Repository: quickwit-oss/quickwit
Branch: main
Commit: 06f0ef088a49
Files: 1206
Total size: 12.3 MB

Directory structure:
gitextract_hf8mrikh/

├── .cargo/
│   └── config.toml
├── .claude/
│   └── skills/
│       ├── bump-tantivy/
│       │   └── SKILL.md
│       ├── fix-clippy/
│       │   └── SKILL.md
│       ├── fmt/
│       │   └── SKILL.md
│       ├── rationalize-deps/
│       │   └── SKILL.md
│       └── simple-pr/
│           └── SKILL.md
├── .devcontainer/
│   ├── devcontainer.json
│   ├── post-create.sh
│   └── welcome.txt
├── .dockerignore
├── .gitattributes
├── .github/
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.md
│   │   ├── documentation_request.md
│   │   ├── feature_request.md
│   │   └── tutorial_request.md
│   ├── PULL_REQUEST_TEMPLATE.md
│   ├── actions/
│   │   ├── cargo-build-macos-binary/
│   │   │   └── action.yml
│   │   └── cross-build-binary/
│   │       └── action.yml
│   ├── dependabot.yml
│   └── workflows/
│       ├── ci.yml
│       ├── coverage.yml
│       ├── dependency.yml
│       ├── publish_cross_images.yml
│       ├── publish_docker_images.yml
│       ├── publish_lambda.yaml
│       ├── publish_nightly_packages.yml
│       ├── publish_release_packages.yml
│       ├── requirements.txt
│       ├── scorecard.yml
│       └── ui-ci.yml
├── .gitignore
├── .localstack/
│   └── init.sh
├── CHANGELOG.md
├── CODE_OF_CONDUCT.md
├── CODE_STYLE.md
├── CONTRIBUTING.md
├── Dockerfile
├── LICENSE
├── LICENSE-3rdparty.csv
├── Makefile
├── README.md
├── SECURITY.md
├── _typos.toml
├── build/
│   └── cross-images/
│       ├── aarch64-unknown-linux-gnu.dockerfile
│       ├── aarch64-unknown-linux-musl.dockerfile
│       ├── x86_64-unknown-linux-gnu.dockerfile
│       └── x86_64-unknown-linux-musl.dockerfile
├── config/
│   ├── quickwit.yaml
│   ├── templates/
│   │   ├── gh-archive.yaml
│   │   └── stackoverflow.yaml
│   └── tutorials/
│       ├── fluentbit-logs/
│       │   └── index-config.yaml
│       ├── gh-archive/
│       │   ├── index-config-for-clickhouse.yaml
│       │   ├── index-config.yaml
│       │   ├── kafka-source.yaml
│       │   └── kinesis-source.yaml
│       ├── grafana/
│       │   └── docker-compose.yml
│       ├── hdfs-logs/
│       │   ├── index-config-partitioned.yaml
│       │   ├── index-config-retention-policy.yaml
│       │   ├── index-config.yaml
│       │   ├── searcher-1.yaml
│       │   ├── searcher-2.yaml
│       │   └── searcher-3.yaml
│       ├── otel-logs/
│       │   ├── index-config.yaml
│       │   ├── kafka-source.yaml
│       │   └── otel-values.yaml
│       ├── otel-traces/
│       │   ├── index-config.yaml
│       │   └── kafka-source.yaml
│       ├── stackoverflow/
│       │   ├── index-config.yaml
│       │   ├── pulsar-source.yaml
│       │   └── send_messages_to_pulsar.py
│       ├── vector-otel-logs/
│       │   └── vector.toml
│       └── wikipedia/
│           ├── index-config.yaml
│           └── multilang-index-config.yaml
├── distribution/
│   ├── docker/
│   │   └── ubuntu/
│   │       └── Dockerfile
│   ├── ecs/
│   │   ├── .gitignore
│   │   ├── README.md
│   │   ├── example/
│   │   │   ├── .terraform.lock.hcl
│   │   │   ├── bastion.tf
│   │   │   ├── image.tf
│   │   │   ├── kafka.tf
│   │   │   ├── terraform.tf
│   │   │   └── vpc.tf
│   │   └── quickwit/
│   │       ├── cluster.tf
│   │       ├── configs.tf
│   │       ├── iam.tf
│   │       ├── outputs.tf
│   │       ├── quickwit-control-plane.tf
│   │       ├── quickwit-indexer.tf
│   │       ├── quickwit-janitor.tf
│   │       ├── quickwit-metastore.tf
│   │       ├── quickwit-searcher.tf
│   │       ├── rds.tf
│   │       ├── s3.tf
│   │       ├── service/
│   │       │   ├── config.tf
│   │       │   ├── ecs.tf
│   │       │   └── variables.tf
│   │       └── variables.tf
│   └── kubernetes/
│       └── README.md
├── docker-compose.yml
├── docs/
│   ├── assets/
│   │   └── sqs-file-source.tf
│   ├── configuration/
│   │   ├── _category_.yaml
│   │   ├── index-config.md
│   │   ├── index.md
│   │   ├── lambda-config.md
│   │   ├── metastore-config.md
│   │   ├── node-config.md
│   │   ├── ports-config.md
│   │   ├── source-config.md
│   │   ├── storage-config.md
│   │   └── template-config.md
│   ├── deployment/
│   │   ├── _category_.yaml
│   │   ├── cluster-sizing.md
│   │   ├── deployment-modes.md
│   │   └── kubernetes/
│   │       ├── _category_.yaml
│   │       ├── gke.md
│   │       ├── glasskube.md
│   │       └── helm.md
│   ├── distributed-tracing/
│   │   ├── _category_.yaml
│   │   ├── otel-service.md
│   │   ├── overview.md
│   │   ├── plug-quickwit-to-jaeger.md
│   │   └── send-traces/
│   │       ├── _category_.yaml
│   │       ├── using-otel-collector.md
│   │       └── using-otel-sdk-python.md
│   ├── get-started/
│   │   ├── _category_.yaml
│   │   ├── installation.md
│   │   ├── query-language-intro.md
│   │   ├── quickstart.md
│   │   └── tutorials/
│   │       ├── _category_.yaml
│   │       ├── prometheus-metrics.md
│   │       ├── trace-analytics-with-grafana.md
│   │       ├── tutorial-hdfs-logs-distributed-search-aws-s3.md
│   │       ├── tutorial-hdfs-logs.md
│   │       └── tutorial-jaeger.md
│   ├── guides/
│   │   ├── _category_.yaml
│   │   ├── aws-setup.md
│   │   ├── schemaless.md
│   │   └── storage-setup/
│   │       ├── _category_.yaml
│   │       └── aws-s3.md
│   ├── ingest-data/
│   │   ├── _category_.yaml
│   │   ├── index.md
│   │   ├── ingest-api.md
│   │   ├── ingest-local-file.md
│   │   ├── kafka.md
│   │   ├── kinesis.md
│   │   ├── pulsar.md
│   │   └── sqs-files.md
│   ├── internals/
│   │   ├── backward-compatibility.md
│   │   ├── date-time.md
│   │   ├── ingest-v2.md
│   │   ├── scroll.md
│   │   ├── searcher-split-cache.md
│   │   ├── sorting.md
│   │   ├── split-format.md
│   │   └── template-index.md
│   ├── log-management/
│   │   ├── _category_.yaml
│   │   ├── otel-service.md
│   │   ├── overview.md
│   │   ├── send-logs/
│   │   │   ├── _category_.yaml
│   │   │   ├── send-docker-logs.md
│   │   │   ├── using-fluentbit.md
│   │   │   ├── using-otel-collector-with-helm.md
│   │   │   ├── using-otel-collector.md
│   │   │   └── using-vector.md
│   │   └── supported-agents.md
│   ├── operating/
│   │   ├── _category_.yaml
│   │   ├── aws-costs.md
│   │   ├── data-directory.md
│   │   ├── monitoring.md
│   │   └── upgrades.md
│   ├── overview/
│   │   ├── _category_.yaml
│   │   ├── architecture.md
│   │   ├── concepts/
│   │   │   ├── _category_.yaml
│   │   │   ├── deletes.md
│   │   │   ├── indexing.md
│   │   │   └── querying.md
│   │   ├── index.md
│   │   └── introduction.md
│   ├── reference/
│   │   ├── _category_.yaml
│   │   ├── aggregation.md
│   │   ├── cli.md
│   │   ├── es_compatible_api.md
│   │   ├── metrics.md
│   │   ├── query-language.md
│   │   ├── rest-api.md
│   │   └── updating-mapper.md
│   └── telemetry.md
├── install.sh
├── monitoring/
│   ├── grafana/
│   │   ├── README.md
│   │   ├── dashboards/
│   │   │   ├── indexers.json
│   │   │   ├── ingesters.json
│   │   │   ├── metastore.json
│   │   │   └── searchers.json
│   │   └── provisioning/
│   │       ├── dashboards/
│   │       │   └── default.yaml
│   │       └── datasources/
│   │           └── default.yaml
│   ├── otel-collector-config.yaml
│   └── prometheus.yaml
└── quickwit/
    ├── .cargo/
    │   └── config.toml
    ├── .cargo-dev/
    │   └── config.toml
    ├── .config/
    │   └── nextest.toml
    ├── .license_header.txt
    ├── CLAUDE.md
    ├── Cargo.toml
    ├── Cross.toml
    ├── Makefile
    ├── NOTICE
    ├── clippy.toml
    ├── deny.toml
    ├── dependency-licenses.html
    ├── license-tool.toml
    ├── quickwit-actors/
    │   ├── Cargo.toml
    │   ├── LICENSE
    │   ├── README.md
    │   ├── benches/
    │   │   └── bench.rs
    │   ├── examples/
    │   │   └── ping_actor.rs
    │   └── src/
    │       ├── actor.rs
    │       ├── actor_context.rs
    │       ├── actor_handle.rs
    │       ├── actor_state.rs
    │       ├── channel_with_priority.rs
    │       ├── command.rs
    │       ├── envelope.rs
    │       ├── lib.rs
    │       ├── mailbox.rs
    │       ├── observation.rs
    │       ├── registry.rs
    │       ├── scheduler.rs
    │       ├── spawn_builder.rs
    │       ├── supervisor.rs
    │       ├── tests.rs
    │       └── universe.rs
    ├── quickwit-aws/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── error.rs
    │       ├── lib.rs
    │       └── retry.rs
    ├── quickwit-cli/
    │   ├── Cargo.toml
    │   ├── src/
    │   │   ├── checklist.rs
    │   │   ├── cli.rs
    │   │   ├── cli_doc_ext.toml
    │   │   ├── generate_markdown.rs
    │   │   ├── index.rs
    │   │   ├── jemalloc.rs
    │   │   ├── lib.rs
    │   │   ├── logger.rs
    │   │   ├── main.rs
    │   │   ├── metrics.rs
    │   │   ├── service.rs
    │   │   ├── source.rs
    │   │   ├── split.rs
    │   │   ├── stats.rs
    │   │   └── tool.rs
    │   └── tests/
    │       ├── Pipfile
    │       ├── cli.rs
    │       ├── helpers.rs
    │       └── prepare_tests.sh
    ├── quickwit-cluster/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── change.rs
    │       ├── cluster.rs
    │       ├── grpc_gossip.rs
    │       ├── grpc_service.rs
    │       ├── lib.rs
    │       ├── member.rs
    │       ├── metrics.rs
    │       └── node.rs
    ├── quickwit-codegen/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── example/
    │   │   ├── Cargo.toml
    │   │   ├── build.rs
    │   │   └── src/
    │   │       ├── codegen/
    │   │       │   └── hello.rs
    │   │       ├── error.rs
    │   │       ├── hello.proto
    │   │       └── lib.rs
    │   └── src/
    │       ├── codegen.rs
    │       └── lib.rs
    ├── quickwit-common/
    │   ├── Cargo.toml
    │   ├── build.rs
    │   └── src/
    │       ├── alloc_tracker.rs
    │       ├── binary_heap.rs
    │       ├── coolid.rs
    │       ├── cpus.rs
    │       ├── fs.rs
    │       ├── io.rs
    │       ├── jemalloc_profiled.rs
    │       ├── kill_switch.rs
    │       ├── lib.rs
    │       ├── metrics.rs
    │       ├── net.rs
    │       ├── path_hasher.rs
    │       ├── pretty.rs
    │       ├── progress.rs
    │       ├── pubsub.rs
    │       ├── rand.rs
    │       ├── rate_limited_tracing.rs
    │       ├── rate_limiter.rs
    │       ├── rendezvous_hasher.rs
    │       ├── retry.rs
    │       ├── ring_buffer.rs
    │       ├── runtimes.rs
    │       ├── shared_consts.rs
    │       ├── socket_addr_legacy_hash.rs
    │       ├── sorted_iter.rs
    │       ├── stream_utils.rs
    │       ├── temp_dir.rs
    │       ├── test_utils.rs
    │       ├── thread_pool.rs
    │       ├── tower/
    │       │   ├── box_layer.rs
    │       │   ├── box_service.rs
    │       │   ├── buffer.rs
    │       │   ├── change.rs
    │       │   ├── circuit_breaker.rs
    │       │   ├── delay.rs
    │       │   ├── estimate_rate.rs
    │       │   ├── event_listener.rs
    │       │   ├── load_shed.rs
    │       │   ├── metrics.rs
    │       │   ├── mod.rs
    │       │   ├── one_task_per_call_layer.rs
    │       │   ├── pool.rs
    │       │   ├── rate.rs
    │       │   ├── rate_estimator.rs
    │       │   ├── rate_limit.rs
    │       │   ├── retry.rs
    │       │   ├── timeout.rs
    │       │   └── transport.rs
    │       ├── type_map.rs
    │       └── uri.rs
    ├── quickwit-config/
    │   ├── Cargo.toml
    │   ├── resources/
    │   │   └── tests/
    │   │       ├── index_config/
    │   │       │   ├── hdfs-logs-create-config.yaml
    │   │       │   ├── hdfs-logs.json
    │   │       │   ├── hdfs-logs.toml
    │   │       │   ├── hdfs-logs.yaml
    │   │       │   ├── minimal-hdfs-logs.yaml
    │   │       │   └── partial-hdfs-logs.yaml
    │   │       ├── node_config/
    │   │       │   ├── quickwit.json
    │   │       │   ├── quickwit.toml
    │   │       │   ├── quickwit.wrongkey.yaml
    │   │       │   └── quickwit.yaml
    │   │       └── source_config/
    │   │           ├── ingest-api-source.json
    │   │           ├── kafka-source.json
    │   │           └── kinesis-source.yaml
    │   └── src/
    │       ├── cluster_config/
    │       │   └── mod.rs
    │       ├── config_value.rs
    │       ├── index_config/
    │       │   ├── mod.rs
    │       │   └── serialize.rs
    │       ├── index_template/
    │       │   ├── mod.rs
    │       │   └── serialize.rs
    │       ├── lib.rs
    │       ├── merge_policy_config.rs
    │       ├── metastore_config.rs
    │       ├── node_config/
    │       │   ├── mod.rs
    │       │   └── serialize.rs
    │       ├── qw_env_vars.rs
    │       ├── serde_utils.rs
    │       ├── service.rs
    │       ├── source_config/
    │       │   ├── mod.rs
    │       │   └── serialize.rs
    │       ├── storage_config.rs
    │       └── templating.rs
    ├── quickwit-control-plane/
    │   ├── Cargo.toml
    │   ├── README.md
    │   └── src/
    │       ├── control_plane.rs
    │       ├── cooldown_map.rs
    │       ├── debouncer.rs
    │       ├── indexing_plan.rs
    │       ├── indexing_scheduler/
    │       │   ├── change_tracker.rs
    │       │   ├── mod.rs
    │       │   └── scheduling/
    │       │       ├── README.md
    │       │       ├── mod.rs
    │       │       ├── scheduling_logic.rs
    │       │       └── scheduling_logic_model.rs
    │       ├── ingest/
    │       │   ├── ingest_controller.rs
    │       │   ├── mod.rs
    │       │   ├── scaling_arbiter.rs
    │       │   └── wait_handle.rs
    │       ├── lib.rs
    │       ├── metrics.rs
    │       ├── model/
    │       │   ├── mod.rs
    │       │   └── shard_table.rs
    │       └── tests.rs
    ├── quickwit-datetime/
    │   ├── Cargo.toml
    │   ├── README.md
    │   └── src/
    │       ├── date_time_format.rs
    │       ├── date_time_parsing.rs
    │       ├── java_date_time_format.rs
    │       └── lib.rs
    ├── quickwit-directories/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── bundle_directory.rs
    │       ├── caching_directory.rs
    │       ├── debug_proxy_directory.rs
    │       ├── hot_directory.rs
    │       ├── lib.rs
    │       ├── storage_directory.rs
    │       └── union_directory.rs
    ├── quickwit-doc-mapper/
    │   ├── Cargo.toml
    │   ├── benches/
    │   │   ├── data/
    │   │   │   ├── simple-parse-bench.json
    │   │   │   └── simple-routing-expression-bench.json
    │   │   ├── doc_to_json_bench.rs
    │   │   └── routing_expression_bench.rs
    │   └── src/
    │       ├── doc_mapper/
    │       │   ├── date_time_type.rs
    │       │   ├── doc_mapper_builder.rs
    │       │   ├── doc_mapper_impl.rs
    │       │   ├── field_mapping_entry.rs
    │       │   ├── field_mapping_type.rs
    │       │   ├── field_presence.rs
    │       │   ├── mapping_tree.rs
    │       │   ├── mod.rs
    │       │   ├── tantivy_val_to_json.rs
    │       │   └── tokenizer_entry.rs
    │       ├── doc_mapping.rs
    │       ├── error.rs
    │       ├── lib.rs
    │       ├── query_builder.rs
    │       ├── routing_expression/
    │       │   └── mod.rs
    │       └── tag_pruning.rs
    ├── quickwit-index-management/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── garbage_collection.rs
    │       ├── index.rs
    │       └── lib.rs
    ├── quickwit-indexing/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── benches/
    │   │   ├── data/
    │   │   │   ├── bench_data.json
    │   │   │   ├── bench_data_heavy_transform.json
    │   │   │   └── bench_data_light_transform.json
    │   │   └── doc_process_vrl_bench.rs
    │   ├── data/
    │   │   └── test_corpus.json
    │   ├── failpoints/
    │   │   └── mod.rs
    │   └── src/
    │       ├── actors/
    │       │   ├── cooperative_indexing.rs
    │       │   ├── doc_processor.rs
    │       │   ├── index_serializer.rs
    │       │   ├── indexer.rs
    │       │   ├── indexing_pipeline.rs
    │       │   ├── indexing_service.rs
    │       │   ├── merge_executor.rs
    │       │   ├── merge_pipeline.rs
    │       │   ├── merge_planner.rs
    │       │   ├── merge_scheduler_service.rs
    │       │   ├── merge_split_downloader.rs
    │       │   ├── mod.rs
    │       │   ├── packager.rs
    │       │   ├── publisher.rs
    │       │   ├── sequencer.rs
    │       │   ├── uploader.rs
    │       │   └── vrl_processing.rs
    │       ├── controlled_directory.rs
    │       ├── lib.rs
    │       ├── merge_policy/
    │       │   ├── const_write_amplification.rs
    │       │   ├── mod.rs
    │       │   ├── nop_merge_policy.rs
    │       │   └── stable_log_merge_policy.rs
    │       ├── metrics.rs
    │       ├── models/
    │       │   ├── indexed_split.rs
    │       │   ├── indexing_service_message.rs
    │       │   ├── indexing_statistics.rs
    │       │   ├── merge_planner_message.rs
    │       │   ├── merge_scratch.rs
    │       │   ├── merge_statistics.rs
    │       │   ├── mod.rs
    │       │   ├── packaged_split.rs
    │       │   ├── processed_doc.rs
    │       │   ├── publish_lock.rs
    │       │   ├── publisher_message.rs
    │       │   ├── raw_doc_batch.rs
    │       │   ├── shard_positions.rs
    │       │   └── split_attrs.rs
    │       ├── source/
    │       │   ├── doc_file_reader.rs
    │       │   ├── file_source.rs
    │       │   ├── gcp_pubsub_source.rs
    │       │   ├── ingest/
    │       │   │   └── mod.rs
    │       │   ├── ingest_api_source.rs
    │       │   ├── kafka_source.rs
    │       │   ├── kinesis/
    │       │   │   ├── api.rs
    │       │   │   ├── helpers.rs
    │       │   │   ├── kinesis_source.rs
    │       │   │   ├── mod.rs
    │       │   │   └── shard_consumer.rs
    │       │   ├── mod.rs
    │       │   ├── pulsar_source.rs
    │       │   ├── queue_sources/
    │       │   │   ├── coordinator.rs
    │       │   │   ├── design.md
    │       │   │   ├── helpers.rs
    │       │   │   ├── local_state.rs
    │       │   │   ├── memory_queue.rs
    │       │   │   ├── message.rs
    │       │   │   ├── mod.rs
    │       │   │   ├── shared_state.rs
    │       │   │   ├── sqs_queue.rs
    │       │   │   └── visibility.rs
    │       │   ├── source_factory.rs
    │       │   ├── stdin_source.rs
    │       │   ├── vec_source.rs
    │       │   └── void_source.rs
    │       ├── split_store/
    │       │   ├── indexing_split_cache.rs
    │       │   ├── indexing_split_store.rs
    │       │   ├── mod.rs
    │       │   └── split_store_quota.rs
    │       └── test_utils.rs
    ├── quickwit-ingest/
    │   ├── Cargo.toml
    │   ├── build.rs
    │   └── src/
    │       ├── codegen/
    │       │   └── ingest_service.rs
    │       ├── doc_batch.rs
    │       ├── error.rs
    │       ├── ingest_api_service.rs
    │       ├── ingest_service.proto
    │       ├── ingest_v2/
    │       │   ├── broadcast/
    │       │   │   ├── capacity_score.rs
    │       │   │   ├── local_shards.rs
    │       │   │   └── mod.rs
    │       │   ├── debouncing.rs
    │       │   ├── doc_mapper.rs
    │       │   ├── fetch.rs
    │       │   ├── helpers.rs
    │       │   ├── idle.rs
    │       │   ├── ingest.md
    │       │   ├── ingester.rs
    │       │   ├── metrics.rs
    │       │   ├── mod.rs
    │       │   ├── models.rs
    │       │   ├── mrecord.rs
    │       │   ├── mrecordlog_utils.rs
    │       │   ├── publish_tracker.rs
    │       │   ├── rate_meter.rs
    │       │   ├── replication.md
    │       │   ├── replication.rs
    │       │   ├── router.rs
    │       │   ├── routing_table.rs
    │       │   ├── state.rs
    │       │   ├── wal_capacity_tracker.rs
    │       │   └── workbench.rs
    │       ├── lib.rs
    │       ├── memory_capacity.rs
    │       ├── metrics.rs
    │       ├── mrecordlog_async.rs
    │       ├── notifications.rs
    │       ├── position.rs
    │       └── queue.rs
    ├── quickwit-integration-tests/
    │   ├── Cargo.toml
    │   ├── src/
    │   │   ├── lib.rs
    │   │   ├── test_utils/
    │   │   │   ├── cluster_sandbox.rs
    │   │   │   ├── mod.rs
    │   │   │   └── shutdown.rs
    │   │   └── tests/
    │   │       ├── basic_tests.rs
    │   │       ├── ingest_v1_tests.rs
    │   │       ├── ingest_v2_tests.rs
    │   │       ├── mod.rs
    │   │       ├── no_cp_tests.rs
    │   │       ├── otlp_tests.rs
    │   │       ├── sqs_tests.rs
    │   │       ├── tls_tests.rs
    │   │       └── update_tests/
    │   │           ├── create_on_update.rs
    │   │           ├── doc_mapping_tests.rs
    │   │           ├── mod.rs
    │   │           ├── restart_indexer_tests.rs
    │   │           └── search_settings_tests.rs
    │   └── test_data/
    │       ├── README.md
    │       ├── ca.crt
    │       ├── ca.key
    │       ├── ca.srl
    │       ├── regenerate-certs.sh
    │       ├── server.crt
    │       ├── server.csr
    │       ├── server.key
    │       └── server.v3.ext
    ├── quickwit-jaeger/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── lib.rs
    │       ├── metrics.rs
    │       ├── v1.rs
    │       └── v2.rs
    ├── quickwit-janitor/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── actors/
    │       │   ├── delete_task_pipeline.rs
    │       │   ├── delete_task_planner.rs
    │       │   ├── delete_task_service.rs
    │       │   ├── garbage_collector.rs
    │       │   ├── mod.rs
    │       │   └── retention_policy_executor.rs
    │       ├── error.rs
    │       ├── janitor_service.rs
    │       ├── lib.rs
    │       ├── metrics.rs
    │       └── retention_policy_execution.rs
    ├── quickwit-lambda-client/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── build.rs
    │   └── src/
    │       ├── deploy.rs
    │       ├── invoker.rs
    │       ├── lib.rs
    │       └── metrics.rs
    ├── quickwit-lambda-server/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── bin/
    │       │   └── leaf_search.rs
    │       ├── context.rs
    │       ├── error.rs
    │       ├── handler.rs
    │       └── lib.rs
    ├── quickwit-macros/
    │   ├── Cargo.toml
    │   └── src/
    │       └── lib.rs
    ├── quickwit-metastore/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── build.rs
    │   ├── migrations/
    │   │   └── postgresql/
    │   │       ├── 10_add-split-incarnation-id.down.sql
    │   │       ├── 10_add-split-incarnation-id.up.sql
    │   │       ├── 11_add-split-maturity-timestamp-field.down.sql
    │   │       ├── 11_add-split-maturity-timestamp-field.up.sql
    │   │       ├── 12_create-shards.down.sql
    │   │       ├── 12_create-shards.up.sql
    │   │       ├── 13_migrate-otel-indexes-v0_6.down.sql
    │   │       ├── 13_migrate-otel-indexes-v0_6.up.sql
    │   │       ├── 14_update-shard-id.down.sql
    │   │       ├── 14_update-shard-id.up.sql
    │   │       ├── 15_create-templates.down.sql
    │   │       ├── 15_create-templates.up.sql
    │   │       ├── 16_create-index-split-uid.down.sql
    │   │       ├── 16_create-index-split-uid.up.sql
    │   │       ├── 17_create-index-split-timestamp.down.sql
    │   │       ├── 17_create-index-split-timestamp.up.sql
    │   │       ├── 18_create-index-shard-index-uid.down.sql
    │   │       ├── 18_create-index-shard-index-uid.up.sql
    │   │       ├── 19_add-split-node-id-field.down.sql
    │   │       ├── 19_add-split-node-id-field.up.sql
    │   │       ├── 1_create-indexes.down.sql
    │   │       ├── 1_create-indexes.up.sql
    │   │       ├── 20_add-shard-doc-mapping-uid-field.down.sql
    │   │       ├── 20_add-shard-doc-mapping-uid-field.up.sql
    │   │       ├── 21_add-shard-update-timestamp-field.down.sql
    │   │       ├── 21_add-shard-update-timestamp-field.up.sql
    │   │       ├── 22_change-splits-pkey.down.sql
    │   │       ├── 22_change-splits-pkey.up.sql
    │   │       ├── 23_change-indexes-unique-index.down.sql
    │   │       ├── 23_change-indexes-unique-index.up.sql
    │   │       ├── 24_add-arbitrary-kv.down.sql
    │   │       ├── 24_add-arbitrary-kv.up.sql
    │   │       ├── 25_add-split-size.down.sql
    │   │       ├── 25_add-split-size.up.sql
    │   │       ├── 2_create-splits.down.sql
    │   │       ├── 2_create-splits.up.sql
    │   │       ├── 3_add-split-publish-timestamp-field.down.sql
    │   │       ├── 3_add-split-publish-timestamp-field.up.sql
    │   │       ├── 4_create-delete_tasks.down.sql
    │   │       ├── 4_create-delete_tasks.up.sql
    │   │       ├── 5_add-delete-opstamp-splits.down.sql
    │   │       ├── 5_add-delete-opstamp-splits.up.sql
    │   │       ├── 6_delete-update-index-update-timestamp-on-split-update-trigger.up.sql
    │   │       ├── 7_delete-split-table-triggers.up.sql
    │   │       ├── 8_delete-update-timestamp-on-indexes-table.up.sql
    │   │       ├── 9_add-split-incarnation-id.down.sql
    │   │       └── 9_add-split-incarnation-id.up.sql
    │   ├── src/
    │   │   ├── backward_compatibility_tests/
    │   │   │   ├── README.md
    │   │   │   └── mod.rs
    │   │   ├── checkpoint.rs
    │   │   ├── error.rs
    │   │   ├── lib.rs
    │   │   ├── metastore/
    │   │   │   ├── control_plane_metastore.rs
    │   │   │   ├── file_backed/
    │   │   │   │   ├── file_backed_index/
    │   │   │   │   │   ├── mod.rs
    │   │   │   │   │   ├── serialize.rs
    │   │   │   │   │   └── shards.rs
    │   │   │   │   ├── file_backed_metastore_factory.rs
    │   │   │   │   ├── index_id_matcher.rs
    │   │   │   │   ├── index_template_matcher.rs
    │   │   │   │   ├── lazy_file_backed_index.rs
    │   │   │   │   ├── manifest.rs
    │   │   │   │   ├── mod.rs
    │   │   │   │   ├── state.rs
    │   │   │   │   └── store_operations.rs
    │   │   │   ├── index_metadata/
    │   │   │   │   ├── mod.rs
    │   │   │   │   └── serialize.rs
    │   │   │   ├── mod.rs
    │   │   │   └── postgres/
    │   │   │       ├── error.rs
    │   │   │       ├── factory.rs
    │   │   │       ├── metastore.rs
    │   │   │       ├── metrics.rs
    │   │   │       ├── migrator.rs
    │   │   │       ├── mod.rs
    │   │   │       ├── model.rs
    │   │   │       ├── pool.rs
    │   │   │       ├── queries/
    │   │   │       │   ├── index_templates/
    │   │   │       │   │   ├── find.sql
    │   │   │       │   │   ├── insert.sql
    │   │   │       │   │   └── upsert.sql
    │   │   │       │   ├── indexes_metadata.sql
    │   │   │       │   └── shards/
    │   │   │       │       ├── acquire.sql
    │   │   │       │       ├── delete.sql
    │   │   │       │       ├── fetch.sql
    │   │   │       │       ├── find_not_deletable.sql
    │   │   │       │       ├── insert.sql
    │   │   │       │       ├── open.sql
    │   │   │       │       ├── prune_age.sql
    │   │   │       │       └── prune_count.sql
    │   │   │       ├── split_stream.rs
    │   │   │       ├── tags.rs
    │   │   │       └── utils.rs
    │   │   ├── metastore_factory.rs
    │   │   ├── metastore_resolver.rs
    │   │   ├── split_metadata.rs
    │   │   ├── split_metadata_version.rs
    │   │   └── tests/
    │   │       ├── delete_task.rs
    │   │       ├── get_identity.rs
    │   │       ├── index.rs
    │   │       ├── list_splits.rs
    │   │       ├── mod.rs
    │   │       ├── shard.rs
    │   │       ├── source.rs
    │   │       ├── split.rs
    │   │       └── template.rs
    │   └── test-data/
    │       ├── .gitignore
    │       ├── file-backed-index/
    │       │   ├── v0.7.expected.json
    │       │   ├── v0.7.json
    │       │   ├── v0.8.expected.json
    │       │   ├── v0.8.json
    │       │   ├── v0.9.expected.json
    │       │   └── v0.9.json
    │       ├── index-metadata/
    │       │   ├── v0.7.expected.json
    │       │   ├── v0.7.json
    │       │   ├── v0.8.expected.json
    │       │   ├── v0.8.json
    │       │   ├── v0.9.expected.json
    │       │   └── v0.9.json
    │       ├── manifest/
    │       │   ├── v0.7.expected.json
    │       │   ├── v0.7.json
    │       │   ├── v0.8.expected.json
    │       │   ├── v0.8.json
    │       │   ├── v0.9.expected.json
    │       │   └── v0.9.json
    │       └── split-metadata/
    │           ├── v0.7.expected.json
    │           ├── v0.7.json
    │           ├── v0.8.expected.json
    │           ├── v0.8.json
    │           ├── v0.9.expected.json
    │           └── v0.9.json
    ├── quickwit-metastore-utils/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── bin/
    │       │   ├── README.md
    │       │   ├── proxy.rs
    │       │   └── replay.rs
    │       ├── grpc_request.rs
    │       └── lib.rs
    ├── quickwit-opentelemetry/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── lib.rs
    │       └── otlp/
    │           ├── logs.rs
    │           ├── metrics.rs
    │           ├── mod.rs
    │           ├── test_utils.rs
    │           └── traces.rs
    ├── quickwit-proto/
    │   ├── .gitignore
    │   ├── Cargo.toml
    │   ├── build.rs
    │   ├── protos/
    │   │   ├── quickwit/
    │   │   │   ├── cluster.proto
    │   │   │   ├── common.proto
    │   │   │   ├── control_plane.proto
    │   │   │   ├── developer.proto
    │   │   │   ├── indexing.proto
    │   │   │   ├── ingest.proto
    │   │   │   ├── ingester.proto
    │   │   │   ├── metastore.proto
    │   │   │   ├── router.proto
    │   │   │   └── search.proto
    │   │   └── third-party/
    │   │       ├── gogoproto/
    │   │       │   └── gogo.proto
    │   │       ├── google/
    │   │       │   └── protobuf/
    │   │       │       ├── any.proto
    │   │       │       ├── api.proto
    │   │       │       ├── descriptor.proto
    │   │       │       ├── duration.proto
    │   │       │       ├── empty.proto
    │   │       │       ├── field_mask.proto
    │   │       │       ├── source_context.proto
    │   │       │       ├── struct.proto
    │   │       │       ├── timestamp.proto
    │   │       │       ├── type.proto
    │   │       │       └── wrappers.proto
    │   │       ├── jaeger/
    │   │       │   ├── model.proto
    │   │       │   ├── storage/
    │   │       │   │   └── v2/
    │   │       │   │       └── trace_storage.proto
    │   │       │   └── storage.proto
    │   │       └── opentelemetry/
    │   │           └── proto/
    │   │               ├── collector/
    │   │               │   ├── README.md
    │   │               │   ├── logs/
    │   │               │   │   └── v1/
    │   │               │   │       ├── logs_service.proto
    │   │               │   │       └── logs_service_http.yaml
    │   │               │   ├── metrics/
    │   │               │   │   └── v1/
    │   │               │   │       ├── metrics_service.proto
    │   │               │   │       └── metrics_service_http.yaml
    │   │               │   └── trace/
    │   │               │       └── v1/
    │   │               │           ├── trace_service.proto
    │   │               │           └── trace_service_http.yaml
    │   │               ├── common/
    │   │               │   └── v1/
    │   │               │       └── common.proto
    │   │               ├── logs/
    │   │               │   └── v1/
    │   │               │       └── logs.proto
    │   │               ├── metrics/
    │   │               │   └── v1/
    │   │               │       └── metrics.proto
    │   │               ├── resource/
    │   │               │   └── v1/
    │   │               │       └── resource.proto
    │   │               └── trace/
    │   │                   └── v1/
    │   │                       └── trace.proto
    │   └── src/
    │       ├── cluster/
    │       │   └── mod.rs
    │       ├── codegen/
    │       │   ├── jaeger/
    │       │   │   ├── jaeger.api_v2.rs
    │       │   │   ├── jaeger.storage.v1.rs
    │       │   │   ├── jaeger.storage.v2.rs
    │       │   │   ├── opentelemetry.proto.common.v1.rs
    │       │   │   ├── opentelemetry.proto.resource.v1.rs
    │       │   │   └── opentelemetry.proto.trace.v1.rs
    │       │   ├── opentelemetry/
    │       │   │   ├── opentelemetry.proto.collector.logs.v1.rs
    │       │   │   ├── opentelemetry.proto.collector.metrics.v1.rs
    │       │   │   ├── opentelemetry.proto.collector.trace.v1.rs
    │       │   │   ├── opentelemetry.proto.common.v1.rs
    │       │   │   ├── opentelemetry.proto.logs.v1.rs
    │       │   │   ├── opentelemetry.proto.metrics.v1.rs
    │       │   │   ├── opentelemetry.proto.resource.v1.rs
    │       │   │   └── opentelemetry.proto.trace.v1.rs
    │       │   └── quickwit/
    │       │       ├── quickwit.cluster.rs
    │       │       ├── quickwit.common.rs
    │       │       ├── quickwit.control_plane.rs
    │       │       ├── quickwit.developer.rs
    │       │       ├── quickwit.indexing.rs
    │       │       ├── quickwit.ingest.ingester.rs
    │       │       ├── quickwit.ingest.router.rs
    │       │       ├── quickwit.ingest.rs
    │       │       ├── quickwit.metastore.rs
    │       │       └── quickwit.search.rs
    │       ├── control_plane/
    │       │   └── mod.rs
    │       ├── developer/
    │       │   └── mod.rs
    │       ├── error.rs
    │       ├── getters.rs
    │       ├── indexing/
    │       │   └── mod.rs
    │       ├── ingest/
    │       │   ├── ingester.rs
    │       │   ├── mod.rs
    │       │   └── router.rs
    │       ├── lib.rs
    │       ├── metastore/
    │       │   ├── events.rs
    │       │   └── mod.rs
    │       ├── search/
    │       │   ├── mod.rs
    │       │   ├── span_id.rs
    │       │   └── trace_id.rs
    │       └── types/
    │           ├── doc_mapping_uid.rs
    │           ├── doc_uid.rs
    │           ├── index_uid.rs
    │           ├── mod.rs
    │           ├── pipeline_uid.rs
    │           ├── position.rs
    │           └── shard_id.rs
    ├── quickwit-query/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── benches/
    │   │   └── tokenizers_bench.rs
    │   └── src/
    │       ├── aggregations.rs
    │       ├── elastic_query_dsl/
    │       │   ├── bool_query.rs
    │       │   ├── exists_query.rs
    │       │   ├── match_bool_prefix.rs
    │       │   ├── match_phrase_query.rs
    │       │   ├── match_query.rs
    │       │   ├── mod.rs
    │       │   ├── multi_match.rs
    │       │   ├── one_field_map.rs
    │       │   ├── phrase_prefix_query.rs
    │       │   ├── prefix_query.rs
    │       │   ├── query_string_query.rs
    │       │   ├── range_query.rs
    │       │   ├── regex_query.rs
    │       │   ├── string_or_struct.rs
    │       │   ├── term_query.rs
    │       │   ├── terms_query.rs
    │       │   ├── visitor.rs
    │       │   └── wildcard_query.rs
    │       ├── error.rs
    │       ├── json_literal.rs
    │       ├── lib.rs
    │       ├── not_nan_f32.rs
    │       ├── query_ast/
    │       │   ├── bool_query.rs
    │       │   ├── cache_node.rs
    │       │   ├── field_presence.rs
    │       │   ├── full_text_query.rs
    │       │   ├── mod.rs
    │       │   ├── phrase_prefix_query.rs
    │       │   ├── range_query.rs
    │       │   ├── regex_query.rs
    │       │   ├── tantivy_query_ast.rs
    │       │   ├── term_query.rs
    │       │   ├── term_set_query.rs
    │       │   ├── user_input_query.rs
    │       │   ├── utils.rs
    │       │   ├── visitor.rs
    │       │   └── wildcard_query.rs
    │       └── tokenizers/
    │           ├── chinese_compatible.rs
    │           ├── code_tokenizer.rs
    │           ├── mod.rs
    │           └── tokenizer_manager.rs
    ├── quickwit-rest-client/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── resources/
    │   │   └── tests/
    │   │       └── documents_to_ingest.json
    │   └── src/
    │       ├── error.rs
    │       ├── lib.rs
    │       ├── models.rs
    │       └── rest_client.rs
    ├── quickwit-search/
    │   ├── Cargo.toml
    │   ├── README.md
    │   └── src/
    │       ├── client.rs
    │       ├── cluster_client.rs
    │       ├── collector.rs
    │       ├── error.rs
    │       ├── fetch_docs.rs
    │       ├── find_trace_ids_collector.rs
    │       ├── invoker.rs
    │       ├── leaf.rs
    │       ├── leaf_cache.rs
    │       ├── lib.rs
    │       ├── list_fields.rs
    │       ├── list_fields_cache.rs
    │       ├── list_terms.rs
    │       ├── metrics.rs
    │       ├── metrics_trackers.rs
    │       ├── retry/
    │       │   ├── mod.rs
    │       │   └── search.rs
    │       ├── root.rs
    │       ├── scroll_context.rs
    │       ├── search_job_placer.rs
    │       ├── search_permit_provider.rs
    │       ├── search_response_rest.rs
    │       ├── service.rs
    │       ├── tests.rs
    │       └── top_k_collector.rs
    ├── quickwit-serve/
    │   ├── Cargo.toml
    │   ├── README.md
    │   ├── build.rs
    │   ├── resources/
    │   │   └── tests/
    │   │       └── jaeger_ui_trace.json
    │   └── src/
    │       ├── build_info.rs
    │       ├── cluster_api/
    │       │   ├── mod.rs
    │       │   └── rest_handler.rs
    │       ├── decompression.rs
    │       ├── delete_task_api/
    │       │   ├── handler.rs
    │       │   └── mod.rs
    │       ├── developer_api/
    │       │   ├── debug.rs
    │       │   ├── heap_prof.rs
    │       │   ├── heap_prof_disabled.rs
    │       │   ├── log_level.rs
    │       │   ├── mod.rs
    │       │   ├── pprof.rs
    │       │   ├── pprof_disabled.rs
    │       │   └── server.rs
    │       ├── elasticsearch_api/
    │       │   ├── bulk.rs
    │       │   ├── bulk_v2.rs
    │       │   ├── filter.rs
    │       │   ├── mod.rs
    │       │   ├── model/
    │       │   │   ├── bulk_body.rs
    │       │   │   ├── bulk_query_params.rs
    │       │   │   ├── cat_indices.rs
    │       │   │   ├── error.rs
    │       │   │   ├── field_capability.rs
    │       │   │   ├── mappings.rs
    │       │   │   ├── mod.rs
    │       │   │   ├── multi_search.rs
    │       │   │   ├── scroll.rs
    │       │   │   ├── search_body.rs
    │       │   │   ├── search_query_params.rs
    │       │   │   ├── search_response.rs
    │       │   │   └── stats.rs
    │       │   └── rest_handler.rs
    │       ├── format.rs
    │       ├── grpc.rs
    │       ├── health_check_api/
    │       │   ├── handler.rs
    │       │   └── mod.rs
    │       ├── index_api/
    │       │   ├── index_resource.rs
    │       │   ├── mod.rs
    │       │   ├── rest_handler.rs
    │       │   ├── source_resource.rs
    │       │   └── split_resource.rs
    │       ├── indexing_api/
    │       │   ├── mod.rs
    │       │   └── rest_handler.rs
    │       ├── ingest_api/
    │       │   ├── mod.rs
    │       │   ├── response.rs
    │       │   └── rest_handler.rs
    │       ├── jaeger_api/
    │       │   ├── mod.rs
    │       │   ├── model.rs
    │       │   ├── parse_duration.rs
    │       │   └── rest_handler.rs
    │       ├── lib.rs
    │       ├── load_shield.rs
    │       ├── metrics.rs
    │       ├── metrics_api.rs
    │       ├── node_info_handler.rs
    │       ├── openapi.rs
    │       ├── otlp_api/
    │       │   ├── mod.rs
    │       │   └── rest_handler.rs
    │       ├── rate_modulator.rs
    │       ├── rest.rs
    │       ├── rest_api_response.rs
    │       ├── search_api/
    │       │   ├── grpc_adapter.rs
    │       │   ├── mod.rs
    │       │   └── rest_handler.rs
    │       ├── simple_list.rs
    │       ├── tcp_listener.rs
    │       ├── template_api/
    │       │   ├── mod.rs
    │       │   └── rest_handler.rs
    │       └── ui_handler.rs
    ├── quickwit-storage/
    │   ├── Cargo.toml
    │   ├── src/
    │   │   ├── bundle_storage.rs
    │   │   ├── cache/
    │   │   │   ├── base_cache.rs
    │   │   │   ├── byte_range_cache.rs
    │   │   │   ├── memory_sized_cache.rs
    │   │   │   ├── mod.rs
    │   │   │   ├── quickwit_cache.rs
    │   │   │   ├── slice_address.rs
    │   │   │   ├── storage_with_cache.rs
    │   │   │   └── stored_item.rs
    │   │   ├── debouncer.rs
    │   │   ├── error.rs
    │   │   ├── file_descriptor_cache.rs
    │   │   ├── lib.rs
    │   │   ├── local_file_storage.rs
    │   │   ├── metrics.rs
    │   │   ├── object_storage/
    │   │   │   ├── azure_blob_storage.rs
    │   │   │   ├── error.rs
    │   │   │   ├── mod.rs
    │   │   │   ├── policy.rs
    │   │   │   ├── s3_compatible_storage.rs
    │   │   │   └── s3_compatible_storage_resolver.rs
    │   │   ├── opendal_storage/
    │   │   │   ├── base.rs
    │   │   │   ├── google_cloud_storage.rs
    │   │   │   └── mod.rs
    │   │   ├── payload.rs
    │   │   ├── prefix_storage.rs
    │   │   ├── ram_storage.rs
    │   │   ├── split.rs
    │   │   ├── split_cache/
    │   │   │   ├── download_task.rs
    │   │   │   ├── mod.rs
    │   │   │   ├── split_table.rs
    │   │   │   └── tests.rs
    │   │   ├── storage.rs
    │   │   ├── storage_factory.rs
    │   │   ├── storage_resolver.rs
    │   │   ├── timeout_and_retry_storage.rs
    │   │   └── versioned_component.rs
    │   └── tests/
    │       ├── azure_storage.rs
    │       ├── google_cloud_storage.rs
    │       └── s3_storage.rs
    ├── quickwit-telemetry/
    │   ├── Cargo.toml
    │   └── src/
    │       ├── lib.rs
    │       ├── payload.rs
    │       ├── sender.rs
    │       └── sink.rs
    ├── quickwit-ui/
    │   ├── .gitignore
    │   ├── .gitignore_for_build_directory
    │   ├── Makefile
    │   ├── README.md
    │   ├── biome.json
    │   ├── build/
    │   │   └── .gitignore
    │   ├── e2e/
    │   │   └── homepage.spec.ts
    │   ├── index.html
    │   ├── jest/
    │   │   └── setup.js
    │   ├── jest.config.js
    │   ├── mocks/
    │   │   ├── monacoMock.js
    │   │   ├── swaggerUIMock.js
    │   │   └── x-charts.js
    │   ├── package.json
    │   ├── playwright.config.ts
    │   ├── public/
    │   │   ├── manifest.json
    │   │   └── robots.txt
    │   ├── src/
    │   │   ├── components/
    │   │   │   ├── ApiUrlFooter.tsx
    │   │   │   ├── IndexSideBar.tsx
    │   │   │   ├── IndexSummary.tsx
    │   │   │   ├── IndexesTable.tsx
    │   │   │   ├── JsonEditor.tsx
    │   │   │   ├── LayoutUtils.tsx
    │   │   │   ├── Loader.tsx
    │   │   │   ├── QueryActionBar.tsx
    │   │   │   ├── QueryEditor/
    │   │   │   │   ├── AggregationEditor.tsx
    │   │   │   │   ├── QueryEditor.tsx
    │   │   │   │   └── config.ts
    │   │   │   ├── ResponseErrorDisplay.tsx
    │   │   │   ├── SearchResult/
    │   │   │   │   ├── AggregationResult.tsx
    │   │   │   │   ├── ResultTable.tsx
    │   │   │   │   ├── Row.tsx
    │   │   │   │   └── SearchResult.tsx
    │   │   │   ├── SideBar.tsx
    │   │   │   ├── TimeRangeSelect.tsx
    │   │   │   └── TopBar.tsx
    │   │   ├── index.css
    │   │   ├── index.test.js
    │   │   ├── index.tsx
    │   │   ├── providers/
    │   │   │   ├── EditorProvider.tsx
    │   │   │   └── LocalStorageProvider.tsx
    │   │   ├── services/
    │   │   │   ├── client.test.ts
    │   │   │   └── client.ts
    │   │   ├── utils/
    │   │   │   ├── SearchComponentProps.ts
    │   │   │   ├── models.ts
    │   │   │   ├── theme.ts
    │   │   │   └── urls.ts
    │   │   └── views/
    │   │       ├── ApiView.tsx
    │   │       ├── App.tsx
    │   │       ├── ClusterView.test.jsx
    │   │       ├── ClusterView.tsx
    │   │       ├── IndexView.test.jsx
    │   │       ├── IndexView.tsx
    │   │       ├── IndexesView.test.jsx
    │   │       ├── IndexesView.tsx
    │   │       ├── NodeInfoView.test.jsx
    │   │       ├── NodeInfoView.tsx
    │   │       ├── SearchView.test.jsx
    │   │       └── SearchView.tsx
    │   ├── tsconfig.json
    │   └── vite.config.ts
    ├── rest-api-tests/
    │   ├── Pipfile
    │   ├── README.md
    │   ├── docker-compose.yaml
    │   ├── run_tests.py
    │   └── scenarii/
    │       ├── aggregations/
    │       │   ├── 0001-aggregations.yaml
    │       │   ├── 0002-doc-len.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── concat_fields/
    │       │   ├── 0001_concat_field.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── default_search_fields/
    │       │   ├── 0001_default_fields.yaml
    │       │   ├── 0002_invalid_default_fields.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── es_compatibility/
    │       │   ├── 0001-noquery.yaml
    │       │   ├── 0002-query_string.yaml
    │       │   ├── 0003-match.yaml
    │       │   ├── 0004-term_aggregations.yaml
    │       │   ├── 0005-query_string_query.yaml
    │       │   ├── 0006-term_query.yaml
    │       │   ├── 0007-range_queries.yaml
    │       │   ├── 0008-sort_by.yaml
    │       │   ├── 0009-bool_query.yaml
    │       │   ├── 0010-match_phrase_prefix_query.yaml
    │       │   ├── 0011-exists-query.yaml
    │       │   ├── 0012-scroll-api.yaml
    │       │   ├── 0013-phrase-query.yaml
    │       │   ├── 0014-multi-match-query.yaml
    │       │   ├── 0015-terms-query.yaml
    │       │   ├── 0016-misc-query.yaml
    │       │   ├── 0017-match-bool-prefix-query.yaml
    │       │   ├── 0018-search_after.yaml
    │       │   ├── 0019-count.yaml
    │       │   ├── 0020-stats.yaml
    │       │   ├── 0021-cat-indices.yaml
    │       │   ├── 0022-source.yaml
    │       │   ├── 0023-extra_filters.yaml
    │       │   ├── 0024-delete_indices.yaml
    │       │   ├── 0025-msearch.yaml
    │       │   ├── 0026-resolve.yaml
    │       │   ├── 0027-cluster-health.yaml
    │       │   ├── 0028-fast_only_field_query.yaml
    │       │   ├── 0029-wildcard.yaml
    │       │   ├── 0030-prefix.yaml
    │       │   ├── 0031-regex.yaml
    │       │   ├── 0032-mappings.yaml
    │       │   ├── _ctx.elasticsearch.yaml
    │       │   ├── _ctx.quickwit.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.elasticsearch.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   ├── _teardown.elasticsearch.yaml
    │       │   ├── _teardown.quickwit.yaml
    │       │   ├── bulk/
    │       │   │   ├── 0001-happy-path.yaml
    │       │   │   ├── 0002-malformed-action.yaml
    │       │   │   ├── 0003-validation-failed-index-missing.yaml
    │       │   │   ├── 0004-put-request.yaml
    │       │   │   ├── 0005-document-parsing-exception.yaml
    │       │   │   ├── 0006-partial-index-not-found.yaml
    │       │   │   ├── 0007-illegal-index-name.yaml
    │       │   │   ├── _ctx.elasticsearch.yaml
    │       │   │   ├── _ctx.quickwit.yaml
    │       │   │   ├── _ctx.yaml
    │       │   │   ├── _setup.elasticsearch.yaml
    │       │   │   ├── _setup.quickwit.yaml
    │       │   │   ├── _teardown.elasticsearch.yaml
    │       │   │   └── _teardown.quickwit.yaml
    │       │   └── multi-indices/
    │       │       ├── 0001-muti_indices_query.yaml
    │       │       ├── 0002-muti_indices_scroll.yaml
    │       │       ├── 0003-multi_indices_aggs.yaml
    │       │       ├── 0004-missing_index_query.yaml
    │       │       ├── _ctx.yaml
    │       │       ├── _setup.elasticsearch.yaml
    │       │       ├── _setup.quickwit.yaml
    │       │       ├── _teardown.elasticsearch.yaml
    │       │       └── _teardown.quickwit.yaml
    │       ├── es_compatibility_info/
    │       │   ├── 0001-info.yaml
    │       │   ├── _ctx.elasticsearch.yaml
    │       │   ├── _ctx.quickwit.yaml
    │       │   └── _ctx.yaml
    │       ├── es_field_capabilities/
    │       │   ├── 0001-field-capabilities.yaml
    │       │   ├── _ctx.elasticsearch.yaml
    │       │   ├── _ctx.quickwit.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.elasticsearch.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   ├── _teardown.elasticsearch.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── multi_splits/
    │       │   ├── 0001-request-optimizations.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── qw_search_api/
    │       │   ├── 0001_ts_range.yaml
    │       │   ├── 0002_negative_search.yaml
    │       │   ├── 0003_exists_search.yaml
    │       │   ├── 0004_exact_string.yaml
    │       │   ├── 0005_fast_field_search.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── search_after/
    │       │   ├── 0001-search_after_edge_case.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       ├── sort_orders/
    │       │   ├── 0001-sort-elasticapi.yaml
    │       │   ├── _ctx.yaml
    │       │   ├── _setup.quickwit.yaml
    │       │   └── _teardown.quickwit.yaml
    │       └── tag_fields/
    │           ├── 0001_allowed_types.yaml
    │           ├── 0002_negative_tags.yaml
    │           ├── _ctx.yaml
    │           ├── _setup.quickwit.yaml
    │           └── _teardown.quickwit.yaml
    ├── rust-toolchain.toml
    ├── rustfmt.toml
    └── scripts/
        ├── about.hbs
        ├── about.toml
        ├── check_license_headers.sh
        ├── check_log_format.sh
        └── dep-tree.py

================================================
FILE CONTENTS
================================================

================================================
FILE: .cargo/config.toml
================================================
[build]
rustflags = ["--cfg", "tokio_unstable"]
rustdocflags = ["--cfg", "tokio_unstable"]

[target.x86_64-unknown-linux-gnu]
# Targeting x86-64-v2 gives a ~2% performance boost while only
# disallowing Intel CPUs older than 2008 and AMD CPUs older than 2011.
# None of those very old CPUs are used in GCP
# (https://cloud.google.com/compute/docs/cpu-platforms). Unfortunately,
# AWS does not seem to disclose the exact CPUs they use.
rustflags = ["-C", "target-cpu=x86-64-v2", "--cfg", "tokio_unstable"]


================================================
FILE: .claude/skills/bump-tantivy/SKILL.md
================================================
---
name: bump-tantivy
description: Bump tantivy to the latest commit on main branch, fix compilation issues, and open a PR
disable-model-invocation: true
---

# Bump Tantivy

Follow these steps to bump tantivy to its latest version:

## Step 1: Check that we are on the main branch

Run: `git branch --show-current`

If the current branch is not `main`, abort and ask the user to switch to the main branch first.

## Step 2: Ensure main is up to date

Run: `git pull origin main`

This ensures we're working from the latest code.

## Step 3: Get the latest tantivy SHA

Run: `gh api repos/quickwit-oss/tantivy/commits/main --jq '.sha'`

Extract the first 7 characters as the short SHA.

## Step 4: Update Cargo.toml

Edit `quickwit/Cargo.toml` and update the `rev` field in the tantivy dependency to the new short SHA.

The line looks like:
```toml
tantivy = { git = "https://github.com/quickwit-oss/tantivy/", rev = "XXXXXXX", ... }
```

## Step 5: Run cargo check and fix compilation errors

Run `cargo check` in the `quickwit` directory to verify compilation.

If there are compilation errors:
- If the fix is straightforward (simple API changes, renames, etc.), fix them without asking
- If the fix is complex or unclear, ask the user before proceeding

Repeat until cargo check passes.

## Step 6: Format code

Run `make fmt` from the `quickwit/` directory to format the code.

## Step 7: Update licenses

Run `make update-licenses` from the `quickwit/` directory, then move the generated file:
```
mv quickwit/LICENSE-3rdparty.csv ./LICENSE-3rdparty.csv
```

## Step 8: Create a new branch

Get the git username: `git config user.name | tr ' ' '-' | tr '[:upper:]' '[:lower:]'`

Get today's date: `date +%Y-%m-%d`

Create and checkout a new branch named: `{username}/bump-tantivy-{date}`

Example: `paul/bump-tantivy-2024-03-15`

## Step 9: Commit changes

Stage all modified files and create a commit with message:
```
Bump tantivy to {short-sha}
```

## Step 10: Push and open a PR

Push the branch and open a PR using:
```
gh pr create --title "Bump tantivy to {short-sha}" --body "Updates tantivy dependency to the latest commit on main."
```

Report the PR URL to the user when complete.


================================================
FILE: .claude/skills/fix-clippy/SKILL.md
================================================
---
name: fix-clippy
description: Fix all clippy lint warnings in the project
---

# Fix Clippy

Clippy issues are **warnings**, not errors. Never grep for `error` when looking for clippy issues.

## Step 1: Auto-fix

Run `make fix` to automatically fix clippy warnings:

```
make fix
```

## Step 2: Fix remaining warnings manually

Check for remaining warnings that couldn't be auto-fixed:

```
cargo clippy --tests 2>&1 | grep "^warning:" | sort -u
```

For each remaining warning, find the exact location and fix it manually.


================================================
FILE: .claude/skills/fmt/SKILL.md
================================================
---
name: fmt
description: Run `make fmt` to check the code format.
---

# Format Check

Run `make fmt` from the `quickwit/` subdirectory to check code formatting:

```
cd /Users/paul.masurel/git/quickwit/quickwit && make fmt
```

This command checks:
1. Rust code formatting
2. License headers
3. Log format policy (no trailing punctuation, no uppercase first character)

If there are log format issues, fix them by:
- Making the first character lowercase
- Removing trailing punctuation (periods, exclamation marks, etc.)

Fix any issues found and re-run until clean.


================================================
FILE: .claude/skills/rationalize-deps/SKILL.md
================================================
---
name: rationalize-deps
description: Analyze Cargo.toml dependencies and attempt to remove unused features to reduce compile times and binary size
---

# Rationalize Dependencies

This skill analyzes Cargo.toml dependencies to identify and remove unused features.

## Overview

Many crates enable features by default that may not be needed. This skill:
1. Identifies dependencies with default features enabled
2. Tests if `default-features = false` works
3. Identifies which specific features are actually needed
4. Verifies compilation after changes

## Step 1: Identify the target

Ask the user which crate(s) to analyze:
- A specific crate name (e.g., "tokio", "serde")
- A specific workspace member (e.g., "quickwit-search")
- "all" to scan the entire workspace

## Step 2: Analyze current dependencies

For the workspace Cargo.toml (`quickwit/Cargo.toml`), list dependencies that:
- Do NOT have `default-features = false`
- Have default features that might be unnecessary

Run: `cargo tree -p <crate> -f "{p} {f}" --edges features` to see what features are actually used.

## Step 3: For each candidate dependency

### 3a: Check the crate's default features

Look up the crate on crates.io or check its Cargo.toml to understand:
- What features are enabled by default
- What each feature provides

Use: `cargo metadata --format-version=1 | jq '.packages[] | select(.name == "<crate>") | .features'`

### 3b: Try disabling default features

Modify the dependency in `quickwit/Cargo.toml`:

From:
```toml
some-crate = { version = "1.0" }
```

To:
```toml
some-crate = { version = "1.0", default-features = false }
```

### 3c: Run cargo check

Run: `cargo check --workspace` (or target specific packages for faster feedback)

If compilation fails:
1. Read the error messages to identify which features are needed
2. Add only the required features explicitly:
   ```toml
   some-crate = { version = "1.0", default-features = false, features = ["needed-feature"] }
   ```
3. Re-run cargo check

### 3d: Binary search for minimal features

If there are many default features, use binary search:
1. Start with no features
2. If it fails, add half the default features
3. Continue until you find the minimal set

## Step 4: Document findings

For each dependency analyzed, report:
- Original configuration
- New configuration (if changed)
- Features that were removed
- Any features that are required

## Step 5: Verify full build

After all changes, run:
```bash
cargo check --workspace --all-targets
cargo test --workspace --no-run
```

## Common Patterns

### Serde
Often only needs `derive`:
```toml
serde = { version = "1.0", default-features = false, features = ["derive", "std"] }
```

### Tokio
Identify which runtime features are actually used:
```toml
tokio = { version = "1.0", default-features = false, features = ["rt-multi-thread", "macros", "sync"] }
```

### Reqwest
Often doesn't need all TLS backends:
```toml
reqwest = { version = "0.11", default-features = false, features = ["rustls-tls", "json"] }
```

## Rollback

If changes cause issues:
```bash
git checkout quickwit/Cargo.toml
cargo check --workspace
```

## Tips

- Start with large crates that have many default features (tokio, reqwest, hyper)
- Use `cargo bloat --crates` to identify large dependencies
- Check `cargo tree -d` for duplicate dependencies that might indicate feature conflicts
- Some features are needed only for tests - consider using `[dev-dependencies]` features


================================================
FILE: .claude/skills/simple-pr/SKILL.md
================================================
---
name: simple-pr
description: Create a simple PR from staged changes with an auto-generated commit message
disable-model-invocation: true
---

# Simple PR

Follow these steps to create a simple PR from staged changes:

## Step 1: Check workspace state

Run: `git status`

Verify that all changes have been staged (no unstaged changes). If there are unstaged changes, abort and ask the user to stage their changes first with `git add`.

Also verify that we are on the `main` branch. If not, abort and ask the user to switch to main first.

## Step 2: Ensure main is up to date

Run: `git pull origin main`

This ensures we're working from the latest code.

## Step 3: Review staged changes

Run: `git diff --cached`

Review the staged changes to understand what the PR will contain.

## Step 4: Generate commit message

Based on the staged changes, generate a concise commit message (1-2 sentences) that describes the "why" rather than the "what".

Display the proposed commit message to the user and ask for confirmation before proceeding.

## Step 5: Create a new branch

Get the git username: `git config user.name | tr ' ' '-' | tr '[:upper:]' '[:lower:]'`

Create a short, descriptive branch name based on the changes (e.g., `fix-typo-in-readme`, `add-retry-logic`, `update-deps`).

Create and checkout the branch: `git checkout -b {username}/{short-descriptive-name}`

## Step 6: Commit changes

Commit with the message from step 3:
```
git commit -m "{commit-message}"
```

## Step 7: Push and open a PR

Push the branch and open a PR:
```
git push -u origin {branch-name}
gh pr create --title "{commit-message-title}" --body "{longer-description-if-needed}"
```

Report the PR URL to the user when complete.


================================================
FILE: .devcontainer/devcontainer.json
================================================
{
    "name": "Quickwit",
    "image": "mcr.microsoft.com/devcontainers/rust:bookworm",
    "customizations": {
        "codespaces": {
            "openFiles": [
                "CONTRIBUTING.md"
            ]
        },
        "vscode": {
            "extensions": [
                "rust-lang.rust-analyzer"
            ]
        }
    },
    "hostRequirements": {
        "cpus": 4,
        "memory": "16gb"
    },
    "runArgs": [
        "--init"
    ],
    "mounts": [
        {
            "source": "/var/run/docker.sock",
            "target": "/var/run/docker.sock",
            "type": "bind"
        }
    ],
    "features": {
        "docker-from-docker": {
            "version": "latest",
            "moby": true
        },
        "ghcr.io/devcontainers/features/node:1": {
            "version": "24"
        },
        "ghcr.io/devcontainers/features/aws-cli:1": {},
        "ghcr.io/devcontainers-contrib/features/protoc:1": {}
    },
    "postCreateCommand": ".devcontainer/post-create.sh"
}


================================================
FILE: .devcontainer/post-create.sh
================================================
#!/bin/bash

# Define success and error color codes
SUCCESS_COLOR="\e[32m"
ERROR_COLOR="\e[31m"
RESET_COLOR="\e[0m"

# Define success tracking variables
rustupToolchainNightlyInstalled=false
cmakeInstalled=false


# Define installation functions

#Installing manually for now until we figure out why "ghcr.io/devcontainers-community/features/cmake": {} is not working
install_cmake() {
    echo -e "Installing CMake..."
    sudo apt-get update
    sudo apt-get install -y cmake > /dev/null 2>&1
    if [[ "$(cmake --version)" =~ "cmake version" ]]; then
        echo -e "${SUCCESS_COLOR}CMake installed successfully.${RESET_COLOR}"
        cmakeInstalled=true
    else
        echo -e "${ERROR_COLOR}CMake installation failed. Please install it manually.${RESET_COLOR}"
    fi
}

install_rustup_toolchain_nightly() {
    echo -e "Installing Rustup nightly toolchain..."
    rustup toolchain install nightly > /dev/null 2>&1
    rustup component add rustfmt --toolchain nightly > /dev/null 2>&1
    if [[ "$(rustup toolchain list)" =~ "nightly" && "$(rustup component list --toolchain nightly | grep rustfmt)" =~ "installed" ]]; then
        echo -e "${SUCCESS_COLOR}Rustup nightly toolchain and rustfmt installed successfully.${RESET_COLOR}"
        rustupToolchainNightlyInstalled=true
    else
        echo -e "${ERROR_COLOR}Rustup nightly toolchain and/or rustfmt installation failed. Please install them manually.${RESET_COLOR}"
    fi
}

# Install tools
install_cmake
install_rustup_toolchain_nightly

# Copy our custom welcome message to replace the default github welcome message
sudo cp .devcontainer/welcome.txt /usr/local/etc/vscode-dev-containers/first-run-notice.txt


# Check the success tracking variables
if $rustupToolchainNightlyInstalled && $cmakeInstalled; then
    echo -e "${SUCCESS_COLOR}All tools installed successfully.${RESET_COLOR}"
else
    echo -e "${ERROR_COLOR}One or more tools failed to install. Please check the output for errors and install the failed tools manually.${RESET_COLOR}"
fi


================================================
FILE: .devcontainer/welcome.txt
================================================
👋 Welcome to the project!
All the necessary tools have already been installed for you 🎉. 
You can go ahead and start hacking! Happy coding💻.

 Here are some useful commands you can run:

🔧 `make test-all` - starts necessary Docker services and runs all tests.
🔧 `make -k test-all docker-compose-down` - the same as above, but tears down the Docker services after running all the tests.
🔧 `make fmt` - runs formatter, this command requires the nightly toolchain to be installed by running `rustup toolchain install nightly`.
🔧 `make fix` - runs formatter and clippy checks.
🔧 `make typos` - runs the spellcheck tool over the codebase. (Install by running `cargo install typos`)
🔧 `make build-docs` - builds docs.
🔧 `make docker-compose-up` - starts Docker services.
🔧 `make docker-compose-down` - stops Docker services.
🔧 `make docker-compose-logs` - shows Docker logs.


================================================
FILE: .dockerignore
================================================
**/*.md
**/*.txt
**/.*
**/build
**/Dockerfile
**/node_modules
**/qwdata
**/target
docs
examples
!.git/
!quickwit-ui/build/.gitignore
!quickwit-ui/.gitignore_for_build_directory


================================================
FILE: .gitattributes
================================================
**/codegen/** linguist-generated


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Create a report to help us improve
title: ""
labels: bug
assignees: ""
---

**Describe the bug**
A clear and concise description of what the bug is.

**Steps to reproduce (if applicable)**
Steps to reproduce the behavior:

1.
2.

**Expected behavior**
A clear and concise description of what you expected to happen.

**Configuration:**
Please provide:

1. Output of `quickwit --version`
2. The index_config.yaml


================================================
FILE: .github/ISSUE_TEMPLATE/documentation_request.md
================================================
---
name: Documentation request
about: Suggest a documentation enhancement
title: "[Documentation topic]"
labels: documentation
assignees: ""
---

<!--

Hi 👋, thank you for submitting a documentation enhancement to Quickwit!

Don't forget to replace the title of this issue with a short
sentence that describes the topic of your enhancement!

-->

## My documentation idea

Use this section to give a description of what your enhancement is about.

Examples:

> I would like to add how to configure MinIO storage for Quickwit:
>

**What do you all think?**
👍 I would love to see it!
🚀 I would love to help!

Thank you for your request!


================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.md
================================================
---
name: Feature request
about: Suggest an idea for this project
title: ""
labels: enhancement
assignees: ""
---

**Is your feature request related to a problem? Please describe.**
A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]

**Describe the solution you'd like**
A clear and concise description of what you want to happen.

**Describe alternatives you've considered**
A clear and concise description of any alternative solutions or features you've considered.

**Additional context**
Add any other context or information about the feature request here.


================================================
FILE: .github/ISSUE_TEMPLATE/tutorial_request.md
================================================
---
name: Tutorial request
about: Suggest a Quickwit tutorial
title: "[Tutorial topic]"
labels: tutorial
assignees: ""
---

<!--

Hi 👋, thank you for submitting a tutorial to Quickwit!

Don't forget to replace the title of this issue with a short
sentence that describes the topic of your tutorial!

-->

## My tutorial idea

Use this section to give a description of what your tutorial is about.

Examples:

> I would like to write a tutorial that shows how to use Quickwit:
>
> - "for storing traces..."
> - "with Grafana/Jaeger/MinIO..."
> - "for ingesting terabytes per day with Kafka..."

Are there any particular tools, concepts, languages or platforms that readers
will learn about?

**What do you all think?**
👍 I would love to see it!
🚀 I would love to help!

Thank you for your request!


================================================
FILE: .github/PULL_REQUEST_TEMPLATE.md
================================================
### Description

Describe the proposed changes made in this PR.

### How was this PR tested?

Describe how you tested this PR.


================================================
FILE: .github/actions/cargo-build-macos-binary/action.yml
================================================
name: "Build Quickwit binary for macOS"
description: "Build React app and Rust binary for macOS with cargo build."
inputs:
  target:
    description: "Target"
    required: true
  version:
    description: "Binary version"
    required: true
  token:
    description: "GitHub access token"
    required: true
runs:
  using: "composite"
  steps:
    - run: echo "ASSET_FULL_NAME=quickwit-${{ inputs.version }}-${{ inputs.target }}" >> $GITHUB_ENV
      shell: bash
    - uses: actions/setup-node@v3
      with:
        node-version: 24
        cache: "yarn"
        cache-dependency-path: quickwit/quickwit-ui/yarn.lock
    - run: yarn global add node-gyp
      shell: bash
    - run: make build-ui
      shell: bash
    - name: Install protoc
      run: brew install protobuf
      shell: bash
    - name: Install rustup
      shell: bash
      run: curl https://sh.rustup.rs -sSf | sh -s -- --default-toolchain none -y
    - name: Add target ${{ inputs.target }}
      run: rustup target add ${{ inputs.target }}
      shell: bash
      working-directory: ./quickwit
    - name: Retrieve and export commit date, hash, and tags
      run: |
        echo "QW_COMMIT_DATE=$(TZ=UTC0 git log -1 --format=%cd --date=format-local:%Y-%m-%dT%H:%M:%SZ)" >> $GITHUB_ENV
        echo "QW_COMMIT_HASH=$(git rev-parse HEAD)" >> $GITHUB_ENV
        echo "QW_COMMIT_TAGS=$(git tag --points-at HEAD | tr '\n' ',')" >> $GITHUB_ENV
      shell: bash
    - name: Build binary
      run: cargo build --release --features release-macos-feature-vendored-set --target ${{ matrix.target }} --bin quickwit
      shell: bash
      working-directory: ./quickwit
      env:
        QW_COMMIT_DATE: ${{ env.QW_COMMIT_DATE }}
        QW_COMMIT_HASH: ${{ env.QW_COMMIT_HASH }}
        QW_COMMIT_TAGS: ${{ env.QW_COMMIT_TAGS }}
    - name: Bundle archive
      run: |
        make archive BINARY_FILE=quickwit/target/${{ inputs.target }}/release/quickwit \
          BINARY_VERSION=${{ inputs.version }} ARCHIVE_NAME=${{ env.ASSET_FULL_NAME }}
      shell: bash
    - name: Save binary archive for three days
      uses: actions/upload-artifact@v4.4.0
      with:
        name: ${{ env.ASSET_FULL_NAME }}.tar.gz
        path: ./${{ env.ASSET_FULL_NAME }}.tar.gz
        retention-days: 3
    - name: Deploy archive to GitHub release
      uses: quickwit-inc/upload-to-github-release@9b2c40fba23bf8dea05b7d2eece24cbc95d4a190
      env:
        GITHUB_TOKEN: ${{ inputs.token }}
      with:
        file: ${{ env.ASSET_FULL_NAME }}.tar.gz
        overwrite: true
        draft: ${{ inputs.version != 'nightly' }}
        tag_name: ${{ inputs.version }}


================================================
FILE: .github/actions/cross-build-binary/action.yml
================================================
name: "Build Quickwit binary with cargo cross"
description: "Build React app and Rust binary with cargo cross."
inputs:
  target:
    description: "Target"
    required: true
  version:
    description: "Binary version"
    required: true
  token:
    description: "GitHub access token"
    required: true
runs:
  using: "composite"
  steps:
    - run: echo "ASSET_FULL_NAME=quickwit-${{ inputs.version }}-${{ inputs.target }}" >> $GITHUB_ENV
      shell: bash
    - uses: actions/setup-node@v3
      with:
        node-version: 24
        cache: "yarn"
        cache-dependency-path: quickwit/quickwit-ui/yarn.lock
    - run: yarn global add node-gyp
      shell: bash
    - run: make build-ui
      shell: bash
    - name: Install rustup
      shell: bash
      run: curl https://sh.rustup.rs -sSf | sh -s -- --default-toolchain none -y
    - name: Install cross
      run: cargo install cross
      shell: bash
    - name: Retrieve and export commit date, hash, and tags
      run: |
        echo "QW_COMMIT_DATE=$(TZ=UTC0 git log -1 --format=%cd --date=format-local:%Y-%m-%dT%H:%M:%SZ)" >> $GITHUB_ENV
        echo "QW_COMMIT_HASH=$(git rev-parse HEAD)" >> $GITHUB_ENV
        echo "QW_COMMIT_TAGS=$(git tag --points-at HEAD | tr '\n' ',')" >> $GITHUB_ENV
      shell: bash
    - name: Build Quickwit
      run: cross build --release --features release-feature-vendored-set --target ${{ inputs.target }} --bin quickwit
      shell: bash
      env:
        QW_COMMIT_DATE: ${{ env.QW_COMMIT_DATE }}
        QW_COMMIT_HASH: ${{ env.QW_COMMIT_HASH }}
        QW_COMMIT_TAGS: ${{ env.QW_COMMIT_TAGS }}
      working-directory: ./quickwit
    - name: Bundle archive
      run: |
        make archive BINARY_FILE=quickwit/target/${{ inputs.target }}/release/quickwit \
          BINARY_VERSION=${{ inputs.version }} ARCHIVE_NAME=${{ env.ASSET_FULL_NAME }}
      shell: bash
    - name: Save binary archive for three days
      uses: actions/upload-artifact@v4.4.0
      with:
        name: ${{ env.ASSET_FULL_NAME }}.tar.gz
        path: ./${{ env.ASSET_FULL_NAME }}.tar.gz
        retention-days: 3
    - name: Upload archive
      uses: quickwit-inc/upload-to-github-release@9b2c40fba23bf8dea05b7d2eece24cbc95d4a190
      env:
        GITHUB_TOKEN: ${{ inputs.token }}
      with:
        file: ${{ env.ASSET_FULL_NAME }}.tar.gz
        overwrite: true
        draft: ${{ inputs.version != 'nightly' }}
        tag_name: ${{ inputs.version }}


================================================
FILE: .github/dependabot.yml
================================================
version: 2
updates:
  # Rust dependencies
  - package-ecosystem: cargo
    directory: "/quickwit"
    schedule:
      interval: "monthly"
    groups:
      rust-dependencies:
        patterns:
          - "*"
    open-pull-requests-limit: 10
    ignore:
      - dependency-name: "*"
        update-types: ["version-update:semver-patch"]

  # Docker dependencies
  - package-ecosystem: docker
    directory: "/"
    schedule:
      interval: "monthly"
    open-pull-requests-limit: 10

  # GitHub Actions
  - package-ecosystem: github-actions
    directory: "/"
    schedule:
      interval: "monthly"
    groups:
      github-actions:
        patterns:
          - "*"
    open-pull-requests-limit: 10

  # NPM dependencies
  - package-ecosystem: npm
    directory: "/"
    schedule:
      interval: "monthly"
    groups:
      npm-dependencies:
        patterns:
          - "*"
    open-pull-requests-limit: 10


================================================
FILE: .github/workflows/ci.yml
================================================
name: CI

on:
  workflow_dispatch:
  pull_request:
  push:
    branches:
      - main
      - trigger-ci-workflow
    paths:
      - "quickwit/**"
      - "!quickwit/quickwit-ui/**"

permissions:
  contents: read

env:
  CARGO_INCREMENTAL: 0
  QW_DISABLE_TELEMETRY: 1
  QW_TEST_DATABASE_URL: postgres://quickwit-dev:quickwit-dev@localhost:5432/quickwit-metastore-dev
  RUST_BACKTRACE: 1
  RUSTDOCFLAGS: -Dwarnings -Arustdoc::private_intra_doc_links
  RUSTFLAGS: -Dwarnings --cfg tokio_unstable

# Ensures that we cancel running jobs for the same PR / same workflow.
concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true

jobs:
  tests:
    name: Unit tests
    runs-on: "ubuntu-latest"
    timeout-minutes: 60
    permissions:
      contents: read
      actions: write
    services:
      # PostgreSQL service container
      postgres:
        image: postgres:latest
        ports:
          - 5432:5432
        env:
          POSTGRES_USER: quickwit-dev
          POSTGRES_PASSWORD: quickwit-dev
          POSTGRES_DB: quickwit-metastore-dev
        # Set health checks to wait until postgres has started
        options: >-
          --health-cmd pg_isready
          --health-interval 10s
          --health-timeout 5s
          --health-retries 5
    steps:
      - name: Cleanup Disk Space
        run: |
          df -h

          if [ "$(df -BG / | awk 'NR==2 {gsub("G","",$4); print $4}')" -lt 30 ]; then
            echo "Less than 30GiB available. Running cleanup..."
            sudo rm -rf /usr/share/dotnet
            sudo rm -rf /usr/local/lib/android
            sudo rm -rf /usr/share/swift
            sudo rm -rf /usr/local/.ghcup
            sudo rm -rf /opt/hostedtoolcache/CodeQL
            df -h
          else
            echo "30GiB or more available. Skipping cleanup."
          fi

      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - name: Install Ubuntu packages
        run: |
          sudo apt-get update
          sudo apt-get -y install protobuf-compiler
      - uses: actions/setup-python@83679a892e2d95755f2dac6acb0bfd1e9ac5d548 # v.6.1.0
        with:
          python-version: '3.11'
      - uses: dorny/paths-filter@de90cc6fb38fc0963ad72b210f1f284cd68cea36 # v3.0.2
        id: modified
        with:
          filters: |
            rust_src:
              - quickwit/**/*.rs
              - quickwit/**/*.toml
              - quickwit/**/*.proto
              - quickwit/rest-api-tests/**
              - .github/workflows/ci.yml
      - name: Setup stable Rust Toolchain
        if: steps.modified.outputs.rust_src == 'true'
        uses: dtolnay/rust-toolchain@f7ccc83f9ed1e5b9c81d8a67d7ad1a747e22a561 # master
        with:
          toolchain: stable
      - name: Setup cache
        uses: Swatinem/rust-cache@779680da715d629ac1d338a641029a2f4372abb5 # v2.8.2
        if: steps.modified.outputs.rust_src == 'true'
        with:
          workspaces: "./quickwit -> target"
          shared-key: "quickwit-cargo"
      - name: Install nextest
        if: always() && steps.modified.outputs.rust_src == 'true'
        uses: taiki-e/install-action@aba36d755ec7ca22d38b12111787c26115943952
        with:
          tool: cargo-nextest
      - name: cargo build
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo build --features=postgres --tests --bin quickwit
        working-directory: ./quickwit
      - name: cargo nextest
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo nextest run --features=postgres --retries 1
        working-directory: ./quickwit
      - name: Install python packages
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: |
          pip install --user --require-hashes -r ${{ github.workspace }}/.github/workflows/requirements.txt
          pipenv install --deploy --ignore-pipfile
        working-directory: ./quickwit/rest-api-tests
      - name: Run REST API tests
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: pipenv run python3 ./run_tests.py --binary ../target/debug/quickwit
        working-directory: ./quickwit/rest-api-tests

  lints:
    name: Lints
    runs-on: "ubuntu-latest"
    timeout-minutes: 60
    permissions:
      contents: read
      actions: write
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - uses: dorny/paths-filter@de90cc6fb38fc0963ad72b210f1f284cd68cea36 # v3.0.2
        id: modified
        with:
          filters: |
            rust_src:
              - quickwit/**/*.rs
              - quickwit/**/*.toml
              - quickwit/**/*.proto
              - .github/workflows/ci.yml
      - name: Install Ubuntu packages
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: |
          sudo apt-get update
          sudo apt-get -y install protobuf-compiler
      - name: Setup nightly Rust Toolchain (for rustfmt)
        if: steps.modified.outputs.rust_src == 'true'
        uses: dtolnay/rust-toolchain@f7ccc83f9ed1e5b9c81d8a67d7ad1a747e22a561 # master
        with:
          toolchain: nightly
          components: rustfmt
      - name: Setup stable Rust Toolchain
        if: steps.modified.outputs.rust_src == 'true'
        uses: dtolnay/rust-toolchain@f7ccc83f9ed1e5b9c81d8a67d7ad1a747e22a561 # master
        with:
          toolchain: stable
      - name: Setup cache
        if: steps.modified.outputs.rust_src == 'true'
        uses: Swatinem/rust-cache@779680da715d629ac1d338a641029a2f4372abb5 # v2.8.2
        with:
          workspaces: "./quickwit -> target"
          shared-key: "quickwit-cargo"
      - name: Install cargo deny
        if: always() && steps.modified.outputs.rust_src == 'true'
        uses: taiki-e/cache-cargo-install-action@34ce5120836e5f9f1508d8713d7fdea0e8facd6f # v3.0.1
        with:
          # 0.18 requires rustc 1.85
          tool: cargo-deny@0.17.0
      - name: Install cargo machete
        if: always() && steps.modified.outputs.rust_src == 'true'
        uses: taiki-e/cache-cargo-install-action@34ce5120836e5f9f1508d8713d7fdea0e8facd6f # v3.0.1
        with:
          tool: cargo-machete
      - name: cargo clippy
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo clippy --workspace --tests --all-features
        working-directory: ./quickwit
      - name: cargo deny
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo deny check licenses
        working-directory: ./quickwit
      - name: cargo machete
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo machete
        working-directory: ./quickwit
      - name: cargo doc
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo doc --no-deps
        working-directory: ./quickwit
      - name: License headers check
        if: always()
        run: bash scripts/check_license_headers.sh
        working-directory: ./quickwit
      - name: rustfmt
        if: always() && steps.modified.outputs.rust_src == 'true'
        run: cargo +nightly fmt --all -- --check
        working-directory: ./quickwit

  thirdparty-license:
    name: Check Datadog third-party license file
    runs-on: ubuntu-latest
    permissions:
      contents: read
      actions: write
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - name: Install Rust toolchain
        uses: dtolnay/rust-toolchain@f7ccc83f9ed1e5b9c81d8a67d7ad1a747e22a561 # master
        with:
          toolchain: stable

      - name: Cache cargo tools
        uses: actions/cache@9255dc7a253b0ccc959486e2bca901246202afeb # v5.0.1
        with:
          path: ~/.cargo/bin
          key: ${{ runner.os }}-cargo-tools-${{ hashFiles('**/Cargo.lock') }}

      - name: Install dd-rust-license-tool
        run: dd-rust-license-tool --help || cargo install --git https://github.com/DataDog/rust-license-tool.git --force

      - name: Check Datadog third-party license file
        run: dd-rust-license-tool --config quickwit/license-tool.toml --manifest-path quickwit/Cargo.toml check


================================================
FILE: .github/workflows/coverage.yml
================================================
name: Code coverage

on:
  workflow_dispatch:
  push:
    branches:
      - main
      - trigger-coverage-workflow
    paths:
      - quickwit/Cargo.toml
      - quickwit/Cargo.lock
      - quickwit/quickwit-*/**

permissions:
  contents: read

env:
  AWS_REGION: us-east-1
  AWS_ACCESS_KEY_ID: "placeholder"
  AWS_SECRET_ACCESS_KEY: "placeholder"
  CARGO_INCREMENTAL: 0
  PUBSUB_EMULATOR_HOST: "localhost:8681"
  QW_DISABLE_TELEMETRY: 1
  QW_S3_ENDPOINT: "http://localhost:4566" # Services are exposed as localhost because we are not running coverage in a container.
  QW_S3_FORCE_PATH_STYLE_ACCESS: 1
  QW_TEST_DATABASE_URL: postgres://quickwit-dev:quickwit-dev@localhost:5432/quickwit-metastore-dev
  RUSTFLAGS: -Dwarnings --cfg tokio_unstable

jobs:
  test:
    name: Coverage
    runs-on: gh-ubuntu-arm64
    timeout-minutes: 40
    permissions:
      contents: read
      actions: write
    # Setting a containing will require to fix the QW_S3_ENDPOINT to http://localstack:4566
    services:
      localstack:
        image: localstack/localstack:latest
        ports:
          - "4566:4566"
          - "4571:4571"
          - "8080:8080"
        env:
          SERVICES: kinesis,s3,sqs
        options: >-
          --health-cmd "curl -k https://localhost:4566"
          --health-interval 10s
          --health-timeout 5s
          --health-retries 5

      postgres:
        image: postgres:latest
        ports:
          - "5432:5432"
        env:
          POSTGRES_USER: quickwit-dev
          POSTGRES_PASSWORD: quickwit-dev
          POSTGRES_DB: quickwit-metastore-dev
        options: >-
          --health-cmd pg_isready
          --health-interval 10s
          --health-timeout 5s
          --health-retries 5

      kafka-broker:
        image: confluentinc/confluent-local:7.4.11
        ports:
          - "9092:9092"
          - "9101:9101"
        env:
          # Mode KRaft (Single Node)
          KAFKA_NODE_ID: 1
          KAFKA_PROCESS_ROLES: 'broker,controller'
          KAFKA_CONTROLLER_QUORUM_VOTERS: '1@localhost:9093'
          KAFKA_LOG4J_LOGGERS: "org.apache.kafka.image.loader.MetadataLoader=WARN"

          # Listeners
          KAFKA_LISTENER_SECURITY_PROTOCOL_MAP: 'CONTROLLER:PLAINTEXT,EXTERNAL:PLAINTEXT'
          KAFKA_LISTENERS: 'EXTERNAL://0.0.0.0:9092,CONTROLLER://0.0.0.0:9093'
          KAFKA_ADVERTISED_LISTENERS: 'EXTERNAL://localhost:9092'
          KAFKA_CONTROLLER_LISTENER_NAMES: 'CONTROLLER'
          KAFKA_INTER_BROKER_LISTENER_NAME: 'EXTERNAL'

          # Configuration simplifiée
          KAFKA_OFFSETS_TOPIC_REPLICATION_FACTOR: 1
          KAFKA_GROUP_INITIAL_REBALANCE_DELAY_MS: 0
          KAFKA_TRANSACTION_STATE_LOG_REPLICATION_FACTOR: 1
          KAFKA_TRANSACTION_STATE_LOG_MIN_ISR: 1

          # ID du Cluster (Nécessaire pour KRaft)
          CLUSTER_ID: 'MkU3OEVBNTcwNTJENDM2Qk'

          KAFKA_HEAP_OPTS: -Xms256M -Xmx256M

        options: >-
          --health-cmd "ub kafka-ready -b localhost:9092 1 5"
          --health-interval 10s
          --health-timeout 5s
          --health-retries 5

      gcp-pubsub-emulator:
        image: thekevjames/gcloud-pubsub-emulator:550.0.0
        ports:
          - "8681:8681"
        env:
          PUBSUB_PROJECT1: "quickwit-emulator,emulator_topic:emulator_subscription"

    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1

      - name: Install lib libsasl2
        run: |
          sudo apt update
          sudo apt install libsasl2-dev
          sudo apt install libsasl2-2

      - uses: actions/setup-python@83679a892e2d95755f2dac6acb0bfd1e9ac5d548 # v.6.1.0
        with:
          python-version: '3.11'

      - uses: actions/cache@9255dc7a253b0ccc959486e2bca901246202afeb # v5.0.1
        with:
          path: |
            ~/.cargo/git
            ~/.cargo/registry
          key: ${{ runner.os }}-cargo-test-${{ hashFiles('Cargo.lock') }}
          restore-keys: |
            ${{ runner.os }}-cargo-test-${{ hashFiles('Cargo.lock') }}
            ${{ runner.os }}-cargo-test

      - name: Install python packages
        run: |
          pip install --user --require-hashes -r ${{ github.workspace }}/.github/workflows/requirements.txt
          pipenv install --deploy --ignore-pipfile
        working-directory: ./quickwit/quickwit-cli/tests

      - name: Prepare LocalStack S3
        run: pipenv run ./prepare_tests.sh
        working-directory: ./quickwit/quickwit-cli/tests

      # GitHub Actions does not allow services to be started with a custom command,
      # so we are running Azurite as a container manually.
      - name: Run Azurite service
        run: DOCKER_SERVICES=azurite make docker-compose-up

      # GitHub Actions does not allow services to be started with a custom command,
      # so we are running fake gcs server as a container manually.
      - name: Run Fake GCS Server service
        run: DOCKER_SERVICES=fake-gcs-server make docker-compose-up

      - name: Run Pulsar service
        run: DOCKER_SERVICES=pulsar make docker-compose-up

      - name: Install Rust
        run: rustup update stable

      - name: Install cargo-llvm-cov, cargo-nextest, and protoc
        uses: taiki-e/install-action@90558ad1e179036f31467972b00dec6cb80701fa # v2.66.3
        with:
          tool: cargo-llvm-cov,nextest,protoc

      # We limit the number of jobs to 4 to avoid OOM errors when linking the binary.
      - name: Generate code coverage
        run: |
          cargo llvm-cov clean --workspace
          cargo llvm-cov nextest --no-report --test failpoints --features fail/failpoints --retries 4
          # increase stack size for test_all_with_s3_localstack_cli, see quickwit#4963
          RUST_MIN_STACK=67108864 CARGO_BUILD_JOBS=4 cargo llvm-cov nextest --no-report --all-features --retries 4
          cargo llvm-cov report --lcov --output-path lcov.info
        working-directory: ./quickwit

      - name: Upload coverage to Codecov
        uses: codecov/codecov-action@671740ac38dd9b0130fbe1cec585b89eea48d3de # v5.5.2
        with:
          token: ${{ secrets.CODECOV_TOKEN }} # not required for public repos
          files: ./quickwit/lcov.info

  on-failure:
    if: ${{ github.repository_owner == 'quickwit-oss' && failure() }}
    name: On Failure
    needs: [test]
    runs-on: ubuntu-latest
    steps:
      - name: Send Message
        uses: sarisia/actions-status-discord@eb045afee445dc055c18d3d90bd0f244fd062708 # v1.16.0
        with:
          webhook: ${{ secrets.DISCORD_WEBHOOK }}
          nodetail: true
          color: "#FF0000"
          title: ""
          description: |
            ### ❌ [${{ github.event.pull_request.title }}](${{ github.event.pull_request.html_url }})

            @${{ github.actor }} quickwit coverage CI failed on your PR.

            Coverage CI contains tests that are not running in the regular CI because they are too lengthy.
            For this reason it is possible for it to break even if the tests were passing on your PR.
            This is not a catastrophy, but you are responsible for fixing it!

            You can run the full test suite locally with `make test-all`.

            Please report in this channel that you are working on it/fixed it/or if it is a flaky test/
            or if you need help.

            **[View logs](https://github.com/${{ github.repository }}/actions/runs/${{ github.run_id }})**


================================================
FILE: .github/workflows/dependency.yml
================================================
name: "Dependency Review"
on: [pull_request]

permissions:
  contents: read

# Ensures that we cancel running jobs for the same PR / same workflow.
concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true

jobs:
  dependency-review:
    runs-on: ubuntu-latest
    steps:
      - name: "Checkout Repository"
        uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - name: "Dependency Review"
        uses: actions/dependency-review-action@98884d411b0f1c583e5ee579e7e897d4623019c2 # v4.8.1
        with:
          # This is an minor vuln on the rsa crate, used for
          # google storage.
          allow-ghsas: GHSA-c38w-74pg-36hr,GHSA-4grx-2x9w-596c


================================================
FILE: .github/workflows/publish_cross_images.yml
================================================
name: Publish custom cross images

on:
  workflow_dispatch:
  push:
    branches:
      - main
    paths:
      - "build/cross-images/**"

permissions:
  contents: read

jobs:
  build-cross-images:
    name: Publish cross images
    runs-on: ubuntu-latest
    environment:
        name: production
    steps:
      - name: Check out the repo
        uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - name: Log in to Docker Hub
        uses: docker/login-action@5e57cd118135c172c3672efd75eb46360885c0ef # v3.6.0
        with:
          username: ${{ secrets.DOCKERHUB_USERNAME }}
          password: ${{ secrets.DOCKERHUB_ACCESS_TOKEN }}
      - name: Build and push cross images
        run: make cross-images


================================================
FILE: .github/workflows/publish_docker_images.yml
================================================
name: Build and publish Docker images

on:
  workflow_dispatch:
  push:
    branches:
      - main
      - release-0.9
    paths:
      - "quickwit/**"
    tags:
      - airmail
      - happy-plazza
      - qw*
      - v*

permissions:
  contents: read

env:
  REGISTRY_IMAGE: quickwit/quickwit

jobs:
  docker:
    strategy:
      matrix:
        include:
          - os: ubuntu-latest
            platform: linux/amd64
            platform_suffix: amd64
          - os: gh-ubuntu-arm64
            platform: linux/arm64
            platform_suffix: arm64
    runs-on: ${{ matrix.os }}
    permissions:
      contents: read
      actions: write
    environment:
      name: production
    steps:
      - name: Cleanup Disk Space
        run: |
          df -h
          sudo rm -rf /opt/hostedtoolcache/CodeQL
          sudo rm -rf /usr/local/.ghcup
          sudo rm -rf /usr/local/lib/android
          sudo rm -rf /usr/share/dotnet
          sudo rm -rf /usr/share/swift
          df -h

      - name: Checkout
        uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1

      - name: Login to Docker Hub
        uses: docker/login-action@5e57cd118135c172c3672efd75eb46360885c0ef # v3.6.0
        with:
          username: ${{ secrets.DOCKERHUB_USERNAME }}
          password: ${{ secrets.DOCKERHUB_ACCESS_TOKEN }}

      - name: Set up QEMU
        uses: docker/setup-qemu-action@c7c53464625b32c7a7e944ae62b3e17d2b600130 # v3.7.0

      - name: Set up Docker Buildx
        uses: docker/setup-buildx-action@8d2750c68a42422c14e847fe6c8ac0403b4cbd6f # v3.12.0

      - name: Docker meta
        id: meta
        uses: docker/metadata-action@c299e40c65443455700f0fdfc63efafe5b349051 # v5.10.0
        with:
          images: |
            ${{ env.REGISTRY_IMAGE }}
          labels: |
            org.opencontainers.image.title=Quickwit
            maintainer=Quickwit, Inc. <hello@quickwit.io>
            org.opencontainers.image.vendor=Quickwit, Inc.
            org.opencontainers.image.licenses=Apache-2.0

      - name: Retrieve commit date, hash, and tags
        run: |
          echo "QW_COMMIT_DATE=$(TZ=UTC0 git log -1 --format=%cd --date=format-local:%Y-%m-%dT%H:%M:%SZ)" >> $GITHUB_ENV
          echo "QW_COMMIT_HASH=$(git rev-parse HEAD)" >> $GITHUB_ENV
          echo "QW_COMMIT_TAGS=$(git tag --points-at HEAD | tr '\n' ',')" >> $GITHUB_ENV
          if [[ "${{ github.event_name }}" == "push" && "${{ github.ref_type }}" == "tag" && "${GITHUB_REF#refs/tags/}" == *"jemprof"* ]]; then
            echo "CARGO_FEATURES=release-jemalloc-profiled" >> $GITHUB_ENV
          else
            echo "CARGO_FEATURES=release-feature-set" >> $GITHUB_ENV
          fi

      - name: Build and push image
        uses: docker/build-push-action@263435318d21b8e681c14492fe198d362a7d2c83 # v6.18.0
        id: build
        with:
          context: .
          platforms: ${{ matrix.platform }}
          build-args: |
            QW_COMMIT_DATE=${{ env.QW_COMMIT_DATE }}
            QW_COMMIT_HASH=${{ env.QW_COMMIT_HASH }}
            QW_COMMIT_TAGS=${{ env.QW_COMMIT_TAGS }}
            CARGO_FEATURES=${{ env.CARGO_FEATURES }}
          labels: ${{ steps.meta.outputs.labels }}
          outputs: type=image,name=${{ env.REGISTRY_IMAGE }},push-by-digest=true,name-canonical=true,push=true

      - name: Export digest
        run: |
          mkdir -p /tmp/digests
          digest="${{ steps.build.outputs.digest }}"
          touch "/tmp/digests/${digest#sha256:}"

      - name: Upload digest
        uses: actions/upload-artifact@b7c566a772e6b6bfb58ed0dc250532a479d7789f # v6.0.0
        with:
          name: digest-${{ matrix.platform_suffix }}
          path: /tmp/digests/*
          if-no-files-found: error
          retention-days: 1

  merge:
    runs-on: ubuntu-latest
    needs: [docker]
    permissions:
      contents: read
      actions: read
    environment: production
    steps:
      - name: Download digests
        uses: actions/download-artifact@37930b1c2abaa49bbe596cd826c3c89aef350131 # v7.0.0
        with:
          pattern: digest-*
          path: /tmp/digests
          merge-multiple: true

      - name: Set up Docker Buildx
        uses: docker/setup-buildx-action@8d2750c68a42422c14e847fe6c8ac0403b4cbd6f # v3.12.0

      - name: Docker meta
        id: meta
        uses: docker/metadata-action@c299e40c65443455700f0fdfc63efafe5b349051 # v5.10.0
        with:
          images: ${{ env.REGISTRY_IMAGE }}
          flavor: |
            latest=false
          tags: |
            type=edge,branch=main
            type=edge,branch=main,suffix=-slim-bookworm
            type=semver,pattern={{version}}
            type=semver,pattern={{version}},value=latest
            type=semver,pattern={{version}},suffix=-slim-bookworm
            type=ref,event=tag
            type=raw,value=v0.9.0-rc,enable=${{ github.ref == 'refs/heads/release-0.9' }}
      - name: Login to Docker Hub
        uses: docker/login-action@5e57cd118135c172c3672efd75eb46360885c0ef # v3.6.0
        with:
          username: ${{ secrets.DOCKERHUB_USERNAME }}
          password: ${{ secrets.DOCKERHUB_ACCESS_TOKEN }}
      - name: Create manifest list and push tags
        working-directory: /tmp/digests
        run: |
          docker buildx imagetools create $(jq -cr '.tags | map("-t " + .) | join(" ")' <<< "$DOCKER_METADATA_OUTPUT_JSON") \
            $(printf '${{ env.REGISTRY_IMAGE }}@sha256:%s ' *)
      - name: Inspect image
        run: |
          docker buildx imagetools inspect ${{ env.REGISTRY_IMAGE }}:${{ steps.meta.outputs.version }}


================================================
FILE: .github/workflows/publish_lambda.yaml
================================================
# This workflow creates a new release for a quickwit search aws lambda.
# The artifact is a zip file containing a binary for ARM 64,
# ready to be deployed by the deployer.
#
# See quickwit-lambda-client/README.md
name: Release Lambda binary

on:
  push:
    tags:
      - 'lambda-*'
  workflow_dispatch:
    inputs:
      version:
        description: 'Version tag (e.g., v0.8.0)'
        required: false
        default: 'dev'

permissions:
  contents: read

jobs:
  build-lambda:
    name: Build Lambda ARM64
    runs-on: ubuntu-latest
    permissions:
      contents: write
      actions: write
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1

      - name: Set version
        run: |
          if [ "${{ github.ref_type }}" = "tag" ]; then
            # Extract version from tag (e.g., lambda-v0.8.0 -> v0.8.0)
            echo "ASSET_VERSION=${GITHUB_REF_NAME#lambda-}" >> $GITHUB_ENV
          elif [ -n "${{ github.event.inputs.version }}" ] && [ "${{ github.event.inputs.version }}" != "dev" ]; then
            echo "ASSET_VERSION=${{ github.event.inputs.version }}" >> $GITHUB_ENV
          else
            echo "ASSET_VERSION=dev-$(git rev-parse --short HEAD)" >> $GITHUB_ENV
          fi

      - name: Install rustup
        run: curl https://sh.rustup.rs -sSf | sh -s -- --default-toolchain none -y

      - name: Install cross
        run: cargo install cross

      - name: Retrieve and export commit date, hash, and tags
        run: |
          echo "QW_COMMIT_DATE=$(TZ=UTC0 git log -1 --format=%cd --date=format-local:%Y-%m-%dT%H:%M:%SZ)" >> $GITHUB_ENV
          echo "QW_COMMIT_HASH=$(git rev-parse HEAD)" >> $GITHUB_ENV
          echo "QW_COMMIT_TAGS=$(git tag --points-at HEAD | tr '\n' ',')" >> $GITHUB_ENV

      - name: Build Lambda binary
        run: cross build --release --features lambda-release --target aarch64-unknown-linux-gnu -p quickwit-lambda-server --bin quickwit-aws-lambda-leaf-search
        env:
          QW_COMMIT_DATE: ${{ env.QW_COMMIT_DATE }}
          QW_COMMIT_HASH: ${{ env.QW_COMMIT_HASH }}
          QW_COMMIT_TAGS: ${{ env.QW_COMMIT_TAGS }}
        working-directory: ./quickwit

      - name: Create Lambda zip
        run: |
          cd quickwit/target/aarch64-unknown-linux-gnu/release
          cp quickwit-aws-lambda-leaf-search bootstrap
          zip quickwit-aws-lambda-${{ env.ASSET_VERSION }}-aarch64.zip bootstrap
          mv quickwit-aws-lambda-${{ env.ASSET_VERSION }}-aarch64.zip ../../../../

      - name: Upload to GitHub release
        uses: quickwit-inc/upload-to-github-release@9b2c40fba23bf8dea05b7d2eece24cbc95d4a190
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        with:
          file: quickwit-aws-lambda-${{ env.ASSET_VERSION }}-aarch64.zip
          overwrite: true
          draft: true
          tag_name: ${{ env.ASSET_VERSION }}


================================================
FILE: .github/workflows/publish_nightly_packages.yml
================================================
name: Build and publish nightly packages

on:
  workflow_dispatch:
  schedule:
    - cron: "0 5 * * *"

permissions:
  contents: read

jobs:
  build-macos-binaries:
    name: Build ${{ matrix.target }}
    runs-on: macos-latest
    permissions:
      contents: write
      actions: write
    strategy:
      fail-fast: false
      matrix:
        target: [x86_64-apple-darwin, aarch64-apple-darwin]
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - uses: ./.github/actions/cargo-build-macos-binary
        with:
          target: ${{ matrix.target }}
          version: nightly
          token: ${{ secrets.GITHUB_TOKEN }}
  build-linux-binaries:
    strategy:
      fail-fast: false
      matrix:
        target: [x86_64-unknown-linux-gnu, aarch64-unknown-linux-gnu]
    name: Build ${{ matrix.target }}
    runs-on: ubuntu-latest
    permissions:
      contents: write
      actions: write
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - uses: ./.github/actions/cross-build-binary
        with:
          target: ${{ matrix.target }}
          version: nightly
          token: ${{ secrets.GITHUB_TOKEN }}


================================================
FILE: .github/workflows/publish_release_packages.yml
================================================
name: Build and publish release packages

on:
  push:
    tags:
      - "v*"

permissions:
  contents: read

jobs:
  build-macos-binaries:
    name: Build ${{ matrix.target }}
    runs-on: macos-latest
    permissions:
      contents: write
      actions: write
    strategy:
      matrix:
        target: [x86_64-apple-darwin, aarch64-apple-darwin]

    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - name: Extract asset version
        run: echo "ASSET_VERSION=${GITHUB_REF/refs\/tags\//}" >> $GITHUB_ENV
      - uses: ./.github/actions/cargo-build-macos-binary
        with:
          target: ${{ matrix.target }}
          version: ${{ env.ASSET_VERSION }}
          token: ${{ secrets.GITHUB_TOKEN }}

  build-linux-binaries:
    strategy:
      matrix:
        target: [x86_64-unknown-linux-gnu, aarch64-unknown-linux-gnu]
    name: Build ${{ matrix.target }}
    runs-on: ubuntu-latest
    permissions:
      contents: write
      actions: write
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - name: Extract asset version
        run: echo "ASSET_VERSION=${GITHUB_REF/refs\/tags\//}" >> $GITHUB_ENV
      - uses: ./.github/actions/cross-build-binary
        with:
          target: ${{ matrix.target }}
          version: ${{ env.ASSET_VERSION }}
          token: ${{ secrets.GITHUB_TOKEN }}


================================================
FILE: .github/workflows/requirements.txt
================================================
# contains pinned dependencies for installing pipenv to ensure repeatable builds in CI/CD workflows
certifi==2025.10.5 \
    --hash=sha256:0f212c2744a9bb6de0c56639a6f68afe01ecd92d91f14ae897c4fe7bbeeef0de \
    --hash=sha256:47c09d31ccf2acf0be3f701ea53595ee7e0b8fa08801c6624be771df09ae7b43
distlib==0.4.0 \
    --hash=sha256:9659f7d87e46584a30b5780e43ac7a2143098441670ff0a49d5f9034c54a6c16 \
    --hash=sha256:feec40075be03a04501a973d81f633735b4b69f98b05450592310c0f401a4e0d
filelock==3.20.3 \
    --hash=sha256:18c57ee915c7ec61cff0ecf7f0f869936c7c30191bb0cf406f1341778d0834e1 \
    --hash=sha256:4b0dda527ee31078689fc205ec4f1c1bf7d56cf88b6dc9426c4f230e46c2dce1
packaging==25.0 \
    --hash=sha256:29572ef2b1f17581046b3a2227d5c611fb25ec70ca1ba8554b24b0e69331a484 \
    --hash=sha256:d443872c98d677bf60f6a1f2f8c1cb748e8fe762d2bf9d3148b5599295b0fc4f
pipenv==2025.0.4 \
    --hash=sha256:36fc2a7841ccdb2f58a9f787b296c2e15dea3b5b79b84d4071812f28b7e8d7a2 \
    --hash=sha256:e1fbe4cfd25ab179f123d1fbb1fa1cdc0b3ffcdb1f21c775dcaa12ccc356f2bb
platformdirs==4.5.0 \
    --hash=sha256:70ddccdd7c99fc5942e9fc25636a8b34d04c24b335100223152c2803e4063312 \
    --hash=sha256:e578a81bb873cbb89a41fcc904c7ef523cc18284b7e3b3ccf06aca1403b7ebd3
virtualenv==20.36.1 \
    --hash=sha256:575a8d6b124ef88f6f51d56d656132389f961062a9177016a50e4f507bbcc19f \
    --hash=sha256:8befb5c81842c641f8ee658481e42641c68b5eab3521d8e092d18320902466ba


================================================
FILE: .github/workflows/scorecard.yml
================================================
name: OpenSSF Scorecard
on:
  schedule:
    - cron: '0 0 * * 0'
  push:
    branches:
      - main

permissions:
  contents: read

jobs:
  analysis:
    name: Scorecards analysis
    runs-on: ubuntu-latest
    permissions:
      # Needed to upload the results to code-scanning dashboard.
      security-events: write
      # Needed to publish results
      id-token: write
      actions: read
      contents: read

    steps:
      - name: 'Checkout code'
        uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
        with:
          persist-credentials: false

      - name: 'Run analysis'
        uses: ossf/scorecard-action@4eaacf0543bb3f2c246792bd56e8cdeffafb205a # v2.4.3
        with:
          results_file: results.sarif
          results_format: sarif
          repo_token: ${{ secrets.GITHUB_TOKEN }}
          publish_results: true

      # Upload the results as artifacts.
      - name: 'Upload artifact'
        uses: actions/upload-artifact@b7c566a772e6b6bfb58ed0dc250532a479d7789f # v6.0.0
        with:
          name: SARIF file
          path: results.sarif
          retention-days: 5

      # Upload the results to GitHub's code scanning dashboard.
      - name: 'Upload to code-scanning'
        uses: github/codeql-action/upload-sarif@cdefb33c0f6224e58673d9004f47f7cb3e328b89 # v4.31.10
        with:
          sarif_file: results.sarif


================================================
FILE: .github/workflows/ui-ci.yml
================================================
name: UI CI

on:
  workflow_dispatch:
  pull_request:
    paths:
      - "quickwit/quickwit-ui/**"
      - ".github/workflows/ui-ci.yml"
  push:
    branches:
      - main
      - trigger-ci-workflow
    paths:
      - "quickwit/quickwit-ui/**"
      - ".github/workflows/ui-ci.yml"

permissions:
  contents: read

jobs:
  checks:
    name: Lint, type check & unit tests
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - uses: actions/setup-node@395ad3262231945c25e8478fd5baf05154b1d79f # v6.1.0
        with:
          node-version: 24
          cache: "yarn"
          cache-dependency-path: quickwit/quickwit-ui/yarn.lock
      - name: Install JS dependencies
        run: yarn --cwd quickwit-ui install
        working-directory: ./quickwit
      - name: Lint
        run: yarn --cwd quickwit-ui lint
        working-directory: ./quickwit
      - name: Type check
        run: yarn --cwd quickwit-ui type
        working-directory: ./quickwit
      - name: Unit tests
        run: yarn --cwd quickwit-ui test
        working-directory: ./quickwit

  e2e:
    name: Playwright e2e
    runs-on: ubuntu-latest
    permissions:
      contents: read
      actions: write
    services:
      postgres:
        image: postgres:latest
        ports:
          - 5432:5432
        env:
          POSTGRES_USER: quickwit-dev
          POSTGRES_PASSWORD: quickwit-dev
          POSTGRES_DB: quickwit-metastore-dev
        options: >-
          --health-cmd pg_isready
          --health-interval 10s
          --health-timeout 5s
          --health-retries 5
    env:
      CARGO_INCREMENTAL: 0
      RUST_BACKTRACE: 1
      RUSTFLAGS: -Dwarnings --cfg tokio_unstable
      RUSTDOCFLAGS: -Dwarnings -Arustdoc::private_intra_doc_links
      QW_TEST_DATABASE_URL: postgres://quickwit-dev:quickwit-dev@postgres:5432/quickwit-metastore-dev
    steps:
      - uses: actions/checkout@8e8c483db84b4bee98b60c0593521ed34d9990e8 # v6.0.1
      - uses: actions/setup-node@395ad3262231945c25e8478fd5baf05154b1d79f # v6.1.0
        with:
          node-version: 24
          cache: "yarn"
          cache-dependency-path: quickwit/quickwit-ui/yarn.lock
      - name: Setup stable Rust Toolchain
        uses: dtolnay/rust-toolchain@f7ccc83f9ed1e5b9c81d8a67d7ad1a747e22a561 # master
        with:
          toolchain: stable
      - name: Setup Rust cache
        uses: Swatinem/rust-cache@779680da715d629ac1d338a641029a2f4372abb5 # v2.8.2
        with:
          workspaces: "./quickwit -> target"
          shared-key: "quickwit-cargo"
      - name: Install JS dependencies
        run: yarn --cwd quickwit-ui install
        working-directory: ./quickwit
      - name: Install Playwright browsers
        run: npx playwright install chromium --with-deps --only-shell
        working-directory: ./quickwit/quickwit-ui
      - name: Build UI
        run: CI=false yarn --cwd quickwit-ui build
        working-directory: ./quickwit
      - name: Build Quickwit
        run: |
          sudo apt-get update && sudo apt-get -y install protobuf-compiler
          cargo build --features=postgres
        working-directory: ./quickwit
      - name: Run e2e tests
        run: |
          mkdir -p qwdata
          cargo run --features=postgres -- run --service searcher --service metastore --config ../config/quickwit.yaml &
          yarn --cwd quickwit-ui e2e-test
        working-directory: ./quickwit


================================================
FILE: .gitignore
================================================
# Generated by Cargo
# will have compiled files and executables
**/target/**
**/proptest-regressions
**/perf.data*
**/flamegraph.svg
local/**
quickwit/quickwit-ui/package-lock.json
**/.DS_Store

TODO.md
QUESTIONS.txt


# Remove Cargo.lock from gitignore if creating an executable, leave it for libraries
# More information here https://doc.rust-lang.org/cargo/guide/cargo-toml-vs-cargo-lock.html
#Cargo.lock

# These are backup files generated by rustfmt
**/*.rs.bk

.env
.idea
.vscode
.vscode-license
deps
elastic-search-artifacts
qwdata

# Generated by prost/tonic build
*_descriptor.bin


================================================
FILE: .localstack/init.sh
================================================
#!/usr/bin/env bash

set -eu

awslocal s3 mb s3://quickwit-dev
awslocal s3 mb s3://quickwit-integration-tests && awslocal s3 rm --recursive s3://quickwit-integration-tests

if ! awslocal kinesis list-streams | grep -q quickwit-dev-stream ; then
    awslocal kinesis create-stream --stream-name quickwit-dev-stream --shard-count 3
fi


================================================
FILE: CHANGELOG.md
================================================
<!--
# Changelog
All notable changes to this project will be documented in this file.

The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).

## [Unreleased]

### Added

### Fixed
- (Jaeger) Query resource attributes when Jaeger request carries tags

### Changed

### Deprecated

### Removed

### Security

--->

# [0.9.0]

### Added
- Add Ingest V2 (#5600, #5566, #5463, #5375, #5350, #5252 #5202)
- Add SQS source (#5374, #5335, #5148)
- Disable control plane check for searcher (#5599, #5360)
- Partially implement `_elastic/_cluster/health` (#5595)
- Make Jaeger span attribute-to-tag conversion exhaustive (#5574)
- Use `content_length_limit` for ES bulk limit (#5573)
- Limit and monitor warmup memory usage (#5568)
- Add eviction metrics to caches (#5523)
- Record object storage request latencies (#5521)
- Add some kind of throttling on the janitor to prevent it from overloading (#5510)
- Prevent single split searches from different `leaf_search` from interleaving (#5509)
- Retry on S3 internal error (#5504)
- Allow specifying OTEL index ID in header (#5503)
- Add a metric to count storage errors and their error code (#5497)
- Add support for concatenated fields (#4773, #5369, #5331)
- Add number of splits per root/leaf search histograms (#5472)
- Introduce a searcher config option to timeout get requests (#5467)
- Add fingerprint to task in cluster state (#5464)
- Enrich root/leaf search spans with number of docs and splits (#5450)
- Add some additional search metrics (#5447)
- Improve GC resilience and add metrics (#5420)
- Enable force shutdown with 2nd Ctrl+C (#5414)
- Add request_timeout_secs config to searcher config (#5402)
- Memoize S3 client (#5377)
- Add more env var config for Postgres (#5365)
- Enable str fast field range queries (#5324)
- Allow querying non-existing fields (#5308)
- Support updating doc mapper through api (#5253)
- Add optional special handling for hex in code tokenizer (#5200)
- Added a circuit breaker layer (#5134)
- Various performance optimizations in Tantivy (https://github.com/quickwit-oss/tantivy/blob/main/CHANGELOG.md)

### Changed
- Parse datetimes and timestamps with leading and/or trailing whitespace (#5544)
- Restrict maturity period to retention (#5543)
- Wait for merge at end of local ingest (#5542)
- Log PostgreSQL metastore error (#5530)
- Update azure multipart policy (#5553)
- Stop relying on our own version of pulsar-rs (#5487)
- Handle nested OTLP values in attributes and log bodies (#5485)
- Improve merge pipeline finalization (#5475)
- Allow failed splits in root search (#5440)
- Batch delete from GC (#5404, #5380)
- Make some S3 errors retryable (#5384)
- Change default timestamps in OTEL logs (#5366)
- Only return root spans for Jaeger HTTP API (#5358)
- Share aggregation limit on node (#5357)

### Fixed
- Fix existence queries for nested fields (#5581)
- Fix lenient option with wildcard queries (#5575)
- Fix incompatible ES Java date format (#5462)
- Fix bulk api response order (#5434)
- Fix pulsar finalize (#5471)
- Fix pulsar URI scheme (#5470)
- Fix grafana searchers dashboard (#5455)
- Fix jaeger http endpoint (#5378)
- Fix file re-ingestion after EOF (#5330)
- Fix configuration interpolation (#5403)
- Fix jaeger duration parse error (#5518)
- Fix unit conversion in jaeger http search endpoint (#5519)

### Removed
- Remove support for 2-digit years in java datetime parser (#5596)
- Remove DocMapper trait (#5508)
- Remove support for AWS Lambda (#5884)
- Remove search stream endpoint (#5886)

# [0.8.1]

### Fixed

- Bug in the chitchat digest message serialization (chitchat#144)

## [0.8.0]

### Added

- Remove some noisy logs (#4447)
- Add `/{index}/_stats` and `/_stats` ES API (#4442)
- Use `search_after` in ES scroll API (#4280)
- Add support for wildcard exclusion in index patterns (#4458)
- Add `.` support in DSL indentifiers (#3989)
- Add cat indices ES API (#4465)
- Limit concurrent merges (#4473)
- Add Index Template API and auto create index (#4456) (only available with ingest V2)
- Add support for compressed ES `_bulk` requests (#4506)
- Add support for slash `/` character in field names (#4510)
- Handle SIGTERM shutdown signal (#4539)
- Add `start_timestamp` and `end_timestamp` filter to ES `_field_caps` API (#4547)
- Limit the number of merge pipelines that can be spawned concurrently (#4574)
- Add support for `_source_excludes` and `_source_includes` query parameters in ES API (#4572)
- Add gRPC metrics layer to clients and servers (#4591)
- Add additional cluster metrics (#4597)
- Add index patterns query param on GET `/indexes` endpoint (#4600)
- Add support for GCS file backed metastore (#4604)
- Add default search fields for OTEL traces index (#4602)
- Add support for delete index in ES API (#4606)
- Add a handler to dynamically change the log level (#4662)
- Add REST endpoint to parse a query into a query AST (#4652)
- Add postgresql index and use `IN` instead of many `OR` (#4670)
- Add support for `_source_excludes`, `_source_includes`, `extra_filters` in `_msearch` ES API (#4696)
- Handle `track_total_size` on request ES body (#4710)
- Add a metric for the number number of indexes (#4711)
- Add various performance optimizations in Quickwit and Tantivy

More details in tantivy's [changelog](https://github.com/quickwit-oss/tantivy/blob/main/CHANGELOG.md).

### Fixed

- Fix aggregation result on empty index (#4449)
- Fix Gzip file source (#4457)
- Rate limit noisy logs (#4483)
- Prevent the exponential backoff from overflowing after 64 attempts (#4501)
- Remove field presence in ES `_field_caps` API (#4492)
- Remove `source` in ES parameter, remove unsupported field `fields` in response (#4590)
- Fix aggregation `split_size` parameter, add docs and test (#4627)
- Various fixes in chitchat (gossip): more details in [chitchat commit history](https://github.com/quickwit-oss/chitchat/commits/main/?since=2024-01-08&until=2024-03-13)
- Various fixes in mrecordlog (WAL): more details in [mrecordlog commit history](https://github.com/quickwit-oss/mrecordlog/commits/main/?since=2024-01-08&until=2024-03-13)

### Changed

- (Breaking) [Add ZSTD compression to chitchat's Deltas](https://github.com/quickwit-oss/chitchat/pull/112)

### Removed

### Migration from 0.7.x to 0.8.0

To deploy Quickwit 0.8.0, you must either:
- **shutdown down** your cluster **entirely** before deploying, or
- **restart all** the nodes of your cluster after deploying.

Because we made some breaking changes in the gossip protocol (chitchat), nodes running different versions of Quickwit cannot communicate with each other and crash upon receiving messages that do not match their release version. The new protocol is now versioned, and future updates of the gossip protocol will be backward compatible.


## [0.7.1]

### Added

- Add es _count API (#4410)
- Add _elastic/_field_caps API (#4350)
- Make gRPC message size configurable (#4388)
- Add API endpoint to get some control-plan internal info (#4339)
- Add Google Cloud Storage Implementation available for storage paths starting with `gs://` (#4344)

### Changed

- Return 404 on index not found in ES Bulk API (#4425)
- Allow $ and @ characters in field names (#4413)

### Fixed
- Assign all sources/shards, even if this requires exceeding the indexer #4363
- Fix traces doc mapping (service name set as  fast) and update default otel logs index ID to `otel-logs-v0_7` (#4401)
- Fix parsing multi-line queries (#4409)
- Fix range query for optional fast field panics with Index out of bounds (#4362)

### Migration from 0.7.0 to 0.7.1

Quickwit 0.7.1 will create the new index `otel-logs-v0_7` which is now used by default when ingesting data with the OTEL gRPC and HTTP API.

In the traces index `otel-traces-v0_7`, the `service_name` field is now fast. No migration is done if `otel-traces-v0_7` already exists. If you want `service_name` field to be fast, you have to delete first the existing `otel-traces-v0_7` index or create your own index.

## [0.7.0]

### Added

- Elasticsearch-compatible API
  - Added scroll and search_after APIs and support for multi-index search queries
  - Added exists, multi-match, match phrase prefix, match bool prefix, bool queries
  - Added `_field_caps` API
- Added support for OTLP over HTTP API (Protobuf only) (#4335)
- Added Jaeger REST endpoints for Grafana tracing support (#4197)
- Added support for injecting custom HTTP headers and moved REST config parameters into REST config section (#4198)
- Added support for OTLP trace data in arbitrary sources
- Commit Kafka offsets on suggest truncate (#3638)
- Honor `auto.offset.reset` parameter in Kafka source (#4095)
- Added exact count optimization (#4019)
- Added stream splits gRPC (#4109)
- Adding a split cache in Searchers (#3857)
- Added `coerce` and `output_format` options for numeric fields (#3704)
- Added `PhraseMatchQuery` and `MultiMatchQuery` (#3727)
- Added Elasticsearch's `TermsQuery` (#3747)
- Added GCP PubSub source (#3720)
- Parse timestamp strings (#3639)
- Added Digital Ocean storage flavor (#3632)
- Added new tokenizers: `source_code_default`, `source_code`, `multilang` (#3647, #3655, #3608)


### Fixed

- Fixed dates in UI (#4277)
- Fixed duplicate splits planned on pipeline crash-respawn (#3854)
- Fixed sorting (#3799)

More details in tantivy's [changelog](https://github.com/quickwit-oss/tantivy/blob/main/CHANGELOG.md).

### Changed

- Improve OTEL traces index config (#4311)
  - OTEL endpoints are now using by default indexes `otel-logs-v0_7` and `otel-traces-v0_7` instead of `otel-logs-v0_6` and `otel-traces-v0_6`
  - OTEL indexes have more fields stored as "fast" and have Trace and Span ID bytes field in hex format

- Increased the gRPC payload limits from 10MiB to 20MiB (#4227)
- Reject malformed Elasticsearch API requests (#4175)
- Better logging when doc processing fails (#4323)
- Search performance improvements
- Indexing performance improvements

### Removed

### Migration from 0.6.x to 0.7

The format of the index and internal objects stored in the metastore of 0.7 is backward compatible with 0.6.

If you are using the OTEL indexes and ingesting data into indexes the `otel-logs-v0_6` and `otel-traces-v0_6`, you must stop indexing before upgrading.
Indeed, the first time you start Quickwit 0.7, it will update the doc mapping fields of Trace ID and Span ID of those two indexes by changing their input/output formats from base64 to hex. This is automatic: you don't have to perform any manual operation.
Quickwit 0.7 will create new indexes `otel-logs-v0_7` and `otel-traces-v0_7`, which are now used by default when ingesting data with the OTEL gRPC and HTTP API. The Jaeger gRPC and HTTP APIs will query both `otel-traces-v0_6` and `otel-traces-v0_7` by default.
It's possible to define the index ID you want to use for OTEL gRPC endpoints and Jaeger gRPC API by setting the request header `qw-otel-logs-index` or `qw-otel-traces-index` to the index ID you want to target.


## [0.6.1]

### Added
- Support of phrase prefix queries in the query language.

### Fixed
- Fix timestamp field which was not allowed when defined in an object mapping.
- Fix querying of integer on a JSON field (no document were returned).


## [0.6.0] - 2023-06-03

### Added
- Elasticsearch/Opensearch compatible API.
- New columnar format:
    - Fast fields can now have any cardinality (Optional, Multivalued, restricted). In fact cardinality is now only used to format the output.
    - Dynamic Fields are now fast fields.
- String fast fields now can be normalized.
- Various parameters of object storages can now be configured.
- The ingest API makes it possible to force a commit, or wait for a scheduled commit to occur.
- Ability to parse non-JSON data using VRL to extract some structure from documents.
- Object storage can now use the `virtual-hosted–style`.
- `date_histogram` aggregation.
- `percentiles` aggregation.
- Added support for Prefix Phrase query.
- Added support for range queries.
- The query language now supports different date formats.
- Added support for base16 input/output configuration for bytes field. You can search for bytes fields using base16 encoded values.
- Autotagging: fields used in the partition key are automatically added to tags.
- Added arm64 docker image.
- Added CORS configuration for the REST API.


### Fixed
- Major bug fix that required to restart quickwit when deleting and recreating an index with the same name.
- The number of concurrent GET requests to object stores is now limited. This fixes a bug observed with when requested a lot of documents from MinIO.
- Quickwit now searches into resource attributes when receiving a Jaeger request carrying tags
- Object storage can be figured to:
    - avoid Bulk delete API (workaround for Google Cloud Storage).
    - Use virtual-host style addresses (workaround for Alibaba Object Storage Service).
- Fix aggregation min doc_count empty merge bug.
- Fix: Sort order for term aggregations.
- Switch to ms in histogram for date type (aligning with ES).

### Improvements

- Search performance improvement.
- Aggregation performance improvement.
- Aggregation memory improvement.

More details in tantivy's [changelog](https://github.com/quickwit-oss/tantivy/blob/main/CHANGELOG.md).

### Changed
- Datetime now have up to a nanosecond precision.
- By default, quickwit now uses the node's hostname as the default node ID.
- By default, Quickwit is in dynamic mode and all dynamic fields are marked as fast fields.
- JSON field uses by default the raw tokanizer and is set to fast field.
- Various performance/compression improvements.
- OTEL indexes Trace ID and Span ID are now bytes fields.
- OTEL indexes stores timestamps with nanosecond precision.
- pan status is now indexed in the OTEL trace index.
- Default and raw tokenizers filter tokesn longer than 255 bytes instead of 40 bytes.


## [0.5.0] - 2023-03-16

### Added
- gRPC OpenTelemetry Protocol support for traces
- gRPC OpenTelemetry Protocol support for logs
- Control plane (indexing tasks scheduling)
- Ingest API rate limiter
- Pulsar source
- VRL transform for data sources
- REST API enhanced to fully manage indexes, sources, and splits
- OpenAPI specification and swagger UI for all REST available endpoints
- Large responses from REST API can be compressed
- Add bulk stage splits method to metastore
- MacOS M1 binary
- Doc mapping field names starting with `_` are now valid

### Fixed
- Fix UI index completion on search page
- Fix CLI index describe command to show stats on published splits
- Fix REST API to always return on error a body formatted as `{"message": "error message"}`
- Fixed REST status code when deleting unexisting index, source and when fetching splits on unexisting index

### Changed
- Source config schema (breaking or not? use serde rename to be not breaking?)
- RocksDB replaced by [mrecordlog](https://github.com/quickwit-oss/mrecordlog) to store ingest API queues records
- (Breaking) Indexing partition key new DSL
- (Breaking) Helm chart updated with the new CLI
- (Breaking) CLI indexes, sources, and splits commands use the REST API
- (Breaking) Index new format: you need to reindex all your data

## [0.4.0] - 2022-12-03

### Added
- Boolean, datetime, and IP address fields
- Chinese tokenizer
- Distributed indexing (Kafka only)
- gRPC metastore server
- Index partitioning
- Kubernetes
- Node config templating
- Prometheus metrics
- Retention policies
- REST API for CRUD operations on indexes/sources
- Support for Azure Blob Storage
- Support for BM25 document scoring
- Support for deletions
- Support for slop in phrase queries
- Support for snippeting

### Fixed
- Fixed cache misses during search fetch docs phase
- Fixed credentials leak in metastore URI
- Fixed GC scalability issues
- Fixed support for multi-source

### Changed
- Changed default docstore block size to 1 MiB and compression algorithm to ZSTD

- Quickwit now relies on sqlx rather than Diesel for PostgreSQL interactions.
Migrating from 0.3 should work as expected. Migrating from earlier version however is
not supported.

### Removed
- Removed support for i64 as timestamp field
- Removed support for sorting index by field

### Security
- Forbid access to paths with `..` at storage level

## [0.3.1] - 2022-06-22

### Added
- Add support for Google Cloud Storage
- Sort hits by timestamp desc by default in search UI
- Add `description` attribute to field mappings
- Display split state in output of `quickwit split list` command

### Fixed
- Clean up local split cache after index deletion
- Fix API URLs displayed for copy and paste in UI
- Fix custom S3 endpoint with trailing `/`
- Fix `quickwit index create` command with `--overwrite` option

## [0.3.0] - 2022-05-31

### Added
- Embedded UI for displaying search hits and cluster state
- Schemaless indexing with JSON field
- Ingest API (Elasticsearch-compatible)
- Aggregation queries
- Support for Amazon Kinesis

### Fixed
- Switched cluster membership algorithm from S.W.I.M. to Chitchat

### Removed
- u64 as date field

## [0.2.1] - 2022-02-28

### Added
- Query validation against index schema before dispatch to leaf nodes (#1109, @linxGnu)
- Support for custom S3 endpoint (#1108)
- Warm up terms and fastfields concurrently (#1147)

### Fixed
- Minor bug in leaf search stream (#1110)
- Default index root URI and metastore URI correctly default to data dir (#1140, @ddelemeny)

### Removed
- QW_ENV environment variable

### Security
- Compiled binaries with Rust 1.58.1, which fixes CVE-2022-21658

## [0.2.0] - 2022-01-12

## [0.1.0] - 2021-07-13


================================================
FILE: CODE_OF_CONDUCT.md
================================================
# Contributor Covenant Code of Conduct

## Our Pledge

We as members, contributors, and leaders pledge to make participation in our
community a harassment-free experience for everyone, regardless of age, body
size, visible or invisible disability, ethnicity, sex characteristics, gender
identity and expression, level of experience, education, socio-economic status,
nationality, personal appearance, race, caste, color, religion, or sexual identity
and orientation.

We pledge to act and interact in ways that contribute to an open, welcoming,
diverse, inclusive, and healthy community.

## Our Standards

Examples of behavior that contributes to a positive environment for our
community include:

* Demonstrating empathy and kindness toward other people
* Being respectful of differing opinions, viewpoints, and experiences
* Giving and gracefully accepting constructive feedback
* Accepting responsibility and apologizing to those affected by our mistakes,
  and learning from the experience
* Focusing on what is best not just for us as individuals, but for the
  overall community

Examples of unacceptable behavior include:

* The use of sexualized language or imagery, and sexual attention or
  advances of any kind
* Trolling, insulting or derogatory comments, and personal or political attacks
* Public or private harassment
* Publishing others' private information, such as a physical or email
  address, without their explicit permission
* Other conduct which could reasonably be considered inappropriate in a
  professional setting

## Enforcement Responsibilities

Community leaders are responsible for clarifying and enforcing our standards of
acceptable behavior and will take appropriate and fair corrective action in
response to any behavior that they deem inappropriate, threatening, offensive,
or harmful.

Community leaders have the right and responsibility to remove, edit, or reject
comments, commits, code, wiki edits, issues, and other contributions that are
not aligned to this Code of Conduct, and will communicate reasons for moderation
decisions when appropriate.

## Scope

This Code of Conduct applies within all community spaces, and also applies when
an individual is officially representing the community in public spaces.
Examples of representing our community include using an official e-mail address,
posting via an official social media account, or acting as an appointed
representative at an online or offline event.

## Enforcement

Instances of abusive, harassing, or otherwise unacceptable behavior may be
reported to the community leaders responsible for enforcement at adrien+cc at quickwit dot io.
All complaints will be reviewed and investigated promptly and fairly.

All community leaders are obligated to respect the privacy and security of the
reporter of any incident.

## Enforcement Guidelines

Community leaders will follow these Community Impact Guidelines in determining
the consequences for any action they deem in violation of this Code of Conduct:

### 1. Correction

**Community Impact**: Use of inappropriate language or other behavior deemed
unprofessional or unwelcome in the community.

**Consequence**: A private, written warning from community leaders, providing
clarity around the nature of the violation and an explanation of why the
behavior was inappropriate. A public apology may be requested.

### 2. Warning

**Community Impact**: A violation through a single incident or series
of actions.

**Consequence**: A warning with consequences for continued behavior. No
interaction with the people involved, including unsolicited interaction with
those enforcing the Code of Conduct, for a specified period of time. This
includes avoiding interactions in community spaces as well as external channels
like social media. Violating these terms may lead to a temporary or
permanent ban.

### 3. Temporary Ban

**Community Impact**: A serious violation of community standards, including
sustained inappropriate behavior.

**Consequence**: A temporary ban from any sort of interaction or public
communication with the community for a specified period of time. No public or
private interaction with the people involved, including unsolicited interaction
with those enforcing the Code of Conduct, is allowed during this period.
Violating these terms may lead to a permanent ban.

### 4. Permanent Ban

**Community Impact**: Demonstrating a pattern of violation of community
standards, including sustained inappropriate behavior,  harassment of an
individual, or aggression toward or disparagement of classes of individuals.

**Consequence**: A permanent ban from any sort of public interaction within
the community.

## Attribution

This Code of Conduct is adapted from the [Contributor Covenant][homepage],
version 2.0, available at
[https://www.contributor-covenant.org/version/2/0/code_of_conduct.html][v2.0].

Community Impact Guidelines were inspired by
[Mozilla's code of conduct enforcement ladder][Mozilla CoC].

For answers to common questions about this code of conduct, see the FAQ at
[https://www.contributor-covenant.org/faq][FAQ]. Translations are available
at [https://www.contributor-covenant.org/translations][translations].

[homepage]: https://www.contributor-covenant.org
[v2.0]: https://www.contributor-covenant.org/version/2/0/code_of_conduct.html
[Mozilla CoC]: https://github.com/mozilla/diversity
[FAQ]: https://www.contributor-covenant.org/faq
[translations]: https://www.contributor-covenant.org/translations


================================================
FILE: CODE_STYLE.md
================================================
# Quickwit Coding Style

This document resumes a couple of points we try to embrace in our coding style. Some of these points take an opinionated side on a trade-off story.
The description will try to make that clear.

The driving motivation of this code style is to make your code more readable.

Readable is one word that hides several dimensions:
- the reader understands the intent very rapidly
- the reader can proofread. It can become confident that the code is correct very easily.

Noticing how the two are different should not require too much squinting.
Shoot for *proofreadability*.

## Code reviews

Do a pass on your own code before sending it for review to avoid wasting the review time.
Also, a trivial code style issues can come in the way and avoid spotting
deeper issues with the code.

As a reviewer, your first mission is proofreading. If you find a logical bug, feel good. You did an awesome job today.

Your second goal is to make sure the code quality stays high.

You can express "nitpicks": suggestions about some local aspect of the code that do not matter too much. Just prepend "nitpick:" to your comment.
You can also express an opinion/advice that you know is not universal.
Make sure you make it clear to the reviewee that it is fine to ignore the comment.

Do not use rhetorical questions... If you are 95% sure of something, there is no need to express it as a question.
Prefer `I believe this should be n+1` to `Shouldn't this be n+1?`.

The issue with rhetorical questions is that when you will have a genuine
question, reviewees may over interpret it as an affirmation.

As a reviewee, if you are not used to CRs, it can feel like an adversarial process. Relax. This is normal to end up with a lot of comments on your first few CRs.

You might feel like the comments are unjustified, try as much as possible to not feel frustrated.
If you want to discuss it, the best place is the chat, or maybe send a PR to modify this document.

But remember to pick your battles... If you think it does not matter much but it takes 2 secs to fix, just consider doing what is suggested by the reviewer or this style guide.

## Rust gives us a lot of tools... this does not mean we need to abuse them.

Rust is an amazing language. It offers all kinds of tools to allow for zero-cost code reuse. Within these tools, however, generics and macros tend to hurt readability (and compile-time). Let's ONLY use them where necessary.

The same goes with the chaining iterator style.
When coupled with error handling, rust's chaining iterator style can
hurt readability.
Using a good old procedural for-loop is fine and recommended in that case.

**example needed**


## Naming

Function and variable names are key for readability.

A good function name is often sufficient for the reader to build reasonable expectations of what it does.

If this implies long names, let's have very long names.

Trying to fit this rule has an interesting side effect.
Nobody likes to type long function names. It just feels ugly.
But these are frequently symptoms of a badly organized code, and it can
help spot refactoring opportunities.

**example needed**

## Explanatory variables

One incredibly powerful tool and simple tool to help make your code
more readable is to introduce explanatory variables.

Explanatory variables are intermediary variables that were not really
necessary, but make it possible -through their names- to convey their
semantics to the reader.

**example needed**

## Shadowing

As much as possible, do not use reuse the same variable name in a function.
It is never necessary, very rarely helpful and can hurt.

## Types

Rust handles type elision. That's great.
Chances are, your editor even automatically hints the type of
your variables.

Sometimes, however, it can be helpful for the reviewer to have the type of some very strategic variables.

**example needed**

## Early returns

We prefer early return.
Rather than chaining `else` statement, we prefer to isolate
corner case in short `if` statement to prevent nesting

**example needed**

## Invariants

A good idea to help reviewers proofread your code is to
identify invariants and express them as `debug_assert`.

These assert will not be part of the release binary and won't hurt the execution time.

**example needed**

## Errors and log messages

Error and log messages follow the same format. They should be concise, lowercase (except proper names), and without trailing punctuation.

As a loose rule, where it does not hurt readability, log messages should rely on `tracing` 
structured logging instead of templating. 

In other words, prefer:
`warn!(remaining=remaining_attempts, "trubulizor rpc plane retry failed")`
to 
`warn!("trubulizor rpc plane retry failed ({remaining_attempts} attempts remaining)")`

### Error Examples
- "failed to start actor runtimes"
- "cannot join PostgreSQL URI {} with path {:?}"
- "could not find split metadata in Metastore {}"
- "unknown output format {:?}"
 
### Log examples


## Comments

We use on the same code style, [rustc's doc comments](https://doc.rust-lang.org/1.0.0/style/style/comments.html).
In particular, the summary line should be written in third-person singular present indicative form.

No rustdoc in Quickwit or in private API is ok.
No rustdoc on Tantivy public API is not ok.

We usually do not expect comments to contain any implementation details.
To some extent, it is normal for the user to have to look at the code.

When it is not clear, comments should convey:
- intent
- context (links to a Wikipedia page or a paper, link to the original issue can be helpful too)
- hidden contracts... but really you should avoid those.

Inline comments in the code can be very useful to help the reader understand
the justification of a thorny piece of code.

**example needed**

## Hidden contracts

We call hidden contract, a pre-condition on the arguments that is not enforced by their types.

Sometimes, hidden contracts are unavoidable.

For instance, a binary search requires the array to be sorted.

Whenever possible, you should avoid having hidden contracts.

To avoid hidden contracts, you should consider:
- changing your argument types to have the type system enforce the contract
- internalize the contract enforcement.

For instance, the following function is not good because it hides a contract on values not being empty:

```
fn min(&self, values: &[usize]) -> usize {
	let mut min_val = usize::MAX;
	for val in values {
		min_val = min_val.min(val)
	}
	min_val
}
```
It can be done by changing the prototype to a `Result` or an `Option`.

In addition, while the author might have thought that the `usize::MAX` trick was a nice touch, it can easily backfire. Panicking is often better than returning a wrong result.

The better approach here is of course an `Option<usize>` like `Iterator::min` does.

Another way to internalize the contract enforcement is to move some logic from the caller to within the function.

For instance:
```
// The algorithms requires splits to be sorted by `end_time`
fn merge_candidates(splits: &mut Vec<SplitMetadata>) -> Vec<SplitMetadata>
```

It is tempting to rely on the fact that splits `Vec` is always sorted on the caller side and put this as a hidden contract.
If it is not too much work, just redoing the sorting within merge candidates
is a good idea. For the above function, that extra work is tiny.

By the way, did you know Rust's std sort is inspired by timsort?
It will perform in linear time if the array is already sorted...

When implementing a function with a hidden contract, as long as it does not hurt the overall performance, add an assert statement to your code to check the contract. (For instance, check that the array is sorted).

**example needed*

## Tests

Test do not need to match the same quality as the original code.

When a bug is encountered, it is ok to introduce a test that seems weirdly
overfitted to the specific issue. A comment should then add a link to the issue.

Unit test should run fast, and if possible they should not do any IO.
Code should be structured to make unit testing possible.

Some of our unit tests would not be considered good unit tests in some companies, and that's ok.

Here are the controversial bits:

### Not just for spotting regression

Our unit tests are not here just to spot regression.
They are also here to check the correctness of our code.

### Not just testing public API

Unit test do not only test public API.
Complex code often calls half a dozen smaller functions.

The cardinality of the corner case of the complex code
can make it difficult to test all corner case.

On the other hand, the smaller functions could be tested
exhaustively.

For this reason, testing internal private functions is actually encouraged.

### Not always "unit" tests

Ideally, unit tests should be testing one thing and one thing only, but if they don't and it helps cover more ground, this is ok.

### Not necessarily deterministic.

Finally, unit tests are not necessarily deterministic. We really like proptests.
When proptesting, make sure to reduce as much as possible the space of exploration to get the most out of it.

## async vs sync

Your async code should block for at most 500 microseconds.
If you are unsure whether your code blocks for 500 microseconds, or if it is a non-trivial question, it should run via `tokio::spawn_block`.


================================================
FILE: CONTRIBUTING.md
================================================
# Contributing to Quickwit
There are many ways to contribute to Quickwit.
Code contributions are welcome of course, but also
bug reports, feature requests, and evangelizing are as valuable.

# Submitting a PR
Check if your issue is already listed on [github](https://github.com/quickwit-oss/quickwit/issues).
If it is not, create your own issue.

Please add the following phrase at the end of your commit `Closes #<Issue Number>`.
It will automatically link your PR in the issue page. Also, once your PR is merged, it will
close the issue. If your PR only partially addresses the issue and you would like to
keep it open, just write `See #<Issue Number>`.

Feel free to send your contribution in an unfinished state to get early feedback.
In that case, simply mark the PR with the tag [WIP] (standing for work in progress).

## PR verification checks
When you submit a pull request to the project, the CI system runs several verification checks. After your PR is merged, a more exhaustive list of tests will be run.

You will be notified by email from the CI system if any issues are discovered, but if you want to run these checks locally before submitting PR or in order to verify changes you can use the following commands in the root directory:
1. To verify that all tests are passing, run `make test-all`.
2. To fix code style and format as well as catch common mistakes run `make fix`. Alternatively, run `make -k test-all docker-compose-down` to tear down the Docker services after running all the tests.
3. To build docs run `make build-rustdoc`.

# Development

## Setup & run tests

### Local Development

1. Install Rust, CMake, Docker (https://docs.docker.com/engine/install/) and Docker Compose (https://docs.docker.com/compose/install/)
2. Install node@24 and `npm install -g yarn`
3. Install awslocal https://github.com/localstack/awscli-local
4. Install protoc https://grpc.io/docs/protoc-installation/ (you may need to install the latest binaries rather than your distro's flavor)
5. Install nextest https://nexte.st/docs/installation/pre-built-binaries/

### GitHub Codespaces

[![Open in GitHub Codespaces](https://github.com/codespaces/badge.svg)](https://codespaces.new/quickwit-oss/quickwit?devcontainer_path=.devcontainer/devcontainer.json)

GitHub Codespaces provides a fully configured development environment in the cloud, making it easy to get started with Quickwit development. By clicking the badge above, you can create a codespace with all the necessary tools installed and configured.

### Running tests
Run `make test-all` to run all tests.

## Useful commands
* `make test-all` - starts necessary Docker services and runs all tests.
* `make -k test-all docker-compose-down` - the same as above, but tears down the Docker services after running all the tests.
* `make fmt` - runs formatter, this command requires the nightly toolchain to be installed by running `rustup toolchain install nightly`.
* `make fix` - runs formatter and clippy checks as well as removing unused dependencies (requires `cargo install cargo-machete`).
* `make typos` - runs the spellcheck tool over the codebase. (Install by running `cargo install typos-cli`)
* `make doc` - builds docs.
* `make docker-compose-up` - starts Docker services.
* `make docker-compose-down` - stops Docker services.
* `make docker-compose-logs` - shows Docker logs.

## Start the UI
1. Switch to the `quickwit` subdirectory of the project and create a data directory `qwdata` there if it doesn't exist
2. Start a server `cargo r run --config ../config/quickwit.yaml`
3. `yarn --cwd quickwit-ui install` and `yarn --cwd quickwit-ui start`
4. Open your browser at `http://localhost:3000/ui` if it doesn't open automatically

## Running UI Tests
1. Run `yarn --cwd quickwit-ui install` and `yarn --cwd quickwit-ui test` in the `quickwit` directory

## Running UI e2e tests
1. Ensure to run a searcher `cargo r run --service searcher --config ../config/quickwit.yaml`
2. Run `yarn --cwd quickwit-ui e2e-test`

## Running services such as Amazon Kinesis or S3, Kafka, or PostgreSQL locally.
1. Ensure Docker and Docker Compose are correctly installed on your machine (see above)
2. Run `make docker-compose-up` to launch all the services or `make docker-compose-up DOCKER_SERVICES=kafka,postgres` to launch a subset of services.

## Tracing with Jaeger
1. Ensure Docker and Docker Compose are correctly installed on your machine (see above)
2. Start the Jaeger services (UI, collector, agent, ...) running the command `make docker-compose-up DOCKER_SERVICES=jaeger`
3. Start Quickwit with the following environment variables:

```
OTEL_EXPORTER_OTLP_ENDPOINT=http://localhost:4317
QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER=true
```

4. Open your browser and visit [localhost:16686](http://localhost:16686/)

## Using tokio console
1. Install tokio-console by running `cargo install tokio-console`.
2. Install the quickwit binary in the quickwit-cli folder `RUSTFLAGS="--cfg tokio_unstable" cargo install --path . --features tokio-console`
3. Launch a long running command such as index and activate tokio with the: `QW_ENABLE_TOKIO_CONSOLE=1 quickwit index ...`
4. Run `tokio-console`.

## Building binaries

Currently, we use [cross](https://github.com/rust-embedded/cross) to build Quickwit binaries for different architectures.
For this to work, we've had to customize the docker images cross uses. These customizations can be found in docker files located in the `./cross-images` folder. To make cross take into account any change on those
docker files, you will need to build and push the images on Docker Hub by running `make cross-images`.
We also have nightly builds that are pushed to Docker Hub. This helps continuously check that our binaries are still built even with external dependency updates. Successful builds let you access the artifacts for the next three days. Release builds always have their artifacts attached to the release.

## Docker images

Each merge on the `main` branch triggers the build of a new Docker image available on DockerHub at `quickwit/quickwit:edge`. Tagging a commit also creates a new image `quickwit/quickwit:<tag name>` if the tag name starts with `v*` or `qw*`. The Docker images are based on Debian.

### Notes on the embedded UI
As the react UI is embedded in the rust binary, we need to build the react app before building the binary. Hence `make cross-image` depends on the command `build-ui`.

## Testing release (alpha, beta, rc)

The following Quickwit installation command `curl -L https://install.quickwit.io | sh` always installs the latest stable version of quickwit. To make it easier in installing and testing new (alpha, beta, rc) releases, you can manually pull and execute the script as `./install.sh --allow-any-latest-version`. This will force the script to install any latest available release package.

## Tracking licenses

We keep track of the licenses used by the open source crates used by this project using
[`rust-license-tool`](https://github.com/DataDog/rust-license-tool). The listing is checked every
time CI is run. To update the listing, install the tool with `cargo install --git
https://github.com/DataDog/rust-license-tool` and then run `dd-rust-license-tool write`. If there are
any errors, you may need to update the listing of exceptions in `license-tool.toml`.

# Documentation

Quickwit documentation is located in the docs directory.

## Generating the CLI docs.

The [CLI doc page](docs/reference/cli.md) is partly generated by a script.
To update it, first run the script:

```bash
cargo run --bin generate_markdown > ../docs/reference/cli_insert.md
```

Then manually edit the [doc page](docs/reference/cli.md) to update it and delete the generated file.
There are two comments to indicate where you want to insert the new docs and where it ends:

```markdown
[comment]: <> (Insert auto generated CLI docs from here.)

...docs to insert...

[comment]: <> (End of auto generated CLI docs.)
```


================================================
FILE: Dockerfile
================================================
FROM node:24@sha256:b2b2184ba9b78c022e1d6a7924ec6fba577adf28f15c9d9c457730cc4ad3807a AS ui-builder

COPY quickwit/quickwit-ui /quickwit/quickwit-ui

WORKDIR /quickwit/quickwit-ui

RUN touch .gitignore_for_build_directory \
    && NODE_ENV=production make install build


FROM rust:bookworm@sha256:b5efaabfd787a695d2e46b37d3d9c54040e11f4c10bc2e714bbadbfcc0cd6c39 AS bin-builder

ARG CARGO_FEATURES=release-feature-set
ARG CARGO_PROFILE=release
ARG QW_COMMIT_DATE
ARG QW_COMMIT_HASH
ARG QW_COMMIT_TAGS

ENV QW_COMMIT_DATE=$QW_COMMIT_DATE
ENV QW_COMMIT_HASH=$QW_COMMIT_HASH
ENV QW_COMMIT_TAGS=$QW_COMMIT_TAGS

RUN apt-get -y update \
    && apt-get -y install ca-certificates \
    clang \
    cmake \
    libssl-dev \
    llvm \
    protobuf-compiler \
    && rm -rf /var/lib/apt/lists/*

COPY quickwit /quickwit
COPY config/quickwit.yaml /quickwit/config/quickwit.yaml
COPY --from=ui-builder /quickwit/quickwit-ui/build /quickwit/quickwit-ui/build

WORKDIR /quickwit

RUN rustup toolchain install

RUN echo "Building workspace with feature(s) '$CARGO_FEATURES' and profile '$CARGO_PROFILE'" \
    && RUSTFLAGS="--cfg tokio_unstable" \
    cargo build \
    -p quickwit-cli \
    --features $CARGO_FEATURES \
    --bin quickwit \
    $(test "$CARGO_PROFILE" = "release" && echo "--release") \
    && echo "Copying binaries to /quickwit/bin" \
    && mkdir -p /quickwit/bin \
    && find target/$CARGO_PROFILE -maxdepth 1 -perm /a+x -type f -exec mv {} /quickwit/bin \;


FROM debian:bookworm-slim@sha256:e899040a73d36e2b36fa33216943539d9957cba8172b858097c2cabcdb20a3e2 AS quickwit

LABEL org.opencontainers.image.title="Quickwit"
LABEL maintainer="Quickwit, Inc. <hello@quickwit.io>"
LABEL org.opencontainers.image.vendor="Quickwit, Inc."
LABEL org.opencontainers.image.licenses="Apache-2.0"

RUN apt-get -y update \
    && apt-get -y install ca-certificates \
    libssl3 \
    && rm -rf /var/lib/apt/lists/*

WORKDIR /quickwit
RUN mkdir config qwdata
COPY --from=bin-builder /quickwit/bin/quickwit /usr/local/bin/quickwit
COPY --from=bin-builder /quickwit/config/quickwit.yaml /quickwit/config/quickwit.yaml

ENV QW_CONFIG=/quickwit/config/quickwit.yaml
ENV QW_DATA_DIR=/quickwit/qwdata
ENV QW_LISTEN_ADDRESS=0.0.0.0

RUN quickwit --version

ENTRYPOINT ["quickwit"]


================================================
FILE: LICENSE
================================================
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets "[]"
      replaced with your own identifying information. (Don't include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same "printed page" as the copyright notice for easier
      identification within third-party archives.

   Copyright 2021-Present Datadog, Inc.

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.


================================================
FILE: LICENSE-3rdparty.csv
================================================
Component,Origin,License,Copyright
adler2,https://github.com/oyvindln/adler2,0BSD OR MIT OR Apache-2.0,"Jonas Schievink <jonasschievink@gmail.com>, oyvindln <oyvindln@users.noreply.github.com>"
advapi32-sys,https://github.com/retep998/winapi-rs,MIT,Peter Atashian <retep998@gmail.com>
ahash,https://github.com/tkaitchuck/ahash,MIT OR Apache-2.0,Tom Kaitchuck <Tom.Kaitchuck@gmail.com>
aho-corasick,https://github.com/BurntSushi/aho-corasick,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
aliasable,https://github.com/avitex/rust-aliasable,MIT,avitex <avitex@wfxlabs.com>
alloca,https://github.com/playXE/alloca-rs,MIT,"Adel Prokurov <adel.prokurov@gmail.com>, StackOverflowExcept1on"
allocator-api2,https://github.com/zakarumych/allocator-api2,MIT OR Apache-2.0,Zakarum <zaq.dev@icloud.com>
android_system_properties,https://github.com/nical/android_system_properties,MIT OR Apache-2.0,Nicolas Silva <nical@fastmail.com>
anes,https://github.com/zrzka/anes-rs,MIT OR Apache-2.0,Robert Vojta <rvojta@me.com>
ansi-str,https://github.com/zhiburt/ansi-str,MIT,Maxim Zhiburt <zhiburt@gmail.com>
ansitok,https://gitlab.com/zhiburt/ansitok,MIT,Maxim Zhiburt <zhiburt@gmail.com>
anstream,https://github.com/rust-cli/anstyle,MIT OR Apache-2.0,The anstream Authors
anstyle,https://github.com/rust-cli/anstyle,MIT OR Apache-2.0,The anstyle Authors
anstyle-parse,https://github.com/rust-cli/anstyle,MIT OR Apache-2.0,The anstyle-parse Authors
anstyle-query,https://github.com/rust-cli/anstyle,MIT OR Apache-2.0,The anstyle-query Authors
anstyle-wincon,https://github.com/rust-cli/anstyle,MIT OR Apache-2.0,The anstyle-wincon Authors
anyhow,https://github.com/dtolnay/anyhow,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
arc-swap,https://github.com/vorner/arc-swap,MIT OR Apache-2.0,Michal 'vorner' Vaner <vorner@vorner.cz>
arrayvec,https://github.com/bluss/arrayvec,MIT OR Apache-2.0,bluss
assert-json-diff,https://github.com/davidpdrsn/assert-json-diff,MIT,David Pedersen <david.pdrsn@gmail.com>
async-compression,https://github.com/Nullus157/async-compression,MIT OR Apache-2.0,"Wim Looman <wim@nemo157.com>, Allen Bui <fairingrey@gmail.com>"
async-speed-limit,https://github.com/tikv/async-speed-limit,MIT OR Apache-2.0,The TiKV Project Developers
async-stream,https://github.com/tokio-rs/async-stream,MIT,Carl Lerche <me@carllerche.com>
async-stream-impl,https://github.com/tokio-rs/async-stream,MIT,Carl Lerche <me@carllerche.com>
async-trait,https://github.com/dtolnay/async-trait,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
atomic-waker,https://github.com/smol-rs/atomic-waker,Apache-2.0 OR MIT,"Stjepan Glavina <stjepang@gmail.com>, Contributors to futures-rs"
aws-config,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-credential-types,https://github.com/smithy-lang/smithy-rs,Apache-2.0,AWS Rust SDK Team <aws-sdk-rust@amazon.com>
aws-lc-rs,https://github.com/aws/aws-lc-rs,ISC AND (Apache-2.0 OR ISC),AWS-LibCrypto
aws-lc-sys,https://github.com/aws/aws-lc-rs,ISC AND (Apache-2.0 OR ISC) AND OpenSSL,AWS-LC
aws-runtime,https://github.com/smithy-lang/smithy-rs,Apache-2.0,AWS Rust SDK Team <aws-sdk-rust@amazon.com>
aws-sdk-lambda,https://github.com/awslabs/aws-sdk-rust,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-sdk-s3,https://github.com/awslabs/aws-sdk-rust,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-sdk-sso,https://github.com/awslabs/aws-sdk-rust,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-sdk-ssooidc,https://github.com/awslabs/aws-sdk-rust,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-sdk-sts,https://github.com/awslabs/aws-sdk-rust,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-sigv4,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, David Barsky <me@davidbarsky.com>"
aws-smithy-async,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, John DiSanti <jdisanti@amazon.com>"
aws-smithy-checksums,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Zelda Hessler <zhessler@amazon.com>"
aws-smithy-eventstream,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, John DiSanti <jdisanti@amazon.com>"
aws-smithy-http,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-smithy-http-client,https://github.com/smithy-lang/smithy-rs,Apache-2.0,AWS Rust SDK Team <aws-sdk-rust@amazon.com>
aws-smithy-json,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, John DiSanti <jdisanti@amazon.com>"
aws-smithy-observability,https://github.com/awslabs/smithy-rs,Apache-2.0,AWS Rust SDK Team <aws-sdk-rust@amazon.com>
aws-smithy-protocol-test,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-smithy-query,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, John DiSanti <jdisanti@amazon.com>"
aws-smithy-runtime,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Zelda Hessler <zhessler@amazon.com>"
aws-smithy-runtime-api,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Zelda Hessler <zhessler@amazon.com>"
aws-smithy-types,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-smithy-xml,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
aws-types,https://github.com/smithy-lang/smithy-rs,Apache-2.0,"AWS Rust SDK Team <aws-sdk-rust@amazon.com>, Russell Cohen <rcoh@amazon.com>"
axum,https://github.com/tokio-rs/axum,MIT,The axum Authors
axum-core,https://github.com/tokio-rs/axum,MIT,The axum-core Authors
base16ct,https://github.com/RustCrypto/formats/tree/master/base16ct,Apache-2.0 OR MIT,RustCrypto Developers
base64,https://github.com/marshallpierce/rust-base64,MIT OR Apache-2.0,Marshall Pierce <marshall@mpierce.org>
base64-simd,https://github.com/Nugine/simd,MIT,The base64-simd Authors
base64ct,https://github.com/RustCrypto/formats,Apache-2.0 OR MIT,RustCrypto Developers
bit-set,https://github.com/contain-rs/bit-set,Apache-2.0 OR MIT,Alexis Beingessner <a.beingessner@gmail.com>
bit-vec,https://github.com/contain-rs/bit-vec,Apache-2.0 OR MIT,Alexis Beingessner <a.beingessner@gmail.com>
bitflags,https://github.com/bitflags/bitflags,MIT OR Apache-2.0,The Rust Project Developers
bitpacking,https://github.com/quickwit-oss/bitpacking,MIT,Paul Masurel <paul.masurel@gmail.com>
block-buffer,https://github.com/RustCrypto/utils,MIT OR Apache-2.0,RustCrypto Developers
bon,https://github.com/elastio/bon,MIT OR Apache-2.0,The bon Authors
bon-macros,https://github.com/elastio/bon,MIT OR Apache-2.0,The bon-macros Authors
bpu_trasher,https://github.com/pseitz/bpu_trasher,MIT,Pascal Seitz <pascal.seitz@gmail.com>
bs58,https://github.com/Nullus157/bs58-rs,MIT OR Apache-2.0,The bs58 Authors
bumpalo,https://github.com/fitzgen/bumpalo,MIT OR Apache-2.0,Nick Fitzgerald <fitzgen@gmail.com>
bytecount,https://github.com/llogiq/bytecount,Apache-2.0 OR MIT,"Andre Bogus <bogusandre@gmail.de>, Joshua Landau <joshua@landau.ws>"
byteorder,https://github.com/BurntSushi/byteorder,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
bytes,https://github.com/tokio-rs/bytes,MIT,"Carl Lerche <me@carllerche.com>, Sean McArthur <sean@seanmonstar.com>"
bytes-utils,https://github.com/vorner/bytes-utils,Apache-2.0 OR MIT,Michal 'vorner' Vaner <vorner@vorner.cz>
bytesize,https://github.com/bytesize-rs/bytesize,Apache-2.0,"Hyunsik Choi <hyunsik.choi@gmail.com>, MrCroxx <mrcroxx@outlook.com>, Rob Ede <robjtede@icloud.com>"
bytestring,https://github.com/actix/actix-net,MIT OR Apache-2.0,"Nikolay Kim <fafhrd91@gmail.com>, Rob Ede <robjtede@icloud.com>"
camino,https://github.com/camino-rs/camino,MIT OR Apache-2.0,"Without Boats <saoirse@without.boats>, Ashley Williams <ashley666ashley@gmail.com>, Steve Klabnik <steve@steveklabnik.com>, Rain <rain@sunshowers.io>"
cargo-platform,https://github.com/rust-lang/cargo,MIT OR Apache-2.0,The cargo-platform Authors
cargo_metadata,https://github.com/oli-obk/cargo_metadata,MIT,Oliver Schneider <git-spam-no-reply9815368754983@oli-obk.de>
cast,https://github.com/japaric/cast.rs,MIT OR Apache-2.0,Jorge Aparicio <jorge@japaric.io>
cbor-diag,https://github.com/Nullus157/cbor-diag-rs,MIT OR Apache-2.0,The cbor-diag Authors
cc,https://github.com/rust-lang/cc-rs,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
census,https://github.com/quickwit-inc/census,MIT,Paul Masurel <paul.masurel@gmail.com>
cfg-if,https://github.com/rust-lang/cfg-if,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
chitchat,https://github.com/quickwit-oss/chitchat,MIT,"Quickwit, Inc. <hello@quickwit.io>"
chrono,https://github.com/chronotope/chrono,MIT OR Apache-2.0,The chrono Authors
ciborium,https://github.com/enarx/ciborium,Apache-2.0,Nathaniel McCallum <npmccallum@profian.com>
ciborium-io,https://github.com/enarx/ciborium,Apache-2.0,Nathaniel McCallum <npmccallum@profian.com>
ciborium-ll,https://github.com/enarx/ciborium,Apache-2.0,Nathaniel McCallum <npmccallum@profian.com>
clap,https://github.com/clap-rs/clap,MIT OR Apache-2.0,The clap Authors
clap_builder,https://github.com/clap-rs/clap,MIT OR Apache-2.0,The clap_builder Authors
clap_lex,https://github.com/clap-rs/clap,MIT OR Apache-2.0,The clap_lex Authors
coarsetime,https://github.com/jedisct1/rust-coarsetime,ISC,Frank Denis <github@pureftpd.org>
cobs,https://github.com/jamesmunns/cobs.rs,MIT OR Apache-2.0,"Allen Welkie <>, James Munns <james@onevariable.com>"
colorchoice,https://github.com/rust-cli/anstyle,MIT OR Apache-2.0,The colorchoice Authors
colored,https://github.com/mackwic/colored,MPL-2.0,Thomas Wickham <mackwic@gmail.com>
compression-codecs,https://github.com/Nullus157/async-compression,MIT OR Apache-2.0,"Wim Looman <wim@nemo157.com>, Allen Bui <fairingrey@gmail.com>"
compression-core,https://github.com/Nullus157/async-compression,MIT OR Apache-2.0,"Wim Looman <wim@nemo157.com>, Allen Bui <fairingrey@gmail.com>"
console,https://github.com/console-rs/console,MIT,The console Authors
const-oid,https://github.com/RustCrypto/formats/tree/master/const-oid,Apache-2.0 OR MIT,RustCrypto Developers
core-foundation,https://github.com/servo/core-foundation-rs,MIT OR Apache-2.0,The Servo Project Developers
core-foundation-sys,https://github.com/servo/core-foundation-rs,MIT OR Apache-2.0,The Servo Project Developers
cpufeatures,https://github.com/RustCrypto/utils,MIT OR Apache-2.0,RustCrypto Developers
crc32c,https://github.com/zowens/crc32c,Apache-2.0 OR MIT,Zack Owens
crc32fast,https://github.com/srijs/rust-crc32fast,MIT OR Apache-2.0,"Sam Rijs <srijs@airpost.net>, Alex Crichton <alex@alexcrichton.com>"
criterion-plot,https://github.com/criterion-rs/criterion.rs,Apache-2.0 OR MIT,"Jorge Aparicio <japaricious@gmail.com>, Brook Heisler <brookheisler@gmail.com>"
cron,https://github.com/zslayton/cron,MIT OR Apache-2.0,Zack Slayton <zack.slayton@gmail.com>
crossbeam-channel,https://github.com/crossbeam-rs/crossbeam,MIT OR Apache-2.0,The crossbeam-channel Authors
crossbeam-deque,https://github.com/crossbeam-rs/crossbeam,MIT OR Apache-2.0,The crossbeam-deque Authors
crossbeam-epoch,https://github.com/crossbeam-rs/crossbeam,MIT OR Apache-2.0,The crossbeam-epoch Authors
crossbeam-utils,https://github.com/crossbeam-rs/crossbeam,MIT OR Apache-2.0,The crossbeam-utils Authors
crunchy,https://github.com/eira-fransham/crunchy,MIT,Eira Fransham <jackefransham@gmail.com>
crypto-bigint,https://github.com/RustCrypto/crypto-bigint,Apache-2.0 OR MIT,RustCrypto Developers
crypto-common,https://github.com/RustCrypto/traits,MIT OR Apache-2.0,RustCrypto Developers
darling,https://github.com/TedDriggs/darling,MIT,Ted Driggs <ted.driggs@outlook.com>
darling_core,https://github.com/TedDriggs/darling,MIT,Ted Driggs <ted.driggs@outlook.com>
darling_macro,https://github.com/TedDriggs/darling,MIT,Ted Driggs <ted.driggs@outlook.com>
dashmap,https://github.com/xacrimon/dashmap,MIT,Acrimon <joel.wejdenstal@gmail.com>
data-encoding,https://github.com/ia0/data-encoding,MIT,Julien Cretin <git@ia0.eu>
deadpool,https://github.com/bikeshedder/deadpool,MIT OR Apache-2.0,Michael P. Jung <michael.jung@terreon.de>
deadpool-runtime,https://github.com/bikeshedder/deadpool,MIT OR Apache-2.0,Michael P. Jung <michael.jung@terreon.de>
der,https://github.com/RustCrypto/formats/tree/master/der,Apache-2.0 OR MIT,RustCrypto Developers
deranged,https://github.com/jhpratt/deranged,MIT OR Apache-2.0,Jacob Pratt <jacob@jhpratt.dev>
dialoguer,https://github.com/console-rs/dialoguer,MIT,The dialoguer Authors
diff,https://github.com/utkarshkukreti/diff.rs,MIT OR Apache-2.0,Utkarsh Kukreti <utkarshkukreti@gmail.com>
difflib,https://github.com/DimaKudosh/difflib,MIT,Dima Kudosh <dimakudosh@gmail.com>
digest,https://github.com/RustCrypto/traits,MIT OR Apache-2.0,RustCrypto Developers
displaydoc,https://github.com/yaahc/displaydoc,MIT OR Apache-2.0,Jane Lusby <jlusby@yaah.dev>
downcast,https://github.com/fkoep/downcast-rs,MIT,Felix Köpge <fkoep@mailbox.org>
downcast-rs,https://github.com/marcianx/downcast-rs,MIT OR Apache-2.0,The downcast-rs Authors
dtoa,https://github.com/dtolnay/dtoa,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
dyn-clone,https://github.com/dtolnay/dyn-clone,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
ecdsa,https://github.com/RustCrypto/signatures/tree/master/ecdsa,Apache-2.0 OR MIT,RustCrypto Developers
either,https://github.com/rayon-rs/either,MIT OR Apache-2.0,bluss
elasticsearch-dsl,https://github.com/vinted/elasticsearch-dsl-rs,MIT OR Apache-2.0,"Evaldas Buinauskas <evaldas.buinauskas@vinted.com>, Search Platform <search-platform@vinted.com>"
elliptic-curve,https://github.com/RustCrypto/traits/tree/master/elliptic-curve,Apache-2.0 OR MIT,RustCrypto Developers
embedded-io,https://github.com/embassy-rs/embedded-io,MIT OR Apache-2.0,The embedded-io Authors
embedded-io,https://github.com/rust-embedded/embedded-hal,MIT OR Apache-2.0,The embedded-io Authors
encode_unicode,https://github.com/tormol/encode_unicode,Apache-2.0 OR MIT,Torbjørn Birch Moltu <t.b.moltu@lyse.net>
encoding_rs,https://github.com/hsivonen/encoding_rs,(Apache-2.0 OR MIT) AND BSD-3-Clause,Henri Sivonen <hsivonen@hsivonen.fi>
enum-iterator,https://github.com/stephaneyfx/enum-iterator,0BSD,Stephane Raux <stephaneyfx@gmail.com>
enum-iterator-derive,https://github.com/stephaneyfx/enum-iterator,0BSD,Stephane Raux <stephaneyfx@gmail.com>
env_filter,https://github.com/rust-cli/env_logger,MIT OR Apache-2.0,The env_filter Authors
env_logger,https://github.com/rust-cli/env_logger,MIT OR Apache-2.0,The env_logger Authors
equivalent,https://github.com/indexmap-rs/equivalent,Apache-2.0 OR MIT,The equivalent Authors
erased-serde,https://github.com/dtolnay/erased-serde,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
errno,https://github.com/lambda-fairy/rust-errno,MIT OR Apache-2.0,"Chris Wong <lambda.fairy@gmail.com>, Dan Gohman <dev@sunfishcode.online>"
error-chain,https://github.com/rust-lang-nursery/error-chain,MIT OR Apache-2.0,"Brian Anderson <banderson@mozilla.com>, Paul Colomiets <paul@colomiets.name>, Colin Kiegel <kiegel@gmx.de>, Yamakaky <yamakaky@yamaworld.fr>, Andrew Gauger <andygauge@gmail.com>"
fail,https://github.com/tikv/fail-rs,Apache-2.0,The TiKV Project Developers
fastdivide,https://github.com/fulmicoton/fastdivide,zlib-acknowledgement OR MIT,Paul Masurel <paul.masurel@gmail.com>
fastrand,https://github.com/smol-rs/fastrand,Apache-2.0 OR MIT,Stjepan Glavina <stjepang@gmail.com>
ff,https://github.com/zkcrypto/ff,MIT OR Apache-2.0,"Sean Bowe <ewillbefull@gmail.com>, Jack Grigg <thestr4d@gmail.com>"
find-msvc-tools,https://github.com/rust-lang/cc-rs,MIT OR Apache-2.0,The find-msvc-tools Authors
fixedbitset,https://github.com/petgraph/fixedbitset,MIT OR Apache-2.0,bluss
flate2,https://github.com/rust-lang/flate2-rs,MIT OR Apache-2.0,"Alex Crichton <alex@alexcrichton.com>, Josh Triplett <josh@joshtriplett.org>"
float-cmp,https://github.com/mikedilger/float-cmp,MIT,Mike Dilger <mike@mikedilger.com>
flume,https://github.com/zesterer/flume,Apache-2.0 OR MIT,Joshua Barretto <joshua.s.barretto@gmail.com>
fnv,https://github.com/servo/rust-fnv,Apache-2.0  OR  MIT,Alex Crichton <alex@alexcrichton.com>
foldhash,https://github.com/orlp/foldhash,Zlib,Orson Peters <orsonpeters@gmail.com>
form_urlencoded,https://github.com/servo/rust-url,MIT OR Apache-2.0,The rust-url developers
fragile,https://github.com/mitsuhiko/fragile,Apache-2.0,Armin Ronacher <armin.ronacher@active-4.com>
fs4,https://github.com/al8n/fs4-rs,MIT OR Apache-2.0,"Dan Burkert <dan@danburkert.com>, Al Liu <scygliu1@gmail.com>"
fslock,https://github.com/brunoczim/fslock,MIT,The fslock Authors
futures,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures Authors
futures-channel,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-channel Authors
futures-core,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-core Authors
futures-executor,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-executor Authors
futures-io,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-io Authors
futures-macro,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-macro Authors
futures-sink,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-sink Authors
futures-task,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-task Authors
futures-timer,https://github.com/async-rs/futures-timer,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
futures-util,https://github.com/rust-lang/futures-rs,MIT OR Apache-2.0,The futures-util Authors
generic-array,https://github.com/fizyk20/generic-array,MIT,"Bartłomiej Kamiński <fizyk20@gmail.com>, Aaron Trent <novacrazy@gmail.com>"
getrandom,https://github.com/rust-random/getrandom,MIT OR Apache-2.0,The Rand Project Developers
glob,https://github.com/rust-lang/glob,MIT OR Apache-2.0,The Rust Project Developers
governor,https://github.com/boinkor-net/governor,MIT,Andreas Fuchs <asf@boinkor.net>
group,https://github.com/zkcrypto/group,MIT OR Apache-2.0,"Sean Bowe <ewillbefull@gmail.com>, Jack Grigg <jack@z.cash>"
h2,https://github.com/hyperium/h2,MIT,"Carl Lerche <me@carllerche.com>, Sean McArthur <sean@seanmonstar.com>"
half,https://github.com/VoidStarKat/half-rs,MIT OR Apache-2.0,Kathryn Long <squeeself@gmail.com>
hashbrown,https://github.com/rust-lang/hashbrown,MIT OR Apache-2.0,Amanieu d'Antras <amanieu@gmail.com>
headers,https://github.com/hyperium/headers,MIT,Sean McArthur <sean@seanmonstar.com>
headers-core,https://github.com/hyperium/headers,MIT,Sean McArthur <sean@seanmonstar.com>
heck,https://github.com/withoutboats/heck,MIT OR Apache-2.0,The heck Authors
heck,https://github.com/withoutboats/heck,MIT OR Apache-2.0,Without Boats <woboats@gmail.com>
hermit-abi,https://github.com/hermit-os/hermit-rs,MIT OR Apache-2.0,Stefan Lankes
hex,https://github.com/KokaKiwi/rust-hex,MIT OR Apache-2.0,KokaKiwi <kokakiwi@kokakiwi.net>
hmac,https://github.com/RustCrypto/MACs,MIT OR Apache-2.0,RustCrypto Developers
home,https://github.com/rust-lang/cargo,MIT OR Apache-2.0,Brian Anderson <andersrb@gmail.com>
hostname,https://github.com/djc/hostname,MIT,The hostname Authors
htmlescape,https://github.com/veddan/rust-htmlescape,Apache-2.0  OR  MIT  OR  MPL-2.0,Viktor Dahl <pazaconyoman@gmail.com>
http,https://github.com/hyperium/http,MIT OR Apache-2.0,"Alex Crichton <alex@alexcrichton.com>, Carl Lerche <me@carllerche.com>, Sean McArthur <sean@seanmonstar.com>"
http-body,https://github.com/hyperium/http-body,MIT,"Carl Lerche <me@carllerche.com>, Lucio Franco <luciofranco14@gmail.com>, Sean McArthur <sean@seanmonstar.com>"
http-body-util,https://github.com/hyperium/http-body,MIT,"Carl Lerche <me@carllerche.com>, Lucio Franco <luciofranco14@gmail.com>, Sean McArthur <sean@seanmonstar.com>"
http-serde,https://gitlab.com/kornelski/http-serde,Apache-2.0 OR MIT,Kornel <kornel@geekhood.net>
httparse,https://github.com/seanmonstar/httparse,MIT OR Apache-2.0,Sean McArthur <sean@seanmonstar.com>
httpdate,https://github.com/pyfisch/httpdate,MIT OR Apache-2.0,Pyfisch <pyfisch@posteo.org>
humantime,https://github.com/chronotope/humantime,MIT OR Apache-2.0,The humantime Authors
hyper,https://github.com/hyperium/hyper,MIT,Sean McArthur <sean@seanmonstar.com>
hyper-rustls,https://github.com/rustls/hyper-rustls,Apache-2.0 OR ISC OR MIT,The hyper-rustls Authors
hyper-timeout,https://github.com/hjr3/hyper-timeout,MIT OR Apache-2.0,Herman J. Radtke III <herman@hermanradtke.com>
hyper-util,https://github.com/hyperium/hyper-util,MIT,Sean McArthur <sean@seanmonstar.com>
hyperloglogplus,https://github.com/tabac/hyperloglog.rs,MIT,Tasos Bakogiannis <t.bakogiannis@gmail.com>
iana-time-zone,https://github.com/strawlab/iana-time-zone,MIT OR Apache-2.0,"Andrew Straw <strawman@astraw.com>, René Kijewski <rene.kijewski@fu-berlin.de>, Ryan Lopopolo <rjl@hyperbo.la>"
iana-time-zone-haiku,https://github.com/strawlab/iana-time-zone,MIT OR Apache-2.0,René Kijewski <crates.io@k6i.de>
icu_collections,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
icu_locale_core,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
icu_normalizer,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
icu_normalizer_data,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
icu_properties,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
icu_properties_data,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
icu_provider,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
ident_case,https://github.com/TedDriggs/ident_case,MIT OR Apache-2.0,Ted Driggs <ted.driggs@outlook.com>
idna,https://github.com/servo/rust-url,MIT OR Apache-2.0,The rust-url developers
idna_adapter,https://github.com/hsivonen/idna_adapter,Apache-2.0 OR MIT,The rust-url developers
indexmap,https://github.com/bluss/indexmap,Apache-2.0 OR MIT,The indexmap Authors
indexmap,https://github.com/indexmap-rs/indexmap,Apache-2.0 OR MIT,The indexmap Authors
indicatif,https://github.com/console-rs/indicatif,MIT,The indicatif Authors
inventory,https://github.com/dtolnay/inventory,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
ipnet,https://github.com/krisprice/ipnet,MIT OR Apache-2.0,Kris Price <kris@krisprice.nz>
ipnetwork,https://github.com/achanda/ipnetwork,MIT OR Apache-2.0,"Abhishek Chanda <abhishek.becs@gmail.com>, Linus Färnstrand <faern@faern.net>"
iri-string,https://github.com/lo48576/iri-string,MIT OR Apache-2.0,YOSHIOKA Takuma <nop_thread@nops.red>
is-terminal,https://github.com/sunfishcode/is-terminal,MIT,"softprops <d.tangren@gmail.com>, Dan Gohman <dev@sunfishcode.online>"
is_terminal_polyfill,https://github.com/polyfill-rs/is_terminal_polyfill,MIT OR Apache-2.0,The is_terminal_polyfill Authors
itertools,https://github.com/rust-itertools/itertools,MIT OR Apache-2.0,bluss
itoa,https://github.com/dtolnay/itoa,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
jobserver,https://github.com/rust-lang/jobserver-rs,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
js-sys,https://github.com/wasm-bindgen/wasm-bindgen/tree/master/crates/js-sys,MIT OR Apache-2.0,The wasm-bindgen Developers
json_comments,https://github.com/tmccombs/json-comments-rs,Apache-2.0,Thayne McCombs <astrothayne@gmail.com>
lambda_runtime,https://github.com/awslabs/aws-lambda-rust-runtime,Apache-2.0,"David Calavera <dcalaver@amazon.com>, Harold Sun <sunhua@amazon.com>"
lambda_runtime_api_client,https://github.com/awslabs/aws-lambda-rust-runtime,Apache-2.0,"David Calavera <dcalaver@amazon.com>, Harold Sun <sunhua@amazon.com>"
lazy_static,https://github.com/rust-lang-nursery/lazy-static.rs,MIT OR Apache-2.0,Marvin Löbel <loebel.marvin@gmail.com>
levenshtein_automata,https://github.com/tantivy-search/levenshtein-automata,MIT,Paul Masurel <paul.masurel@gmail.com>
libc,https://github.com/rust-lang/libc,MIT OR Apache-2.0,The Rust Project Developers
libm,https://github.com/rust-lang/compiler-builtins,MIT,Jorge Aparicio <jorge@japaric.io>
linked-hash-map,https://github.com/contain-rs/linked-hash-map,MIT OR Apache-2.0,"Stepan Koltsov <stepan.koltsov@gmail.com>, Andrew Paseltiner <apaseltiner@gmail.com>"
linux-raw-sys,https://github.com/sunfishcode/linux-raw-sys,Apache-2.0 WITH LLVM-exception OR Apache-2.0 OR MIT,Dan Gohman <dev@sunfishcode.online>
litemap,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
lock_api,https://github.com/Amanieu/parking_lot,MIT OR Apache-2.0,Amanieu d'Antras <amanieu@gmail.com>
log,https://github.com/rust-lang/log,MIT OR Apache-2.0,The Rust Project Developers
lru,https://github.com/jeromefroe/lru-rs,MIT,Jerome Froelich <jeromefroelic@hotmail.com>
lru-slab,https://github.com/Ralith/lru-slab,MIT OR Apache-2.0 OR Zlib,Benjamin Saunders <ben.e.saunders@gmail.com>
lz4_flex,https://github.com/pseitz/lz4_flex,MIT,"Pascal Seitz <pascal.seitz@gmail.com>, Arthur Silva <arthurprs@gmail.com>, ticki <Ticki@users.noreply.github.com>"
matchers,https://github.com/hawkw/matchers,MIT,Eliza Weisman <eliza@buoyant.io>
matchit,https://github.com/ibraheemdev/matchit,MIT AND BSD-3-Clause,Ibraheem Ahmed <ibraheem@ibraheem.ca>
md-5,https://github.com/RustCrypto/hashes,MIT OR Apache-2.0,RustCrypto Developers
md5,https://github.com/stainless-steel/md5,Apache-2.0 OR MIT,"Ivan Ukhov <ivan.ukhov@gmail.com>, Kamal Ahmad <shibe@openmailbox.org>, Konstantin Stepanov <milezv@gmail.com>, Lukas Kalbertodt <lukas.kalbertodt@gmail.com>, Nathan Musoke <nathan.musoke@gmail.com>, Scott Mabin <scott@mabez.dev>, Tony Arcieri <bascule@gmail.com>, Wim de With <register@dewith.io>, Yosef Dinerstein <yosefdi@gmail.com>"
measure_time,https://github.com/PSeitz/rust_measure_time,MIT,Pascal Seitz <pascal.seitz@gmail.com>
memchr,https://github.com/BurntSushi/memchr,Unlicense OR MIT,"Andrew Gallant <jamslam@gmail.com>, bluss"
memmap2,https://github.com/RazrFalcon/memmap2-rs,MIT OR Apache-2.0,"Dan Burkert <dan@danburkert.com>, Yevhenii Reizner <razrfalcon@gmail.com>"
mime,https://github.com/hyperium/mime,MIT OR Apache-2.0,Sean McArthur <sean@seanmonstar.com>
mime_guess,https://github.com/abonander/mime_guess,MIT,Austin Bonander <austin.bonander@gmail.com>
mini-internal,https://github.com/dtolnay/miniserde,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
mini-moka,https://github.com/moka-rs/mini-moka,MIT OR Apache-2.0,The mini-moka Authors
minimal-lexical,https://github.com/Alexhuszagh/minimal-lexical,MIT OR Apache-2.0,Alex Huszagh <ahuszagh@gmail.com>
miniserde,https://github.com/dtolnay/miniserde,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
miniz_oxide,https://github.com/Frommi/miniz_oxide/tree/master/miniz_oxide,MIT OR Zlib OR Apache-2.0,"Frommi <daniil.liferenko@gmail.com>, oyvindln <oyvindln@users.noreply.github.com>, Rich Geldreich richgel99@gmail.com"
mio,https://github.com/tokio-rs/mio,MIT,"Carl Lerche <me@carllerche.com>, Thomas de Zeeuw <thomasdezeeuw@gmail.com>, Tokio Contributors <team@tokio.rs>"
mockall,https://github.com/asomers/mockall,MIT OR Apache-2.0,Alan Somers <asomers@gmail.com>
mockall_derive,https://github.com/asomers/mockall,MIT OR Apache-2.0,Alan Somers <asomers@gmail.com>
mrecordlog,https://github.com/quickwit-oss/mrecordlog,MIT,The mrecordlog Authors
multimap,https://github.com/havarnov/multimap,MIT OR Apache-2.0,Håvar Nøvik <havar.novik@gmail.com>
murmurhash32,https://github.com/quickwit-inc/murmurhash32,MIT,Paul Masurel <paul.masurel@gmail.com>
new_string_template,https://github.com/hasezoey/new_string_template,MIT,hasezoey <hasezoey@gmail.com>
no-std-net,https://github.com/dunmatt/no-std-net,MIT,M@ Dunlap <mattdunlap@gmail.com>
nom,https://github.com/Geal/nom,MIT,contact@geoffroycouprie.com
nom,https://github.com/rust-bakery/nom,MIT,contact@geoffroycouprie.com
nonzero_ext,https://github.com/antifuchs/nonzero_ext,Apache-2.0,Andreas Fuchs <asf@boinkor.net>
normalize-line-endings,https://github.com/derekdreery/normalize-line-endings,Apache-2.0,Richard Dodd <richdodj@gmail.com>
nu-ansi-term,https://github.com/nushell/nu-ansi-term,MIT,"ogham@bsago.me, Ryan Scheel (Havvy) <ryan.havvy@gmail.com>, Josh Triplett <josh@joshtriplett.org>, The Nushell Project Developers"
num-bigint,https://github.com/rust-num/num-bigint,MIT OR Apache-2.0,The Rust Project Developers
num-conv,https://github.com/jhpratt/num-conv,MIT OR Apache-2.0,Jacob Pratt <jacob@jhpratt.dev>
num-integer,https://github.com/rust-num/num-integer,MIT OR Apache-2.0,The Rust Project Developers
num-rational,https://github.com/rust-num/num-rational,MIT OR Apache-2.0,The Rust Project Developers
num-traits,https://github.com/rust-num/num-traits,MIT OR Apache-2.0,The Rust Project Developers
num_cpus,https://github.com/seanmonstar/num_cpus,MIT OR Apache-2.0,Sean McArthur <sean@seanmonstar.com>
numfmt,https://github.com/kurtlawrence/numfmt,MIT,Kurt Lawrence <kurtlawrence.info>
objc2-core-foundation,https://github.com/madsmtm/objc2,Zlib OR Apache-2.0 OR MIT,The objc2-core-foundation Authors
objc2-io-kit,https://github.com/madsmtm/objc2,Zlib OR Apache-2.0 OR MIT,The objc2-io-kit Authors
once_cell,https://github.com/matklad/once_cell,MIT OR Apache-2.0,Aleksey Kladov <aleksey.kladov@gmail.com>
once_cell_polyfill,https://github.com/polyfill-rs/once_cell_polyfill,MIT OR Apache-2.0,The once_cell_polyfill Authors
oneshot,https://github.com/faern/oneshot,MIT OR Apache-2.0,Linus Färnstrand <faern@faern.net>
oorandom,https://hg.sr.ht/~icefox/oorandom,MIT,Simon Heath <icefox@dreamquest.io>
openssl-probe,https://github.com/alexcrichton/openssl-probe,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
opentelemetry,https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry,Apache-2.0,The opentelemetry Authors
opentelemetry-appender-tracing,https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-appender-tracing,Apache-2.0,The opentelemetry-appender-tracing Authors
opentelemetry-http,https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-http,Apache-2.0,The opentelemetry-http Authors
opentelemetry-otlp,https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-otlp,Apache-2.0,The opentelemetry-otlp Authors
opentelemetry-proto,https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-proto,Apache-2.0,The opentelemetry-proto Authors
opentelemetry_sdk,https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-sdk,Apache-2.0,The opentelemetry_sdk Authors
ordered-float,https://github.com/reem/rust-ordered-float,MIT,"Jonathan Reem <jonathan.reem@gmail.com>, Matt Brubeck <mbrubeck@limpet.net>"
ouroboros,https://github.com/someguynamedjosh/ouroboros,MIT OR Apache-2.0,Josh <someguynamedjosh@github.com>
ouroboros_macro,https://github.com/someguynamedjosh/ouroboros,MIT OR Apache-2.0,Josh <someguynamedjosh@github.com>
outref,https://github.com/Nugine/outref,MIT,The outref Authors
ownedbytes,https://github.com/quickwit-oss/tantivy,MIT,"Paul Masurel <paul@quickwit.io>, Pascal Seitz <pascal@quickwit.io>"
p256,https://github.com/RustCrypto/elliptic-curves/tree/master/p256,Apache-2.0 OR MIT,RustCrypto Developers
page_size,https://github.com/Elzair/page_size_rs,MIT OR Apache-2.0,Philip Woods <elzairthesorcerer@gmail.com>
papergrid,https://github.com/zhiburt/tabled,MIT,Maxim Zhiburt <zhiburt@gmail.com>
parking_lot,https://github.com/Amanieu/parking_lot,MIT OR Apache-2.0,Amanieu d'Antras <amanieu@gmail.com>
parking_lot_core,https://github.com/Amanieu/parking_lot,MIT OR Apache-2.0,Amanieu d'Antras <amanieu@gmail.com>
peakmem-alloc,https://github.com/PSeitz/peakmem-alloc,MIT,Pascal Seitz <pascal.seitz@gmail.com>
percent-encoding,https://github.com/servo/rust-url,MIT OR Apache-2.0,The rust-url developers
perf-event,https://github.com/jimblandy/perf-event,MIT OR Apache-2.0,Jim Blandy <jimb@red-bean.com>
perf-event-open-sys,https://github.com/jimblandy/perf-event-open-sys,MIT OR Apache-2.0,Jim Blandy <jimb@red-bean.com>
petgraph,https://github.com/petgraph/petgraph,MIT OR Apache-2.0,"bluss, mitchmindtree"
pin-project,https://github.com/taiki-e/pin-project,Apache-2.0 OR MIT,The pin-project Authors
pin-project-internal,https://github.com/taiki-e/pin-project,Apache-2.0 OR MIT,The pin-project-internal Authors
pin-project-lite,https://github.com/taiki-e/pin-project-lite,Apache-2.0 OR MIT,The pin-project-lite Authors
pin-utils,https://github.com/rust-lang-nursery/pin-utils,MIT OR Apache-2.0,Josef Brandl <mail@josefbrandl.de>
pkcs8,https://github.com/RustCrypto/formats/tree/master/pkcs8,Apache-2.0 OR MIT,RustCrypto Developers
plotters,https://github.com/plotters-rs/plotters,MIT,Hao Hou <haohou302@gmail.com>
plotters-backend,https://github.com/plotters-rs/plotters,MIT,Hao Hou <haohou302@gmail.com>
plotters-svg,https://github.com/plotters-rs/plotters,MIT,Hao Hou <haohou302@gmail.com>
pnet,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,Robert Clipsham <robert@octarineparrot.com>
pnet_base,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,"Robert Clipsham <robert@octarineparrot.com>, Linus Färnstrand <faern@faern.net>"
pnet_datalink,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,"Robert Clipsham <robert@octarineparrot.com>, Linus Färnstrand <faern@faern.net>"
pnet_macros,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,"Robert Clipsham <robert@octarineparrot.com>, Pierre Chifflier <chifflier@wzdftpd.net>"
pnet_macros_support,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,Robert Clipsham <robert@octarineparrot.com>
pnet_packet,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,Robert Clipsham <robert@octarineparrot.com>
pnet_sys,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,"Robert Clipsham <robert@octarineparrot.com>, Linus Färnstrand <faern@faern.net>"
pnet_transport,https://github.com/libpnet/libpnet,MIT OR Apache-2.0,Robert Clipsham <robert@octarineparrot.com>
portable-atomic,https://github.com/taiki-e/portable-atomic,Apache-2.0 OR MIT,The portable-atomic Authors
postcard,https://github.com/jamesmunns/postcard,MIT OR Apache-2.0,James Munns <james@onevariable.com>
potential_utf,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
powerfmt,https://github.com/jhpratt/powerfmt,MIT OR Apache-2.0,Jacob Pratt <jacob@jhpratt.dev>
ppv-lite86,https://github.com/cryptocorrosion/cryptocorrosion,MIT OR Apache-2.0,The CryptoCorrosion Contributors
predicates,https://github.com/assert-rs/predicates-rs,MIT OR Apache-2.0,Nick Stevens <nick@bitcurry.com>
predicates-core,https://github.com/assert-rs/predicates-rs/tree/master/crates/core,MIT OR Apache-2.0,Nick Stevens <nick@bitcurry.com>
predicates-tree,https://github.com/assert-rs/predicates-rs/tree/master/crates/tree,MIT OR Apache-2.0,Nick Stevens <nick@bitcurry.com>
pretty_assertions,https://github.com/rust-pretty-assertions/rust-pretty-assertions,MIT OR Apache-2.0,"Colin Kiegel <kiegel@gmx.de>, Florent Fayolle <florent.fayolle69@gmail.com>, Tom Milligan <code@tommilligan.net>"
prettyplease,https://github.com/dtolnay/prettyplease,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
proc-macro-error,https://gitlab.com/CreepySkeleton/proc-macro-error,MIT OR Apache-2.0,CreepySkeleton <creepy-skeleton@yandex.ru>
proc-macro-error-attr,https://gitlab.com/CreepySkeleton/proc-macro-error,MIT OR Apache-2.0,CreepySkeleton <creepy-skeleton@yandex.ru>
proc-macro-error-attr2,https://github.com/GnomedDev/proc-macro-error-2,MIT OR Apache-2.0,"CreepySkeleton <creepy-skeleton@yandex.ru>, GnomedDev <david2005thomas@gmail.com>"
proc-macro-error2,https://github.com/GnomedDev/proc-macro-error-2,MIT OR Apache-2.0,"CreepySkeleton <creepy-skeleton@yandex.ru>, GnomedDev <david2005thomas@gmail.com>"
proc-macro2,https://github.com/dtolnay/proc-macro2,MIT OR Apache-2.0,"David Tolnay <dtolnay@gmail.com>, Alex Crichton <alex@alexcrichton.com>"
proc-macro2-diagnostics,https://github.com/SergioBenitez/proc-macro2-diagnostics,MIT OR Apache-2.0,Sergio Benitez <sb@sergio.bz>
procfs,https://github.com/eminence/procfs,MIT OR Apache-2.0,Andrew Chin <achin@eminence32.net>
procfs-core,https://github.com/eminence/procfs,MIT OR Apache-2.0,Andrew Chin <achin@eminence32.net>
prometheus,https://github.com/tikv/rust-prometheus,Apache-2.0,"overvenus@gmail.com, siddontang@gmail.com, vistaswx@gmail.com"
prost,https://github.com/tokio-rs/prost,Apache-2.0,"Dan Burkert <dan@danburkert.com>, Lucio Franco <luciofranco14@gmail.com>, Casper Meijn <casper@meijn.net>, Tokio Contributors <team@tokio.rs>"
prost-build,https://github.com/tokio-rs/prost,Apache-2.0,"Dan Burkert <dan@danburkert.com>, Lucio Franco <luciofranco14@gmail.com>, Casper Meijn <casper@meijn.net>, Tokio Contributors <team@tokio.rs>"
prost-derive,https://github.com/tokio-rs/prost,Apache-2.0,"Dan Burkert <dan@danburkert.com>, Lucio Franco <luciofranco14@gmail.com>, Casper Meijn <casper@meijn.net>, Tokio Contributors <team@tokio.rs>"
prost-types,https://github.com/tokio-rs/prost,Apache-2.0,"Dan Burkert <dan@danburkert.com>, Lucio Franco <luciofranco14@gmail.com>, Casper Meijn <casper@meijn.net>, Tokio Contributors <team@tokio.rs>"
pulldown-cmark,https://github.com/raphlinus/pulldown-cmark,MIT,"Raph Levien <raph.levien@gmail.com>, Marcus Klaas de Vries <mail@marcusklaas.nl>"
pulldown-cmark-to-cmark,https://github.com/Byron/pulldown-cmark-to-cmark,Apache-2.0,"Sebastian Thiel <byronimo@gmail.com>, Dylan Owen <dyltotheo@gmail.com>, Alessandro Ogier <alessandro.ogier@gmail.com>, Zixian Cai <2891235+caizixian@users.noreply.github.com>, Andrew Lyjak <andrew.lyjak@gmail.com>"
quanta,https://github.com/metrics-rs/quanta,MIT,Toby Lawrence <toby@nuclearfurnace.com>
quick-error,http://github.com/tailhook/quick-error,MIT OR Apache-2.0,"Paul Colomiets <paul@colomiets.name>, Colin Kiegel <kiegel@gmx.de>"
quick_cache,https://github.com/arthurprs/quick-cache,MIT,Arthur Silva <arthurprs@gmail.com>
quinn,https://github.com/quinn-rs/quinn,MIT OR Apache-2.0,The quinn Authors
quinn-proto,https://github.com/quinn-rs/quinn,MIT OR Apache-2.0,The quinn-proto Authors
quinn-udp,https://github.com/quinn-rs/quinn,MIT OR Apache-2.0,The quinn-udp Authors
quote,https://github.com/dtolnay/quote,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
r-efi,https://github.com/r-efi/r-efi,MIT OR Apache-2.0 OR LGPL-2.1-or-later,The r-efi Authors
rand,https://github.com/rust-random/rand,MIT OR Apache-2.0,"The Rand Project Developers, The Rust Project Developers"
rand_chacha,https://github.com/rust-random/rand,MIT OR Apache-2.0,"The Rand Project Developers, The Rust Project Developers, The CryptoCorrosion Contributors"
rand_core,https://github.com/rust-random/rand,MIT OR Apache-2.0,"The Rand Project Developers, The Rust Project Developers"
rand_xorshift,https://github.com/rust-random/rngs,MIT OR Apache-2.0,"The Rand Project Developers, The Rust Project Developers"
raw-cpuid,https://github.com/gz/rust-cpuid,MIT,Gerd Zellweger <mail@gerdzellweger.com>
rayon,https://github.com/rayon-rs/rayon,MIT OR Apache-2.0,The rayon Authors
rayon-core,https://github.com/rayon-rs/rayon,MIT OR Apache-2.0,The rayon-core Authors
redox_syscall,https://gitlab.redox-os.org/redox-os/syscall,MIT,Jeremy Soller <jackpot51@gmail.com>
ref-cast,https://github.com/dtolnay/ref-cast,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
ref-cast-impl,https://github.com/dtolnay/ref-cast,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
regex,https://github.com/rust-lang/regex,MIT OR Apache-2.0,"The Rust Project Developers, Andrew Gallant <jamslam@gmail.com>"
regex-automata,https://github.com/rust-lang/regex,MIT OR Apache-2.0,"The Rust Project Developers, Andrew Gallant <jamslam@gmail.com>"
regex-lite,https://github.com/rust-lang/regex,MIT OR Apache-2.0,"The Rust Project Developers, Andrew Gallant <jamslam@gmail.com>"
regex-syntax,https://github.com/rust-lang/regex,MIT OR Apache-2.0,"The Rust Project Developers, Andrew Gallant <jamslam@gmail.com>"
reqwest,https://github.com/seanmonstar/reqwest,MIT OR Apache-2.0,Sean McArthur <sean@seanmonstar.com>
reqwest-middleware,https://github.com/TrueLayer/reqwest-middleware,MIT OR Apache-2.0,Rodrigo Gryzinski <rodrigo.gryzinski@truelayer.com>
reqwest-retry,https://github.com/TrueLayer/reqwest-middleware,MIT OR Apache-2.0,Rodrigo Gryzinski <rodrigo.gryzinski@truelayer.com>
retry-policies,https://github.com/TrueLayer/retry-policies,MIT OR Apache-2.0,Luca Palmieri <lpalmieri@truelayer.com>
rfc6979,https://github.com/RustCrypto/signatures/tree/master/rfc6979,Apache-2.0 OR MIT,RustCrypto Developers
ring,https://github.com/briansmith/ring,Apache-2.0 AND ISC,The ring Authors
roxmltree,https://github.com/RazrFalcon/roxmltree,MIT OR Apache-2.0,Evgeniy Reizner <razrfalcon@gmail.com>
rust-embed,https://pyrossh.dev/repos/rust-embed,MIT,pyrossh
rust-embed-impl,https://pyrossh.dev/repos/rust-embed,MIT,pyrossh
rust-embed-utils,https://pyrossh.dev/repos/rust-embed,MIT,pyrossh
rustc-hash,https://github.com/rust-lang/rustc-hash,Apache-2.0 OR MIT,The Rust Project Developers
rustix,https://github.com/bytecodealliance/rustix,Apache-2.0 WITH LLVM-exception OR Apache-2.0 OR MIT,"Dan Gohman <dev@sunfishcode.online>, Jakub Konka <kubkon@jakubkonka.com>"
rustls,https://github.com/rustls/rustls,Apache-2.0 OR ISC OR MIT,The rustls Authors
rustls-native-certs,https://github.com/rustls/rustls-native-certs,Apache-2.0 OR ISC OR MIT,The rustls-native-certs Authors
rustls-pemfile,https://github.com/rustls/pemfile,Apache-2.0 OR ISC OR MIT,The rustls-pemfile Authors
rustls-pki-types,https://github.com/rustls/pki-types,MIT OR Apache-2.0,The rustls-pki-types Authors
rustls-webpki,https://github.com/rustls/webpki,ISC,The rustls-webpki Authors
rustop,https://chiselapp.com/user/fifr/repository/rustop,MIT,Frank Fischer <frank-fischer@shadow-soft.de>
rustversion,https://github.com/dtolnay/rustversion,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
rusty-fork,https://github.com/altsysrq/rusty-fork,MIT OR Apache-2.0,Jason Lingle
ryu,https://github.com/dtolnay/ryu,Apache-2.0 OR BSL-1.0,David Tolnay <dtolnay@gmail.com>
same-file,https://github.com/BurntSushi/same-file,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
scc,https://github.com/wvwwvwwv/scalable-concurrent-containers,Apache-2.0,wvwwvwwv <wvwwvwwv@me.com>
schannel,https://github.com/steffengy/schannel-rs,MIT,"Steven Fackler <sfackler@gmail.com>, Steffen Butzer <steffen.butzer@outlook.com>"
schemars,https://github.com/GREsau/schemars,MIT,Graham Esau <gesau@hotmail.co.uk>
scoped-tls,https://github.com/alexcrichton/scoped-tls,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
scopeguard,https://github.com/bluss/scopeguard,MIT OR Apache-2.0,bluss
sct,https://github.com/rustls/sct.rs,Apache-2.0 OR ISC OR MIT,Joseph Birr-Pixton <jpixton@gmail.com>
sdd,https://github.com/wvwwvwwv/scalable-delayed-dealloc,Apache-2.0,wvwwvwwv <wvwwvwwv@me.com>
sec1,https://github.com/RustCrypto/formats/tree/master/sec1,Apache-2.0 OR MIT,RustCrypto Developers
security-framework,https://github.com/kornelski/rust-security-framework,MIT OR Apache-2.0,"Steven Fackler <sfackler@gmail.com>, Kornel <kornel@geekhood.net>"
security-framework-sys,https://github.com/kornelski/rust-security-framework,MIT OR Apache-2.0,"Steven Fackler <sfackler@gmail.com>, Kornel <kornel@geekhood.net>"
semver,https://github.com/dtolnay/semver,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
separator,https://github.com/saghm/rust-separator,MIT,Saghm Rossi <saghmrossi@gmail.com>
serde,https://github.com/serde-rs/serde,MIT OR Apache-2.0,"Erick Tryzelaar <erick.tryzelaar@gmail.com>, David Tolnay <dtolnay@gmail.com>"
serde_core,https://github.com/serde-rs/serde,MIT OR Apache-2.0,"Erick Tryzelaar <erick.tryzelaar@gmail.com>, David Tolnay <dtolnay@gmail.com>"
serde_derive,https://github.com/serde-rs/serde,MIT OR Apache-2.0,"Erick Tryzelaar <erick.tryzelaar@gmail.com>, David Tolnay <dtolnay@gmail.com>"
serde_json,https://github.com/serde-rs/json,MIT OR Apache-2.0,"Erick Tryzelaar <erick.tryzelaar@gmail.com>, David Tolnay <dtolnay@gmail.com>"
serde_json_borrow,https://github.com/PSeitz/serde_json_borrow,MIT,Pascal Seitz <pascal.seitz@gmail.com>
serde_path_to_error,https://github.com/dtolnay/path-to-error,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
serde_qs,https://github.com/samscott89/serde_qs,MIT OR Apache-2.0,Sam Scott <sam@osohq.com>
serde_spanned,https://github.com/toml-rs/toml,MIT OR Apache-2.0,The serde_spanned Authors
serde_urlencoded,https://github.com/nox/serde_urlencoded,MIT OR Apache-2.0,Anthony Ramine <n.oxyde@gmail.com>
serde_with,https://github.com/jonasbb/serde_with,MIT OR Apache-2.0,"Jonas Bushart, Marcin Kaźmierczak"
serde_with_macros,https://github.com/jonasbb/serde_with,MIT OR Apache-2.0,Jonas Bushart
serde_yaml,https://github.com/dtolnay/serde-yaml,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
serial_test_derive,https://github.com/palfrey/serial_test,MIT,Tom Parker-Shemilt <palfrey@tevp.net>
sha1,https://github.com/RustCrypto/hashes,MIT OR Apache-2.0,RustCrypto Developers
sha2,https://github.com/RustCrypto/hashes,MIT OR Apache-2.0,RustCrypto Developers
sharded-slab,https://github.com/hawkw/sharded-slab,MIT,Eliza Weisman <eliza@buoyant.io>
shell-words,https://github.com/tmiasko/shell-words,MIT OR Apache-2.0,Tomasz Miąsko <tomasz.miasko@gmail.com>
shlex,https://github.com/comex/rust-shlex,MIT OR Apache-2.0,"comex <comexk@gmail.com>, Fenhl <fenhl@fenhl.net>, Adrian Taylor <adetaylor@chromium.org>, Alex Touchet <alextouchet@outlook.com>, Daniel Parks <dp+git@oxidized.org>, Garrett Berg <googberg@gmail.com>"
signal-hook-registry,https://github.com/vorner/signal-hook,MIT OR Apache-2.0,"Michal 'vorner' Vaner <vorner@vorner.cz>, Masaki Hara <ackie.h.gmai@gmail.com>"
signature,https://github.com/RustCrypto/traits/tree/master/signature,Apache-2.0 OR MIT,RustCrypto Developers
simd-adler32,https://github.com/mcountryman/simd-adler32,MIT,Marvin Countryman <me@maar.vin>
siphasher,https://github.com/jedisct1/rust-siphash,MIT OR Apache-2.0,Frank Denis <github@pureftpd.org>
sketches-ddsketch,https://github.com/mheffner/rust-sketches-ddsketch,Apache-2.0,Mike Heffner <mikeh@fesnel.com>
slab,https://github.com/tokio-rs/slab,MIT,Carl Lerche <me@carllerche.com>
smallvec,https://github.com/servo/rust-smallvec,MIT OR Apache-2.0,The Servo Project Developers
socket2,https://github.com/rust-lang/socket2,MIT OR Apache-2.0,"Alex Crichton <alex@alexcrichton.com>, Thomas de Zeeuw <thomasdezeeuw@gmail.com>"
spin,https://github.com/mvdnes/spin-rs,MIT,"Mathijs van de Nes <git@mathijs.vd-nes.nl>, John Ericson <git@JohnEricson.me>, Joshua Barretto <joshua.s.barretto@gmail.com>"
spinning_top,https://github.com/rust-osdev/spinning_top,MIT OR Apache-2.0,Philipp Oppermann <dev@phil-opp.com>
spki,https://github.com/RustCrypto/formats/tree/master/spki,Apache-2.0 OR MIT,RustCrypto Developers
stable_deref_trait,https://github.com/storyyeller/stable_deref_trait,MIT OR Apache-2.0,Robert Grosse <n210241048576@gmail.com>
static_assertions,https://github.com/nvzqz/static-assertions-rs,MIT OR Apache-2.0,Nikolai Vazquez
strsim,https://github.com/rapidfuzz/strsim-rs,MIT,"Danny Guo <danny@dannyguo.com>, maxbachmann <oss@maxbachmann.de>"
subtle,https://github.com/dalek-cryptography/subtle,BSD-3-Clause,"Isis Lovecruft <isis@patternsinthevoid.net>, Henry de Valence <hdevalence@hdevalence.ca>"
syn,https://github.com/dtolnay/syn,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
sync_wrapper,https://github.com/Actyx/sync_wrapper,Apache-2.0,Actyx AG <developer@actyx.io>
synstructure,https://github.com/mystor/synstructure,MIT,Nika Layzell <nika@thelayzells.com>
sysinfo,https://github.com/GuillaumeGomez/sysinfo,MIT,Guillaume Gomez <guillaume1.gomez@gmail.com>
tabled,https://github.com/zhiburt/tabled,MIT,Maxim Zhiburt <zhiburt@gmail.com>
tabled_derive,https://github.com/zhiburt/tabled,MIT,Maxim Zhiburt <zhiburt@gmail.com>
tagptr,https://github.com/oliver-giersch/tagptr,MIT OR Apache-2.0,Oliver Giersch
tantivy,https://github.com/quickwit-oss/tantivy,MIT,Paul Masurel <paul.masurel@gmail.com>
tantivy-bitpacker,https://github.com/quickwit-oss/tantivy,MIT,Paul Masurel <paul.masurel@gmail.com>
tantivy-columnar,https://github.com/quickwit-oss/tantivy,MIT,The tantivy-columnar Authors
tantivy-common,https://github.com/quickwit-oss/tantivy,MIT,"Paul Masurel <paul@quickwit.io>, Pascal Seitz <pascal@quickwit.io>"
tantivy-fst,https://github.com/quickwit-inc/fst,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
tantivy-query-grammar,https://github.com/quickwit-oss/tantivy,MIT,Paul Masurel <paul.masurel@gmail.com>
tantivy-sstable,https://github.com/quickwit-oss/tantivy,MIT,The tantivy-sstable Authors
tantivy-stacker,https://github.com/quickwit-oss/tantivy,MIT,The tantivy-stacker Authors
tantivy-tokenizer-api,https://github.com/quickwit-oss/tantivy,MIT,The tantivy-tokenizer-api Authors
tempfile,https://github.com/Stebalien/tempfile,MIT OR Apache-2.0,"Steven Allen <steven@stebalien.com>, The Rust Project Developers, Ashley Mannix <ashleymannix@live.com.au>, Jason White <me@jasonwhite.io>"
termtree,https://github.com/rust-cli/termtree,MIT,The termtree Authors
testing_table,https://github.com/zhiburt/tabled,MIT,Maxim Zhiburt <zhiburt@gmail.com>
thiserror,https://github.com/dtolnay/thiserror,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
thiserror-impl,https://github.com/dtolnay/thiserror,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
thousands,https://github.com/tov/thousands-rs,MIT OR Apache-2.0,Jesse A. Tov <jesse.tov@gmail.com>
thread_local,https://github.com/Amanieu/thread_local-rs,MIT OR Apache-2.0,Amanieu d'Antras <amanieu@gmail.com>
time,https://github.com/time-rs/time,MIT OR Apache-2.0,"Jacob Pratt <open-source@jhpratt.dev>, Time contributors"
time-core,https://github.com/time-rs/time,MIT OR Apache-2.0,"Jacob Pratt <open-source@jhpratt.dev>, Time contributors"
time-fmt,https://github.com/MiSawa/time-fmt,MIT OR Apache-2.0,mi_sawa <mi.sawa.1216+git@gmail.com>
time-macros,https://github.com/time-rs/time,MIT OR Apache-2.0,"Jacob Pratt <open-source@jhpratt.dev>, Time contributors"
tinystr,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
tinytemplate,https://github.com/bheisler/TinyTemplate,Apache-2.0 OR MIT,Brook Heisler <brookheisler@gmail.com>
tinyvec,https://github.com/Lokathor/tinyvec,Zlib OR Apache-2.0 OR MIT,Lokathor <zefria@gmail.com>
tinyvec_macros,https://github.com/Soveu/tinyvec_macros,MIT OR Apache-2.0 OR Zlib,Soveu <marx.tomasz@gmail.com>
tokio,https://github.com/tokio-rs/tokio,MIT,Tokio Contributors <team@tokio.rs>
tokio-macros,https://github.com/tokio-rs/tokio,MIT,Tokio Contributors <team@tokio.rs>
tokio-metrics,https://github.com/tokio-rs/tokio-metrics,MIT,Tokio Contributors <team@tokio.rs>
tokio-rustls,https://github.com/rustls/tokio-rustls,MIT OR Apache-2.0,The tokio-rustls Authors
tokio-stream,https://github.com/tokio-rs/tokio,MIT,Tokio Contributors <team@tokio.rs>
tokio-util,https://github.com/tokio-rs/tokio,MIT,Tokio Contributors <team@tokio.rs>
toml,https://github.com/toml-rs/toml,MIT OR Apache-2.0,The toml Authors
toml_datetime,https://github.com/toml-rs/toml,MIT OR Apache-2.0,The toml_datetime Authors
toml_parser,https://github.com/toml-rs/toml,MIT OR Apache-2.0,The toml_parser Authors
toml_writer,https://github.com/toml-rs/toml,MIT OR Apache-2.0,The toml_writer Authors
tonic,https://github.com/hyperium/tonic,MIT,Lucio Franco <luciofranco14@gmail.com>
tonic-build,https://github.com/hyperium/tonic,MIT,Lucio Franco <luciofranco14@gmail.com>
tonic-health,https://github.com/hyperium/tonic,MIT,James Nugent <james@jen20.com>
tonic-prost,https://github.com/hyperium/tonic,MIT,Lucio Franco <luciofranco14@gmail.com>
tonic-prost-build,https://github.com/hyperium/tonic,MIT,Lucio Franco <luciofranco14@gmail.com>
tonic-reflection,https://github.com/hyperium/tonic,MIT,"James Nugent <james@jen20.com>, Samani G. Gikandi <samani@gojulas.com>"
tower,https://github.com/tower-rs/tower,MIT,Tower Maintainers <team@tower-rs.com>
tower-http,https://github.com/tower-rs/tower-http,MIT,Tower Maintainers <team@tower-rs.com>
tower-layer,https://github.com/tower-rs/tower,MIT,Tower Maintainers <team@tower-rs.com>
tower-service,https://github.com/tower-rs/tower,MIT,Tower Maintainers <team@tower-rs.com>
tracing,https://github.com/tokio-rs/tracing,MIT,"Eliza Weisman <eliza@buoyant.io>, Tokio Contributors <team@tokio.rs>"
tracing-attributes,https://github.com/tokio-rs/tracing,MIT,"Tokio Contributors <team@tokio.rs>, Eliza Weisman <eliza@buoyant.io>, David Barsky <dbarsky@amazon.com>"
tracing-core,https://github.com/tokio-rs/tracing,MIT,Tokio Contributors <team@tokio.rs>
tracing-log,https://github.com/tokio-rs/tracing,MIT,Tokio Contributors <team@tokio.rs>
tracing-opentelemetry,https://github.com/tokio-rs/tracing-opentelemetry,MIT,The tracing-opentelemetry Authors
tracing-serde,https://github.com/tokio-rs/tracing,MIT,Tokio Contributors <team@tokio.rs>
tracing-subscriber,https://github.com/tokio-rs/tracing,MIT,"Eliza Weisman <eliza@buoyant.io>, David Barsky <me@davidbarsky.com>, Tokio Contributors <team@tokio.rs>"
triomphe,https://github.com/Manishearth/triomphe,MIT OR Apache-2.0,"Manish Goregaokar <manishsmail@gmail.com>, The Servo Project Developers"
try-lock,https://github.com/seanmonstar/try-lock,MIT,Sean McArthur <sean@seanmonstar.com>
ttl_cache,https://github.com/stusmall/ttl_cache,MIT OR Apache-2.0,Stu Small <stuart.alan.small@gmail.com>
typeid,https://github.com/dtolnay/typeid,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
typenum,https://github.com/paholg/typenum,MIT OR Apache-2.0,"Paho Lurie-Gregg <paho@paholg.com>, Andre Bogus <bogusandre@gmail.com>"
typetag,https://github.com/dtolnay/typetag,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
typetag-impl,https://github.com/dtolnay/typetag,MIT OR Apache-2.0,David Tolnay <dtolnay@gmail.com>
ulid,https://github.com/dylanhart/ulid-rs,MIT,dylanhart <dylan96hart@gmail.com>
unarray,https://github.com/cameron1024/unarray,MIT OR Apache-2.0,The unarray Authors
unicase,https://github.com/seanmonstar/unicase,MIT OR Apache-2.0,Sean McArthur <sean@seanmonstar.com>
unicode-ident,https://github.com/dtolnay/unicode-ident,(MIT OR Apache-2.0) AND Unicode-3.0,David Tolnay <dtolnay@gmail.com>
unicode-width,https://github.com/unicode-rs/unicode-width,MIT OR Apache-2.0,"kwantam <kwantam@gmail.com>, Manish Goregaokar <manishsmail@gmail.com>"
unit-prefix,https://codeberg.org/commons-rs/unit-prefix,MIT,"Fabio Valentini <decathorpe@gmail.com>, Benjamin Sago <ogham@bsago.me>"
unsafe-libyaml,https://github.com/dtolnay/unsafe-libyaml,MIT,David Tolnay <dtolnay@gmail.com>
untrusted,https://github.com/briansmith/untrusted,ISC,Brian Smith <brian@briansmith.org>
ureq-proto,https://github.com/algesten/ureq-proto,MIT OR Apache-2.0,Martin Algesten <martin@algesten.se>
url,https://github.com/servo/rust-url,MIT OR Apache-2.0,The rust-url developers
urlencoding,https://github.com/kornelski/rust_urlencoding,MIT,"Kornel <kornel@geekhood.net>, Bertram Truong <b@bertramtruong.com>"
username,https://pijul.org/darcs/user,MIT OR Apache-2.0,Pierre-Étienne Meunier <pierre-etienne.meunier@aalto.fi>
utf-8,https://github.com/SimonSapin/rust-utf8,MIT OR Apache-2.0,Simon Sapin <simon.sapin@exyr.org>
utf8-ranges,https://github.com/BurntSushi/utf8-ranges,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
utf8_iter,https://github.com/hsivonen/utf8_iter,Apache-2.0 OR MIT,Henri Sivonen <hsivonen@hsivonen.fi>
utf8parse,https://github.com/alacritty/vte,Apache-2.0 OR MIT,"Joe Wilm <joe@jwilm.com>, Christian Duerr <contact@christianduerr.com>"
utoipa,https://github.com/juhaku/utoipa,MIT OR Apache-2.0,Juha Kukkonen <juha7kukkonen@gmail.com>
utoipa-gen,https://github.com/juhaku/utoipa,MIT OR Apache-2.0,Juha Kukkonen <juha7kukkonen@gmail.com>
uuid,https://github.com/uuid-rs/uuid,Apache-2.0 OR MIT,"Ashley Mannix<ashleymannix@live.com.au>, Dylan DPC<dylan.dpc@gmail.com>, Hunar Roop Kahlon<hunar.roop@gmail.com>"
valuable,https://github.com/tokio-rs/valuable,MIT,The valuable Authors
vsimd,https://github.com/Nugine/simd,MIT,The vsimd Authors
vte,https://github.com/alacritty/vte,Apache-2.0 OR MIT,"Joe Wilm <joe@jwilm.com>, Christian Duerr <contact@christianduerr.com>"
wait-timeout,https://github.com/alexcrichton/wait-timeout,MIT OR Apache-2.0,Alex Crichton <alex@alexcrichton.com>
walkdir,https://github.com/BurntSushi/walkdir,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
want,https://github.com/seanmonstar/want,MIT,Sean McArthur <sean@seanmonstar.com>
warp,https://github.com/seanmonstar/warp,MIT,Sean McArthur <sean@seanmonstar.com>
wasi,https://github.com/bytecodealliance/wasi,Apache-2.0 WITH LLVM-exception OR Apache-2.0 OR MIT,The Cranelift Project Developers
wasip2,https://github.com/bytecodealliance/wasi-rs,Apache-2.0 WITH LLVM-exception OR Apache-2.0 OR MIT,The wasip2 Authors
wasix,https://github.com/wasix-org/wasix-abi-rust,Apache-2.0 WITH LLVM-exception OR Apache-2.0 OR MIT,"The Cranelift Project Developers, john-sharratt"
wasm-bindgen,https://github.com/wasm-bindgen/wasm-bindgen,MIT OR Apache-2.0,The wasm-bindgen Developers
wasm-bindgen-futures,https://github.com/wasm-bindgen/wasm-bindgen/tree/master/crates/futures,MIT OR Apache-2.0,The wasm-bindgen Developers
wasm-bindgen-macro,https://github.com/wasm-bindgen/wasm-bindgen/tree/master/crates/macro,MIT OR Apache-2.0,The wasm-bindgen Developers
wasm-bindgen-macro-support,https://github.com/wasm-bindgen/wasm-bindgen/tree/master/crates/macro-support,MIT OR Apache-2.0,The wasm-bindgen Developers
wasm-bindgen-shared,https://github.com/wasm-bindgen/wasm-bindgen/tree/master/crates/shared,MIT OR Apache-2.0,The wasm-bindgen Developers
wasmtimer,https://github.com/whizsid/wasmtimer-rs,MIT,"WhizSid <whizsid@aol.com>, Pierre Krieger <pierre.krieger1708@gmail.com>"
web-sys,https://github.com/wasm-bindgen/wasm-bindgen/tree/master/crates/web-sys,MIT OR Apache-2.0,The wasm-bindgen Developers
web-time,https://github.com/daxpedda/web-time,MIT OR Apache-2.0,The web-time Authors
webpki-roots,https://github.com/rustls/webpki-roots,CDLA-Permissive-2.0,The webpki-roots Authors
winapi,https://github.com/retep998/winapi-rs,MIT,Peter Atashian <retep998@gmail.com>
winapi,https://github.com/retep998/winapi-rs,MIT OR Apache-2.0,Peter Atashian <retep998@gmail.com>
winapi-i686-pc-windows-gnu,https://github.com/retep998/winapi-rs,MIT OR Apache-2.0,Peter Atashian <retep998@gmail.com>
winapi-util,https://github.com/BurntSushi/winapi-util,Unlicense OR MIT,Andrew Gallant <jamslam@gmail.com>
winapi-x86_64-pc-windows-gnu,https://github.com/retep998/winapi-rs,MIT OR Apache-2.0,Peter Atashian <retep998@gmail.com>
windows,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-collections,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-collections Authors
windows-core,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-core,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-core Authors
windows-future,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-future Authors
windows-implement,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-implement Authors
windows-interface,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-interface Authors
windows-link,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-link,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-link Authors
windows-numerics,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-numerics Authors
windows-result,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-result,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-result Authors
windows-strings,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-strings,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-strings Authors
windows-sys,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-sys,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-sys Authors
windows-targets,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows-targets,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows-targets Authors
windows-threading,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_aarch64_gnullvm,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_aarch64_gnullvm,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_aarch64_gnullvm Authors
windows_aarch64_msvc,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_aarch64_msvc,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_aarch64_msvc Authors
windows_i686_gnu,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_i686_gnu,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_i686_gnu Authors
windows_i686_gnullvm,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_i686_gnullvm,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_i686_gnullvm Authors
windows_i686_msvc,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_i686_msvc,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_i686_msvc Authors
windows_x86_64_gnu,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_x86_64_gnu,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_x86_64_gnu Authors
windows_x86_64_gnullvm,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_x86_64_gnullvm,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_x86_64_gnullvm Authors
windows_x86_64_msvc,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,Microsoft
windows_x86_64_msvc,https://github.com/microsoft/windows-rs,MIT OR Apache-2.0,The windows_x86_64_msvc Authors
winnow,https://github.com/winnow-rs/winnow,MIT,The winnow Authors
wit-bindgen,https://github.com/bytecodealliance/wit-bindgen,Apache-2.0 WITH LLVM-exception OR Apache-2.0 OR MIT,Alex Crichton <alex@alexcrichton.com>
writeable,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
xmlparser,https://github.com/RazrFalcon/xmlparser,MIT OR Apache-2.0,Yevhenii Reizner <razrfalcon@gmail.com>
yansi,https://github.com/SergioBenitez/yansi,MIT OR Apache-2.0,Sergio Benitez <sb@sergio.bz>
yoke,https://github.com/unicode-org/icu4x,Unicode-3.0,Manish Goregaokar <manishsmail@gmail.com>
yoke-derive,https://github.com/unicode-org/icu4x,Unicode-3.0,Manish Goregaokar <manishsmail@gmail.com>
zerocopy,https://github.com/google/zerocopy,BSD-2-Clause OR Apache-2.0 OR MIT,"Joshua Liebow-Feeser <joshlf@google.com>, Jack Wrenn <jswrenn@amazon.com>"
zerocopy-derive,https://github.com/google/zerocopy,BSD-2-Clause OR Apache-2.0 OR MIT,"Joshua Liebow-Feeser <joshlf@google.com>, Jack Wrenn <jswrenn@amazon.com>"
zerofrom,https://github.com/unicode-org/icu4x,Unicode-3.0,Manish Goregaokar <manishsmail@gmail.com>
zerofrom-derive,https://github.com/unicode-org/icu4x,Unicode-3.0,Manish Goregaokar <manishsmail@gmail.com>
zeroize,https://github.com/RustCrypto/utils,Apache-2.0 OR MIT,The RustCrypto Project Developers
zerotrie,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
zerovec,https://github.com/unicode-org/icu4x,Unicode-3.0,The ICU4X Project Developers
zerovec-derive,https://github.com/unicode-org/icu4x,Unicode-3.0,Manish Goregaokar <manishsmail@gmail.com>
zmij,https://github.com/dtolnay/zmij,MIT,David Tolnay <dtolnay@gmail.com>
zstd,https://github.com/gyscos/zstd-rs,MIT,Alexandre Bury <alexandre.bury@gmail.com>
zstd-safe,https://github.com/gyscos/zstd-rs,MIT OR Apache-2.0,Alexandre Bury <alexandre.bury@gmail.com>
zstd-sys,https://github.com/gyscos/zstd-rs,MIT OR Apache-2.0,Alexandre Bury <alexandre.bury@gmail.com>


================================================
FILE: Makefile
================================================
DOCKER_SERVICES ?= all

QUICKWIT_SRC = quickwit

help:
	@grep '^[^\.#[:space:]].*:' Makefile


IMAGE_TAG := $(shell git branch --show-current | tr '\#/' '-')

QW_COMMIT_DATE := $(shell TZ=UTC0 git log -1 --format=%cd --date=format-local:'%Y-%m-%dT%H:%M:%SZ')
QW_COMMIT_HASH := $(shell git rev-parse HEAD)
QW_COMMIT_TAGS := $(shell git tag --points-at HEAD | tr '\n' ',')

docker-build:
	@docker build \
		--build-arg QW_COMMIT_DATE=$(QW_COMMIT_DATE) \
		--build-arg QW_COMMIT_HASH=$(QW_COMMIT_HASH) \
		--build-arg QW_COMMIT_TAGS=$(QW_COMMIT_TAGS) \
		-t quickwit/quickwit:$(IMAGE_TAG) .

# Usage:
# `make docker-compose-up` starts all the services.
# `make docker-compose-up DOCKER_SERVICES='jaeger,localstack'` starts the subset of services matching the profiles.
docker-compose-up:
	@echo "Launching ${DOCKER_SERVICES} Docker service(s)"
	COMPOSE_PROFILES=$(DOCKER_SERVICES) docker compose -f docker-compose.yml up -d --remove-orphans --wait

docker-compose-down:
	docker compose -p quickwit down --remove-orphans

docker-compose-logs:
	docker compose logs -f docker-compose.yml -t

docker-compose-monitoring:
	COMPOSE_PROFILES=monitoring docker compose -f docker-compose.yml up -d --remove-orphans

docker-rm-postgres-volume:
	docker volume rm quickwit_postgres_data

docker-rm-volumes:
	docker volume rm quickwit_azurite_data quickwit_fake_gcs_server_data quickwit_grafana_conf quickwit_grafana_data quickwit_localstack_data quickwit_postgres_data

doc:
	@$(MAKE) -C $(QUICKWIT_SRC) doc

fmt:
	@$(MAKE) -C $(QUICKWIT_SRC) fmt

fix:
	@$(MAKE) -C $(QUICKWIT_SRC) fix

typos:
	typos

# Usage:
# `make test-all` starts the Docker services and runs all the tests.
# `make -k test-all docker-compose-down`, tears down the Docker services after running all the tests.
test-all: docker-compose-up
	@$(MAKE) -C $(QUICKWIT_SRC) test-all

test-failpoints:
	@$(MAKE) -C $(QUICKWIT_SRC) test-failpoints

# This will build and push all custom cross images for cross-compilation.
# You will need to login into Docker Hub with the `quickwit` account.
IMAGE_TAGS = x86_64-unknown-linux-gnu aarch64-unknown-linux-gnu x86_64-unknown-linux-musl aarch64-unknown-linux-musl

.PHONY: cross-images
cross-images:
	@for tag in ${IMAGE_TAGS}; do \
		docker build --tag quickwit/cross:$$tag --file ./build/cross-images/$$tag.dockerfile ./build/cross-images; \
		docker push quickwit/cross:$$tag; \
	done

# TODO: to be replaced by https://github.com/quickwit-oss/quickwit/issues/237
.PHONY: build
build: build-ui
	$(MAKE) -C $(QUICKWIT_SRC) build

# Usage:
# `BINARY_FILE=path/to/quickwit/binary BINARY_VERSION=0.1.0 ARCHIVE_NAME=quickwit make archive`
# - BINARY_FILE: Path of the quickwit binary file.
# - BINARY_VERSION: Version of the quickwit binary.
# - ARCHIVE_NAME: Name of the resulting archive file (without extension).
.PHONY: archive
archive:
	@echo "Archiving release binary & assets"
	@mkdir -p "./quickwit-${BINARY_VERSION}/config"
	@mkdir -p "./quickwit-${BINARY_VERSION}/qwdata"
	@cp ./config/quickwit.yaml "./quickwit-${BINARY_VERSION}/config"
	@cp ./LICENSE "./quickwit-${BINARY_VERSION}"
	@cp "${BINARY_FILE}" "./quickwit-${BINARY_VERSION}"
	@tar -czf "${ARCHIVE_NAME}.tar.gz" "./quickwit-${BINARY_VERSION}"
	@rm -rf "./quickwit-${BINARY_VERSION}"

workspace-deps-tree:
	$(MAKE) -C $(QUICKWIT_SRC) workspace-deps-tree

.PHONY: build-rustdoc
build-rustdoc:
	$(MAKE) -C $(QUICKWIT_SRC) build-rustdoc

.PHONY: build-ui
build-ui:
	$(MAKE) -C $(QUICKWIT_SRC) build-ui


================================================
FILE: README.md
================================================
[![CI](https://github.com/quickwit-oss/quickwit/actions/workflows/ci.yml/badge.svg)](https://github.com/quickwit-oss/quickwit/actions?query=workflow%3ACI+branch%3Amain)
[![codecov](https://codecov.io/gh/quickwit-oss/quickwit/branch/main/graph/badge.svg?token=06SRGAV5SS)](https://codecov.io/gh/quickwit-oss/quickwit)
[![OpenSSF Scorecard](https://api.scorecard.dev/projects/github.com/quickwit-oss/quickwit/badge)](https://scorecard.dev/viewer/?uri=github.com/quickwit-oss/quickwit)
[![Contributor Covenant](https://img.shields.io/badge/Contributor%20Covenant-2.0-4baaaa.svg)](CODE_OF_CONDUCT.md)
[![License: Apache 2.0](https://img.shields.io/badge/license-Apache%202.0-blue?style=flat-square)](LICENSE)
[![Twitter Follow](https://img.shields.io/twitter/follow/Quickwit_Inc?color=%231DA1F2&logo=Twitter&style=plastic)](https://twitter.com/Quickwit_Inc)
[![Discord](https://img.shields.io/discord/908281611840282624?logo=Discord&logoColor=%23FFFFFF&style=plastic)](https://discord.quickwit.io)
<br/>

<br/>
<br/>
<p align="center">
  <img src="docs/assets/images/logo_horizontal.svg#gh-light-mode-only" alt="Quickwit Cloud-Native Search Engine" height="40">
  <img src="docs/assets/images/quickwit-dark-theme-logo.png#gh-dark-mode-only" alt="Quickwit Cloud-Native Search Engine" height="40">
</p>

<h2 align="center">
Cloud-native search engine for observability (logs, traces, and soon metrics!). An open-source alternative to Datadog, Elasticsearch,  Loki, and Tempo.
</h2>

<h4 align="center">
  <a href="https://quickwit.io/docs/get-started/quickstart">Quickstart</a> |
  <a href="https://quickwit.io/docs/">Docs</a> |
  <a href="https://quickwit.io/tutorials">Tutorials</a> |
  <a href="https://discord.quickwit.io">Chat</a> |
  <a href="https://quickwit.io/docs/get-started/installation">Download</a>
</h4>
<br/>

<b>We just released Quickwit 0.8! Read the [blog post](https://quickwit.io/blog/quickwit-0.8) to learn about the latest powerful features!</b>

### **Quickwit is the fastest search engine on cloud storage. It's the perfect fit for observability use cases**

- [Log management](https://quickwit.io/docs/log-management/overview)
- [Distributed tracing](https://quickwit.io/docs/distributed-tracing/overview)
- Metrics support is on the roadmap

### 🚀 Quickstart

- [Search and analytics on Stack Overflow dataset](https://quickwit.io/docs/get-started/quickstart)
- [Trace analytics with Grafana](https://quickwit.io/docs/get-started/tutorials/trace-analytics-with-grafana)
- [Distributed tracing with Jaeger](https://quickwit.io/docs/get-started/tutorials/tutorial-jaeger)

<br/>

<video src="https://github.com/quickwit-oss/quickwit/assets/653704/020b94b9-deeb-4376-9a3a-b82e1168094c" controls="controls" style="max-width: 1200px;">
</video>

<br/>

# 💡 Features

- Full-text search and aggregation queries
- Elasticsearch-compatible API, use Quickwit with any Elasticsearch or OpenSearch client
- [Jaeger-native](https://quickwit.io/docs/distributed-tracing/plug-quickwit-to-jaeger)
- OTEL-native for [logs](https://quickwit.io/docs/log-management/overview) and [traces](https://quickwit.io/docs/distributed-tracing/overview)
- [Schemaless](https://quickwit.io/docs/guides/schemaless) or strict schema indexing
- Schemaless analytics
- Sub-second search on cloud storage (Amazon S3, Azure Blob Storage, Google Cloud Storage, …)
- Decoupled compute and storage, stateless indexers & searchers
- [Grafana data source](https://github.com/quickwit-oss/quickwit-datasource)
- Kubernetes ready - See our [helm-chart](https://quickwit.io/docs/deployment/kubernetes/helm)
- RESTful API

## Enterprise ready

- Multiple [data sources](https://quickwit.io/docs/ingest-data/) Kafka / Kinesis / Pulsar native
- Multi-tenancy: indexing with many indexes and partitioning
- Retention policies
- Delete tasks (for GDPR use cases)
- Distributed and highly available* engine that scales out in seconds (*HA indexing only with Kafka)

# 📑 Architecture overview

![Quickwit Distributed Tracing](./docs/assets/images/quickwit-overview-light.svg#gh-light-mode-only)![Quickwit Distributed Tracing](./docs/assets/images/quickwit-overview-dark.svg#gh-dark-mode-only)

- [Architecture overview]([https://quickwit.io/docs/distributed-tracing/overview](https://quickwit.io/docs/overview/architecture))
- [Log management](https://quickwit.io/docs/log-management/overview)
- [Distributed traces](https://quickwit.io/docs/distributed-tracing/overview)


# 📕 Documentation

- [Installation](https://quickwit.io/docs/get-started/installation)
- [Log management with Quickwit](https://quickwit.io/docs/log-management/overview)
- [Distributed Tracing with Quickwit](https://quickwit.io/docs/distributed-tracing/overview)
- [Ingest data](https://quickwit.io/docs/ingest-data/)
- [REST API](https://quickwit.io/docs/reference/rest-api)

# 📚 Resources

- [Blog posts](https://quickwit.io/blog/)
- [Youtube channel](https://www.youtube.com/@quickwit8103)
- [Discord](https://discord.quickwit.io)

# 🔮 Roadmap

- Quickwit 0.9 (July 2024)
  - Indexing and search performance improvements
  - Index configuration updates (retention policy, indexing and search settings)
  - Concatenated field

- Quickwit 0.10 (October 2024)
  - Schema (doc mapping) updates
  - Native distributed ingestion
  - Index templates

# 🙋 FAQ

### How can I switch from Elasticsearch or OpenSearch to Quickwit?

Quickwit supports a large subset of Elasticsearch/OpenSearch API.

For instance, it has an ES-compatible ingest API to make it easier to migrate your log shippers (Vector, Fluent Bit, Syslog, ...) to Quickwit.

On the search side, the most popular Elasticsearch endpoints, query DSL, and even aggregations are supported.

The list of available endpoints and queries is available [here](https://quickwit.io/docs/reference/es_compatible_api), while the list of supported aggregations is available [here](https://quickwit.io/docs/reference/aggregation).

Let us know if part of the API you are using is missing!

If the client you are using is refusing to connect to Quickwit due to missing headers, you can use the `extra_headers` option in the [node configuration](https://quickwit.io/docs/configuration/node-config#rest-configuration) to impersonate any compatible version of Elasticsearch or OpenSearch.

### How is Quickwit different from traditional search engines like Elasticsearch or Solr?

The core difference and advantage of Quickwit is its architecture built from the ground to search on cloud storage. We optimized IO paths, revamped the index data structures and made search stateless and sub-second on cloud storage.

### How does Quickwit compare to Elastic in terms of cost?

We estimate that Quickwit can be up to 10x cheaper on average than Elastic. To understand how, check out our [blog post](https://quickwit.io/blog/commoncrawl/) about searching the web on AWS S3.

### What license does Quickwit use?

Quickwit is open-source under the Apache License, Version 2.0 - Apache-2.0.

### Is it possible to set up Quickwit for a High Availability (HA)?

HA is available for search, for indexing it's available only with a Kafka source.

# 🤝 Contribute and spread the word

We are always thrilled to receive contributions: code, documentation, issues, or feedback. Here's how you can help us build the future of log management:

- Start by checking out the [GitHub issues labeled "Good first issue"](https://github.com/quickwit-oss/quickwit/issues?q=is%3Aissue+is%3Aopen+label%3A%22good+first+issue%22). These are a great place for newcomers to contribute.
- Read our [Contributor Covenant Code of Conduct](./CODE_OF_CONDUCT.md) to understand our community standards.
- [Create a fork of Quickwit](https://github.com/quickwit-oss/quickwit/fork) to have your own copy of the repository where you can make changes.
- To understand how to contribute, read our [contributing guide](./CONTRIBUTING.md).
- Set up your development environment following our [development setup guide](./CONTRIBUTING.md#development).
- Once you've made your changes and tested them, you can contribute by [submitting a pull request](./CONTRIBUTING.md#submitting-a-pr).

✨ After your contributions are accepted, don't forget to claim your swag by emailing us at hello@quickwit.io. Thank you for contributing!

# 💬 Join Our Community

We welcome everyone to our community! Whether you're contributing code or just saying hello, we'd love to hear from you. Here's how you can connect with us:

- Join the conversation on [Discord](https://discord.quickwit.io).
- Follow us on [Twitter](https://twitter.com/Quickwit_Inc).
- Check out our [website](https://quickwit.io/) and [blog](https://quickwit.io/blog) for the latest updates.
- Watch our [YouTube](https://www.youtube.com/channel/UCvZVuRm2FiDq1_ul0mY85wA) channel for video content.


================================================
FILE: SECURITY.md
================================================
# Security Policy

## Supported Versions

| Version | Supported          |
| ------- | ------------------ |
| 0.3.1   | :white_check_mark: |
| < 0.3.1   | :x:                |

## Reporting a Vulnerability

To disclose a vulnerability in our code, please notify us by email at security@quickwit.io or private message _@fulmicoton_ or _@guilload_ on our Discord 
server ([discord.quickwit.io](https://discord.quickwit.io)). We will open a draft security advisory on our repository and grant you access so you can
share with us more details about the vulnerability. After releasing a fix, we will publish the security advisory to publicly disclose the security vulnerability
to the project's community.


================================================
FILE: _typos.toml
================================================
[files]
extend-exclude = ["**/*.json"]

[default.extend-words]
# Don't correct the surname "Teh"
strat = "strat"


================================================
FILE: build/cross-images/aarch64-unknown-linux-gnu.dockerfile
================================================
FROM ghcr.io/cross-rs/aarch64-unknown-linux-gnu:0.2.4@sha256:3356619b020614effd22e83cec41236e69f17ce581ffe35e252898b0c693b4e2

ARG PBC_URL="https://github.com/protocolbuffers/protobuf/releases/download/v21.5/protoc-21.5-linux-x86_64.zip"

#TODO: 
# We can switch to static linking (remove `libsasl2-dev:arm64`) using 
# `rdkafka/gssapi-vendored` feature when there is a release including: 
# https://github.com/MaterializeInc/rust-sasl/pull/48

RUN dpkg --add-architecture arm64 && \
    apt-get update && \
    apt-get install -y clang-3.9 \
        libclang-3.9-dev \
        binutils-aarch64-linux-gnu \
        libsasl2-dev:arm64 \
        unzip && \
    rm -rf /var/lib/apt/lists/*

RUN curl -fLO $PBC_URL && \
    unzip protoc-21.5-linux-x86_64.zip -d ./protobuf && \
    mv ./protobuf/bin/protoc /usr/bin/ && \
    rm -rf ./protobuf protoc-21.5-linux-x86_64.zip

ENV LIBZ_SYS_STATIC=1 \
    PKG_CONFIG_ALLOW_CROSS=true \
    PKG_CONFIG_ALL_STATIC=true \
    X86_64_UNKNOWN_LINUX_MUSL_OPENSSL_STATIC=1 \
    X86_64_UNKNOWN_LINUX_MUSL_OPENSSL_DIR=/usr/local/musl/


================================================
FILE: build/cross-images/aarch64-unknown-linux-musl.dockerfile
================================================
FROM rustembedded/cross:aarch64-unknown-linux-musl@sha256:22627e0ba533781062127b13601c37216fdca27123390b07dfabd3f31f3c84a0


# The Rust toolchain to use when building our image.  Set by `hooks/build`.
# ARG TOOLCHAIN=stable

# The OpenSSL version to use. Here is the place to check for new releases:
#
# - https://www.openssl.org/source/
#
# ALSO UPDATE hooks/build!
ARG OPENSSL_VERSION=1.1.1i
ARG ZLIB_VERSION=1.2.11

RUN echo "Building OpenSSL" && \
    cd /tmp && \
    short_version="$(echo "$OPENSSL_VERSION" | sed s'/[a-z]$//' )" && \
    curl -fLO "https://www.openssl.org/source/openssl-$OPENSSL_VERSION.tar.gz" || \
        curl -fLO "https://www.openssl.org/source/old/$short_version/openssl-$OPENSSL_VERSION.tar.gz" && \
    tar xvzf "openssl-$OPENSSL_VERSION.tar.gz" && cd "openssl-$OPENSSL_VERSION" && \
    AR=aarch64-linux-musl-ar CC=aarch64-linux-musl-gcc ./Configure no-zlib -fPIC --prefix=/usr/local/aarch64-linux-musl -DOPENSSL_NO_SECURE_MEMORY linux-aarch64 && \
    env C_INCLUDE_PATH=/usr/local/aarch64-linux-musl/include/ make depend && \
    env C_INCLUDE_PATH=/usr/local/aarch64-linux-musl/include/ make && \
    make install && \
    rm -r /tmp/*

RUN echo "Building zlib" && \
    cd /tmp && \
    curl -fLO "https://zlib.net/fossils/zlib-$ZLIB_VERSION.tar.gz" && \
    tar xzf "zlib-$ZLIB_VERSION.tar.gz" && cd "zlib-$ZLIB_VERSION" && \
    AR=aarch64-linux-musl-ar CC=aarch64-linux-musl-gcc ./configure --static --prefix=/usr/local/aarch64-linux-musl && \
    make && make install && \
    rm -r /tmp/*

ENV AARCH64_UNKNOWN_LINUX_MUSL_OPENSSL_STATIC=1 \
    CC=aarch64-linux-musl-gcc \
    CFLAGS=-I/usr/local/aarch64-linux-musl/include \
    LIBZ_SYS_STATIC=1 \
    LIB_LDFLAGS=-L/usr/local/aarch64-linux-musl/lib \
    OPENSSL_INCLUDE_DIR=/usr/local/aarch64-linux-musl/include/openssl \
    OPENSSL_LIB_DIR=/usr/local/aarch64-linux-musl/lib \
    PKG_CONFIG_ALLOW_CROSS=true \
    PKG_CONFIG_ALL_STATIC=true \
    TARGET=aarch64-unknown-linux-musl \
    AARCH64_UNKNOWN_LINUX_MUSL_OPENSSL_DIR=/usr/local/aarch64-linux-musl \
    OPENSSL_ROOT_DIR=/usr/local/aarch64-linux-musl


================================================
FILE: build/cross-images/x86_64-unknown-linux-gnu.dockerfile
================================================
FROM ghcr.io/cross-rs/x86_64-unknown-linux-gnu:0.2.4@sha256:7c9067212c2283be2a1d5585af5ecebd4c4a2e18091e2a6aafd23f9b4b81d496

ARG PBC_URL="https://github.com/protocolbuffers/protobuf/releases/download/v21.5/protoc-21.5-linux-x86_64.zip"

RUN apt-get update && \
    apt-get install -y clang-3.9 \
        libclang-3.9-dev \
        libsasl2-dev \
        unzip && \
    rm -rf /var/lib/apt/lists/*

RUN curl -fLO $PBC_URL && \
    unzip protoc-21.5-linux-x86_64.zip -d ./protobuf && \
    mv ./protobuf/bin/protoc /usr/bin/ && \
    rm -rf ./protobuf protoc-21.5-linux-x86_64.zip


================================================
FILE: build/cross-images/x86_64-unknown-linux-musl.dockerfile
================================================
FROM quickwit/cross-base:x86_64-unknown-linux-musl@sha256:5bcc7843aab64f89bf85c464fa2c5a00ecc634a8b1ac88c84a864f60054450cb
# See https://github.com/quickwit-inc/rust-musl-builder

RUN echo "Upgrading CMake" && \
    sudo apt-get remove cmake -y && \
    curl -fLO https://www.cmake.org/files/v3.12/cmake-3.12.1.tar.gz && \
    tar -xvzf cmake-3.12.1.tar.gz && \
    cd cmake-3.12.1/ && ./configure && \
    sudo make install
    
ENV CC=musl-gcc \
    CFLAGS=-I/usr/local/musl/include \
    LIB_LDFLAGS=-L/usr/lib/x86_64-linux-gnu


================================================
FILE: config/quickwit.yaml
================================================
# ============================ Node Configuration ==============================
#
# Website: https://quickwit.io
# Docs: https://quickwit.io/docs/configuration/node-config
#
# Configure AWS credentials: https://quickwit.io/docs/guides/aws-setup#aws-credentials
#
# -------------------------------- General settings --------------------------------
#
# Config file format version.
#
version: 0.8
#
# Node ID. Must be unique within a cluster. If not set, a random node ID is generated on each startup.
#
# node_id: node-1
#
# Quickwit opens three sockets.
# - for its HTTP server, hosting the UI and the REST API (TCP)
# - for its gRPC service (TCP)
# - for its Gossip cluster membership service (UDP)
#
# All three services are bound to the same host and a different port. The host can be an IP address or a hostname.
#
# Default HTTP server host is `127.0.0.1` and default HTTP port is 7280.
# The default host value was chosen to avoid exposing the node to the open-world without users' explicit consent.
# This allows for testing Quickwit in single-node mode or with multiple nodes running on the same host and listening
# on different ports. However, in cluster mode, using this value is never appropriate because it causes the node to
# ignore incoming traffic.
# There are two options to set up a node in cluster mode:
#   1. specify the node's hostname or IP
#   2. pass `0.0.0.0` and let Quickwit do its best to discover the node's IP (see `advertise_address`)
#
# listen_address: 127.0.0.1
#
# rest:
#   listen_port: 7280
#   cors_allow_origins:
#     - "http://localhost:3000"
#   extra_headers:
#     x-header-1: header-value-1
#     x-header-2: header-value-2
#
# grpc:
#   max_message_size: 10 MiB
#
# IP address advertised by the node, i.e. the IP address that peer nodes should use to connect to the node for RPCs.
# The environment variable `QW_ADVERTISE_ADDRESS` can also be used to override this value.
# The default advertise address is `listen_address`. If `listen_address` is unspecified (`0.0.0.0`),
# Quickwit attempts to sniff the node's IP by scanning the available network interfaces.
# advertise_address: 192.168.0.42
#
# In order to join a cluster, one needs to specify a list of
# seeds to connect to. If no port is specified, Quickwit will assume
# the seeds are using the same port as the current node gossip port.
# By default, the peer seed list is empty.
#
# peer_seeds:
#   - quickwit-searcher-0.local
#   - quickwit-searcher-1.local:10000
#
# Path to directory where temporary data (caches, intermediate indexing data structures)
# is stored. Defaults to `./qwdata`.
#
# data_dir: /path/to/data/dir
#
# Metastore URI. Defaults to `data_dir/indexes#polling_interval=30s`,
# which is a file-backed metastore and mostly convenient for testing. A cluster would
# require a metastore backed by Amzon S3 or PostgreSQL.
#
# metastore_uri: s3://your-bucket/indexes
# metastore_uri: postgres://username:password@host:port/db
#
# When using a file-backed metastore, the state of the metastore will be cached forever.
# If you are indexing and searching from different processes, it is possible to periodically
# refresh the state of the metastore on the searcher using the `polling_interval` hashtag.
#
# metastore_uri: s3://your-bucket/indexes#polling_interval=30s
#
# Default index root URI, which defines where index data (splits) is stored,
# following the scheme `{default_index_root_uri}/{index-id}`. Defaults to `{data_dir}/indexes`.
#
# default_index_root_uri: s3://your-bucket/indexes
#
# -------------------------------- Storage settings --------------------------------
# https://quickwit.io/docs/configuration/node-config#storage-configuration
#
# Hardcoding credentials into configuration files is not secure and strongly
# discouraged. Prefer the alternative authentication methods that your storage
# backend may provide.
#
# storage:
#   azure:
#     account: ${QW_AZURE_STORAGE_ACCOUNT}
#     access_key: ${QW_AZURE_STORAGE_ACCESS_KEY}
#
#   s3:
#     access_key_id: ${AWS_ACCESS_KEY_ID}
#     secret_access_key: ${AWS_SECRET_ACCESS_KEY}
#     region: ${AWS_REGION}
#     endpoint: ${QW_S3_ENDPOINT}
#     force_path_style_access: ${QW_S3_FORCE_PATH_STYLE_ACCESS:-false}
#     disable_multi_object_delete: false
#     disable_multipart_upload: false
#
# -------------------------------- Metastore settings --------------------------------
# https://quickwit.io/docs/configuration/node-config#metastore-configuration
#
# metastore:
#   postgres:
#     min_connections: 0
#     max_connections: 10
#     acquire_connection_timeout: 10s
#     idle_connection_timeout: 10min
#     max_connection_lifetime: 30min
#
# -------------------------------- Indexer settings --------------------------------
# https://quickwit.io/docs/configuration/node-config#indexer-configuration

indexer:
  enable_otlp_endpoint: ${QW_ENABLE_OTLP_ENDPOINT:-true}
#   split_store_max_num_bytes: 100G
#   split_store_max_num_splits: 1000
#   max_concurrent_split_uploads: 12
#
#
# -------------------------------- Ingest API settings ------------------------------
# https://quickwit.io/docs/configuration/node-config#ingest-api-configuration
#
# ingest_api:
#   max_queue_memory_usage: 2GiB
#   max_queue_disk_usage: 4GiB
#   content_length_limit: 10MiB
#
# -------------------------------- Searcher settings --------------------------------
# https://quickwit.io/docs/configuration/node-config#searcher-configuration
#
# searcher:
#   fast_field_cache_capacity: 1G
#   split_footer_cache_capacity: 500M
#   partial_request_cache_capacity: 64M
#   max_num_concurrent_split_streams: 100
#   max_num_concurrent_split_searches: 100
#   aggregation_memory_limit: 500M
#   aggregation_bucket_limit: 65000
#   split_cache:
#      max_num_bytes: 1G
#      max_num_splits: 10000
#      num_concurrent_downloads: 1
# -------------------------------- Jaeger settings --------------------------------

jaeger:
  enable_endpoint: ${QW_ENABLE_JAEGER_ENDPOINT:-true}


================================================
FILE: config/templates/gh-archive.yaml
================================================
version: 0.8

template_id: gh-archive

index_id_patterns:
  - gh-archive*

description: Index config template for the GH Archive dataset (gharchive.org)

priority: 0

doc_mapping:
  field_mappings:
    - name: id
      type: text
      tokenizer: raw
    - name: type
      type: text
      fast: true
      tokenizer: raw
    - name: public
      type: bool
      fast: true
    - name: payload
      type: json
      tokenizer: default
    - name: org
      type: json
      tokenizer: default
    - name: repo
      type: json
      tokenizer: default
    - name: actor
      type: json
      tokenizer: default
    - name: other
      type: json
      tokenizer: default
    - name: created_at
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: created_at

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: config/templates/stackoverflow.yaml
================================================
version: 0.8

template_id: stackoverflow

index_id_patterns:
  - stackoverflow*

description: Index config template for the Stackoverflow tutorial (quickwit.io/docs/get-started/quickstart)

priority: 0

doc_mapping:
  field_mappings:
    - name: title
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: body
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: creationDate
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: creationDate

search_settings:
  default_search_fields: [title, body]

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: config/tutorials/fluentbit-logs/index-config.yaml
================================================
version: 0.8

index_id: fluentbit-logs

doc_mapping:
  mode: dynamic
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast: true
  timestamp_field: timestamp

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: config/tutorials/gh-archive/index-config-for-clickhouse.yaml
================================================
#
# Index config file for gh-archive dataset.
#
version: 0.8

index_id: gh-archive

doc_mapping:
  store_source: false
  field_mappings:
    - name: id
      type: u64
      fast: true
    - name: created_at
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: event_type
      type: text
      tokenizer: raw
    - name: title
      type: text
      tokenizer: default
      record: position
    - name: body
      type: text
      tokenizer: default
      record: position
  timestamp_field: created_at

search_settings:
  default_search_fields: [title, body]


================================================
FILE: config/tutorials/gh-archive/index-config.yaml
================================================
#
# Index config file for gh-archive dataset.
#
version: 0.8

index_id: gh-archive

doc_mapping:
  field_mappings:
    - name: id
      type: text
      tokenizer: raw
    - name: type
      type: text
      fast: true
      tokenizer: raw
    - name: public
      type: bool
      fast: true
    - name: payload
      type: json
      tokenizer: default
    - name: org
      type: json
      tokenizer: default
    - name: repo
      type: json
      tokenizer: default
    - name: actor
      type: json
      tokenizer: default
    - name: other
      type: json
      tokenizer: default
    - name: created_at
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: created_at

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: config/tutorials/gh-archive/kafka-source.yaml
================================================
version: 0.8
source_id: kafka-source
source_type: kafka
num_pipelines: 2
params:
  topic: gh-archive
  client_params:
    bootstrap.servers: localhost:9092


================================================
FILE: config/tutorials/gh-archive/kinesis-source.yaml
================================================
version: 0.8
source_id: kinesis-source
source_type: kinesis
params:
  stream_name: gh-archive


================================================
FILE: config/tutorials/grafana/docker-compose.yml
================================================
version: "3.9"

networks:
  default:
    name: quickwit-grafana
    # ipam:
    #   config:
    #   - subnet: 172.16.7.0/24
    #     gateway: 172.16.7.1

services:
  quickwit:
    image: quickwit/quickwit:${QUICKWIT_VERSION:-0.7.1}
  grafana:
    image: grafana/grafana-oss:${GRAFANA_VERSION:-9.4.7}
    container_name: grafana
    ports:
      - "${MAP_HOST_GRAFANA:-127.0.0.1}:3000:3000"
    environment:
      GF_AUTH_DISABLE_LOGIN_FORM: "true"
      GF_AUTH_ANONYMOUS_ENABLED: "true"
      GF_AUTH_ANONYMOUS_ORG_ROLE: Admin
    volumes:
      - ./monitoring/grafana/dashboards:/var/lib/grafana/dashboards
      - ./monitoring/grafana/provisioning:/etc/grafana/provisioning

  jaeger:
    image: jaegertracing/all-in-one:${JAEGER_VERSION:-1.48.0}
    container_name: jaeger
    ports:
      - "${MAP_HOST_JAEGER:-127.0.0.1}:16686:16686" # Frontend
    profiles:
      - jaeger
      - monitoring

  otel-collector:
    image: otel/opentelemetry-collector:${OTEL_VERSION:-0.84.0}
    container_name: otel-collector
    ports:
      - "${MAP_HOST_OTEL:-127.0.0.1}:1888:1888"   # pprof extension
      - "${MAP_HOST_OTEL:-127.0.0.1}:8888:8888"   # Prometheus metrics exposed by the collector
      - "${MAP_HOST_OTEL:-127.0.0.1}:8889:8889"   # Prometheus exporter metrics
      - "${MAP_HOST_OTEL:-127.0.0.1}:13133:13133" # health_check extension
      - "${MAP_HOST_OTEL:-127.0.0.1}:4317:4317"   # OTLP gRPC receiver
      - "${MAP_HOST_OTEL:-127.0.0.1}:4318:4318"   # OTLP http receiver
      - "${MAP_HOST_OTEL:-127.0.0.1}:55679:55679" # zpages extension
    profiles:
      - otel
      - monitoring
    volumes:
      - ./monitoring/otel-collector-config.yaml:/etc/otel-collector-config.yaml
    command: ["--config=/etc/otel-collector-config.yaml"]

  prometheus:
    image: prom/prometheus:${PROMETHEUS_VERSION:-v2.43.0}
    container_name: prometheus
    ports:
      - "${MAP_HOST_PROMETHEUS:-127.0.0.1}:9090:9090"
    profiles:
      - prometheus
      - monitoring
    volumes:
      - ./monitoring/prometheus.yaml:/etc/prometheus/prometheus.yml
    extra_hosts:
      - "host.docker.internal:host-gateway"

  gcp-pubsub-emulator:
    # It is not an official docker image
    # if we prefer we can build a docker from the official docker image (gcloud cli)
    # and install the pubsub emulator https://cloud.google.com/pubsub/docs/emulator
    image: thekevjames/gcloud-pubsub-emulator:${GCLOUD_EMULATOR:-455.0.0}
    container_name: gcp-pubsub-emulator
    ports:
      - "${MAP_HOST_GCLOUD_EMULATOR:-127.0.0.1}:8681:8681"
    environment:
      # create a fake gcp project and a topic / subscription
      - PUBSUB_PROJECT1=quickwit-emulator,emulator_topic:emulator_subscription
    profiles:
      - all
      - gcp-pubsub

volumes:
  localstack_data:
  postgres_data:
  azurite_data:


================================================
FILE: config/tutorials/hdfs-logs/index-config-partitioned.yaml
================================================
#
# Index config file for hdfs-logs dataset with partitioning configured.
#

version: 0.8

index_id: hdfs-logs-partitioned

doc_mapping:
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: tenant_id
      type: u64
    - name: severity_text
      type: text
      tokenizer: raw
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: json
      tokenizer: raw
  tag_fields: [tenant_id]
  partition_key: tenant_id
  max_num_partitions: 1000
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity_text, body]

indexing_settings:
  commit_timeout_secs: 30
  split_num_docs_target: 10000000
  merge_policy:
    type: "limit_merge"
    merge_factor: 10
    max_merge_ops: 3
    maturation_period: 48 hours


================================================
FILE: config/tutorials/hdfs-logs/index-config-retention-policy.yaml
================================================
#
# Index config file for hdfs-logs dataset with a retention policy configured.
#

version: 0.8

index_id: hdfs-logs-retention-policy

doc_mapping:
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: tenant_id
      type: u64
    - name: severity_text
      type: text
      tokenizer: raw
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: json
      tokenizer: raw
  tag_fields: [tenant_id]
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity_text, body]

retention:
  period: 90 days
  schedule: daily

indexing_settings:
  commit_timeout_secs: 10
  split_num_docs_target: 10000000


================================================
FILE: config/tutorials/hdfs-logs/index-config.yaml
================================================
#
# Index config file for hdfs-logs dataset.
#

version: 0.8

index_id: hdfs-logs

doc_mapping:
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: tenant_id
      type: u64
    - name: severity_text
      type: text
      tokenizer: raw
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: json
      tokenizer: raw
  tag_fields: [tenant_id]
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity_text, body]


================================================
FILE: config/tutorials/hdfs-logs/searcher-1.yaml
================================================
version: 0.8
node_id: searcher-1
listen_address: 127.0.0.1
rest:
  listen_port: 7280
ingest_api:
  max_queue_memory_usage: 4GiB
  max_queue_disk_usage: 8GiB
peer_seeds:
  - 127.0.0.1:7290 # searcher-2
  - 127.0.0.1:7300 # searcher-3


================================================
FILE: config/tutorials/hdfs-logs/searcher-2.yaml
================================================
version: 0.8
node_id: searcher-2
listen_address: 127.0.0.1
rest:
  listen_port: 7290
peer_seeds:
  - 127.0.0.1:7280 # searcher-1
  - 127.0.0.1:7300 # searcher-3


================================================
FILE: config/tutorials/hdfs-logs/searcher-3.yaml
================================================
version: 0.8
node_id: searcher-3
listen_address: 127.0.0.1
rest:
  listen_port: 7300
peer_seeds:
  - 127.0.0.1:7280 # searcher-1
  - 127.0.0.1:7290 # searcher-2


================================================
FILE: config/tutorials/otel-logs/index-config.yaml
================================================
#
# Index config file for receiving logs in OpenTelemetry format.
# Link: https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/logs/data-model.md
#

version: 0.8

index_id: otel-log-v0

doc_mapping:
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast: true
    - name: severity
      type: text
      tokenizer: raw
      fast: true
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: attributes
      type: json
    - name: resource
      type: json
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity, body]


================================================
FILE: config/tutorials/otel-logs/kafka-source.yaml
================================================
version: 0.8
source_id: kafka-source
source_type: kafka
input_format: otlp_logs_proto
params:
  topic: otlp_logs
  client_params:
    bootstrap.servers: localhost:9092


================================================
FILE: config/tutorials/otel-logs/otel-values.yaml
================================================
mode: "daemonset"
presets:
  logsCollection:
    enabled: true
  kubernetesAttributes:
    enabled: true
config:
  exporters:
    otlp:
      endpoint: quickwit-indexer.qw-tutorial.svc.cluster.local:7281
      tls:
        insecure: true
  service:
    pipelines:
      logs:
        exporters:
          - otlp


================================================
FILE: config/tutorials/otel-traces/index-config.yaml
================================================
#
# Index config file for receiving logs in OpenTelemetry format.
# Link: https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/logs/data-model.md
#

version: 0.8

index_id: otel-trace-v0

doc_mapping:
  mode: lenient
  field_mappings:
    - name: trace_id
      type: bytes
    - name: trace_state
      type: text
      indexed: false
    - name: resource_attributes
      type: json
      tokenizer: raw
    - name: resource_dropped_attributes_count
      type: u64
      indexed: false
    - name: service_name
      type: text
      tokenizer: raw
    - name: span_id
      type: bytes
    - name: span_kind
      type: u64
    - name: span_name
      type: text
      tokenizer: raw
    - name: span_start_timestamp_secs
      type: datetime
      indexed: true
      fast_precision: seconds
      fast: true
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_secs
    - name: span_start_timestamp_nanos
      type: i64
      indexed: false
    - name: span_end_timestamp_nanos
      type: i64
      indexed: false
    - name: span_duration_secs
      type: i64
      indexed: false
    - name: span_attributes
      type: json
      tokenizer: raw
    - name: span_dropped_attributes_count
      type: u64
      indexed: false
    - name: span_dropped_events_count
      type: u64
      indexed: false
    - name: span_dropped_links_count
      type: u64
      indexed: false
    - name: span_status
      type: json
      indexed: false
    - name: parent_span_id
      type: bytes
    - name: events
      type: array<json>
      tokenizer: raw
    - name: links
      type: array<json>
      tokenizer: raw

  timestamp_field: span_start_timestamp_secs

  partition_key: service_name
  max_num_partitions: 100

indexing_settings:
  commit_timeout_secs: 30

search_settings:
  default_search_fields: []


================================================
FILE: config/tutorials/otel-traces/kafka-source.yaml
================================================
version: 0.8
source_id: kafka-source
source_type: kafka
input_format: otlp_traces_proto
params:
  topic: otlp_spans
  client_params:
    bootstrap.servers: localhost:9092


================================================
FILE: config/tutorials/stackoverflow/index-config.yaml
================================================
#
# Index config file for stackoverflow dataset.
#
version: 0.8

index_id: stackoverflow

doc_mapping:
  field_mappings:
    - name: title
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: body
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: creationDate
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: creationDate

search_settings:
  default_search_fields: [title, body]

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: config/tutorials/stackoverflow/pulsar-source.yaml
================================================
version: 0.8
source_id: pulsar-source
source_type: pulsar
params:
  topics:
    - quickwit/pulsar/stackoverflow
  address: pulsar://localhost:6650


================================================
FILE: config/tutorials/stackoverflow/send_messages_to_pulsar.py
================================================
import json
import pulsar

client = pulsar.Client('pulsar://localhost:6650')
producer = client.create_producer('stackoverflow')

with open('stackoverflow.posts.transformed-10000.json', encoding='utf8') as file:
   for i, line in enumerate(file):
       producer.send(line.encode('utf-8'))
       if i % 100 == 0:
           print(f"{i}/10000 messages sent.", i)

client.close()


================================================
FILE: config/tutorials/vector-otel-logs/vector.toml
================================================
[sources.generate_syslog]
type = "demo_logs"
format = "syslog"
count = 100000
interval = 0.001

[transforms.remap_syslog]
inputs = [ "generate_syslog"]
type = "remap"
source = '''
  structured = parse_syslog!(.message)
  .timestamp_nanos, err = to_unix_timestamp(structured.timestamp, unit: "nanoseconds")
  .body = structured
  .service_name = structured.appname
  .resource_attributes.source_type = .source_type
  .resource_attributes.host.hostname = structured.hostname
  .resource_attributes.service.name = structured.appname
  .attributes.syslog.procid = structured.procid
  .attributes.syslog.facility = structured.facility
  .attributes.syslog.version = structured.version
  .severity_text = if includes(["emerg", "err", "crit", "alert"], structured.severity) {
    "ERROR"
  } else if structured.severity == "warning" {
    "WARN"
  } else if structured.severity == "debug" {
    "DEBUG"
  } else if includes(["info", "notice"], structured.severity) {
    "INFO"
  } else {
   structured.severity
  }
  .scope_name = structured.msgid
  del(.message)
  del(.timestamp)
  del(.source_type)
'''

[sinks.emit_syslog]
inputs = ["remap_syslog"]
type = "console"
encoding.codec = "json"

[sinks.quickwit_logs]
type = "http"
method = "post"
inputs = ["remap_syslog"]
encoding.codec = "json"
framing.method = "newline_delimited"
uri = "http://127.0.0.1:7280/api/v1/otel-logs-v0_7/ingest"


================================================
FILE: config/tutorials/wikipedia/index-config.yaml
================================================
#
# Index config file for wikipedia dataset.
#

version: 0.8

index_id: wikipedia

doc_mapping:
  field_mappings:
    - name: title
      type: text
      tokenizer: default
      record: position
      stored: true
      fieldnorms: true
    - name: body
      type: text
      tokenizer: default
      record: position
      stored: true
      fieldnorms: true
    - name: url
      type: text
      tokenizer: raw

search_settings:
  default_search_fields: [title, body]

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: config/tutorials/wikipedia/multilang-index-config.yaml
================================================
#
# Index config file for multilang wikipedia datasets.
#

version: 0.8

index_id: multilang-wikipedia

doc_mapping:
  tokenizers:
    - name: multilang
      type: multilang
  field_mappings:
    - name: title
      type: text
      tokenizer: multilang
      record: position
      stored: true
      fieldnorms: true
    - name: body
      type: text
      tokenizer: multilang
      record: position
      stored: true
      fieldnorms: true
    - name: url
      type: text
      tokenizer: raw

search_settings:
  default_search_fields: [title, body]

indexing_settings:
  commit_timeout_secs: 10


================================================
FILE: distribution/docker/ubuntu/Dockerfile
================================================
FROM ubuntu:noble@sha256:66460d557b25769b102175144d538d88219c077c678a49af4afca6fbfc1b5252 AS builder

RUN apt-get update && apt-get install -y curl
RUN curl -L https://install.quickwit.io | sh


FROM ubuntu:noble@sha256:66460d557b25769b102175144d538d88219c077c678a49af4afca6fbfc1b5252 AS quickwit

LABEL org.opencontainers.image.title="Quickwit"
LABEL maintainer="Quickwit, Inc. <hello@quickwit.io>"
LABEL org.opencontainers.image.vendor="Quickwit, Inc."
LABEL org.opencontainers.image.licenses="Apache-2.0"

RUN apt-get -y update \
    && apt-get -y install ca-certificates \
    libssl3 \
    && rm -rf /var/lib/apt/lists/*

WORKDIR /quickwit
RUN mkdir config qwdata
COPY --from=builder /quickwit-v*/quickwit /usr/local/bin/quickwit
COPY --from=builder /quickwit-v*/config/quickwit.yaml /quickwit/config/quickwit.yaml

ENV QW_CONFIG=/quickwit/config/quickwit.yaml
ENV QW_DATA_DIR=/quickwit/qwdata
ENV QW_LISTEN_ADDRESS=0.0.0.0

RUN quickwit --version

ENTRYPOINT ["quickwit"]


================================================
FILE: distribution/ecs/.gitignore
================================================
.terraform
terraform.tfstate*
.terraform.tfstate*
terraform.tfvars


================================================
FILE: distribution/ecs/README.md
================================================
# ECS deployment for quickwit

## Run Quickwit in your infrastructure

Create a Quickwit module using:

```terraform
module "quickwit" {
  source = "github.com/quickwit-oss/quickwit/distribution/ecs/quickwit"

  vpc_id                       =       # VPC in which all resources will be created
  subnet_ids                   = [...] # At least 2 private subnets must be specified
  quickwit_ingress_cidr_blocks = [...] # List of CIDR blocks allowed to access to the Quickwit API
}
```

The Quickwit cluster is running on a private subnet. For ECS to pull the image:
- if using the default Docker Hub image `quickwit/quickwit`, the subnets
specified must be configured with a NAT Gateway (no public IPs are attached to
the tasks)
- if using an image hosted on ECR, a VPC endpoint for ECR can be used instead of
a NAT Gateway


## Module configurations

To get the list of available configurations, check the `./quickwit/variables.tf`
file.

### Tips

Metastore database backups are disabled as restoring one would lead to
inconsistencies with the index store on S3. To ensure high availability, you
should enable `rds_config.multi_az` instead. To use your own Postgres database
instead of creating a new RDS instance, configure the
`external_postgres_uri_secret_arn` variable (e.g ARN of an SSM parameter with
the value `postgres://user:password@domain:port/db`).

Using NAT Gateways for the image registry is quite costly (approx. $0.05/hour/AZ). If
you are not already using NAT Gateways in the AZs where Quickwit will be
deployed, you should probably push the Quickwit image to ECR and use ECR
interface VPC endpoints instead (approx. ~$0.01/hour/AZ).

When using the default image, you will quickly run into the Docker Hub rate
limiting. We recommend pushing the Quickwit image to ECR and configure that as
`quickwit_image`. Note that the architecture of the image that you push to ECR
must match the `quickwit_cpu_architecture` variable (`ARM64` by default).

Sidecar container and custom logging configurations can be configured using the
variables `sidecar_container_definitions`, `sidecar_container_dependencies`,
`log_configuration`, `enable_cloudwatch_logging`. See [custom log
routing](https://docs.aws.amazon.com/AmazonECS/latest/developerguide/using_firelens.html).

You can use sidecars to inject additional secrets as files. This can be
useful for configuring sources such as Kafka. See `./example/kafka.tf` for an
example.

To access external AWS services like the Kinesis source, use the
`quickwit_indexer.extra_task_policy_arns` variable to attach the necessary
IAM policies to indexers.

## Running the example stack

We provide an example of self contained deployment with an ad-hoc VPC. 

> [!IMPORTANT]
> This stack costs ~$200/month to run (Fargate tasks, NAT Gateways
> and RDS)

### Deploy the Quickwit module and connect through a bastion

To make it easy to access your Quickwit cluster, the example stack includes
a bastion instance. Access is secured using an SSH key pair that you need to
provide (e.g generated with `ssh-keygen -t ed25519`).

In the `./example` directory, create a `terraform.tfvars` file with the public
key of your RSA key pair:

```terraform
bastion_public_key = "ssh-ed25519 ..."
```

> [!NOTE]
> You can skip the creation of the bastion by not specifying the
> `bastion_public_key` variable, but that would make it hard to access and
> experiment with the created Quickwit cluster.

In the same directory (`./example`) run:

```bash
terraform init
terraform apply
```

The successful `apply` command should output the IP of the bastion EC2 instance.
You can port forward Quickwit's search UI using:

```bash
ssh -N -L 7280:searcher.quickwit:7280 -i {your-private-key-file} ubuntu@{bastion_ip}
```

To ingest some example dataset, log into the bastion:

```bash
ssh -i {your-private-key-file} ubuntu@{bastion_ip}

# create the log index
wget https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/hdfs-logs/index-config.yaml
curl -X POST \
  -H "content-type: application/yaml" \
  --data-binary @index-config.yaml \
  http://indexer.quickwit:7280/api/v1/indexes

# import some data
wget https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants-10000.json
curl -X POST \
  -H "content-type: application/json" \
  --data-binary @hdfs-logs-multitenants-10000.json \
  http://indexer.quickwit:7280/api/v1/hdfs-logs/ingest?commit=force
```

If your SSH tunnel to the searcher is still running, you should be able to see
the ingested data in the UI.

### Setup an ECR repository to avoid throttling from Docker Hub

By default, the example stack uses Docker Hub to pull the Quickwit image. This
is convenient but it quickly runs into rate limiting. To avoid this, in the
`terraform.tfvars` file, set the `dockerhub_pull_through_creds_secret_arn` to a
AWS Secret with the following content:

```json
{"username":"...","accessToken":"..."}
```

This will:
- provision an ECR repository and a pull through cache rule
- configure the Quickwit module to use that repository


================================================
FILE: distribution/ecs/example/.terraform.lock.hcl
================================================
# This file is maintained automatically by "terraform init".
# Manual edits may be lost in future updates.

provider "registry.terraform.io/hashicorp/aws" {
  version     = "5.39.1"
  constraints = ">= 4.66.1, >= 5.36.0, ~> 5.39.1"
  hashes = [
    "h1:hQLlAd6O1LdQHy1GdWtgT5fcOlc3TWW+SaaFkpe+e8E=",
    "zh:05c50a5d8edb3ba4ebc4eb6e0d0b5e319142f5983b27821710ed7d475d335bdc",
    "zh:082986a5784dd21957e632371b289e549f051a4ea21d5c78c6d744c3537f03c5",
    "zh:192ae622ba562eacc4921ed549a794506179233d724fdd15a4f147f3400724a0",
    "zh:19a1d4637a62de90b0da174c0bf01000cd900488f7e8f709d8a37f082c59756b",
    "zh:1d7689a8583515f1705972d7ce57ccfab96215b19905530d2c78c02dcfaff583",
    "zh:22c446a21209a52ab74b4ba1ede0b220531e97ce479430047e493a2c45e1d8cb",
    "zh:4154de82290ab4e9f81bac1ea62342de8b3b7a608f99258c190d4dd1c6663e47",
    "zh:6bc4859ccdc54f28af9286b2fa090a31dcb345138d68c471510b737f6a052011",
    "zh:73c69e000e0b321e78a4a12fef60d37285f2afec0ea7be9e06163d985101cb59",
    "zh:890a3422f5e445b49bae30facf448d0ec9cd647e9155d0b685b5b39e9d331a94",
    "zh:9b12af85486a96aedd8d7984b0ff811a4b42e3d88dad1a3fb4c0b580d04fa425",
    "zh:9cd88bec0f5205df9032e3126d4e57edd1c5cc8d45cda25626882dafc485a3b0",
    "zh:a3a8e3276d0fbf051bbafa192a2998b05745f2cf285ac8c36a9ad167a75c037f",
    "zh:d47e4dcf4c0ad71b9a7c720be4f3a89f6786a82e77bbe8d950794562792a1da5",
    "zh:f74e5b2af508c7de80a6ae5198df54a795eeba5058a0cd247828943f0c54f6e0",
  ]
}

provider "registry.terraform.io/hashicorp/random" {
  version     = "3.6.0"
  constraints = ">= 3.1.0"
  hashes = [
    "h1:R5Ucn26riKIEijcsiOMBR3uOAjuOMfI1x7XvH4P6B1w=",
    "zh:03360ed3ecd31e8c5dac9c95fe0858be50f3e9a0d0c654b5e504109c2159287d",
    "zh:1c67ac51254ba2a2bb53a25e8ae7e4d076103483f55f39b426ec55e47d1fe211",
    "zh:24a17bba7f6d679538ff51b3a2f378cedadede97af8a1db7dad4fd8d6d50f829",
    "zh:30ffb297ffd1633175d6545d37c2217e2cef9545a6e03946e514c59c0859b77d",
    "zh:454ce4b3dbc73e6775f2f6605d45cee6e16c3872a2e66a2c97993d6e5cbd7055",
    "zh:78d5eefdd9e494defcb3c68d282b8f96630502cac21d1ea161f53cfe9bb483b3",
    "zh:91df0a9fab329aff2ff4cf26797592eb7a3a90b4a0c04d64ce186654e0cc6e17",
    "zh:aa57384b85622a9f7bfb5d4512ca88e61f22a9cea9f30febaa4c98c68ff0dc21",
    "zh:c4a3e329ba786ffb6f2b694e1fd41d413a7010f3a53c20b432325a94fa71e839",
    "zh:e2699bc9116447f96c53d55f2a00570f982e6f9935038c3810603572693712d0",
    "zh:e747c0fd5d7684e5bfad8aa0ca441903f15ae7a98a737ff6aca24ba223207e2c",
    "zh:f1ca75f417ce490368f047b63ec09fd003711ae48487fba90b4aba2ccf71920e",
  ]
}


================================================
FILE: distribution/ecs/example/bastion.tf
================================================
variable "bastion_public_key" {
  description = "The public key used to connect to the bastion host. If empty, no bastion is created."
  default     = ""
}

output "bastion_ip" {
  value = var.bastion_public_key != "" ? aws_instance.bastion[0].public_ip : null
}

data "aws_ami" "ubuntu" {
  most_recent = true

  filter {
    name   = "name"
    values = ["ubuntu/images/hvm-ssd/ubuntu-jammy-22.04-amd64-server-*"]
  }

  filter {
    name   = "virtualization-type"
    values = ["hvm"]
  }

  owners = ["099720109477"] # Canonical
}

resource "aws_security_group" "allow_ssh" {
  count       = var.bastion_public_key != "" ? 1 : 0
  name        = "qw_ecs_bastion_allow_ssh"
  description = "Allow SSH inbound traffic from everywhere"
  vpc_id      = module.vpc.vpc_id

  ingress {
    from_port   = 22
    to_port     = 22
    protocol    = "tcp"
    cidr_blocks = ["0.0.0.0/0"]
  }

  egress {
    from_port   = 0
    to_port     = 0
    protocol    = "-1"
    cidr_blocks = ["0.0.0.0/0"]
  }
}

resource "aws_instance" "bastion" {
  count                       = var.bastion_public_key != "" ? 1 : 0
  ami                         = data.aws_ami.ubuntu.id
  instance_type               = "t3.nano"
  key_name                    = aws_key_pair.bastion_key[0].key_name
  subnet_id                   = module.vpc.public_subnets[0]
  associate_public_ip_address = true
  vpc_security_group_ids      = [aws_security_group.allow_ssh[0].id]

  tags = {
    Name = "quickwit-ecs-bastion"
  }
}

resource "aws_key_pair" "bastion_key" {
  count      = var.bastion_public_key != "" ? 1 : 0
  key_name   = "quickwit-ecs-bastion-key"
  public_key = var.bastion_public_key
}


================================================
FILE: distribution/ecs/example/image.tf
================================================
variable "dockerhub_pull_through_creds_secret_arn" {
  description = "If left empty, image is pulled directly from Docker Hub, which might be throttled."
  default     = ""
}

locals {
  ecr_repository_prefix = "quickwit-ecs-example"
}

# This repo is populated by the pull through cache below
resource "aws_ecr_repository" "quickwit" {
  count                = var.dockerhub_pull_through_creds_secret_arn == "" ? 0 : 1
  name                 = "${local.ecr_repository_prefix}/quickwit/quickwit"
  image_tag_mutability = "MUTABLE"
  force_delete         = true
  image_scanning_configuration {
    scan_on_push = false
  }
}

resource "aws_ecr_pull_through_cache_rule" "docker_hub" {
  count                 = var.dockerhub_pull_through_creds_secret_arn == "" ? 0 : 1
  ecr_repository_prefix = local.ecr_repository_prefix
  upstream_registry_url = "registry-1.docker.io"
  credential_arn        = var.dockerhub_pull_through_creds_secret_arn
}


locals {
  ecr_domain     = "${data.aws_caller_identity.current.account_id}.dkr.ecr.${data.aws_region.current.name}.amazonaws.com"
  image_prefix   = var.dockerhub_pull_through_creds_secret_arn == "" ? "" : "${local.ecr_domain}/${local.ecr_repository_prefix}/"
  quickwit_image = "${local.image_prefix}quickwit/quickwit"
}


================================================
FILE: distribution/ecs/example/kafka.tf
================================================
# Example configuration for injecting SSL keys for securing a Kafka connection
# You can then create a secured Kafka source along these lines:
# 
# version: 0.8
# source_id: kafka-source
# source_type: kafka
# num_pipelines: 2
# params:
#   topic: your-topic
#   client_params:
#     bootstrap.servers: "your-kafka-broker.com"
#     security.protocol: "SSL"
#     ssl.ca.location: "/quickwit/keys/ca.pem"
#     ssl.certificate.location: "/quickwit/keys/service.cert"
#     ssl.key.location: "/quickwit/keys/service.key"


locals {
  ca_pem       = "echo \"$CA_PEM\" > /quickwit/cfg/ca.pem"
  service_cert = "echo \"$SERVICE_CERT\" > /quickwit/cfg/service.cert"
  service_key  = "echo \"$SERVICE_KEY\" > /quickwit/cfg/service.key"
  example_kafka_sidecar_container_definitions = {
    kafka_key_init = {
      name                      = "kafka_key_init"
      essential                 = false
      image                     = "busybox"
      command                   = ["sh", "-c", "${local.ca_pem} && ${local.service_cert} && ${local.service_key}"]
      enable_cloudwatch_logging = true
      mount_points = [
        {
          sourceVolume  = "quickwit-keys"
          containerPath = "/quickwit/keys"
        }
      ]
      secrets = [
        {
          name      = "CA_PEM"
          valueFrom = "arn:aws:secretsmanager:eu-west-1:123456789:secret:your_kafka_ca_pem"
        },
        {
          name      = "SERVICE_CERT"
          valueFrom = "arn:aws:secretsmanager:eu-west-1:123456789:secret:your_kafka_service_cert"
        },
        {
          name      = "SERVICE_KEY"
          valueFrom = "arn:aws:secretsmanager:eu-west-1:123456789:secret:your_kafka_service_key"
        }
      ]
    }
  }

  example_kafka_sidecar_container_dependencies = [
    {
      condition     = "SUCCESS"
      containerName = "kafka_key_init"
    }
  ]
}


================================================
FILE: distribution/ecs/example/terraform.tf
================================================
terraform {
  backend "local" {}
  required_providers {
    aws = {
      source  = "hashicorp/aws"
      version = "~> 5.39.1"
    }
  }
}

provider "aws" {
  region = "eu-west-1"
  default_tags {
    tags = {
      provisioner = "terraform"
    }
  }
}

data "aws_region" "current" {}

data "aws_caller_identity" "current" {}

module "quickwit" {
  source                       = "../quickwit"
  vpc_id                       = module.vpc.vpc_id
  subnet_ids                   = module.vpc.private_subnets
  quickwit_ingress_cidr_blocks = [module.vpc.vpc_cidr_block]

  ## Optional configurations:

  # - ECR if you provide the `dockerhub_pull_through_creds_secret_arn` variable
  # - Docker Hub otherwise (subject to throttling)
  quickwit_image = "${local.quickwit_image}:latest"

  # quickwit_index_s3_prefix  = "my-bucket/my-prefix"
  # quickwit_domain           = "quickwit"
  # quickwit_cpu_architecture = "ARM64"

  # quickwit_indexer = {
  #   desired_count         = 3
  #   memory                = 8192
  #   cpu                   = 4096
  #   ephemeral_storage_gib = 50
  #   extra_task_policy_arns = ["arn:aws:iam::aws:policy/AmazonKinesisFullAccess"]
  # }

  # quickwit_metastore = {
  #   desired_count = 1
  #   memory        = 512
  #   cpu           = 256
  # }

  # quickwit_searcher = {
  #   desired_count         = 1
  #   memory                = 2048
  #   cpu                   = 1024
  # }

  # quickwit_control_plane = {
  #   memory = 512
  #   cpu    = 256
  # }

  # quickwit_janitor = {
  #   memory = 512
  #   cpu    = 256
  # }

  # rds_config = {
  #   instance_class = "db.t4g.micro"
  #   multi_az       = false
  # }

  # external_postgres_uri_secret_arn = aws_ssm_parameter.postgres_uri.arn

  ## Example logging configuration 
  # sidecar_container_definitions  = {
  #   my_sidecar_container = see http://docs.aws.amazon.com/AmazonECS/latest/APIReference/API_ContainerDefinition.html
  # }
  # sidecar_container_dependencies = [{condition = "START", containerName = "my_sidecar_container"}]
  # log_configuration              = see https://registry.terraform.io/providers/hashicorp/aws/latest/docs/resources/ecs_service#log_configuration
  # enable_cloudwatch_logging      = false

  ## Example Kafka key injection (see kafka.tf)
  # sidecar_container_definitions  = local.example_kafka_sidecar_container_definitions
  # sidecar_container_dependencies = local.example_kafka_sidecar_container_dependencies
}


output "indexer_service_name" {
  value = module.quickwit.indexer_service_name
}

output "searcher_service_name" {
  value = module.quickwit.searcher_service_name
}


================================================
FILE: distribution/ecs/example/vpc.tf
================================================
module "vpc" {
  source  = "terraform-aws-modules/vpc/aws"
  version = "5.5.3"

  name = "quickwit-ecs"
  cidr = "10.0.0.0/16"

  azs             = ["${data.aws_region.current.name}a", "${data.aws_region.current.name}b"]
  private_subnets = ["10.0.1.0/24", "10.0.2.0/24"]
  public_subnets  = ["10.0.101.0/24", "10.0.102.0/24"]

  enable_nat_gateway = true
}


================================================
FILE: distribution/ecs/quickwit/cluster.tf
================================================
module "ecs_cluster" {
  source  = "terraform-aws-modules/ecs/aws//modules/cluster"
  version = "5.9.3"

  cluster_name = "quickwit-${local.module_id}"
}

resource "aws_service_discovery_private_dns_namespace" "quickwit_internal" {
  name        = var.quickwit_domain
  description = "Internal quickwit domain"
  vpc         = var.vpc_id
}

resource "aws_security_group" "quickwit_cluster_member_sg" {
  name        = "quickwit-cluster-member-${local.module_id}"
  description = "Security group for members of the Quickwit cluster"
  vpc_id      = var.vpc_id
}


================================================
FILE: distribution/ecs/quickwit/configs.tf
================================================
locals {
  quickwit_peer_list = [
    "${aws_service_discovery_service.metastore.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}",
    "${aws_service_discovery_service.control_plane.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}",
    "${aws_service_discovery_service.janitor.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}",
    "${aws_service_discovery_service.indexer.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}",
    "${aws_service_discovery_service.searcher.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}",
  ]

  # id to avoid conflicts when deploying this module multiple times (random by default)
  module_id = var.module_id == "" ? random_id.module.hex : var.module_id
  s3_id     = var.module_id == "" ? random_id.module.hex : "${var.module_id}-${random_id.module.hex}"

  quickwit_index_s3_prefix = var.quickwit_index_s3_prefix == "" ? aws_s3_bucket.index[0].id : var.quickwit_index_s3_prefix

  use_external_rds        = var.external_postgres_uri_secret_arn != ""
  postgres_uri_secret_arn = var.external_postgres_uri_secret_arn != "" ? var.external_postgres_uri_secret_arn : aws_ssm_parameter.postgres_credential[0].arn
}

resource "random_id" "module" {
  byte_length = 3
}


================================================
FILE: distribution/ecs/quickwit/iam.tf
================================================
data "aws_iam_policy_document" "quickwit_task_permission" {
  # Reference: https://quickwit.io/docs/guides/aws-setup#amazon-s3
  statement {
    actions = [
      "s3:ListBucket",
      "s3:GetObject",
      "s3:PutObject",
      "s3:DeleteObject"
    ]

    resources = [
      "arn:aws:s3:::${local.quickwit_index_s3_prefix}*",
    ]
  }
}

resource "aws_iam_policy" "quickwit_task_permission" {
  name = "quickwit-task-policy-${local.module_id}"
  path = "/"

  policy = data.aws_iam_policy_document.quickwit_task_permission.json
}

data "aws_iam_policy_document" "quickwit_task_execution_permission" {
  statement {
    actions = [
      "logs:PutLogEvents",
      "logs:CreateLogStream"
    ]

    resources = ["*"]
  }
  statement {
    actions = [
      "ecr:GetDownloadUrlForLayer",
      "ecr:GetAuthorizationToken",
      "ecr:BatchGetImage",
      "ecr:BatchCheckLayerAvailability",
      "ecr:CreateRepository",
      "ecr:BatchImportUpstreamImage"
    ]

    resources = ["*"]
  }

  statement {
    actions = ["ssm:GetParameters"]

    resources = [local.postgres_uri_secret_arn]
  }

  statement {
    actions = ["secretsmanager:GetSecretValue"]

    resources = ["arn:aws:secretsmanager:*:*:secret:*"]
  }

}

resource "aws_iam_policy" "quickwit_task_execution_permission" {
  name = "quickwit-task-execution-policy-${local.module_id}"
  path = "/"

  policy = data.aws_iam_policy_document.quickwit_task_execution_permission.json
}


================================================
FILE: distribution/ecs/quickwit/outputs.tf
================================================
output "indexer_service_name" {
  value = "${aws_service_discovery_service.indexer.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}"
}

output "searcher_service_name" {
  value = "${aws_service_discovery_service.searcher.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}"
}

output "janitor_service_name" {
  value = "${aws_service_discovery_service.janitor.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}"
}

output "control_plane_service_name" {
  value = "${aws_service_discovery_service.control_plane.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}"
}

output "metastore_service_name" {
  value = "${aws_service_discovery_service.metastore.name}.${aws_service_discovery_private_dns_namespace.quickwit_internal.name}"
}


================================================
FILE: distribution/ecs/quickwit/quickwit-control-plane.tf
================================================
module "quickwit_control_plane" {
  source                         = "./service"
  service_name                   = "control_plane"
  service_discovery_registry_arn = aws_service_discovery_service.control_plane.arn
  cluster_arn                    = module.ecs_cluster.arn
  postgres_uri_secret_arn        = local.postgres_uri_secret_arn
  quickwit_peer_list             = local.quickwit_peer_list
  s3_access_policy_arn           = aws_iam_policy.quickwit_task_permission.arn
  task_execution_policy_arn      = aws_iam_policy.quickwit_task_execution_permission.arn
  module_id                      = local.module_id
  quickwit_cluster_member_sg_id  = aws_security_group.quickwit_cluster_member_sg.id

  subnet_ids                     = var.subnet_ids
  ingress_cidr_blocks            = var.quickwit_ingress_cidr_blocks
  quickwit_image                 = var.quickwit_image
  quickwit_cpu_architecture      = var.quickwit_cpu_architecture
  sidecar_container_definitions  = var.sidecar_container_definitions
  sidecar_container_dependencies = var.sidecar_container_dependencies
  log_configuration              = var.log_configuration
  enable_cloudwatch_logging      = var.enable_cloudwatch_logging
  service_config                 = var.quickwit_control_plane
  quickwit_index_s3_prefix       = local.quickwit_index_s3_prefix
}

resource "aws_service_discovery_service" "control_plane" {
  name = "control-plane"

  dns_config {
    namespace_id = aws_service_discovery_private_dns_namespace.quickwit_internal.id

    dns_records {
      ttl  = 10
      type = "A"
    }

    routing_policy = "MULTIVALUE"
  }
}


================================================
FILE: distribution/ecs/quickwit/quickwit-indexer.tf
================================================
module "quickwit_indexer" {
  source                         = "./service"
  service_name                   = "indexer"
  service_discovery_registry_arn = aws_service_discovery_service.indexer.arn
  cluster_arn                    = module.ecs_cluster.arn
  postgres_uri_secret_arn        = local.postgres_uri_secret_arn
  quickwit_peer_list             = local.quickwit_peer_list
  s3_access_policy_arn           = aws_iam_policy.quickwit_task_permission.arn
  task_execution_policy_arn      = aws_iam_policy.quickwit_task_execution_permission.arn
  module_id                      = local.module_id
  quickwit_cluster_member_sg_id  = aws_security_group.quickwit_cluster_member_sg.id

  subnet_ids                     = var.subnet_ids
  ingress_cidr_blocks            = var.quickwit_ingress_cidr_blocks
  quickwit_image                 = var.quickwit_image
  quickwit_cpu_architecture      = var.quickwit_cpu_architecture
  sidecar_container_definitions  = var.sidecar_container_definitions
  sidecar_container_dependencies = var.sidecar_container_dependencies
  log_configuration              = var.log_configuration
  enable_cloudwatch_logging      = var.enable_cloudwatch_logging
  service_config                 = var.quickwit_indexer
  quickwit_index_s3_prefix       = local.quickwit_index_s3_prefix
  # Longer termination grace period for indexers because we are waiting for the
  # data persisted in the ingesters to be indexed and committed. Should be
  # larger than the largest commit timeout.
  stop_timeout = 120
}

resource "aws_service_discovery_service" "indexer" {
  name = "indexer"

  dns_config {
    namespace_id = aws_service_discovery_private_dns_namespace.quickwit_internal.id

    dns_records {
      ttl  = 10
      type = "A"
    }

    routing_policy = "MULTIVALUE"
  }
}


================================================
FILE: distribution/ecs/quickwit/quickwit-janitor.tf
================================================
module "quickwit_janitor" {
  source                         = "./service"
  service_name                   = "janitor"
  service_discovery_registry_arn = aws_service_discovery_service.janitor.arn
  cluster_arn                    = module.ecs_cluster.arn
  postgres_uri_secret_arn        = local.postgres_uri_secret_arn
  quickwit_peer_list             = local.quickwit_peer_list
  s3_access_policy_arn           = aws_iam_policy.quickwit_task_permission.arn
  task_execution_policy_arn      = aws_iam_policy.quickwit_task_execution_permission.arn
  module_id                      = local.module_id
  quickwit_cluster_member_sg_id  = aws_security_group.quickwit_cluster_member_sg.id

  subnet_ids                     = var.subnet_ids
  ingress_cidr_blocks            = var.quickwit_ingress_cidr_blocks
  quickwit_image                 = var.quickwit_image
  quickwit_cpu_architecture      = var.quickwit_cpu_architecture
  sidecar_container_definitions  = var.sidecar_container_definitions
  sidecar_container_dependencies = var.sidecar_container_dependencies
  log_configuration              = var.log_configuration
  enable_cloudwatch_logging      = var.enable_cloudwatch_logging
  service_config                 = var.quickwit_janitor
  quickwit_index_s3_prefix       = local.quickwit_index_s3_prefix
}

resource "aws_service_discovery_service" "janitor" {
  name = "janitor"

  dns_config {
    namespace_id = aws_service_discovery_private_dns_namespace.quickwit_internal.id

    dns_records {
      ttl  = 10
      type = "A"
    }

    routing_policy = "MULTIVALUE"
  }
}


================================================
FILE: distribution/ecs/quickwit/quickwit-metastore.tf
================================================
module "quickwit_metastore" {
  source                         = "./service"
  service_name                   = "metastore"
  service_discovery_registry_arn = aws_service_discovery_service.metastore.arn
  cluster_arn                    = module.ecs_cluster.arn
  postgres_uri_secret_arn        = local.postgres_uri_secret_arn
  quickwit_peer_list             = local.quickwit_peer_list
  s3_access_policy_arn           = aws_iam_policy.quickwit_task_permission.arn
  task_execution_policy_arn      = aws_iam_policy.quickwit_task_execution_permission.arn
  module_id                      = local.module_id
  quickwit_cluster_member_sg_id  = aws_security_group.quickwit_cluster_member_sg.id

  subnet_ids                     = var.subnet_ids
  ingress_cidr_blocks            = var.quickwit_ingress_cidr_blocks
  quickwit_image                 = var.quickwit_image
  quickwit_cpu_architecture      = var.quickwit_cpu_architecture
  sidecar_container_definitions  = var.sidecar_container_definitions
  sidecar_container_dependencies = var.sidecar_container_dependencies
  log_configuration              = var.log_configuration
  enable_cloudwatch_logging      = var.enable_cloudwatch_logging
  service_config                 = var.quickwit_metastore
  quickwit_index_s3_prefix       = local.quickwit_index_s3_prefix
}

resource "aws_service_discovery_service" "metastore" {
  name = "metastore"

  dns_config {
    namespace_id = aws_service_discovery_private_dns_namespace.quickwit_internal.id

    dns_records {
      ttl  = 10
      type = "A"
    }

    routing_policy = "MULTIVALUE"
  }
}


================================================
FILE: distribution/ecs/quickwit/quickwit-searcher.tf
================================================
module "quickwit_searcher" {
  source                         = "./service"
  service_name                   = "searcher"
  service_discovery_registry_arn = aws_service_discovery_service.searcher.arn
  cluster_arn                    = module.ecs_cluster.arn
  postgres_uri_secret_arn        = local.postgres_uri_secret_arn
  quickwit_peer_list             = local.quickwit_peer_list
  s3_access_policy_arn           = aws_iam_policy.quickwit_task_permission.arn
  task_execution_policy_arn      = aws_iam_policy.quickwit_task_execution_permission.arn
  module_id                      = local.module_id
  quickwit_cluster_member_sg_id  = aws_security_group.quickwit_cluster_member_sg.id

  subnet_ids                     = var.subnet_ids
  ingress_cidr_blocks            = var.quickwit_ingress_cidr_blocks
  quickwit_image                 = var.quickwit_image
  quickwit_cpu_architecture      = var.quickwit_cpu_architecture
  sidecar_container_definitions  = var.sidecar_container_definitions
  sidecar_container_dependencies = var.sidecar_container_dependencies
  log_configuration              = var.log_configuration
  enable_cloudwatch_logging      = var.enable_cloudwatch_logging
  service_config                 = var.quickwit_searcher
  quickwit_index_s3_prefix       = local.quickwit_index_s3_prefix
}

resource "aws_service_discovery_service" "searcher" {
  name = "searcher"

  dns_config {
    namespace_id = aws_service_discovery_private_dns_namespace.quickwit_internal.id

    dns_records {
      ttl  = 10
      type = "A"
    }

    routing_policy = "MULTIVALUE"
  }
}


================================================
FILE: distribution/ecs/quickwit/rds.tf
================================================
resource "random_password" "quickwit_db" {
  count   = local.use_external_rds ? 0 : 1
  length  = 64
  special = false
}

module "quickwit_db" {
  count   = local.use_external_rds ? 0 : 1
  source  = "terraform-aws-modules/rds/aws"
  version = "6.5.2"

  identifier = "quickwit-metastore-${local.module_id}"

  engine               = "postgres"
  engine_version       = "16"
  family               = "postgres16" # DB parameter group
  major_engine_version = "16"         # DB option group

  instance_class    = var.rds_config.instance_class
  multi_az          = var.rds_config.multi_az
  allocated_storage = 5

  db_name  = "quickwit"
  username = "quickwit"
  password = random_password.quickwit_db[0].result

  port                                = "5432"
  publicly_accessible                 = false
  manage_master_user_password         = false
  iam_database_authentication_enabled = true
  vpc_security_group_ids              = [aws_security_group.quickwit_db[0].id]
  db_subnet_group_name                = aws_db_subnet_group.quickwit[0].name

  maintenance_window = "Mon:00:00-Mon:03:00"

  create_monitoring_role = true
  monitoring_interval    = "30"
  monitoring_role_name   = "RDSQuickwitMonitoringRole-${local.module_id}"

  deletion_protection = false
  skip_final_snapshot = true
}

resource "aws_security_group" "quickwit_db" {
  count       = local.use_external_rds ? 0 : 1
  name        = "quickwit-db-${local.module_id}"
  description = "Security group for the Quickwit Metastore DB"
  vpc_id      = var.vpc_id

  ingress {
    description     = "Connection from explicitly allowed resources"
    from_port       = 5432
    to_port         = 5432
    protocol        = "tcp"
    security_groups = [aws_security_group.quickwit_cluster_member_sg.id]
  }
}

resource "aws_db_subnet_group" "quickwit" {
  count       = local.use_external_rds ? 0 : 1
  name        = "quickwit-${local.module_id}"
  description = "Quickwit metastore"
  subnet_ids  = var.subnet_ids
}

resource "aws_ssm_parameter" "postgres_credential" {
  count = local.use_external_rds ? 0 : 1
  name  = "/quickwit/${local.module_id}/postgres"
  type  = "SecureString"
  value = "postgres://${module.quickwit_db[0].db_instance_username}:${random_password.quickwit_db[0].result}@${module.quickwit_db[0].db_instance_address}:${module.quickwit_db[0].db_instance_port}/${module.quickwit_db[0].db_instance_name}"
}


================================================
FILE: distribution/ecs/quickwit/s3.tf
================================================
data "aws_caller_identity" "current" {}

resource "aws_s3_bucket" "index" {
  count         = var.quickwit_index_s3_prefix == "" ? 1 : 0
  bucket        = "quickwit-ecs-index-${data.aws_caller_identity.current.account_id}-${local.s3_id}"
  force_destroy = true
}


================================================
FILE: distribution/ecs/quickwit/service/config.tf
================================================
locals {
  quickwit_data_dir = "/quickwit/qwdata"

  quickwit_common_environment = [
    {
      name  = "QW_ENABLED_SERVICES"
      value = var.service_name
    },
    {
      name  = "QW_PEER_SEEDS"
      value = join(",", var.quickwit_peer_list)
    },
    {
      name  = "NO_COLOR"
      value = "true"
    },
    {
      name  = "QW_CLUSTER_ID"
      value = "ecs-${var.module_id}"
    },
    {
      name  = "QW_LISTEN_ADDRESS"
      value = "0.0.0.0"
    },
    {
      name  = "QW_DATA_DIR"
      value = local.quickwit_data_dir
    },
    {
      name  = "QW_DEFAULT_INDEX_ROOT_URI"
      value = "s3://${var.quickwit_index_s3_prefix}"
    },
  ]

  nb_extra_policies             = length(var.service_config.extra_task_policy_arns)
  extra_tasks_iam_role_policies = { for i in range(local.nb_extra_policies) : "extra_policy_${i}" => var.service_config.extra_task_policy_arns[i] }
  tasks_iam_role_policies       = merge({ s3_access = var.s3_access_policy_arn }, local.extra_tasks_iam_role_policies)
}


================================================
FILE: distribution/ecs/quickwit/service/ecs.tf
================================================
module "quickwit_service" {
  source  = "terraform-aws-modules/ecs/aws//modules/service"
  version = "5.9.3"

  name        = "quickwit-${var.service_name}-${var.module_id}"
  cluster_arn = var.cluster_arn

  cpu    = var.service_config.cpu
  memory = var.service_config.memory
  ephemeral_storage = {
    size_in_gib = var.service_config.ephemeral_storage_gib
  }

  container_definitions = merge(var.sidecar_container_definitions, {
    quickwit = {
      cpu    = var.service_config.cpu
      memory = var.service_config.memory

      essential                 = true
      image                     = var.quickwit_image
      enable_cloudwatch_logging = var.enable_cloudwatch_logging

      command = ["run"]

      environment = local.quickwit_common_environment

      secrets = [
        {
          name      = "QW_METASTORE_URI"
          valueFrom = var.postgres_uri_secret_arn
        }
      ]

      port_mappings = [
        {
          name          = "rest"
          containerPort = 7280
          protocol      = "tcp"
        },
        {
          name          = "grpc"
          containerPort = 7281
          protocol      = "tcp"
        },
        {
          name          = "gossip"
          containerPort = 7280
          protocol      = "udp"
        }
      ]

      log_configuration = var.log_configuration

      mount_points = [
        {
          sourceVolume  = "quickwit-data-vol"
          containerPath = local.quickwit_data_dir
        },
        # A volume that can be used to inject secrets as files.
        {
          sourceVolume  = "quickwit-keys"
          containerPath = "/quickwit/keys"
        }
      ]

      stopTimeout = var.stop_timeout

      dependencies = var.sidecar_container_dependencies
    }
  })

  requires_compatibilities = ["FARGATE"]
  runtime_platform = {
    operating_system_family = "LINUX"
    cpu_architecture        = var.quickwit_cpu_architecture
  }

  service_registries = {
    registry_arn   = var.service_discovery_registry_arn
    container_name = "quickwit"
  }

  subnet_ids = var.subnet_ids
  security_group_rules = {
    ingress_internal = {
      type      = "ingress"
      from_port = 7280
      to_port   = 7281
      protocol  = "-1"

      source_security_group_id = var.quickwit_cluster_member_sg_id
    }
    ingress_external = {
      type      = "ingress"
      from_port = 7280
      to_port   = 7281
      protocol  = "-1"

      cidr_blocks = var.ingress_cidr_blocks
    }
    egress_all = {
      type      = "egress"
      from_port = 0
      to_port   = 0
      protocol  = "-1"

      cidr_blocks = ["0.0.0.0/0"]
    }
  }
  security_group_ids = [var.quickwit_cluster_member_sg_id]

  enable_autoscaling = false
  desired_count      = var.service_config.desired_count

  volume = [
    {
      name = "quickwit-data-vol"
    },
    {
      name = "quickwit-keys"
    }
  ]

  tasks_iam_role_policies = local.tasks_iam_role_policies

  task_exec_iam_role_policies = {
    policy = var.task_execution_policy_arn
  }

}


================================================
FILE: distribution/ecs/quickwit/service/variables.tf
================================================
variable "service_name" {
  description = "One of indexer, metastore, searcher, control_plane, janitor"
}

variable "service_discovery_registry_arn" {}

variable "sidecar_container_definitions" {}

variable "sidecar_container_dependencies" {
  type = list(object({
    containerName = string
    condition     = string
  }))
  default = []
}

variable "log_configuration" {}

variable "enable_cloudwatch_logging" {
  type = bool
}

variable "cluster_arn" {}

variable "ingress_cidr_blocks" {
  type = list(string)
}

variable "quickwit_cluster_member_sg_id" {}

variable "subnet_ids" {
  type = list(string)
}

variable "postgres_uri_secret_arn" {
  description = "ARN of the SSM parameter or Secret Manager secret containing the URI of a Postgres instance"
}

variable "quickwit_image" {}

variable "service_config" {
  type = object({
    desired_count          = optional(number, 1)
    memory                 = number
    cpu                    = number
    ephemeral_storage_gib  = optional(number, 21)
    extra_task_policy_arns = optional(list(string), [])
  })
}

variable "quickwit_index_s3_prefix" {}

variable "quickwit_peer_list" {
  type = list(string)
}

variable "s3_access_policy_arn" {}

variable "task_execution_policy_arn" {}

variable "quickwit_cpu_architecture" {}

variable "module_id" {}

variable "stop_timeout" {
  # between 1s and 120s on Fargate, 30s is the ECS default
  default = 30
}


================================================
FILE: distribution/ecs/quickwit/variables.tf
================================================
## REQUIRED VARIABLES

variable "vpc_id" {
  description = "VPC ID of the cluster"
}

variable "subnet_ids" {
  description = "Subnet(s) where quickwit will be deployed"
  type        = list(string)
}


## OPTIONAL VARIABLES

variable "module_id" {
  description = "Identifier for the module, e.g the stage. If not specified, a random string is generated."
  default     = ""
}

variable "quickwit_ingress_cidr_blocks" {
  description = "CIDR blocks (private) that should have access to the Quickwit cluster"
  type        = list(string)
  default     = []
}


variable "quickwit_index_s3_prefix" {
  description = "S3 bucket name and prefix for the Quickwit data, e.g. my-bucket-name/my-prefix. Quickwit will only have access to this S3 location. Leave empty to create a new bucket."
  default     = ""
}

variable "quickwit_domain" {
  description = "Local domain for quickwit service discovery"
  default     = "quickwit"
}

variable "quickwit_image" {
  description = "Quickwit docker image"
  default     = "quickwit/quickwit:latest"
}

variable "quickwit_cpu_architecture" {
  description = "One of X86_64 / ARM64. Must match the arch of the provided image (var.quickwit_image)."
  default     = "ARM64"
}

variable "sidecar_container_definitions" {
  description = "Sidecar containers to be attached to Quickwit tasks"
  default     = {}
}

variable "sidecar_container_dependencies" {
  description = "Specify the Quickwit container's dependencies on sidecars"
  type = list(object({
    containerName = string
    condition     = string
  }))
  default = []
}

variable "enable_cloudwatch_logging" {
  description = "Cloudwatch logging for Quickwit tasks. Usually disabled when using a custom log configuration."
  default     = true
}

variable "log_configuration" {
  description = "Custom log configuration for Quickwit tasks"
  default     = {}
}

variable "quickwit_indexer" {
  description = "Indexer service sizing configurations"
  type = object({
    desired_count          = optional(number, 1)
    memory                 = optional(number, 8192)
    cpu                    = optional(number, 2048)
    ephemeral_storage_gib  = optional(number, 21)
    extra_task_policy_arns = optional(list(string), [])
  })
  default = {}
}

variable "quickwit_metastore" {
  description = "Metastore service sizing configurations"
  type = object({
    desired_count = optional(number, 1)
    memory        = optional(number, 512)
    cpu           = optional(number, 256)
  })
  default = {}
}

variable "quickwit_searcher" {
  description = "Searcher service sizing configurations"
  type = object({
    desired_count         = optional(number, 1)
    memory                = optional(number, 4096)
    cpu                   = optional(number, 1024)
    ephemeral_storage_gib = optional(number, 21)
  })
  default = {}
}

variable "quickwit_control_plane" {
  description = "Control plane service sizing configurations"
  type = object({
    # only 1 task is necessary
    memory = optional(number, 512)
    cpu    = optional(number, 256)
  })
  default = {}
}

variable "quickwit_janitor" {
  description = "Janitor service sizing configurations"
  type = object({
    # only 1 task is necessary
    memory = optional(number, 512)
    cpu    = optional(number, 256)
  })
  default = {}
}

variable "rds_config" {
  description = "Configurations of the metastore RDS database. Enable multi_az to ensure high availability."
  type = object({
    instance_class = optional(string, "db.t4g.micro")
    multi_az       = optional(bool, false)
  })
  default = {}
}

variable "external_postgres_uri_secret_arn" {
  description = "ARN of the SSM parameter or Secret Manager secret containing the URI of a Postgres instance (postgres://{user}:{password}@{address}:{port}/{db_instance_name}). The Postgres instance should allow indbound connections from the subnets specified in `variable.subnet_ids`. If provided, the internal RDS will not be created and `var.rds_config` is ignored."
  default     = ""
}


================================================
FILE: distribution/kubernetes/README.md
================================================
# Quickwit on Kubernetes

To deploy Quickwit on Kubernetes, use the official Quickwit Helm chart available at [helm.quickwit.io](https://helm.quickwit.io/) and refer to our [documentation](https://quickwit.io/docs/deployment/kubernetes/helm) for more information.


================================================
FILE: docker-compose.yml
================================================
# By default, this docker compose script maps all services to localhost only.
# If you need to make services available outside of your machine, add
# appropriate service mappings to the .env file. See .env.example file for
# configuration example.
#
# Notes on image versions:
#  - For the key services such as postgres and pulsar we are trying to run
#    against the oldest supported version
#  - For kafka we use the oldest version that supports KRaft.
#  - For everything else we are trying to run against the latest version.
#
# To run against the latest image versions update .env file. See .env.example
# file for configuration examples. You might need to remove the old images
# first if they are already tagged latest and volumes if their content is
# incompatible with the latest version, as in case of postgres.

name: quickwit

networks:
  default:
    name: quickwit-network
    ipam:
      config:
      - subnet: 172.16.7.0/24
        gateway: 172.16.7.1

services:
  localstack:
    image: localstack/localstack:${LOCALSTACK_VERSION:-3.5.0}
    container_name: localstack
    ports:
      - "${MAP_HOST_LOCALSTACK:-127.0.0.1}:4566:4566"
      - "${MAP_HOST_LOCALSTACK:-127.0.0.1}:4571:4571"
      - "${MAP_HOST_LOCALSTACK:-127.0.0.1}:8080:8080"
    profiles:
      - all
      - localstack
    environment:
      SERVICES: kinesis,s3,sqs
      PERSISTENCE: 1
    volumes:
      - .localstack:/etc/localstack/init/ready.d
      - localstack_data:/var/lib/localstack
    healthcheck:
      test: ["CMD", "curl", "-k", "-f", "https://localhost:4566/quickwit-integration-tests"]
      interval: 1s
      timeout: 5s
      retries: 100

  postgres:
    # The oldest supported version. EOL November 14, 2024
    image: postgres:${POSTGRES_VERSION:-12.17-alpine}
    container_name: postgres
    ports:
      - "${MAP_HOST_POSTGRES:-127.0.0.1}:5432:5432"
    profiles:
      - all
      - postgres
    environment:
      PGDATA: /var/lib/postgresql/data/pgdata
      POSTGRES_USER: ${POSTGRES_USER:-quickwit-dev}
      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-quickwit-dev}
      POSTGRES_DB: ${POSTGRES_DB:-quickwit-metastore-dev}
    volumes:
      - postgres_data:/var/lib/postgresql/data
    healthcheck:
      test: ["CMD", "pg_isready"]
      interval: 1s
      timeout: 5s
      retries: 100

  pulsar-broker:
    # The oldest version with arm64 docker images. EOL May 2 2025
    image: apachepulsar/pulsar:${PULSAR_VERSION:-3.0.0}
    container_name: pulsar-broker
    command: bin/pulsar standalone --no-functions-worker
    ports:
      - "${MAP_HOST_PULSAR:-127.0.0.1}:6650:6650"
      - "${MAP_HOST_PULSAR:-127.0.0.1}:8081:8080"
    environment:
      PULSAR_MEM: "-Xms384M -Xmx384M"
      # Disable functions worker to save memory/time
      PULSAR_PREFIX_functionsWorkerEnabled: "false"
    profiles:
      - all
      - pulsar

  kafka-broker:
    image: confluentinc/confluent-local:${CP_VERSION:-7.4.11}
    container_name: kafka-broker
    ports:
      - "${MAP_HOST_KAFKA:-127.0.0.1}:9092:9092"
      - "${MAP_HOST_KAFKA:-127.0.0.1}:9101:9101"
    profiles:
      - all
      - kafka

    environment:
          # Mode KRaft (Single Node)
          KAFKA_NODE_ID: 1
          KAFKA_PROCESS_ROLES: 'broker,controller'
          KAFKA_CONTROLLER_QUORUM_VOTERS: '1@localhost:9093'
          KAFKA_LOG4J_LOGGERS: "org.apache.kafka.image.loader.MetadataLoader=WARN"

          # Listeners
          KAFKA_LISTENER_SECURITY_PROTOCOL_MAP: 'CONTROLLER:PLAINTEXT,EXTERNAL:PLAINTEXT'
          KAFKA_LISTENERS: 'EXTERNAL://0.0.0.0:9092,CONTROLLER://0.0.0.0:9093'
          KAFKA_ADVERTISED_LISTENERS: 'EXTERNAL://localhost:9092'
          KAFKA_CONTROLLER_LISTENER_NAMES: 'CONTROLLER'
          KAFKA_INTER_BROKER_LISTENER_NAME: 'EXTERNAL'

          # Configuration simplifiée
          KAFKA_OFFSETS_TOPIC_REPLICATION_FACTOR: 1
          KAFKA_GROUP_INITIAL_REBALANCE_DELAY_MS: 0
          KAFKA_TRANSACTION_STATE_LOG_REPLICATION_FACTOR: 1
          KAFKA_TRANSACTION_STATE_LOG_MIN_ISR: 1

          # ID du Cluster (Nécessaire pour KRaft)
          CLUSTER_ID: 'MkU3OEVBNTcwNTJENDM2Qk'

          KAFKA_HEAP_OPTS: -Xms256M -Xmx256M
    healthcheck:
        # test: ["CMD-SHELL", "nc -z localhost 9092 || exit 1"]
        test: ["CMD", "ub", "kafka-ready", "-b", "localhost:9092", "1", "5"]
        start_period: 5s
        interval: 5s
        timeout: 10s
        retries: 100

  azurite:
    image: mcr.microsoft.com/azure-storage/azurite:${AZURITE_VERSION:-3.24.0}
    container_name: azurite
    ports:
        - "${MAP_HOST_AZURITE:-127.0.0.1}:10000:10000" # Blob store port
    profiles:
      - all
      - azurite
    volumes:
        - azurite_data:/data
    command: azurite --blobHost 0.0.0.0 --loose

  fake-gcs-server:
    image: fsouza/fake-gcs-server:${FAKE_GCS_SERVER_VERSION:-1.47.7}
    container_name: fake-gcs-server
    ports:
      - "${MAP_HOST_FAKE_GCS_SERVER:-127.0.0.1}:4443:4443" # Blob store port
    profiles:
      - all
      - fake-gcs-server
    volumes:
      - fake_gcs_server_data:/data
    command: -scheme http

  grafana:
    image: grafana/grafana-oss:${GRAFANA_VERSION:-10.4.1}
    container_name: grafana
    ports:
      - "${MAP_HOST_GRAFANA:-127.0.0.1}:3000:3000"
    profiles:
      - grafana
      - monitoring
    environment:
      GF_AUTH_DISABLE_LOGIN_FORM: "true"
      GF_AUTH_ANONYMOUS_ENABLED: "true"
      GF_AUTH_ANONYMOUS_ORG_ROLE: Admin
    volumes:
      - grafana_conf:/etc/grafana
      - grafana_data:/var/lib/grafana
      - ./monitoring/grafana/dashboards:/var/lib/grafana/dashboards
      - ./monitoring/grafana/provisioning:/etc/grafana/provisioning

  jaeger:
    image: jaegertracing/all-in-one:${JAEGER_VERSION:-1.48.0}
    container_name: jaeger
    ports:
      - "${MAP_HOST_JAEGER:-127.0.0.1}:16686:16686" # Frontend
    profiles:
      - jaeger
      - monitoring

  otel-collector:
    image: otel/opentelemetry-collector:${OTEL_VERSION:-0.84.0}
    container_name: otel-collector
    ports:
      - "${MAP_HOST_OTEL:-127.0.0.1}:1888:1888"   # pprof extension
      - "${MAP_HOST_OTEL:-127.0.0.1}:8888:8888"   # Prometheus metrics exposed by the collector
      - "${MAP_HOST_OTEL:-127.0.0.1}:8889:8889"   # Prometheus exporter metrics
      - "${MAP_HOST_OTEL:-127.0.0.1}:13133:13133" # health_check extension
      - "${MAP_HOST_OTEL:-127.0.0.1}:4317:4317"   # OTLP gRPC receiver
      - "${MAP_HOST_OTEL:-127.0.0.1}:4318:4318"   # OTLP http receiver
      - "${MAP_HOST_OTEL:-127.0.0.1}:55679:55679" # zpages extension
    profiles:
      - otel
      - monitoring
    volumes:
      - ./monitoring/otel-collector-config.yaml:/etc/otel-collector-config.yaml
    command: ["--config=/etc/otel-collector-config.yaml"]

  prometheus:
    image: prom/prometheus:${PROMETHEUS_VERSION:-v2.43.0}
    container_name: prometheus
    ports:
      - "${MAP_HOST_PROMETHEUS:-127.0.0.1}:9090:9090"
    profiles:
      - prometheus
      - monitoring
    volumes:
      - ./monitoring/prometheus.yaml:/etc/prometheus/prometheus.yml
    extra_hosts:
      - "host.docker.internal:host-gateway"

  gcp-pubsub-emulator:
    # It is not an official docker image
    # if we prefer we can build a docker from the official docker image (gcloud cli)
    # and install the pubsub emulator https://cloud.google.com/pubsub/docs/emulator
    image: thekevjames/gcloud-pubsub-emulator:${GCLOUD_EMULATOR:-550.0.0}
    container_name: gcp-pubsub-emulator
    ports:
      - "${MAP_HOST_GCLOUD_EMULATOR:-127.0.0.1}:8681:8681"
    environment:
      # create a fake gcp project and a topic / subscription
      - PUBSUB_PROJECT1=quickwit-emulator,emulator_topic:emulator_subscription
    profiles:
      - all
      - gcp-pubsub

volumes:
  azurite_data:
  fake_gcs_server_data:
  grafana_conf:
  grafana_data:
  localstack_data:
  postgres_data:


================================================
FILE: docs/assets/sqs-file-source.tf
================================================
terraform {
  required_version = "1.7.5"
  required_providers {
    aws = {
      source  = "hashicorp/aws"
      version = "~> 5.39.1"
    }
  }
}

provider "aws" {
  region = "us-east-1"
  default_tags {
    tags = {
      provisioner = "terraform"
      author      = "Quickwit"
    }
  }
}

locals {
  sqs_notification_queue_name = "qw-tuto-s3-event-notifications"
  source_bucket_name          = "qw-tuto-source-bucket"
}

resource "aws_s3_bucket" "file_source" {
  bucket_prefix = local.source_bucket_name
  force_destroy = true
}

data "aws_iam_policy_document" "sqs_notification" {
  statement {
    effect = "Allow"

    principals {
      type        = "*"
      identifiers = ["*"]
    }

    actions   = ["sqs:SendMessage"]
    resources = ["arn:aws:sqs:*:*:${local.sqs_notification_queue_name}"]

    condition {
      test     = "ArnEquals"
      variable = "aws:SourceArn"
      values   = [aws_s3_bucket.file_source.arn]
    }
  }
}


resource "aws_sqs_queue" "s3_events" {
  name   = local.sqs_notification_queue_name
  policy = data.aws_iam_policy_document.sqs_notification.json

  redrive_policy = jsonencode({
    deadLetterTargetArn = aws_sqs_queue.s3_events_deadletter.arn
    maxReceiveCount     = 5
  })
}

resource "aws_sqs_queue" "s3_events_deadletter" {
  name = "${locals.sqs_notification_queue_name}-deadletter"
}

resource "aws_sqs_queue_redrive_allow_policy" "s3_events_deadletter" {
  queue_url = aws_sqs_queue.s3_events_deadletter.id

  redrive_allow_policy = jsonencode({
    redrivePermission = "byQueue",
    sourceQueueArns   = [aws_sqs_queue.s3_events.arn]
  })
}

resource "aws_s3_bucket_notification" "bucket_notification" {
  bucket = aws_s3_bucket.file_source.id

  queue {
    queue_arn = aws_sqs_queue.s3_events.arn
    events    = ["s3:ObjectCreated:*"]
  }
}

data "aws_iam_policy_document" "quickwit_node" {
  statement {
    effect = "Allow"
    actions = [
      "sqs:ReceiveMessage",
      "sqs:DeleteMessage",
      "sqs:ChangeMessageVisibility",
      "sqs:GetQueueAttributes",
    ]
    resources = [aws_sqs_queue.s3_events.arn]
  }
  statement {
    effect    = "Allow"
    actions   = ["s3:GetObject"]
    resources = ["${aws_s3_bucket.file_source.arn}/*"]
  }
}

resource "aws_iam_user" "quickwit_node" {
  name = "quickwit-filesource-tutorial"
  path = "/system/"
}

resource "aws_iam_user_policy" "quickwit_node" {
  name   = "quickwit-filesource-tutorial"
  user   = aws_iam_user.quickwit_node.name
  policy = data.aws_iam_policy_document.quickwit_node.json
}

resource "aws_iam_access_key" "quickwit_node" {
  user = aws_iam_user.quickwit_node.name
}

output "source_bucket_name" {
  value = aws_s3_bucket.file_source.bucket

}

output "notification_queue_url" {
  value = aws_sqs_queue.s3_events.id
}

output "quickwit_node_access_key_id" {
  value     = aws_iam_access_key.quickwit_node.id
  sensitive = true
}

output "quickwit_node_secret_access_key" {
  value     = aws_iam_access_key.quickwit_node.secret
  sensitive = true
}


================================================
FILE: docs/configuration/_category_.yaml
================================================
label: 'Configuration'
position: 4
collapsed: true


================================================
FILE: docs/configuration/index-config.md
================================================
---
title: Index configuration
sidebar_position: 3
toc_max_heading_level: 4
---

This page describes how to configure an index.

In addition to the `index_id`, the index configuration lets you define five items:

- The **index-uri**: it defines where the index files should be stored.
- The **doc mapping**: it defines how a document and the fields it contains are stored and indexed for a given index.
- The **indexing settings**: it defines the timestamp field used for sharding, and some more advanced parameters like the merge policy.
- The **search settings**: it defines the default search fields `default_search_fields`, a list of fields that Quickwit will search into if the user query does not explicitly target a field.
- The **retention policy**: it defines how long Quickwit should keep the indexed data. If not specified, the data is stored forever.

Configuration is set at index creation and can be changed using the [update endpoint](../reference/rest-api.md) or the [CLI](../reference/cli.md).

## Config file format

The index configuration format is YAML. When a key is absent from the configuration file, the default value is used.
Here is a complete example suited for the HDFS logs dataset:

```yaml
version: 0.7 # File format version.

index_id: "hdfs"

index_uri: "s3://my-bucket/hdfs"

doc_mapping:
  mode: lenient
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: severity_text
      type: text
      tokenizer: raw
      fast:
        - tokenizer: lowercase
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: object
      field_mappings:
        - name: service
          type: text
          tokenizer: raw
  tag_fields: ["resource.service"]
  timestamp_field: timestamp
  index_field_presence: true

search_settings:
  default_search_fields: [severity_text, body]

retention:
  period: 90 days
  schedule: daily
```

## Index ID

The index ID is a string that uniquely identifies the index within the metastore. It may only contain uppercase or lowercase ASCII letters, digits, hyphens (`-`), and underscores (`_`). Finally, it must start with a letter and contain at least 3 characters but no more than 255.

## Index uri

The index-uri defines where the index files (also called splits) should be stored.
This parameter expects a [storage uri](storage-config#storage-uris).

The `index-uri` parameter is optional.
By default, the `index-uri` will be computed by concatenating the `index-id` with the
`default_index_root_uri` defined in the [Quickwit's config](node-config).

:::caution
The file storage will not work when running quickwit in distributed mode. Instead, AWS S3, Azure Blob Storage, Google Cloud Storage (in s3 interoperability mode) or other S3-compatible storage systems including Scaleway Object Storage and Garage should be used as storage when running several searcher nodes.
:::

## Doc mapping

The doc mapping defines how a document and the fields it contains are stored and indexed for a given index. A document is a collection of named fields, each having its own data type (text, bytes, datetime, bool, i64, u64, f64, ip, json).

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `field_mappings` | Collection of field mapping, each having its own data type (text, binary, datetime, bool, i64, u64, f64, ip, json).   | `[]` |
| `mode`        | Defines how quickwit should handle document fields that are not present in the `field_mappings`. In particular, the "dynamic" mode makes it possible to use quickwit in a schemaless manner. (See [mode](#mode)) | `dynamic`
| `dynamic_mapping` | This parameter is only allowed when `mode` is set to `dynamic`. It then defines whether dynamically mapped fields should be indexed, stored, etc.  | (See [mode](#mode))
| `tag_fields` | Collection of fields* explicitly defined in `field_mappings` whose values will be stored as part of the `tags` metadata. Allowed types are: `text` (with raw tokenizer), `i64` and `u64`. [Learn more about tags](../overview/concepts/querying.md#tag-pruning). | `[]` |
| `store_source` | Whether or not the original JSON document is stored or not in the index.   | `false` |
| `timestamp_field`      | Timestamp field* used for sharding documents in splits. The field has to be of type `datetime`. [Learn more about time sharding](./../overview/architecture.md).  | `None` |
| `partition_key`   |  If set, quickwit will route documents into different splits depending on the field name declared as the `partition_key`. | `null` |
| `max_num_partitions`  | Limits the number of splits created through partitioning. (See [Partitioning](../overview/concepts/querying.md#partitioning))  |    `200` |
| `index_field_presence` | `exists` queries are enabled automatically for fast fields. To enable it for all other fields set this parameter to `true`. Enabling it can have a significant CPU-cost on indexing.  |  false |

*: tags fields and timestamp field are expressed as a path from the root of the JSON object to the given field. If a field name contains a `.` character, it needs to be escaped with a `\` character.

### Field types

Each field[^1] has a type that indicates the kind of data it contains, such as integer on 64 bits or text.
Quickwit supports the following raw types [`text`](#text-type), [`i64`](#numeric-types-i64-u64-and-f64-type), [`u64`](#numeric-types-i64-u64-and-f64-type), [`f64`](#numeric-types-i64-u64-and-f64-type), [`datetime`](#datetime-type), [`bool`](#bool-type), [`ip`](#ip-type), [`bytes`](#bytes-type), and [`json`](#json-type), and also supports composite types such as array and object. Behind the scenes, Quickwit is using tantivy field types, don't hesitate to look at [tantivy documentation](https://github.com/tantivy-search/tantivy) if you want to go into the details.

### Raw types

#### Text type

This field is a text field that will be analyzed and split into tokens before indexing.
This kind of field is tailored for full-text search.

Example of a mapping for a text field:

```yaml
name: body
description: Body of the document
type: text
tokenizer: default
record: position
fieldnorms: true
fast:
  normalizer: lowercase
```

**Parameters for text field**

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `description` | Optional description for the field. | `None` |
| `stored`    | Whether value is stored in the document store | `true` |
| `indexed`   | Whether value should be indexed so it can be searched | `true` |
| `tokenizer` | Name of the `Tokenizer`. ([See tokenizers](#description-of-available-tokenizers)) for a list of available tokenizers.  | `default` |
| `record`    | Describes the amount of information indexed, choices between `basic`, `freq` and `position` | `basic` |
| `fieldnorms` | Whether to store fieldnorms for the field. Fieldnorms are required to calculate the BM25 Score of the document. | `false` |
| `fast`     | Whether value is stored in a fast field. The fast field will contain the term ids and the dictionary. The default behaviour for `true` is to store the original text unchanged. The normalizers on the fast field is separately configured. It can be configured via `normalizer: lowercase`. ([See normalizers](#description-of-available-normalizers)) for a list of available normalizers. | `false` |

##### Description of available tokenizers

| Tokenizer     | Description   |
| ------------- | ------------- |
| `raw`         | Does not process nor tokenize text. Filters out tokens larger than 255 bytes. This is similar to the `keyword` type in Elasticsearch. |
| `raw_lowercase` | Does not tokenize text, but lowercase it. Filters out tokens larger than 255 bytes.  |
| `default`     | Chops the text on according to whitespace and punctuation, removes tokens that are too long, and converts to lowercase. Filters out tokens larger than 255 bytes. |
| `en_stem`     | Like `default`, but also applies stemming on the resulting tokens. Filters out tokens larger than 255 bytes.  |
| `whitespace`  | Chops the text on according to whitespace only. Doesn't remove long tokens or converts to lowercase. |
| `chinese_compatible` |  Chop between each CJK character in addition to what `default` does. Should be used with `record: position` to be able to properly search |
| `lowercase`   | Applies a lowercase transformation on the text. It does not tokenize the text. |

##### Description of available normalizers

| Normalizer     | Description   |
| ------------- | ------------- |
| `raw`         | Does not process nor tokenize text. Filters token larger than 255 bytes.  |
| `lowercase` |  Applies a lowercase transformation on the text. Filters token larger than 255 bytes. |

**Description of record options**

| Record option | Description   |
| ------------- | ------------- |
| `basic`       |  Records only the `DocId`s |
| `freq`        |  Records the document ids as well as the term frequency  |
| `position`    |  Records the document id, the term frequency and the positions of occurrences.  |

Indexing with position is required to run phrase queries.

#### Numeric types: `i64`, `u64` and `f64` type

Quickwit handles three numeric types: `i64`, `u64`, and `f64`.

Numeric values can be stored in a fast field (the equivalent of Lucene's `DocValues`), which is a column-oriented storage used for range queries and aggregations.

When querying negative numbers without precising a field (using `default_search_fields`), you should single-quote the number (for instance '-5'), otherwise it will be interpreted as wanting to match anything but that number.

Example of a mapping for an u64 field:

```yaml
name: rating
description: Score between 0 and 5
type: u64
stored: true
indexed: true
fast: true
```

**Parameters for i64, u64 and f64 field**

| Variable        | Description   | Default value |
| --------------- | ------------- | ------------- |
| `description`   | Optional description for the field. | `None` |
| `stored`        | Whether the field values are stored in the document store. | `true` |
| `indexed`       | Whether the field values are indexed. | `true` |
| `fast`          | Whether the field values are stored in a fast field. | `false` |
| `coerce`        | Whether to convert numbers passed as strings to integers or floats. | `true` |
| `output_format` | JSON type used to return numbers in search results. Possible values are `number` or `string`. | `number` |

#### `datetime` type

The `datetime` type handles dates and datetimes. Since JSON doesn’t have a date type, the `datetime` field support multiple input types and formats. The supported input types are:
- floating-point or integer numbers representing a Unix timestamp
- strings containing a formatted date, datetime, or Unix timestamp

The `input_formats` field parameter specifies the accepted date formats. The following input formats are natively supported:
- `iso8601`
- `rfc2822`
- `rfc3339`
- `strptime`
- `unix_timestamp`

**Input formats**

When specifying multiple input formats, the corresponding parsers are attempted in the order they are declared. The following formats are natively supported:
- `iso8601`, `rfc2822`, `rfc3339`: parse dates using standard ISO and RFC formats.
- `strptime`: parse dates using the Unix [strptime](https://man7.org/linux/man-pages/man3/strptime.3.html) format with some variations:
  - `strptime` format specifiers: `%C`, `%d`, `%D`, `%e`, `%F`, `%g`, `%G`, `%h`, `%H`, `%I`, `%j`, `%k`, `%l`, `%m`, `%M`, `%n`, `%R`, `%S`, `%t`, `%T`, `%u`, `%U`, `%V`, `%w`, `%W`, `%y`, `%Y`, `%%`.
  - `%f` for milliseconds precision support.
  - `%z` timezone offsets can be specified as `(+|-)hhmm` or `(+|-)hh:mm`.

:::warning
The timezone name format specifier (`%Z`) is not supported currently.
:::

- `unix_timestamp`: parse float and integer numbers to Unix timestamps. Floating-point values are converted to timestamps expressed in seconds. Integer values are converted to Unix timestamps whose precision, determined in `seconds`, `milliseconds`, `microseconds`, or `nanoseconds`, is inferred from the number of input digits. Internally, datetimes are converted to UTC (if the time zone is specified) and stored as *i64* integers. As a result, Quickwit only supports timestamp values ranging from `Apr 13, 1972 23:59:55` to `Mar 16, 2242 12:56:31`.

:::warning
Converting timestamps from float to integer values may occur with a loss of precision.
:::

When a `datetime` field is stored as a fast field, the `fast_precision` parameter indicates the precision used to truncate the values before encoding, which improves compression (truncation here means zeroing). The `fast_precision` parameter can take the following values: `seconds`, `milliseconds`, `microseconds`, or `nanoseconds`. It only affects what is stored in fast fields when a `datetime` field is marked as "fast". Finally, operations on `datetime` fast fields, e.g. via aggregations, need to be done at the nanosecond level.

:::info
Internally `datetime` is stored in `nanoseconds` in fast fields and in the docstore, and in `seconds` in the term dictionary.
:::

In addition, Quickwit supports the `output_format` field parameter to specify with which precision datetimes are deserialized. This parameter supports the same value as input formats except for `unix_timestamp` which is replaced by the following formats:
- `unix_timestamp_secs`: displays timestamps in seconds.
- `unix_timestamp_millis`: displays timestamps in milliseconds.
- `unix_timestamp_micros`: displays timestamps in microseconds.
- `unix_timestamp_nanos`: displays timestamps in nanoseconds.

Example of a mapping for a datetime field:

```yaml
name: timestamp
type: datetime
description: Time at which the event was emitted
input_formats:
  - rfc3339
  - unix_timestamp
  - "%Y %m %d %H:%M:%S.%f %z"
output_format: unix_timestamp_secs
stored: true
indexed: true
fast: true
fast_precision: milliseconds
```

**Parameters for datetime field**

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `input_formats` | Formats used to parse input dates | [`rfc3339`, `unix_timestamp`] |
| `output_format` | Format used to display dates in search results | `rfc3339` |
| `stored`        | Whether the field values are stored in the document store | `true` |
| `indexed`       | Whether the field values are indexed | `true` |
| `fast`          | Whether the field values are stored in a fast field | `false` |
| `fast_precision`     | The precision (`seconds`, `milliseconds`, `microseconds`, or `nanoseconds`) used to store the fast values. | `seconds` |

#### `bool` type

The `bool` type accepts boolean values.

Example of a mapping for a boolean field:

```yaml
name: is_active
description: Activation status
type: bool
stored: true
indexed: true
fast: true
```

**Parameters for bool field**

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `description` | Optional description for the field. | `None` |
| `stored`    | Whether value is stored in the document store | `true` |
| `indexed`   | Whether value is indexed | `true` |
| `fast`      | Whether value is stored in a fast field | `false` |

#### `ip` type

The `ip` type accepts IP address values, both IpV4 and IpV6 are supported. Internally IpV4 are converted to IpV6.

Example of a mapping for an IP field:

```yaml
name: host_ip
description: Host IP address
type: ip
fast: true
```

**Parameters for IP field**

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `description` | Optional description for the field. | `None` |
| `stored`    | Whether value is stored in the document store | `true` |
| `indexed`   | Whether value is indexed | `true` |
| `fast`      | Whether value is stored in a fast field | `false` |


#### `bytes` type
The `bytes` type accepts a binary value as a `Base64` encoded string.

Example of a mapping for a bytes field:

```yaml
name: binary
type: bytes
stored: true
indexed: true
fast: true
input_format: hex
output_format: hex
```

**Parameters for bytes field**

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `description` | Optional description for the field. | `None` |
| `stored`    | Whether value is stored in the document store | `true` |
| `indexed`   | Whether value is indexed | `true` |
| `fast`     | Whether value is stored in a fast field. Only on 1:1 cardinality, not supported on `array<bytes>` fields | `false` |
| `input_format`   | Encoding used to represent input bytes, either `hex` or `base64` | `base64` |
| `output_format`   |  Encoding used to represent bytes in search results, either `hex` or `base64` | `base64` |

#### `json` type

The `json` type accepts a JSON object.

Example of a mapping for a JSON field:

```yaml
name: parameters
type: json
stored: true
indexed: true
tokenizer: raw
expand_dots: false
fast:
  normalizer: lowercase
```

Stored primitive types are inferred from the JSON value types using the following rules:
- a boolean value `true` or `false` is stored as `bool`
- numeric values are cast to the first compatible format between `i64`, `u64` or
  `f64` (in this order)
- for string values (surrounded with quotes), Tantivy attempts to parse a date
  in `rfc3339` format. If the parsing fails, the value is stored as `text` using
  the configured tokenization rules

**Parameters for JSON field**

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `description` | Optional description for the field. | `None` |
| `stored`    | Whether value is stored in the document store | `true` |
| `indexed`   | Whether value is indexed | `true` |
| `fast`     | Whether value is stored in a fast field. The default behaviour for text in the JSON is to store the text unchanged. A normalizer can be configured via `normalizer: lowercase`. ([See normalizers](#description-of-available-normalizers)) for a list of available normalizers. | `false` |
| `tokenizer` | **Only affects strings in the json object**. Name of the `Tokenizer`, choices between `raw`, `default`, `en_stem` and `chinese_compatible` | `raw` |
| `record`    | **Only affects strings in the json object**. Describes the amount of information indexed, choices between `basic`, `freq` and `position` | `basic` |
| `expand_dots`    | If true, json keys containing a `.` should be expanded. For instance, if `expand_dots` is set to true, `{"k8s.node.id": "node-2"}` will be indexed as if it was `{"k8s": {"node": {"id": "node2"}}}`. The benefit is that escaping the `.` will not be required at query time. In other words, `k8s.node.id:node2` will match the document. This does not impact the way the document is stored.  | `true` |

Note that the `tokenizer` and the `record` have the same definition and the same effect as for the text field.

To search into a json object, one then needs to extend the field name with the path that will lead to the target value.

For instance, when indexing the following object:
```json
{
    "product_name": "droopy t-shirt",
    "attributes": {
        "color": ["red", "green", "white"],
        "size:": "L"
    }
}
```

Assuming `attributes` as been defined as a field mapping as follows:
```yaml
- type: json
  name: attributes
```

`attributes.color:red` is then a valid query.

If, in addition, `attributes` is set as a default search field, then `color:red` is a valid query.

### Composite types

#### array

Quickwit supports arrays for all raw types except for `object` types.

To declare an array type of `i64` in the index config, you just have to set the type to `array<i64>`.

#### object

Quickwit supports nested objects as long as it does not contain arrays of objects.

```yaml
name: resource
type: object
field_mappings:
  - name: service
    type: text
```

#### concatenate

Quickwit supports mapping the content of multiple fields to a single one. This can be more efficient at query time than
searching through dozens of `default_search_fields`. It also allows querying inside a json field without knowing the path
to the field being searched.

```yaml
name: my_default_field
type: concatenate
concatenate_fields:
  - text # things inside text, tokenized with the `default` tokenizer
  - resource.author # all fields in resource.author, assuming resource is an `object` field.
include_dynamic_fields: true
tokenizer: default
record: basic
```

Concatenate fields don't support fast fields, and are never stored. They uses their own tokenizer, independently of the
tokenizer configured on the individual fields.
At query time, concatenate fields don't support range queries.
Only the following types are supported inside a concatenate field: text, bool,
i64, u64, f64, json. Other types are rejected at index creation, or silently
discarded during indexation if they are found inside a json field. Unlike
regular JSON fields, JSON fields in a concatenate field don't store RFC3339
dates as Tantivy dates. This means you can still perform prefix queries,
e.g `my_default_field:"2025-12-12"*` to work around the lack of support for range
queries.
Adding an object field to a concatenate field doesn't automatically add its subfields (yet).
<!-- typing is made so it wouldn't be too hard to add, as well as things like params_* matching all fields which starts name with params_ , but the feature isn't implemented yet -->
It isn't possible to add subfields from a json field to a concatenate field. For instance if `attributes` is a json field, it's not possible to add only `attributes.color` to a concatenate field.

For json fields and dynamic fields, the path is not indexed, only values are. For instance, given the following document:
```json
{
  "421312": {
    "my-key": "my-value"
  }
}
```
It is possible to search for `my-value` despite not knowing the full path, but it isn't possible to search for all documents containing a key `my-key`.

<!--
when the features are supported, add these:
  - params_* # shortcut for all fields starting with `params_`
  - resource.author # all fields in resource.author, assuming resource is either of type `object` or `json`
---
Only the following types are supported inside a concatenate field: text, datetime, bool, i64, u64, ip, json. Other types are rejected
---
Datetime can only be queried in their RFC-3339 form, possibly omitting later components. # todo! will have to confirm this is achievable
---
plan:
- implement text/bool/i64/u64 (nothing to do on search side for it to work). all gets converted to strings
- add json
- add object
- add dynamic
-- you are here
- add wildcard
- add json sub-fields?
- add datetime (at index time, generate multiple tokens for yyyy, yyyy-MM... to yyyy-MM-ddThh:mm:ss; at search time, emit both tokenized and "raw" version of what may look like a datetime)
- check negative i64 works as intended for non-raw tokenizer, and leverage datetime code if it doesn't
- add ip (at index time, convert to single token; at search time, emit both tokenized and "raw" version of the ip)
- allow optionally indexing json path (how do we tokenize it? split at each dot, or not?)
-->

### Mode

The `mode` describes how Quickwit should behave when it receives a field that is not defined in the field mapping.

Quickwit offers you three different modes:
- `dynamic` (default value): unmapped fields are gathered by Quickwit and handled as defined in the `dynamic_mapping` parameter.
- `lenient`: unmapped fields are dismissed by Quickwit.
- `strict`: if a document contains a field that is not mapped, quickwit will dismiss it, and count it as an error.

#### Dynamic Mapping

`dynamic` mode makes it possible to operate Quickwit in a schemaless manner, or with a partial schema.
The configuration of `dynamic` mode can be set via the `dynamic_mapping` parameter.
`dynamic_mapping` offers the same configuration options as when configuring a `json` field. It defaults to:

```yaml
version: 0.7
index_id: my-dynamic-index
doc_mapping:
  mode: dynamic
  dynamic_mapping:
    indexed: true
    stored: true
    tokenizer: raw
    record: basic
    expand_dots: true
    fast: true
```

When the `dynamic_mapping` is set as indexed (default), fields mapped through
dynamic mode can be searched by targeting the path needed to access them from
the root of the JSON object.

For instance, in an entirely schemaless settings, a minimal index configuration could be:

```yaml
version: 0.7
index_id: my-dynamic-index
doc_mapping:
    # If you have a timestamp field, it is important to tell quickwit about it.
    timestamp_field: unix_timestamp
    # mode: dynamic #< Commented out, as dynamic is the default mode.
```

With such a simple configuration, we can index a complex document like the following:

```json
{
  "endpoint": "/admin",
  "query_params": {
    "ctk": "e42bb897d",
    "page": "eeb"
  },
  "src": {
    "ip": "8.8.8.8",
    "port": 53,
  },
  //...
}
```

The following queries are then valid, and match the document above.

```bash
// Fields can be searched simply.
endpoint:/admin

// Nested object can be queried by specifying a `.` separated
// path from the root of the json object to the given field.
query_params.ctk:e42bb897d

// numbers are searchable too
src.port:53

// and of course we can combine them with boolean operators.
src.port:53 AND query_params.ctk:e42bb897d
```

The stored primitive type inference is the [same as for JSON fields](#json-type).

### Field name validation rules

Currently Quickwit only accepts field name that matches the following regular expression:
`^[@$_\-a-zA-Z][@$_/\.\-a-zA-Z0-9]{0,254}$`

In plain language:
- it needs to have at least one character.
- it can only contain uppercase and lowercase ASCII letters `[a-zA-Z]`, digits `[0-9]`, `.`, hyphens `-`, underscores `_`, slash `/`, at `@` and dollar `$` signs.
- it must not start with a dot or a digit.
- it must be different from Quickwit's reserved field mapping names `_source`, `_dynamic`, `_field_presence`.

:::caution
For field names containing the `.` character, you will need to escape it when referencing them. Otherwise the `.` character will be interpreted as a JSON object property access. Because of this, it is recommended to avoid using field names containing the `.` character.
:::

### Behavior with null values or missing fields

Fields with `null` or missing fields in your JSON document will be silently ignored when indexing.

## Indexing settings

This section describes indexing settings for a given index.

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `commit_timeout_secs`      | Maximum number of seconds before committing a split since its creation.   | `60` |
| `split_num_docs_target` | Target number of docs per split.   | `10000000` |
| `merge_policy` | Describes the strategy used to trigger split merge operations (see [Merge policies](#merge-policies) section below). |
| `resources.heap_size`      | Indexer heap size per source per index.   | `2000000000` |
| `docstore_compression_level` | Level of compression used by zstd for the docstore. Lower values may increase ingest speed, at the cost of index size | `8` |
| `docstore_blocksize` | Size of blocks in the docstore, in bytes. Lower values may improve doc retrieval speed, at the cost of index size | `1000000` |

:::note

Choosing an appropriate commit timeout is critical. With a shorter commit timeout, ingested data is queryable faster. But the published splits will be smaller, increasing the overhead associated with [merges](#merge-policies). 

When decommissioning definitively an indexer node that received data through the ingest API (including the [Elastic bulk API](/docs/reference/es_compatible_api) and the OTEL [log](/docs/log-management/otel-service.md) and [trace](/docs/distributed-tracing/otel-service.md) services), we need to make sure that all the data that was persisted locally (Write Ahead Log) is indexed and committed. After receiving the termination signal, the Quickwit process waits for the indexing pipelines to finish processing this local data. This can take as long as the longest commit timeout of all indexes. Make sure that the termination grace period of the infrastructure supporting the Quickwit indexer nodes is long enough (e.g [`terminationGracePeriodSeconds`](https://kubernetes.io/docs/concepts/containers/container-lifecycle-hooks/) in Kubernetes or [`stopTimeout`](https://docs.aws.amazon.com/AmazonECS/latest/developerguide/task_definition_parameters.html) on AWS ECS).

:::

### Merge policies

Quickwit makes it possible to define the strategy used to decide which splits should be merged together and when.

Quickwit offers three different merge policies, each with their
own set of parameters.

#### "Stable log" merge policy

The stable log merge policy attempts to minimize write amplification AND keep time-pruning power as high as possible, by merging splits with a similar size, and with a close time span.

Quickwit's default merge policy is the `stable_log` merge policy
with the following parameters:

```yaml
version: 0.7
index_id: "hdfs"
# ...
indexing_settings:
  merge_policy:
    type: "stable_log"
    min_level_num_docs: 100000
    merge_factor: 10
    max_merge_factor: 12
    maturation_period: 48h
```


| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `merge_factor`      | *(advanced)* Number of splits to merge together in a single merge operation.   | `10` |
| `max_merge_factor` | *(advanced)* Maximum number of splits that can be merged together in a single merge operation.  | `12` |
| `min_level_num_docs` |  *(advanced)* Number of docs below which all splits are considered as belonging to the same level.   | `100000` |
| `maturation_period` | Duration after which a split is considered mature, and won't be considered for merges anymore. May impact the completion time of pending delete tasks. | `48h` |

#### "Limit Merge" merge policy

*The limit merge policy is considered advanced*.

The limit merge policy simply limits write amplification by setting an upperbound
of the number of merge operation a split should undergo.


```yaml
version: 0.7
index_id: "hdfs"
# ...
indexing_settings:
  merge_policy:
    type: "limit_merge"
    max_merge_ops: 5
    merge_factor: 10
    max_merge_factor: 12
    maturation_period: 48h
```


| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `max_merge_ops`   |  Maximum number of merges that a given split should undergo. | `4` |
| `merge_factor`      | *(advanced)* Number of splits to merge together in a single merge operation.   | `10` |
| `max_merge_factor` | *(advanced)* Maximum number of splits that can be merged together in a single merge operation.  | `12` |
| `maturation_period` | Duration after which a split is considered mature, and won't be considered for merges anymore. May impact the completion time of pending delete tasks. | `48h` |

#### No merge

The `no_merge` merge policy entirely disables merging.

:::caution
This setting is not recommended. Merges are necessary to reduce the number of splits, and hence improve search performances.
:::

```yaml
version: 0.7
index_id: "hdfs"
indexing_settings:
    merge_policy:
        type: "no_merge"
```


### Indexer memory usage

Indexer works with a default heap of 2 GiB of memory. This does not directly reflect the overall memory usage, but doubling this value should give a fair approximation.


## Search settings

This section describes search settings for a given index.

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `default_search_fields` | Default list of fields that will be used for search. The field names in this list may be declared explicitly in the schema, or may refer to a field captured by the dynamic mode. | `None` |

## Retention policy

This section describes how Quickwit manages data retention. In Quickwit, the retention policy manager drops data on a split basis as opposed to individually dropping documents. Splits are evaluated based on their `time_range` which is derived from the index timestamp field specified in the (`doc_mapping.timestamp_field`) settings. Using this setting, the retention policy will delete a split when `now() - split.time_range.end >= retention_policy.period`

```yaml
version: 0.7
index_id: hdfs
# ...
retention:
  period: 90 days
  schedule: daily
```

| Variable      | Description   | Default value |
| ------------- | ------------- | ------------- |
| `period`      | Duration after which splits are dropped, expressed in a human-readable way (`1 day`, `2 hours`, `a week`, ...). | required |
| `schedule`    | Frequency at which the retention policy is evaluated and applied, expressed as a cron expression (`0 0 * * * *`) or human-readable form (`hourly`, `daily`, `weekly`, `monthly`, `yearly`). | `hourly` |


`period` is specified as set of time spans. Each time span is an integer followed by a unit suffix like: `2 days 3h 24min`. The supported units are:
  - `nsec`, `ns` -- nanoseconds
  - `usec`, `us` -- microseconds
  - `msec`, `ms` -- milliseconds
  - `seconds`, `second`, `sec`, `s`
  - `minutes`, `minute`, `min`, `m`
  - `hours`, `hour`, `hr`, `h`
  - `days`, `day`, `d`
  - `weeks`, `week`, `w`
  - `months`, `month`, `M` -- a month is defined as `30.44 days`
  - `years`, `year`, `y` -- a year is defined as `365.25 days`


================================================
FILE: docs/configuration/index.md
================================================
---
title: Configuration Reference
---

import DocCardList from '@theme/DocCardList';

<DocCardList />


================================================
FILE: docs/configuration/lambda-config.md
================================================
---
title: Lambda configuration
sidebar_position: 6
---

Quickwit supports offloading leaf search operations to AWS Lambda for horizontal scaling. When the local search queue becomes saturated, overflow splits are automatically sent to Lambda functions for processing.

:::note
Lambda offloading is currently only supported on AWS.
:::

## How it works

Lambda offloading is **only active when a `lambda` configuration section is present** under `searcher` in your node configuration. When configured:

1. Quickwit monitors the local search queue depth
2. When pending searches exceed the `offload_threshold`, new splits are sent to Lambda instead of being queued locally
3. Lambda returns per-split search results that are cached and merged with local results

This allows Quickwit to handle traffic spikes without provisioning additional searcher nodes.

## Startup validation

When a `lambda` configuration is defined, Quickwit performs a **dry run invocation** at startup to verify that:
- The Lambda function exists
- The function version matches the embedded binary
- The invoker has permission to call the function

If this validation fails, **Quickwit will fail to start**. This ensures that Lambda offloading works correctly before the node begins serving traffic.

## Configuration

Add a `lambda` section under `searcher` in your node configuration:

```yaml
searcher:
  lambda:
    offload_threshold: 100
    auto_deploy:
      execution_role_arn: arn:aws:iam::123456789012:role/quickwit-lambda-role
      memory_size: 5 GiB
      invocation_timeout_secs: 15
```

### Lambda configuration options

| Property | Description | Default value |
| --- | --- | --- |
| `function_name` | Name of the AWS Lambda function to invoke. | `quickwit-lambda-search` |
| `max_splits_per_invocation` | Maximum number of splits to send in a single Lambda invocation. Must be at least 1. | `10` |
| `offload_threshold` | Number of pending local searches before offloading to Lambda. A value of `0` offloads everything to Lambda. | `100` |
| `auto_deploy` | Auto-deployment configuration. If set, Quickwit automatically deploys or updates the Lambda function at startup. | (none) |

### Auto-deploy configuration options

| Property | Description | Default value |
| --- | --- | --- |
| `execution_role_arn` | **Required.** IAM role ARN for the Lambda function's execution role. | |
| `memory_size` | Memory allocated to the Lambda function. More memory provides more CPU. | `5 GiB` |
| `invocation_timeout_secs` | Timeout for Lambda invocations in seconds. | `15` |

## Deployment options

### Automatic deployment (recommended)

With `auto_deploy` configured, Quickwit automatically:
1. Creates the Lambda function if it doesn't exist
2. Updates the function code if the embedded binary has changed
3. Publishes a new version with a unique identifier
4. Garbage collects old versions (keeps current + 5 most recent)

This is the recommended approach as it ensures the Lambda function always matches the Quickwit binary version.

### Manual deployment

You can deploy the Lambda function manually without `auto_deploy`:
1. Download the Lambda zip from [GitHub releases](https://github.com/quickwit-oss/quickwit/releases)
2. Create or update the Lambda function using AWS CLI, Terraform, or the AWS Console
3. Publish a version with description format `quickwit_{version}_{sha256}_{timeout}_{deploy_config}"` (e.g., `quickwit_0_8_0_fa940f44_5120_60s_6c3b2`)

The description must match the format Quickwit expects, or it won't find the function version.

## IAM permissions

### Permissions for the Quickwit node

The IAM role or user running Quickwit needs the following permissions to invoke Lambda:

```json
{
  "Version": "2012-10-17",
  "Statement": [
    {
      "Effect": "Allow",
      "Action": [
        "lambda:InvokeFunction"
      ],
      "Resource": "arn:aws:lambda:*:*:function:quickwit-lambda-search:*"
    }
  ]
}
```

If using `auto_deploy`, additional permissions are required for deployment:

```json
{
  "Version": "2012-10-17",
  "Statement": [
    {
      "Effect": "Allow",
      "Action": [
        "lambda:CreateFunction",
        "lambda:GetFunction",
        "lambda:UpdateFunctionCode",
        "lambda:PublishVersion",
        "lambda:ListVersionsByFunction",
        "lambda:DeleteFunction"
      ],
      "Resource": "arn:aws:lambda:*:*:function:quickwit-lambda-search"
    },
    {
      "Effect": "Allow",
      "Action": "iam:PassRole",
      "Resource": "arn:aws:iam::*:role/quickwit-lambda-role",
      "Condition": {
        "StringEquals": {
          "iam:PassedToService": "lambda.amazonaws.com"
        }
      }
    }
  ]
}
```

### Lambda execution role

The Lambda function requires an execution role with S3 read access to your index data.

Example policy:

```json
{
  "Version": "2012-10-17",
  "Statement": [
    {
      "Effect": "Allow",
      "Action": "s3:GetObject",
      "Resource": "arn:aws:s3:::your-index-bucket/*"
    }
  ]
}
```

The execution role must also have a trust policy allowing Lambda to assume it:

```json
{
  "Version": "2012-10-17",
  "Statement": [
    {
      "Effect": "Allow",
      "Principal": {
        "Service": "lambda.amazonaws.com"
      },
      "Action": "sts:AssumeRole"
    }
  ]
}
```

## CloudWatch logging

The Lambda function emits structured logs (JSON) to stdout. To have these logs captured by CloudWatch, add the following iam permissions to the Lambda execution role:

```json
{
  "Version": "2012-10-17",
  "Statement": [
    {
      "Effect": "Allow",
      "Action": [
        "logs:CreateLogGroup",
        "logs:CreateLogStream",
        "logs:PutLogEvents"
      ],
      "Resource": "arn:aws:logs:*:*:*"
    }
  ]
}
```

No additional configuration is needed on the Quickwit side.

## Versioning

Quickwit uses content-based versioning for Lambda:
- A SHA256 hash of the Lambda binary is computed at build time
- This hash is embedded in the Lambda function description as `quickwit:{version}-{sha256_short}`
- When Quickwit starts, it searches for a version matching this description
- Different Quickwit builds with the same Lambda binary share the same Lambda version
- Updating the Lambda binary automatically triggers a new deployment

## Example configuration


Minimal configuration (with auto-deployment):

```yaml
searcher:
  lambda:
    auto_deploy:
      execution_role_arn: arn:aws:iam::123456789012:role/quickwit-lambda-role
```


Full configuration (auto-deployment):

```yaml
searcher:
  lambda:
    function_name: quickwit-lambda-search
    max_splits_per_invocation: 10
    offload_threshold: 10
    auto_deploy:
      execution_role_arn: arn:aws:iam::123456789012:role/quickwit-lambda-role
      memory_size: 5 GiB
      invocation_timeout_secs: 15
```

Aggressive offloading (send everything to Lambda):

```yaml
searcher:
  lambda:
    function_name: quickwit-lambda-search
    offload_threshold: 0
    auto_deploy:
      execution_role_arn: arn:aws:iam::123456789012:role/quickwit-lambda-role
```


================================================
FILE: docs/configuration/metastore-config.md
================================================
---
title: Metastore configuration
sidebar_position: 4
---

Quickwit needs a place to store meta-information about its indexes.

For instance:

- The index configuration.
- Meta-information about its splits. For instance, their IDs, the number of documents they contain, their sizes, their min/max timestamp, and the set of tags present in the split.
- The different sources checkpoints.
- Some extra information such as the index creation time.

The metastore is entirely defined by a single URI. One can set it by editing the `metastore_uri` parameter of the [node configuration file](./node-config.md) (often named `quickwit.yaml`).

Currently, Quickwit offers two implementations:

- **PostgreSQL**: recommended for distributed usage.
- **File-backed implementation**.

# PostgreSQL Metastore

We recommend the PostgreSQL metastore for any distributed usage.

The PostgreSQL metastore can be configured by setting a PostgreSQL URI in the `metastore_uri` parameter of the Quickwit configuration file. The URI takes the following format:

```
postgres://[user]:[password]@[host]:[port]/[dbname]
```

Some of those parameters can be omitted. The following PostgreSQL URIs are for instance valid:

```
postgres://localhost/mydb
postgres://user@localhost
postgres://user:secret@localhost
```

The database has to be created in advance.

On its first execution, Quickwit will transparently create the necessary tables.

Likewise, if you upgrade Quickwit to a version that includes some changes in the PostgreSQL schema, Quickwit will transparently operate the migration startup.

# File-backed metastore

For convenience, Quickwit also makes it possible to store its metadata in files using a file-backed metastore. In that case, Quickwit will write one file per index.

The metastore is then configured by passing a [storage URI](storage-config#storage-uris) that will serve as the root of the metastore storage.

The metadata file associated with a given index will then be stored under

  `[storage_uri]/[index_id]/metastore.json`

For the moment, Quickwit supports two types of storage types:

- a local file system URI (e.g., `file:///opt/toto`). It is also valid to pass a file path directly (without file://). `/var/quickwit`. Relative paths will be resolved with respect to the current working directory.
- S3-compatible storage URI (e.g., `s3://my-bucket/some-path`). See the [storage config](storage-config) documentation to configure S3 or S3-compatible storage providers.

### Polling configuration

By default, the File-Backed Metastore is only read once when you start a Quickwit process (searcher, indexer, ...).

You can also configure it to poll the File-Backed Metastore periodically to keep a fresh view of it. This is useful for a Searcher instance that needs to be aware of new splits published by an Indexer running in parallel.

To configure the polling interval (in seconds), add a URI fragment to the storage URI as follows: `s3://quickwit/my-indexes#polling_interval=30s`

:::note
The polling interval can be configured in seconds only; other units, such as minutes or hours, are not supported.
:::

:::tip
Amazon S3 charges $0.0004 per 1000 GET requests. Polling a metastore every 30 seconds costs $0.04 per month and index.
:::

### Examples

The following file-backed metastore URIs for instance are valid:

```markdown
s3://my-indexes
s3://quickwit/my-indexes
s3://quickwit/my-indexes#polling_interval=30s
file:///local/indices
file:///local/indices#polling_interval=30s
/local/indices
./quickwit-metastores
```

:::caution
The file-backed metastore does not support multiple instances running at the same time because it does not implement any locking mechanism to prevent concurrent writes from overwriting each other. Ensure that only one file-backed metastore instance is running at all times.
:::


================================================
FILE: docs/configuration/node-config.md
================================================
---
title: Node configuration
sidebar_position: 1
---

The node configuration allows you to customize and optimize the settings for individual nodes in your cluster. It is divided into several sections:

- Common configuration settings: shared top-level properties
- Storage settings: defined in the [storage](#storage-configuration) section
- Metastore settings: defined in the [metastore](#metastore-configuration) section
- Ingest settings: defined in the [ingest_api](#ingest-api-configuration) section
- Indexer settings: defined in the [indexer](#indexer-configuration) section
- Searcher settings: defined in the [searcher](#searcher-configuration) section
- Jaeger settings: defined in the [jaeger](#jaeger-configuration) section

A commented example is available here: [quickwit.yaml](https://github.com/quickwit-oss/quickwit/blob/main/config/quickwit.yaml).

## Common configuration

| Property | Description | Env variable | Default value |
| --- | --- | --- | --- |
| `version` | Config file version. `0.7` is the only available value with a retro compatibility on `0.5` and `0.4`. | | |
| `cluster_id` | Unique identifier of the cluster the node will be joining. Clusters sharing the same network should use distinct cluster IDs.| `QW_CLUSTER_ID` | `quickwit-default-cluster` |
| `node_id` | Unique identifier of the node. It must be distinct from the node IDs of its cluster peers. Defaults to the instance's short hostname if not set. | `QW_NODE_ID` | short hostname |
| `enabled_services` | Enabled services (control_plane, indexer, janitor, metastore, searcher) | `QW_ENABLED_SERVICES` | all services |
| `listen_address` | The IP address or hostname that Quickwit service binds to for starting REST and GRPC server and connecting this node to other nodes. By default, Quickwit binds itself to 127.0.0.1 (localhost). This default is not valid when trying to form a cluster. | `QW_LISTEN_ADDRESS` | `127.0.0.1` |
| `advertise_address` | IP address advertised by the node, i.e. the IP address that peer nodes should use to connect to the node for RPCs. | `QW_ADVERTISE_ADDRESS` | `listen_address` |
| `gossip_listen_port` | The port which to listen for the Gossip cluster membership service (UDP). | `QW_GOSSIP_LISTEN_PORT` | `rest.listen_port` |
| `grpc_listen_port` | The port on which gRPC services listen for traffic. | `QW_GRPC_LISTEN_PORT` | `rest.listen_port + 1` |
| `peer_seeds` | List of IP addresses or hostnames used to bootstrap the cluster and discover the complete set of nodes. This list may contain the current node address and does not need to be exhaustive. If the list of peer seeds contains a host name, Quickwit will resolve it by querying the DNS every minute. On kubernetes for instance, it is a good practise to set it to a [headless service](https://kubernetes.io/docs/concepts/services-networking/service/#headless-services). | `QW_PEER_SEEDS` | |
| `data_dir` | Path to directory where data (tmp data, splits kept for caching purpose) is persisted. This is mostly used in indexing. | `QW_DATA_DIR` | `./qwdata` |
| `metastore_uri` | Metastore URI. Can be a local directory or `s3://my-bucket/indexes` or `postgres://username:password@localhost:5432/metastore`. [Learn more about the metastore configuration](metastore-config.md). | `QW_METASTORE_URI` | `{data_dir}/indexes` |
| `default_index_root_uri` | Default index root URI that defines the location where index data (splits) is stored. The index URI is built following the scheme: `{default_index_root_uri}/{index-id}` | `QW_DEFAULT_INDEX_ROOT_URI` | `{data_dir}/indexes` |
| environment variable only | Log level of Quickwit. Can be a direct log level, or a comma separated list of `module_name=level` | `RUST_LOG` | `info` |

## REST configuration

This section contains the REST API configuration options.

| Property | Description | Env variable | Default value |
| --- | --- | --- | --- |
| `listen_port` | The port on which the REST API listens for HTTP traffic. | `QW_REST_LISTEN_PORT` | `7280` |
| `cors_allow_origins` | Configure the CORS origins which are allowed to access the API. [Read more](#configuring-cors-cross-origin-resource-sharing) | |
| `extra_headers` | List of header names and values | | |

### Configuring CORS (Cross-origin resource sharing)

CORS (Cross-origin resource sharing) describes which address or origins can access the REST API from the browser.
By default, sharing resources cross-origin is not allowed.

A wildcard, single origin, or multiple origins can be specified as part of the `cors_allow_origins` parameter:


Example of a REST configuration:

```yaml
rest:
  listen_port: 1789
  extra_headers:
    x-header-1: header-value-1
    x-header-2: header-value-2
  cors_allow_origins: '*'

#   cors_allow_origins: https://my-hdfs-logs.domain.com   # Optionally we can specify one domain
#   cors_allow_origins:                                   # Or allow multiple origins
#     - https://my-hdfs-logs.domain.com
#     - https://my-hdfs.other-domain.com
```

## gRPC configuration

This section contains the configuration options for gRPC services and clients used for internal communication between nodes.

| Property | Description | Env variable | Default value |
| --- | --- | --- | --- |
| `max_message_size` | The maximum size (in bytes) of messages exchanged by internal gRPC clients and services. | | `20 MiB` |

Example of a gRPC configuration:

```yaml
grpc:
  max_message_size: 30 MiB
```

:::warning
We advise changing the default value of 20 MiB only if you encounter the following error:
`Error, message length too large: found 24732228 bytes, the limit is: 20971520 bytes.` In that case, increase `max_message_size` by increments of 10 MiB until the issue disappears. This is a temporary fix: the next version of Quickwit will rely exclusively on gRPC streaming endpoints and handle messages of any length.
:::

## Storage configuration

Please refer to the dedicated [storage configuration](storage-config) page to learn more about configuring Quickwit for various storage providers.

Here are also some minimal examples of how to configure Quickwit with Amazon S3 or Alibaba OSS:

```bash
AWS_ACCESS_KEY_ID=<your access key ID>
AWS_SECRET_ACCESS_KEY=<your secret access key>
```

*Amazon S3*

```yaml
storage:
  s3:
    region: us-east-1
```

*Alibaba*

```yaml
storage:
  s3:
    region: us-east-1
    endpoint: https://oss-us-east-1.aliyuncs.com
```

## Metastore configuration

This section may contain one configuration subsection per available metastore implementation. The specific configuration parameters for each implementation may vary. Currently, the available metastore implementations are:
- File-backed
- PostgreSQL

### File-backed metastore configuration

File-backed metastore doesn't have any node level configuration. You can configure the poll interval [at the index level](./metastore-config.md#polling-configuration).

### PostgreSQL metastore configuration

| Property | Description | Default value |
| --- | --- | --- |
| `min_connections` | Minimum number of connections to maintain in the pool at all times. | `0` |
| `max_connections` | Maximum number of connections to maintain in the pool. | `10` |
| `acquire_connection_timeout` | Maximum amount of time to spend waiting for an available connection before aborting a query. | `10s` |
| `idle_connection_timeout` | Maximum idle duration before closing individual connections. | `10min` |
| `max_connection_lifetime` | Maximum lifetime of individual connections. | `30min` |

Example of a metastore configuration for PostgreSQL in YAML format:

```yaml
metastore:
  postgres:
    min_connections: 10
    max_connections: 50
    acquire_connection_timeout: 30s
    idle_connection_timeout: 1h
    max_connection_lifetime: 1d
```

## Indexer configuration

This section contains the configuration options for an indexer. The split store is documented in the [indexing document](../overview/concepts/indexing.md#split-store).

| Property | Description | Default value |
| --- | --- | --- |
| `split_store_max_num_bytes` | Maximum size in bytes allowed in the split store. | `100G` |
| `split_store_max_num_splits` | Maximum number of files allowed in the split store. | `1000` |
| `max_concurrent_split_uploads` | Maximum number of concurrent split uploads allowed on the node. | `12` |
| `merge_concurrency` | Maximum number of merge operations that can be executed on the node at one point in time. | `(2 x num threads available) / 3` |
| `enable_otlp_endpoint` | If true, enables the OpenTelemetry exporter endpoint to ingest logs and traces via the OpenTelemetry Protocol (OTLP). | `false` |
| `cpu_capacity` | Advisory parameter used by the control plane. The value can expressed be in threads (e.g. `2`) or in term of millicpus (`2000m`). The control plane will attempt to schedule indexing pipelines on the different nodes proportionally to the cpu capacity advertised by the indexer. It is NOT used as a limit. All pipelines will be scheduled regardless of whether the cluster has sufficient capacity or not. The control plane does not attempt to spread the work equally when the load is well below the `cpu_capacity`. Users who need a balanced load on all of their indexer nodes can set the `cpu_capacity` to an arbitrarily low value as long as they keep it proportional to the number of threads available. | `num threads available` |
| `enable_cooperative_indexing` | Enable sharing resources more efficiently when the number of indexes actively written to is significantly higher than the number of cores but might decrease the overall indexing throughput. | `false` |

Example:

```yaml
indexer:
  split_store_max_num_bytes: 100G
  split_store_max_num_splits: 1000
  max_concurrent_split_uploads: 12
  enable_otlp_endpoint: true
```

## Ingest API configuration

| Property | Description | Default value |
| --- | --- | --- |
| `max_queue_memory_usage` | Maximum size in bytes of the in-memory Ingest queue. | `2GiB` |
| `max_queue_disk_usage` | Maximum disk-space in bytes taken by the Ingest queue. The minimum size is at least `256M` and be at least `max_queue_memory_usage`. | `4GiB` |
| `content_length_limit` | Maximum payload size uncompressed. Increasing this is discouraged, use a [file source](../ingest-data/sqs-files.md) instead. | `10MiB` |
| `grpc_compression_algorithm` | Compression algorithm (`gzip` or `zstd`) to use for gRPC traffic between nodes for the ingest service | `None` |

Example:

```yaml
ingest_api:
  max_queue_memory_usage: 2GiB
  max_queue_disk_usage: 4GiB
  content_length_limit: 10MiB
  grpc_compression_algorithm: zstd
```

## Searcher configuration

This section contains the configuration options for a Searcher.

| Property | Description | Default value |
| --- | --- | --- |
| `aggregation_memory_limit` | Controls the maximum amount of memory that can be used for aggregations before aborting. This limit is per searcher node. A node may run concurrent queries, which share the limit. The first query that will hit the limit will be aborted and frees its memory. It is used to prevent excessive memory usage during the aggregation phase, which can lead to performance degradation or crashes. | `500M`|
| `aggregation_bucket_limit` | Determines the maximum number of buckets returned to the client. | `65000` |
| `fast_field_cache_capacity` | Fast field in memory cache capacity on a Searcher. If your filter by dates, run aggregations, range queries, or even for tracing, it might worth increasing this parameter. The [metrics](../reference/metrics.md) starting by `quickwit_cache_fastfields_cache` can help you make an informed choice when setting this value. | `1G` |
| `split_footer_cache_capacity` | Split footer in memory cache (it is essentially the hotcache) capacity on a Searcher.| `500M` |
| `partial_request_cache_capacity` | Partial request in memory cache capacity on a Searcher. Cache intermediate state for a request, possibly making subsequent requests faster. It can be disabled by setting the size to `0`. | `64M` |
| `max_num_concurrent_split_searches` | Maximum number of concurrent split search requests running on a Searcher. | `100` |
| `split_cache` | Searcher split cache configuration options defined in the section below. Cache disabled if unspecified. | |
| `request_timeout_secs` | The time before a search request is cancelled. This should match the timeout of the stack calling into quickwit if there is one set.  | `30` |

### Searcher split cache configuration

This section contains the configuration options for the on-disk searcher split cache. Files are stored in the data directory under `searcher-split-cache/`.

| Property | Description | Default value |
| --- | --- | --- |
| `max_num_bytes` | Maximum disk size in bytes allowed in the split cache. Can be exceeded by the size of one split. | |
| `max_num_splits` | Maximum number of splits allowed in the split cache.   | `10000` |
| `num_concurrent_downloads` | Maximum number of concurrent download of splits. | `1` |


Example:

```yaml
searcher:
  fast_field_cache_capacity: 1G
  split_footer_cache_capacity: 500M
  partial_request_cache_capacity: 64M
  split_cache:
    max_num_bytes: 1G
    max_num_splits: 10000
    num_concurrent_downloads: 1
```

## Jaeger configuration

| Property | Description | Default value |
| --- | --- | --- |
| `enable_endpoint` | If true, enables the gRPC endpoint that allows the Jaeger Query Service to connect and retrieve traces. | `false` |

Example:

```yaml
jaeger:
  enable_endpoint: true
```


## Using environment variables in the configuration

You can use environment variable references in the config file to set values that need to be configurable during deployment. To do this, use:

`${VAR_NAME}`

where `VAR_NAME` is the name of the environment variable.

Each variable reference is replaced at startup by the value of the environment variable. The replacement is case-sensitive and occurs before the configuration file is parsed. Referencing undefined variables throws an error unless you specify a default value or custom error text.

To specify a default value, use:

`${VAR_NAME:-default_value}`

where `default_value` is the value to use if the environment variable is unset.

```
<config_field>: ${VAR_NAME}
or
<config_field>: ${VAR_NAME:-default value}
```

For example:

```bash
export QW_LISTEN_ADDRESS=0.0.0.0
```

```yaml
# config.yaml
version: 0.7
cluster_id: quickwit-cluster
node_id: my-unique-node-id
listen_address: ${QW_LISTEN_ADDRESS}
rest:
  listen_port: ${QW_LISTEN_PORT:-1111}
```

Will be interpreted by Quickwit as:

```yaml
version: 0.7
cluster_id: quickwit-cluster
node_id: my-unique-node-id
listen_address: 0.0.0.0
rest:
  listen_port: 1111
```


================================================
FILE: docs/configuration/ports-config.md
================================================
---
title: Ports configuration
sidebar_position: 6
---

When starting a quickwit search server, one important parameter that can be configured is
the `rest.listen_port` (defaults to :7280).

Internally, Quickwit will, in fact, use three sockets. The ports of these three sockets
cannot be configured independently at the moment.
The ports used are computed relative to the `rest.listen_port` port, as follows.


| Service                       | Port used                 | Protocol |  Default  |
|-------------------------------|---------------------------|----------|-----------|
| Http server with the rest api | `${rest.listen_port}`     |   TCP    | 7280      |
| Cluster membership            | `${rest.listen_port}`     |   UDP    | 7280      |
| GRPC service                  | `${rest.listen_port} + 1` |   TCP    | 7281      |

It is not possible for the moment to configure these ports independently.


In order to form a cluster, you will also need to define a `peer_seeds` parameter.
The following addresses are valid peer seed addresses:

| Type | Example without port | Example with port         |
|--------------|--------------|---------------------------|
| IPv4         | 172.1.0.12   | 172.1.0.12:7180           |
| IPv6         | 2001:0db8:85a3:0000:0000:8a2e:0370:7334  | [2001:0db8:85a3:0000:0000:8a2e:0370:7334:7180]:7280 |
| hostname     | node3        | node3:7180                |

If no port is specified in a peer node address, a Quickwit node will assume the peer is using the same port as itself.


================================================
FILE: docs/configuration/source-config.md
================================================
---
title: Source configuration
sidebar_position: 5
---

Quickwit can insert data into an index from one or multiple sources.
A source can be added after index creation using the [CLI command](../reference/cli.md#source) `quickwit source create`.
It can also be enabled or disabled with the `quickwit source enable/disable` subcommands.

A source is declared using an object called source config, which defines the source's settings. It consists of multiple parameters:

- source ID
- source type
- source parameters
- input_format
- maximum number of pipelines per indexer (optional)
- desired number of pipelines (optional)
- transform parameters (optional)

## Source ID

The source ID is a string that uniquely identifies the source within an index. It may only contain uppercase or lowercase ASCII letters, digits, hyphens (`-`), and underscores (`_`). Finally, it must start with a letter and contain at least 3 characters but no more than 255.

## Source type

The source type designates the kind of source being configured. As of version 0.5, available source types are `ingest-api`, `kafka`, `kinesis`, and `pulsar`. The `file` type is also supported but only for local ingestion from [the CLI](/docs/reference/cli.md#tool-local-ingest).

## Source parameters

The source parameters indicate how to connect to a data store and are specific to the source type.

### File source

A file source reads data from files containing JSON objects separated by newlines (NDJSON). Gzip compression is supported provided that the file name ends with the `.gz` suffix.

#### Ingest a single file (CLI only)

To ingest a specific file, run the indexing directly in an adhoc CLI process with:

```bash
./quickwit tool local-ingest --index <index> --input-path <input-path>
```

Both local and object files are supported, provided that the environment is configured with the appropriate permissions. A tutorial is available [here](/docs/ingest-data/ingest-local-file.md).

#### Notification based file ingestion (beta)

Quickwit can automatically ingest all new files that are uploaded to an S3 bucket. This requires creating and configuring an [SQS notification queue](https://docs.aws.amazon.com/AmazonS3/latest/userguide/ways-to-add-notification-config-to-bucket.html). A complete example can be found [in this tutorial](/docs/ingest-data/sqs-files.md).


The `notifications` parameter takes an array of notification settings. Currently one notifier can be configured per source and only the SQS notification `type` is supported.

Required fields for the SQS `notifications` parameter items:
- `type`: `sqs`
- `queue_url`: complete URL of the SQS queue (e.g `https://sqs.us-east-1.amazonaws.com/123456789012/queue-name`)
- `message_type`: format of the message payload, either
  - `s3_notification`: an [S3 event notification](https://docs.aws.amazon.com/AmazonS3/latest/userguide/EventNotifications.html)
  - `raw_uri`: a message containing just the file object URI (e.g. `s3://mybucket/mykey`)
  - `deduplication_window_duration_sec`: maximum duration for which ingested files checkpoints are kept (default 3600)
  - `deduplication_window_max_messages`: maximum number of ingested file checkpoints kept (default 100k)
  - `deduplication_cleanup_interval_secs`: frequency at which outdated file checkpoints are cleaned up

*Adding a file source with SQS notifications to an index with the [CLI](../reference/cli.md#source)*

```bash
cat << EOF > source-config.yaml
version: 0.8
source_id: my-sqs-file-source
source_type: file
num_pipelines: 2
params:
  notifications:
    - type: sqs
      queue_url: https://sqs.us-east-1.amazonaws.com/123456789012/queue-name
      message_type: s3_notification
EOF
./quickwit source create --index my-index --source-config source-config.yaml
```

:::note

- Quickwit does not automatically delete the source files after a successful ingestion. You can use [S3 object expiration](https://docs.aws.amazon.com/AmazonS3/latest/userguide/lifecycle-expire-general-considerations.html) to configure how long they should be retained in the bucket.
- Configure the notification to only forward events of type `s3:ObjectCreated:*`. Other events are acknowledged by the source without further processing and an warning is logged.
- We strongly recommend using a [dead letter queue](https://docs.aws.amazon.com/AWSSimpleQueueService/latest/SQSDeveloperGuide/sqs-dead-letter-queues.html) to receive all messages that couldn't be processed by the file source. A `maxReceiveCount` of 5 is a good default value. Here are some common situations where the notification message ends up in the dead letter queue:
  - the notification message could not be parsed (e.g it is not a valid S3 notification)
  - the file was not found
  - the file is corrupted (e.g unexpected compression)
- AWS S3 notifications and AWS SQS provide "at least once" delivery guaranties. To avoid duplicates, the file source includes a mechanism that prevents the same file from being ingested twice. It works by storing checkpoints in the metastore that track the indexing progress for each file. You can decrease `deduplication_window_*` or increase `deduplication_cleanup_interval_secs` to reduce the load on the metastore.

:::

### Ingest API source

An ingest API source reads data from the [Ingest API](/docs/reference/rest-api.md#ingest-data-into-an-index). This source is automatically created at the index creation and cannot be deleted nor disabled.

### Kafka source

A Kafka source reads data from a Kafka stream. Each message in the stream must hold a JSON object.

A tutorial is available [here](/docs/ingest-data/kafka.md).

#### Kafka source parameters

The Kafka source consumes a `topic` using the client library [librdkafka](https://github.com/edenhill/librdkafka) and forwards the key-value pairs carried by the parameter `client_params` to the underlying librdkafka consumer. Common `client_params` options are bootstrap servers (`bootstrap.servers`), or security protocol (`security.protocol`). Please, refer to [Kafka](https://kafka.apache.org/documentation/#consumerconfigs) and [librdkafka](https://github.com/edenhill/librdkafka/blob/master/CONFIGURATION.md) documentation pages for more advanced options.

| Property | Description | Default value |
| --- | --- | --- |
| `topic` | Name of the topic to consume. | required |
| `client_log_level` | librdkafka client log level. Possible values are: debug, info, warn, error. | `info` |
| `client_params` | librdkafka client configuration parameters. | `{}` |
| `enable_backfill_mode` | Backfill mode stops the source after reaching the end of the topic. | `false` |

**Kafka client parameters**

- `bootstrap.servers`
Comma-separated list of host and port pairs that are the addresses of a subset of the Kafka brokers in the Kafka cluster.

- `auto.offset.reset`
Defines the behavior of the source when consuming a partition for which there is no initial offset saved in the checkpoint. `earliest` consumes from the beginning of the partition, whereas `latest` (default) consumes from the end.

- `enable.auto.commit`
This setting is ignored because the Kafka source manages commit offsets internally using the [checkpoint API](../overview/concepts/indexing.md#checkpoint) and forces auto-commits to be disabled.

- `group.id`
Kafka-based distributed indexing relies on consumer groups. Unless overridden in the client parameters, the default group ID assigned to each consumer managed by the source is `quickwit-{index_uid}-{source_id}`.

- `max.poll.interval.ms`
Short max poll interval durations may cause a source to crash when back pressure from the indexer occurs. Therefore, Quickwit recommends using the default value of `300000` (5 minutes).

*Adding a Kafka source to an index with the [CLI](../reference/cli.md#source)*

```bash
cat << EOF > source-config.yaml
version: 0.8
source_id: my-kafka-source
source_type: kafka
num_pipelines: 2
params:
  topic: my-topic
  client_params:
    bootstrap.servers: localhost:9092
    security.protocol: SSL
EOF
./quickwit source create --index my-index --source-config source-config.yaml
```

### Kinesis source

A Kinesis source reads data from an [Amazon Kinesis](https://aws.amazon.com/kinesis/) stream. Each message in the stream must hold a JSON object.

A tutorial is available [here](/docs/ingest-data/kinesis.md).

**Kinesis source parameters**

The Kinesis source consumes a stream identified by a `stream_name` and a `region`.

| Property | Description | Default value |
| --- | --- | --- |
| `stream_name` | Name of the stream to consume. | required |
| `region` | The AWS region of the stream. Mutually exclusive with `endpoint`. | `us-east-1` |
| `endpoint` | Custom endpoint for use with AWS-compatible Kinesis service. Mutually exclusive with `region`. | optional |

If no region is specified, Quickwit will attempt to find one in multiple other locations and with the following order of precedence:

1. Environment variables (`AWS_REGION` then `AWS_DEFAULT_REGION`)

2. Config file, typically located at `~/.aws/config` or otherwise specified by the `AWS_CONFIG_FILE` environment variable if set and not empty.

3. Amazon EC2 instance metadata service determining the region of the currently running Amazon EC2 instance.

4. Default value: `us-east-1`

*Adding a Kinesis source to an index with the [CLI](../reference/cli.md#source)*

```bash
cat << EOF > source-config.yaml
version: 0.7
source_id: my-kinesis-source
source_type: kinesis
params:
  stream_name: my-stream
EOF
quickwit source create --index my-index --source-config source-config.yaml
```

### Pulsar source

A Puslar source reads data from one or several Pulsar topics. Each message in topic(s) must hold a JSON object.

A tutorial is available [here](/docs/ingest-data/pulsar.md).

**Pulsar source parameters**

The Pulsar source consumes `topics` using the client library [pulsar-rs](https://github.com/streamnative/pulsar-rs).

| Property | Description | Default value |
| --- | --- | --- |
| `topics` | List of topics to consume. | required |
| `address` | Pulsar URL (pulsar:// and pulsar+ssl://). | required |
| `consumer_name` | The consumer name to register with the pulsar source. | `quickwit` |

*Adding a Pulsar source to an index with the [CLI](../reference/cli.md#source)*

```bash
cat << EOF > source-config.yaml
version: 0.7
source_id: my-pulsar-source
source_type: pulsar
params:
  topics:
    - my-topic
  address: pulsar://localhost:6650
EOF
./quickwit source create --index my-index --source-config source-config.yaml
```

## Number of pipelines

The `num_pipelines` parameter is only available for distributed sources like Kafka, GCP PubSub, and Pulsar.

It defines the number of pipelines to run on a cluster for the source. The actual placement of these pipelines on the different indexer
will be decided by the control plane.

:::info

Note that distributing the indexing load of partitioned sources like Kafka is done by assigning the different partitions to different pipelines. As a result, it is important to ensure that the number of partitions is a multiple of `num_pipelines`.

Also, assuming you are only indexing a single Kafka source in your Quickwit cluster, you should set the number of pipelines to a multiple of the number of indexers. Finally, if your indexing throughput is high, you should provision between 2 and 4 vCPUs per pipeline.

For instance, assume you want to index a 60-partition topic, with each partition receiving a throughput of 10 MB/s. If you measured that Quickwit can index your data at a pace of 40MB/s per pipeline, a possible setting could be:
- 5 indexers with 8 vCPUs each
- 15 pipelines

Each indexer will then be in charge of 3 pipelines, and each pipeline will cover 4 partitions.
:::


## Transform parameters

For all source types but the `ingest-api`, ingested documents can be transformed before being indexed using [Vector Remap Language (VRL)](https://vector.dev/docs/reference/vrl/) scripts.

| Property | Description | Default value |
| --- | --- | --- |
| `script` | Source code of the VRL program executed to transform documents. | required |
| `timezone` | Timezone used in the VRL program for date and time manipulations. It must be a valid name in the [TZ database](https://en.wikipedia.org/wiki/List_of_tz_database_time_zones) | `UTC` |

```yaml
# Your source config here
# ...
transform:
  script: |
    .message = downcase(string!(.message))
    .timestamp = now()
    del(.username)
  timezone: local
```

## Input format

The `input_format` parameter specifies the expected data format of the source. The formats currently supported are:
- `json` (default)
- `otlp_logs_json`
- `otlp_logs_proto`
- `otlp_traces_json`
- `otlp_traces_proto`
- `plain_text`

*OTLP formats*

When ingesting OTLP data into an OTLP logs or traces index with a source other than the native OTEL endpoints, use this parameter to specify whether the exported logs or traces will be serialized in JSON or Protobuf. When possible, prefer the latter, which is a more compact encoding.

*Plaint text format*

Use this parameter for unstructured text data. Internally, Quickwit can only index JSON data. To allow the ingestion of plain text documents, Quickwit transform them on the fly into JSON objects of the following form: `{"plain_text": "<original plain text document>"}`. Then, they can be optionally transformed into more complex documents using a VRL script. (see [transform feature](#transform-parameters)).

The following is an example of how one could parse and transform a CSV dataset containing a list of users described by 3 attributes: first name, last name, and age.

```yaml
# Your source config here
# ...
input_format: plain_text
transform:
  script: |
    user = parse_csv!(.plain_text)
    .first_name = user[0]
    .last_name = user[1]
    .age = to_int!(user[2])
    del(.plain_text)
```

## Enabling/disabling a source from an index

A source can be enabled or disabled from an index using the [CLI command](../reference/cli.md) `quickwit source enable` or `quickwit source disable`:

```bash
quickwit source disable --index my-index --source my-source
```

A source is enabled by default. When disabling a source, the related indexing pipelines will be shut down on each relevant indexer and indexing for this source will be paused.

## Deleting a source from an index

A source can be removed from an index using the [CLI command](../reference/cli.md) `quickwit source delete`:

```bash
quickwit source delete --index my-index --source my-source
```

When deleting a source, the checkpoint associated with the source is also removed.


================================================
FILE: docs/configuration/storage-config.md
================================================
---
title: Storage configuration
sidebar_position: 2
---

## Supported Storage Providers

Quickwit currently supports four types of storage providers:
- Amazon S3 and S3-compatible (Garage, MinIO, ...)
- Azure Blob Storage
- Local file storage*
- Google Cloud Storage (native API)

## Storage URIs

Storage URIs refer to different storage providers identified by a URI "protocol" or "scheme". Quickwit supports the following storage URI protocols:
- `s3://` for Amazon S3 and S3-compatible
- `azure://` for Azure Blob Storage
- `file://` for local file systems
- `gs://` for Google Cloud Storage

In general, you can use a storage URI or a file path anywhere you would intuitively expect a file path. For instance:
- when setting the `index_uri` of an index to specify the storage provider and location;
- when setting the `metastore_uri` in a node config to set up a file-backed metastore;
- when passing a file path as a command line argument.

### Local file storage URIs

Quickwit interprets regular file paths as local file system URIs. Relative file paths are allowed and are resolved relatively to the current working directory (CWD). `~` can be used as a shortcut to refer to the user’s home directory. The following are valid local file system URIs:

```markdown
- /var/quickwit
- file:///var/quickwit
- /home/quickwit/data
- ~/data
- ./quickwit
```

:::caution
When using the `file://` protocol, a third `/` is necessary to express an absolute path. For instance, the following URI `file://home/quickwit/` is interpreted as `./home/quickwit`
:::

## Storage configuration

This section contains one configuration subsection per storage provider. If a storage configuration parameter is not explicitly set, Quickwit relies on the default values provided by the storage provider SDKs ([Azure SDK for Rust](https://github.com/Azure/azure-sdk-for-rust), [AWS SDK for Rust](https://github.com/awslabs/aws-sdk-rust)).

### S3 storage configuration

| Property | Description | Default value |
| --- | --- | --- |
| `flavor` |  The optional storage flavor to use. Available flavors are `digital_ocean`, `garage`, `gcs`, and `minio`. | |
| `access_key_id` | The AWS access key ID. | |
| `secret_access_key` | The AWS secret access key. | |
| `region` | The AWS region to send requests to. | `us-east-1` (SDK default) |
| `endpoint` | Custom endpoint for use with S3-compatible providers. | SDK default |
| `force_path_style_access` | Disables [virtual-hosted–style](https://docs.aws.amazon.com/AmazonS3/latest/userguide/VirtualHosting.html) requests. Required by some S3-compatible providers (Ceph, MinIO). | `false` |
| `disable_multi_object_delete` | Disables [Multi-Object Delete](https://docs.aws.amazon.com/AmazonS3/latest/API/API_DeleteObjects.html) requests. Required by some S3-compatible providers (GCS). | `false` |
| `disable_multipart_upload` | Disables [multipart upload](https://docs.aws.amazon.com/AmazonS3/latest/userguide/mpuoverview.html) of objects. Required by some S3-compatible providers (GCS). | `false` |

:::warning
Hardcoding credentials into configuration files is not secure and strongly discouraged. Prefer the alternative authentication methods that your storage backend may provide.
:::

#### Environment variables

| Env variable | Description |
| --- | --- |
| `QW_S3_ENDPOINT` | Custom S3 endpoint. |
| `QW_S3_MAX_CONCURRENCY` | Limit the number of concurrent requests to S3 |

#### Storage flavors

Storage flavors ensure that Quickwit works correctly with storage providers that deviate from the S3 API by automatically configuring the appropriate settings. The available flavors are:
- `digital_ocean`
- `garage`
- `gcs`
- `minio`

*Digital Ocean*

The Digital Ocean flavor (`digital_ocean`) forces path-style access and turns off multi-object delete requests.

*Garage flavor*

The Garage flavor (`garage`) overrides the `region` parameter to `garage` and forces path-style access.

*Google Cloud Storage*

The Google Cloud Storage flavor (`gcs`) turns off multi-object delete requests and multipart uploads.

*MinIO flavor*

The MinIO flavor (`minio`) overrides the `region` parameter to `minio` and forces path-style access.

Example of a storage configuration for Google Cloud Storage in YAML format:

```yaml
storage:
  s3:
    flavor: gcs
    region: us-east1
    endpoint: https://storage.googleapis.com
```

### Azure storage configuration

| Property | Description | Default value |
| --- | --- | --- |
| `account` | The Azure storage account name. | |
| `access_key` | The Azure storage account access key. | |

#### Environment variables

| Env variable | Description |
| --- | --- |
| `QW_AZURE_STORAGE_ACCOUNT` | Azure Blob Storage account name. |
| `QW_AZURE_STORAGE_ACCESS_KEY` | Azure Blob Storage account access key. |

Example of a storage configuration for Azure in YAML format:

```yaml
storage:
  azure:
    account: your-azure-account-name
    access_key: your-azure-access-key
```

## Storage configuration examples for various object storage providers

### Garage

[Garage](https://garagehq.deuxfleurs.fr/) is an open-source distributed object storage service tailored for self-hosting.

```yaml
storage:
  s3:
    flavor: garage
    endpoint: http://127.0.0.1:3900
```

### MinIO

[MinIO](https://min.io/) is a high-performance object storage.

```yaml
storage:
  s3:
    flavor: minio
    endpoint: http://127.0.0.1:9000
```

Note: `default_index_root_uri` or index URIs do not include the endpoint, you should set it as a typical S3 path such as `s3://indexes`.


================================================
FILE: docs/configuration/template-config.md
================================================
---
title: Index template configuration
sidebar_position: 7
toc_max_heading_level: 4
---

This page describes how to configure an index template.

Index templates let you dynamically create indexes according to predefined rules. Templates are used automatically when documents are received on the ingest API for an index that doesn't exist.

The index template configuration lets you define the following parameters:
- `template_id` (required)
- `description`
- `index_id_patterns` (required)
- `index_root_uri`
- `priority`

Besides, the following parameters can also be configured and are the same as those found in the [index configuration](../configuration/index-config.md):
- doc mapping (required)
- indexing settings
- search settings
- retention policy

You can manage templates using the [index template API](../reference/rest-api.md#index-template-api).

## Config file format

The index configuration format is YAML or JSON. When a key is absent from the configuration file, the default value is used.
Here is a complete example:

```yaml
version: 0.9 # File format version.

template_id: "hdfs-dev"

index_root_uri: "s3://my-bucket/hdfs-dev/"

description: "HDFS log management dev"

index_id_patterns:
    - hdfs-dev-*
    - hdfs-staging-*

priority: 100

doc_mapping:
  mode: lenient
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: severity_text
      type: text
      tokenizer: raw
      fast:
        - tokenizer: lowercase
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: object
      field_mappings:
        - name: service
          type: text
          tokenizer: raw
  tag_fields: ["resource.service"]
  timestamp_field: timestamp
  index_field_presence: true

search_settings:
  default_search_fields: [severity_text, body]

retention:
  period: 90 days
  schedule: daily
```

## Template ID

The `template_id` is a string that uniquely identifies the index template within the metastore. It may only contain uppercase or lowercase ASCII letters, digits, hyphens (`-`), and underscores (`_`). It must start with a letter and contain at least 3 characters but no more than 255.

## Description

An optional string that describes what the index template is used for.

## Index root uri

The `index_root_uri` defines where the index files (also called splits) should be stored.
This parameter expects a [storage uri](storage-config#storage-uris).

The actual URI of the index is the path concatenation of the `index_root_uri` with the index id. 

If `index_root_uri` is not defined, the `default_index_root_uri` from [Quickwit's node config](node-config) will be used.

## Index ID patterns

`index_id_patterns` is a list of strings that define which indices should be created according to this template. Use [glob-like](https://en.wikipedia.org/wiki/Glob_(programming)) wildcard ( \* ) expressions to target indices that match a pattern: test\* or \*test or te\*t or \*test\*. You can also use negative patterns by prepending the hyphen `-` character.

Patterns must obey the following rules:
- It must follow the regex `^-?[a-zA-Z\*][a-zA-Z0-9-_\.\*]{0,254}$`.
- It cannot contain consecutive asterisks (`*`).
- If it does not contain an asterisk (`*`), the length must be greater than or equal to 3 characters.

## Priority

When multiple templates match a new index ID, the template with the highest `priority` is used to configure the index.


================================================
FILE: docs/deployment/_category_.yaml
================================================
label: 'Deployment'
position: 7
collapsed: true


================================================
FILE: docs/deployment/cluster-sizing.md
================================================
---
title: Cluster sizing
sidebar_position: 3
---

In this guide, we discuss how to size your Quickwit cluster and nodes. As shown
in the [architecture section](../overview/architecture.md), a Quickwit cluster
has 5 main components: the Indexers, Searchers, Control Plane,
Metastore and, Janitor. Each component has different resource requirements
and can be scaled independently. We will also discuss how to size the metastore
PostgreSQL database.

:::note

This guide provides general guidelines. The actual resource requirements depend
strongly on your workload. We recommend monitoring the resource usage and
adjusting the cluster size accordingly.

:::

## Quickwit services

### Indexers

Here are some high-level guidelines to size your Indexer nodes:
- Quickwit can index at around **7.5MB per second per core**
- For the general use case, configure 4GB of RAM per core
  - Workloads with a large number of indexes or data sources consume more RAM
    <!-- TODO: revisit this when cooperative indexing becomes the default -->
  - Don't use instances with less than 8GB of RAM
    <!-- Note: 2GB for the heap size (per pipeline) and 2GB for ingest queues -->
- Mount the data directory to a volume of at least 120GB to store:
  - the [split cache](../configuration/node-config.md#Indexer-configuration) (default 100GB)
  - the [ingest queue](../configuration/node-config.md#ingest-api-configuration) (default 4GiB)
  - a little extra for the indexes that are being built (first generation and merges)
- Local SSDs are preferred for deploying Indexers since they generally provide the best performance per dollar and save some network bandwidth. However, remote disks can also if they provide roughly 20 MB/s of write throughput per core when using the ingest API or 10 MB/s when relying on other sources. For Amazon EBS volumes, this is equivalent to 320 or 160 IOPS per core (assuming 64 KB IOPS).

:::note

To utilize all CPUs on Indexer nodes that have more than 4 cores, your indexing
workload needs to be broken down into multiple indexing pipelines. This can be
achieved by creating multiple indexes or by using a [partitioned data
source](../configuration/source-config.md#number-of-pipelines) such as
[Kafka](../configuration/source-config.md#kafka-source) or the [ingest API
(v2)](../ingest-data/ingest-api.md#ingest-api-versions).

:::


### Searchers

Search performance is highly dependent on the workload. For example, term queries
are usually cheaper than aggregations. A good starting point for dimensioning
Searcher nodes:
- Configure 8GB of RAM per core when using a high latency / low bandwidth object
  store like AWS S3
- Decrease the RAM / CPU ratio (e.g 4GB/core) when using a faster object store
- Provision more RAM if you expect many concurrent aggregation requests. By
  default, each request can use up to 500MB of RAM on each node.
- Avoid instances with less than 4GB of RAM
<!-- 1GB fast_field_cache_capacity + 0.5GB split_footer_cache_capacity + 0.5GB/req aggregation_memory_limit -->
- Searcher nodes don't use disk unless the [split
  cache](../configuration/node-config.md#Searcher-split-cache-configuration) is
  explicitly enabled

One strength of Quickwit is that its Searchers are stateless, which makes it
easy to scale them up and down based on the workload. Scale the number of
Searcher nodes based on:
- the number of concurrent requests expected
- aggregations that run on large amounts of data (without
  [time](../overview/concepts/querying.md#time-sharding) or
  [tag](../overview/concepts/querying.md#tag-pruning) pruning)

### Other services

The Control Plane, Metastore and, Janitor are lightweight components.

- **Control Plane**: A cluster must have only one Control Plane. It needs a
  single core and 2GB of RAM. It doesn't require any disk.

- **Metastore**: A cluster must have exactly one Metastore when using the
  [file-backed metastore](../configuration/metastore-config.md#file-backed-metastore).
  When using the [PostgreSQL metastore](#postgres-metastore-backend), you can
  run one or several Metastore pods for high availability (HA). The Metastore
  requires a single core and 2GB of RAM. For clusters handling hundreds of
  indexes, you may increase the size to 2 cores and 4GB of RAM. It doesn't
  write to disk (when using PostgreSQL, the database handles persistence).

- **Janitor**: A cluster must have only one Janitor. In general, it requires 1
  core and 2GB of RAM and doesn't use the disk. If you use the [delete
  API](https://quickwit.io/docs/overview/concepts/deletes), the Janitor should
  be dimensioned like an indexer.

### Single node deployments

For experimentations and small scale POCs, it is possible to deploy all the
services on a single node (see
[tutorial](../get-started/tutorials/tutorial-hdfs-logs.md)). We recommend at
least 2 cores and 8GB of RAM.

## Postgres Metastore backend

For most use cases, a PostgreSQL instance with 4GB of RAM and 1 core is
sufficient:
- with the AWS RDS managed service, use the t4g.medium instance type. Enable
  multi-AZ with one standby for high availability.


================================================
FILE: docs/deployment/deployment-modes.md
================================================
---
title: Deployment modes
sidebar_position: 1
---

As an application, Quickwit is built out of multiple services and is designed to run as a horizontally-scalable distributed system. Currently, Quickwit supports four core services (indexer, searcher, metastore, control plane) and one maintenance service (janitor):

- Indexers ingest documents from data sources and build indexes.
- Searchers execute search queries submitted via the REST API.
- The Metastore stores index metadata in a PostgreSQL-compatible database or cloud-hosted file.
- The Control Plane distributes and coordinates indexing workloads on indexers.
- The Janitor performs periodic maintenance tasks.

Quickwit is distributed as a single binary or Docker image. The behavior of that executable file or image is controlled with the `--service` option of the `quickwit run` command and defines which services run on a node. You may start one service, multiple, or all of them. Nodes always serve the REST API and the search and admin UI. In addition, they will redirect requests that they cannot satisfy to the appropriate nodes in the cluster. Finally, each service can run on one or several nodes depending on the expected load on the system.

## Standalone mode (single node)

This deployment mode is the simplest way to get started with Quickwit. Launch all the services with the `quickwit run` [command](../reference/cli.md), and you are now ready to ingest data and search your indexes.

## Cluster mode (multi-node)

You can deploy Quickwit on multiple nodes. We provide a [Helm chart](./kubernetes/helm.md) to help you deploy Quickwit on Kubernetes. In cluster mode, you must store your index data on a shared storage backend such as Amazon S3 or MinIO.

## One indexer, multiple searchers

One indexer running on a small instance (4 vCPUs) can ingest documents at a throughput of 20-40MB/s (1-3+ TB/day). A deployment with one indexer is thus an excellent place to start. However, you may need several searchers to handle large datasets or serve many resource-intensive requests such as aggregation queries.

## Multiple indexers, multiple searchers

Indexing a single [data source](../configuration/source-config.md) on several indexers is only possible with a [Kafka source](../configuration/source-config.md#kafka-source).
Support for native distributed indexing was added with Quickwit 0.9.

## File-backed metastore limitations

The file-backed metastore is a good fit for standalone and small deployments. However, it does not support multiple instances running at the same time. As long as you can guarantee that no more than one metastore is running at any given time, the file-backed metastore is safe to use. For heavy workloads, we recommend using a PostgreSQL metastore.


================================================
FILE: docs/deployment/kubernetes/_category_.yaml
================================================
label: 'Kubernetes'
position: 2
collapsed: true


================================================
FILE: docs/deployment/kubernetes/gke.md
================================================
---
title: Install Quickwit on Google GKE
sidebar_label: Google GKE
sidebar_position: 2
---

This guide will help you set up a Quickwit cluster with the correct GCS permissions.


## Set up

Before installing Quickwit with Helm, let's create a namespace for our playground.

```
export NS=quickwit-tutorial
kubectl create ns ${NS}
```

Quickwit stores its index on an object storage. We will use GCS, which is natively supported since the 0.7 version (for versions < 0.7, you should use an S3 interoperability key).

The following steps create a GCP and a GKE service account and bind them together.
We are going to create them, set the right permissions and bind them.

```bash
export PROJECT_ID={your-project-id}
export GCP_SERVICE_ACCOUNT=quickwit-tutorial
export GKE_SERVICE_ACCOUNT=quickwit-sa
export BUCKET=your-bucket

kubectl create serviceaccount ${GKE_SERVICE_ACCOUNT} -n ${NS}

gcloud iam service-accounts create ${GCP_SERVICE_ACCOUNT} --project=${PROJECT_ID}

gcloud storage buckets add-iam-policy-binding gs://${BUCKET} \
--member "serviceAccount:${GCP_SERVICE_ACCOUNT}@${PROJECT_ID}.iam.gserviceaccount.com" \
--role "roles/storage.objectAdmin"

# Notice that the member is related to a namespace.
gcloud iam service-accounts add-iam-policy-binding ${GCP_SERVICE_ACCOUNT}@${PROJECT_ID}.iam.gserviceaccount.com \
--role roles/iam.workloadIdentityUser \
--member "serviceAccount:${PROJECT_ID}.svc.id.goog[${NS}/${GKE_SERVICE_ACCOUNT}]"

# Now we can annotate our service account!
kubectl annotate serviceaccount ${GKE_SERVICE_ACCOUNT} \
iam.gke.io/gcp-service-account=${GCP_SERVICE_ACCOUNT}@${PROJECT_ID}.iam.gserviceaccount.com \
-n ${NS}
```

## Install Quickwit using Helm

We are now ready to install Quickwit on GKE. If you'd like to know more about Helm, consult our [comprehensive guide](./helm.md) for installing Quickwit on Kubernetes.

```bash
helm repo add quickwit https://helm.quickwit.io
helm repo update quickwit
```

Let's set Quickwit `values.yaml`:

```yaml
# We use the edge version here as we recently fixed
# a bug which prevents the metastore from running on GCS.
image:
    repository: quickwit/quickwit
    pullPolicy: Always
    tag: edge

serviceAccount:
  create: false
  name: quickwit-sa

config:
  default_index_root_uri: gs://{BUCKET}/qw-indexes
  metastore_uri: gs://{BUCKET}/qw-indexes

```

We're ready to deploy:

```bash
helm install <deployment name> quickwit/quickwit -f values.yaml
```

## Check that Quickwit is running

It should take a few seconds for the cluster to start. During the startup process, individual pods might restart themselves several times.

To access the UI, you can run the following command and then open your browser at [http://localhost:7280](http://localhost:7280):

```
kubectl port-forward svc/release-name-quickwit-searcher 7280:7280
```


## Uninstall the deployment

Run the following Helm command to uninstall the deployment

```bash
helm uninstall <deployment name>
```

And don't forget to clean your bucket, Quickwit should have stored 3 files in `gs://{BUCKET}/qw-indexes`.


================================================
FILE: docs/deployment/kubernetes/glasskube.md
================================================
---
title: Install Quickwit with Glasskube
sidebar_label: Glasskube
sidebar_position: 3
---

[Glasskube](https://glasskube.dev) is a package manager for Kubernetes that empowers you to effortlessly install, upgrade, configure, and manage your Kubernetes cluster packages, all while streamlining repetitive and cumbersome maintenance tasks.

## Requirements

To deploy Quickwit on Kubernetes, you will need:

- kubectl, compatible with your cluster (+/- 1 minor release from your cluster) (`kubectl version`)
- A Kubernetes cluster

1. Install `kubectl` and `glasskube` cli.

To install `kubectl` locally, you can refer to [this documentation](https://kubernetes.io/docs/tasks/tools/#install-kubectl).

To install `glasskube` cli locally, you can refer to [this documentation](https://glasskube.dev/docs/getting-started/install) and choose the right installation options according to your operating system.

For example, let's assume that you're on MacOS using homebrew and kind, this is what you'll have to do:

```shell
brew install glasskube/tap/glasskube # install the glasskube cli
kind create cluster # create a kind Kubernetes cluster
```

2. Install glasskube in your Kubernetes cluster:

```shell
glasskube bootstrap
```

3. Start and access to the Glasskube's GUI:

```shell
glasskube serve
```

You'll be able to access to the GUI of Glasskube here: http://localhost:8580

## Install Quickwit using Glasskube

`glasskube` will install Quickwit in the `quickwit` namespace. You can perform the Quickwit installation directly with the GUI:

![screenshot-glasskube-ui.png](../../assets/images/screenshot-glasskube-ui.png)

Or use the CLI instead:

```shell
glasskube install quickwit
```

In both, you'll have to set the value of those parameters:

* `defaultIndexRootUri`: the default index URI is a S3 compliant bucket which usually looks like this: `s3://<bucket-name>/<optional-base-path>`
* `metastoreUri`: if you're not using PostgreSQL and object storage, you can pick the same bucket and value you used for the `defaultIndexRootUri` parameter
* `s3Endpoint`: the http(s) URL of your object storage service which should looks like `https://s3.{region}.{your object storage domain}`
* `s3Flavor`: which can be one of the following: `do`, `garage`, `gcp`, `minio`. You can leave it empty if your object storage is compliant with AWS S3
* `s3Region`
* `s3AccessKeyId`
* `s3SecretAccessKey`

## Uninstall quickwit

```shell
glasskube uninstall quickwit
```


================================================
FILE: docs/deployment/kubernetes/helm.md
================================================
---
title: Install Quickwit with Helm
sidebar_label: Helm
sidebar_position: 1
---

[Helm](https://helm.sh) is a package manager for Kubernetes that allows you to configure, install, and upgrade containerized applications in a Kubernetes cluster in a version-controlled and reproducible way.

You can install Quickwit on Kubernetes with the official Quickwit Helm chart. If you encounter any problem with the chart, please, open an issue in our [GitHub repository](https://github.com/quickwit-oss/helm-charts).

## Requirements

To deploy Quickwit on Kubernetes, you will need:

- kubectl, compatible with your cluster (+/- 1 minor release from your cluster) (`kubectl version`)
- Helm v3 (`helm version`)
- A Kubernetes cluster

1. Install `kubectl` and `helm`

To install `kubectl` and `helm` locally, follow the [Kubernetes](https://kubernetes.io/docs/tasks/tools/#install-kubectl) and [Helm](https://helm.sh/docs/intro/install/) documentation pages.

2. Add the Quickwit Helm chart repository to Helm

```bash
helm repo add quickwit https://helm.quickwit.io
```

3. Update the repository

```bash
helm repo update quickwit
```

4. Create and customize your configuration file `values.yaml`

You can inspect the default configuration values of the chart using the following command:

```bash
helm show values quickwit/quickwit
```

Here is an example of a minimal configuration with a file-backed metastore:

```yaml
environment:
  QW_METASTORE_URI: s3://<my-bucket>/quickwit-indexes

config:
  default_index_root_uri: s3://<my-bucket>/quickwit-indexes
  storage:
    s3:
      region: eu-east-1
      # We recommend using IAM roles and permissions to access Amazon S3 resources,
      # but you can specify a pair of access and secret keys if necessary.
      access_key_id: <my access key>
      secret_access_key: <my secret key>
```

5. Deploy Quickwit

```bash
helm install <deployment name> quickwit/quickwit -f values.yaml
```

6. Check that Quickwit is running

It might take some time for the cluster to start. During the startup process individual pods might restart themselves several times. The command on the previous step will print the instructions on how to connect to the cluster. This endpoint can be used to access the quickwit search UI, as well execute standard API commands against.

## Using PostgreSQL as a metadata store

The file-backed metastore is mainly useful for testing purposes. Though a file-backed metastore might be easier to setup, we strongly encourage you to use a PostgreSQL metastore in production. For the quickwit installation to work with PostgreSQL metadata you need to provide connection PostgreSQL information instead of metastore URI:

```yaml
config:
  default_index_root_uri: s3://<my-bucket>/quickwit-indexes

  postgres:
    host: <postgres_host>
    port: 5432
    database: quickwit-metastore
    username: quickwit
    password: <my strong password> # This password will be stored as a Kubernetes Secret

  storage: {}
    s3:
      region: eu-east-1
      # We recommend using IAM roles and permissions to access Amazon S3 resources,
      # but you can specify a pair of access and secret keys if necessary.
      access_key_id: <my access key>
      secret_access_key: <my secret key>
```

## Uninstall the deployment

Run the following Helm command to uninstall the deployment

```bash
helm uninstall <deployment name>
```


================================================
FILE: docs/distributed-tracing/_category_.yaml
================================================
label: 'Distributed tracing'
position: 6
collapsed: true


================================================
FILE: docs/distributed-tracing/otel-service.md
================================================
---
title: OTEL service
sidebar_position: 5
---

Quickwit natively supports the [OpenTelemetry Protocol (OTLP)](https://opentelemetry.io/docs/reference/specification/protocol/otlp/) and provides a gRPC endpoint to receive spans from an OpenTelemetry collector, or from your application directly, via an exporter. This endpoint is enabled by default.

When enabled, Quickwit will start the gRPC service ready to receive spans from an OpenTelemetry collector. The spans are indexed in the `otel-trace-v0_7` index by default, and this index will be automatically created if not present. The index doc mapping is described in the next [section](#trace-and-span-data-model).

If for any reason, you want to disable this endpoint, you can:
- Set the `QW_ENABLE_OTLP_ENDPOINT` environment variable to `false` when starting Quickwit.
- Or [configure the node config](/docs/configuration/node-config.md) by setting the indexer setting `enable_otlp_endpoint` to `false`.

```yaml title=node-config.yaml
# ... Indexer configuration ...
indexer:
    enable_otlp_endpoint: false
```

## Sending spans in your own index

You can send spans in the index of your choice by setting the header `qw-otel-traces-index` of your gRPC request to the targeted index ID.


## Trace and span data model

A trace is a collection of spans that represents a single request. A span represents a single operation within a trace. OpenTelemetry collectors send spans, Quickwit then indexes them in the `otel-trace-v0_7` index by default that maps OpenTelemetry span model to an indexed document in Quickwit.

The span model is derived from the [OpenTelemetry specification](https://opentelemetry.io/docs/reference/specification/trace/api/).

Below is the doc mapping of the `otel-trace-v0_7` index:

```yaml

version: 0.7

index_id: otel-trace-v0_7

doc_mapping:
  mode: strict
  field_mappings:
    - name: trace_id
      type: bytes
      input_format: hex
      output_format: hex
      fast: true
    - name: trace_state
      type: text
      indexed: false
    - name: service_name
      type: text
      tokenizer: raw
      fast: true
    - name: resource_attributes
      type: json
      tokenizer: raw
    - name: resource_dropped_attributes_count
      type: u64
      indexed: false
    - name: scope_name
      type: text
      indexed: false
    - name: scope_version
      type: text
      indexed: false
    - name: scope_attributes
      type: json
      indexed: false
    - name: scope_dropped_attributes_count
      type: u64
      indexed: false
    - name: span_id
      type: bytes
      input_format: hex
      output_format: hex
    - name: span_kind
      type: u64
    - name: span_name
      type: text
      tokenizer: raw
      fast: true
    - name: span_fingerprint
      type: text
      tokenizer: raw
    - name: span_start_timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
      indexed: false
      fast: true
      fast_precision: milliseconds
    - name: span_end_timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
      indexed: false
      fast: false
    - name: span_duration_millis
      type: u64
      indexed: false
      fast: true
    - name: span_attributes
      type: json
      tokenizer: raw
      fast: true
    - name: span_dropped_attributes_count
      type: u64
      indexed: false
    - name: span_dropped_events_count
      type: u64
      indexed: false
    - name: span_dropped_links_count
      type: u64
      indexed: false
    - name: span_status
      type: json
      indexed: true
    - name: parent_span_id
      type: bytes
      input_format: hex
      output_format: hex
      indexed: false
    - name: events
      type: array<json>
      tokenizer: raw
      fast: true
    - name: event_names
      type: array<text>
      tokenizer: default
      record: position
      stored: false
    - name: links
      type: array<json>
      tokenizer: raw

  timestamp_field: span_start_timestamp_nanos

indexing_settings:
  commit_timeout_secs: 10

search_settings:
  default_search_fields: []
```

## Known limitations

There are a few limitations on the current distributed tracing setup in Quickwit 0.9:
- The OTLP gRPC service does not provide High-Durability. This will be fixed in 0.10.
- OTLP HTTP is only available with the Binary Protobuf Encoding. OTLP HTTP with JSON encoding is not planned yet, but this can be easily fixed in the next version. Please open an issue if you need this feature.

If you are interested in new features or discovered other limitations, please open an issue on [GitHub](https://github.com/quickwit-oss/quickwit).


================================================
FILE: docs/distributed-tracing/overview.md
================================================
---
title: Distributed Tracing with Quickwit
sidebar_label: Overview
sidebar_position: 1
---

Distributed Tracing is a process that tracks your application requests flowing through your different services: frontend, backend, databases and more. It's a powerful tool to understand how your application works and to debug performance issues.

Quickwit is a cloud-native engine to index and search unstructured data which makes it a perfect fit for a traces backend.

Moreover, Quickwit supports natively the [OpenTelemetry gRPC and HTTP (protobuf only) protocol](https://opentelemetry.io/docs/reference/specification/protocol/otlp/) and the [Jaeger gRPC API (SpanReader only)](https://www.jaegertracing.io/). **This means that you can use Quickwit to store your traces and to query them with Jaeger UI**.

![Quickwit Distributed Tracing](../assets/images/distributed-tracing-overview-light.png#gh-light-mode-only)![Quickwit Distributed Tracing](../assets/images/distributed-tracing-overview-dark.png#gh-dark-mode-only)

## Plug Quickwit to Jaeger

Quickwit implements a gRPC service compatible with Jaeger UI. All you need is to configure Jaeger with a (span) storage type `grpc`[^1] and you will be able to visualize your traces in Jaeger that are stored in any Quickwit's indexes matching the pattern `otel-traces-v0_*`.

We made a tutorial on [how to plug Quickwit to Jaeger UI](plug-quickwit-to-jaeger.md) that will guide you through the process.

[^1]: It was `grpc-plugin` until the version 1.58 of Jaeger.

## Send traces to Quickwit

- [Using OTEL collector](send-traces/using-otel-collector.md)
- [Using python OTEL SDK](send-traces/using-otel-sdk-python.md)


================================================
FILE: docs/distributed-tracing/plug-quickwit-to-jaeger.md
================================================
---
title: Plug Quickwit to Jaeger
description: A simple tutorial to use Jaeger with Quickwit backend.
icon_url: /img/tutorials/quickwit-logo.png
tags: [traces, ingestion]
sidebar_position: 2
---

In this tutorial, we will show you how Quickwit can eat its own dog food: we will send Quickwit traces into Jaeger and analyze them, which will generate new traces to analyze :)

## Start Quickwit

First, start a [Quickwit instance](../get-started/installation.md) with the OTLP service enabled:

```bash
QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER=true \
OTEL_EXPORTER_OTLP_ENDPOINT=http://127.0.0.1:7281 \
./quickwit run
```

We also set `QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER` and `OTEL_EXPORTER_OTLP_ENDPOINT` environment variables so that Quickwit will send its own traces to itself.

## Start Jaeger UI

Let's start a Jaeger UI instance with docker. Here we need to inform jaeger that it should use quickwit as its backend.

Due to some idiosyncrasy associated with networking with containers, we will have to use a different approach on MacOS & Windows on one side, and Linux on the other side.

### MacOS & Windows

We can rely on `host.docker.internal` to get the docker bridge ip address, pointing to our quickwit server.

```bash
docker run --rm --name jaeger-qw \
    -e SPAN_STORAGE_TYPE=grpc \
    -e GRPC_STORAGE_SERVER=host.docker.internal:7281 \
    -p 16686:16686 \
    jaegertracing/jaeger-query:1.60
```

### Linux

By default, Quickwit is listening to `127.0.0.1`, and will not respond to request directed
to the docker bridge (`172.17.0.1`). There are different ways to solve this problem.
The easiest is probably to use host network mode.

```bash
docker run --rm --name jaeger-qw  --network=host \
    -e SPAN_STORAGE_TYPE=grpc \
    -e GRPC_STORAGE_SERVER=127.0.0.1:7281 \
    -p 16686:16686 \
    jaegertracing/jaeger-query:1.60

```

## Search traces in Jaeger UI

As Quickwit is indexing its own traces, you should be able to see them in Jaeger UI after 5 seconds (the time it takes for Quickwit to do its first commit).

Open the Jaeger UI at [http://localhost:16686](http://localhost:16686) and search for traces! By executing search queries, you will then see Quickwit's own traces:

- `find_traces` is the endpoint called when you search for traces in Jaeger UI, it then calls `find_trace_ids`.
- `find_traces_ids` is doing an aggregation query on spans to get unique trace IDs.
- `root_search` is Quickwit search entry point. It calls search on each split (piece of index) in parallel, in a distributed manner, or just locally if there is only one node.
- `leaf_search` is the search entry point on each node. It calls `leaf_search_single_split` on each split.
- `leaf_search_single_split` is the search entry point on a split. It will call consecutively `warmup` and `tantivy_search`.
- `warmup` is the warmup phase of the search. It prefetches data needed to execute the search query.
- `tantivy_search` is the search phase of the search. It is executing the search query at horse speeds with the [Tantivy](https://github.com/quickwit-oss/tantivy).

![Quickwit trace in Jaeger UI](../assets/images/jaeger-ui-quickwit-trace-analysis.png)

## Next steps

You are now ready for the next step: instrumenting your application and sending its traces to Quickwit. You can do it:
- In [python](send-traces/using-otel-sdk-python.md).
- And in any other language that OpenTelemetry supports.


================================================
FILE: docs/distributed-tracing/send-traces/_category_.yaml
================================================
label: 'Sending traces'
position: 3
collapsed: false


================================================
FILE: docs/distributed-tracing/send-traces/using-otel-collector.md
================================================
---
title: Using OTEL Collector
description: Using OTEL Collector
tags: [otel, collector, traces]
sidebar_position: 1
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

If you already have your own OpenTelemetry Collector and want to export your traces to Quickwit, you need a new OLTP gRPC exporter in your config.yaml:

<Tabs>

<TabItem value="macOS_windows" label="macOS/Windows">

```yaml title="otel-collector-config.yaml"
receivers:
  otlp:
    protocols:
      grpc:
      http:

processors:
  batch:

exporters:
  otlp/quickwit:
    endpoint: host.docker.internal:7281
    tls:
      insecure: true
    # By default, traces are sent to the otel-traces-v0_7.
    # You can customize the index ID By setting this header.
    # headers:
    #   qw-otel-traces-index: otel-traces-v0_7

service:
  pipelines:
    traces:
      receivers: [otlp]
      processors: [batch]
      exporters: [otlp/quickwit]
```

</TabItem>

<TabItem value="linux" label="Linux">

```yaml title="otel-collector-config.yaml"
receivers:
  otlp:
    protocols:
      grpc:
      http:

processors:
  batch:

exporters:
  otlp/quickwit:
    endpoint: 127.0.0.1:7281
    tls:
      insecure: true

service:
  pipelines:
    traces:
      receivers: [otlp]
      processors: [batch]
      exporters: [otlp/quickwit]
```

</TabItem>

</Tabs>


## Test your OTEL configuration

1. [Install](../../get-started/installation.md) and start a Quickwit server:
   
```bash
./quickwit run
```

2. Start a collector with the previous config:

<Tabs>

<TabItem value="macOS_windows" label="macOS/Windows">

```bash
docker run -v ${PWD}/otel-collector-config.yaml:/etc/otelcol/config.yaml -p 4317:4317 -p 4318:4318 -p 7281:7281 otel/opentelemetry-collector
```

</TabItem>

<TabItem value="linux" label="Linux">

```bash
docker run -v ${PWD}/otel-collector-config.yaml:/etc/otelcol/config.yaml --network=host -p 4317:4317 -p 4318:4318 -p 7281:7281 otel/opentelemetry-collector
```

</TabItem>

</Tabs>

3. Send a trace to your collector with cURL:

```bash
curl -XPOST "http://localhost:4318/v1/traces" -H "Content-Type: application/json" \
--data-binary @- << EOF
{
 "resource_spans": [
   {
     "resource": {
       "attributes": [
         {
           "key": "service.name",
           "value": {
             "string_value": "test-with-curl"
           }
         }
       ]
     },
     "scope_spans": [
       {
         "scope": {
           "name": "manual-test"
         },
         "spans": [
           {
             "time_unix_nano": "1678974011000000000",
             "observed_time_unix_nano": "1678974011000000000",
             "start_time_unix_nano": "1678974011000000000",
             "end_time_unix_nano": "1678974021000000000",
             "trace_id": "3c191d03fa8be0653c191d03fa8be065",
             "span_id": "3c191d03fa8be065",
             "kind": 2,
             "events": [],
             "status": {
               "code": 1
             }
           }
         ]
       }
     ]
   }
 ]
}
EOF
```

You should see a log on the Quickwit server similar to the following:

```bash
2023-03-16T13:44:09.369Z  INFO quickwit_indexing::actors::indexer: new-split split_id="01GVNAKT5TQW0T2QGA245XCMTJ" partition_id=6444214793425557444
```

This means that Quickwit has received the trace and created a new split. Wait for the split to be published before searching for traces.

## Next step

Follow our tutorial on [how to send traces from your python app](using-otel-sdk-python.md).


================================================
FILE: docs/distributed-tracing/send-traces/using-otel-sdk-python.md
================================================
---
title: Using OTEL SDK - Python
description: A simple tutorial to send traces to Quickwit from a Python Flask app.
icon_url: /img/tutorials/python-logo.png
tags: [python, traces, ingestion]
sidebar_position: 2
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

In this tutorial, we will show you how to instrument a Python [Flask](https://flask.palletsprojects.com/en/2.2.x/) app with OpenTelemetry and send traces to Quickwit. This tutorial was inspired by the [Python OpenTelemetry](https://opentelemetry.io/docs/instrumentation/python/getting-started/) documentation, huge thanks to the OpenTelemetry team!

## Prerequisites

- Python3 installed
- Docker installed

## Start a Quickwit instance

[Install Quickwit](/docs/get-started/installation.md) and start a Quickwit instance:

```bash
./quickwit run
```

## Start Jaeger UI

Let's start a Jaeger UI instance with docker. Here we need to inform jaeger that it should use quickwit as its backend.

Due to some idiosyncrasy associated with networking with containers, we will have to use a different approach on MacOS & Windows on one side, and Linux on the other side.

### MacOS & Windows

We can rely on `host.docker.internal` to get the docker bridge ip address, pointing to our quickwit server.

```bash
docker run --rm --name jaeger-qw \
    -e SPAN_STORAGE_TYPE=grpc \
    -e GRPC_STORAGE_SERVER=host.docker.internal:7281 \
    -p 16686:16686 \
    jaegertracing/jaeger-query:1.60
```

### Linux

By default, quickwit is listening to `127.0.0.1`, and will not respond to request directed
to the docker bridge (`172.17.0.1`). There are different ways to solve this problem.
The easiest is probably to use host network mode.

```bash
docker run --rm --name jaeger-qw --network=host \
    -e SPAN_STORAGE_TYPE=grpc \
    -e GRPC_STORAGE_SERVER=127.0.0.1:7281 \
    -p 16686:16686 \
    jaegertracing/jaeger-query:1.60
```

## Run a simple Flask app

We will start a flask application that is doing three things on each HTTP call `http://localhost:5000/process-ip`:

- Fetching an IP address from [https://httpbin.org/ip](https://httpbin.org/ip).
- Parsing it and fake processing it with a random sleep.
- Displaying it with a random sleep.


Let's first install the dependencies:

```bash
pip install flask
pip install opentelemetry-distro
pip install opentelemetry-exporter-otlp
```

The opentelemetry-distro package installs the API, SDK, and the opentelemetry-bootstrap and opentelemetry-instrument tools that you’ll use.

Here is the code of our app:

```python title=my_app.py
import random
import time
import requests

from flask import Flask

app = Flask(__name__)

@app.route("/process-ip")
def process_ip():
    body = fetch()
    ip = parse(body)
    display(ip)
    return ip

def fetch():
    resp = requests.get('https://httpbin.org/ip')
    body = resp.json()
    return body

def parse(body):
    # Sleep for a random amount of time to make the span more visible.
    secs = random.randint(1, 100) / 1000
    time.sleep(secs)

    return body["origin"]

def display(ip):
    # Sleep for a random amount of time to make the span more visible.
    secs = random.randint(1, 100) / 1000
    time.sleep(secs)

    message = f"Your IP address is `{ip}`."
    print(message)

if __name__ == "__main__":
    app.run(port=5000)
```

## Auto-instrumentation

OpenTelemetry provides a tool called `opentelemetry-bootstrap` that automatically instruments your Python application.

```bash
opentelemetry-bootstrap -a install
```

And that's it, we are now ready to run the app:

```bash
# We don't need metrics.
OTEL_METRICS_EXPORTER=none \
OTEL_TRACES_EXPORTER=console \
OTEL_SERVICE_NAME=my_app \
python my_app.py
```

By hitting [http://localhost:5000/process-ip](http://localhost:5000/process-ip) you should see the corresponding trace in the console.

This is nice but it would be even better if we could have the time passed in each steps, get the status code of the HTTP request, and the content type of the response. Let's do that by manually instrumentating our app!

## Manual instrumentation

```python title=my_instrumented_app.py
import random
import time
import requests

from flask import Flask

from opentelemetry import trace

# Creates a tracer from the global tracer provider
tracer = trace.get_tracer(__name__)

app = Flask(__name__)

@app.route("/process-ip")
@tracer.start_as_current_span("process_ip")
def process_ip():
    body = fetch()
    ip = parse(body)
    display(ip)
    return ip

@tracer.start_as_current_span("fetch")
def fetch():
    resp = requests.get('https://httpbin.org/ip')
    body = resp.json()

    headers = resp.headers
    current_span = trace.get_current_span()
    current_span.set_attribute("status_code", resp.status_code)
    current_span.set_attribute("content_type", headers["Content-Type"])
    current_span.set_attribute("content_length", headers["Content-Length"])

    return body

@tracer.start_as_current_span("parse")
def parse(body):
    # Sleep for a random amount of time to make the span more visible.
    secs = random.randint(1, 100) / 1000
    time.sleep(secs)

    return body["origin"]

@tracer.start_as_current_span("display")
def display(ip):
    # Sleep for a random amount of time to make the span more visible.
    secs = random.randint(1, 100) / 1000
    time.sleep(secs)

    message = f"Your IP address is `{ip}`."
    print(message)

    current_span = trace.get_current_span()
    current_span.add_event(message)

if __name__ == "__main__":
    app.run(port=5000)

```

We can now start the new instrumented app:

```bash
OTEL_METRICS_EXPORTER=none \
OTEL_TRACES_EXPORTER=console \
OTEL_SERVICE_NAME=my_app \
opentelemetry-instrument python my_instrumented_app.py
```

If you hit again [http://localhost:5000/process-ip](http://localhost:5000/process-ip), you should see new spans with name `fetch`, `parse`, and `display` and with the corresponding custom attributes!


## Sending traces to Quickwit

To send traces to Quickwit, we need to use the OTLP exporter. This is a simple as this:

```bash
OTEL_METRICS_EXPORTER=none \ # We don't need metrics
OTEL_SERVICE_NAME=my_app \
OTEL_EXPORTER_OTLP_TRACES_ENDPOINT=http://localhost:7281 \
opentelemetry-instrument python my_instrumented_app.py
```

Now, if you hit [http://localhost:5000/process-ip](http://localhost:5000/process-ip), traces will be send to Quickwit, you just need to wait around 30 seconds before they are indexed. It's time for a coffee break!

30 seconds has passed, let's query the traces from our service:

```bash
curl -XPOST http://localhost:7280/api/v1/otel-trace-v0/search -H 'Content-Type: application/json' -d '{
    "query": "resource_attributes.service.name:my_app"
}'
```

And then open the Jaeger UI [localhost:16686](http://localhost:16686/) and play with it, you have now a Jaeger UI powered by a Quickwit storage backend!

![Flask trace analysis in Jaeger UI](../../assets/images/jaeger-ui-python-app-trace-analysis.png)

![Flask traces in Jaeger UI](../../assets/images/jaeger-ui-python-app-traces.png)

## Sending traces to your OpenTelemetry collector

Start a collector as described in the [OpenTelemetry collector tutorial](using-otel-collector.md) and execute the following command:

```bash
OTEL_METRICS_EXPORTER=none \ # We don't need metrics
OTEL_SERVICE_NAME=my_app \
opentelemetry-instrument python instrumented_app.py
```

Traces will be sent to your collector, and then to Quickwit.


## Wrap up

In this tutorial, we have seen how to instrument a Python application with OpenTelemetry and send traces to Quickwit. We have also seen how to use the Jaeger UI to analyze traces.

All the code snippets in our [tutorial repository](https://github.com/quickwit-oss/tutorials).

Please let us know what you think about this tutorial, and if you have any questions, feel free to reach out to us on [Discord](https://discord.gg/7eNYX4d) or [Twitter](https://twitter.com/quickwit_inc).


================================================
FILE: docs/get-started/_category_.yaml
================================================
label: 'Get started'
position: 2
collapsed: false


================================================
FILE: docs/get-started/installation.md
================================================
---
title: Installation
sidebar_position: 2
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';
import { useDocsVersion } from '@docusaurus/theme-common/internal';

export const RenderIf = ({children, condition}) => (
    <>
        {condition && children}
    </>
);

Quickwit compiles to a single binary and we provide different methods to install it:

- Linux/MacOS binaries that you can [download manually](#download) or with the [install script](#install-script)
- [Docker image](#use-the-docker-image)
- [Helm chart](../deployment/kubernetes/helm.md)
- [Glasskube](../deployment/kubernetes/glasskube.md)

## Prerequisites

Quickwit is officially only supported for Linux. Freebsd and MacOS are not officially supported, but should work as well.

Quickwit supplies binaries for x86-64 and aarch64. No special instruction set is required, but on x86-64 SSE3 is recommended.
Support of aarch64 is currently experimental.

## Download

<RenderIf condition={useDocsVersion().version == 'current'}>

Version: nightly - 
License: [Apache 2.0](https://github.com/quickwit-oss/quickwit/blob/main/LICENSE) -
Downloads `.tar.gz`:
- [Linux ARM64](https://github.com/quickwit-oss/quickwit/releases/download/nightly/quickwit-nightly-aarch64-unknown-linux-gnu.tar.gz)
- [Linux x86_64](https://github.com/quickwit-oss/quickwit/releases/download/nightly/quickwit-nightly-x86_64-unknown-linux-gnu.tar.gz)
- [macOS aarch64](https://github.com/quickwit-oss/quickwit/releases/download/nightly/quickwit-nightly-aarch64-apple-darwin.tar.gz)
- [macOS x86_64](https://github.com/quickwit-oss/quickwit/releases/download/nightly/quickwit-nightly-x86_64-apple-darwin.tar.gz)

</RenderIf>

<!-- Bellow is the set of links to edit when a new version is released -->
<RenderIf condition={useDocsVersion().version != 'current'}>

version: 0.8.1 - [Release notes](https://github.com/quickwit-oss/quickwit/releases/tag/v0.8.1) - [Changelog](https://github.com/quickwit-oss/quickwit/blob/main/CHANGELOG.md)
License: [Apache 2.0](https://github.com/quickwit-oss/quickwit/blob/main/LICENSE)
Downloads `.tar.gz`:
- [Linux ARM64](https://github.com/quickwit-oss/quickwit/releases/download/v0.8.1/quickwit-v0.8.1-aarch64-unknown-linux-gnu.tar.gz)
- [Linux x86_64](https://github.com/quickwit-oss/quickwit/releases/download/v0.8.1/quickwit-v0.8.1-x86_64-unknown-linux-gnu.tar.gz)
- [macOS aarch64](https://github.com/quickwit-oss/quickwit/releases/download/v0.8.1/quickwit-v0.8.1-aarch64-apple-darwin.tar.gz)
- [macOS x86_64](https://github.com/quickwit-oss/quickwit/releases/download/v0.8.1/quickwit-v0.8.1-x86_64-apple-darwin.tar.gz)

</RenderIf>

Check out the available builds in greater detail on [GitHub](https://github.com/quickwit-oss/quickwit/releases)

### Note on external dependencies

Quickwit depends on the following external libraries to work correctly:
- `libssl`: the industry defacto cryptography library.
These libraries can be installed on your system using the native package manager.
You can install these dependencies using the following command:

<Tabs>

<TabItem value="ubuntu" label="Ubuntu">

```bash
apt-get -y update && apt-get -y install libssl
```

</TabItem>

<TabItem value="aws-linux" label="AWS Linux">

```bash
yum -y update && yum -y install openssl
```

</TabItem>

<TabItem value="arch-linux" label="Arch Linux">

```bash
pacman -S openssl
```

</TabItem>

</Tabs>

Additionally it requires a few more dependencies to compile it. These dependencies are not required on production system:
- `clang`: used to compile some dependencies.
- `protobuf-compiler`: used to compile protobuf definitions.
- `libssl-dev`: headers for libssl.
- `pkg-config`: used to locate libssl.
- `cmake`: used to build librdkafka, for kafka support.
These dependencies can be installed on your system using the native package manager.
You can install these dependencies using the following command:

<Tabs>

<TabItem value="ubuntu" label="Ubuntu">

```bash
apt install -y clang protobuf-compiler libssl-dev pkg-config cmake
```

</TabItem>

<TabItem value="aws-linux" label="AWS Linux">

```bash
yum -y update && yum -y install clang openssl-devel pkgconfig cmake3
# amazonlinux only has protobuf-compiler 2.5, we need something much more up to date.
wget https://github.com/protocolbuffers/protobuf/releases/download/v21.9/protoc-21.9-linux-x86_64.zip
sudo unzip protoc-21.9-linux-x86_64.zip -d /usr/local
# amazonlinux use cmake2 as cmake, we need cmake3
ln -s /usr/bin/cmake3 /usr/bin/cmake
```

</TabItem>

<TabItem value="arch-linux" label="Arch Linux">

```bash
pacman -S clang protobuf openssl pkg-config cmake make
```

</TabItem>

</Tabs>

## Install script

To easily install Quickwit on your machine, just run the command below from your preferred shell.
The script detects the architecture and then downloads the correct binary archive for the machine.

```bash
curl -L https://install.quickwit.io | sh
```

All this script does is download the correct binary archive for your machine and extracts it in the current working directory. This means you can download any desired archive from [github](https://github.com/quickwit-oss/quickwit/releases) that matches your OS architecture and manually extract it anywhere.

Once installed or extracted, all of Quickwit's installation files can be found in a directory named `quickwit-{version}` where `version` is the corresponding version of Quickwit. This directory has the following layout:

```bash
quickwit-{version}
    ├── config
    │   └── quickwit.yaml
    ├── LICENSE
    ├── quickwit
    └── qwdata
```

- `config/quickwit.yaml`: is the default configuration file.
- `LICENSE`: the license file.
- `quickwit`: the quickwit executable binary.
- `qwdata/`: the default data directory.


## Use the Docker image

If you use Docker, this might be one of the quickest way to get going.
The following command will pull the image from [Docker Hub](https://hub.docker.com/r/quickwit/quickwit)
and start a container ready to execute Quickwit commands.

```bash
docker run --rm quickwit/quickwit --version

# If you are using Apple silicon based macOS system you might need to specify the platform.
# You can also safely ignore jemalloc warnings.
docker run --rm --platform linux/amd64 quickwit/quickwit --version
```

To get the full gist of this, follow the [Quickstart guide](./quickstart.md).


================================================
FILE: docs/get-started/query-language-intro.md
================================================
---
title: Introduction to Quickwit's query language
sidebar_position: 3
---

Quickwit allows you to search on your indexed documents using a simple query language. Here's a quick overview.

## Clauses

The main concept of this language is a clause, which represents a simple condition that can be tested against documents. 

### Querying fields

A clause operates on fields of your document. It has the following syntax :
```
field:condition
```

For example, when searching documents where the field `app_name` contains the token `tantivy`, you would write the following clause:
```
app_name:tantivy
```

In many cases the field name can be omitted, quickwit will then use the `default_search_fields` configured for the index.

### Clauses Cheat Sheet

Quickwit support various types of clauses to express different kinds of conditions. Here's a quick overview of them:

| type | syntax | examples | description| `default_search_field`|
|-------------|--------|----------|------------|-----------------------|
| term | `field:token` | `app_name:tantivy` <br/> `process_id:1234` <br/> `word` | A term clause tests the existence of avalue in the field's tokens | yes |
| term prefix | `field:prefix*` | `app_name:tant*` <br/> `quick*` | A term clause tests the existence of a token starting with the provided value | yes |
| term set | `field:IN [token token ..]` |`severity:IN [error warn]` | A term set clause tests the existence of any of the provided value in the field's tokens| yes |
| phrase | `field:"sequence of tokens"` | `full_name:"john doe"` | A phrase clause tests the existence of the provided sequence of tokens | yes |
| phrase prefix | `field:"sequence of tokens"*` | `title:"how to m"*` | A phrase prefix clause tests the existence of a sequence of tokens, the last one used like in a prefix clause | yes |
| all | `*` | `*` | A match-all clause will match every document | no |
| exist | `field:*` | `error:*` | An exist clause tests the existence of any value for the field, it will match only if the field exists | no |
| range | `field:bounds` |`duration:[0 TO 1000}` <br/> `last_name:[banner TO miller]` | A term clause tests the existence of a token between the provided bounds | no |

## Queries

### Combining queries

Clauses can be combined using boolean operators `AND` and  `OR` to create more complex search expressions
An `AND` query will match only if conditions on both sides of the operator are met
```
type:rose AND color:red
```

An `OR` query will match if either or both conditions on each side of the operator are met
```
weekday:6 OR weekday:7
```

If no operator is provided, `AND` is implicitly assumed.

```
type:violet color:blue
```

### Grouping queries
You can build complex expressions by grouping clauses using parentheses.
```
(type:rose AND color:red) OR (type:violet AND color:blue)
```

When no parentheses are used, `AND` takes precedence over `OR`, meaning that the following query is equivalent to the one above.

```
type:rose AND color:red OR type:violet AND color:blue
```

### Negating queries

An expression can be negated either with the operator `NOT` or by prefixing the query with a dash `-`.

`NOT` and `-` take precedence over everything, such that `-a AND b` means `(-a) AND b`, not `-(a AND B)`.

```
NOT severity:debug
```

or

```
type:proposal -(status:rejected OR status:pending)
```


## Dive deeper

If you want to know more about the query language, head to the [Query Language Reference](../reference/query-language.md)


================================================
FILE: docs/get-started/quickstart.md
================================================
---
title: Quickstart
sidebar_position: 1
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

In this quick start guide, we will install Quickwit, create an index, add documents and finally execute search queries. All the Quickwit commands used in this guide are documented [in the CLI reference documentation](/docs/reference/cli.md).

## Install Quickwit using Quickwit installer

The Quickwit installer automatically picks the correct binary archive for your environment and then downloads and unpacks it in your working directory.
This method works only for [some OS/architectures](installation.md#download), and you will also need to install some [external dependencies](installation.md#note-on-external-dependencies).

```bash
curl -L https://install.quickwit.io | sh
```

```bash
cd ./quickwit-v*/
./quickwit --version
```

You can now move this executable directory wherever sensible for your environment and possibly add it to your `PATH` environment.

## Use Quickwit's Docker image

You can also pull and run the Quickwit binary in an isolated Docker container.

```bash
# Create first the data directory.
mkdir qwdata
docker run --rm quickwit/quickwit --version
```

If you are using Apple silicon based macOS system you might need to specify the platform. You can also safely ignore jemalloc warnings.

```bash
docker run --rm --platform linux/amd64 quickwit/quickwit --version
```

## Start Quickwit server

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit run
```

</TabItem>

<TabItem value="docker" label="Docker">

```bash
docker run --rm -v $(pwd)/qwdata:/quickwit/qwdata -p 127.0.0.1:7280:7280 quickwit/quickwit run
```

</TabItem>

</Tabs>

Tips: you can use the environment variable `RUST_LOG` to control quickwit verbosity.

Check it's working by browsing the [UI at http://localhost:7280](http://localhost:7280) or do a simple GET with cURL:

```bash
curl http://localhost:7280/api/v1/version
```

## Create your first index

Before adding documents to Quickwit, you need to create an index configured with a YAML config file. This config file notably lets you define how to map your input documents to your index fields and whether these fields should be stored and indexed. See the [index config documentation](/docs/configuration/index-config.md).

Let's create an index configured to receive Stackoverflow posts (questions and answers).

```bash
# First, download the stackoverflow dataset config from Quickwit repository.
curl -o stackoverflow-index-config.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/stackoverflow/index-config.yaml
```

The index config defines three fields: `title`, `body` and `creationDate`. `title` and `body` are [indexed and tokenized](../configuration/index-config.md#text-type), and they are also used as default search fields, which means they will be used for search if you do not target a specific field in your query. `creationDate` serves as the timestamp for each record. There are no more explicit field definitions as we can use the default dynamic [mode](/docs/configuration/index-config.md#mode): the undeclared fields will still be indexed, by default fast fields are enabled to enable aggregation queries. and the `raw` tokenizer is used for text. 

And here is the complete config:

```yaml title="stackoverflow-index-config.yaml"
#
# Index config file for stackoverflow dataset.
#
version: 0.7

index_id: stackoverflow

doc_mapping:
  field_mappings:
    - name: title
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: body
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: creationDate
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: creationDate

search_settings:
  default_search_fields: [title, body]

indexing_settings:
  commit_timeout_secs: 30
```

Now we can create the index with the command:

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit index create --index-config ./stackoverflow-index-config.yaml
```

</TabItem>

<TabItem value="curl" label="CURL">

```bash
curl -XPOST http://127.0.0.1:7280/api/v1/indexes --header "content-type: application/yaml" --data-binary @./stackoverflow-index-config.yaml
```

</TabItem>

</Tabs>

Check that a directory `./qwdata/indexes/stackoverflow` has been created, Quickwit will write index files here and a `metastore.json` which contains the [index metadata](../overview/architecture.md#index).
You're now ready to fill the index.


## Let's add some documents

Quickwit can index data from many [sources](/docs/configuration/source-config.md). We will use a new line delimited json [ndjson](http://ndjson.org/) datasets as our data source.
Let's download [a bunch of stackoverflow posts (10 000)](https://quickwit-datasets-public.s3.amazonaws.com/stackoverflow.posts.transformed-10000.json) in [ndjson](http://ndjson.org/) format and index it.

```bash
# Download the first 10_000 Stackoverflow posts articles.
curl -O https://quickwit-datasets-public.s3.amazonaws.com/stackoverflow.posts.transformed-10000.json
```

<Tabs>

<TabItem value="cli" label="CLI">

```bash
# Index our 10k documents.
./quickwit index ingest --index stackoverflow --input-path stackoverflow.posts.transformed-10000.json --force
```

</TabItem>

<TabItem value="curl" label="CURL">

```bash
# Index our 10k documents.
curl -XPOST "http://127.0.0.1:7280/api/v1/stackoverflow/ingest?commit=force" --data-binary @stackoverflow.posts.transformed-10000.json
```

</TabItem>

</Tabs>

As soon as the ingest command finishes you can start querying data by using the following `search` command:

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit index search --index stackoverflow --query "search AND engine"
```

</TabItem>

<TabItem value="curl" label="CURL">

```bash
curl "http://127.0.0.1:7280/api/v1/stackoverflow/search?query=search+AND+engine"
```

</TabItem>

</Tabs>

It should return 10 hits. Now you're ready to play with the search API.


## Execute search queries


Let's start with a query on the field `title`: `title:search AND engine`:
```bash
curl "http://127.0.0.1:7280/api/v1/stackoverflow/search?query=title:search+AND+engine"
```

The same request can be expressed as a JSON query:
```bash
curl -XPOST "http://localhost:7280/api/v1/stackoverflow/search" -H 'Content-Type: application/json' -d '{
    "query": "title:search AND engine"
}'
```

This format is more verbose but it allows you to use more advanced features such as aggregations. The following query finds most popular tags used on the questions in this dataset:
```bash
curl -XPOST "http://localhost:7280/api/v1/stackoverflow/search" -H 'Content-Type: application/json' -d '{
    "query": "type:question",
    "max_hits": 0,
    "aggs": {
        "foo": {
            "terms":{
                "field":"tags",
                "size": 10
            }
        }
    }
}'
```

As you are experimenting with different queries check out the server logs to see what's happening.

:::note

Don't forget to encode correctly the query params to avoid bad request (status 400).

:::


## Clean

Let's do some cleanup by deleting the index:

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit index delete --index stackoverflow
```

</TabItem>

<TabItem value="rest" label="REST">

```bash
curl -XDELETE http://127.0.0.1:7280/api/v1/indexes/stackoverflow
```

</TabItem>

</Tabs>

Congrats! You can level up with the following tutorials to discover all Quickwit features.


## TLDR

Run the following command from within Quickwit's installation directory.

```bash
curl -o stackoverflow-index-config.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/stackoverflow/index-config.yaml
./quickwit index create --index-config ./stackoverflow-index-config.yaml
curl -O https://quickwit-datasets-public.s3.amazonaws.com/stackoverflow.posts.transformed-10000.json
./quickwit index ingest --index stackoverflow --input-path ./stackoverflow.posts.transformed-10000.json --force
./quickwit index search --index stackoverflow --query "search AND engine"
./quickwit index delete --index stackoverflow
```


## Next tutorials

- [Search on logs with timestamp pruning](/docs/get-started/tutorials/tutorial-hdfs-logs)
- [Setup a distributed search on AWS S3](/docs/get-started/tutorials/tutorial-hdfs-logs-distributed-search-aws-s3)


================================================
FILE: docs/get-started/tutorials/_category_.yaml
================================================
label: 'Tutorials'
position: 2
collapsed: false


================================================
FILE: docs/get-started/tutorials/prometheus-metrics.md
================================================
---
title: Metrics with Grafana and Prometheus
description: A simple tutorial to display Quickwit metrics with Grafana.
icon_url: /img/tutorials/quickwit-logo.png
tags: [grafana, prometheus, integration]
sidebar_position: 2
---

In this tutorial, you will learn how to set up Grafana to display Quickwit metrics using Prometheus. Grafana will visualize the metrics collected from Quickwit, allowing you to monitor its performance effectively.

## Step 1: Create a Docker Compose File

First, create a `docker-compose.yml` file in your project directory. This file will configure and run Quickwit, Prometheus, and Grafana as Docker services.

Here’s the complete Docker Compose configuration:

```yaml
services:
  quickwit:
    image: quickwit/quickwit
    environment:
      QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER: "true"
      OTEL_EXPORTER_OTLP_ENDPOINT: "http://localhost:7281"
    ports:
      - 7280:7280
    command: ["run"]

  grafana:
    image: grafana/grafana-oss
    container_name: grafana
    ports:
      - "${MAP_HOST_GRAFANA:-127.0.0.1}:3000:3000"
    environment:
      GF_INSTALL_PLUGINS: https://github.com/quickwit-oss/quickwit-datasource/releases/download/v0.4.6/quickwit-quickwit-datasource-0.4.6.zip;quickwit-quickwit-datasource
      GF_AUTH_DISABLE_LOGIN_FORM: "true"
      GF_AUTH_ANONYMOUS_ENABLED: "true"
      GF_AUTH_ANONYMOUS_ORG_ROLE: Admin

  prometheus:
    image: prom/prometheus:latest
    container_name: prometheus
    volumes:
      - ./prometheus.yml:/etc/prometheus/prometheus.yml  # Ensure prometheus.yml exists in the same directory
    ports:
      - 9090:9090
```

### Explanation of Services

- **Quickwit**: Runs the Quickwit service on port `7280`.
- **Grafana**: Queries and displays data from Prometheus.
- **Prometheus**: Collects metrics from Quickwit using the `/metrics` endpoint.

## Step 2: Configure Prometheus

Prometheus needs a configuration file to define how it scrapes metrics from Quickwit. Create a file named `prometheus.yml` in the same directory as your Docker Compose file with the following content:

```yaml
global:
  scrape_interval: 1s
  scrape_timeout: 1s

scrape_configs:
  - job_name: quickwit
    metrics_path: /metrics
    static_configs:
      - targets:
          - quickwit:7280
```

## Step 3: Start the Services

Run the following command in your terminal to start all services defined in the Docker Compose file:

```bash
docker compose up
```

This will launch Quickwit, Prometheus, and Grafana services.

## Step 4: Configure Grafana to Use Prometheus

1. Open Grafana in your browser at `http://localhost:3000`.
2. Navigate to **Configuration** > **Data Sources**.
3. Click **Add Data Source**, select **Prometheus**, and set the URL to `http://prometheus:9090`.
4. Click **Save & Test** to verify the connection.

## Step 5: Create or Use Pre-Configured Dashboards

Now that Grafana is set up with Prometheus as a data source, you can create custom dashboards or use Quickwit's pre-configured dashboards:

1. Go to the **Dashboards** section in Grafana.
2. Import or create a new dashboard to visualize metrics.
3. Alternatively, use one of Quickwit’s [pre-configured dashboards](../../operating/monitoring).


================================================
FILE: docs/get-started/tutorials/trace-analytics-with-grafana.md
================================================
---
title: Logs and Traces with Grafana
description: A simple tutorial to use Grafana with Quickwit's datasource plugin.
icon_url: /img/tutorials/quickwit-logo.png
tags: [grafana, integration]
sidebar_position: 2
---

In this tutorial, we will set up a Grafana Dashboard showing Quickwit traces using Docker Compose.

You only need a few minutes to get Grafana working with Quickwit and build meaningful dashboards.

## Create a Docker Compose recipe

First, create a `docker-compose.yml` file. This file will define the services needed to run Quickwit with OpenTelemetry and Grafana with the Quickwit Datasource plugin.

Below is the complete Docker Compose configuration:

```yaml
version: '3.0'
services:
  quickwit:
    image: quickwit/quickwit
    environment:
      QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER: "true"
      OTEL_EXPORTER_OTLP_ENDPOINT: "http://localhost:7281"
    ports:
      - 7280:7280
    command: ["run"]

  grafana:
    image: grafana/grafana-oss
    container_name: grafana
    ports:
      - "${MAP_HOST_GRAFANA:-127.0.0.1}:3000:3000"
    environment:
      GF_INSTALL_PLUGINS: https://github.com/quickwit-oss/quickwit-datasource/releases/download/v0.4.6/quickwit-quickwit-datasource-0.4.6.zip;quickwit-quickwit-datasource
      GF_AUTH_DISABLE_LOGIN_FORM: "true"
      GF_AUTH_ANONYMOUS_ENABLED: "true"
      GF_AUTH_ANONYMOUS_ORG_ROLE: Admin
```

The default Grafana port is 3000. If this port is already taken, you can modify the port mapping, for example, changing 3000:3000 to 3100:3000 or any other available port.

Save and run the recipe:

```bash
$ docker compose up
```

You should be able to access Quickwit's UI on `http://localhost:7280/` and Grafana's UI on `http://localhost:3000/`.

## Setting up the datasource

In Grafana, head to [Data Sources](http://localhost:3000/connections/datasources). If the plugin is installed correctly you should be able to find Quickwit in the list.

We're going to set up a new Quickwit data source looking at Quickwit's own OpenTelemetry traces, let's configure the datasource with the following parameters:

- URL : `http://quickwit:7280/api/v1` _This uses the docker service name as the host_
- Index ID : `otel-traces-v0_7`

Save and test, you should obtain a confirmation that the datasource is correctly set up.


![Quickwit Plugin configuration success](../../assets/images/grafana-ui-quickwit-datasource-plugin-success.png)


You can also set up a new Quickwit data source looking at Quickwit's own OpenTelemetry logs (or your own logs index), let's configure the datasource with the following parameters:

- URL : `http://quickwit:7280/api/v1` _This uses the docker service name as the host_
- Index ID : `otel-logs-v0_7`


## Creating a dashboard

You can then [create a new dashboard](http://localhost:3000/dashboard/new) and add a visualization : you should be able to choose the traces quickwit datasource here.

Quickwit sends itself its own traces, so you should already have data to display. Let's configure some panels !

- a Table counting span_names 
  - **Panel type** : Table
  - **Query**: _empty_
  - **Metric** : Count
  - **Group by** : Terms : `span_name` : order by Count
- a Bar Chart showing the amount of tantivy searches per hour :
  - **Panel type**: Time Series
  - **Query** : "span_name:tantivy_search"
  - **Metric**: Count
  - **Group by** : Date Histogram : `span_start_timestamp_nanos` : Interval 1h
- a Bar Chart showing the amount of ERROR logs per hour for the last 6 hours :
  - **Panel type**: Bar Chart
  - **Query**: "service_name:quickwit AND events.event_attributes.level:ERROR"
  - **Metric**: Count
  - **Group by** : Terms : `span_start_timestamp_nanos` : Interval 1h
- another query on the same Bar Chart for WARN logs

## The result

Here's what your first dashboard can look like :

![Quickwit Panel in Grafana Dashboard](../../assets/images/screenshot-grafana-tutorial-dashboard.png)


================================================
FILE: docs/get-started/tutorials/tutorial-hdfs-logs-distributed-search-aws-s3.md
================================================
---
title: Distributed search on AWS S3
description: Index log entries on AWS S3 using an EC2 instance and launch a distributed cluster.
tags: [aws, integration]
icon_url: /img/tutorials/aws-logo.png
sidebar_position: 6
---

In this guide, we will index about 40 million log entries (13 GB decompressed) on AWS S3 using an EC2 instance and launch a three-node distributed search cluster.

Example of a log entry:
```json
{
  "timestamp": 1460530013,
  "severity_text": "INFO",
  "body": "PacketResponder: BP-108841162-10.10.34.11-1440074360971:blk_1074072698_331874, type=HAS_DOWNSTREAM_IN_PIPELINE terminating",
  "resource": {
    "service": "datanode/01"
  },
  "attributes": {
    "class": "org.apache.hadoop.hdfs.server.datanode.DataNode"
  }
}
```

:::caution

Before using Quickwit with an object storage, check out our [advice](../../operating/aws-costs) for deploying on AWS S3 to avoid some bad surprises at the end of the month.

:::

First of all, let's create an EC2 instance, install a Quickwit binary, and [configure it](../../guides/aws-setup) to let Quickwit access your S3 buckets. This instance will be used for indexing our dataset (note that you can also index your dataset from your local machine if it has the rights to read/write on AWS S3).

## Install

```bash
curl -L https://install.quickwit.io | sh
cd quickwit-v*/
```

## Configure Quickwit with S3

Let's define the S3 path where we want to store our indexes.

```bash
export S3_PATH=s3://{path/to/bucket}/indexes
```

:::note
You'll want to include the necessary authorization for the given bucket, this can be done by setting the `AWS_ACCESS_KEY_ID` and `AWS_SECRET_ACCESS_KEY`
environment variables, or via the AWS credentials file. Usually located at `~/.aws/credentials`.

For more info check out [our AWS setup guide](https://quickwit.io/docs/guides/aws-setup)
:::

Now we can create a Quickwit config file.

```bash
# Create Quickwit config file.
echo "version: 0.7
node_id: searcher-1
listen_address: 0.0.0.0
metastore_uri: ${S3_PATH}
default_index_root_uri: ${S3_PATH}
" > config.yaml
```

> You can also pass environment variables directly:
> ```yaml
> # config.yaml
> node_id: searcher-1
> listen_address: 0.0.0.0
> version: 0.7
> metastore_uri: ${S3_PATH}
> default_index_root_uri: ${S3_PATH}
>```

We are now ready to start Quickwit.

```bash
./quickwit run --config config.yaml
```

## Create your index

```bash
# First, download the hdfs logs config from Quickwit repository.
curl -o hdfs_logs_index_config.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/hdfs-logs/index-config.yaml
```

The index config defines five fields: `timestamp`, `tenant_id`, `severity_text`, `body`, and one JSON field
for the nested values `resource.service`, we could use an object field here and maintain a fixed schema, but for convenience we're going to use a JSON field.
It also sets the `default_search_fields`, the `tag_fields`, and the `timestamp_field`. The `timestamp_field` and `tag_fields` are
used by Quickwit for [splits pruning](../../overview/architecture) at query time to boost search speed. 
Check out the [index config docs](../../configuration/index-config) for more details.

```yaml title="hdfs_logs_index_config.yaml"
version: 0.7

index_id: hdfs-logs

doc_mapping:
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: tenant_id
      type: u64
    - name: severity_text
      type: text
      tokenizer: raw
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: json
      tokenizer: raw
  tag_fields: [tenant_id]
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity_text, body]
```

We can now create the index with the `create` subcommand.

```bash
./quickwit index create --index-config hdfs_logs_index_config.yaml
```

:::note

This step can also be executed on your local machine. The `create` command creates the index locally and then uploads a 
json file `metastore.json` to your bucket at `s3://path-to-your-bucket/hdfs-logs/metastore.json`.

:::

## Index logs
The dataset is a compressed [NDJSON file](https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants.json.gz). 
Instead of downloading and indexing the data in separate steps, we will use pipes to send a decompressed stream to Quickwit directly.

```bash
wget https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants.json.gz
gunzip -c hdfs-logs-multitenants.json.gz | ./quickwit index ingest --index hdfs-logs
```

:::note

8GB of RAM is enough to index this dataset; an instance like `t4g.large` with 8GB and 2 vCPU indexed this dataset in less than 10 minutes 
(provided that you have some CPU credits).

This step can also be done on your local machine. 
The `ingest` subcommand generates locally [splits](../../overview/architecture) of 10 million documents and will upload 
them on your bucket. Concretely, each split is a bundle of index files and metadata files.

:::


You can check it's working by using `search` subcommand and look for `ERROR` in `severity_text` field:
```bash
./quickwit index search --index hdfs-logs --query "severity_text:ERROR"
```

which returns the json

```json
{
  "num_hits": 345,
  "hits": [
    {
      "attributes": {
        "class": "org.apache.hadoop.hdfs.server.datanode.DataNode"
      },
      "body": "RECEIVED SIGNAL 15: SIGTERM",
      "resource": {
        "service": "datanode/16"
      },
      "severity_text": "ERROR",
      "tenant_id": 51,
      "timestamp": 1469687755
    },
    ...
  ],
  "elapsed_time_micros": 522542
}
```

You can see that this query has 345 hits. In this case for the first run, the server responded in 523 milliseconds.
Subsequent runs use the cached metastore and can be resolved in under 100 milliseconds.

Now that we have indexed the logs and can search from one instance, it's time to configure and start two other instances to form a cluster.

## Start two more instances

Quickwit needs a port `rest.listen_port` for serving the HTTP rest API via TCP as well as maintaining the cluster formation via UDP. 
Also, it needs `{rest.listen_port} + 1` for gRPC communication between instances.

In AWS, you can create a security group to group these inbound rules. Check out the [network section](../../guides/aws-setup) of our AWS setup guide.

To make things easier, let's create a security group that opens the TCP/UDP port range [7200-7300]. 
Next, create three EC2 instances using the previously created security group. Take note of each instance's public IP address.

Now ssh into the first EC2 instance, install Quickwit, and [configure the environment](../../guides/aws-setup) to let Quickwit access the index S3 buckets.

Let's install Quickwit on the second and third EC2 instances.

```bash
curl -L https://install.quickwit.io | sh
cd quickwit-v*/
```

And configure the environment so instances can form a cluster:

```bash
export S3_PATH=s3://{path/to/bucket}/indexes
export IP_NODE_1={first-ec2-instance-public-ip}
```

```bash
# configuration for our second node
echo "version: 0.7
node_id: searcher-2
metastore_uri: ${S3_PATH}
default_index_root_uri: ${S3_PATH}
listen_address: 0.0.0.0
peer_seeds:
  - ${IP_NODE_1} # searcher-1
" > config.yaml

# Start a Quickwit searcher.
./quickwit run --service searcher --config config.yaml
```

```bash
# configuration for our third node
echo "version: 0.7
node_id: searcher-3
listen_address: 0.0.0.0
peer_seeds:
  - ${IP_NODE_1} # searcher-1
metastore_uri: ${S3_PATH}
default_index_root_uri: ${S3_PATH}
" > config.yaml

# Start a Quickwit searcher.
./quickwit run --service searcher --config config.yaml
```


You will see in the terminal the confirmation that the instance has joined the existing cluster. Example of such a log:

```
2023-03-19T16:44:56.918Z  INFO quickwit_cluster::cluster: Joining cluster. cluster_id=quickwit-default-cluster node_id=searcher-2 enabled_services={Searcher} gossip_listen_addr=0.0.0.0:7280 gossip_advertise_addr=172.31.30.168:7280 grpc_advertise_addr=172.31.30.168:7281 peer_seed_addrs=172.31.91.203:7280
```

Now we can query one of our instance directly by issuing http requests to one of the nodes rest API endpoint.

```
curl -v "http://0.0.0.0:7280/api/v1/hdfs-logs/search?query=severity_text:ERROR"
```

Check out the logs of all instances and you will see that all nodes are working.

## Load balancing incoming requests

Now that you have a search cluster, ideally, you will want to load balance external requests. 
This can quickly be done by adding an AWS load balancer to listen to incoming HTTP or HTTPS traffic and forward it to a target group.
You can now play with your cluster, kill processes randomly, add/remove new instances, and keep calm.

## Clean

Let's do some cleanup by deleting the index:

```bash
./quickwit index delete --index hdfs-logs
```

Also remember to remove the security group to protect your EC2 instances. You can just remove the instances if you don't need them.

Congratz! You finished this tutorial!

To continue your Quickwit journey, check out the [search REST API reference](/docs/reference/rest-api) or the [query language reference](/docs/reference/query-language).


================================================
FILE: docs/get-started/tutorials/tutorial-hdfs-logs.md
================================================
---
title: Index a logging dataset locally
description: Index log entries on a local machine.
tags: [self-hosted, setup]
icon_url: /img/quickwit-icon.svg
sidebar_position: 3
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

In this guide, we will index about 20 million log entries (7 GB decompressed) on a local machine. If you want to start a server with indexes on AWS S3 with several search nodes, check out the [tutorial for distributed search](tutorial-hdfs-logs-distributed-search-aws-s3.md).

Here is an example of a log entry:
```json
{
  "timestamp": 1460530013,
  "severity_text": "INFO",
  "body": "PacketResponder: BP-108841162-10.10.34.11-1440074360971:blk_1074072698_331874, type=HAS_DOWNSTREAM_IN_PIPELINE terminating",
  "resource": {
    "service": "datanode/01"
  },
  "attributes": {
    "class": "org.apache.hadoop.hdfs.server.datanode.DataNode"
  },
  "tenant_id": 58
}
```


## Install

Let's download and install Quickwit.

```bash
curl -L https://install.quickwit.io | sh
cd quickwit-v*/
```

Or pull and run the Quickwit binary in an isolated Docker container.

```bash
docker run quickwit/quickwit --version
```

## Start a Quickwit server

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit run
```

</TabItem>

<TabItem value="docker" label="Docker">

```bash
docker run --rm -v $(pwd)/qwdata:/quickwit/qwdata -p 127.0.0.1:7280:7280 quickwit/quickwit run
```

You may need to specify the platform if you are using Apple silicon based macOS system with the `--platform linux/amd64` flag. You can also safely ignore jemalloc warnings.

</TabItem>

</Tabs>


## Create your index

Let's create an index configured to receive these logs.

```bash
# First, download the hdfs logs config from Quickwit repository.
curl -o hdfs_logs_index_config.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/hdfs-logs/index-config.yaml
```

The index config defines five fields: `timestamp`, `tenant_id`, `severity_text`, `body`, and one JSON field
for the nested values `resource.service`, we could use an object field here and maintain a fixed schema, but for convenience we're going to use a JSON field.
It also sets the `default_search_fields`, the `tag_fields`, and the `timestamp_field`.
The `timestamp_field` and `tag_fields` are used by Quickwit for [splits pruning](../../overview/concepts/querying.md#time-sharding) at query time to boost search speed. 
Check out the [index config docs](../../configuration/index-config) for more details.

```yaml title="hdfs-logs-index.yaml"
version: 0.7

index_id: hdfs-logs

doc_mapping:
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: tenant_id
      type: u64
    - name: severity_text
      type: text
      tokenizer: raw
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: json
      tokenizer: raw
  tag_fields: [tenant_id]
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity_text, body]
```

Now let's create the index with the `create` subcommand (assuming you are inside Quickwit install directory):

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit index create --index-config hdfs_logs_index_config.yaml
```

</TabItem>

<TabItem value="curl" label="cURL">

```bash
curl -XPOST http://localhost:7280/api/v1/indexes -H "content-type: application/yaml" --data-binary @hdfs_logs_index_config.yaml
```

</TabItem>

</Tabs>


You're now ready to fill the index.

## Index logs
The dataset is a compressed [NDJSON file](https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants.json.gz).
Instead of downloading it and then indexing the data, we will use pipes to directly send a decompressed stream to Quickwit.
This can take up to 10 minutes on a modern machine, the perfect time for a coffee break.

<Tabs>

<TabItem value="cli" label="CLI">

```bash
curl https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants.json.gz | gunzip | ./quickwit index ingest --index hdfs-logs
```

</TabItem>

<TabItem value="docker" label="Docker">

```bash
curl https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants.json.gz | gunzip | docker run -v $(pwd)/qwdata:/quickwit/qwdata -i quickwit/quickwit index ingest --index hdfs-logs
```

</TabItem>

</Tabs>


If you are in a hurry, use the sample dataset that contains 10 000 documents, we will use this dataset for the example queries:

<Tabs>

<TabItem value="cli" label="CLI">

```bash
curl https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants-10000.json | ./quickwit index ingest --index hdfs-logs
```

</TabItem>

<TabItem value="docker" label="Docker">

On macOS or Windows:

```bash
curl https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants-10000.json | docker run -v $(pwd)/qwdata:/quickwit/qwdata -i quickwit/quickwit index ingest --index hdfs-logs --endpoint http://host.docker.internal:7280
```

On linux:

```bash
curl https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants-10000.json | docker run --network=host -v $(pwd)/qwdata:/quickwit/qwdata -i quickwit/quickwit index ingest --index hdfs-logs --endpoint http://127.0.0.1:7280
```

</TabItem>

<TabItem value="curl" label="cURL">

```bash
wget https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants-10000.json
curl -XPOST http://localhost:7280/api/v1/hdfs-logs/ingest -H "content-type: application/json" --data-binary @hdfs-logs-multitenants-10000.json
```

</TabItem>

</Tabs>

You can check it's working by searching for `INFO` in `severity_text` field:

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit index search --index hdfs-logs  --query "severity_text:INFO"
```

</TabItem>

<TabItem value="docker" label="Docker">

On macOS or Windows:

```bash
docker run -v $(pwd)/qwdata:/quickwit/qwdata quickwit/quickwit index search --index hdfs-logs  --query "severity_text:INFO" --endpoint http://host.docker.internal:7280
```

On linux:

```bash
docker run --network=host -v $(pwd)/qwdata:/quickwit/qwdata quickwit/quickwit index search --index hdfs-logs  --query "severity_text:INFO" --endpoint http://127.0.0.1:7280
```

</TabItem>

</Tabs>

:::note

The `ingest` subcommand generates [splits](../../overview/architecture) of 5 million documents. Each split is a small piece of index represented by a file in which index files and metadata files are saved.

:::


The query which returns the json:

```json
{
  "num_hits": 10000,
  "hits": [
    {
      "body": "Receiving BP-108841162-10.10.34.11-1440074360971:blk_1073836032_95208 src: /10.10.34.20:60300 dest: /10.10.34.13:50010",
      "resource": {
        "service": "datanode/03"
      },
      "severity_text": "INFO",
      "tenant_id": 58,
      "timestamp": 1440670490
    }
    ...
  ],
  "elapsed_time_micros": 2490
}
```

The index config shows that we can use the timestamp field parameters `start_timestamp` and `end_timestamp` and benefit from time pruning. 
Behind the scenes, Quickwit will only query [splits](../../overview/architecture) that have logs in this time range.

Let's use these parameters with the following query:

```bash
curl 'http://127.0.0.1:7280/api/v1/hdfs-logs/search?query=severity_text:INFO&start_timestamp=1440670490&end_timestamp=1450670490'
```

## Clean

Let's do some cleanup by deleting the index:

<Tabs>

<TabItem value="cli" label="CLI">

```bash
./quickwit index delete --index hdfs-logs
```

</TabItem>

<TabItem value="curl" label="cURL">

```bash
curl -XDELETE http://127.0.0.1:7280/api/v1/indexes/hdfs-logs
```

</TabItem>

</Tabs>

Congratz! You finished this tutorial!


To continue your Quickwit journey, check out the [tutorial for distributed search](tutorial-hdfs-logs-distributed-search-aws-s3.md) or dig into the [search REST API](/docs/reference/rest-api) or [query language](/docs/reference/query-language).


================================================
FILE: docs/get-started/tutorials/tutorial-jaeger.md
================================================
---
title: Traces with Jaeger
sidebar_position: 2
---

In this quick start guide, we will set up a Quickwit instance and analyze its own traces with Jaeger using Docker Compose.

You only need a minute to get Jaeger working with Quickwit storage backend.

## Start Quickwit and Jaeger

Let's use `docker compose` with the following configuration:

```yaml title="docker-compose.yaml"
version: "3"

services:
  quickwit:
    image: quickwit/quickwit:${QW_VERSION:-0.8.1}
    volumes:
      - ./qwdata:/quickwit/qwdata
    ports:
      - 7280:7280
    environment:
      - QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER=true
      - OTEL_EXPORTER_OTLP_ENDPOINT=http://localhost:7281
    command: ["run"]

  jaeger-query:
    image: jaegertracing/jaeger-query:1.60
    ports:
      - 16686:16686
    environment:
      - SPAN_STORAGE_TYPE=grpc
      - GRPC_STORAGE_SERVER=quickwit:7281
      - GRPC_STORAGE_TLS=false
```

As you can see in the docker compose file, Quickwit is configured to send its own traces `OTEL_EXPORTER_OTLP_ENDPOINT` to itself `http://localhost:7281`.
On the other side, Jaeger is configured to use a gRPC storage server `quickwit:7281`.

Save and run the recipe:

```bash
$ docker compose up
```

You should be able to access Quickwit's UI on `http://localhost:7280/` and Jager's UI on `http://localhost:16686/`.


## Searching and view traces in Jaeger

Quickwit generates many traces, let's take a look at some of them:
- `find_traces`: generated by the "Find traces" Jaeger button.
- `get_operations`: generated by Jaeger when it is fetching the list of operations.
- `get_services`: generated by Jaeger when it is fetching the list of services.
- `ingest-spans`: generated when Quickwit receives spans on the gRPC OTLP API.
- ...

Here are the screenshots of the search and trace view:

![Jaeger search view](../../assets/images/jaeger-ui-quickwit-search-traces.png)
![Jaeger trace view](../../assets/images/jaeger-ui-quickwit-trace-view.png)

## Searching traces with Quickwit UI

You can also use the Quickwit UI at [http://localhost:7280](http://localhost:7280) to search traces.

Here are a couple of query examples:
- `service_name:quickwit AND events.event_attributes.level:INFO`
- `span_duration_millis:>100`
- `resource_attributes.service.version:v0.8.1`
- `service_name:quickwit`

That's it! You can level up with the following tutorials to discover all Quickwit features.

## Next tutorials

- [Send traces using an OTEL collector](/docs/distributed-tracing/send-traces/using-otel-collector.md)
- [Send traces from a python web server](/docs/distributed-tracing/send-traces/using-otel-sdk-python.md)


================================================
FILE: docs/guides/_category_.yaml
================================================
label: 'Guides'
position: 8
collapsed: true


================================================
FILE: docs/guides/aws-setup.md
================================================
---
title: AWS cluster setup
sidebar_position: 3
---

Setting up a Quickwit cluster on AWS requires the configuration of three elements:
- AWS credentials
- AWS region
- Network configuration

## AWS credentials

When starting a node, Quickwit attempts to find AWS credentials using the credential provider chain implemented by [rusoto_core::ChainProvider](https://docs.rs/rusoto_credential/latest/rusoto_credential/struct.ChainProvider.html) and looks for credentials in this order:

1. Environment variables `AWS_ACCESS_KEY_ID`, `AWS_SECRET_ACCESS_KEY`, or `AWS_SESSION_TOKEN` (optional).

2. Credential profiles file, typically located at `~/.aws/credentials` or otherwise specified by the `AWS_SHARED_CREDENTIALS_FILE` and `AWS_PROFILE` environment variables if set and not empty.

3. Amazon ECS container credentials, loaded from the Amazon ECS container if the environment variable `AWS_CONTAINER_CREDENTIALS_RELATIVE_URI` is set.

4. Instance profile credentials, used on Amazon EC2 instances, and delivered through the Amazon EC2 metadata service.

An error is returned if no credentials are found in the chain.

## AWS region

Quickwit attempts to find an AWS region in multiple locations and with the following order of precedence:

1. Environment variables (`AWS_REGION` then `AWS_DEFAULT_REGION`)

2. Config file, typically located at `~/.aws/config` or otherwise specified by the `AWS_CONFIG_FILE` environment variable if set and not empty.

3. Amazon EC2 instance metadata service indicating the region of the currently running Amazon EC2 instance.

4. Default value: `us-east-1`

:::note

AWS credentials or region resolution may take a few seconds, especially if the Amazon EC2 instance metadata service is slow or unavailable.

:::

## IAM permissions

### Amazon S3

Required authorized actions:
- `ListBucket` (on the bucket directly)
- `GetObject`
- `PutObject`
- `DeleteObject`
- `ListMultipartUploadParts`
- `AbortMultipartUpload`

Here is an example of a bucket policy:
```json
{
  "Version": "2012-10-17",
  "Statement": [
    {
      "Effect": "Allow",
      "Action": [
        "s3:ListBucket"
      ],
      "Resource": [
        "arn:aws:s3:::my-bucket"
      ]
    },
    {
      "Effect": "Allow",
      "Action": [
        "s3:GetObject",
        "s3:PutObject",
        "s3:DeleteObject",
        "s3:ListMultipartUploadParts",
        "s3:AbortMultipartUpload"
      ],
      "Resource": [
        "arn:aws:s3:::my-bucket/*"
      ]
    }
  ]
}
```

You can run the following commands to verify that AWS credentials, region, and IAM permissions are properly configured for Amazon S3:

```bash
MY_BUCKET=<bucket name>
aws s3 ls $MY_BUCKET
echo "Hello, World!" | aws s3 cp - $MY_BUCKET/hello
aws s3 ls $MY_BUCKET/hello
aws s3 cp $MY_BUCKET/hello -
aws s3 rm $MY_BUCKET/hello
```

### Amazon Kinesis

- `GetRecords`
- `GetShardIterator`
- `ListShards`

You can run the following commands to verify that AWS credentials, region, and IAM permissions are properly configured for Amazon Kinesis:

```bash
MY_STREAM=<my stream name>

# List the shards in the stream and select the first one.
SHARD_ID=$(
    aws kinesis list-shards --stream-name $MY_STREAM \
    | jq -r .Shards[0].ShardId
)

# Get a shard iterator for the selected shard.
SHARD_ITERATOR=$(
    aws kinesis get-shard-iterator --stream-name $MY_STREAM \
                                   --shard-id $SHARD_ID \
                                   --shard-iterator-type TRIM_HORIZON \
    | jq -r .ShardIterator
)

# Fetch some records from the shard and display the first one.
aws kinesis get-records --shard-iterator $SHARD_ITERATOR | jq -r .Records[0]
```

## Network configuration

### Security groups

To communicate with each other, nodes must reside in security groups that allow inbound and outbound traffic on one UDP port and two TCP ports. Please, refer to the [ports configuration](/configuration/ports-config.md) page for more details.

## Common errors

If you set the wrong credentials, you will see this error message with `Unauthorized` in your terminal:

```bash
Command failed: Another error occurred. `Metastore error`. Cause: `StorageError(kind=Unauthorized, source=failed to fetch object: s3://quickwit-dev/my-hdfs/metastore.json)`
```

If you put the wrong region, you will see this one:

```bash
Command failed: Another error occurred. `Metastore error`. Cause: `StorageError(kind=Internal, source=failed to fetch object: s3://your-bucket/your-index/metastore.json)`.
```


================================================
FILE: docs/guides/schemaless.md
================================================
---
title: Schemaless
sidebar_position: 1
---

# Strict schema or schemaless?

Quickwit lets you place the cursor on how strict you would like your schema to be. In other words, it is possible to operate Quickwit with a very strict mapping, in an entirely schemaless manner, and anywhere in between. Let's see how this works!

:::note

To execute the CLI commands throughout this guide, [install](/docs/get-started/installation.md) Quickwit and start a server in a terminal with the following command:

```bash
./quickwit run
```

:::

## A strict mapping

That's the most straightforward approach.
As a user, you need to precisely define the list of fields to be ingested by Quickwit.

For instance, a reasonable mapping for an application log could be:

```yaml title=my_strict_index.yaml
version: 0.7

index_id: my_strict_index

doc_mapping:
  mode: strict # <--- The mode attribute
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: server
      type: text
      tokenizer: raw
    - name: message
      type: text
      record: position
    - name: severity
      tokenizer: raw
  timestamp_field: timestamp

search_settings:
  default_search_fields: [severity, message]

indexing_settings:
  commit_timeout_secs: 30
```

The `mode` attribute controls what should be done if an ingested document
contains a field that is not defined in the document mapping. By default, your index is in the `dynamic` mode. In `dynamic` mode, the fields that do not appear in the document mapping will be indexed in a schemaless fashion.
See details in the [dynamic mode section](#dynamic-mode).


If `mode` is set to `strict` on the other hand, documents containing fields
that are not defined in the mapping will be entirely discarded.

Finally the last possible value for `mode` is `lenient`. In lenient mode, fields that are not present in the field mapping will simply be ignored.

## The dynamic mode: schemaless with a partial schema {#dynamic-mode}

`mode` can take the value: `dynamic`.
When set to dynamic, all extra fields will actually be mapped using a catch-all configuration.

By default, this catch-all configuration indexes and stores all of these fields, but this can be configured by setting the [`dynamic_mapping` attribute](../configuration/index-config#mode).
A minimalist, yet perfectly valid and useful index configuration is then:

```yaml title=my_dynamic_index.yaml
version: 0.7
index_id: my_dynamic_index
doc_mapping:
  mode: dynamic
```

This configuration makes it possible to ingest any JSON object and search them.

However, the dynamic mode can also be used in conjunction with field mappings.
This combination is especially powerful for event logs which cannot be mapped to a single schema.

For instance, let's consider the following user event log:

```json file title=my_logs.json
{
    "timestamp": 1653021741,
    "user_id": "8705a7fak",
    "event_type": "login",
    "ab_groups": ["phoenix-red-ux"]
}
{
    "timestamp": 1653021746,
    "user_id": "7618fe06",
    "event_type": "order",
    "ab_groups": ["phoenix-red-ux", "new-ranker"],
    "cart": [
        {
            "product_id": 120391,
            "product_description": "Cherry Pi: A single-board computer that is compatible..."
        }
    ]
}
{
    "timestamp": 1653021748,
    "user_id": "8705a7fak",
    "event_type": "login",
    "ab_groups": ["phoenix-red-ux"]
}
```

Each event type comes with its own set of attributes. Declaring our mapping as the union of all of these event-specific mappings would be a tedious exercise.

Instead, we can cherry-pick the fields that are common to all of the logs, and rely on dynamic mode to handle the rest.

```yaml title=my_dynamic_index.yaml
version: 0.7
index_id: my_dynamic_index
doc_mapping:
  mode: dynamic
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: user_id
      type: text
      tokenizer: raw
    - name: event_type
      type: text
      tokenizer: raw
  timestamp_field: timestamp

indexing_settings:
  commit_timeout_secs: 30  # <--- Your document will be searchable ~30 seconds after you ingest them.
```

Our index is now ready to handle queries like this:

```
event_type:order AND cart.product_id:120391
```

Execute the following commands to create the index, ingest a few documents and search through them:

```bash
cat << EOF > my_dynamic_index.yaml
version: 0.7
index_id: my_dynamic_index
doc_mapping:
  mode: dynamic
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: user_id
      type: text
      tokenizer: raw
    - name: event_type
      type: text
      tokenizer: raw
  timestamp_field: timestamp

indexing_settings:
  commit_timeout_secs: 30
EOF

# Create index.
./quickwit index create --index-config ./my_dynamic_index.yaml --overwrite --yes

cat << EOF > my_logs.json
{"timestamp":1653021741,"user_id":"8705a7fak","event_type":"login","ab_groups":["phoenix-red-ux"]}
{"timestamp":1653021746,"user_id":"7618fe06","event_type":"order","ab_groups":["phoenix-red-ux","new-ranker"],"cart":[{"product_id":120391,"product_description":"Cherry Pi: A single-board computer that is compatible..."}]}
{"timestamp":1653021748,"user_id":"8705a7fak","event_type":"login","ab_groups":["phoenix-red-ux"]}
EOF

# Ingest documents.
./quickwit index ingest --index my_dynamic_index --input-path my_logs.json --force

# Execute search query.
./quickwit index search --index my_dynamic_index --query "event_type:order AND cart.product_id:120391

```

## A schema with schemaless pockets

Some logs are isolating these event-specific attributes in a
sub-field. For instance, let's have a look at an OpenTelemetry JSON log.

```json title=otel_logs.json
{
  "Timestamp": 1653028151,
  "Attributes": {
    "split_id": "28f897f2-0419-4d88-8abc-ada72b4b5256"
  },
  "Resource": {
    "service": "donut_shop",
    "k8s_pod_uid": "27413708-876b-4652-8ca4-50e8b4a5caa2"
  },
  "TraceId": "f4dbb3edd765f620",
  "SpanId": "43222c2d51a7abe3",
  "SeverityText": "INFO",
  "SeverityNumber": 9,
  "Body": "merge ended"
}
```

In this log, the `Attributes` and the `Resource` fields contain arbitrary key-values.

Quickwit 0.3 introduced a JSON field type to handle this use case.
A good index configuration here could be:

```yaml title=otel_logs.yaml
version: 0.7
index_id: otel_logs
doc_mapping:
  mode: dynamic
  field_mappings:
    - name: Timestamp
      type: datetime
      fast: true
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast_precision: seconds
      fast: true
    - name: Attributes
      type: json
      tokenizer: raw
    - name: Resource
      type: json
      tokenizer: raw
    - name: TraceId
      type: text
      tokenizer: raw
    - name: SpanId
      type: text
      tokenizer: raw
    - name: SeverityText
      type: text
      tokenizer: raw
      fast: true
    - name: Body
      type: text
  timestamp_field: Timestamp
  
search_settings:
  default_search_fields: [SeverityText, Body, Attributes, Resource]

indexing_settings:
  commit_timeout_secs: 10
```

We can now naturally search our logs with the following query:

```
merge AND service:donuts_shop
```

Let's execute the following commands to create the index, ingest a document and execute a search query:

```bash
# Create index.
./quickwit index create --index-config ./otel_logs.yaml --overwrite --yes

cat << EOF > otel_logs.json
{"Timestamp":1653028151,"Attributes":{"split_id":"28f897f2-0419-4d88-8abc-ada72b4b5256"},"Resource":{"service":"donut_shop","k8s_pod_uid":"27413708-876b-4652-8ca4-50e8b4a5caa2"},"TraceId":"f4dbb3edd765f620","SpanId":"43222c2d51a7abe3","SeverityText":"INFO","SeverityNumber":9,"Body":"merge ended"}
EOF

# Ingest documents.
./quickwit index ingest --index otel_logs --input-path otel_logs.json --force

# Execute search query.
./quickwit index search --index otel_logs --query "merge AND service:donut_shop"

```


================================================
FILE: docs/guides/storage-setup/_category_.yaml
================================================
label: 'Storage Setup'
position: 2
collapsed: true


================================================
FILE: docs/guides/storage-setup/aws-s3.md
================================================
---
title: AWS S3
sidebar_position: 1
---

In this guide, you will learn how to configure a Quickwit [storage](../../configuration/storage-config) for Amazon S3.

## Set your AWS credentials

A simple way to do it is to declare the environment variables `AWS_ACCESS_KEY_ID`, `AWS_SECRET_ACCESS_KEY`. For more details, read our guide on [AWS setup](../aws-setup).

## Set the Metastore URI and default index URI

Here is an example of how to set up your [node config file](../../configuration/node-config) with S3:

```yaml
metastore_uri: s3://{my-bucket}/indexes
default_index_uri: s3://{my-bucket}/indexes
```

## Set the Index URI

Here is an example of how to set up your index URI in the [index config file](../../configuration/index-config):
```yaml
index_uri: s3://{my-bucket}/indexes/{my-index-id}
```


================================================
FILE: docs/ingest-data/_category_.yaml
================================================
label: 'Ingest data'
position: 4
collapsed: true


================================================
FILE: docs/ingest-data/index.md
================================================
---
title: Ingest data from multiple sources
---

import DocCardList from '@theme/DocCardList';

<DocCardList />

It is possible to ingest data with log shippers like [OpenTelemetry](../log-management/overview.md#opentelemetry-agent), [Fluentbit](../log-management/send-logs/using-fluentbit.md), or [Vector](../log-management/send-logs/using-vector.md). It's also possible to send traces from your apps to the [OpenTelemetry Collector](../log-management/send-logs/using-otel-collector-with-helm.md) and then to Quickwit.


================================================
FILE: docs/ingest-data/ingest-api.md
================================================
---
title: Ingest API
description: A short tutorial describing how to send data in Quickwit using the ingest API
tags: [ingest-api, integration]
icon_url: /img/tutorials/quickwit-logo.svg
sidebar_position: 1
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

In this tutorial, we will describe how to send data to Quickwit using the ingest API.

You will need a [local Quickwit instance](../get-started/installation) up and running to follow this tutorial.

To start it, run `./quickwit run` in a terminal.

## Create an index

First, let's create a schemaless index.

```bash
# Create the index config file.
cat << EOF > stackoverflow-schemaless-config.yaml
version: 0.7
index_id: stackoverflow-schemaless
doc_mapping:
  mode: dynamic
  dynamic_mapping:
    tokenizer: default
indexing_settings:
  commit_timeout_secs: 30
EOF
# Use the CLI to create the index...
./quickwit index create --index-config stackoverflow-schemaless-config.yaml
# Or with cURL.
curl -XPOST -H 'Content-Type: application/yaml' 'http://localhost:7280/api/v1/indexes' --data-binary @stackoverflow-schemaless-config.yaml
```

Note that for this example, we configure the dynamic mapping to use the [default tokenizer](../configuration/index-config.md#description-of-available-tokenizers). This is necessary to enable full-text search on all text fields.

## Ingest data

Let's first download a sample of the [StackOverflow dataset](https://www.kaggle.com/stackoverflow/stacksample).

```bash
# Download the first 10_000 Stackoverflow posts articles.
curl -O https://quickwit-datasets-public.s3.amazonaws.com/stackoverflow.posts.transformed-10000.json
```

You can ingest data either with the CLI or with cURL. The CLI is more convenient for ingesting several GB as Quickwit may return `429` responses if the ingest queue is full. Quickwit CLI will automatically retry ingestion in this case.

```bash
# Ingest the first 10_000 Stackoverflow posts articles with the CLI...
./quickwit index ingest --index stackoverflow-schemaless --input-path stackoverflow.posts.transformed-10000.json --force

# OR with cURL.
curl -XPOST -H 'Content-Type: application/json' 'http://localhost:7280/api/v1/stackoverflow-schemaless/ingest?commit=force' --data-binary @stackoverflow.posts.transformed-10000.json
```

## Execute search queries

You can now search the index.

```bash
curl 'http://localhost:7280/api/v1/stackoverflow-schemaless/search?query=body:python'
```

## Tear down resources (optional)

```bash
curl -XDELETE 'http://localhost:7280/api/v1/indexes/stackoverflow-schemaless'
```

This concludes the tutorial. You can now move on to the [next tutorial](/docs/ingest-data/kafka.md) to learn how to ingest data from Kafka.

## Ingest API versions

In 0.9, Quickwit introduced a new version of the ingest API that enables distributing the indexing in the cluster regardless of the node that received the ingest request. This new ingestion service is often referred to as "Ingest V2" compared to the legacy ingestion (V1). In upcoming versions the new ingest API will also be capable of replicating the write ahead log in order to achieve higher durability.

By default, both ingestion services are enabled and ingest V2 is used. You can toggle this behavior with the following environment variables:

| Variable              | Description   | Default value |
| --------------------- | --------------|-------------- |
| `QW_ENABLE_INGEST_V2` | Start the V2 ingest service and use it by default. | true | 
| `QW_DISABLE_INGEST_V1`| V1 ingest will be used by the APIs only if V2 is disabled. Running V1 along V2 is necessary to migrate to V2 without loosing existing unindexed V1 logs. | false |

:::note

These configurations drive the ingest service used both by the `api/v1/<index-id>/ingest` endpoint and the [bulk API](../reference/es_compatible_api.md#_bulk--batch-ingestion-endpoint).

:::


================================================
FILE: docs/ingest-data/ingest-local-file.md
================================================
---
title: Local file
description: A short tutorial describing how to index a local file with the Quickiwt CLI 
tags: [local-ingest, integration]
icon_url: /img/tutorials/file-ndjson.svg
sidebar_position: 2
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

In this tutorial, we will describe how to index a local file with the Quickwit CLI.

You will need the [Quickwit binary](/docs/get-started/installation.md) to follow this tutorial.

## Create an index

First, let's create a schemaless index. We need to start a Quickwit server only for the creation so we will start it and shut it down afterwards.

Start the Quickwit server.

```bash
./quickwit run
```

And create the index in a separate terminal.

```bash
# Create the index config file.
cat << EOF > stackoverflow-schemaless-config.yaml
version: 0.7
index_id: stackoverflow-schemaless
doc_mapping:
  mode: dynamic
indexing_settings:
  commit_timeout_secs: 30
EOF

./quickwit index create --index-config stackoverflow-schemaless-config.yaml
```

You can now shutdown the server by pressing `Ctrl+C` in the first terminal.

## Ingest the file

To ingest a file, you just need to execute the following command:

```bash
./quickwit tool local-ingest --index stackoverflow-schemaless --input-path stackoverflow.posts.transformed-10000.json
```

After a few seconds you should see the following output:

```bash
❯ Ingesting documents locally...

---------------------------------------------------
 Connectivity checklist
 ✔ metastore
 ✔ storage
 ✔ _ingest-cli-source

 Num docs   10000 Parse errs     0 PublSplits   1 Input size     6MB Thrghput  3.34MB/s Time 00:00:02
 Num docs   10000 Parse errs     0 PublSplits   1 Input size     6MB Thrghput  2.23MB/s Time 00:00:03
 Num docs   10000 Parse errs     0 PublSplits   1 Input size     6MB Thrghput  1.67MB/s Time 00:00:04

Indexed 10,000 documents in 4s.
Now, you can query the index with the following command:
quickwit index search --index stackoverflow-schemaless --config ./config/quickwit.yaml --query "my query"
Clearing local cache directory...
✔ Local cache directory cleared.
✔ Documents successfully indexed.
```

:::tip

Object store URIs like `s3://mybucket/mykey.json` are also supported as `--input-path`, provided that your environment is configured with the appropriate permissions.

:::

## Tear down resources (optional)

That's it! You can now tear down the resources you created. You can do so by running the following command:

```bash
./quickwit run
```

And in a separate terminal:

```bash
./quickwit index delete --index-id stackoverflow-schemaless
```

This concludes the tutorial. You can now move on to the next tutorial.


================================================
FILE: docs/ingest-data/kafka.md
================================================
---
title: Kafka
description: A short tutorial describing how to set up Quickwit to ingest data from Kafka in a few minutes
tags: [kafka, integration]
icon_url: /img/tutorials/kafka.svg
sidebar_position: 2
---

In this tutorial, we will describe how to set up Quickwit to ingest data from Kafka in a few minutes. First, we will create an index and configure a Kafka source. Then, we will create a Kafka topic and load some events from the [GH Archive](https://www.gharchive.org/) into it. Finally, we will execute some search and aggregation queries to explore the freshly ingested data.

## Prerequisites

You will need the following to complete this tutorial:
- A running Kafka cluster (see Kafka [quickstart](https://kafka.apache.org/quickstart))
- A local Quickwit [installation](/docs/get-started/installation.md)

## Create index

First, let's create a new index. Here is the index config and doc mapping corresponding to the schema of the GH Archive events:

```yaml title="index-config.yaml"
#
# Index config file for gh-archive dataset.
#
version: 0.7

index_id: gh-archive

doc_mapping:
  field_mappings:
    - name: id
      type: text
      tokenizer: raw
    - name: type
      type: text
      fast: true
      tokenizer: raw
    - name: public
      type: bool
      fast: true
    - name: payload
      type: json
      tokenizer: default
    - name: org
      type: json
      tokenizer: default
    - name: repo
      type: json
      tokenizer: default
    - name: actor
      type: json
      tokenizer: default
    - name: other
      type: json
      tokenizer: default
    - name: created_at
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: created_at

indexing_settings:
  commit_timeout_secs: 10
```

Execute these Bash commands to download the index config and create the `gh-archive` index:

```bash
# Download GH Archive index config.
wget -O gh-archive.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/gh-archive/index-config.yaml

# Create index.
./quickwit index create --index-config gh-archive.yaml
```

## Create and populate Kafka topic

Now, let's create a Kafka topic and load some events into it.

```bash
# Create a topic named `gh-archive` with 3 partitions.
bin/kafka-topics.sh --create --topic gh-archive --partitions 3 --bootstrap-server localhost:9092

# Download a few GH Archive files.
wget https://data.gharchive.org/2022-05-12-{10..15}.json.gz

# Load the events into Kafka topic.
gunzip -c 2022-05-12*.json.gz | \
bin/kafka-console-producer.sh --topic gh-archive --bootstrap-server localhost:9092
```

## Create Kafka source

:::note
This tutorial assumes that the Kafka cluster is available locally on the default port (9092). If it's not the case, please, update the `bootstrap.servers` parameter accordingly.
:::

```yaml title="kafka-source.yaml"
#
# Kafka source config file.
#
version: 0.8
source_id: kafka-source
source_type: kafka
num_pipelines: 2
params:
  topic: gh-archive
  client_params:
    bootstrap.servers: localhost:9092
```

Run these commands to download the source config file and create the source.

```bash
# Download Kafka source config.
wget https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/gh-archive/kafka-source.yaml

# Create source.
./quickwit source create --index gh-archive --source-config kafka-source.yaml
```
:::note

If you get the following error:

``` Command failed: Topic `gh-archive` has no partitions.```

It means the Kafka topic `gh-archive` was not properly created in the previous step.

:::


## Launch indexing and search services

Finally, execute this command to start Quickwit in server mode.

```bash
# Launch Quickwit services.
./quickwit run
```

Under the hood, this command spawns an indexer and a searcher. On startup, the indexer will connect to the Kafka topic specified by the source and start streaming and indexing events from the partitions composing the topic. With the default commit timeout value (see [indexing settings](../configuration/index-config#indexing-settings)), the indexer should publish the first split after approximately 60 seconds.

You can run this command (in another shell) to inspect the properties of the index and check the current number of published splits:

```bash
# Display some general information about the index.
./quickwit index describe --index gh-archive
```

Once the first split is published, you can start running search queries. For instance, we can find all the events for the Kubernetes [repository](https://github.com/kubernetes/kubernetes):

```bash
curl 'http://localhost:7280/api/v1/gh-archive/search?query=org.login:kubernetes%20AND%20repo.name:kubernetes'
```

It is also possible to access these results through the [Quickwit UI](http://localhost:7280/ui/search?query=org.login%3Akubernetes+AND+repo.name%3Akubernetes&index_id=gh-archive&max_hits=10).


We can also group these events by type and count them:

```
curl -XPOST -H 'Content-Type: application/json' 'http://localhost:7280/api/v1/gh-archive/search' -d '
{
  "query":"org.login:kubernetes AND repo.name:kubernetes",
  "max_hits":0,
  "aggs":{
    "count_by_event_type":{
      "terms":{
        "field":"type"
      }
    }
  }
}'
```


## Secured Kafka connection (optional)

The Quickwit Kafka source supports SSL and SASL authentication. This is
particularly useful when consuming data from an external Kafka service.

:::tip

The certificate and key files must be present on all Quickwit nodes for the
Kafka source to be created and for the indexing pipelines to run successfully.

:::

### SSL configuration

```yaml
version: 0.8
source_id: kafka-source-ssl
source_type: kafka
num_pipelines: 2
params:
  topic: gh-archive
  client_params:
    bootstrap.servers: your-kafka-broker.com
    security.protocol: SSL
    ssl.ca.location: /path/to/ca.pem
    ssl.certificate.location: /path/to/service.cert
    ssl.key.location: /path/to/service.key
```

### SASL configuration

```yaml
version: 0.8
source_id: kafka-source-sasl
source_type: kafka
num_pipelines: 2
params:
  topic: gh-archive
  client_params:
    bootstrap.servers: your-kafka-broker.com
    ssl.ca.location: /path/to/ca.pem
    security.protocol: SASL_SSL
    sasl.mechanisms: SCRAM-SHA-256
    sasl.username: your_sasl_username
    sasl.password: your_sasl_password
```

:::note

If you get the following error:

```Client creation error: ssl.ca.location failed: error:05880002:x509 certificate routines::system lib```

It usually means the path to the CA certificate is incorrect. Update the
`ssl.ca.location` parameter accordingly.

:::

## Tear down resources (optional)

Let's delete the files and resources created for the purpose of this tutorial.

```bash
# Delete Kafka topic.
bin/kafka-topics.sh --delete --topic gh-archive --bootstrap-server localhost:9092

# Delete index.
./quickwit index delete --index gh-archive

# Delete source config.
rm kafka-source.yaml
```

This concludes the tutorial. If you have any questions regarding Quickwit or encounter any issues, don't hesitate to ask a [question](https://github.com/quickwit-oss/quickwit/discussions) or open an [issue](https://github.com/quickwit-oss/quickwit/issues) on [GitHub](https://github.com/quickwit-oss/quickwit) or contact us directly on [Discord](https://discord.com/invite/MT27AG5EVE).


================================================
FILE: docs/ingest-data/kinesis.md
================================================
---
title: Kinesis
description: A short tutorial describing how to set up Quickwit to ingest data from Kinesis in a few minutes
tags: [aws, integration]
icon_url: /img/tutorials/aws-kinesis.svg
sidebar_position: 4
---

In this tutorial, we will describe how to set up Quickwit to ingest data from Kinesis in a few minutes. First, we will create an index and configure a Kinesis source. Then, we will create a Kinesis stream and load some events from the [GH Archive](https://www.gharchive.org/) into it. Finally, we will execute some search and aggregation queries to explore the freshly ingested data.

:::caution
You will incur some charges for using the Amazon Kinesis service during this tutorial.
:::

## Prerequisites

You will need the following to complete this tutorial:
- The AWS CLI version 2 (see [Getting started with the AWS CLI](https://docs.aws.amazon.com/cli/latest/userguide/getting-started-prereqs.html) for prerequisites and installation)
- A local Quickwit [installation](/docs/get-started/installation.md)
- [jq](https://stedolan.github.io/jq/download/)
- [GNU parallel](https://www.gnu.org/software/parallel/)

:::note
`jq` is required to reshape the events into records ingestable by the Amazon Kinesis API.
:::

### Create index

First, let's create a new index. Here is the index config and doc mapping corresponding to the schema of the GH Archive events:

```yaml title="index-config.yaml"
#
# Index config file for gh-archive dataset.
#
version: 0.7

index_id: gh-archive

doc_mapping:
  field_mappings:
    - name: id
      type: text
      tokenizer: raw
    - name: type
      type: text
      fast: true
      tokenizer: raw
    - name: public
      type: bool
      fast: true
    - name: payload
      type: json
      tokenizer: default
    - name: org
      type: json
      tokenizer: default
    - name: repo
      type: json
      tokenizer: default
    - name: actor
      type: json
      tokenizer: default
    - name: other
      type: json
      tokenizer: default
    - name: created_at
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: created_at

indexing_settings:
  commit_timeout_secs: 10

```

Execute these Bash commands to download the index config and create the `gh-archive` index.

```bash
# Download GH Archive index config.
wget -O gh-archive.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/gh-archive/index-config.yaml

# Create index.
./quickwit index create --index-config gh-archive.yaml
```


## Create and populate Kinesis stream

Now, let's create a Kinesis stream and load some events into it.

:::tip
This step may be fairly slow depending on how much bandwidth is available. The current command limits the volume of data to ingest by taking the first 10 000 lines of every single file downloaded from the GH Archive. If you have enough bandwidth, you can remove it to ingest the whole set of files. You can also speed things up by increasing the number of shards and/or the number of jobs launched by `parallel` (`-j` option).
:::

```bash
# Create a stream named `gh-archive` with 3 shards.
aws kinesis create-stream --stream-name gh-archive --shard-count 8

# Download a few GH Archive files.
wget https://data.gharchive.org/2022-05-12-{10..12}.json.gz

# Load the events into Kinesis stream
gunzip -c 2022-05-12*.json.gz | \
head -n 10000 | \
parallel --gnu -j8 -N 500 --pipe \
'jq --slurp -c "{\"Records\": [.[] | {\"Data\": (. | tostring), \"PartitionKey\": .id }], \"StreamName\": \"gh-archive\"}" > records-{%}.json && \
aws kinesis put-records --cli-input-json file://records-{%}.json --cli-binary-format raw-in-base64-out >> out.log'
```

## Create Kinesis source

```yaml title="kinesis-source.yaml"
#
# Kinesis source config file.
#
version: 0.7
source_id: kinesis-source
source_type: kinesis
params:
  stream_name: gh-archive
```

Run these commands to download the source config file and create the source.

```bash
# Download Kinesis source config.
wget https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/gh-archive/kinesis-source.yaml

# Create source.
./quickwit source create --index gh-archive --source-config kinesis-source.yaml
```

:::note

If this command fails with the following error message:
```
Command failed: Stream gh-archive under account XXXXXXXXX not found.

Caused by:
    0: Stream gh-archive under account XXXXXXXX not found.
    1: Stream gh-archive under account XXXXXXXX not found.
```

it means the Kinesis stream was not properly created in the previous step.
:::

## Launch indexing and search services

Finally, execute this command to start Quickwit in server mode.

```bash
# Launch Quickwit services.
./quickwit run
```

Under the hood, this command spawns an indexer and a searcher. On startup, the indexer will connect to the Kinesis stream specified by the source and start streaming and indexing events from the shards composing the stream. With the default commit timeout value (see [indexing settings](../configuration/index-config#indexing-settings)), the indexer should publish the first split after approximately 60 seconds.

You can run this command (in another shell) to inspect the properties of the index and check the current number of published splits:

```bash
# Display some general information about the index.
./quickwit index describe --index gh-archive
```

It is also possible to get index information through the [Quickwit UI](http://localhost:7280/ui/indexes/gh-archive).

Once the first split is published, you can start running search queries. For instance, we can find all the events for the Kubernetes [repository](https://github.com/kubernetes/kubernetes):

```bash
curl 'http://localhost:7280/api/v1/gh-archive/search?query=org.login:kubernetes%20AND%20repo.name:kubernetes'
```

It is also possible to access these results through the [UI](http://localhost:7280/ui/search?query=org.login%3Akubernetes+AND+repo.name%3Akubernetes&index_id=gh-archive&max_hits=10).

We can also group these events by type and count them:

```
curl -XPOST -H 'Content-Type: application/json' 'http://localhost:7280/api/v1/gh-archive/search' -d '
{
  "query":"org.login:kubernetes AND repo.name:kubernetes",
  "max_hits":0,
  "aggs":{
    "count_by_event_type":{
      "terms":{
        "field":"type"
      }
    }
  }
}'
```

## Tear down resources (optional)

Let's delete the files and resources created for the purpose of this tutorial.

```bash
# Delete Kinesis stream.
aws kinesis delete-stream --stream-name gh-archive

# Delete index.
./quickwit index delete --index gh-archive

# Delete source config.
rm kinesis-source.yaml
```

This concludes the tutorial. If you have any questions regarding Quickwit or encounter any issues, don't hesitate to ask a [question](https://github.com/quickwit-oss/quickwit/discussions) or open an [issue](https://github.com/quickwit-oss/quickwit/issues) on [GitHub](https://github.com/quickwit-oss/quickwit) or contact us directly on [Discord](https://discord.com/invite/MT27AG5EVE).


================================================
FILE: docs/ingest-data/pulsar.md
================================================
---
title: Pulsar
description: A short tutorial describing how to set up Quickwit to ingest data from Pulsar in a few minutes
tags: [pulsar, integration]
icon_url: /img/tutorials/pulsar.svg
sidebar_position: 3
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

In this tutorial, we will describe how to set up Quickwit to ingest data from Pulsar in a few minutes. First, we will create an index and configure a Pulsar source. Then, we will create a Pulsar topic and load some events from the [Stack Overflow dataset](https://www.kaggle.com/stackoverflow/stacksample) into it. Finally, we will execute some searches.

## Prerequisites

You will need the following to complete this tutorial:
- A local running [Quickwit instance](/docs/get-started/installation.md)
- A local running [Pulsar instance](https://pulsar.apache.org/docs/next/getting-started-standalone/)

### Quickwit setup

[Download](/docs/get-started/installation.md) Quickwit and start a server. Then open a new terminal to execute CLI commands with the same binary. 

```bash
./quickwit run
```

Test that the cluster is running:

```bash
./quickwit index list
```

### Pulsar setup

<Tabs>

<TabItem value="Local" label="Local">

```bash
wget https://archive.apache.org/dist/pulsar/pulsar-2.11.0/apache-pulsar-2.11.0-bin.tar.gz
tar xvfz apache-pulsar-2.11.0-bin.tar.gz
cd apache-pulsar-2.11.0
bin/pulsar standalone
```

</TabItem>

<TabItem value="Docker" label="Docker">

```bash
docker run -it -p 6650:6650 -p 8080:8080 apachepulsar/pulsar:2.11.0 bin/pulsar standalone
```

See the details on the [official documentation](https://pulsar.apache.org/docs/next/getting-started-docker/).

</TabItem>

</Tabs>

## Prepare Quickwit

First, let's create a new index. Here is the index config and doc mapping corresponding to the schema of Stack Overflow posts:

```yaml title="index-config.yaml"
#
# Index config file for Stack Overflow dataset.
#
version: 0.7

index_id: stackoverflow

doc_mapping:
  field_mappings:
    - name: user
      type: text
      fast: true
      tokenizer: raw
    - name: tags
      type: array<text>
      fast: true
      tokenizer: raw
    - name: type
      type: text
      fast: true
      tokenizer: raw
    - name: title
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: body
      type: text
      tokenizer: default
      record: position
      stored: true
    - name: questionId
      type: u64
    - name: answerId
      type: u64
    - name: acceptedAnswerId
      type: u64
    - name: creationDate
      type: datetime
      fast: true
      input_formats:
        - rfc3339
      fast_precision: seconds
  timestamp_field: creationDate

search_settings:
  default_search_fields: [title, body]

indexing_settings:
  commit_timeout_secs: 10
```

Execute these Bash commands to download the index config and create the `stackoverflow` index.

```bash
# Download stackoverflow index config.
wget -O stackoverflow.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/stackoverflow/index-config.yaml

# Create index.
./quickwit index create --index-config stackoverflow.yaml
```

## Create the Pulsar source

A Pulsar source just needs to define the list of topics and the instance address.

```yaml title="pulsar-source.yaml"
#
# Pulsar source config file.
#
version: 0.7
source_id: pulsar-source
source_type: pulsar
params:
  topics:
    - stackoverflow
  address: pulsar://localhost:6650
```

Run these commands to download the source config file and create the source.

```bash
# Download Pulsar source config.
wget -O stackoverflow-pulsar-source.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/stackoverflow/pulsar-source.yaml

# Create source.
./quickwit source create --index stackoverflow --source-config stackoverflow-pulsar-source.yaml
```

As soon as the Pulsar source is created, Quickwit control plane will ask an indexer to start a new indexing pipeline. You will see logs like below by looking on the indexer:

```bash
INFO spawn_pipeline{index=stackoverflow gen=0}:pulsar-consumer{subscription_name="quickwit-stackoverflow-pulsar-source" params=PulsarSourceParams { topics: ["stackoverflow"], address: "pulsar://localhost:6650", consumer_name: "quickwit", authentication: None } current_positions={}}: quickwit_indexing::source::pulsar_source: Seeking to last checkpoint positions. positions={}
```

## Create and populate a Pulsar topic

We will use the Pulsar's default tenant/namespace `public/default`. To populate the topic, we will use a python script:

```python title=send_messages_to_pulsar.py
import json
import pulsar

client = pulsar.Client('pulsar://localhost:6650')
producer = client.create_producer('public/default/stackoverflow')

with open('stackoverflow.posts.transformed-10000.json', encoding='utf8') as file:
   for i, line in enumerate(file):
       producer.send(line.encode('utf-8'))
       if i % 100 == 0:
           print(f"{i}/10000 messages sent.", i)

client.close()
```

Install locally the python client, more details on [documentation page](https://pulsar.apache.org/docs/2.11.x/client-libraries-python/):

```bash
# Download the first 10_000 Stackoverflow posts articles.
curl -O https://quickwit-datasets-public.s3.amazonaws.com/stackoverflow.posts.transformed-10000.json

# Install pulsar python client.
# Requires a python version < 3.11
pip3 install 'pulsar-client==2.10.1'
wget https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/stackoverflow/send_messages_to_pulsar.py
python3 send_messages_to_pulsar.py
```

## Time to search!

You can run this command to inspect the properties of the index and check the current number of published splits and documents:

```bash
# Display some general information about the index.
./quickwit index describe --index stackoverflow
```

You will notably see the number of published documents.

You are now ready to execute some queries.

```bash
curl 'http://localhost:7280/api/v1/stackoverflow/search?query=search+AND+engine'
```

If your Quickwit server is local, you can access to the results through Quickwit UI on [localhost:7280](http://localhost:7280/ui/search?query=&index_id=stackoverflow&max_hits=10).


## Tear down resources (optional)

Let's delete the files and resources created for the purpose of this tutorial.

```bash
# Delete quickwit index.
./quickwit index delete --index stackoverflow --yes
# Delete Pulsar topic.
bin/pulsar-admin topics delete stackoverflow
```

This concludes the tutorial. If you have any questions regarding Quickwit or encounter any issues, don't hesitate to ask a [question](https://github.com/quickwit-oss/quickwit/discussions) or open an [issue](https://github.com/quickwit-oss/quickwit/issues) on [GitHub](https://github.com/quickwit-oss/quickwit) or contact us directly on [Discord](https://discord.com/invite/MT27AG5EVE).


================================================
FILE: docs/ingest-data/sqs-files.md
================================================
---
title: S3 with SQS notifications
description: A short tutorial describing how to set up Quickwit to ingest data from S3 files using an SQS notifier
tags: [s3, sqs, integration]
icon_url: /img/tutorials/file-ndjson.svg
sidebar_position: 5
---

In this tutorial, we describe how to set up Quickwit to ingest data from S3
with bucket notification events flowing through SQS. We will first create the
AWS resources (S3 bucket, SQS queue, notifications) using terraform. We will
then configure the Quickwit index and file source. Finally we will send some
data to the source bucket and verify that it gets indexed.

## AWS resources

The complete terraform script can be downloaded [here](../assets/sqs-file-source.tf).

First, create the bucket that will receive the source data files (NDJSON format):

```
resource "aws_s3_bucket" "file_source" {
  bucket_prefix = "qw-tuto-source-bucket"
}
```

Then setup the SQS queue that will carry the notifications when files are added
to the bucket. The queue is configured with a policy that allows the source
bucket to write the S3 notification messages to it. Also create a dead letter
queue (DLQ) to receive the messages that couldn't be processed by the file
source (e.g corrupted files). Messages are moved to the DLQ after 5 indexing
attempts. 

```
locals {
  sqs_notification_queue_name = "qw-tuto-s3-event-notifications"
}

data "aws_iam_policy_document" "sqs_notification" {
  statement {
    effect = "Allow"

    principals {
      type        = "*"
      identifiers = ["*"]
    }

    actions   = ["sqs:SendMessage"]
    resources = ["arn:aws:sqs:*:*:${local.sqs_notification_queue_name}"]

    condition {
      test     = "ArnEquals"
      variable = "aws:SourceArn"
      values   = [aws_s3_bucket.file_source.arn]
    }
  }
}

resource "aws_sqs_queue" "s3_events_deadletter" {
  name = "${locals.sqs_notification_queue_name}-deadletter"
}

resource "aws_sqs_queue" "s3_events" {
  name   = local.sqs_notification_queue_name
  policy = data.aws_iam_policy_document.sqs_notification.json

  redrive_policy = jsonencode({
    deadLetterTargetArn = aws_sqs_queue.s3_events_deadletter.arn
    maxReceiveCount     = 5
  })
}

resource "aws_sqs_queue_redrive_allow_policy" "s3_events_deadletter" {
  queue_url = aws_sqs_queue.s3_events_deadletter.id

  redrive_allow_policy = jsonencode({
    redrivePermission = "byQueue",
    sourceQueueArns   = [aws_sqs_queue.s3_events.arn]
  })
}
```

Configure the bucket notification that writes messages to SQS each time a new
file is created in the source bucket:

```
resource "aws_s3_bucket_notification" "bucket_notification" {
  bucket = aws_s3_bucket.file_source.id

  queue {
    queue_arn = aws_sqs_queue.s3_events.arn
    events    = ["s3:ObjectCreated:*"]
  }
}
```

:::note

Only events of type `s3:ObjectCreated:*` are supported. Other types (e.g.
`ObjectRemoved`) are acknowledged and a warning is logged.

:::

The source needs to have access to both the notification queue and the source
bucket. The following policy document contains the minimum permissions required
by the source:

```
data "aws_iam_policy_document" "quickwit_node" {
  statement {
    effect = "Allow"
    actions = [
      "sqs:ReceiveMessage",
      "sqs:DeleteMessage",
      "sqs:ChangeMessageVisibility",
      "sqs:GetQueueAttributes",
    ]
    resources = [aws_sqs_queue.s3_events.arn]
  }
  statement {
    effect    = "Allow"
    actions   = ["s3:GetObject"]
    resources = ["${aws_s3_bucket.file_source.arn}/*"]
  }
}
```

Create the IAM user and credentials that will be used to
associate this policy to your local Quickwit instance:

```
resource "aws_iam_user" "quickwit_node" {
  name = "quickwit-filesource-tutorial"
  path = "/system/"
}

resource "aws_iam_user_policy" "quickwit_node" {
  name   = "quickwit-filesource-tutorial"
  user   = aws_iam_user.quickwit_node.name
  policy = data.aws_iam_policy_document.quickwit_node.json
}

resource "aws_iam_access_key" "quickwit_node" {
  user = aws_iam_user.quickwit_node.name
}
```


:::warning

We don't recommend using IAM user credentials for running Quickwit nodes in
production. This is just a simplified setup for the sake of the tutorial. When
running on EC2/ECS, attach the policy document to an IAM roles instead.

:::

Download the [complete terraform script](../assets/sqs-file-source.tf) and
deploy it using `terraform init` and `terraform apply`. After a successful
execution, the outputs required to configure Quickwit will be listed. You can
display the values of the sensitive outputs (key id and secret key) with:


```bash
terraform output quickwit_node_access_key_id
terraform output quickwit_node_secret_access_key
```

## Run Quickwit

[Install Quickwit locally](/docs/get-started/installation), then in your install
directory, run Quickwit with the necessary access rights by replacing the
`<quickwit_node_access_key_id>` and `<quickwit_node_secret_access_key>` with the
matching Terraform output values:

```bash
AWS_ACCESS_KEY_ID=<quickwit_node_access_key_id> \
AWS_SECRET_ACCESS_KEY=<quickwit_node_secret_access_key> \
AWS_REGION=us-east-1 \
./quickwit run
```

## Configure the index and the source

In another terminal, in the Quickwit install directory, create an index:

```bash
cat << EOF > tutorial-sqs-file-index.yaml
version: 0.7
index_id: tutorial-sqs-file
doc_mapping:
  mode: dynamic
indexing_settings:
  commit_timeout_secs: 30
EOF

./quickwit index create --index-config tutorial-sqs-file-index.yaml
```

Replacing `<notification_queue_url>` with the corresponding Terraform output
value, create a file source for that index:

```bash
cat << EOF > tutorial-sqs-file-source.yaml
version: 0.8
source_id: sqs-filesource
source_type: file
num_pipelines: 2
params:
  notifications:
    - type: sqs
      queue_url: <notification_queue_url>
      message_type: s3_notification
EOF

./quickwit source create --index tutorial-sqs-file --source-config tutorial-sqs-file-source.yaml
```

:::tip

The `num_pipeline` configuration controls how many consumers will poll from the queue in parallel. Choose the number according to the indexer compute resources you want to dedicate to this source. As a rule of thumb, configure 1 pipeline for every 2 cores.

:::

## Ingest data

We can now ingest data into Quickwit by uploading files to S3. If you have the
AWS CLI installed, run the following command, replacing `<source_bucket_name>`
with the associated Terraform output:

```bash
curl https://quickwit-datasets-public.s3.amazonaws.com/hdfs-logs-multitenants-10000.json | \
    aws s3 cp - s3://<source_bucket_name>/hdfs-logs-multitenants-10000.json
```

If you prefer not to use the AWS CLI, you can also download the file and upload
it manually to the source bucket using the AWS console.

Wait approximately 1 minute and the data should appear in the index:

```bash
./quickwit index describe --index tutorial-sqs-file
```

## Tear down the resources

The AWS resources instantiated in this tutorial don't incur any fixed costs, but
we still recommend deleting them when you are done. In the directory with the
Terraform script, run `terraform destroy`.


================================================
FILE: docs/internals/backward-compatibility.md
================================================
# Backward compatibility in Quickwit.

If you are reading this, chances are you want to make a change to one of the resource
of Quickwit's meta/config.

There are basically 3 types of configuration:

Edited by the user and read back from file on startup:
- QuickwitConfig

Edited by the user then stored in the metastore:
- IndexConfig
- SourceConfig
- VersionedIndexTemplate

Assembled by Quickwit then stored in the metastore:
- IndexMetadata
- SplitMetadata
- FileBackedIndex (file backed metastore only)
- Manifest (file backed metastore only)

Quickwit currently manages the backward compatibility of all of these resources except the `QuickwitConfig`.

This document describes how to handle a change, and how to make test such a change, and spot eventual regression.

## How do I update `{IndexMetadata, SplitMetadata, FileBackedIndex, SourceConfig, IndexConfig, Manifest}`?

There are two types of upgrades:
- naturally backward compatible change
- change requiring a new version

### Naturally backward compatible change

Serde offers some attributes to make backward compatible changes to our model.
For instance, it is possible to add a new field to a struct and slap
a `serde(default)` attribute to it in order to handle older serialized version of the
struct.

If you want to avoid to generate any diff on the non-regression json files,
you can also avoid use `#[serde(skip_serializing_if)]`, although by default,
it is recommended to not use it.

It is also possible to rename a field in a backward compatible manner
by using the `#[serde(alias)]`.

For this type of change it is not required to update the serialization version.

Nevertheless, the regression tests will spot these changes. When that happens:
- modify your model with the help of the attributes above.
- modify the example for the model by editing its `TestableForRegression` trait implementation.
- run the backward compatibility tests (see below)
- check the diff between the `xxx.modified.json` files created and the matching `xxx.json` files. 
If the changes are acceptable, replace the content of the `xxx.json` files and commit them.

Be particularly careful to changes on files corresponding to the most recent version. If the 
changes are not compatible, create a new configuration version.

### Change requiring a new version

For changes requiring a new version, you will have to increment the configuration
version. You need to make sure that all of these resources share the same version number.

- update the resource struct you want to change.
- create a new item in the `VersionedXXXX` struct. It is usually located in a serialize.rs file
- `Serialize` is not needed for the previous serialized version. We just need `Deserialize`. We can 
remove the `Serialize` impl from the derive statement, and mark it a `skip_serializing` as follows.

e.g.
```
#[serde(tag = "version")]
pub(crate) enum VersionedXXXXXX {
    #[serde(rename = "0")]
    V0(#[serde(skip_serializing)] XXXX_V0),
    #[serde(rename = "1")]
    V1(XXXX_V1),
}
```
- complete the conversion `From<VersionedXXXX> for XXXX` and `From<XXXX> for VersionedXXXX`
- run the backward compatibility tests (see below)
- for older versions, check the diff between the `xxx.expected.modified.json` files created and the matching `xxx.expected.json` files. 
If the changes are acceptable, replace the content of the `xxx.expected.json` files and commit them.
- check the `yyyy.json` that was created for the new version and commit it along with the `yyyy.expected.json` file (identical).
- possibly update the generation of the default XXXX instance used for regression. It is in the function `TestableForRegression::sample_for_regression`.


## Backward compatibility tests

These tests are used to ensure the backward compatibility of Quickwit.
Right now, `SplitMetadata`, `IndexMetadata`, `Manifest` and `FileBackedIndex` are tested.

We want to be able to read all past versions of these files, but only write the most recent format.

The tests consist of pairs of JSON files, `XXXX.json` and `XXXX.expected.json`:
- `XXXX.json` is the first serialized value of a new version.
- `XXXX.expected.json` is the result of `serialize_new_version(deserialize(XXXX.json))`.

Format changes are automatically detected. There are two possible situations when a format changes.

#### Updating expected.json

We need to keep `*.expected.json` files up-to-date with the format changes.

This is done in a semi-automatic fashion.

Checks are performed in two steps:
- first pass, `deserialize(original_json) == deserialize(expectation_json)`
- second pass, `expectation_json = serialize(deserialize(expectation_json))`

When changing the json format, it is expected to see this test fail.
The unit test then updates automatically the `expected.json`. The developer just has to
check the diff of the result (in particular no information should be lost) and commit the 
updated expected.json files.

Adding this update operation within the unit test is a tad unexpected, but it has the merit of
integrating well with CI. If a developer forgets to update the expected.json file,
the CI will catch it.

#### Adding a new test case.

If the serialization format changes, a new version should be created and the unit test will
automatically add a new unit test generated from the sample tested objects.
Concretely, it will just write two files `XXXX.json` and `XXXX.expected.json` for each model.

The two files will be identical. This is expected as this is a unit test for the most recent 
version. The unit test will start making sense in future updates thanks to the update phase
described in the previous section.


================================================
FILE: docs/internals/date-time.md
================================================
# Datetime format

Quickwit's DateTime is a wrapper around Tantivy's provided DateTime type which is internally represented as an `i64` microseconds value. For optimization reasons, Tantivy stores the value differently at the following locations:
- DocStore: Dates are stored as they are received from the input document.
- TermDict: Dates are stored with `seconds` precision.
- FastField: Dates are stored using the DateTime type configured precision that can take of the following values: `seconds`, `milliseconds`, `microseconds`.


================================================
FILE: docs/internals/ingest-v2.md
================================================
# Ingest V2

Ingest V2 is the latest ingestion API that is designed to be more efficient and scalable for thousands of indexes than the previous version. It is the default since 0.9.

## Architecture

Just like ingest V1, the new ingest uses [`mrecordlog`](https://github.com/quickwit-oss/mrecordlog) to persist ingested documents that are waiting to be indexed. But unlike V1, which always persists the documents locally on the node that receives them, ingest V2 can dynamically distribute them into WAL units called _shards_. The assigned shard can be local or on another indexer. The control plane is in charge of distributing the shards to balance the indexing work as well as possible across all indexer nodes. The progress within each shard is not tracked as an index metadata checkpoint anymore but in a dedicated metastore `shards` table.

In the future, the shard based ingest will also be capable of writing a replica for each shard, thus ensuring a high durability of the documents that are waiting to be indexed (durability of the indexed documents is guarantied by the object store).

## Toggling between ingest V1 and V2

Variables driving the ingest configuration are documented [here](../ingest-data/ingest-api.md#ingest-api-versions).

With ingest V2, you can also activate the `enable_cooperative_indexing` option in the indexer configuration. This setting is useful for deployments with very large numbers (dozens) of actively written indexers, to limit the indexing workbench memory consumption. The indexer configuration is in the node configuration:

```yaml
version: 0.8
# [...]
indexer:
  enable_cooperative_indexing: true
```

See [full configuration example](https://github.com/quickwit-oss/quickwit/blob/main/config/quickwit.yaml).

## Differences between ingest V1 and V2

- V1 uses the `queues/` directory whereas V2 uses the `wal/` directory
- both V1 and V2 are configured with:
  - `ingest_api.max_queue_memory_usage` 
  - `ingest_api.max_queue_disk_usage` 
- but ingest V2 can also be configured with:
  - `ingest_api.replication_factor`, not working yet
- ingest V1 always writes to the WAL of the node receiving the request, V2 potentially forwards it to another node, dynamically assigned by the control plane to distribute the indexing work more evenly.
- ingest V2 parses and validates input documents synchronously. Schema and JSON formatting errors are returned in the ingest response (for ingest V1 those errors were available in the server logs only).


================================================
FILE: docs/internals/scroll.md
================================================
# Scroll API

The scroll API has been implemented to offer compatibility with ElasticSearch.
The API and the implementation are quirky and are detailed in this document.

## API description

You can find information about the scroll API here.
https://www.elastic.co/guide/en/elasticsearch/reference/current/paginate-search-results.html#scroll-search-results
https://www.elastic.co/guide/en/elasticsearch/reference/current/scroll-api.html

The user runs a regular search request with a `scroll` param.
The search result then contains the normal response, but a `_scroll` property is added to the search body.

That id is then meant to be sent to a scroll rest API.
This API successive calls will then return pages incrementally.

## Quirk and difficulty.

The scrolled results should be consistent with the state of the original index.
For this reason we need to capture the state of the index at the point of the original request.

If a network error happens between the client and the server at page N, there is no way for the client to ask the reemission of page N.
Page N+1 will be returned on the next call.

## Implementation

Server side, we store a replicated scroll context.

It contains:
- the detail about the original query (we need to be able to reemit paginated queries)
- the "point-in-time" list of split metadatas used for the query
- a cached list of partial docs (= not the doc content, just its address and its score) to avoid
performing search over and over.
- the total number of results, in order to append that information to our response.
searching at every single scroll requests.

We use a simple leaderless KV store to keep the state required to run the scroll API.
We generate a scroll ULID and use it to get a list of the servers with the best affinity according
to rendez vous hashing. We then go through them in order and attempt to put that key on up to 2 servers. Failures for these PUTs are silent.

For each call to scroll, one of two things can happen:
- the partial docs for the page requested is in the partial doc cache. We just run the fetch_docs phase, and update the context with the `start_offset`.
- the partial docs for the page request are not in the partial doc cache. We then run a new search query.

We attempt to fetch `SCROLL_BATCH_LEN` in order to fill the partial doc address cache for subsequent calls.

# A strange `scroll_id`.

The elasticsearch API is needlessly broken as it returns the same scroll_id most of the time.
The "page-change" mutation is something that happens on the server side.

In quickwit on the other hand, the scroll id is the concatenation of the
- ULID: used as the address for the search context.
- the start_offset.
- the number of hits per page
- a search_after key

We only mutate the state server side to update the cache whenever needed.

The idea here is that if that if the put request failed, we can still return the right results even if we have an obsolete version of the `ScrollContext`.

# Quickwit implementation (improvement, quirks and shortcuts)

We do not do explicitly protect the split from our store Point-In-Time information
from deletion. Instead we simply rely on the existing grace period mechanism (a split
only is effectively garbage collected 32mn after it is marked as deleted).

For this reason we limit the scroll period to 30mn and subsequent scroll calls do not
extend the scroll period.

Also thanks to this period, we do not add any extra replication repair mechanism.
Some scroll calls will end up being broken if we were to remove 2 servers within 30mn.

Quickwit caches partial hits in batches of 1000 results.
Querying page N leverages `search_after`, so that accessing further pages isn't more
costly than accessing the first ones.


================================================
FILE: docs/internals/searcher-split-cache.md
================================================

# Searcher split cache

Quickwit includes a split cache. It can be useful for specific workloads:
- to improve performance
- to reduce the cost associated with GET requests.

The split cache stores entire split files on disk.
It works under the following configurable constraints:
- number of concurrent downloads
- amount of disk space
- number of on-disk files.

Searcher get tipped by indexers about the existence of splits (for which they have the best affinity).
They also might learn about split existence, upon read requests.

The searcher is then in charge of maintaining an in-memory data structure with a bounded list of splits it knows about and their score.
The current strategy for admission/evicton is a simple LRU logic.

If the most recently accessed split not already in cache has been accessed, we consider downloading it.
If the limits have been reached, we only proceed to eviction if one of the split currently
in cache has been less recently accessed.


================================================
FILE: docs/internals/sorting.md
================================================
# Sorting

Quickwit can sort results based on fastfield values or score. This document discuss where and how
 it happens.
It also tries to describe optimizations that may be enabled (but are not necessarily implemented)
by this behavior.

## Behavior

Sorting is controlled by the `sort_by` query parameter. It accepts a comma separated list of fields
to use for sorting. Sorting is Descending by default. The sorting order can be reversed by prefixing
a field name with a hyphen `-`.
The special value `_score` means sorting by score, it is also Descending by default.

In case of equality between two documents, the GlobalDocId, composed of (SplitId, SegmentId, DocId)
is used as a tie breaker. It is used to sort in the same order as the first field being sorted by.
This means it is in Descending order by default.

If a document doesn't have a value for a sorting field, that document is considered to go after any
document which has a value, independently of sort order. That is, when sorting the value 1,2 and
None, ascending sort would give `[1, 2, None]`, and descending sort would give `[2, 1, None]`.

If a client does not request sorting, documents are sorted using (SplitId, SegmentId, DocId), on
Descending order. In other words, everything happens as if documents were sorted by a constant
value.

<!--
TODO we could also say "it's not sorted" and add a special `_doc_id` for that. See optimizations
-->

# Code

A new structure TopK is introduced which is used both for in-split sorting and for merging of
results. It reduces the risks of inconsistencies between in-split and between-split behavior.
`SortOrder` gets new `compare` and `compare_opt` method which can be used to compare two values with
 respect to the particular sort order required, and with proper handling of the `None` special case.

# Optimization permitted

Both orders allow an optimization when sorting by date (either direction), by leveraging splits
meta-data to know in advance if a split can, or not, contain better results. Changing the sorting
order for "not sorted" queries allows to leverage SplitId as a way to know whether a split can
contain or not better results (if its SplitId is more/less than the current worst best-hit, the
split does not need to be searched).

<!--
If we allow unsorted requests, we can go further and stop searching as soon as we have k hits
(even going as far as stopping mid collection), without even looking at other splits metadata.
Argument can be made in favor of this because GlobalDocId is not stable, and can change during
a merge, so order is not guaranteed anyway, at least not until Quickwit has support for a Point
In Time mechanism.
-->

These optimization have limited to no impact if we give an exact count of matching documents.
An option to request only a lower bound would be required for these optimizations to make sense.


================================================
FILE: docs/internals/split-format.md
================================================
# Split format

Quickwit's index are divided into small independent immutable piece of index called split.

For convenience, a split consists in a single file, with the extension `.split`.

In reality, this file hides an internal mini static filesystem,
with:
- the Tantivy index files (`.idx`, `.pos`, `.term`...)
- a Quickwit specific file with the list of fields, including those indexed as part of a JSON type. 
It contains the field name, type and capabilities.

The split file data layout looks like this:
- concatenation all of the files in the split
- a footer

The footer follows the following format.

- a json object called `BundleStorageFileOffsets` containing the `[start, end)` byte-offsets
of all files.
- the length of this json (8 bytes little endian)
- a hotcache, a small static cache that contains some important file sections.
- the length of this hotcache (8 bytes little endian)

This footer plays a key role a very important role in quickwit.
It packs in one read all of the information required to open a split.

When opening a file from a distant storage,  Quickwit's metastore stores the byte offsets of this footer to make this read possible.

If this footer offset information is not available, for instance if the split is just a file on the filesystem, it is still possible to open it by reading the last 8 bytes of the split (encoding the length of the hotcache), deducing the position of the meta information and unpacking this in turn.


================================================
FILE: docs/internals/template-index.md
================================================
# Index template API

Index templates are a way to create indexes automatically with some given configuration when Quickwit receives documents for an index that doesn't exist yet.

Example of templates: [https://github.com/quickwit-oss/quickwit/tree/main/config/templates](https://github.com/quickwit-oss/quickwit/tree/main/config/templates).

# Curl to run to use the REST API to create Stackoverflow template

```bash
curl -XPOST -H 'Content-Type: application/yaml' 'http://localhost:7280/api/v1/templates' --data-binary @config/templates/stackoverflow.yaml

# Lists templates.
curl 'http://localhost:7280/api/v1/templates'

# Update Stackoverflow template.
curl -XPUT -H 'Content-Type: application/yaml' 'http://localhost:7280/api/v1/templates/stackoverflow' --data-binary @config/templates/stackoverflow.yaml

# Download dataset.
curl -O https://quickwit-datasets-public.s3.amazonaws.com/stackoverflow.posts.transformed-10000.json

# Ingest 10k docs into `stackoverflow-foo` index.
curl -XPOST "http://127.0.0.1:7280/api/v1/stackoverflow-foo/ingest" --data-binary @stackoverflow.posts.transformed-10000.json

# Ingest 10k docs into `stackoverflow-bar` index.
curl -XPOST "http://127.0.0.1:7280/api/v1/stackoverflow-bar/ingest" --data-binary @stackoverflow.posts.transformed-10000.json

# Delete Stackoverflow template.
curl -XDELETE 'http://localhost:7280/api/v1/templates/stackoverflow'

```bash


================================================
FILE: docs/log-management/_category_.yaml
================================================
label: 'Log management'
position: 5
collapsed: true


================================================
FILE: docs/log-management/otel-service.md
================================================
---
title: OTEL service
sidebar_position: 4
---

Quickwit natively supports the [OpenTelemetry Protocol (OTLP)](https://opentelemetry.io/docs/reference/specification/protocol/otlp/) and provides a gRPC endpoint to receive spans from an OpenTelemetry collector. This endpoint is enabled by default.

When enabled, Quickwit will start the gRPC service ready to receive logs from an OpenTelemetry collector. The logs are indexed in the `otel-logs-v0_7` index by default, and this index will be automatically created if not present. The index doc mapping is described in the next [section](#trace-and-span-data-model).

If for any reason, you want to disable this endpoint, you can:
- Set the `QW_ENABLE_OTLP_ENDPOINT` environment variable to `false` when starting Quickwit.
- Or [configure the node config](/docs/configuration/node-config.md) by setting the indexer setting `enable_otlp_endpoint` to `false`.

```yaml title=node-config.yaml
# ... Indexer configuration ...
indexer:
    enable_otlp_endpoint: false
```

## Sending logs in your own index

You can send logs in the index of your choice by setting the header `qw-otel-logs-index` of your gRPC request to the targeted index ID.


## OpenTelemetry logs data model

Quickwit sends OpenTelemetry logs into the `otel-logs-v0_7` index by default which is automatically created if you enable the OpenTelemetry service.
The doc mapping of this index described below is derived from the [OpenTelemetry logs data model](https://opentelemetry.io/docs/reference/specification/logs/data-model/).

```yaml

version: 0.7

index_id: otel-logs-v0_7

doc_mapping:
  mode: strict
  field_mappings:
    - name: timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
      indexed: false
      fast: true
      fast_precision: milliseconds
    - name: observed_timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
    - name: service_name
      type: text
      tokenizer: raw
      fast: true
    - name: severity_text
      type: text
      tokenizer: raw
      fast: true
    - name: severity_number
      type: u64
      fast: true
    - name: body
      type: json
      tokenizer: default
    - name: attributes
      type: json
      tokenizer: raw
      fast: true
    - name: dropped_attributes_count
      type: u64
      indexed: false
    - name: trace_id
      type: bytes
      input_format: hex
      output_format: hex
    - name: span_id
      type: bytes
      input_format: hex
      output_format: hex
    - name: trace_flags
      type: u64
      indexed: false
    - name: resource_attributes
      type: json
      tokenizer: raw
      fast: true
    - name: resource_dropped_attributes_count
      type: u64
      indexed: false
    - name: scope_name
      type: text
      indexed: false
    - name: scope_version
      type: text
      indexed: false
    - name: scope_attributes
      type: json
      indexed: false
    - name: scope_dropped_attributes_count
      type: u64
      indexed: false

  timestamp_field: timestamp_nanos

indexing_settings:
  commit_timeout_secs: 10

search_settings:
  default_search_fields: [body.message]
```

## UI Integration

Currently, Quickwit provides a simplistic UI to get basic information from the cluster, indexes and search documents.
If a simple UI is not sufficient for you and you need additional features, Grafana and Elasticsearch query API support are planned for Q2 2023, stay tuned!

You can also send traces to Quickwit that you can visualize in Jaeger UI, as explained in the following [tutorial](../distributed-tracing/send-traces/using-otel-sdk-python.md).


## Known limitations

There are a few limitations on the log management setup in Quickwit 0.9:
- The ingest API does not provide High-Durability. This will be fixed in 0.10.
- OTLP HTTP is only available with the Binary Protobuf Encoding. OTLP HTTP with JSON encoding is not planned yet, but this can be easily fixed in the next version. Please open an issue if you need this feature.

If you are interested in new features or discover other limitations, please open an issue on [GitHub](https://github.com/quickwit-oss/quickwit).


================================================
FILE: docs/log-management/overview.md
================================================
---
title: Log management with Quickwit
sidebar_label: Overview
sidebar_position: 1
---

Quickwit is built from the ground up to [efficiently index unstructured data](../guides/schemaless.md), and search it effortlessly on cloud storage.
Moreover, Quickwit supports OpenTelemetry gRPC and HTTP (protobuf only) protocols out of the box and provides a REST API ready to ingest any JSON formatted logs.
**This makes Quickwit a perfect fit for logs!**.

![Quickwit Log Management](../assets/images/log-management-overview-light.svg#gh-light-mode-only)![Quickwit Log Management](../assets/images/log-management-overview-dark.svg#gh-dark-mode-only)

## Sending logs to Quickwit

- [Using OTEL collector](send-logs/using-otel-collector.md)
- [Using OTEL collector with Helm](send-logs/using-otel-collector-with-helm.md)
- [Using Fluentbit](send-logs/using-fluentbit.md)
- [Using Vector](send-logs/using-vector.md)


================================================
FILE: docs/log-management/send-logs/_category_.yaml
================================================
label: 'Sending logs'
position: 2
collapsed: false


================================================
FILE: docs/log-management/send-logs/send-docker-logs.md
================================================
---
title: Send docker logs into Quickwit
sidebar_label: Docker logs into Quickwit
description: Send docker logs into Quickwit
tags: [otel, docker, collector, log]
sidebar_position: 5
---

To send docker container logs into Quickwit, you just need to setup an OpenTelemetry Collector with the file logs receiver. In this tutorial, we will use `docker compose` to start the collector and Quickwit.

You only need a minute to get your Quickwit log UI!

![Quickwit UI Logs](../../assets/images/screenshot-quickwit-ui-docker-compose-logs.png)

## OTEL collector configuration

The following collector configuration will collect docker logs in `/var/lib/docker/containers/*/*-json.log` (depending on your system, log files can be at a different location), add a few attributes and send them to Quickwit through gRPC at `http://quickwit:7281`.


```yaml title="otel-collector-config.yaml"
receivers:
  filelog:
    include:
      - /var/lib/docker/containers/*/*-json.log
    operators:
     - id: parser-docker
       timestamp:
         layout: '%Y-%m-%dT%H:%M:%S.%LZ'
         parse_from: attributes.time
       type: json_parser
     - field: attributes.time
       type: remove
     - id: extract_metadata_from_docker_tag
       parse_from: attributes.attrs.tag
       regex: ^(?P<name>[^\|]+)\|(?P<image_name>[^\|]+)\|(?P<id>[^$]+)$
       type: regex_parser
       if: 'attributes?.attrs?.tag != nil'
     - from: attributes.name
       to: resource["docker.container.name"]
       type: move
       if: 'attributes?.name != nil'
     - from: attributes.image_name
       to: resource["docker.image.name"]
       type: move
       if: 'attributes?.image_name != nil'
     - from: attributes.id
       to: resource["docker.container.id"]
       type: move
       if: 'attributes?.id != nil'
     - from: attributes.log
       to: body
       type: move

processors:
  batch:
    timeout: 5s

exporters:
  otlp/qw:
    endpoint: quickwit:7281
    tls:
      insecure: true

service:
  pipelines:
    logs:
      receivers: [filelog]
      processors: [batch]
      exporters: [otlp/qw]
```

## Start the OTEL collector and a Quickwit instance

Let's use `docker compose` with the following configuration:

```yaml title="docker-compose.yaml"
version: "3"

x-default-logging: &logging
 driver: "json-file"
 options:
   max-size: "5m"
   max-file: "2"
   tag: "{{.Name}}|{{.ImageName}}|{{.ID}}"

services:
  quickwit:
    image: quickwit/quickwit:${QW_VERSION:-0.8.1}
    volumes:
      - ./qwdata:/quickwit/qwdata
    ports:
      - 7280:7280
    environment:
      - NO_COLOR=true
    command: ["run"]
    logging: *logging

  otel-collector:
    user: "0" # Needed to access the directory /var/lib/docker/containers/
    image: otel/opentelemetry-collector-contrib:${OTEL_VERSION:-0.87.0}
    volumes:
      - ./otel-collector-config.yaml:/etc/otel-collector-config.yaml
      - /var/lib/docker/containers:/var/lib/docker/containers:ro
    command: ["--config=/etc/otel-collector-config.yaml"] 
    logging: *logging
```


You will notice the custom `logging`, the OTEL collector will use that additional information to enrich the logs.

## Run it and search

Download the configuration files and start the containers:
   
```bash

mkdir qwdata
docker compose up
```

After a few seconds, you will see the logs in the Quickwit UI [http://localhost:7280](http://localhost:7280).


Here is what it should look like:

```json
{
  "attributes": {
    "log.file.name": "34ad1a84c71de1d29ad75f99b56d01205e2976440f2398734037151ba2bcde1a-json.log",
    "stream": "stdout"
  },
  "body": {
    "message": "2023-10-23T16:39:57.892  INFO --- [   asgi_gw_1] localstack.request.aws     : AWS s3.ListObjects => 200\n"
  },
  "observed_timestamp_nanos": 1698079197979435000,
  "service_name": "unknown_service",
  "severity_number": 0,
  "timestamp_nanos": 1698079197892726000,
  "trace_flags": 0
}
```


## Troubleshooting

It's possible that you get no logs in the UI. In this case, check the `docker compose` logs. The problem can typically come from a wrong configuration of the OTEL collector.


================================================
FILE: docs/log-management/send-logs/using-fluentbit.md
================================================
---
title: Send logs using Fluentbit
sidebar_label: Using Fluentbit
description: A simple tutorial to send logs from Fluentbit to Quickwit in a few minutes.
icon_url: /img/tutorials/fluentbit-logo.png
tags: [logs, ingestion]
sidebar_position: 4
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

[Fluent Bit](https://fluentbit.io/) is an open-source logging and metrics processor and forwarder to multiple destinations.

In this guide, we will show you how to connect it to Quickwit.

## Prerequisites

- [Install Quickwit](/docs/get-started/installation.md)
- Start a Quickwit instance with `./quickwit run`
- [Install Fluentbit](https://docs.fluentbit.io/manual/installation/getting-started-with-fluent-bit)


## Create a simple index for Fluentbit logs

Let's create a schemaless index with only one field `timestamp`. The mode `dynamic` indicates that Quickwit will index all fields even if they are not defined in the doc mapping.

```yaml title="index-config.yaml"
version: 0.7

index_id: fluentbit-logs

doc_mapping:
  mode: dynamic
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast: true
  timestamp_field: timestamp

indexing_settings:
  commit_timeout_secs: 10
```

```bash
curl -o fluentbit-logs.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/fluentbit-logs/index-config.yaml
```

And then create the index with `cURL` or the `CLI`:

<Tabs>

<TabItem value="curl" label="cURL">

```bash
curl -XPOST http://localhost:7280/api/v1/indexes -H "content-type: application/yaml" --data-binary @fluentbit-logs.yaml
```

</TabItem>

<TabItem value="cli" label="CLI">

```bash
./quickwit index create --index-config fluentbit-logs.yaml
```

</TabItem>

</Tabs>


## Setup Fluentbit

Fluentbit configuration file is made of inputs and outputs. For this tutorial, we will use a dummy configuration:

``` title=fluent-bit.conf
[INPUT]
  Name   dummy
  Tag    dummy.log

[OUTPUT]
  Name http
  Match *
  URI   /api/v1/fluentbit-logs/ingest
  Host  localhost
  Port  7280
  tls   Off
  Format json_lines
  Json_date_key    timestamp
  Json_date_format epoch
```

Fluentbit will send `dummy` logs to Quickwit endpoint `/api/v1/fluentbit-logs/ingest`.

Let's start Fluentbit.

```bash
fluent-bit -c fluent-bit.conf
```

## Search logs

Quickwit is now ingesting logs coming from Fluentbit and you can search them either with `cURL` or by using the UI:
- `curl "http://127.0.0.1:7280/api/v1/fluentbit-logs/search?query=severity:DEBUG"`
- Open your browser at `http://127.0.0.1:7280/ui/search?query=severity:DEBUG&index_id=fluentbit-logs&max_hits=10`.


## Further improvements

You will soon be able to do aggregations on dynamic fields (planned for 0.7).


================================================
FILE: docs/log-management/send-logs/using-otel-collector-with-helm.md
================================================
---
title: Send K8s logs using OTEL collector
sidebar_label: Using OTEL with Helm
description: Send K8s logs with OTEL collectors and Helm to Quickwit in a few minutes.
tags: [k8s, helm]
icon_url: /img/tutorials/helm-otel-k8s-tutorial-illustation.jpg
sidebar_position: 2
---

This guide will help you to unlock log search on your k8s cluster logs. We will first deploy Quickwit and OTEL collectors with [Helm](https://helm.sh/) and then see how to index and search them.

## Prerequisites

You will need the following to complete this tutorial:
- A Kubernetes cluster.
- The command line tool [kubectl](https://kubernetes.io/docs/reference/kubectl/).
- The command line tool [Helm](https://helm.sh/).
- An access to an object storage like AWS S3, GCS, Azure blob storage, or Scaleway to store index data.


## Install with Helm

Let's first create a namespace to isolate our experiment and set it as the default namespace.

```bash
kubectl create namespace qw-tutorial
kubectl config set-context --current --namespace=qw-tutorial
```


Then let's add [Quickwit](https://github.com/quickwit-oss/helm-charts) and [Otel](https://github.com/open-telemetry/opentelemetry-helm-charts) helm repositories:

```bash
helm repo add quickwit https://helm.quickwit.io
helm repo add open-telemetry https://open-telemetry.github.io/opentelemetry-helm-charts
```

You should now see the two repos in helm:

```bash
helm repo list
NAME                	URL
quickwit            	https://helm.quickwit.io
open-telemetry      	https://open-telemetry.github.io/opentelemetry-helm-charts
```


### Deploy Quickwit

Let's create a basic chart configuration:

```bash
export AWS_REGION=us-east-1
export AWS_ACCESS_KEY_ID=XXXX
export AWS_SECRET_ACCESS_KEY=XXXX
export DEFAULT_INDEX_ROOT_URI=s3://your-bucket/indexes
```

```bash
# Create Quickwit config file.
echo "
searcher:
  replicaCount: 1
indexer:
  replicaCount: 1
metastore:
  replicaCount: 1
janitor:
  enabled: true
control_plane:
  enabled: true

environment:
  # Remove ANSI colors.
  NO_COLOR: 1

# Quickwit configuration
config:
  storage:
    s3:
      region: ${AWS_REGION}
      access_key_id: ${AWS_ACCESS_KEY_ID}
      secret_access_key: ${AWS_SECRET_ACCESS_KEY}
      # If you are not on AWS S3, you can define a flavor (gcs, minio, garage...)
      # and additional variables for your object storage.
      # flavor: gcs
      # endpoint: https://storage.googleapis.com

  # Metastore on S3.
  metastore_uri: ${DEFAULT_INDEX_ROOT_URI}

  default_index_root_uri: ${DEFAULT_INDEX_ROOT_URI}

  # Indexer settings
  indexer:
    # By activating the OTEL service, Quickwit will be able
    # to receive gRPC requests from OTEL collectors.
    enable_otlp_endpoint: true
" > qw-tutorial-values.yaml
```

Before installing Quickwit chart, make sure you have access to S3 and that you did not make a typo in the `default_index_root_uri`. This can be easily done with `aws` CLI with a simple `ls`:

```bash
aws s3 ls ${DEFAULT_INDEX_ROOT_URI}
```

If the CLI did not return an error, you are ready to install the chart:

```bash
helm install quickwit quickwit/quickwit -f qw-tutorial-values.yaml
```

In a few moments, you will see the pods running Quickwit services:

```bash
kubectl get pods
NAME                                      READY   STATUS    RESTARTS      AGE
quickwit-control-plane-7fc495f4c4-slqv4   1/1     Running   2 (84s ago)   87s
quickwit-indexer-0                        1/1     Running   2 (84s ago)   87s
quickwit-janitor-7f75f4bc8-jrfv6          1/1     Running   2 (84s ago)   87s
quickwit-metastore-6989978fc-9s82j        1/1     Running   2 (85s ago)   87s
quickwit-searcher-0                       1/1     Running   2 (84s ago)   87s
```

Let's check Quickwit is working:

```bash
kubectl port-forward svc/quickwit-searcher 7280
```

Then open your browser `http://localhost:7280/ui/indexes`. You should see the list of indexes. If everything is fine, keep the kubectl command running and open a new terminal.

### Deploy OTEL collectors

We need to configure a bit the collectors in order to:
- collect logs from k8s
- enrich the logs with k8s attributes
- export the logs to Quickwit indexer.

```bash
echo "
mode: daemonset
presets:
  logsCollection:
    enabled: true
  kubernetesAttributes:
    enabled: true
config:
  exporters:
    otlp:
      endpoint: quickwit-indexer.qw-tutorial.svc.cluster.local:7281
      tls:
        insecure: true
      # By default, logs are sent to the otel-logs-v0_7.
      # You can customize the index ID By setting this header.
      # headers:
      #   qw-otel-logs-index: otel-logs-v0_7
  service:
    pipelines:
      logs:
        exporters:
          - otlp
" > otel-values.yaml
```

```
helm install otel-collector open-telemetry/opentelemetry-collector -f otel-values.yaml
```

After a few seconds, you should see logs on your indexer that show indexing has started. It looks like this:
```
2022-11-30T18:27:37.628Z  INFO spawn_merge_pipeline{index=otel-log-v0 gen=0}: quickwit_indexing::actors::merge_pipeline: Spawning merge pipeline. index_id=otel-log-v0 source_id=_ingest-api-source pipeline_ord=0 root_dir=/quickwit/qwdata/indexing/otel-log-v0/_ingest-api-source merge_policy=StableLogMergePolicy { config: StableLogMergePolicyConfig { min_level_num_docs: 100000, merge_factor: 10, max_merge_factor: 12, maturation_period: 172800s }, split_num_docs_target: 10000000 }
2022-11-30T18:27:37.628Z  INFO quickwit_serve::grpc: Starting gRPC server. enabled_grpc_services={"otlp-log", "otlp-trace"} grpc_listen_addr=0.0.0.0:7281
2022-11-30T18:27:37.628Z  INFO quickwit_serve::rest: Starting REST server. rest_listen_addr=0.0.0.0:7280
2022-11-30T18:27:37.628Z  INFO quickwit_serve::rest: Searcher ready to accept requests at http://0.0.0.0:7280/
2022-11-30T18:27:42.654Z  INFO quickwit_indexing::actors::indexer: new-split split_id="01GK4WPTXK8GH3AGTRNBN9A8YG" partition_id=0
2022-11-30T18:27:52.643Z  INFO quickwit_indexing::actors::indexer: send-to-index-serializer commit_trigger=Timeout split_ids=01GK4WPTXK8GH3AGTRNBN9A8YG num_docs=22
2022-11-30T18:27:52.652Z  INFO index_batch{index_id=otel-log-v0 source_id=_ingest-api-source pipeline_ord=0}:packager: quickwit_indexing::actors::packager: start-packaging-splits split_ids=["01GK4WPTXK8GH3AGTRNBN9A8YG"]
2022-11-30T18:27:52.652Z  INFO index_batch{index_id=otel-log-v0 source_id=_ingest-api-source pipeline_ord=0}:packager: quickwit_indexing::actors::packager: create-packaged-split split_id="01GK4WPTXK8GH3AGTRNBN9A8YG"
2022-11-30T18:27:52.653Z  INFO index_batch{index_id=otel-log-v0 source_id=_ingest-api-source pipeline_ord=0}:uploader: quickwit_indexing::actors::uploader: start-stage-and-store-splits split_ids=["01GK4WPTXK8GH3AGTRNBN9A8YG"]
2022-11-30T18:27:52.733Z  INFO index_batch{index_id=otel-log-v0 source_id=_ingest-api-source pipeline_ord=0}:uploader:stage_and_upload{split=01GK4WPTXK8GH3AGTRNBN9A8YG}:store_split: quickwit_indexing::split_store::indexing_split_store: store-split-remote-success split_size_in_megabytes=0.018351 num_docs=22 elapsed_secs=0.07654519 throughput_mb_s=0.23974074 is_mature=false
```

If you see some errors there, it's probably coming from a misconfiguration of your object storage. If you need some help, please open an issue on [GitHub](https://github.com/quickwit-oss/quickwit) or come on our [discord server](https://discord.gg/MT27AG5EVE).


### Ready to search logs

You are now ready to search, wait 30 seconds and you will see the first indexed logs: just [open the UI](http://localhost:7280/ui/search?query=*&index_id=otel-logs-v0&max_hits=10&sort_by=-timestamp_secs) and play with it. Funny thing you will see quickwit logs in it :).

Example of queries:

- [body.message:quickwit](http://localhost:7280/ui/search?query=body.message:quickwit&index_id=otel-logs-v0&max_hits=10&sort_by=-timestamp_secs)
- [resource_attributes.k8s.container.name:quickwit](http://localhost:7280/ui/search?query=resource_attributes.k8s.container.name%3Aquickwit&index_id=otel-logs-v0&max_hits=10&sort_by=-timestamp_secs)
- [resource_attributes.k8s.container.restart_count:1](http://localhost:7280/ui/search?query=resource_attributes.k8s.container.restart_count%3A1&index_id=otel-logs-v0&max_hits=10&sort_by=-timestamp_secs)


![UI screenshot](../../assets/screenshot-ui-otel-logs.png)

That's all, folks!

### Clean up

Let's first delete the index and then uninstall the charts.

```bash
# Delete the index. The command will return the list of delete split files.
curl -XDELETE http://127.0.0.1:7280/api/v1/indexes/otel-logs-v0

# Uninstall charts
helm uninstall otel-collector
helm uninstall quickwit

# Delete namespace
kubectl delete namespace qw-tutorial
```

Finally, you need to delete three JSON files created by Quickwit on your object storage:

```bash
# if your version <= 0.7.1
aws s3 rm ${DEFAULT_INDEX_ROOT_URI}/indexes_states.json
# if your version > 0.7.1
aws s3 rm ${DEFAULT_INDEX_ROOT_URI}/manifest.json
# the metastore file of the logs index
aws s3 rm ${DEFAULT_INDEX_ROOT_URI}/otel-logs-v0_7/metastore.json
# the metastore file of the traces index
aws s3 rm ${DEFAULT_INDEX_ROOT_URI}/otel-traces-v0_7/metastore.json
```

## Next step

Follow our [tutorial](../../get-started/tutorials/trace-analytics-with-grafana.md) to install Quickwit Grafana plugin to explore your logs, create dashboards and alerts.


================================================
FILE: docs/log-management/send-logs/using-otel-collector.md
================================================
---
title: Send logs from OTEL Collector
sidebar_label: Using OTEL collector
description: Using OTEL Collector
tags: [otel, collector, log]
sidebar_position: 1
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

If you already have your own OpenTelemetry Collector and want to export your logs to Quickwit, you need a new OLTP gRPC exporter in your config.yaml:

<Tabs>

<TabItem value="macOS_windows" label="macOS/Windows">

```yaml title="otel-collector-config.yaml"
receivers:
  otlp:
    protocols:
      grpc:
      http:

processors:
  batch:

exporters:
  otlp/quickwit:
    endpoint: host.docker.internal:7281
    tls:
      insecure: true  
    # By default, logs are sent to the otel-logs-v0_7.
    # You can customize the index ID By setting this header.
    # headers:
    #   qw-otel-logs-index: otel-logs-v0_7
service:
  pipelines:
    logs:
      receivers: [otlp]
      processors: [batch]
      exporters: [otlp/quickwit]
```

</TabItem>

<TabItem value="linux" label="Linux">

```yaml title="otel-collector-config.yaml"
receivers:
  otlp:
    protocols:
      grpc:
      http:

processors:
  batch:

exporters:
  otlp/quickwit:
    endpoint: 127.0.0.1:7281
    tls:
      insecure: true
    # By default, logs are sent to the otel-logs-v0_7.
    # You can customize the index ID By setting this header.
    # headers:
    #   qw-otel-logs-index: otel-logs-v0_7

service:
  pipelines:
    logs:
      receivers: [otlp]
      processors: [batch]
      exporters: [otlp/quickwit]
```

</TabItem>

</Tabs>


## Test your OTEL configuration

1. [Install](../../get-started/installation.md) and start a Quickwit server:
   
```bash
./quickwit run
```

2. Start a collector with the previous config:

<Tabs>

<TabItem value="macOS_windows" label="macOS/Windows">

```bash
docker run -v ${PWD}/otel-collector-config.yaml:/etc/otelcol/config.yaml -p 4317:4317 -p 4318:4318 -p 7281:7281 otel/opentelemetry-collector
```

</TabItem>

<TabItem value="linux" label="Linux">

```bash
docker run -v ${PWD}/otel-collector-config.yaml:/etc/otelcol/config.yaml --network=host -p 4317:4317 -p 4318:4318 -p 7281:7281 otel/opentelemetry-collector
```

</TabItem>

</Tabs>

3. Send a log to your collector with cURL:

```bash
curl -XPOST "http://localhost:4318/v1/logs" -H "Content-Type: application/json" \
--data-binary @- << EOF
{
 "resource_logs": [
   {
     "resource": {
       "attributes": [
         {
           "key": "service.name",
           "value": {
             "stringValue": "test-with-curl"
           }
         }
       ]
     },
     "scope_logs": [
       {
         "scope": {
           "name": "manual-test"
         },
         "log_records": [
           {
             "time_unix_nano": "1678974011000000000",
             "observed_time_unix_nano": "1678974011000000000",
             "name": "test",
             "severity_text": "INFO"
           }
         ]
       }
     ]
   }
 ]
}
EOF
```

You should see a log on the Quickwit server similar to the following:

```bash
2023-03-16T13:44:09.369Z  INFO quickwit_indexing::actors::indexer: new-split split_id="01GVNAKT5TQW0T2QGA245XCMTJ" partition_id=6444214793425557444
```

This means that Quickwit has received the log and created a new split. Wait for the split to be published before searching for logs.


================================================
FILE: docs/log-management/send-logs/using-vector.md
================================================
---
title: Send logs from Vector
sidebar_label: Using Vector
description: A simple tutorial to send logs from Vector to Quickwit in a few minutes.
icon_url: /img/tutorials/vector-logo.png
tags: [logs, ingestion]
sidebar_position: 3
---

import Tabs from '@theme/Tabs';
import TabItem from '@theme/TabItem';

[Vector](https://vector.dev/) is an amazing piece of software (in Rust obviously) and brings a new fresh wind in the observability space,
it is well-known for collecting logs from every part of your infrastructure, transforming and aggregating them, and finally forwarding them to a sink.

In this guide, we will show you how to connect it to Quickwit.

## Start Quickwit server

<Tabs>

<TabItem value="cli" label="CLI">

```bash
# Create Quickwit data dir.
mkdir qwdata
./quickwit run
```

</TabItem>

<TabItem value="docker" label="Docker">

```bash
# Create Quickwit data dir.
mkdir qwdata
docker run --rm -v $(pwd)/qwdata:/quickwit/qwdata -p 7280:7280 quickwit/quickwit run
```

</TabItem>

</Tabs>

## Taking advantage of Quickwit's native support for logs

Let's embrace the OpenTelemetry standard and take advantage of Quickwit features. With the native support for OpenTelemetry standards, Quickwit already comes with an index called `otel-logs_v0_7` that is compatible with the OpenTelemetry [logs data model](https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/logs/data-model.md). This means we can start pushing log data without any prior usual index setup.

The OpenTelemetry index configuration can be found in the [quickwit-opentelemetry/src/otlp/logs.rs](https://github.com/quickwit-oss/quickwit/blob/main/quickwit/quickwit-opentelemetry/src/otlp/logs.rs) source file.

## Setup Vector

Our sink here will be Quickwit ingest API `http://127.0.0.1:7280/api/v1/otel-logs-v0_7/ingest`.
To keep it simple in this tutorial, we will use a log source called `demo_logs` that generates logs in a given format. Let's choose the common `syslog` format
(Vector does not generate logs in the OpenTelemetry format directly!) and use the transform feature to map the `syslog` format into the OpenTelemetry format.


```toml title=vector.toml
[sources.generate_syslog]
type = "demo_logs"
format = "syslog"
count = 100000
interval = 0.001

[transforms.remap_syslog]
inputs = [ "generate_syslog"]
type = "remap"
source = '''
  structured = parse_syslog!(.message)
  .timestamp_nanos = to_unix_timestamp!(structured.timestamp, unit: "nanoseconds")
  .body = structured
  .service_name = structured.appname
  .resource_attributes.source_type = .source_type
  .resource_attributes.host.hostname = structured.hostname
  .resource_attributes.service.name = structured.appname
  .attributes.syslog.procid = structured.procid
  .attributes.syslog.facility = structured.facility
  .attributes.syslog.version = structured.version
  .severity_text = if includes(["emerg", "err", "crit", "alert"], structured.severity) {
    "ERROR"
  } else if structured.severity == "warning" {
    "WARN"
  } else if structured.severity == "debug" {
    "DEBUG"
  } else if includes(["info", "notice"], structured.severity) {
    "INFO"
  } else {
   structured.severity
  }
  .scope_name = structured.msgid
  del(.message)
  del(.timestamp)
  del(.service)
  del(.source_type)
'''

# useful to see the logs in the terminal
# [sinks.emit_syslog]
# inputs = ["remap_syslog"]
# type = "console"
# encoding.codec = "json"

[sinks.quickwit_logs]
type = "http"
method = "post"
inputs = ["remap_syslog"]
encoding.codec = "json"
framing.method = "newline_delimited"
uri = "http://127.0.0.1:7280/api/v1/otel-logs-v0_7/ingest"
```
Download the above Vector config file.

```bash
curl -o vector.toml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/vector-otel-logs/vector.toml
```

Now let's start Vector so that we can start sending logs to Quickwit.

```bash
docker run -v $(pwd)/vector.toml:/etc/vector/vector.toml:ro -p 8383:8383 --net=host timberio/vector:0.25.0-distroless-libc
```

## Search logs

Quickwit is now ingesting logs coming from Vector and you can search them either with `curl` or by using the UI:
- `curl -XGET http://127.0.0.1:7280/api/v1/otel-logs-v0_7/search?query=severity_text:ERROR`
- Open your browser at `http://127.0.0.1:7280/ui/search?query=severity_text:ERROR&index_id=otel-logs-v0_7&max_hits=10` and play with it!

## Compute aggregation on severity_text

For aggregations, we can't use yet Quickwit UI but we can use cURL.

Let's craft a nice aggregation query to count how many `INFO`, `DEBUG`, `WARN`, and `ERROR` per minute (all datetime are stored in microseconds thus the interval of 60_000_000 microseconds) we have:

```json title=aggregation-query.json
{
  "query": "*",
  "max_hits": 0,
  "aggs": {
    "count_per_minute": {
      "histogram": {
          "field": "timestamp_nanos",
          "interval": 60000000
      },
      "aggs": {
        "severity_text_count": {
          "terms": {
            "field": "severity_text"
          }
        }
      }
    }
  }
}
```

```bash
curl -XPOST -H "Content-Type: application/json" http://127.0.0.1:7280/api/v1/otel-logs-v0_7/search --data @aggregation-query.json
```

## Going further

Now you can also deploy Grafana and connect to Quickwit as data source for query, dashboard, alerts and more!


================================================
FILE: docs/log-management/supported-agents.md
================================================
---
title: Supported agents
sidebar_position: 3
---

Quickwit is compatible with the following agents:

## OpenTelemetry agent

Before using an [OpenTelemetry collector](https://opentelemetry.io/docs/collector/), check that [Quickwit OpenTelemetry service](otel-service.md) is enabled.
Once started, Quickwit is then ready to receive and ingest OpenTelemetry gRPC requests.

Here is a configuration example of an OpenTelemetry agent that sends logs into Quickwit:

```yaml
mode: daemonset
presets:
  logsCollection:
    enabled: true
  kubernetesAttributes:
    enabled: true
config:
  exporters:
    otlp:
      # Replace quickwit-host with the hostname of your Quickwit node/service.
      # On k8s, it should be of the form `{quickwit-indexer-service-name}.{namespace}.svc.cluster.local:7281
      endpoint: quickwit-host:7281
      tls:
        insecure: true
  service:
    pipelines:
      logs:
        exporters:
          - otlp
```

Find more configuration details on the [OpenTelemetry documentation](https://opentelemetry.io/docs/collector/configuration/). You can also check out our [tutorial to send logs with OTEL collector](send-logs/using-otel-collector.md) to Quickwit.

## HTTP-based agents

It's also possible to use other agents that send HTTP requests to Quickwit Ingest API. Quickwit also partially supports Elasticseardch `_bulk` API. Thus, there is a good chance that your agent is already compatible with Quickwit.
Currently, we have tested the following HTTP-based agents:

- [Vector](send-logs/using-vector.md)
- [Fluentbit](send-logs/using-fluentbit.md)
- FluentD (tutorial coming soon)
- Logstash: Quickwit does not support the Elasticsearch output. However, it's possible to send logs with the HTTP output but with `json` [format](https://www.elastic.co/guide/en/logstash/current/plugins-outputs-http.html) only.

Quickwit natively supports the [OpenTelemetry Protocol (OTLP)](https://opentelemetry.io/docs/reference/specification/protocol/otlp/) and provides a gRPC endpoint to receive logs from an OpenTelemetry collector by default.

The logs received by this endpoint are indexed on  the `otel-logs-v0` index. This index will be automatically created if not present. The index doc mapping is described in this [section](#opentelemetry-logs-data-model).

You can also send your logs directly to this index by using the [ingest API](/docs/reference/rest-api.md#ingest-data-into-an-index).

## OpenTelemetry service

Quickwit natively supports the [OpenTelemetry Protocol (OTLP)](https://opentelemetry.io/docs/reference/specification/protocol/otlp/) and provides a gRPC endpoint to receive spans from an OpenTelemetry collector. This endpoint is enabled by default.

When enabled, Quickwit will start the gRPC service ready to receive spans from an OpenTelemetry collector. The spans are indexed in the `otel-trace-v0_7` index by default, and this index will be automatically created if not present. The index doc mapping is described in the next [section](#trace-and-span-data-model).

If for any reason, you want to disable this endpoint, you can:
- Set the `QW_ENABLE_OTLP_ENDPOINT` environment variable to `false` when starting Quickwit.
- Or [configure the node config](/docs/configuration/node-config.md) by setting the indexer setting `enable_otlp_endpoint` to `false`.

```yaml title=node-config.yaml
# ... Indexer configuration ...
indexer:
    enable_otlp_endpoint: false
```


================================================
FILE: docs/operating/_category_.yaml
================================================
label: 'Operating Quickwit'
position: 7
collapsed: true


================================================
FILE: docs/operating/aws-costs.md
================================================
---
title: AWS Cost Optimization
sidebar_position: 3
---

Quickwit has been tested on Amazon S3. This page sums up what we have learned from that experience.

## Real World Example
In this [blog post](https://quickwit.io/blog/benchmarking-quickwit-engine-on-an-adversarial-dataset#indexing-costs), we indexed 23 TB of data and evaluated performance and costs.
You may be able to deduce the costs of indexing and querying on your dataset.

## Data transfers costs and latency

Cloud providers charge for data transfers in and out of their networks. In addition, querying an index from a remote machine adds some extra latency.
For those reasons, we recommend that you test and use the Quickwit from an instance located within your cloud provider's network.

## Optimizing bandwidth with wisely chosen instances

We recommend picking instances with high network performance to allow faster downloads from Amazon S3. In our experience, `c5n.2xlarge` instances offer the best bang for your buck.

## Requests cost

A final note on object storage requests costs. These are [quite low](https://aws.amazon.com/s3/pricing/) actually, $0,0004 / 1000 requests for GET and $0.005 / 1000 requests for PUT on AWS S3.

### PUT requests

During indexing, Quickwit uploads new splits on Amazon S3 and progressively merges them until they reach 10 million documents that we call “mature splits”. Such splits have a typical size between 1GB and 10GB and will usually require 2 PUT requests to be uploaded (1 PUT request / 5GB).

With default indexing parameters `commit_timeout_secs` of 60 seconds and `merge_policy.merge_factor` of 10 and assuming you want to ingest 1 million documents every minute, this will cost you less than $1 / month.

### GET requests

When querying, Quickwit needs to make multiple GET requests:

```jsx
#num requests = #num splits * ((#num search fields * #num terms * 3) + (#num search fields with fieldnorms enabled) + 1 (timestamp fast field if present)) + #num docs returned
```

The above formula assumes that the hotcache is cached, which will be loaded after the first query for every split.
`#num splits` can be reduced with [pruning](../overview/concepts/querying.md).

When positions are not enabled, only 2 GET requests will be executed per term.

These requests costs could add up quickly if you have a high number of splits or QPS > 10.
Don't hesitate to [contact us](mailto:hello@quickwit.io) if this is the case :).


================================================
FILE: docs/operating/data-directory.md
================================================
---
title: Data directory
sidebar_position: 1
---

Quickwit operates on a local directory to store temporary files. By default, this working directory is named `qwdata` and placed right next to the Quickwit binary.

Let's have a look at how Quickwit organizes the data directory.

## Data directory layout

When operating Quickwit, you will end up with the following tree:

```bash
qwdata
├── cache
│   └── splits
|       ├── 03BSWV41QNGY5MZV9JYAE1DCGA.split
│       └── 01GSWV41QNGY5MZV9JYAE1DCB7.split
├── delete_task_service
│   └── wikipedia%01H13SVKDS03P%TpCfrA
├── indexing
│   ├── wikipedia%01H13SVKDS03P%_ingest-api-source%RbaOAI
│   └── wikipedia%01H13SVKDS03P%kafka-source%cNqQtI
├── wal
│   ├── wal-00000000000000000056
│   └── wal-00000000000000000057
└── queues
    ├── partition_id
    ├── wal-00000000000000000028
    └── wal-00000000000000000029
```

### `/queues` and `/wal` directories
 
These directories are created only if the ingest API service is running on your node. They contain write ahead log files of the ingest API to guard against data loss. The `/queues` directory is used by the legacy version of the ingest (sometimes referred to as ingest V1). It is meant to be phased out in upcoming versions of Quickwit. Learn more about ingest API versions [here](../ingest-data/ingest-api.md#ingest-api-versions).

The log file is truncated when Quickwit commits a split (piece of index), which means that the split is stored on the storage and its metadata are in the metastore.

You can configure `max_queue_memory_usage` and `max_queue_disk_usage` in the [node config file](../configuration/node-config.md#ingest-api-configuration) to limit the max disk usage.

### `/indexing` directory

This directory holds the local indexing directory of each indexing source of each index managed by Quickwit. In the above tree, you can see two directories corresponding to the `wikipedia` index, which means that index is currently handling two sources.


### `/delete_task_service` directory

This directory is used by the Janitor service to apply deletes on indexes. During this process, splits are downloaded, a new split is created while applying deletes and uploaded to the target storage. This directory gets created only on nodes running the Janitor service.

### `/cache` directory

This directory is used for caching splits that will undergo a merge operation to save disk IOPS. Splits are evicted if they are older than two days. If cache limits are reached, oldest splits are evicted.

You can [configure](../configuration/node-config#indexer-configuration) the number of splits the cache can hold with `split_store_max_num_splits` and limit the overall size in bytes of splits with `split_store_max_num_bytes`.

### `/searcher-split-cache` directory

This directory is used by searcher nodes to cache entire splits and reduce calls to the object store. It won't be created unless you set the `split_cache` fields in the [searcher configuration](../configuration/node-config.md#searcher-configuration).


## Setting the right splits cache limits

Caching splits saves disk IOPS when Quickwit needs to merge splits.

Setting the right limits will depend on your [merge policy](../configuration/index-config.md#merge-policies) and the number of partitions you are using. The default splits cache limits should fit most use cases.

### Splits cache with the default configuration

For a given index, Quickwit commits one split every minute and uses the "Stable log" [merge policy](../configuration/index-config.md#merge-policies). This merge policy by default merges splits by group of 10, 11, or 12 until splits have more than 10 millions of documents. A split will typically undergo 3 or 4 merges and after will be considered as mature and evicted from the cache.

The following table shows how many splits will be created after a given amount of time assuming a 20MB/s ingestion rate with a compression ratio of 0.5:

| Time (minutes) | Number of splits                       | Splits size (GB) |
| -------------- | -------------------------------------- | ----------- |
| 1              | 1                                      | 0.6 GB      |
| 2              | 2                                      | 1.2 GB      |
| 10             | 10                                     | 6 GB        |
| 11             | 1 + 1 (merged once)                    | 6.6 GB      |
| 21             | 1 + 2 (merged once)                    | 12.6 GB     |
| 91             | 1 + 9 (merged once)                    | 54.6 GB     |
| 101            | 1 + 1 (merged twice)                   | 60.6 GB     |
| 111            | 2 + 1 (merged once) + 1 (merged twice) | 66.6 GB     |
| 201            | 1 + 0 (merged once) + 2 (merged twice) | 120.6 GB    |
| ..             | ...                                    |             |

In this case, the default cache limits of 1000 splits and 100GB are good enough to avoid downloading splits from the storage for the first two merges. This is perfectly fine for a production use case. You may want to increase the splits cache size to avoid any split download.

You can monitor the download rate with our [indexers dashboard](monitoring.md).

### Splits cache with partitioning

When using [partitions](../overview/concepts/querying.md#partitioning), Quickwit will create one split per partition and the number of splits can add up very quickly.

Let's take a concrete example with the following assumptions:
- A [commit timeout](../configuration/index-config.md#indexing-settings) of 1 minute.
- A partitioning that has 100 partitions. Quickwit will create 100 splits per minute assuming a document of each partition is ingested in one minute.
- A merge policy that merges splits of same partition as soon as there is 10 splits.

The following table shows how many splits will be created after a given amount of time:

| Time (minutes) | Number of splits |
| ------------ | ---------------- |
| 1            | 100              |
| 2            | 200              |
| 10           | 1000             |
| 11           | 100 + 100 (merged once) |
| 21           | 100 + 200 (merged once) |
| 91           | 100 + 900 (merged once) |
| 100          | 1000 + 900 (merged once) |
| 101          | 100 + 0 (merge once) + 100 (merged twice) |
| 200          | 1000 + 900 (merged once) + 100 (merged twice) |
| 201          | 100 + 0 (merged once) + 200 (merged twice) |

With these assumptions, you have to set `split_store_max_num_splits` to at least 1000 to avoid downloading splits from the storage for the first merge operation. And as merging can take a bit of time, you should set `split_store_max_num_splits` to a value that can hold all the splits that are not yet merged plus the incoming splits, a value of 1100 splits should be enough. If you want to store split until the second merge, a limit of 2500 splits should be good enough.

## Troubleshooting with a huge number of local splits

When starting, Quickwit is scanning all the splits in the cache directory to know which split is present locally, this can take a few minutes if you have tens of thousands splits. On Kubernetes, as your pod can be restarted if it takes too long to start, you may want to clean up the data directory or increase the liveliness probe timeout.
Also please report such a behavior on [GitHub](https://github.com/quickwit-oss/quickwit) as we can certainly optimize this start phase.


================================================
FILE: docs/operating/monitoring.md
================================================
---
title: Monitoring with Grafana
sidebar_position: 2
---

You can monitor your Quickwit cluster with Grafana.
Follow the tutorial at [Quickwit Monitoring with Grafana](../get-started/tutorials/prometheus-metrics) on how to set it up.

We provide three Grafana dashboards to help you monitor:
- [indexers performance](https://github.com/quickwit-oss/quickwit/blob/main/monitoring/grafana/dashboards/indexers.json)
- [searchers performance](https://github.com/quickwit-oss/quickwit/blob/main/monitoring/grafana/dashboards/searchers.json)
- [metastore queries](https://github.com/quickwit-oss/quickwit/blob/main/monitoring/grafana/dashboards/metastore.json)

Dashboards rely on a prometheus datasource fed with [Quickwit metrics](../reference/metrics.md).

## Screenshots

![Indexers Grafana Dashboard](../assets/images/screenshot-indexers-grafana-dashboard.png)

![Searchers Grafana Dashboard](../assets/images/screenshot-searchers-grafana-dashboard.png)

![Metastore Grafana Dashboard](../assets/images/screenshot-metastore-grafana-dashboard.png)


================================================
FILE: docs/operating/upgrades.md
================================================
---
title: Version upgrade
sidebar_position: 4
---

## Migration from 0.6.x to 0.7.0

The format of the index and internal objects stored in the metastore of 0.7 is backward compatible with 0.6.

If you are using the OTEL indexes and ingesting data into indexes the `otel-logs-v0_6` and `otel-traces-v0_6`, you must stop indexing before upgrading. Indeed, the first time you start Quickwit 0.7, it will update the doc mapping fields of Trace ID and Span ID of those two indexes by changing their input/output formats from `base64` to `hex`. This is automatic: you don't have to perform any manual operation.

Quickwit 0.7 will also create the new index `otel-traces-v0_7`, which is now used by default when ingesting data with the OTEL gRPC and HTTP API. The Jaeger gRPC and HTTP APIs will query both `otel-traces-v0_6` and `otel-traces-v0_7` by default. It's possible to define the index ID you want to use for OTEL gRPC endpoints and Jaeger gRPC API by setting the request header `qw-otel-logs-index` or `qw-otel-traces-index` to the index ID you want to target.


## Migration from 0.7.0 to 0.7.1

Quickwit 0.7.1 will create the new index `otel-logs-v0_7` which is now used by default when ingesting data with the OTEL gRPC and HTTP API.

In the traces index `otel-traces-v0_7`, the `service_name` field is now `fast`. 
No migration is done if `otel-traces-v0_7` already exists. If you want `service_name` field to be `fast`, you have to delete first the existing `otel-traces-v0_7` index or you need to create your own index.

## Migration from 0.8 to 0.9

Quickwit 0.9 introduces a new ingestion service to to power the ingest and bulk APIs (v2). The new ingest is enabled and used by default, even though the legacy one (v1) remains enabled to finish indexing residual data in the legacy write ahead logs. Note that `ingest_api.max_queue_disk_usage` is enforced on both ingest versions separately, which means that the cumulated disk usage might be up to twice this limit.

When upgrading to 0.9, we recommend to perform a full cluster restart.

<!--
Reasons:
- Ingested data into previously existing indexes on upgraded indexer nodes will not be picked by the indexing pipelines until the control plane is upgraded.
- The indexing plan is computed differently in 0.9, all pipelines will be restarted when upgrading the control plane.
- If you intend to enable compression for the ingest service (`ingest_api.grpc_compression_algorithm`), you must do so in two steps: first, upgrade the indexer nodes with compression disabled, then update the node configuration to enable compression, and finally restart the indexer nodes.
- Obscure bug raised in https://github.com/quickwit-oss/quickwit/issues/5787#issuecomment-2979470315
-->

Shutdown order:
1) indexers, searchers and janitor
2) control plane
3) metastores

Start up order:
1) metastores
2) control plane
3) indexers, searchers and janitor


================================================
FILE: docs/overview/_category_.yaml
================================================
label: 'Introduction'
position: 1
collapsed: true


================================================
FILE: docs/overview/architecture.md
================================================
---
title: Architecture
sidebar_position: 2
---

Quickwit distributed search engine relies on 4 major services and one maintenance service:

- The Searchers for executing search queries from the REST API.
- The Indexers that index data from data sources.
- The Metastore that stores the index metadata in a PostgreSQL-like database or in a cloud storage file.
- The Control plane that schedules indexing tasks to the indexers.
- The Janitor that executes periodic maintenance tasks.

Moreover, Quickwit leverages existing infrastructure by relying on battled-tested technologies for index storage, metadata storage, and ingestion:

- Cloud storage like AWS S3, Google Cloud Storage, Azure Blob Storage or other S3 compatible storage for index storage.
- Postgresql for metadata storage.
- Distributed queues like Kafka and Pulsar for ingestion.

## Architecture diagram

The following diagram shows a Quickwit cluster with its four major components and the janitor whose role is to execute periodic maintenance tasks, see the [Janitor section](#janitor) for more details.

![Quickwit Architecture](../assets/images/quickwit-architecture-light.svg#gh-light-mode-only)![Quickwit Log Management](../assets/images/quickwit-architecture-dark.svg#gh-dark-mode-only)

## Index & splits

A Quickwit index stores documents and makes it possible to query them efficiently. The index organizes documents into a collection of smaller independent indexes called **splits**.

A document is a collection of fields. Fields can be stored in different data structures:

- an inverted index, which enables fast full-text search.
- a columnar storage called `fast field`. It is the equivalent of doc values in [Lucene](https://lucene.apache.org/). Fast fields are required to compute aggregates over the documents matching a query. They can also allow some advanced types of filtering.
- a row-storage called the doc store. It makes it possible to get the content of the matching documents.

You can configure your index to control how to map your JSON object to a Quickwit document and, for each field, define whether it should be stored, indexed, or be a fast field. [Learn how to configure your index](../configuration/index-config.md)

### Splits

A split is a small piece of an index identified by a UUID. For each split, Quickwit adds up a `hotcache` file along with index files. This **hotcache** is what makes it possible for Searchers to open a split in less than 60ms, even on high latency storage.

The Quickwit index is aware of its splits by keeping splits metadata, notably:

- the split state which indicates if the split is ready for search
- the min/max time range computed on the timestamp field if present.

This timestamp metadata can be handy at query time. If the user specifies a time range filter to their query, Quickwit will use it to **prune irrelevant splits**.

Index metadata needs to be accessible by every instance of the cluster. This is made possible thanks to the `metastore`.

### Index storage

Quickwit stores the indexes data (splits files) on cloud storage (AWS S3, Google Cloud Storage, Azure Blob Storage or other S3 compatible storage) and also on local disk for single-server deployment.

## Metastore

Quickwit gathers index metadata into a metastore to make them available across the cluster. 

On the write path, indexers push index data on the index storage and publish metadata to the metastore.

On the read path, for a given query on a given index, a search node will ask the metastore for the index metadata and then use it to do the query planning and finally execute the plan.

In a clustered deployment, the metastore is typically a traditional RDBMS like PostgreSQL which we only support today. In a single-server deployment, it’s also possible to rely on a local file or on Amazon S3.

## Quickwit cluster and services

### Cluster formation

Quickwit uses [chitchat](https://github.com/quickwit-oss/chitchat), a cluster membership protocol with failure detection implemented by Quickwit. The protocol is inspired by Scuttlebutt reconciliation and phi-accrual detection, ideas borrowed from Cassandra and DynamoDB.

[Learn more on chitchat](https://github.com/quickwit-oss/chitchat).

### Indexers

See [dedicated indexing doc page](./concepts/indexing.md).

### Searchers

Quickwit's search cluster has the following characteristics:

- It is composed of stateless nodes: any node can answer any query about any splits.
- A node can distribute search workload to other nodes.
- Load-balancing is made with rendezvous hashing to allow for efficient caching.

This design provides high availability while keeping the architecture simple.

**Workload distribution: root and leaf nodes**

Any search node can handle any search request. A node that receives a query will act as the root node for the span of the request. It will then process it in 3 steps:

- Get the index metadata from the metastore and identify the splits relevant to the query.
- Distributes the split workload among the nodes of the cluster. These nodes are assuming the role of leaf nodes.
- Waits for results from leaf nodes, merges them, and returns the aggregated results.

**Stateless nodes**

Quickwit cluster distributes search workloads while keeping nodes stateless.

Thanks to the hotcache, opening a split on Amazon S3 only takes 60ms. It makes it possible to remain totally stateless: a node does not need to know anything about the indexes. Adding or removing nodes takes seconds and does not require moving data around.

**Rendezvous hashing**

The root node uses [Rendezvous hashing](https://en.wikipedia.org/wiki/Rendezvous_hashing) to distribute the workload among leaf nodes. Rendez-vous hashing makes it possible to define a node/split affinity function with excellent stability properties when a node joins or leaves the cluster. This trick unlocks efficient caching.

Learn more about query internals on the [querying doc page](./concepts/querying.md).


### Control plane

The control plane service schedules indexing tasks to indexers. The scheduling is executed when the scheduler receives external or internal events and on certains conditions:

- The scheduler listens to metastore events: source create, delete, toggle, or index delete. On each of these events, it will schedule a new plan, named the `desired plan` and send indexing tasks to the indexers.
- On every `HEARTBEAT` (3 seconds), the scheduler controls if the `desired plan` and the indexing tasks running on indexers are in sync. If not, it will reapply the desired plan to indexers.
- Every minute, the scheduler rebuilds a plan with the latest metastore state, and if it differs from the last applied plan, it will apply the new one. This is necessary as the scheduler may have not received all metastore events due to network issues.

### Janitor

The Janitor service runs maintenance tasks on indexes: garbage collection, delete query tasks, and retention policy tasks.

## Data sources

Quickwit supports [multiple sources](../ingest-data/) to ingest data from.

A file is ideal for a one-time ingestion like an initial load, the ingest API or a message queue are ideal to continuously feed data into the system. 

Quickwit indexers connect directly to external message queues like Kafka, Pulsar or Kinesis and guarantee the exactly-once semantics. If you need support for other distributed queues, please vote for yours [here](https://github.com/quickwit-oss/quickwit/issues/1000).


================================================
FILE: docs/overview/concepts/_category_.yaml
================================================
label: 'Advanced concepts'
position: 3
collapsed: true


================================================
FILE: docs/overview/concepts/deletes.md
================================================
---
title: Deletes
sidebar_position: 3
---

Quickwit supports deletes thanks to the [delete API](../../reference/rest-api.md#delete-api). It's important to note that this feature is mainly intended to comply with GDPR (General Data Protection Regulation) and should be used parsimoniously as deletes are expensive: typically a few queries per hour or day is recommended.

## Delete tasks

A delete task on a given index is executed on all splits created before the delete task creation. This can be a long-running task that could last several hours if the delete query is matching documents present in many splits.

To track the progress of the execution, each delete task is given a unique and incremental identifier called "operation stamp" or `opstamp`. All existing splits will undergo a delete operation and, after its success, each split metadata will be updated with the corresponding operation stamp.

All splits created after the creation of a delete tasks will have a `opstamp` greater or equal to the `opstamp` of the delete task (greater if other delete tasks have been created at the same moment).

Quickwit batches delete operations on a given split: for example, if a split has it delete `opstamp = n` and the last created delete task has a `opstamp = n + 10`, ten (10) delete queries will be executed at once on the split.

## Delete API

Delete tasks are created through the [Delete REST API](../../reference/rest-api.md#delete-api).

## Pitfalls

### Immature splits

Delete operations are applied only to “mature” splits, that is splits that will no longer undergo merges. Whether a split is mature depends on the [merge policy](../../configuration/index-config.md#merge-policies). It is possible to define `maturation_period` after which a split will be mature. Thus, a delete request created at `t0` will first apply deletes to mature splits and, in the worst case, will wait the `t0 + maturation_period` for immature splits to become mature.


### Monitoring and dev XP

It's currently not possible to monitor delete operations. An [issue](https://github.com/quickwit-oss/quickwit/issues/2494) is opened to improve the dev experience, don't hesitate to add your comments it and follow its progress.


================================================
FILE: docs/overview/concepts/indexing.md
================================================
---
title: Indexing
sidebar_position: 1
---

## Supported data formats

Quickwit ingests JSON records and refers to them as "documents" or "docs". Each document must be a JSON object. When ingesting files, documents must be separated by a newline.

Quickwit does not yet support file formats such as `Avro` or `CSV`. Compression formats such as `bzip2` or `gzip` are also not supported yet.

## Data model

Quickwit supports both schemaless indexes and fixed schemas. The "document mapping" of an index, also commonly called "doc mapping", is a list of field names and types that declares the schema of an index. For a schemaless or mixed fixed schema and schemaless indexing, follow our [guide on schemaless indexing](../../guides/schemaless.md). Additionally, a doc mapping specifies how documents are indexed (tokenizers) and stored (column-oriented vs. row-oriented).


## Merge process and merge policy

An index is broken into immutable splits. The size of a split is defined by the number of documents it carries. A split is considered "mature" when its size reaches a threshold defined in the index config as `split_num_docs_target`.

An indexer buffers incoming documents and produces a new split when the size of the buffer reaches `split_num_docs_target` or `commit_timeout_secs` seconds have passed since the first document has been enqueued, depending on which event occurs first. In the latter case, the indexer generates immature splits. The merge process designates the iterative procedure that groups and merges immature splits together to produce mature splits.

The merge policy controls the merge algorithm, which is mainly driven by the two parameters `split_num_docs_target` and `merge_factor`. Each time a new split is published, the merge policy examines the list of immature splits and attempts to merge `merge_factor` splits together in order to produce larger splits. The merge policy may also decide to merge fewer or more splits together if deemed necessary. Finally, the merge algorithm never merges more than `max_merge_factor` splits together.

### Split store

The split store is a cache that keeps recently published and immature splits on disk to speed up the merge process. After a successful merge phase, the split store evicts dangling splits.

The disk space allocated to the split store is controlled by the config parameters `split_store_max_num_splits` and `split_store_max_num_bytes`.

## Data sources

A data source designates the location and set of parameters that allow to connect to and ingest data from an external data store, which can be a file, a stream, or a database. Often, Quickwit simply refers to data sources as "sources". The indexing engine supports local adhoc file ingests using [the CLI](/docs/reference/cli#tool-local-ingest) and streaming sources (e.g. the Kafka source). Quickwit can insert data into an index from one or multiple sources. More details can be found [in the source configuration page](https://quickwit.io/docs/configuration/source-config).

## Checkpoint

Quickwit achieves exactly-once processing using checkpoints. For each source, a "source checkpoint" records up to which point documents have been processed in the target file or stream. Checkpoints are stored in the metastore and updated atomically each time a new split is published. When an indexing error occurs, the indexing process is resumed right after the last successfully published checkpoint. Internally, a source checkpoint is represented as an object mapping from absolute paths or partition IDs to offsets or sequence numbers.


================================================
FILE: docs/overview/concepts/querying.md
================================================
---
title: Querying
sidebar_position: 2
---

A search query received by a searcher will be executed using a map-reduce approach following these steps:

1. The Searcher identifies relevant splits based on the request’s [timestamp interval](#time-sharding) and [tags](#tag-pruning).
2. It distributes the splits workload among other searchers available in the cluster using *[rendez-vous hashing](https://en.wikipedia.org/wiki/Rendezvous_hashing)* to optimize caching and load.
3. It finally waits for all results, merges them, and returns them to the client.

A search stream query follows the same execution path as for a search query except for the last step: instead of waiting for each Searcher's result, the searcher streams the results as soon as it starts receiving some from a searcher.

### **Time sharding**

On datasets with a time component, Quickwit will shard data into timestamp-aware splits. With this feature, Quickwit is capable of filtering out most splits before they can make it to the query processing stage, thus reducing drastically the amount of data needed to process the query.

The following query parameters are available to apply timestamped pruning to your query:

- `startTimestamp`: restricts search to documents with a `timestamp >= start_timestamp`
- `endTimestamp`: restricts search to documents with a `timestamp < end_timestamp`

### Tag pruning

Quickwit also provides pruning on a second dimension called `tags`. By [setting a field as tagged](../../configuration/index-config.md) Quickwit will generate split metadata at indexing in order to filter splits that match requested tags at query time. Note that this metadata is only generated when the cardinality of the field is less than 1,000.

Tag pruning is notably useful on multi-tenant datasets.

### Partitioning

Quickwit makes it possible to route documents into different splits based on a partitioning key.

This feature is especially useful in a context where documents with different
tags are all mixed together in the same source (usually a Kafka topic).

In that case, simply marking the field as tag will have no positive effect on search, as all produced splits will contain almost all tags.

The `partition_key` attributes (defined in the doc mapping) lets you configure the logic used by Quickwit to route documents into isolated splits.
Quickwit will also enforce this isolation during merges. This functionality is, in a sense, similar to sharding.

Quickwit supports a simple DSL for partitioning described in the next section.

Partition & tags are often used to:

- separate `tenants` in a multi-tenant application
- separate `team` or `application` in an observation logging case.

Emitting many splits can heavily stress an `indexer`. For this reason,
another parameter of the doc mapping called `max_num_partitions` acts as a safety valve. If the number of partitions is
about to exceed `max_num_partitions`, a single extra partition is created
and all extra partitions will be grouped together into this special partition.

If you are expecting 20 partitions, we strongly recommend you to not set
`max_num_partitions` to 20, but instead use a larger value (200 for instance).
Quickwit should handle that number of partitions smoothly, and it will avoid documents belonging to different partitions from being grouped together due to
a few faulty documents.

### Partition key DSL

Quickwit allows you to configure how document are routed with a simple DSL. Here are some sample expression with a short description of their result:

- `tenant_id`: create one partition per tenant\_id
- `tenant_id,app_id`: create one partition per unique combination of tenant\_id and app\_id
- `tenant_id,hash_mod(app_id, 8)`: for each tenant, create up to 8 partitions containing each data related to some applications
- `hash_mod((tenant_id,app_id), 50)`: create 50 partition in total, containing some combination of tenant and apps.


The partition key DSL is generated by this grammar:
```
RoutingExpr := RoutingSubExpr [ , RoutingExpr ]
RougingSubExpr := Identifier [ \( Arguments \) ]
Identifier := FieldChar [ Identifier ]
FieldChar := { a..z | A..Z | 0..9 | _ }
Arguments := Argument [ , Arguments ]
Argument := { \( RoutingExpr \) | RoutingSubExpr | DirectValue }
# We may want other DirectValue in the future
DirectValue := Number
Number := { 0..9 } [ Number ]
```
Supported functions are currently:
- `hash_mod(RoutingExpr, Number)`: hash `RoutingExpr` and divide the result by `Number`, keeping only the reminder.

When using `hash_mod` with a tuple of key like in `hash_mod((tenant_id,app_id), 50)`, beware it might route together documents which would make tags less effective.
For instance, if tenant\_1,app\_1 and tenant\_2,app\_2 are both sent to partition one, but tenant\_1,app\_2 is sent to partition two, a query for tenant\_1,app\_2 will
still search inside the 1st partition as it will be tagged with tenant\_1,tenant\_2,app\_1 and app\_2. You should therefore prefer a partition key such as
`hash_mod(tenant_id, 10),hash_mod(app_id, 5)` which will generate as many splits, but with better tags.

### Caching

Quickwit does caching in many places to deliver a highly performing query engine.

In memory:

- Hotcache caching: A static cache that holds information about a split file internal representation. It helps speed up the opening of a split file. Its size can be defined via the `split_footer_cache_capacity` configuration parameter.
- Fast field caching: Fast fields tend to be accessed very frequently by users especially for stream requests. They are cached in a RAM whose size can be limited by the `fast_field_cache_capacity` configuration value.
- Partial request caching: In some cases, like when using dashboards, some very similar requests might be issued, with only timestamp bounds changing. Some partial results can be cached to make these requests faster and issue less requests to the storage. They are cached in a RAM whose size can be limited by the `partial_request_cache_capacity` configuration value.

On disk:

- The split cache stores entire splits on disk. It can be enabled by setting the `split_cache` configuration fields. This cache can help reduce object store costs and load. Searchers populate this cache when splits are created or queried and evict them with a simple LRU strategy.

Learn more about cache parameters in the [searcher configuration docs](../../configuration/node-config.md#searcher-configuration).

### Scoring

Quickwit supports sorting docs by their BM25 scores. In order to query by score, [fieldnorms](../../configuration/index-config.md#text-type) must be enabled for the field. By default, BM25 scoring is disabled to improve query latencies but it can be opt-in by setting the `sort_by` option to `_score` in queries.

### Document ID

Each document in Quickwit is assigned a unique document ID, which is a combination of the split ID and the Tantivy DocId within the split. This implies that you cannot assign a custom ID and that the ID changes when splits undergo merges. This ID is used for every search query as sort order (after the explicitly specified sort values) to make the results deterministic.


================================================
FILE: docs/overview/index.md
================================================
---
title: Quickwit documentation
slug: /
sidebar_position: 1
---

import CallToAction from '@theme/CallToAction';

Quickwit is the first engine to execute complex search and analytics queries directly on cloud storage with sub-second latency. Powered by Rust and its decoupled compute and storage architecture, it is designed to be resource-efficient, easy to operate, and scale to petabytes of data.

Quickwit is a great fit for log management, distributed tracing, and generally immutable data such as conversational data (emails, texts, messaging platforms) and event-based analytics.

<CallToAction
heading='Get started with Quickwit'
description='Get up and running in minutes and start harnessing the power of Quickwit today!'
buttontext='GET STARTED'
to='/docs/main-branch/get-started/quickstart'>
</CallToAction>

## Use cases

- [Log management](../log-management/overview.md)
- [Distributed Tracing](../distributed-tracing/overview.md)

## Key concepts

- [Architecture](architecture.md)
- [Indexing](concepts/indexing.md)
- [Querying](concepts/querying.md)

## Reference

- [Configuration](../configuration/index.md)
- [REST API](../reference/rest-api.md)
- [CLI](../reference/cli.md)


================================================
FILE: docs/overview/introduction.md
================================================
---
title: What is Quickwit?
sidebar_position: 1
---

Quickwit is the first engine to execute complex search and analytics queries directly on cloud storage with sub-second latency. Powered by Rust and its decoupled compute and storage architecture, it is designed to be resource-efficient, easy to operate, and scale to petabytes of data.

Quickwit is a great fit for log management, distributed tracing, and generally immutable data such as conversational data (emails, texts, messaging platforms) and event-based analytics.


## Why Quickwit is different from other search engines?

Quickwit is designed for sub-second search straight from object storage allowing true decoupled compute and storage. And it means a lot for your infrastructure:

- You store once for all your data on cheap, safe and unlimited storage.
- You scale out your cluster in seconds, no need to move data around.
- Indexing and search workloads are decoupled, you can scale them independently.
- Your tenants are easily isolated and you can charge them for their usage.

Quickwit is also designed to index and search semi-structured data. Its schemaless indexing allows you to index JSON document with an arbitrary amount of field without heavily impacting your performance. Aggregation are not yet supported but we are working on it, stay tuned!

## When to use Quickwit

Quickwit is a great fit for log management, distributed tracing, and generally immutable data such as conversational data (emails, texts, messaging platforms), event-based analytics,  audit logs, security logs, and more.

Check out our guides to see how you can use Quickwit:

- [Log management](../log-management/overview.md)
- [Distributed Tracing](../distributed-tracing/overview.md)


## Key features

- Full-text search and aggregation queries
- Elasticsearch query language support
- Sub-second search on cloud storage (Amazon S3, Azure Blob Storage, …)
- Decoupled compute and storage, stateless indexers & searchers
- [Schemaless](https://quickwit.io/docs/guides/schemaless) or strict schema indexing
- Schemaless analytics
- [Grafana data source](https://github.com/quickwit-oss/quickwit-datasource)
- [Jaeger-native](https://quickwit.io/docs/distributed-tracing/plug-quickwit-to-jaeger)
- OTEL-native for [logs](https://quickwit.io/docs/log-management/overview) and [traces](https://quickwit.io/docs/distributed-tracing/overview)
- Kubernetes ready - See our [helm-chart](https://quickwit.io/docs/deployment/kubernetes)
- RESTful API

### Enterprise-grade features

- Multiple [data sources](../ingest-data/index.md) Kafka / Kinesis / Pulsar native
- Multi-tenancy: indexing with many indexes and partitioning
- Retention policies
- Delete tasks (for GRPR use cases)
- Distributed and highly available* engine that scales out in seconds (HA indexing only with Kafka)

## When not to use Quickwit

Use cases where you would likely *not* want to use Quickwit include:

- You need a low-latency search for e-commerce websites.
- Your data is mutable.

## Time to discover Quickwit

- [Quickstart](../get-started/quickstart.md)
- [Concepts](architecture.md)
- [Last release blog post](https://quickwit.io/blog/quickwit-0.7)


================================================
FILE: docs/reference/_category_.yaml
================================================
label: 'Reference'
position: 11
collapsed: true


================================================
FILE: docs/reference/aggregation.md
================================================
---
title: Aggregations API
sidebar_position: 30
---

An aggregation summarizes your data as statistics on buckets or metrics.

Aggregations can provide answers to questions like:

- What is the average price of all sold articles?
- How many errors with status code 500 do we have per day?
- What is the average listing price of cars grouped by color?

There are two categories: [Metrics](#metric-aggregations) and [Buckets](#bucket-aggregations).

#### Prerequisite

To be able to use aggregations on a field, the field needs to have a fast field index created. A fast field index is a columnar storage,
where documents values are extracted and stored.

Example to create a fast field on text for term aggregations.
```yaml
name: category
type: text
tokenizer: raw
record: basic
fast: true
```

See the [index configuration](../configuration/index-config.md) page for more details and examples.

#### API Endpoint

The endpoints for aggregations are the search endpoints:
- Quickwit API: `api/v1/<index id>/search`
- Elasticsearch API: `api/v1/_elastic/<index_id>/_search`.

#### Format

The aggregation request and result de/serialize into elasticsearch compatible JSON.
If not documented otherwise you should be able to drop in your elasticsearch aggregation queries.

In some examples below is not the full request shown, but only the payload for `aggregations`.

#### Example

Request
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "sites_and_aqi": {
            "terms": {
                "field": "County",
                "size": 2,
                "order": { "average_aqi": "asc" }
            },
            "aggs": {
                "average_aqi": {
                    "avg": { "field": "AQI" }
                }
            }
        }
    }
}
```


Response
```json
...
"aggregations": {
    "sites_and_aqi": {
      "buckets": [
        {
          "average_aqi": {
            "value": 32.62267569707098
          },
          "doc_count": 56845,
          "key": "臺東縣"
        },
        {
          "average_aqi": {
            "value": 35.97893635571055
          },
          "doc_count": 28675,
          "key": "花蓮縣"
        }
      ],
      "sum_other_doc_count": 1872055
    }
}
```

### Supported Aggregations

 - Bucket
    - [Histogram](#histogram)
    - [DateHistogram](#date-histogram)
    - [Range](#range)
    - [Terms](#terms)
- Metric
    - [Average](#average)
    - [Count](#count)
    - [Max](#max)
    - [Min](#min)
    - [Stats](#stats)
    - [Sum](#sum)
    - [Percentiles](#percentiles)
    - [Cardinality](#cardinality)


## Bucket Aggregations

BucketAggregations create buckets of documents. Each bucket is associated with a rule which determines whether or not a document falls into it.
In other words, the buckets effectively define document sets. Buckets are not necessarily disjunct, therefore a document can fall into multiple buckets.
In addition to the buckets themselves, the bucket aggregations also compute and return the number of documents for each bucket.
Bucket aggregations, as opposed to metric aggregations, can hold sub-aggregations.
These sub-aggregations will be aggregated for the buckets created by their “parent” bucket aggregation.
There are different bucket aggregators, each with a different “bucketing” strategy.
Some define a single bucket, some define a fixed number of multiple buckets, and others dynamically create the buckets during the aggregation process.


### Histogram

A histogram is a type of bucket aggregation where documents are grouped into buckets based on a fixed interval. Each document's value is "rounded down" to the nearest bucket boundary.

E.g. if we have a price 18 and an interval of 5, the document will fall into the bucket with the key 15. The formula used for this is: `((val - offset) / interval).floor() * interval + offset`.

#### Histogram on datetime fields

See [`DateHistogram`](#date-histogram) for more convenient API for `datetime` fields.

Fields of type `datetime` are handled the same way as any numeric field. However, all values in the requests such as intervals, offsets, bounds, and range boundaries need to be expressed in milliseconds.

Histogram with one bucket per day on a `datetime` field. `interval` needs to be provided in milliseconds.
In the following example, we grouped documents per day (`1 day = 86400000 milliseconds`).
The returned format is currently fixed at `RFC3339`.

##### Request
```json skip
{
  "query": "*",
  "max_hits": 0,
  "aggs": {
    "count_per_day":{
      "histogram":{
        "field": "datetime",
        "interval": 86400000
      }
    }
  }
}
```
##### Response

```json skip
{
  ...
  "aggregations": {
    "count_per_day": {
      "buckets": [
        {
          "doc_count": 1,
          "key": 1546300800000000.0,
          "key_as_string": "2019-01-01T00:00:00Z"
        },
        {
          "doc_count": 2,
          "key": 1546560000000000.0,
          "key_as_string": "2019-01-04T00:00:00Z"
        }
      ]
    }
  }
}
```


#### Returned Buckets

By default buckets are returned between the min and max value of the documents, including empty buckets. Setting `min_doc_count > 0` will filter empty buckets.

The value range of the buckets can be extended via [`extended_bounds`](#extended_bounds) or limit the range via [`hard_bounds`](#hard_bounds).

#### Example

```json
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "prices": {
            "histogram": {
                "field": "price",
                "interval": 10
            }
        }
    }
}
```

#### Parameters

###### **field**

The field to aggregate on.

Currently this aggregation only works on fast fields of type `u64`, `f64`, `i64`, and `datetime`.

###### **keyed**

Change response format from an array to a hashmap, `key` in the bucket will be the `key` in the hashmap.

###### **interval**

The interval to chunk your data range. Each bucket spans a value range of [0..interval). Must be larger than 0.

###### **offset**

Intervals implicitly defines an absolute grid of buckets `[interval * k, interval * (k + 1))`.
Offset makes it possible to shift this grid into `[offset + interval * k, offset + interval (k + 1))`. Offset has to be in the range [0, interval).

As an example, if there are two documents with value 8 and 12 and interval 10.0, they would fall into the buckets with the key 0 and 10. With offset 5 and interval 10, they would both fall into the bucket with the key 5 and the range [5..15)

```json
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "prices": {
            "histogram": {
                "field": "price",
                "interval": 10,
                "offset": 2.5
            }
        }
    }
}
```


###### **min_doc_count**

The minimum number of documents in a bucket to be returned. Defaults to 0.

###### **hard_bounds**

Limits the data range to [min, max] closed interval.
This can be used to filter values if they are not in the data range.
hard_bounds only limits the buckets, to force a range set both `extended_bounds` and `hard_bounds` to the same range.

```json
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "prices": {
            "histogram": {
                "field": "price",
                "interval": 10,
                "hard_bounds": {
                    "min": 0,
                    "max": 100
                }
            }
        }
    }
}
```

###### **extended_bounds**

Can be set to extend your bounds. The range of the buckets is by default defined by the data range of the values of the documents. As the name suggests, this can only be used to extend the value range. If the bounds for min or max are not extending the range, the value has no effect on the returned buckets.
Cannot be set in conjunction with `min_doc_count` > 0, since the empty buckets from extended bounds would not be returned.

```json
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "prices": {
            "histogram": {
                "field": "price",
                "interval": 10,
                "extended_bounds": {
                    "min": 0,
                    "max": 100
                }
            }
        }
    }
}
```

### Date Histogram

`DateHistogram` is similar to `Histogram`, but it can only be used with [datetime type](../configuration/index-config#datetime-type) and provides a more convenient API to define intervals.

Like the histogram, values are rounded down to the closest bucket.

The returned format is currently fixed at `Rfc3339`.

##### Limitations
Only fixed time intervals via the `fixed_interval` parameter are supported.
The parameters `interval` and `calendar_interval` are unsupported.

##### Request
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "sales_over_time": {
            "date_histogram": {
                "field": "sold_at",
                "fixed_interval": "30d"
                "offset": "-4d"
            }
        }
    }
}
```
##### Response

```json skip
{
    ...
    "aggregations": {
        "sales_over_time" : {
            "buckets" : [{
                "key_as_string" : "2015-01-01T00:00:00Z",
                "key" : 1420070400000,
                "doc_count" : 4
            }]
        }
    }
}
```


#### Parameters

###### **field**

The field to aggregate on.

Currently this aggregation only works on fast fields of type `datetime`.

###### **keyed**

Change response format from an array to a hashmap, `key` in the bucket will be the `key` in the hashmap.

###### **interval**

The interval to chunk your data range. Each bucket spans a value range of [0..interval). Must be larger than 0.

Fixed intervals are configured with the `fixed_interval` parameter.
Fixed intervals are a fixed number of SI units and
never deviate, regardless of where they fall on the calendar. One second is always
composed of 1000ms. This allows fixed intervals to be specified in any multiple of the
supported units. However, it means fixed intervals cannot express other units such as
months, since the duration of a month is not a fixed quantity. Attempting to specify a
calendar interval like month or quarter will return an Error.

The accepted units for fixed intervals are:
* `ms`: milliseconds
* `s`: seconds. Defined as 1000 milliseconds each.
* `m`: minutes. Defined as 60 seconds each (60_000 milliseconds).
* `h`: hours. Defined as 60 minutes each (3_600_000 milliseconds).
* `d`: days. Defined as 24 hours (86_400_000 milliseconds).

Fractional time values are not supported, but this can be addressed by shifting to another
time unit (e.g., `1.5h` could instead be specified as `90m`).

###### **offset**

Intervals implicitly define an absolute grid of buckets `[interval * k, interval * (k + 1))`.
Offset makes it possible to shift this grid into `[offset + interval * k, offset + interval (k + 1))`. Offset has to be in the range [0, interval).

This is especially useful when using `fixed_interval`, to shift the first bucket e.g. at the start of the year.

The `offset` parameter has the same syntax as the `fixed_interval` parameter, but also allows for negative values.

###### **min_doc_count**

The minimum number of documents in a bucket to be returned. Defaults to 0.

###### **hard_bounds**
Same as in [`Histogram`](#hard_bounds) but `min` and `max` parameters need to be set as timestamp with milliseconds precision.

###### **extended_bounds**
Same as in [`Histogram`](#extended_bounds) but `min` and `max` parameters need to be set as timestamp with milliseconds precision.

### Range

Provide user-defined buckets to aggregate on. Two special buckets will automatically be created to cover the whole range of values.
The provided buckets have to be continuous. During the aggregation, the values extracted from the fast_field field will be checked against each bucket range.
Note that this aggregation includes the from value and excludes the to value for each range.

#### Limitations/Compatibility

Overlapping ranges are not yet supported.

##### Request
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "my_scores": {
            "range": {
                "field": "score",
                "ranges": [
                    { "to": 3.0, "key": "low" },
                    { "from": 3.0, "to": 7.0, "key": "medium-low" },
                    { "from": 7.0, "to": 20.0, "key": "medium-high" },
                    { "from": 20.0, "key": "high" }
                ]
            }
        }
    }
}
```

##### Response

```json skip
{
    ...
    "aggregations": {
        "my_scores" : {
            "buckets": [
                {"key": "low", "doc_count": 0, "to": 3.0},
                {"key": "medium-low", "doc_count": 10, "from": 3.0, "to": 7.0},
                {"key": "medium-high", "doc_count": 10, "from": 7.0, "to": 20.0},
                {"key": "high", "doc_count": 80, "from": 20.0}
            ]
        }
    }
}
```

#### Parameters

###### **keyed**

Change response format from an array to a hashmap, the serialized range will be the `key` in the hashmap.
If a custom `key` is provided, it will be used instead.

###### **field**

The field to aggregate on.

Currently this aggregation only works on fast fields of type `u64`, `f64`, `i64`, and `datetime`.

###### **ranges**

The list of buckets, with `from` and `to` values.
The `from` value is inclusive in the range.
The `to` value is not inclusive in the range.
`key` is optional, and will be used as the bucket key in the response.

The first bucket can omit the `from` value, and the last bucket the `to` value.
Note that this aggregation includes the `from` value and excludes the `to` value for each range. Extra buckets will be created until the first `to`, and last `from`, if necessary.

### Terms

Creates a bucket for every unique term and counts the number of occurrences.

Request
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "genres": {
            "terms": { "field": "genre" }
        }
    }
}
```

Response
```json
...
"aggregations": {
    "genres": {
        "doc_count_error_upper_bound": 0,
        "sum_other_doc_count": 0,
        "buckets": [
            { "key": "drumnbass", "doc_count": 6 },
            { "key": "raggae", "doc_count": 4 },
            { "key": "jazz", "doc_count": 2 }
        ]
    }
}
```


#### Document count error
In Quickwit, we have one segment per split. Therefore the results returned from a split, is equivalent to results returned from a segment.
To improve performance, results from one split are cut off at `shard_size`.
When combining results of multiple splits, terms that
don't make it in the top n of a result from a split increase the theoretical upper bound error by lowest
term-count.

Even with a larger `shard_size` value, doc_count values for a terms aggregation may be
approximate. As a result, any sub-aggregations on the terms aggregation may also be approximate.
`sum_other_doc_count` is the number of documents that didn’t make it into the top size
terms. If this is greater than 0, the terms agg had to throw away some
buckets, either because they didn’t fit into `size` on the root node or they didn’t fit into
`shard_size` on the leaf node.

#### Per bucket document count error
If you set the `show_term_doc_count_error` parameter to true, the terms aggregation will include
doc_count_error_upper_bound, which is an upper bound to the error on the doc_count returned by
each split. It’s the sum of the size of the largest bucket on each split that didn’t fit
into `shard_size`.

#### Parameters

###### **field**

The field to aggregate on.

Currently term aggregation only works on fast fields of type `text`, `f64`, `i64` and `u64`.

###### **size**

By default, the top 10 terms with the most documents are returned. Larger values for size are more expensive.

###### **shard_size**

To obtain more accurate results, we fetch more than the `size` from each segment/split.

Increasing this value will enhance accuracy but will also increase CPU/memory usage. 
Refer to the [`document count error`](#document-count-error) section for more information on how `shard_size` impacts accuracy.

`shard_size` represents the number of terms that are returned from one split. 
For example, if there are 100 splits and `shard_size` is set to 1000, the root node may receive up to 100_000 terms to merge. 
Assuming an average cost of 50 bytes per term, this would require up to 5MB of memory. 
The actual number of terms sent to the root depends on the number of splits handled by one node and how the intermediate results can be merged (e.g., the cardinality of the terms).

Note on differences between Quickwit and Elasticsearch:
* Unlike Elasticsearch, Quickwit does not use global ordinals, so serialized terms need to be sent to the root node.
* The concept of shards in Elasticsearch differs from splits in Quickwit. In Elasticsearch, a shard contains up to 200M documents and is a collection of segments. In contrast, a Quickwit split comprises a single segment, typically with 5M documents. Therefore, `shard_size` in Elasticsearch applies to a group of segments, whereas in Quickwit, it applies to a single segment.

Defaults to `size * 10`.

###### **show_term_doc_count_error**

If you set the show_term_doc_count_error parameter to true, the terms aggregation will include doc_count_error_upper_bound, which is an upper bound to the error on the doc_count returned by each split.
It’s the sum of the size of the largest bucket on each split that didn’t fit into `shard_size`.

Defaults to true when ordering by count desc.


###### **min_doc_count**

Filter all terms that are lower than `min_doc_count`. Defaults to 1.

_Expensive_ : When set to 0, this will return all terms in the field.

###### **missing**

The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "genre", "missing": "NO_DATA" }
```

###### **order**

Set the order. String is here a target, which is either “_count”, “_key”, or the name of a metric sub_aggregation.
Single value metrics like average can be addressed by its name. Multi value metrics like stats are required to address their field by name e.g. “stats.avg”.
_Limitation_ : Ordering is only supported by one property currently. Passing an array for `order` is _not_ supported `"order": [{ "average_price": "asc" }, { "_key": "asc" }]`.

Order alphabetically
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "genres": {
            "terms": {
                "field": "genre",
                "order": { "_key": "asc" }
            }
        }
    }
}
```


Order by sub_aggregation

```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "articles_by_price": {
            "terms": {
                "field": "article_name",
                "order": { "average_price": "asc" }
            },
            "aggs": {
                "average_price": {
                    "avg": { "field": "price" }
                }
            }
        }
    }
}
```


## Metric Aggregations

The aggregations in this family compute metrics based on values extracted from the documents that are being aggregated.
Values are extracted from the fast field of the document. Some aggregations output a single numeric metric (e.g. Average)
and are called single-value numeric metrics aggregation, others generate multiple metrics (e.g. Stats) and are called multi-value numeric metrics aggregation.

In contrast to bucket aggregations, metrics don't allow sub-aggregations, since there is no document set to aggregate on.

### Average

A single-value metric aggregation that computes the average of numeric values that are extracted from the aggregated documents.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "average_price": {
            "avg": { "field": "price" }
        }
    }
}
```

**Response**
```json
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 101942,
    "errors": [],
    "aggregations": {
        "average_price": {
            "value": 133.7
        }
    }
}
```

#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

### Count

A single-value metric aggregation that counts the number of values that are extracted from the aggregated documents.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "price_count": {
            "value_count": { "field": "price" }
        }
    }
}
```

**Response**
```json
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 102956,
    "errors": [],
    "aggregations": {
        "price_count": {
            "value": 9582098
        }
    }
}
```
#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

### Max

A single-value metric aggregation that computes the maximum of numeric values that are that are extracted from the aggregated documents.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "max_price": {
            "max": { "field": "price" }
        }
    }
}
```

**Response**
```json
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 101543,
    "errors": [],
    "aggregations": {
        "max_price": {
            "value": 1353.23
        }
    }
}
```
#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

### Min

A single-value metric aggregation that computes the minimum of numeric values that are that are extracted from the aggregated documents.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "min_price": {
            "min": { "field": "price" }
        }
    }
}
```

**Response**
```json
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 102342,
    "errors": [],
    "aggregations": {
        "min_price": {
            "value": 0.01
        }
    }
}
```
#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

### Stats

A multi-value metric aggregation that computes stats (average, count, min, max, standard deviation, and sum) of numeric values that are extracted from the aggregated documents.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "timestamp_stats": {
            "stats": { "field": "timestamp" }
        }
    }
}
```


**Response**
```json
{
    "num_hits": 10000783,
    "hits": [],
    "elapsed_time_micros": 65297,
    "errors": [],
    "aggregations": {
        "timestamp_stats": {
            "avg": 1462320207.9803998,
            "count": 10000783,
            "max": 1475669670.0,
            "min": 1440670432.0,
            "standard_deviation": 11867304.28681695,
            "sum": 1.4624347076526848e16
        }
    }
}
```
#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

### Extended Stats

Extended stats is the same as `stats`, but with following additional metrics: `sum_of_squares`, `variance`, `std_deviation`, and `std_deviation_bounds`.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "response_extended_stats": {
            "extended_stats": { "field": "response" }
        }
    }
}
```

**Response**
```json
{
    ..
    "aggregations": {
        "response_extended_stats": {
            "avg": 65.55555555555556,
            "count": 9,
            "max": 130.0,
            "min": 20.0,
            "std_deviation": 42.97573245736381,
            "std_deviation_bounds": {
                "lower": -20.395909359172062,
                "lower_population": -20.395909359172062,
                "lower_sampling": -25.60973998562673,
                "upper": 151.50702047028318,
                "upper_population": 151.50702047028318,
                "upper_sampling": 156.72085109673785
            },
            "std_deviation_population": 42.97573245736381,
            "std_deviation_sampling": 45.582647770591144,
            "sum": 590.0,
            "sum_of_squares": 55300.0,
            "variance": 1846.9135802469136,
            "variance_population": 1846.9135802469136,
            "variance_sampling": 2077.777777777778
        }
    }
}
```

#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

###### **sigma**

The sigma parameter controls how many standard deviations +/- from the mean should be displayed.
The default value is 2.
```json skip
{ "field": "price", "sigma": "3.0" }
```

### Sum

A single-value metric aggregation that sums up numeric values that are that are extracted from the aggregated documents.
Supported field types are `u64`, `f64`, `i64`, and `datetime`.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "total_price": {
            "sum": { "field": "price" }
        }
    }
}
```

**Response**
```json
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 101142,
    "errors": [],
    "aggregations": {
        "total_price": {
            "value": 12966782476.54
        }
    }
}
```

#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```


### Percentiles
The percentiles aggregation is a useful tool for understanding the distribution of a data set.
It calculates the values below which a given percentage of the data falls.
For instance, the 95th percentile indicates the value below which 95% of the data points can be found.

This aggregation can be particularly interesting for analyzing website or service response times.
For example, if the 95th percentile website load time is significantly higher than the median, this indicates
that a small percentage of users are experiencing much slower load times than the majority.

To use the percentiles aggregation, you'll need to provide a field to aggregate on.
In the case of website load times, this would typically be a field containing the duration of time it takes for the site to load.

**Request**
```json skip
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "loading_times": {
            "percentiles": {
                "field": "load_time"
                "percents": [90, 95, 99]
            }
        }
    }
}
```

**Response**
```JSON
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 101142,
    "errors": [],
    "aggregations": {
        "loading_times": {
            "values": {
                "90.0": 33.4,
                "95.0": 83.4,
                "99.0": 230.3
            }
        }
    }
}
```

`percents` may be omitted, it will default to `[1, 5, 25, 50 (median), 75, 95, and 99]`.

#### Estimating Percentiles

While percentiles provide valuable insights into the distribution of data, it's important to understand that they are often estimates.
This is because calculating exact percentiles for large data sets can be computationally expensive and time-consuming.

#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```


### Cardinality
The cardinality aggregation is used to approximate the count of distinct values in a field. 
Cardinality aggregations are essential when working with large datasets where computing the exact count of distinct values would be computationally expensive. 

The cardinality aggregation can be useful to e.g. to count the number of unique users visiting a website or to determine the number of unique IP addresses that have logged into a server over a certain period.

The algorithm behind the cardinality aggregation is based on HyperLogLog++, which provides an approximate count over the hashed values.

To use the cardinality aggregation, you need to specify the field on which to perform the aggregation.

**Request**
```json
{
    "query": "*",
    "max_hits": 0,
    "aggs": {
        "unique_users": {
            "cardinality": {
                "field": "user_id"
            }
        }
    }
}
```

**Response**
```json
{
    "num_hits": 9582098,
    "hits": [],
    "elapsed_time_micros": 101142,
    "errors": [],
    "aggregations": {
        "unique_users": {
            "value": 345672
        }
    }
}
```


#### Parameters

###### **missing**
The `missing` parameter defines how documents that are missing a value should be treated.
By default they will be ignored but it is also possible to treat them as if they had a value.
```json skip
{ "field": "price", "missing": "10.0" }
```

#### Performance

The cardinality aggregation on text fields is computationally expensive for datasets with a large amount of unique values. 
This is because the aggregation computes the hash for each unique term in the field. 
In order to do this, Quickwit will for each split first collect the term ids and then fetch the compressed terms for those term ids from the dictionary.
Decompressing the terms is comparatively expensive and keeping the term ids increases the memory usage.

For numeric fields, the cardinality aggregation is much more efficient as it directly computes the hash of the numeric values and adds them to HLL++.

##### Limitations
The parameter `precision_threshold` is ignored currently. Normally it allows to set the threshold until the aggregation is exact.


================================================
FILE: docs/reference/cli.md
================================================
---
title: Command-line options
sidebar_position: 50
---

Quickwit command line tool lets you start a Quickwit server and manage indexes (create, delete, ingest), splits and sources (create, delete, toggle). To start a server, `quickwit` needs a [node config file path](../configuration/node-config.md) that you can specify with `QW_CONFIG` environment variable: `export QW_CONFIG=./config/quickwit.yaml`.

This page documents all the available commands, related options, and environment variables.

### Common Options

To manage indexes, splits and sources on a remote cluster you might need to specify the connection to a Quickwit node. The following options are supported:

| Option              | Description                 | Default                 |
|---------------------|-----------------------------|------------------------:|
| `--endpoint`        | The url of a Quickwit node. | `http://127.0.0.1:7280` |
| `--timeout`         | Command timeout.            | *See below*             |
| `--connect-timeout` | Connect timeout.            | `5s`                    |

The default timeouts are command specific:
- **search** - 1 minute
- **ingest** (without force or wait) - 1 minute
- **ingest** (with force or wait) - 30 minute
- all other operations - 10 seconds

The timeout can be expressed as in seconds, minutes, hours or days. For example:

- `10s` - 10 seconds timeout
- `1m` - 1 minute timeout
- `2h` - 2 hours timeout
- `1d` - 1 day timeout
- `none` - no timeout is applied.

:::caution

Before using Quickwit with object storage, consult our [guidelines](../operating/aws-costs.md) for deploying on AWS S3 to avoid surprises on your next bill.

:::


## Commands

[Command-line synopsis syntax](https://developers.google.com/style/code-syntax)

### Help

`quickwit` or `quickwit --help` displays the list of available commands.

`quickwit <command name> --help` displays the documentation for the command and a usage example.

### Version

`quickwit --version` displays the version. It is helpful for reporting bugs.


### Syntax

The CLI is structured into high-level commands with subcommands.
`quickwit [command] [subcommand] [args]`.

* `command`: `run`, `index`, `split`, `source` and `tool`.


<!--
    Insert auto-generated CLI docs here...
-->
## run
Starts a Quickwit node with all services enabled by default: `indexer`, `searcher`, `metastore`, `control-plane`, and `janitor`.


### Indexer service

The indexer service runs indexing pipelines assigned by the control plane.

### Searcher service 
Starts a web server at `rest_listing_address:rest_list_port` that exposes the [Quickwit REST API](rest-api.md)
where `rest_listing_address` and `rest_list_port` are defined in Quickwit config file (quickwit.yaml).
The node can optionally join a cluster using the `peer_seeds` parameter.
This list of node addresses is used to discover the remaining peer nodes in the cluster through a gossip protocol, see [chitchat](https://github.com/quickwit-oss/chitchat).

### Metastore service

The metastore service exposes Quickwit metastore over the network. This is a core internal service that is needed to operate Quickwit. As such, at least one running instance of this service is required for other services to work.

### Control plane service

The control plane service schedules indexing tasks to indexers. It listens to metastore events such as
an source create, delete, toggle, or index delete and reacts accordingly to update the indexing plan.

### Janitor service

The Janitor service runs maintenance tasks on indexes: garbage collection, documents delete, and retention policy tasks.

:::note
Quickwit needs to open the following port for cluster formation and workload distribution:

    TCP port (default is 7280) for REST API
    TCP and UDP port (default is 7280) for cluster membership protocol
    TCP port + 1 (default is 7281) for gRPC address for the distributed search

If ports are already taken, the serve command will fail.
:::
  
`quickwit  run [args]`

*Synopsis*

```bash
quickwit run
    [--config <config>]
    [--service <service>]
```

*Options*

| Option | Description | Default |
|-----------------|-------------|--------:|
| `--config` | Config file location | `config/quickwit.yaml` |
| `--service` | Services (`indexer`, `searcher`, `metastore`, `control-plane`, or `janitor`) to run. If unspecified, all the supported services are started. |  |

*Examples*

*Starts an indexer and a metastore services*
```bash
quickwit run --service indexer --service metastore --endpoint=http://127.0.0.1:7280
```

*Start a control plane, metastore and janitor services*
```bash
quickwit run --service control_plane --service metastore --service janitor --config=./config/quickwit.yaml
```

*Make a search request on a wikipedia index*
```bash
# To create wikipedia index and ingest data, go to our tutorials https://quickwit.io/docs/get-started/.
# Start a searcher.
quickwit run --service searcher --service metastore --config=./config/quickwit.yaml
# Make a request.
curl "http://127.0.0.1:7280/api/v1/wikipedia/search?query=barack+obama"

```

## index
Manages indexes: creates, updates, deletes, ingests, searches, describes...

### index create

Creates an index of ID `index` at `index-uri` configured by a [YAML config file](../configuration/index-config.md) located at `index-config`.
The index config lets you define the mapping of your document on the index and how each field is stored and indexed.
If `index-uri` is omitted, `index-uri` will be set to `{default_index_root_uri}/{index}`, more info on [Quickwit config docs](../configuration/node-config.md).
The command fails if an index already exists unless `overwrite` is passed.
When `overwrite` is enabled, the command deletes all the files stored at `index-uri` before creating a new index.
  
`quickwit index create [args]`

*Synopsis*

```bash
quickwit index create
    --index-config <index-config>
    [--overwrite]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index-config` | Location of the index config file. |
| `--overwrite` | Overwrites pre-existing index. This will delete all existing data stored at `index-uri` before creating a new index. |

*Examples*

*Create a new index.*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
curl -o wikipedia_index_config.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/wikipedia/index-config.yaml
quickwit index create --endpoint=http://127.0.0.1:7280 --index-config wikipedia_index_config.yaml

```

### index update

Updates an index using an index config file.  
`quickwit index update [args]`

*Synopsis*

```bash
quickwit index update
    --index <index>
    --index-config <index-config>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--index-config` | Location of the index config file. |
| `--create` | Create the index if it doesn't exist. |
### index clear

Clears an index: deletes all splits and resets checkpoint.  
`quickwit index clear [args]`
`quickwit index clr [args]`

*Synopsis*

```bash
quickwit index clear
    --index <index>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | Index ID |
### index delete

Deletes an index.  
`quickwit index delete [args]`
`quickwit index del [args]`

*Synopsis*

```bash
quickwit index delete
    --index <index>
    [--dry-run]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--dry-run` | Executes the command in dry run mode and only displays the list of splits candidates for deletion. |

*Examples*

*Delete your index*
```bash
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index delete --index wikipedia --endpoint=http://127.0.0.1:7280

```

### index describe

Displays descriptive statistics of an index.  
`quickwit index describe [args]`

*Synopsis*

```bash
quickwit index describe
    --index <index>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |

*Examples*

*Displays descriptive statistics of your index*
```bash
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index describe --endpoint=http://127.0.0.1:7280 --index wikipedia

1. General infos
===============================================================================
Index id:                           wikipedia
Index uri:                          file:///home/quickwit-indices/qwdata/indexes/wikipedia
Number of published splits:         1
Number of published documents:      300000
Size of published splits:           448 MB

2. Statistics on splits
===============================================================================
Document count stats:
Mean ± σ in [min … max]:            300000 ± 0 in [300000 … 300000]
Quantiles [1%, 25%, 50%, 75%, 99%]: [300000, 300000, 300000, 300000, 300000]

Size in MB stats:
Mean ± σ in [min … max]:            448 ± 0 in [448 … 448]
Quantiles [1%, 25%, 50%, 75%, 99%]: [448, 448, 448, 448, 448]

```

### index list

List indexes.  
`quickwit index list [args]`
`quickwit index ls [args]`

*Examples*

*List indexes*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index list --endpoint=http://127.0.0.1:7280
# Or with alias.
quickwit index ls --endpoint=http://127.0.0.1:7280

                                    Indexes                                     
+-----------+--------------------------------------------------------+
| Index ID  |                       Index URI                        |
+-----------+--------------------------------------------------------+
| hdfs-logs | file:///home/quickwit-indices/qwdata/indexes/hdfs-logs |
+-----------+--------------------------------------------------------+
| wikipedia | file:///home/quickwit-indices/qwdata/indexes/wikipedia |
+-----------+--------------------------------------------------------+


```

### index ingest

Indexes a dataset consisting of newline-delimited JSON objects located at `input-path` or read from *stdin*.
The data is appended to the target index of ID `index` unless `overwrite` is passed. `input-path` can be a file or another command output piped into stdin.
Currently, only local datasets are supported.
By default, Quickwit's indexer will work with a heap of 2 GiB of memory. Learn how to change `heap-size` in the [index config doc page](../configuration/index-config.md).
  
`quickwit index ingest [args]`

*Synopsis*

```bash
quickwit index ingest
    --index <index>
    [--input-path <input-path>]
    [--batch-size-limit <batch-size-limit>]
    [--wait]
    [--detailed-response]
    [--force]
    [--commit-timeout <commit-timeout>]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--input-path` | Location of the input file. |
| `--batch-size-limit` | Size limit of each submitted document batch. |
| `--wait` | Wait for all documents to be committed and available for search before exiting. Applies only to the last batch, see [#5417](https://github.com/quickwit-oss/quickwit/issues/5417). |
| `--detailed-response` | Print detailed errors. Enabling might impact performance negatively. |
| `--force` | Force a commit after the last document is sent, and wait for all documents to be committed and available for search before exiting. Applies only to the last batch, see [#5417](https://github.com/quickwit-oss/quickwit/issues/5417). |
| `--commit-timeout` | Timeout for ingest operations that require waiting for the final commit (`--wait` or `--force`). This is different from the `commit_timeout_secs` indexing setting, which sets the maximum time before committing splits after their creation. |

*Examples*

*Indexing a dataset from a file*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
curl -o wiki-articles-10000.json https://quickwit-datasets-public.s3.amazonaws.com/wiki-articles-10000.json
quickwit index ingest --endpoint=http://127.0.0.1:7280 --index wikipedia --input-path wiki-articles-10000.json

```

*Indexing a dataset from stdin*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
cat wiki-articles-10000.json | quickwit index ingest --endpoint=http://127.0.0.1:7280 --index wikipedia

```

### index search

Searches an index with ID `--index` and returns the documents matching the query specified with `--query`.
More details on the [query language page](query-language.md).
The offset of the first hit returned and the number of hits returned can be set with the `start-offset` and `max-hits` options.
It's possible to override the default search fields `search-fields` option to define the list of fields that Quickwit will search into if 
the user query does not explicitly target a field in the query. Quickwit will return snippets of the matching content when requested via the `snippet-fields` options.
Search can also be limited to a time range using the `start-timestamp` and `end-timestamp` options.
These timestamp options are useful for boosting query performance when using a time series dataset.

:::warning
The `start_timestamp` and `end_timestamp` should be specified in seconds regardless of the timestamp field precision. The timestamp field precision only affects the way it's stored as fast-fields, whereas the document filtering is always performed in seconds.
:::
  
`quickwit index search [args]`

*Synopsis*

```bash
quickwit index search
    --index <index>
    --query <query>
    [--aggregation <aggregation>]
    [--max-hits <max-hits>]
    [--start-offset <start-offset>]
    [--search-fields <search-fields>]
    [--snippet-fields <snippet-fields>]
    [--start-timestamp <start-timestamp>]
    [--end-timestamp <end-timestamp>]
    [--sort-by-score]
```

*Options*

| Option | Description | Default |
|-----------------|-------------|--------:|
| `--index` | ID of the target index |  |
| `--query` | Query expressed in natural query language ((barack AND obama) OR "president of united states"). Learn more on https://quickwit.io/docs/reference/search-language. |  |
| `--aggregation` | JSON serialized aggregation request in tantivy/elasticsearch format. |  |
| `--max-hits` | Maximum number of hits returned. | `20` |
| `--start-offset` | Offset in the global result set of the first hit returned. | `0` |
| `--search-fields` | List of fields that Quickwit will search into if the user query does not explicitly target a field in the query. It overrides the default search fields defined in the index config. Space-separated list, e.g. "field1 field2".  |  |
| `--snippet-fields` | List of fields that Quickwit will return snippet highlight on. Space-separated list, e.g. "field1 field2".  |  |
| `--start-timestamp` | Filters out documents before that timestamp (time-series indexes only). |  |
| `--end-timestamp` | Filters out documents after that timestamp (time-series indexes only). |  |
| `--sort-by-score` | Sorts documents by their BM25 score. |  |

*Examples*

*Searching a index*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama"
# If you have jq installed.
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama" | jq '.hits[].title'

```

*Sorting documents by their BM25 score*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "obama" --sort-by-score

```

*Limiting the result set to 50 hits*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama" --max-hits 50
# If you have jq installed.
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama" --max-hits 50 | jq '.num_hits'

```

*Looking for matches in the title only*
```bash
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "obama" --search-fields body
# If you have jq installed.
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "obama" --search-fields body | jq '.hits[].title'

```

## source
Manages sources: creates, updates, deletes sources...

### source create

Adds a new source to an index.  
`quickwit source create [args]`

*Synopsis*

```bash
quickwit source create
    --index <index>
    --source-config <source-config>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--source-config` | Path to source config file. Please, refer to the documentation for more details. |
### source update

Update an existing source.  
`quickwit source update [args]`

*Synopsis*

```bash
quickwit source update
    --index <index>
    --source <source>
    --source-config <source-config>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--source` | ID of the source |
| `--source-config` | Path to source config file. Please, refer to the documentation for more details. |
| `--create` | Create the source if it doesn't exist. |
### source enable

Enables a source for an index.  
`quickwit source enable [args]`

*Synopsis*

```bash
quickwit source enable
    --index <index>
    --source <source>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--source` | ID of the source. |
### source disable

Disables a source for an index.  
`quickwit source disable [args]`

*Synopsis*

```bash
quickwit source disable
    --index <index>
    --source <source>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--source` | ID of the source. |
### source ingest-api

Enables/disables the ingest API of an index.  
`quickwit source ingest-api [args]`

*Synopsis*

```bash
quickwit source ingest-api
    --index <index>
    [--enable]
    [--disable]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--enable` | Enables the ingest API. |
| `--disable` | Disables the ingest API. |
### source delete

Deletes a source from an index.  
`quickwit source delete [args]`
`quickwit source del [args]`

*Synopsis*

```bash
quickwit source delete
    --index <index>
    --source <source>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--source` | ID of the source. |

*Examples*

*Delete a `wikipedia-source` source*
```bash
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit source delete --endpoint=http://127.0.0.1:7280 --index wikipedia --source wikipedia-source

```

### source describe

Describes a source.  
`quickwit source describe [args]`
`quickwit source desc [args]`

*Synopsis*

```bash
quickwit source describe
    --index <index>
    --source <source>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--source` | ID of the source. |
### source list

Lists the sources of an index.  
`quickwit source list [args]`
`quickwit source ls [args]`

*Synopsis*

```bash
quickwit source list
    --index <index>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |

*Examples*

*List `wikipedia` index sources*
```bash
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit source list --endpoint=http://127.0.0.1:7280 --index wikipedia

```

### source reset-checkpoint

Resets a source checkpoint.  
`quickwit source reset-checkpoint [args]`
`quickwit source reset [args]`

*Synopsis*

```bash
quickwit source reset-checkpoint
    --index <index>
    --source <source>
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | Index ID |
| `--source` | Source ID |
## split
Manages splits: lists, describes, marks for deletion...

### split list

Lists the splits of an index.  
`quickwit split list [args]`
`quickwit split ls [args]`

*Synopsis*

```bash
quickwit split list
    --index <index>
    [--offset <offset>]
    [--limit <limit>]
    [--states <states>]
    [--create-date <create-date>]
    [--start-date <start-date>]
    [--end-date <end-date>]
    [--output-format <output-format>]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | Target index ID |
| `--offset` | Number of splits to skip. |
| `--limit` | Maximum number of splits to retrieve. |
| `--states` | Selects the splits whose states are included in this comma-separated list of states. Possible values are `staged`, `published`, and `marked`. |
| `--create-date` | Selects the splits whose creation dates are before this date. |
| `--start-date` | Selects the splits that contain documents after this date (time-series indexes only). |
| `--end-date` | Selects the splits that contain documents before this date (time-series indexes only). |
| `--output-format` | Output format. Possible values are `table`, `json`, and `pretty-json`. |
### split describe

Displays metadata about a split.  
`quickwit split describe [args]`
`quickwit split desc [args]`

*Synopsis*

```bash
quickwit split describe
    --index <index>
    --split <split>
    [--verbose]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--split` | ID of the target split |
| `--verbose` | Displays additional metadata about the hotcache. |
### split mark-for-deletion

Marks one or multiple splits of an index for deletion.  
`quickwit split mark-for-deletion [args]`
`quickwit split mark [args]`

*Synopsis*

```bash
quickwit split mark-for-deletion
    --index <index>
    --splits <splits>
    [--yes]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | Target index ID |
| `--splits` | Comma-separated list of split IDs |
| `--yes` | Assume "yes" as an answer to all prompts and run non-interactively. |
## tool
Performs utility operations. Requires a node config.

### tool local-ingest

Indexes NDJSON documents locally.  
`quickwit tool local-ingest [args]`

*Synopsis*

```bash
quickwit tool local-ingest
    --index <index>
    [--input-path <input-path>]
    [--input-format <input-format>]
    [--overwrite]
    [--transform-script <transform-script>]
    [--keep-cache]
```

*Options*

| Option | Description | Default |
|-----------------|-------------|--------:|
| `--index` | ID of the target index |  |
| `--input-path` | Location of the input file. |  |
| `--input-format` | Format of the input data. | `json` |
| `--overwrite` | Overwrites pre-existing index. |  |
| `--transform-script` | VRL program to transform docs before ingesting. |  |
| `--keep-cache` | Does not clear local cache directory upon completion. |  |
### tool extract-split

Downloads and extracts a split to a directory.  
`quickwit tool extract-split [args]`

*Synopsis*

```bash
quickwit tool extract-split
    --index <index>
    --split <split>
    [--target-dir <target-dir>]
```

*Options*

| Option | Description |
|-----------------|-------------|
| `--index` | ID of the target index |
| `--split` | ID of the target split |
| `--target-dir` | Directory to extract the split to. |
### tool gc

Garbage collects stale staged splits and splits marked for deletion.  
:::note
Intermediate files are created while executing Quickwit commands.
These intermediate files are always cleaned at the end of each successfully executed command.
However, failed or interrupted commands can leave behind intermediate files that need to be removed.
Also, note that using a very short grace period (like seconds) can cause the removal of intermediate files being operated on, especially when using Quickwit concurrently on the same index.
In practice, you can settle with the default value (1 hour) and only specify a lower value if you really know what you are doing.

:::
`quickwit tool gc [args]`

*Synopsis*

```bash
quickwit tool gc
    --index <index>
    [--grace-period <grace-period>]
    [--dry-run]
```

*Options*

| Option | Description | Default |
|-----------------|-------------|--------:|
| `--index` | ID of the target index |  |
| `--grace-period` | Threshold period after which stale staged splits are garbage collected. | `1h` |
| `--dry-run` | Executes the command in dry run mode and only displays the list of splits candidates for garbage collection. |  |

<!--
    End of auto-generated CLI docs
-->

## Environment Variables

### QW_CLUSTER_ENDPOINT

Specifies the address of the cluster to connect to. Management commands `index`, `split` and `source` require the `cluster_endpoint`, which you can set once and for all with the `QW_CLUSTER_ENDPOINT` environment variable.

### QW_CONFIG

Specifies the path to the [quickwit config](../configuration/node-config.md). Commands `run` and `tools` require the `config`, which you can set once and for all with the `QW_CONFIG` environment variable.

*Example*

`export QW_CONFIG=config/quickwit.yaml`

### QW_DISABLE_TELEMETRY

Disables [telemetry](../telemetry.md) when set to any non-empty value.

*Example*

`QW_DISABLE_TELEMETRY=1 quickwit help`

### QW_POSTGRES_SKIP_MIGRATIONS

Don't run database migrations (but verify that migrations were run successfully before, and no that unknown migration was run).

### QW_POSTGRES_SKIP_MIGRATION_LOCKING

Don't lock the database during migration. This may increase compatibility with alternative databases using the PostgreSQL wire protocol. However, it
is dangerous to use this if you can't guarantee that only one node will run the migrations.

### RUST_LOG

Configure quickwit log level.

*Examples*

```
# run with higher verbosity
RUST_LOG=debug quickwit run
# run with log level info, except for indexing related logs
RUST_LOG=info,quickwit_indexing=debug quickwit run
```


================================================
FILE: docs/reference/es_compatible_api.md
================================================
---
title: Elasticsearch compatible API
sidebar_position: 20
---


In order to facilitate migrations and integrations with existing tools,
Quickwit offers an Elasticsearch/Opensearch compatible API.
This API is incomplete. This page lists the available features and endpoints.

## Supported endpoints

All the API endpoints start with the `api/v1/_elastic/` prefix.

### `_bulk` &nbsp; Batch ingestion endpoint

```
POST api/v1/_elastic/_bulk
```
```
POST api/v1/_elastic/<index>/_bulk
```

The _bulk ingestion API makes it possible to index a batch of documents, possibly targeting several indices in the same request.

#### Request Body example

```json
{ "create" : { "_index" : "wikipedia", "_id" : "1" } }
{"url":"https://en.wikipedia.org/wiki?id=1","title":"foo","body":"foo"}
{ "create" : { "_index" : "wikipedia", "_id" : "2" } }
{"url":"https://en.wikipedia.org/wiki?id=2","title":"bar","body":"bar"}
{ "create" : { "_index" : "wikipedia", "_id" : "3" } }
{"url":"https://en.wikipedia.org/wiki?id=3","title":"baz","body":"baz"}'
```

Ingest a batch of documents to make them searchable using the [Elasticsearch](https://www.elastic.co/guide/en/elasticsearch/reference/current/docs-bulk.html) bulk API. This endpoint provides compatibility with tools or systems that already send data to Elasticsearch for indexing. Currently, only the `create` action of the bulk API is supported, all other actions such as `delete` or `update` are ignored.

If an index is specified via the url path, it will act as a default value
for the `_index` properties.

The [`refresh`](https://www.elastic.co/guide/en/elasticsearch/reference/current/docs-refresh.html) parameter is supported.

:::caution
The quickwit API will not report errors, you need to check the server logs.

In Elasticsearch, the `create` action has a specific behavior when the ingested documents contain an identifier (the `_id` field). It only inserts such a document if it was not inserted before. This is extremely handy to achieve At-Most-Once indexing.
Quickwit does not have any notion of document id and does not support this feature.
:::

:::info
The payload size is limited to 10MB as this endpoint is intended to receive documents in batch.
:::

#### Query parameter

| Variable  | Type     | Description                                                      | Default value |
| --------- | -------- | ---------------------------------------------------------------- | ------------- |
| `refresh` | `String` | The commit behavior: blank string, `true`, `wait_for` or `false` | `false`       |

#### Response

The response is a JSON object, and the content type is `application/json; charset=UTF-8.`

| Field                     | Description                                                                                                                                                              |   Type   |
| ------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------ | :------: |
| `num_docs_for_processing` | Total number of documents ingested for processing. The documents may not have been processed. The API will not return indexing errors, check the server logs for errors. | `number` |


### `_search` &nbsp; Index search endpoint

```
POST api/v1/_elastic/<index_id>/_search
```
```
GET api/v1/_elastic/<index_id>/_search
```

#### Request Body example

```json
{
  "size": 10,
  "query": {
    "bool": {
      "must": [
        {
          "query_string": {
            "query": "bitpacking"
          }
        },
        {
          "term": {
            "actor.login": {
              "value": "fulmicoton"
            }
          }
        }
      ]
    }
  },
  "sort": [
    {
      "actor.id": {
        "order": null
      }
    }
  ],
  "aggs": {
    "event_types": {
      "terms": {
        "field": "type",
        "size": 5
      }
    }
  }
}
```

Search into a specific index using the [Elasticsearch search API](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/search-search.html).

Some of the parameter can be passed as query string parameter, and some via JSON payload.
If a parameter appears both as a query string parameter and in the JSON payload, the query string parameter value will take priority.

#### Supported Query string parameters


| Variable           | Type          | Description                                                                      | Default value |
| ------------------ | ------------- | -------------------------------------------------------------------------------- | ------------- |
| `default_operator` | `AND` or `OR` | The default operator used to combine search terms. It should be `AND` or `OR`.   | `OR`          |
| `from`             | `Integer`     | The rank of the first hit to return. This is useful for pagination.              | 0             |
| `q`                | `String`      | The search query.                                                                | (Optional)    |
| `size`             | `Integer`     | Number of hits to return.                                                        | 10            |
| `sort`             | `String`      | Describes how documents should be ranked. See [Sort order](#sort-order)          | (Optional)    |
| `scroll`           | `Duration`    | Creates a scroll context for "time to live". See [Scroll](#_searchscroll--scroll-api). | (Optional)    |
| `allow_partial_search_results` | `Boolean` | Returns a partial response if some (but not all) of the split searches were unsuccessful. | `true` |

#### Supported Request Body parameters

| Variable           | Type              | Description                                                                    | Default value |
| ------------------ | ----------------- | ------------------------------------------------------------------------------ | ------------- |
| `default_operator` | `"AND"` or `"OR"` | The default operator used to combine search terms. It should be `AND` or `OR`. | `OR`          |
| `from`             | `Integer`         | The rank of the first hit to return. This is useful for pagination.            | 0             |
| `query`            | `Json object`     | Describe the search query. See [Query DSL](#query-dsl)                         | (Optional)    |
| `size`             | `Integer`         | Number of hits to return.                                                      | 10            |
| `sort`             | `JsonObject[]`    | Describes how documents should be ranked. See [Sort order](#sort-order)        | `[]`          |
| `search_after`     | `Any[]`           | Ignore documents with a SortingValue preceding or equal to the parameter       | (Optional)    |
| `aggs`             | `Json object`     | Aggregation definition. See [Aggregations](aggregation.md).                    | `{}`          |


#### Sort order

You can define up to two criteria on which to apply sort.
The second criterion will only be used in presence of a tie for the first criterion.

A given criterion can either be
- the name of a fast field (explicitly defined in the schema or captured by the dynamic mode)
- `_score` to sort by BM25.

By default, the sort order is `ascending` for fast fields and descending for `_score`.

When sorting by a fast field and this field contains several values in a single document, only the first value is used for sorting.

The sort order can be set as descending/ascending using the
following syntax.

```json
{
  // ...
  "sort" : [
    { "timestamp" : {"order" : "asc"}},
    { "serial_number" : "desc" }
  ]
  // ...
}

```

It is also possible to not supply an order and rely on the default order using the following syntax.

```json
{ //...
  "sort" : ["_score", "timestamp"]
  // ...
}
```

If no format is provided for timestamps, timestamps are returned with milliseconds precision.

If you need nanosecond precision, you can use the `epoch_nanos_int` format. Beware this means the resulting
JSON may contain high numbers for which there is loss of precision when using languages where all numbers are
floats, such as JavaScript.

```json
{
  // ...
  "sort" : [
    { "timestamp" : {"format": "epoch_nanos_int","order" : "asc"}},
    { "serial_number" : "desc" }
  ]
  // ...
}

#### Search after

When sorting results, the answer looks like the following

```json
{
  // ...
  "hits": {
    // ...
    "hits": [
      // ...
      {
        // ...
        "sort": [
          1701962929199
        ]
      }
    ]
  }
}
```

You can pass the `sort` value of the last hit in a subsequent request where other fields are kept unchanged:
```json
{
  // keep all fields from the original request
  "search_after": [
    1701962929199
  ]
}
```

This allows you to paginate your results.

### `_msearch` &nbsp; Multi search API

```
POST api/v1/_elastic/_msearch
```

#### Request Body example

```json
{"index": "gharchive" }
{"query" : {"match" : { "author.login": "fulmicoton"}}}
{"index": "gharchive"}
{"query" : {"match_all" : {}}}
```

[Multi search endpoint ES API reference](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/search-multi-search.html)

Runs several search requests at once.

The payload is expected to alternate:
- a `header` json object, containing the targeted index id.
- a `search request body` as defined in the [`_search` endpoint section].


### `_search/scroll` &nbsp; Scroll API

```
GET api/v1/_elastic/_search/scroll
```

#### Supported Request Body parameters

| Variable    | Type                                        | Description | Default value |
| ----------- | ------------------------------------------- | ----------- | ------------- |
| `scroll_id` | Scroll id (obtained from a search response) | Required    |               |


The `_search/scroll` endpoint, in combination with the `_search` API makes it possible to request successive pages of search results.
First, the client needs to call the `search api` with a `scroll` query parameter, and then pass the `scroll_id` returned in the response payload to  `_search/scroll` endpoint.

Each subsequent call to the `_search/scroll` endpoint will return a new `scroll_id` pointing to the next page.

:::tip

Using `_search` and then `_search/scroll` is somewhat similar to using `_search` with the `search_after` parameter, except that it creates a lightweight snapshot view of the dataset during the initial call to `_search`. Further calls to `_search/scroll` only return results from that view, thus ensuring more consistent results.

:::

### `_cat` &nbsp; Cat API

```
GET api/v1/_elastic/_cat/indices/<index>
```
```
GET api/v1/_elastic/_cat/indices
```

#### Supported Query string parameters

| Variable | Type       | Description                                                                                            | Default value |
|----------|------------|--------------------------------------------------------------------------------------------------------|---------------|
| `format` | `String`   | Format for response. Only JSON supported for now.                                                      |               |
| `h`      | `String[]` | Comma-separated list of column names to display.                                                       | (Optional)    |
| `health` | `String`   | Filter for health: `green`, `yellow`, or `red`.                                                        | (Optional)    |
| `bytes`  | `String`   | Unit used to display byte values. Unsupported for now.                                                 | (Optional)    |
| `s`      | `String`   | Comma-separated list of column names or column aliases used to sort the response. Unsupported for now. | (Optional)    |
| `v`      | `Boolean`  | If true, the response includes column headings. Unsupported for now.                                   | (Optional)    |

Use the [cat indices API](https://www.elastic.co/guide/en/elasticsearch/reference/current/cat-indices.html) to get the following information for each index in a cluster:
* Shard count
* Document count
* Deleted document count
* Primary store size
* Total store size

#### Response

The response is a JSON object, and the content type is `application/json; charset=UTF-8.`

| Field            | Description                                      |   Type   |
|------------------|--------------------------------------------------|:--------:|
| `uuid`           | Index uuid                                       | `String` |
| `index`          | Index name                                       | `String` |
| `health`         | Health of the index `green`, `yellow`, or `red`. | `String` |
| `status`         | Status of the index `open`.                      | `String` |
| `rep`            | Replication factor.                              | `Number` |
| `pri`            | Number of primary shards                         | `Number` |
| `pri.store.size` | Stored size of primary shard.                    | `String` |
| `store.size`     | Stored size of index.                            | `String` |
| `dataset.size`   | Indexed data size.                               | `String` |
| `docs.count`     | Number of records in index.                      | `Number` |
| `docs.deleted`   | Number of deleted records in index.              | `Number` |

Example response:

```json
[
  {
    "dataset.size": "0b",
    "docs.count": "0",
    "docs.deleted": "0",
    "health": "green",
    "index": "otel-traces-v0_7",
    "pri": "1",
    "pri.store.size": "0b",
    "rep": "1",
    "status": "open",
    "store.size": "0b",
    "uuid": "otel-traces-v0_7:01HTJC6TQDGM07KBDQZ2KDHW53"
  },
  {
    "dataset.size": "387.5gb",
    "docs.count": "224453081",
    "docs.deleted": "0",
    "health": "green",
    "index": "otel-logs-v0_7",
    "pri": "1",
    "pri.store.size": "37.5gb",
    "rep": "1",
    "status": "open",
    "store.size": "37.5gb",
    "uuid": "otel-logs-v0_7:01HTJC6TME1JGXBFERHZ0FJ860"
  }
]
```

[HTTP accept header]: https://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html


### `_field_caps` &nbsp; Field capabilities API

```
GET api/v1/_elastic/<index>/_field_caps
```
```
POST api/v1/_elastic/<index>/_field_caps
```
```
GET api/v1/_elastic/_field_caps
```
```
POST api/v1/_elastic/_field_caps
```

The [field capabilities API](https://www.elastic.co/guide/en/elasticsearch/reference/current/search-field-caps.html) returns information about the capabilities of fields among multiple indices.

#### Supported Query string parameters

| Variable              | Type       | Description                                                                    | Default value |
| --------------------- | ---------- | ------------------------------------------------------------------------------ | ------------- |
| `fields`              | `String`   | Comma-separated list of fields to retrieve capabilities for. Supports wildcards (`*`). | (Optional) |
| `allow_no_indices`    | `Boolean`  | If `true`, missing or closed indices are not an error.                          | (Optional)    |
| `expand_wildcards`    | `String`   | Controls what kind of indices that wildcard patterns can match.                 | (Optional)    |
| `ignore_unavailable`  | `Boolean`  | If `true`, unavailable indices are ignored.                                    | (Optional)    |
| `start_timestamp`     | `Integer`  | *(Quickwit-specific)* If set, restricts splits to documents with a timestamp range start >= `start_timestamp` (seconds since epoch). | (Optional) |
| `end_timestamp`       | `Integer`  | *(Quickwit-specific)* If set, restricts splits to documents with a timestamp range end < `end_timestamp` (seconds since epoch). | (Optional) |

#### Supported Request Body parameters

| Variable           | Type          | Description                                                                 | Default value |
| ------------------ | ------------- | --------------------------------------------------------------------------- | ------------- |
| `index_filter`     | `Json object` | A query to filter indices. If provided, only fields from indices that can potentially match the filter are returned. See [index_filter](#index_filter). | (Optional) |
| `runtime_mappings`  | `Json object` | Accepted but not supported.                                                 | (Optional)    |

#### `index_filter`

The `index_filter` parameter allows you to filter which indices contribute to the field capabilities response. When provided, Quickwit uses the filter query to prune indices (splits) that cannot match the filter, and only returns field capabilities for the remaining ones.

Like Elasticsearch, this is a **best-effort** approach: Quickwit may return field capabilities from indices that do not actually contain any matching documents. In Quickwit, the filtering is limited to the existing split-pruning based on metadata:

- **Time pruning**: Range queries on the timestamp field can eliminate splits whose time range does not overlap with the filter.
- **Tag pruning**: Term queries on [tag fields](../configuration/index-config.md#tag-fields) can eliminate splits that do not contain the requested tag value.

Other filter types (e.g. full-text queries or term queries on non-tag fields) are accepted but will not prune any splits — all indices will be returned as if no filter was specified. In particular, Quickwit does not check whether terms are present in the term dictionary.

#### Request Body example

```json
{
  "index_filter": {
    "range": {
      "timestamp": {
        "gte": "2024-01-01T00:00:00Z",
        "lt": "2024-02-01T00:00:00Z"
      }
    }
  }
}
```

```json
{
  "index_filter": {
    "term": {
      "status": "active"
    }
  }
}
```


## Query DSL

[Elasticsearch Query DSL reference](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl.html).

The following query types are supported.

### `query_string`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-query-string-query.html)


#### Example

```json
{
  "query": {
    "query_string": {
      "query": "bitpacking AND author.login:fulmicoton",
      "fields": [
        "payload.description"
      ]
    }
  }
}
```

#### Supported parameters

| Variable           | Type                  | Description                                                                                                                 | Default value |
| ------------------ | --------------------- | --------------------------------------------------------------------------------------------------------------------------- | ------------- |
| `query`            | `String`              | Query meant to be parsed.                                                                                                   | -             |
| `fields`           | `String[]` (Optional) | Default search target fields.                                                                                               | -             |
| `default_operator` | `"AND"` or `"OR"`     | In the absence of boolean operator defines whether terms should be combined as a conjunction (`AND`) or disjunction (`OR`). | `OR`          |
| `boost`            | `Number`              | Multiplier boost for score computation.                                                                                     | 1.0           |
| `lenient`          | `Boolean`             | [See note](#about-the-lenient-argument).                                                                                    | false         |


### `bool`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-term-query.html)

#### Example

```json
{
  "query": {
    "bool": {
      "must": [
        {
          "query_string": {
            "query": "bitpacking"
          }
        }
      ],
      "must_not": {
        "term": {
          "type": {
            "value": "CommitEvent"
          }
        }
      }
    }
  }
}
```

#### Supported parameters

| Variable   | Type                      | Description                                                       | Default value |
| ---------- | ------------------------- | ----------------------------------------------------------------- | ------------- |
| `must`     | `JsonObject[]` (Optional) | Sub-queries required to match the document.                       | []            |
| `must_not` | `JsonObject[]` (Optional) | Sub-queries required to not match the document.                   | []            |
| `should`   | `JsonObject[]` (Optional) | Sub-queries that should match the documents.                      | []            |
| `filter`   | `JsonObject[]`            | Like must queries, but the match does not influence the `_score`. | []            |
| `boost`    | `Number`                  | Multiplier boost for score computation.                           | 1.0           |
| `minimum_should_match`    | `Number` or `Str` | If present, quickwit will only match documents for which at least `minimum_should_match` should clauses are matching. `2`, `-1`, `"10%"` and `"-10%"` are supported. |  |

### `range`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-range-query.html)

#### Example

```json
{
  "query": {
    "range": {
      "my_date_field": {
        "lt": "2015-02-01T00:00:13Z",
        "gte": "2015-02-01T00:00:10Z"
      }
    }
  }
}

```

#### Supported parameters

| Variable | Type                            | Description                            | Default value |
| -------- | ------------------------------- | -------------------------------------- | ------------- |
| `gt`     | bool, string, Number (Optional) | Greater than                           | None          |
| `gte`    | bool, string, Number (Optional) | Greater than or equal                  | None          |
| `lt`     | bool, string, Number (Optional) | Less than                              | None          |
| `lte`    | bool, string, Number (Optional) | Less than or equal                     | None          |
| `boost`  | `Number`                        | Multiplier boost for score computation | 1.0           |


### `match`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-match-query.html)

#### Example

```json
{
  "query": {
    "match": {
        "type": {
            "query": "CommitEvent",
            "zero_terms_query": "all"
        }
    }
  }
}
```

#### Supported Parameters

| Variable           | Type              | Description                                                                                                                    | Default |
| ------------------ | ----------------- | ------------------------------------------------------------------------------------------------------------------------------ | ------- |
| `query`            | String            | Full-text search query.                                                                                                        | -       |
| `operator`         | `"AND"` or `"OR"` | Defines whether all terms should be present (`AND`) or if at least one term is sufficient to match (`OR`).                     | OR      |
| `zero_terms_query` | `all` or `none`   | Defines if all (`all`) or no documents (`none`) should be returned if the query does not contain any terms after tokenization. | `none`  |
| `boost`            | `Number`          | Multiplier boost for score computation                                                                                         | 1.0     |
| `lenient`          | `Boolean`         | [See note](#about-the-lenient-argument).                                                                                       | false   |


### `match_phrase`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-match-query-phrase.html)

#### Example

```json
{
  "query": {
    "match_phrase": {
      "title": "search keywords",
      "analyzer": "default"
    }
  }
}
```


### `match_phrase_prefix`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query-phrase-prefix.html)

#### Example

```json
{
  "query": {
    "match_phrase_prefix": {
      "payload.commits.message": {
        "query": "automated comm" // This will match "automated commit" for instance.
      }
    }
  }
}
```

#### Supported Parameters

| Variable           | Type            | Description                                                                                                                    | Default                     |
| ------------------ | --------------- | ------------------------------------------------------------------------------------------------------------------------------ | --------------------------- |
| `query`            | String          | Full-text search query. The last token will be prefix-matched                                                                  | -                           |
| `zero_terms_query` | `all` or `none` | Defines if all (`all`) or no documents (`none`) should be returned if the query does not contain any terms after tokenization. | `none`                      |
| `max_expansions`   | `Integer`       | Number of terms to be match by the prefix matching.                                                                            | 50                          |
| `slop`             | `Integer`       | Allows extra tokens between the query tokens.                                                                                  | 0                           |
| `analyzer`         | String          | Analyzer meant to cut the query into terms. It is recommended to NOT use this parameter.                                       | The actual field tokenizer. |


### `match_bool_prefix`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query-phrase-prefix.html)

#### Example

```json
{
  "query": {
    "match_bool_prefix": {
      "payload.commits.message": {
        "query": "automated comm" // This will match "automated commit" for instance.
      }
    }
  }
}
```

Contrary to ES/Opensearch, in Quickwit, at most 50 terms will be considered when searching the last term of the query as a prefix `match_bool_prefix`.

#### Supported Parameters

| Variable           | Type              | Description                                                                                                                    | Default |
| ------------------ | ----------------- | ------------------------------------------------------------------------------------------------------------------------------ | ------- |
| `query`            | String            | Full-text search query. The last token will be prefix-matched                                                                  | -       |
| `operator`         | `"AND"` or `"OR"` | Defines whether all terms should be present (`AND`) or if at least one term is sufficient to match (`OR`).                     | OR      |
| `zero_terms_query` | `all` or `none`   | Defines if all (`all`) or no documents (`none`) should be returned if the query does not contain any terms after tokenization. | `none`  |


### `Multi-match`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-multi-match-query.html)

#### Example
```json
{
  "query": {
    "multi_match": {
      "query": "search keywords",
      "fields": [
        "title",
        "body"
      ]
    }
  }
}
```

```json
{
  "query": {
    "multi_match": {
      "query": "search keywords",
      "type": "most_fields",
      "fields": [
        "title",
        "body"
      ]
    }
  }
}
```

```json
{
  "query": {
    "multi_match": {
      "query": "search keywords",
      "type": "phrase",
      "fields": [
        "title",
        "body"
      ]
    }
  }
}
```

```json
{
  "query": {
    "multi_match" : {
      "query":      "search key",
      "type":       "phrase_prefix",
      "fields":     [ "title", "body" ]
    }
  }
}
```

#### Supported parameters

| Variable           | Type                  | Description                                  | Default value |
| ------------------ | --------------------- | ---------------------------------------------| ------------- |
| `type`             | `String`              | See supported types below                    | `most_fields` |
| `fields`           | `String[]` (Optional) | Default search target fields.                | -             |
| `lenient`          | `Boolean`             | [See note](#about-the-lenient-argument).     | false         |

Supported types:

| `type` value    | Description                                                                                 |
| --------------- | ------------------------------------------------------------------------------------------- |
| `most_fields`   | Finds documents matching any field and combines the `_score` from each field (default).  |
| `phrase`        | Runs a `match_phrase` query on each field.       |
| `phrase_prefix` | Runs a `match_phrase_prefix` query on each field. |
| `bool_prefix`   | Runs a `match_bool_prefix` query on each field. |

:::warning

In `phrase`, `phrase_prefix` and `bool_prefix` modes, Quickwit sums the score of the different fields instead of returning their max.

Moreover, while Quickwit does not support `best_fields` or `cross_fields`, it will not return an error when presented a `best_fields` or `cross_fields` type. For compatibilility reasons, Quickwit silently accepts these parameters and interprets them as a `most_fields` type.

:::

### `term`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-term-query.html)

:::note

When working on text, it is recommended to only use `term` queries on fields configured with `tokenizer: raw`. This is the Quickwit equivalent of the Elasticsearch `keyword` type.

:::

#### Example

```json
{
  "query": {
    "term": {
      "payload.commits.message": {
        "value": "automated",
        "boost": 2.0
      }
    }
  }
}
```

#### Supported Parameters

| Variable           | Type    | Description                                                                  | Default |
| ------------------ | ------- | ---------------------------------------------------------------------------- | ------- |
| `value`            | String  | Term value. This is the string representation of a token after tokenization. | -       |
| `boost`            | Number  | Multiplier boost for score computation                                       | 1.0     |
| `case_insensitive` | Boolean | Allows ASCII case insensitive matching of the value.                         | false   |


### `match_all` / `match_none`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-all-query.html)

#### Example

```json
{"match_all": {}}
```
```json
{"match_none": {}}
```


### `exists`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-exists-query.html)

Query matching only documents containing a non-null value for a given field.

#### Example

```json
{
  "query": {
    "exists": {
      "field": "author.login"
    }
  }
}
```

#### Supported Parameters

| Variable | Type   | Description                                             | Default |
| -------- | ------ | ------------------------------------------------------- | ------- |
| `field`  | String | Only documents with a value for field will be returned. | -       |

### `prefix`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-prefix-query.html)

Returns documents that contain a specific prefix in a provided field.

#### Example

```json
{
  "query": {
    "prefix": {
      "author.login" {
        "value": "adm",
      }
    }
  }
}
```

#### Supported Parameters

| Variable           | Type    | Description                                          | Default |
| ------------------ | ------- | ---------------------------------------------------- | ------- |
| `value`            | String  | Beginning characters of terms you wish to find.      | -       |
| `case_insensitive` | Boolean | Allows ASCII case insensitive matching of the value. | false   |

### `wildcard`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-wildcard-query.html)

Returns documents that contain terms matching a wildcard pattern:
* `?` replaces one and only one term character
* `*` replaces any number of term characters or an empty string

#### Example

```json
{
  "query": {
    "wildcard": {
      "author.login" {
        "value": "adm?n*",
      }
    }
  }
}
```

#### Supported Parameters

| Variable           | Type    | Description                                          | Default |
| ------------------ | ------- | ---------------------------------------------------- | ------- |
| `value`            | String  | Wildcard pattern for terms you wish to find.         | -       |
| `boost`            | Number  | Multiplier boost for score computation.              | 1.0     |
| `case_insensitive` | Boolean | Allows ASCII case insensitive matching of the value. | false   |


### `regexp`

[Elasticsearch reference documentation](https://www.elastic.co/guide/en/elasticsearch/reference/8.8/query-dsl-regexp-query.html)

Returns documents that contain terms matching a regular expression.

#### Example

```json
{
  "query": {
    "regexp": {
      "author.login" {
        "value": "adm.*n",
      }
    }
  }
}
```

#### Supported Parameters

| Variable           | Type    | Description                                          | Default |
| ------------------ | ------- | ---------------------------------------------------- | ------- |
| `value`            | String  | Wildcard pattern for terms you wish to find.         | -       |
| `case_insensitive` | Boolean | Allows ASCII case insensitive matching of the value. | false   |


### About the `lenient` argument

Quickwit and Elasticsearch have different interpretations of the `lenient` setting:
- In Quickwit, lenient mode allows ignoring parts of the query that reference non-existing columns. This is a behavior that Elasticsearch supports by default.
- In Elasticsearch, lenient mode primarily addresses type errors (such as searching for text in an integer field). Quickwit always supports this behavior, regardless of the `lenient` setting.

## Search multiple indices

Search APIs that accept <index_id> requests path parameter also support multi-target syntax.

### Multi-target syntax

In multi-target syntax, you can use a comma or its URL encoded version '%2C' separated list to run a request on multiple indices: test1,test2,test3. You can also sue [glob-like](https://en.wikipedia.org/wiki/Glob_(programming)) wildcard ( \* ) expressions to target indices that match a pattern: test\* or \*test or te\*t or \*test\*.

The multi-target expression has the following constraints:

    - It must follow the regex `^[a-zA-Z\*][a-zA-Z0-9-_\.\*]{0,254}$`.
    - It cannot contain consecutive asterisks (`*`).
    - If it does not contain an asterisk (`*`), the length must be greater than or equal to 3 characters.

### Examples
```
GET api/v1/_elastic/stackoverflow-000001,stackoverflow-000002/_search
{
  "query": {
    "query_string": {
      "query": "search AND engine",
      "fields": [
        "title",
        "body"
      ]
    }
  }
}
```

```
GET api/v1/_elastic/stackoverflow*/_search
{
  "query": {
    "query_string": {
      "query": "search AND engine",
      "fields": [
        "title",
        "body"
      ]
    }
  }
}
```


================================================
FILE: docs/reference/metrics.md
================================================
---
title: Metrics
sidebar_position: 70
---

Quickwit exposes key metrics in the [Prometheus](https://prometheus.io/) format on the `/metrics` endpoint. You can use any front-end that supports Prometheus to examine the behavior of Quickwit visually.

## Cache Metrics

Currently Quickwit exposes metrics for three caches: `fastfields`, `shortlived`, `splitfooter`. These metrics share the same structure.

| Namespace | Metric Name | Description | Type |
| --------- | ----------- | ----------- | ---- |
| `quickwit_cache_{cache_name}` | `in_cache_count` | Count of {cache_name} in cache | `gauge` |
| `quickwit_cache_{cache_name}` | `in_cache_num_bytes` | Number of {cache_name} bytes in cache | `gauge` |
| `quickwit_cache_{cache_name}` | `cache_hit_total` | Number of {cache_name} cache hits | `counter` |
| `quickwit_cache_{cache_name}` | `cache_hits_bytes` | Number of {cache_name} cache hits in bytes | `counter` |
| `quickwit_cache_{cache_name}` | `cache_miss_total` | Number of {cache_name} cache hits | `counter` |

## CLI Metrics

| Namespace | Metric Name | Description | Type |
| --------- | ----------- | ----------- | ---- |
| `quickwit` | `allocated_num_bytes` | Number of bytes allocated memory, as reported by jemalloc. | `gauge` |

## Common Metrics

| Namespace | Metric Name | Description | Labels | Type |
| --------- | ----------- | ----------- | ------ | ---- |
| `quickwit` | `write_bytes`| Number of bytes written by a given component in [`indexer`, `merger`, `deleter`, `split_downloader_{merge,delete}`] | [`index`, `component`] | `counter` |

## Indexing Metrics

| Namespace | Metric Name | Description | Labels | Type |
| --------- | ----------- | ----------- | ------ | ---- |
| `quickwit_indexing` | `processed_docs_total`| Number of processed docs by index, source and processed status in [`valid`, `schema_error`, `parse_error`, `transform_error`] | [`index`, `source`, `docs_processed_status`] | `counter` |
| `quickwit_indexing` | `processed_bytes`| Number of processed bytes by index, source and processed status in [`valid`, `schema_error`, `parse_error`, `transform_error`] | [`index`, `source`, `docs_processed_status`] | `counter` |
| `quickwit_indexing` | `available_concurrent_upload_permits`| Number of available concurrent upload permits by component in [`merger`, `indexer`] | [`component`] | `gauge` |
| `quickwit_indexing` | `ongoing_merge_operations`| Number of available concurrent upload permits by component in [`merger`, `indexer`]. | [`index`, `source`] | `gauge` |

## Ingest Metrics

| Namespace | Metric Name | Description | Type |
| --------- | ----------- | ----------- | ---- |
| `quickwit_ingest` | `docs_bytes_total` | Total size of the docs ingested, measured in ingester's leader, after validation and before persistence/replication | `counter` |
| `quickwit_ingest` | `docs_total` | Total number of the docs ingested, measured in ingester's leader, after validation and before persistence/replication | `counter` |
| `quickwit_ingest` | `queue_count` | Number of queues currently active | `counter` |

## Metastore Metrics

All metastore methods are monitored by the 3 metrics:

| Namespace | Metric Name | Description | Labels | Type |
| --------- | ----------- | ----------- | ------ | ---- |
| `quickwit_metastore` | `requests_total` | Number of requests | [`operation`, `index`] | `counter` |
| `quickwit_metastore` | `request_errors_total` | Number of failed requests | [`operation`, `index`] | `counter` |
| `quickwit_metastore` | `request_duration_seconds` | Duration of requests | [`operation`, `index`, `error`] | `histogram` |

Examples of operation names: `create_index`, `index_metadata`, `delete_index`, `stage_splits`, `publish_splits`, `list_splits`, `add_source`, ...

## Rest API Metrics

| Namespace | Metric Name | Description | Type |
| --------- | ----------- | ----------- | ---- |
| `quickwit` | `http_requests_total` | Total number of HTTP requests received | `counter` |

## Search Metrics

| Namespace | Metric Name | Description | Type |
| --------- | ----------- | ----------- | ---- |
| `quickwit_search` | `leaf_searches_splits_total` | Number of leaf searches (count of splits) started | `counter` |
| `quickwit_search` | `leaf_search_split_duration_secs` | Number of seconds required to run a leaf search over a single split. The timer starts after the semaphore is obtained | `histogram` |
| `quickwit_search` | `active_search_threads_count` | Number of threads in use in the CPU thread pool | `gauge` |

## Storage Metrics

| Namespace | Metric Name | Description | Type |
| --------- | ----------- | ----------- | ---- |
| `quickwit_storage` | `object_storage_gets_total` | Number of objects fetched | `counter` |
| `quickwit_storage` | `object_storage_puts_total` | Number of objects uploaded. May differ from object_storage_requests_parts due to multipart upload | `counter` |
| `quickwit_storage` | `object_storage_puts_parts` | Number of object parts uploaded | `counter` |
| `quickwit_storage` | `object_storage_download_num_bytes` | Amount of data downloaded from an object storage | `counter` |


================================================
FILE: docs/reference/query-language.md
================================================
---
title: Query Language Reference
sidebar_position: 40
---

## Pseudo-grammar

```
query = '(' query ')'
      | query operator query
      | unary_operator query
      | query query
      | clause

operator = 'AND' | 'OR'

unary_operator = 'NOT' | '-'

clause = field_name ':' field_clause
       | defaultable_clause
       | '*'

field_clause = term | term_prefix | term_set | phrase | phrase_prefix | range | '*'
defaultable_clause = term | term_prefix | term_set | phrase | phrase_prefix
```
---
## Writing Queries
### Escaping Special Characters

Some characters need to be escaped in non quoted terms because they are syntactically significant otherwise: special reserved characters are: `+` , `^`, `` ` ``, `:`, `{`, `}`, `"`, `[`, `]`, `(`, `)`, `~`, `!`, `\\`, `*`, `SPACE`. If such such characters appear in query terms, they need to be escaped by prefixing them with an anti-slash `\`.

In quoted terms, the quote character in use `'` or `"` needs to be escaped.

###### Allowed characters in field names

See the [Field name validation rules](https://quickwit.io/docs/configuration/index-config#field-name-validation-rules) in the index config documentation.

### Addressing nested structures

Data stored deep inside nested data structures like `object` or `json` fields can be addressed using dots as separators in the field name.
For instance, the document `{"product": {"attributes": {color": "red"}}}` is matched by
```
product.attributes.color:red
```

If the keys of your object contain dots, the above syntax has some ambiguity : by default `{"k8s.component.name": "quickwit"}` will be matched by 
```k8s.component.name:quickwit```

It is possible to remove the ambiguity by setting expand_dots in the json field configuration. 
In that case, it will be necessary to escape the `.` in the query to match this document like this :
```
k8s\.component\.name:quickwit
```

---

## Structured data
### Datetime
Datetime values must be provided in rfc3339 format, such as `1970-01-01T00:00:00Z`

### IP addresses
IP addresses can be provided as IPv4 or IPv6. It is recommended to search with the format used when indexing documents.
There is no support for searching for a range of IP using CIDR notation, but you can use normal range queries.

---

## Types of clauses

### Term `field:term`
```
term = term_char+
```

Matches documents if the targeted field contains a token equal to the provided term. 

`field:value` will match any document where the field 'field' has a token 'value'.

### Wildcard `field:wil?car*d`
```
wildcard = [term_char\*\?]+
```

Matches documents if the targeted field contains a token that matches the wildcard:
- `?` replaces one and only one term character
- `*` replaces any number of term characters or an empty string

Examples:
- `field:quick*` will match any document where the field 'field' has a token like `quickwit` or `quickstart`, but not `qui` or `abcd`.
- `field:h?llo` will match any document where the field 'field' has a token like `hello` or `hallo`, but not `heillo` or `hllo`.

Queries with prefixes (`field:qui*`) are much more efficient than queries starting with a wildcard (`field:*wit`)


### Term set `field:IN [a b c]`
```
term_set = 'IN' '[' term_list ']'
term_list = term_list term
          | term
```
Matches if the document contains any of the tokens provided. 

###### Examples
`field:IN [ab cd]` will match 'ab' or 'cd', but nothing else.

###### Performance Note
This is a lot like writing `field:ab OR field:cd`. When there are only a handful of terms to search for, using ORs is usually faster.
When there are many values to match, a term set query can become more efficient.

<!-- previously a field was required. It looks like it may no longer be the case -->

### Phrase `field:"sequence of words"`
```
phrase = phrase_string
       | phrase_string slop
phrase_string = '"' phrase_char '"'
slop = '~' [01-9]+

```

Matches if the field contains the sequence of token provided:
- `field:"looks good to me"` will match any document containing that sequence of tokens.
- `field:"look* good to me"` with the default tokenizer is equivalent to `field:"look good to me"`, i.e. the '*' character is pruned by the tokenizer and not interpreted as a wildcard.

:::info

The field must have been configured with `record: position` when indexing.

:::

###### Slop operator
Is is also possible to add a slop, which allow matching a sequence with some distance. For instance `"looks to me"~1` will match "looks good to me", but not "looks very good to me".
Transposition costs 2, e.g. `"A B"~1` will not match `"B A"` but it would with `"A B"~2`.
Transposition is not a special case, in the example above A is moved 1 position and B is moved 1 position, so the slop is 2.

### Phrase Prefix `field:"finish this phr"*`
```
phrase_prefix = phrase '*'
```

Matches if the field contains the sequence of token provided, where the last token in the query may be only a prefix of the token in the document.

The field must have been configured with `record: position` when indexing.

There is no slop for phrase prefix queries.

###### Examples
 `field:"thanks for your contrib"*` will match 'thanks for your contribution'.

###### Limitation

Quickwit may trim some results matched by this clause in some cases.  If you search for `"thanks for your co"*`, it will enumerate the first 50 tokens which start with "co" (in their storage order), and search for any documents where "thanks for your" is followed by any of these tokens.

If there are many tokens starting with "co", "contribution" might not be one of the 50 selected tokens, and the query won't match a document containing "thanks for your contribution". Normal prefix queries don't suffer from this issue.

### Range `field:[low_bound TO high_bound}`
```
range = explicit_range | comparison_half_range

explicit_range = left_bound_char bounds right_bound_char
left_bound_char = '[' | '{' 
right_bound_char = '}' | ']'
bounds = term TO term
       | term TO '*'
       | '*' TO term

comparison_range = comparison_operator term
comparison_operator = '<' | '>' | '<=' | '>='
```

Matches if the document contains a token between the provided bounds for that field.
For range queries, you must provide a field. Quickwit won't use `default_search_fields` automatically.

###### Order
For text fields, the ranges are defined by lexicographic order on uft-8 encoded byte arrays. It means for a text field, 100 is between 1 and 2.
<!-- TODO: Build a more comprehensive example set to showcase how wharacters are sorted -->

When using ranges on integers, it behaves naturally.

###### Inclusive and exclusive bounds
Inclusive bounds are represented by square brackets `[]`. They will match tokens equal to the bound term.
Exclusive bounds are represented by curly brackets `{}`. They will not match tokens equal to the bound term.

###### Half-Open bounds
You can make an half open range by using `*` as one of the bounds. `field:[b TO *]` will match 'bb' and 'zz', but not 'ab'.
You can also use a comparison based syntax:`field:<b`, `field:>b`, `field:<=b` or `field:>=b`.

<!-- NOTE : empty values likely not indexed -->

###### Examples
- Inclusive Range: `ip:[127.0.0.1 TO 127.0.0.50]`
- Exclusive Range: `ip:{127.0.0.1 TO 127.0.0.50}`
- Unbounded Inclusive Range: `ip:[127.0.0.1 TO *] or ip:>=127.0.0.1`
- Unbounded Exclusive Range: `ip:{127.0.0.1 TO *] or ip:>127.0.0.1`


### Exists `field:*`

Matches documents where the field is set. You have to specify a field for this query, Quickwit won't use `default_search_fields` automatically.

### Match All `*`

Matches every document. You can't put a field in front. It is simply written as `*`.

---

## Building Queries
Most queries are composed of more than one clause. When doing so, you may add operators between clauses.

Implicitly if no operator is provided, 'AND' is assumed.

### Conjunction `AND`
An `AND` query will match only if both sides match.

<!-- TODO: Formal example ?*-->

### Disjunction `OR`
An `OR` query will match if either (or both) sides match.

<!-- TODO: Formal example ?*-->

### Negation `NOT` or `-`
A `NOT` query will match if the clause it is applied to does not match.
The `-` prefix is equivalent to the `NOT` operator.

### Grouping `()`
Parentheses are used to force the order of evaluation of operators.
For instance, if a query should match if 'field1' is 'one' or 'two', and 'field2' is 'three', you can use `(field1:one OR field1:two) AND field2:three`.

### Operator Precedence
Without parentheses, `AND` takes precedence over `OR`. That is, `a AND b OR c` is interpreted as `(a AND b) or c`.

`NOT` and `-` takes precedence over everything, such that `-a AND b` means `(-a) AND b`, not `-(a AND B)`.


---

## Other considerations 

### Default Search Fields
In many case it is possible to omit the field you search if it was configured in the `default_search_fields` array of the index configuration. If more than one field is configured as default, the resulting implicit clauses are combined using a conjunction ('OR').

### Tokenization
Note that the result of a query can depend on the tokenizer used for the field getting searched. Hence this document always speaks of tokens, which may be the exact value the document contain (in case of the raw tokenizer), or a subset of it (for instance any tokenizer cutting on spaces).

<!-- NOTE : should dig deeper ? -->


================================================
FILE: docs/reference/rest-api.md
================================================
---
title: REST API
sidebar_position: 10
---

## API version

All the API endpoints start with the `api/v1/` prefix. `v1` indicates that we are currently using version 1 of the API.


## OpenAPI specification

The OpenAPI specification of the REST API is available at `/openapi.json` and a Swagger UI version is available at `/ui/api-playground`.

## Parameters

Parameters passed in the URL must be properly URL-encoded, using the UTF-8 encoding for non-ASCII characters.

```
GET [..]/search?query=barack%20obama
```

## Error handling

Successful requests return a 2xx HTTP status code.

Failed requests return a 4xx HTTP status code. The response body of failed requests holds a JSON object containing a `message` field that describes the error.

```json
{
 "message": "Failed to parse query"
}
```

## Search API

### Search in an index

Search for documents matching a query in the given index `api/v1/<index id>/search`. This endpoint is available as long as you have at least one node running a searcher service in the cluster.
The search endpoint accepts `GET` and `POST` requests. The [parameters](#get-parameters) are URL parameters for `GET` requests or JSON key-value pairs for `POST` requests.

```
GET api/v1/<index id>/search?query=searchterm
```

```
POST api/v1/<index id>/search
{
  "query": searchterm
}
```

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `index id`  | The index id  |

#### Parameters

| Variable            | Type       | Description     | Default value   |
|---------------------|------------|-----------------|-----------------|
| `query`           | `String`   | Query text. See the [query language doc](query-language.md) | _required_ |
| `start_timestamp` | `i64`      | If set, restrict search to documents with a `timestamp >= start_timestamp`, taking advantage of potential time pruning opportunities. The value must be in seconds. | |
| `end_timestamp`   | `i64`      | If set, restrict search to documents with a `timestamp < end_timestamp`, taking advantage of potential time pruning opportunities. The value must be in seconds.    | |
| `start_offset`    | `Integer`  | Number of documents to skip | `0` |
| `max_hits`        | `Integer`  | Maximum number of hits to return (by default 20) | `20` |
| `search_field`    | `[String]` | Fields to search on if no field name is specified in the query. Comma-separated list, e.g. "field1,field2"  | index_config.search_settings.default_search_fields |
| `snippet_fields`  | `[String]` | Fields to extract snippet on. Comma-separated list, e.g. "field1,field2"  | |
| `sort_by`         | `[String]` | Fields to sort the query results on. You can sort by one or two fast fields or by BM25 `_score` (requires fieldnorms). By default, hits are sorted in reverse order of their [document ID](/docs/overview/concepts/querying.md#document-id) (to show recent events first). | |
| `format`          | `Enum`     | The output format. Allowed values are "json" or "pretty_json" | `pretty_json` |
| `aggs`            | `JSON`     | The aggregations request. See the [aggregations doc](aggregation.md) for supported aggregations. | |

:::info
The `start_timestamp` and `end_timestamp` should be specified in seconds regardless of the timestamp field precision.
:::

#### Response

The response is a JSON object, and the content type is `application/json; charset=UTF-8.`

| Field                   | Description                    | Type       |
| --------------------    | ------------------------------ | :--------: |
| `hits`                | Results of the query           | `[hit]`    |
| `num_hits`            | Total number of matches        | `number`   |
| `elapsed_time_micros` | Processing time of the query   | `number`   |

### Search multiple indices
Search APIs that accept `index id` requests path parameter also support multi-target syntax.

#### Multi-target syntax

In multi-target syntax, you can use a comma or its URL encoded version '%2C' separated list to run a request on multiple indices: test1,test2,test3. You can also use [glob-like](https://en.wikipedia.org/wiki/Glob_(programming)) wildcard ( \* ) expressions to target indices that match a pattern: test\* or \*test or te\*t or \*test\*.

The following are some constrains about the multi-target expression.

    - It must follow the regex `^[a-zA-Z\*][a-zA-Z0-9-_\.\*]{0,254}$`.
    - It cannot contain consecutive asterisks (`*`).
    - If it does not contain an asterisk (`*`), the length must be greater than or equal to 3 characters.

#### Examples
```
GET api/v1/stackoverflow-000001,stackoverflow-000002/search
{
    "query": "search AND engine",
}
```

```
GET api/v1/stackoverflow*/search
{
    "query": "search AND engine",
}
```

## Ingest API

### Ingest data into an index

```
POST api/v1/<index id>/ingest -d \
'{"url":"https://en.wikipedia.org/wiki?id=1","title":"foo","body":"foo"}
{"url":"https://en.wikipedia.org/wiki?id=2","title":"bar","body":"bar"}
{"url":"https://en.wikipedia.org/wiki?id=3","title":"baz","body":"baz"}'
```

Ingest a batch of documents to make them searchable in a given `<index id>`. Currently, NDJSON is the only accepted payload format. This endpoint is only available on a node that is running an indexer service.

#### Controlling when the indexed documents will be available for search

Newly added documents will not appear in the search results until they are added to a split and that split is committed. This process is automatic and is controlled by `split_num_docs_target` and `commit_timeout_secs` parameters. By default, the ingest command exits as soon as the records are added to the indexing queue, which means that the new documents will not appear in the search results at this moment. This behavior can be changed by adding `commit=wait_for` or `commit=force` parameters to the query. The `wait_for` parameter will cause the command to wait for the documents to be committed according to the standard time or number of documents rules. The `force` parameter will trigger a commit after all documents in the request are processed. It will also wait for this commit to finish before returning. Please note that the `force` option may have a significant performance cost especially if it is used on small batches.

```
POST api/v1/<index id>/ingest?commit=wait_for -d \
'{"url":"https://en.wikipedia.org/wiki?id=1","title":"foo","body":"foo"}
{"url":"https://en.wikipedia.org/wiki?id=2","title":"bar","body":"bar"}
{"url":"https://en.wikipedia.org/wiki?id=3","title":"baz","body":"baz"}'
```

:::info

The payload size is limited to 10MB [by default](../configuration/node-config.md#ingest-api-configuration) since this endpoint is intended to receive documents in batches.

:::

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `index id`  | The index id  |

#### Query parameters

| Variable            | Type       | Description                                        | Default value |
|---------------------|------------|----------------------------------------------------|---------------|
| `commit`            | `String`   | The commit behavior: `auto`, `wait_for` or `force` | `auto`        |
| `detailed_response` | `bool`     | Enable `parse_failures` in the response. Setting to `true` might impact performances negatively. | `false`        |

#### Response

The response is a JSON object, and the content type is `application/json; charset=UTF-8.`

| Field                       | Description                                                                                                                                                              |   Type   |
|-----------------------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:--------:|
| `num_docs_for_processing` | Total number of documents submitted for processing. The documents may not have been processed. | `number` |
| `num_ingested_docs`       | Number of documents successfully persisted in the write ahead log | `number` |
| `num_rejected_docs`       | Number of documents that couldn't be parsed (invalid json, bad schema...) | `number` |
| `parse_failures`          | List detailing parsing failures. Only available if `detailed_response` is set to `true`. | `list(object)` |

The parse failure objects contain the following fields:
- `message`: a detailed message explaining the error
- `reason`: one of `invalid_json`, `invalid_schema` or `unspecified`
- `document`: the utf-8 decoded string of the document byte chunk that generated the error


## Index API

### Create an index

```
POST api/v1/indexes
```

Create an index by posting an `IndexConfig` payload. The API accepts JSON with `content-type: application/json` and YAML with `content-type: application/yaml`.

#### POST payload

| Variable            | Type               | Description                                                                                                           | Default value                         |
|---------------------|--------------------|-----------------------------------------------------------------------------------------------------------------------|---------------------------------------|
| `version`           | `String`           | Config format version, use the same as your Quickwit version.                                                         | _required_                            |
| `index_id`          | `String`           | Index ID, see its [validation rules](../configuration/index-config.md#index-id) on identifiers.                       | _required_                            |
| `index_uri`         | `String`           | Defines where the index files are stored. This parameter expects a [storage URI](../configuration/storage-config.md#storage-uris).           | `{default_index_root_uri}/{index_id}` |
| `doc_mapping`       | `DocMapping`       | Doc mapping object as specified in the [index config docs](../configuration/index-config.md#doc-mapping).             | _required_                            |
| `indexing_settings` | `IndexingSettings` | Indexing settings object as specified in the [index config docs](../configuration/index-config.md#indexing-settings). |                                       |
| `search_settings`   | `SearchSettings`   | Search settings object as specified in the [index config docs](../configuration/index-config.md#search-settings).     |                                       |
| `retention`         | `Retention`        | Retention policy object as specified in the [index config docs](../configuration/index-config.md#retention-policy).   |                                       |


**Payload Example**

curl -XPOST http://localhost:7280/api/v1/indexes --data @index_config.json -H "Content-Type: application/json"

```json title="index_config.json
{
    "version": "0.8",
    "index_id": "hdfs-logs",
    "doc_mapping": {
        "field_mappings": [
            {
                "name": "tenant_id",
                "type": "u64",
                "fast": true
            },
            {
                "name": "app_id",
                "type": "u64",
                "fast": true
            },
            {
                "name": "timestamp",
                "type": "datetime",
                "input_formats": ["unix_timestamp"],
                "fast_precision": "seconds",
                "fast": true
            },
            {
                "name": "body",
                "type": "text",
                "record": "position"
            }
        ],
        "partition_key": "tenant_id",
        "max_num_partitions": 200,
        "tag_fields": ["tenant_id"],
        "timestamp_field": "timestamp"
    },
    "search_settings": {
        "default_search_fields": ["body"]
    },
    "indexing_settings": {
        "merge_policy": {
            "type": "limit_merge",
            "max_merge_ops": 3,
            "merge_factor": 10,
            "max_merge_factor": 12
        }
    },
    "retention": {
        "period": "7 days",
        "schedule": "@daily"
    }
}
```

#### Response

The response is the index metadata of the created index, and the content type is `application/json; charset=UTF-8.`

| Field                | Description                                   |         Type          |
|----------------------|-----------------------------------------------|:---------------------:|
| `version`          | The current index configuration format version. |       `string`        |
| `index_uid`        | The server-generated index UID.                 |       `string`        |
| `index_config`     | The posted index config.                        |     `IndexConfig`     |
| `checkpoint`       | Map of checkpoints by source.                   |   `IndexCheckpoint`   |
| `create_timestamp` | Index creation timestamp                        |       `number`        |
| `sources`          | List of the index sources configurations.       | `Array<SourceConfig>` |


### Update an index

```
PUT api/v1/indexes/<index id>
```

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `index id`    | The index id  |

#### Query parameters

| Variable  | Type   | Description                                   | Default value |
|-----------|--------|-----------------------------------------------|---------------|
| `create`  | `bool` | Create the index if it doesn't already exists | `false`       |

Update the configurations of an index. This endpoint follows PUT semantics, which means that all the fields of the current configuration are replaced by the values specified in this request or the associated defaults. In particular, if the field is optional (e.g. `retention_policy`), omitting it will delete the associated configuration. If the new configuration file contains updates that cannot be applied, the request fails, and none of the updates are applied. The API accepts JSON with `content-type: application/json` and YAML with `content-type: application/yaml`.

- The retention policy update is automatically picked up by the janitor service on its next state refresh.
- The search settings update is automatically picked up by searcher nodes when the next query is executed.
- The indexing settings update is automatically picked up by the indexer nodes once the control plane emits a new indexing plan.
- The doc mapping update is automatically picked up by the indexer nodes once the control plane emit a new indexing plan.

:::warning

If you use the ingest or ES bulk API (V2), the old doc mapping will still be used to validate new documents that end up being persisted on existing shards (see [#5738](https://github.com/quickwit-oss/quickwit/issues/5738)).

:::

Updating the doc mapping doesn't reindex existing data. Queries and results are mapped on a best-effort basis when querying older splits. For more details, check [the reference](updating-mapper.md) out.

#### PUT payload

| Variable            | Type               | Description                                                                                                           | Default value                         |
|---------------------|--------------------|-----------------------------------------------------------------------------------------------------------------------|---------------------------------------|
| `version`           | `String`           | Config format version, use the same as your Quickwit version.                                                         | _required_                            |
| `index_id`          | `String`           | Index ID, must be the same index as in the request URI.                                                               | _required_                            |
| `index_uri`         | `String`           | Defines where the index files are stored. Cannot be updated.                                                          | `{default_index_root_uri}/{index_id}`                 |
| `doc_mapping`       | `DocMapping`       | Doc mapping object as specified in the [index config docs](../configuration/index-config.md#doc-mapping).             | _required_                            |
| `indexing_settings` | `IndexingSettings` | Indexing settings object as specified in the [index config docs](../configuration/index-config.md#indexing-settings). |                                       |
| `search_settings`   | `SearchSettings`   | Search settings object as specified in the [index config docs](../configuration/index-config.md#search-settings).     |                                       |
| `retention`         | `Retention`        | Retention policy object as specified in the [index config docs](../configuration/index-config.md#retention-policy).   |                                       |


**Payload Example**

curl -XPUT http://localhost:7280/api/v1/indexes/hdfs-logs --data @updated_index_update.json -H "Content-Type: application/json"

```json title="updated_index_update.json
{
    "version": "0.8",
    "index_id": "hdfs-logs",
    "doc_mapping": {
        "field_mappings": [
            {
                "name": "tenant_id",
                "type": "u64",
                "fast": true
            },
            {
                "name": "app_id",
                "type": "u64",
                "fast": true
            },
            {
                "name": "timestamp",
                "type": "datetime",
                "input_formats": ["unix_timestamp"],
                "fast_precision": "seconds",
                "fast": true
            },
            {
                "name": "body",
                "type": "text",
                "record": "position"
            }
        ],
        "partition_key": "tenant_id",
        "max_num_partitions": 200,
        "tag_fields": ["tenant_id"],
        "timestamp_field": "timestamp"
    },
    "search_settings": {
        "default_search_fields": ["body"]
    },
    "indexing_settings": {
        "merge_policy": {
            "type": "limit_merge",
            "max_merge_ops": 3,
            "merge_factor": 10,
            "max_merge_factor": 12
        }
    },
    "retention": {
        "period": "30 days",
        "schedule": "@daily"
    }
}
```

#### Response

The response is the index metadata of the updated index, and the content type is `application/json; charset=UTF-8.`

| Field                | Description                             |         Type          |
|----------------------|-----------------------------------------|:---------------------:|
| `version`          | The current server configuration version. |       `string`        |
| `index_uid`        | The server-generated index UID.            |       `string`        |
| `index_config`     | The posted index config.                  |     `IndexConfig`     |
| `checkpoint`       | Map of checkpoints by source.             |   `IndexCheckpoint`   |
| `create_timestamp` | Index creation timestamp                  |       `number`        |
| `sources`          | List of the index sources configurations. | `Array<SourceConfig>` |


### Get an index metadata

```
GET api/v1/indexes/<index id>
```

Get the index metadata of ID `index id`.

#### Response

The response is the index metadata of the requested index, and the content type is `application/json; charset=UTF-8.`

| Field                | Description                               |         Type          |
|----------------------|-------------------------------------------|:---------------------:|
| `version`          | The current server configuration version. |       `string`        |
| `index_uid`        | The server-generated index UID.            |       `string`        |
| `index_config`     | The posted index config.                  |     `IndexConfig`     |
| `checkpoint`       | Map of checkpoints by source.             |   `IndexCheckpoint`   |
| `create_timestamp` | Index creation timestamp.                 |       `number`        |
| `sources`          | List of the index sources configurations. | `Array<SourceConfig>` |


### Describe an index

```
GET api/v1/indexes/<index id>/describe
```
Describes an index of ID `index id`.

#### Response

The response is the stats about the requested index, and the content type is `application/json; charset=UTF-8.`

| Field                               | Description                                              |         Type          |
|-------------------------------------|----------------------------------------------------------|:---------------------:|
| `index_id`                          | Index ID of index.                                       |       `String`        |
| `index_uri`                         | Uri of index                                             |       `String`        |
| `num_published_splits`              | Number of published splits.                              |       `number`        |
| `size_published_splits`             | Size of published splits.                                |       `number`        |
| `num_published_docs`                | Number of published documents.                           |       `number`        |
| `size_published_docs_uncompressed`  | Size of the published documents in bytes (uncompressed). |       `number`        |
| `timestamp_field_name`              | Name of timestamp field.                                       |       `String`        |
| `min_timestamp`                     | Starting time of timestamp.                              |       `number`        |
| `max_timestamp`                     | Ending time of timestamp.                                |       `number`        |


### Get splits

```
GET api/v1/indexes/<index id>/splits
```
Get splits belongs to an index of ID `index id`.

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `index id`  | The index id  |

#### Get parameters

| Variable            | Type       | Description                                                                                                      |
|---------------------|------------|------------------------------------------------------------------------------------------------------------------|
| `offset`           | `number`   | If set, restrict the number of splits to skip|
| `limit `           | `number`   | If set, restrict maximum number of splits to retrieve|
| `split_states`           | `usize`   | If set, specific split state(s) to filter by|
| `start_timestamp`           | `number`   | If set, restrict splits to documents with a `timestamp >= start_timestamp|
| `end_timestamp`           | `number`   | If set, restrict splits to documents with a `timestamp < end_timestamp|
| `end_create_timestamp`           | `number`   | If set, restrict splits whose creation dates are before this date|


#### Response

The response is the stats about the requested index, and the content type is `application/json; charset=UTF-8.`

| Field                               | Description                                              |         Type          |
|-------------------------------------|----------------------------------------------------------|:---------------------:|
| `offset`                          | Index ID of index.                                       |       `String`        |
| `size`                         | Uri of index                                             |       `String`        |
| `splits`              | Number of published splits.                              |       `List`        |

#### Examples
```
GET /api/v1/indexes/stackoverflow/splits?offset=0&limit=10
```
```json
{
  "offset": 0,
  "size": 1,
  "splits": [
    {
      "split_state": "Published",
      "update_timestamp": 1695642901,
      "publish_timestamp": 1695642901,
      "version": "0.7",
      "split_id": "01HB632HD8W6WHNM7CZFH3KG1X",
      "index_uid": "stackoverflow:01HB6321TDT3SP58D4EZP14KSX",
      "partition_id": 0,
      "source_id": "_ingest-api-source",
      "node_id": "jerry",
      "num_docs": 10000,
      "uncompressed_docs_size_in_bytes": 6674940,
      "time_range": {
        "start": 1217540572,
        "end": 1219335682
      },
      "create_timestamp": 1695642900,
      "maturity": {
        "type": "immature",
        "maturation_period_millis": 172800000
      },
      "tags": [],
      "footer_offsets": {
        "start": 4714989,
        "end": 4719999
      },
      "delete_opstamp": 0,
      "num_merge_ops": 0
    }
  ]
}
```


### Clears an index

```
PUT api/v1/indexes/<index id>/clear
```

Clears index of ID `index id`: all splits will be deleted (metastore + storage) and all source checkpoints will be reset.

It returns an empty body.


### Delete an index

```
DELETE api/v1/indexes/<index id>
```

Delete index of ID `index id`.

#### Response

The response is the list of deleted split files; the content type is `application/json; charset=UTF-8.`

```json
[
    {
        "split_id": "01GK1XNAECH7P14850S9VV6P94",
        "num_docs": 1337,
        "uncompressed_docs_size_bytes": 23933408,
        "file_name": "01GK1XNAECH7P14850S9VV6P94.split",
        "file_size_bytes": 2991676
    }
]
```

### Get all indexes metadata

```
GET api/v1/indexes
```

Retrieve the metadata of all indexes present in the metastore.

#### Response

The response is an array of `IndexMetadata`, and the content type is `application/json; charset=UTF-8.`


### Create a source

```
POST api/v1/indexes/<index id>/sources
```

Create source by posting a source config JSON payload.

#### POST payload

| Variable          | Type     | Description                                                                            | Default value |
|-------------------|----------|----------------------------------------------------------------------------------------|---------------|
| `version**       | `String` | Config format version, put your current Quickwit version.                               | _required_    |
| `source_id`     | `String` | Source ID. See ID [validation rules](../configuration/source-config.md).                 | _required_    |
| `source_type`   | `String` | Source type: `kafka`, `kinesis` or `pulsar`.                                             | _required_    |
| `num_pipelines` | `usize`  | Number of running indexing pipelines per node for this source.                           | `1`           |
| `transform`     | `object` | A [VRL](https://vector.dev/docs/reference/vrl/) transformation applied to incoming documents, as defined in [source config docs](../configuration/source-config.md#transform-parameters).                          | `null`         |
| `params`        | `object` | Source parameters as defined in [source config docs](../configuration/source-config.md). | _required_    |


**Payload Example**

curl -XPOST http://localhost:7280/api/v1/indexes/my-index/sources --data @source_config.json -H "Content-Type: application/json"

```json title="source_config.json
{
    "version": "0.8",
    "source_id": "kafka-source",
    "source_type": "kafka",
    "params": {
        "topic": "quickwit-fts-staging",
        "client_params": {
            "bootstrap.servers": "kafka-quickwit-server:9092"
        }
    }
}
```

#### Response

The response is the created source config, and the content type is `application/json; charset=UTF-8.`

### Update a source

```
PUT api/v1/indexes/<index id>/sources/<source id>
```

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `index id`    | The index id  |
| `source id`   | The source id  |

#### Query parameters

| Variable  | Type   | Description                                   | Default value |
|-----------|--------|-----------------------------------------------|---------------|
| `create`  | `bool` | Create the index if it doesn't already exists | `false`       |

Update a source by posting a source config JSON payload.

#### PUT payload

| Variable          | Type     | Description                                                                            | Default value |
|-------------------|----------|----------------------------------------------------------------------------------------|---------------|
| `version**       | `String` | Config format version, put your current Quickwit version.                               | _required_    |
| `source_id`     | `String` | Source ID, must be the same source as in the request URL.                                | _required_    |
| `source_type`   | `String` | Source type: `kafka`, `kinesis` or `pulsar`. Cannot be updated.                          | _required_    |
| `num_pipelines` | `usize`  | Number of running indexing pipelines per node for this source.                           | `1`           |
| `transform`     | `object` | A [VRL](https://vector.dev/docs/reference/vrl/) transformation applied to incoming documents, as defined in [source config docs](../configuration/source-config.md#transform-parameters).                          | `null`         |
| `params`        | `object` | Source parameters as defined in [source config docs](../configuration/source-config.md). | _required_    |

:::warning

While updating `num_pipelines` and `transform` is generally safe and reversible, updating `params` has consequences specific to the source type and might have side effects such as loosing the source's checkpoints. Perform such updates with great care. 

:::

**Payload Example**

curl -XPOST http://localhost:7280/api/v1/indexes/my-index/sources --data @source_config.json -H "Content-Type: application/json"

```json title="source_config.json
{
    "version": "0.8",
    "source_id": "kafka-source",
    "source_type": "kafka",
    "params": {
        "topic": "quickwit-fts-staging",
        "client_params": {
            "bootstrap.servers": "kafka-quickwit-server:9092"
        }
    }
}
```

#### Response

The response is the created source config, and the content type is `application/json; charset=UTF-8.`

### Toggle source

```
PUT api/v1/indexes/<index id>/sources/<source id>/toggle
```

Toggle (enable/disable) source `source id` of index ID `index id`.

It returns an empty body.

#### PUT payload

| Variable          | Type     | Description                                                                                          |
|-------------------|----------|------------------------------------------------------------------------------------------------------|
| `enable`       | `bool` | If `true` enable the source, else disable it.                                |

### Reset source checkpoint

```
PUT api/v1/indexes/<index id>/sources/<source id>/reset-checkpoint
```

Resets checkpoints of source `source id` of index ID `index id`.

It returns an empty body.

### Delete a source

```
DELETE api/v1/indexes/<index id>/sources/<source id>
```

Delete source of ID `<source id>`.


## Cluster API

This endpoint lets you check the state of the cluster from the point of view of the node handling the request.

```
GET api/v1/cluster?format=pretty_json
```

#### Parameters

Name | Type | Description | Default value
--- | --- | --- | ---
`format` | `String` | The output format requested for the response: `json` or `pretty_json` | `pretty_json`


## Delete API

The delete API enables to delete documents matching a query.

### Create a delete task

```
POST api/v1/<index id>/delete-tasks
```

Create a delete task that will delete all documents matching the provided query in the given index `<index id>`.
The endpoint simply appends your delete task to the delete task queue in the metastore. The deletion will eventually be executed.

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `index id`  | The index id  |


#### POST payload `DeleteQuery`


| Variable            | Type       | Description                                                                                             | Default value                                      |
|---------------------|------------|---------------------------------------------------------------------------------------------------------|----------------------------------------------------|
| `query`           | `String`   | Query text. See the [query language doc](query-language.md)                                               | _required_                                         |
| `search_field`    | `[String]` | Fields to search on. Comma-separated list, e.g. "field1,field2"                                           | index_config.search_settings.default_search_fields |
| `start_timestamp` | `i64`      | If set, restrict search to documents with a `timestamp >= start_timestamp`. The value must be in seconds. |                                                    |
| `end_timestamp`   | `i64`      | If set, restrict search to documents with a `timestamp < end_timestamp`. The value must be in seconds.    |                                                    |


**Example**

```json
{
    "query": "body:trash",
    "start_timestamp": "1669738645",
    "end_timestamp": "1669825046",
}
```

#### Response

The response is the created delete task represented in JSON, `DeleteTask`, the content type is `application/json; charset=UTF-8.`

| Field                | Description                                            |     Type      |
|----------------------|--------------------------------------------------------|:-------------:|
| `create_timestamp` | Create timestamp of the delete query in seconds        |     `i64`     |
| `opstamp`          | Unique operation stamp associated with the delete task |     `u64`     |
| `delete_query`     | The posted delete query                                | `DeleteQuery` |


### List delete queries

```
GET api/v1/<index id>/delete-tasks
```

Get the list of delete tasks for a given `index_id`.


#### Response

The response is an array of `DeleteTask`.


## Index template API

This API manages index template resources. Templates are higher level configuration objects used to automatically create indexes according to predefined rules. See [index template configuration](../configuration/template-config.md).

### Create a template

```
POST api/v1/templates
```

#### POST payload

Create an index template by posting a [template configuration](../configuration/template-config.md) payload. The API accepts JSON with the header `content-type: application/json` and YAML with `content-type: application/yaml`.

**Example**

```yaml
version: 0.9 # File format version.

template_id: "all-logs"

index_root_uri: "s3://my-bucket/logs/"

description: "All my logs"

index_id_patterns:
    - logs-*

priority: 100

doc_mapping:
  mode: dynamic
  field_mappings:
    - name: timestamp
      type: datetime
      input_formats:
        - unix_timestamp
      output_format: unix_timestamp_secs
      fast: true
  timestamp_field: timestamp
```

#### Response

The created index template configuration as JSON.


### Update a template

```
PUT api/v1/templates/<template id>
```

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `template id` | The template id  |


#### POST payload

Update an index template by posting an [template configuration](../configuration/template-config.md) payload. The API accepts JSON with the header `content-type: application/json` and YAML with `content-type: application/yaml`.

**Example**

See [create endpoint](#create-a-template).

#### Response

The updated template configuration as JSON.

### List the templates

```
GET api/v1/templates
```

#### Response

An array with all the existing index template configurations as JSON.

### Get a template

```
GET api/v1/templates/<template id>
```

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `template id` | The template id  |

#### Response

The requested index template configuration as JSON.

### Delete a template

```
DELETE api/v1/templates/<template id>
```

#### Path variable

| Variable      | Description   |
| ------------- | ------------- |
| `template id` | The template id  |

#### Response

Empty response.


================================================
FILE: docs/reference/updating-mapper.md
================================================
# Updating the doc mapping of an index

Quickwit allows updating the mapping it uses to add more fields to an existing index or change how they are indexed. In doing so, it does not reindex existing data but still lets you search through older documents where possible.

## Indexing

When you update a doc mapping for an index, Quickwit will restart indexing pipelines to take the changes into account. As both this operation and the document ingestion are asynchronous, there is no strict happens-before relationship between ingestion and update. This means a document ingested just before the update may be indexed according to the newer doc mapper, and document ingested just after the update may be indexed with the older doc mapper.

:::warning

If you use the ingest or ES bulk API (V2), the old doc mapping will still be used to validate new documents that end up being persisted on existing shards (see [#5738](https://github.com/quickwit-oss/quickwit/issues/5738)).

:::

## Querying

Quickwit always validate queries against the most recent mapping.
If a query was valid under a previous mapping but is not compatible with the newer mapping, that query will be rejected.
For instance if a field which was indexed no longer is, any query that uses it will become invalid.
On the other hand, if a query was not valid for a previous doc mapping, but is valid under the new doc mapping, Quickwit will process the query.
When querying newer splits, it will behave normally, when querying older splits, it will try to execute the query as correctly as possible.
If you find yourself in a situation where older splits causes a valid request to return an error, please open a bug report.
See examples 1 and 2 below for clarification.

Change in tokenizer affect only newer splits, older splits keep using the tokenizers they were created with.

Document retrieved are mapped from Quickwit internal format to JSON based on the latest doc mapping. This means if fields are deleted,
they will stop appearing (see also Reversibility below) unless mapper mode is Dynamic. If the type of some field changed, it will be converted on a best-effort basis:
integers will get turned into text, text will get turned into string when it is possible, otherwise, the field is omited.
See example 3 for clarification.

## Reversibility

Quickwit does not modify existing data when receiving a new doc mapping. If you realize that you updated the mapping in a wrong way, you can re-update your index using the previous mapping. Documents indexed while the mapping was wrong will be impacted, but any document that was committed before the change will be queryable as if nothing happened.

## Type update reference

Conversion from a type to itself is omitted. Conversions that never succeed and always omit the field are omitted, too.

<!-- this is extracted from `quickwit_doc_mapper::::default_doc_mapper::value_to_json()` -->
| type before | type after | behavior |
|-------------|------------|
| u64/i64/f64 | text | convert to decimal string |
| date | text | convert to rfc3339 textual representation |
| ip | text | convert to IPv6 representation. For IPv4, convert to IPv4-mapped IPv6 address (`::ffff:1.2.3.4`) |
| bool | text | convert to "true" or false" |
| u64/i64/f64 | bool | convert 0/0.0 to false and 1/1.0 to true, otherwise omit |
| text | bool | convert if "true" or "false" (lowercase), otherwise omit |
| text | ip | convert if valid IPv4 or IPv6, otherwise omit |
| text | f64 | convert if valid floating point number, otherwise omit |
| u64/i64 | f64 | convert, possibly with loss of precision |
| bool | f64 | convert to 0.0 for false, and 1.0 for true |
| text | u64 | convert is valid integer in range 0..2\*\*64, otherwise omit |
| i64 | u64 | convert if in range 0..2\*\*63, otherwise omit |
| f64 | u64 | convert if in range 0..2\*\*64, possibly with loss of precision, otherwise omit |
| text | i64 | convert is valid integer in range -2\*\*63..2\*\*63, otherwise omit |
| u64 | i64 | convert if in range 0..2\*\*63, otherwise omit |
| f64 | i64 | convert if in range -2\*\*63..2\*\*63, possibly with loss of precision, otherwise omit |
| bool | i64 | convert to 0 for false, and 1 for true |
| text | datetime | parse according to current input\_format, otherwise omit |
| u64 | datetime | parse according to current input\_format, otherwise omit |
| i64 | datetime | parse according to current input\_format, otherwise omit |
| f64 | datetime | parse according to current input\_format, otherwise omit |
| array\<T\> | array\<U\> | convert individual elements, skipping over those which can't be converted |
| T | array\<U\> | convert element, emiting array of a single element, or empty array if it can't be converted |
| array\<T\> | U | convert individual elements, keeping the first which can be converted |
| json | object | try convert individual elements if they exists inside object, omit individual elements which can't be |
| object | json | convert individual elements. Previous lists of one element are converted to a single element not in an array.

## Examples

In the below examples, fields which are not relevant are removed for conciseness, you will not be able to use these index config as is.

### Example 1

before:
```yaml
doc_mapping:
  field_mappings:
    - name: field1
      type: text
      tokenizer: raw
```

after:
```yaml
doc_mapping:
  field_mappings:
    - name: field1
      type: text
      indexed: false
```

A field changed from being indexed to not being indexed.
A query such as `field1:my_value` was valid, but is now rejected.

### Example 2

before:
```yaml
doc_mapping:
  field_mappings:
    - name: field1
      type: text
      indexed: false
    - name: field2
      type: text
      tokenizer: raw

```

after:
```yaml
doc_mapping:
  field_mappings:
    - name: field1
      type: text
      tokenizer: raw
    - name: field2
      type: text
      tokenizer: raw
```

A field changed from being not indexed to being indexed.
A query such as `field1:my_value` was invalid before, and is now valid. When querying older splits, it won't return a match, but won't return an error either.
A query such as `field1:my_value OR field2:my_value` is now valid too. For old splits, it will return the same results as `field2:my_value` as field1 wasn't indexed before. For newer splits, it will return the expected results.
A query such as `NOT field1:my_value` would return all documents for old splits, and only documents where `field1` is not `my_value` for newer splits.


### Example 3

# show cast (trivial, valid and invalid)
# show array to single

before:
```yaml
doc_mapping:
  field_mappings:
    - name: field1
      type: text
    - name: field2
      type: u64
    - name: field3
      type: array<text>
```
document presents before update:
```json
{
  "field1": "123",
  "field2": 456,
  "field3": ["abc", "def"]
}
{
  "field1": "message",
  "field2": 987,
  "field3": ["ghi"]
}
```

after:
```yaml
doc_mapping:
  field_mappings:
    - name: field1
      type: u64
    - name: field2
      type: text
    - name: field3
      type: text
```

When querying this index, the documents returned would become:
```json
{
  "field1": 123,
  "field2": "456",
  "field3": "abc"
}
{
  // field1 is missing because "message" can't be converted to int
  "field2": "987",
  "field3": "ghi"
}
```


================================================
FILE: docs/telemetry.md
================================================
---
title: Telemetry
sidebar_position: 12
---

Quickwit, Inc. collects anonymous data regarding general usage to help us drive our development. Privacy and transparency are at the heart of Quickwit values and we only collect the minimal useful data and don't use any third party tool for the collection.

## Disabling data collection

Data collection are opt-out. To disable them, just set the environment variable `QW_DISABLE_TELEMETRY` to whatever value.

```bash
export QW_DISABLE_TELEMETRY=1
```

Look at `--help` command output to check whether telemetry is enabled or not:
```bash
quickwit --help
Quickwit 0.7
Sub-second search & analytics engine on cloud storage.
  Find more information at https://quickwit.io/docs

Telemetry enabled
```

The line `Telemetry enabled` disappears when you disable it.

## Which data are collected?

We collect the minimum amount of information to respect privacy. Here are the data collected:
- type of events among create, index, delete and serve events
- client information:
  - session uuid: uuid generated on the fly
  - quickwit version
  - os (linux, macos, freebsd, android...)
  - architecture of the CPU
  - md5 hash of host and username
  - a boolean to know if `KUBERNETES_SERVICE_HOST` is set.

All data are sent to `telemetry.quickwit.io`.

## No third party

We did not want to add any untrusted third party tool in the collection so we decided to implement and host our own metric collection server.


================================================
FILE: install.sh
================================================
#!/bin/bash

# installer.sh
#
# This is just a little script that can be downloaded from the internet to
# install Quickwit.
# It just does platform detection, fetches the latest appropriate release version from github
# and execute the appropriate commands to download the binary.
#
# Heavily inspired by the Vector & Meilisearch installation scripts

set -u

# If PACKAGE_ROOT is unset or empty, default it.
PACKAGE_ROOT="${PACKAGE_ROOT:-"https://github.com/quickwit-oss/quickwit/releases/download"}"
PACKAGE_RELEASE_API="${PACKAGE_RELEASE_API:-"https://api.github.com/repos/quickwit-oss/quickwit/releases"}"
PACKAGE_NAME="quickwit"
_divider="--------------------------------------------------------------------------------"
_prompt=">>>"
_indent="   "

header() {
    cat 1>&2 <<EOF

                                   Q U I C K W I T
                                      Installer

$_divider
Website: https://quickwit.io/
Docs: https://quickwit.io/docs/
$_divider

EOF
}

usage() {
    cat 1>&2 <<EOF
quickwit-install
The installer for Quickwit (https://quickwit.io/)

USAGE:
    quickwit-install [FLAGS] [OPTIONS]

FLAGS:
    -h, --help              Prints help information
EOF
}

main() {
    downloader --check
    header
    install_from_archive "${1:-""}"
}

install_from_archive() {
    need_cmd cp
    need_cmd mv
    need_cmd rm
    need_cmd tar
    need_cmd gzip
    need_cmd chmod
    need_cmd grep
    need_cmd head
    need_cmd sed
    need_cmd curl

    get_architecture || return 1
    local _arch="$RETVAL"
    assert_nz "$_arch" "arch"

    local _binary_arch=""
    case "$_arch" in
        aarch64-apple-darwin)
            _binary_arch=$_arch
            ;;
        x86_64-apple-darwin)
            _binary_arch=$_arch
            ;;
        x86_64-*linux*-gnu)
            _binary_arch="x86_64-unknown-linux-gnu"
            ;;
        aarch64-*linux*-gnu)
            _binary_arch="aarch64-unknown-linux-gnu"
            ;;
        *)
            printf "%s A pre-built package is not available for your OS architecture: %s" "$_prompt" "$_arch"
            printf "\n"
            err "You can easily build it from source following the docs: https://quickwit.io/docs"
            ;;
    esac

    local _version=$(get_latest_version "$1")
    local _archive_content_file="quickwit-${_version}-${_binary_arch}"
    local _file="${_archive_content_file}.tar.gz"
    local _url="${PACKAGE_ROOT}/${_version}/${_file}"

    printf "%s Downloading Quickwit via %s" "$_prompt" "$_url"
    ensure downloader "$_url" "$_file"
    printf "\n"

    printf "%s Unpacking archive ..." "$_prompt"
    ensure tar -xzf "$_file"
    chmod 744 "./quickwit-${_version}/quickwit"
    ensure rm "$_file"
    printf "\n"

    printf "\n"
    printf "%s Install succeeded!\n" "$_prompt"
    printf "%s To start using Quickwit:\n" "$_prompt"
    printf "\n"
    printf "%s ./quickwit-${_version}/quickwit --version \n" "$_indent"
    printf "\n"
    printf "%s More information at https://quickwit.io/docs/\n" "$_prompt"

    local _retval=$?

    return "$_retval"
}

# ------------------------------------------------------------------------------
# semverParseInto and semverLT from https://github.com/cloudflare/semver_bash/blob/master/semver.sh
#
# usage: semverParseInto version major minor patch special
# version: the string version
# major, minor, patch, special: will be assigned by the function
# ------------------------------------------------------------------------------

semverParseInto() {
    local RE='[^0-9]*\([0-9]*\)[.]\([0-9]*\)[.]\([0-9]*\)\([0-9A-Za-z-]*\)'
    #MAJOR
    eval $2=`echo $1 | sed -e "s#$RE#\1#"`
    #MINOR
    eval $3=`echo $1 | sed -e "s#$RE#\2#"`
    #PATCH
    eval $4=`echo $1 | sed -e "s#$RE#\3#"`
    #SPECIAL
    eval $5=`echo $1 | sed -e "s#$RE#\4#"`
}

# usage: semverLT version1 version2
semverLT() {
    local MAJOR_A=0
    local MINOR_A=0
    local PATCH_A=0
    local SPECIAL_A=0

    local MAJOR_B=0
    local MINOR_B=0
    local PATCH_B=0
    local SPECIAL_B=0

    semverParseInto $1 MAJOR_A MINOR_A PATCH_A SPECIAL_A
    semverParseInto $2 MAJOR_B MINOR_B PATCH_B SPECIAL_B

    if [ $MAJOR_A -lt $MAJOR_B ]; then
        return 0
    fi
    if [ $MAJOR_A -le $MAJOR_B ] && [ $MINOR_A -lt $MINOR_B ]; then
        return 0
    fi
    if [ $MAJOR_A -le $MAJOR_B ] && [ $MINOR_A -le $MINOR_B ] && [ $PATCH_A -lt $PATCH_B ]; then
        return 0
    fi
    if [ "_$SPECIAL_A"  == "_" ] && [ "_$SPECIAL_B"  == "_" ] ; then
        return 1
    fi
    if [ "_$SPECIAL_A"  == "_" ] && [ "_$SPECIAL_B"  != "_" ] ; then
        return 1
    fi
    if [ "_$SPECIAL_A"  != "_" ] && [ "_$SPECIAL_B"  == "_" ] ; then
        return 0
    fi
    if [ "_$SPECIAL_A" < "_$SPECIAL_B" ]; then
        return 0
    fi

    return 1
}

# Returns the tag of the latest stable release (in terms of semver and not of release date)
get_latest_version() {
    GREP_SEMVER_REGEXP='v\([0-9]*\)[.]\([0-9]*\)[.]\([0-9]*\)$' # i.e. v[number].[number].[number]
    temp_file='temp_file' # temp_file needed because the grep would start before the download is over
    curl -s "${PACKAGE_RELEASE_API}" > "$temp_file" || return 1
    releases=$(cat "$temp_file" | \
        grep -E "tag_name|draft|prerelease" \
        | tr -d ',"' | cut -d ':' -f2 | tr -d ' ')
        # Returns a list of [tag_name draft_boolean prerelease_boolean ...]
        # Ex: v0.10.1 false false v0.9.1-rc.1 false true v0.9.0 false false...

    # clean up early
    rm -f "$temp_file"

    if [ "$1" = "--allow-any-latest-version" ]; then
        local first_release=$(echo $releases | { read first rest; echo $first; })
        echo $first_release
        return
    fi

    i=0
    latest=""
    current_tag=""
    for release_info in $releases; do
        if [ $i -eq 0 ]; then # Checking tag_name
            if echo "$release_info" | grep -q "$GREP_SEMVER_REGEXP"; then # If it's not an alpha or beta release
                current_tag=$release_info
            else
                current_tag=""
            fi
            i=1
        elif [ $i -eq 1 ]; then # Checking draft boolean
            if [ "$release_info" = "true" ]; then
                current_tag=""
            fi
            i=2
        elif [ $i -eq 2 ]; then # Checking prerelease boolean
            if [ "$release_info" = "true" ]; then
                current_tag=""
            fi
            i=0
            if [ "$current_tag" != "" ]; then # If the current_tag is valid
                if [ "$latest" = "" ]; then # If there is no latest yet
                    latest="$current_tag"
                else
                    semverLT $current_tag $latest # Comparing latest and the current tag
                    if [ $? -eq 1 ]; then
                        latest="$current_tag"
                    fi
                fi
            fi
        fi
    done

    echo $latest
}

# ------------------------------------------------------------------------------
# All code below here was copied from https://sh.rustup.rs and can safely
# be updated if necessary.
# ------------------------------------------------------------------------------

get_gnu_musl_glibc() {
  need_cmd ldd
  need_cmd bc
  need_cmd awk
  # Detect both gnu and musl
  local _ldd_version
  local _glibc_version
  _ldd_version=$(ldd --version)
  if ldd --version 2>&1 | grep -Eq 'GNU'; then
    _glibc_version=$(echo "$_ldd_version" | awk '/ldd/{print $NF}')
    if [ 1 -eq "$(echo "${_glibc_version} < 2.18" | bc)" ]; then
      echo "musl"
    else
      echo "gnu"
    fi
  elif ldd --version 2>&1 | grep -Eq "musl"; then
    echo "musl"
  else
    err "Warning: Unable to detect architecture from ldd (using gnu-unknown)"
  fi
}

get_bitness() {
    need_cmd head
    # Architecture detection without dependencies beyond coreutils.
    # ELF files start out "\x7fELF", and the following byte is
    #   0x01 for 32-bit and
    #   0x02 for 64-bit.
    # The printf builtin on some shells like dash only supports octal
    # escape sequences, so we use those.
    local _current_exe_head
    _current_exe_head=$(head -c 5 /proc/self/exe )
    if [ "$_current_exe_head" = "$(printf '\177ELF\001')" ]; then
        echo 32
    elif [ "$_current_exe_head" = "$(printf '\177ELF\002')" ]; then
        echo 64
    else
        err "unknown platform bitness"
    fi
}

get_endianness() {
    local cputype=$1
    local suffix_eb=$2
    local suffix_el=$3

    # detect endianness without od/hexdump, like get_bitness() does.
    need_cmd head
    need_cmd tail

    local _current_exe_endianness
    _current_exe_endianness="$(head -c 6 /proc/self/exe | tail -c 1)"
    if [ "$_current_exe_endianness" = "$(printf '\001')" ]; then
        echo "${cputype}${suffix_el}"
    elif [ "$_current_exe_endianness" = "$(printf '\002')" ]; then
        echo "${cputype}${suffix_eb}"
    else
        err "unknown platform endianness"
    fi
}

get_architecture() {
    local _ostype _cputype _bitness _arch
    _ostype="$(uname -s)"
    _cputype="$(uname -m)"

    if [ "$_ostype" = Linux ]; then
        if [ "$(uname -o)" = Android ]; then
            _ostype=Android
        fi
    fi

    if [ "$_ostype" = Darwin ] && [ "$_cputype" = i386 ]; then
        # Darwin `uname -m` lies
        if sysctl hw.optional.x86_64 | grep -q ': 1'; then
            _cputype=x86_64
        fi
    fi

    case "$_ostype" in

        Android)
            _ostype=linux-android
            ;;

        Linux)
            case $(get_gnu_musl_glibc) in
              "musl")
                _ostype=unknown-linux-musl
                ;;
              "gnu")
                _ostype=unknown-linux-gnu
                ;;
              # Fallback
              *)
                _ostype=unknown-linux-gnu
                ;;
            esac
            _bitness=$(get_bitness)
            ;;

        FreeBSD)
            _ostype=unknown-freebsd
            ;;

        NetBSD)
            _ostype=unknown-netbsd
            ;;

        DragonFly)
            _ostype=unknown-dragonfly
            ;;

        Darwin)
            _ostype=apple-darwin
            ;;

        MINGW* | MSYS* | CYGWIN*)
            _ostype=pc-windows-gnu
            ;;

        *)
            err "unrecognized OS type: $_ostype"
            ;;

    esac

    case "$_cputype" in

        i386 | i486 | i686 | i786 | x86)
            _cputype=i686
            ;;

        xscale | arm)
            _cputype=arm
            if [ "$_ostype" = "linux-android" ]; then
                _ostype=linux-androideabi
            fi
            ;;

        armv6l)
            _cputype=arm
            if [ "$_ostype" = "linux-android" ]; then
                _ostype=linux-androideabi
            else
                _ostype="${_ostype}eabihf"
            fi
            ;;

        armv7l | armv8l)
            _cputype=armv7
            if [ "$_ostype" = "linux-android" ]; then
                _ostype=linux-androideabi
            else
                _ostype="${_ostype}eabihf"
            fi
            ;;

        aarch64 | arm64)
            _cputype=aarch64
            ;;

        x86_64 | x86-64 | x64 | amd64)
            _cputype=x86_64
            ;;

        mips)
            _cputype=$(get_endianness mips '' el)
            ;;

        mips64)
            if [ "$_bitness" -eq 64 ]; then
                # only n64 ABI is supported for now
                _ostype="${_ostype}abi64"
                _cputype=$(get_endianness mips64 '' el)
            fi
            ;;

        ppc)
            _cputype=powerpc
            ;;

        ppc64)
            _cputype=powerpc64
            ;;

        ppc64le)
            _cputype=powerpc64le
            ;;

        s390x)
            _cputype=s390x
            ;;

        *)
            err "unknown CPU type: $_cputype"

    esac

    # Detect 64-bit linux with 32-bit userland
    if [ "${_ostype}" = unknown-linux-gnu ] && [ "${_bitness}" -eq 32 ]; then
        case $_cputype in
            x86_64)
                _cputype=i686
                ;;
            mips64)
                _cputype=$(get_endianness mips '' el)
                ;;
            powerpc64)
                _cputype=powerpc
                ;;
            aarch64)
                _cputype=armv7
                if [ "$_ostype" = "linux-android" ]; then
                    _ostype=linux-androideabi
                else
                    _ostype="${_ostype}eabihf"
                fi
                ;;
        esac
    fi

    # Detect armv7 but without the CPU features Rust needs in that build,
    # and fall back to arm.
    # See https://github.com/rust-lang/rustup.rs/issues/587.
    if [ "$_ostype" = "unknown-linux-gnueabihf" ] && [ "$_cputype" = armv7 ]; then
        if ensure grep '^Features' /proc/cpuinfo | grep -q -v neon; then
            # At least one processor does not have NEON.
            _cputype=arm
        fi
    fi

    _arch="${_cputype}-${_ostype}"

    RETVAL="$_arch"
}

err() {
    echo "$_prompt $1" >&2
    exit 1
}

need_cmd() {
    if ! check_cmd "$1"; then
        err "Error: the install script failed because the command '$1' was not found"
    fi
}

check_cmd() {
    command -v "$1" > /dev/null 2>&1
}

assert_nz() {
    if [ -z "$1" ]; then err "assert_nz $2"; fi
}

# Run a command that should never fail. If the command fails execution
# will immediately terminate with an error showing the failing
# command.
ensure() {
    local output
    output="$("$@" 2>&1 > /dev/null)"

    if [ "$output" ]; then
        echo ""
        echo "$_prompt command failed: $*"
        echo ""
        echo "$_divider"
        echo ""
        echo "$output" >&2
        exit 1
    fi
}

# This is just for indicating that commands' results are being
# intentionally ignored. Usually, because it's being executed
# as part of error handling.
ignore() {
    "$@"
}

# This wraps curl or wget. Try curl first, if not installed,
# use wget instead.
downloader() {
    if [ "$1" = --check ]; then
        need_cmd curl
    else
        if ! check_help_for curl --proto --tlsv1.2; then
            echo "Warning: Not forcing TLS v1.2, this is potentially less secure"
            curl --silent --show-error --fail --location "$1" --output "$2"
        else
            curl --proto '=https' --tlsv1.2 --silent --show-error --fail --location "$1" --output "$2"
        fi
    fi
}

check_help_for() {
    local _cmd
    local _arg
    local _ok
    _cmd="$1"
    _ok="y"
    shift

    # If we're running on OS-X, older than 10.13, then we always
    # fail to find these options to force fallback
    if check_cmd sw_vers; then
        if [ "$(sw_vers -productVersion | cut -d. -f2)" -lt 13 ]; then
            # Older than 10.13
            echo "Warning: Detected OS X platform older than 10.13"
            _ok="n"
        fi
    fi

    for _arg in "$@"; do
        if ! "$_cmd" --help | grep -q -- "$_arg"; then
            _ok="n"
        fi
    done

    test "$_ok" = "y"
}

main "$@" || exit 1


================================================
FILE: monitoring/grafana/README.md
================================================
# Grafana dashboards for monitoring Quickwit

The list of featured dashboards:
- [x] Metastore
- [x] Indexers
- [x] Searchers
- [ ] Janitor


================================================
FILE: monitoring/grafana/dashboards/indexers.json
================================================
{
  "annotations": {
    "list": [
      {
        "builtIn": 1,
        "datasource": {
          "type": "grafana",
          "uid": "-- Grafana --"
        },
        "enable": true,
        "hide": true,
        "iconColor": "rgba(0, 211, 255, 1)",
        "name": "Annotations & Alerts",
        "target": {
          "limit": 100,
          "matchAny": false,
          "tags": [],
          "type": "dashboard"
        },
        "type": "dashboard"
      }
    ]
  },
  "description": "",
  "editable": true,
  "fiscalYearStartMonth": 0,
  "graphTooltip": 0,
  "links": [],
  "liveNow": false,
  "panels": [
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "Bps"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 6,
        "x": 0,
        "y": 0
      },
      "id": 10,
      "options": {
        "colorMode": "value",
        "graphMode": "none",
        "justifyMode": "auto",
        "orientation": "auto",
        "reduceOptions": {
          "calcs": [
            "lastNotNull"
          ],
          "fields": "",
          "values": false
        },
        "showPercentChange": false,
        "textMode": "auto",
        "wideLayout": true
      },
      "pluginVersion": "10.4.1",
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum by(docs_processed_status) (rate(quickwit_indexing_processed_bytes{instance=~\"$instance\"}[$__rate_interval]))",
          "legendFormat": "{{docs_processed_status}}",
          "range": true,
          "refId": "A"
        }
      ],
      "title": "Indexing throughput",
      "type": "stat"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "suffix: docs/s"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 6,
        "x": 6,
        "y": 0
      },
      "id": 11,
      "options": {
        "colorMode": "value",
        "graphMode": "none",
        "justifyMode": "auto",
        "orientation": "auto",
        "reduceOptions": {
          "calcs": [
            "lastNotNull"
          ],
          "fields": "",
          "values": false
        },
        "showPercentChange": false,
        "textMode": "auto",
        "wideLayout": true
      },
      "pluginVersion": "10.4.1",
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum by(docs_processed_status) (rate(quickwit_indexing_processed_docs_total{instance=~\"$pod|$instance\"}[$__rate_interval]))",
          "legendFormat": "{{docs_processed_status}}",
          "range": true,
          "refId": "A"
        }
      ],
      "title": "Documents throughput",
      "type": "stat"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "left",
            "axisSoftMax": -4,
            "axisSoftMin": 8,
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 8,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "Bps"
        },
        "overrides": [
          {
            "matcher": {
              "id": "byName",
              "options": "valid"
            },
            "properties": [
              {
                "id": "color",
                "value": {
                  "mode": "continuous-GrYlRd",
                  "seriesBy": "last"
                }
              }
            ]
          },
          {
            "matcher": {
              "id": "byName",
              "options": "parsing_error"
            },
            "properties": [
              {
                "id": "color",
                "value": {
                  "mode": "continuous-RdYlGr"
                }
              }
            ]
          }
        ]
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 0
      },
      "id": 2,
      "options": {
        "legend": {
          "calcs": [
            "min",
            "max",
            "mean"
          ],
          "displayMode": "table",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "exemplar": false,
          "expr": "sum by(docs_processed_status, index) (rate(quickwit_indexing_processed_bytes{instance=~\"$instance\"}[$__rate_interval]))",
          "format": "time_series",
          "instant": false,
          "interval": "",
          "legendFormat": "{{docs_processed_status}}-{{index}}",
          "range": true,
          "refId": "Indexing bytes rate"
        }
      ],
      "title": "Indexing throughput",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "description": "",
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "decimals": 1,
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "Bps"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 8
      },
      "id": 6,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "exemplar": false,
          "expr": "rate(quickwit_write_bytes{instance=~\"$instance\"}[$__rate_interval])",
          "hide": false,
          "instant": false,
          "legendFormat": "{{instance}} {{component}}",
          "range": true,
          "refId": "Writes"
        }
      ],
      "title": "Writes rate",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 12,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "decbytes"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 8
      },
      "id": 8,
      "options": {
        "legend": {
          "calcs": [
            "min",
            "max",
            "mean"
          ],
          "displayMode": "table",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "pluginVersion": "9.2.1",
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "quickwit_memory_allocated_bytes{instance=~\"$instance\"}",
          "legendFormat": "{{instance}} allocated",
          "range": true,
          "refId": "A"
        },
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "quickwit_memory_resident_bytes{instance=~\"$instance\"}",
          "hide": false,
          "legendFormat": "{{instance}} RSS",
          "range": true,
          "refId": "C"
        }
      ],
      "title": "Memory usage (allocated and RSS)",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 14,
            "gradientMode": "hue",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineStyle": {
              "fill": "solid"
            },
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "decimals": 1,
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "none"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 16
      },
      "id": 13,
      "options": {
        "legend": {
          "calcs": [
            "min",
            "max",
            "mean"
          ],
          "displayMode": "table",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "quickwit_indexing_ongoing_merge_operations{instance=~\"$instance\"}",
          "hide": false,
          "legendFormat": "{{instance}} ongoing",
          "range": true,
          "refId": "Processed docs"
        },
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "quickwit_indexing_pending_merge_operations{instance=~\"$instance\"}",
          "hide": false,
          "legendFormat": "{{instance}} pending",
          "range": true,
          "refId": "A"
        }
      ],
      "title": "Merge operations (ongoing and pending)",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 7,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineStyle": {
              "fill": "solid"
            },
            "lineWidth": 1,
            "pointSize": 4,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "decimals": 1,
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "Bps"
        },
        "overrides": [
          {
            "matcher": {
              "id": "byName",
              "options": "Upload bytes / sec"
            },
            "properties": [
              {
                "id": "custom.transform",
                "value": "negative-Y"
              }
            ]
          }
        ]
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 16
      },
      "id": 4,
      "options": {
        "legend": {
          "calcs": [
            "min",
            "max",
            "mean"
          ],
          "displayMode": "table",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum by(pod) (rate(quickwit_storage_object_storage_download_num_bytes{instance=~\"$instance\"}[$__rate_interval]))",
          "legendFormat": "Download bytes / sec - {{pod}}",
          "range": true,
          "refId": "Download"
        },
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum by(pod) (rate(quickwit_storage_object_storage_upload_num_bytes{namespace=\"$namespace\", pod=~\"$pod\", instance=~\"$instance\"}[$__rate_interval]))",
          "hide": false,
          "legendFormat": "Upload bytes / sec - {{pod}}",
          "range": true,
          "refId": "Upload"
        }
      ],
      "title": "Object storage transfer rate",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 14,
            "gradientMode": "hue",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineStyle": {
              "fill": "solid"
            },
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "decimals": 1,
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "none"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 24
      },
      "id": 5,
      "options": {
        "legend": {
          "calcs": [
            "min",
            "max",
            "mean"
          ],
          "displayMode": "table",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum by(docs_processed_status, index) (rate(quickwit_indexing_processed_docs_total{instance=~\"$instance\"}[$__rate_interval]))",
          "hide": false,
          "legendFormat": "{{docs_processed_status}}-{{index}}",
          "range": true,
          "refId": "Processed docs"
        }
      ],
      "title": "Indexed documents rate",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 7,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineStyle": {
              "fill": "solid"
            },
            "lineWidth": 1,
            "pointSize": 4,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "decimals": 1,
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "none"
        },
        "overrides": [
          {
            "matcher": {
              "id": "byName",
              "options": "Upload bytes / sec"
            },
            "properties": [
              {
                "id": "custom.transform",
                "value": "negative-Y"
              }
            ]
          }
        ]
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 24
      },
      "id": 14,
      "options": {
        "legend": {
          "calcs": [
            "min",
            "max",
            "mean"
          ],
          "displayMode": "table",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum(rate(quickwit_storage_object_storage_gets_total{instance=~\"$instance\"}[$__rate_interval]))",
          "legendFormat": "GET req/sec",
          "range": true,
          "refId": "Download"
        },
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "sum(rate(quickwit_storage_object_storage_puts_total{namespace=\"$namespace\", pod=~\"$pod\", instance=~\"$instance\"}[$__rate_interval]))",
          "hide": false,
          "legendFormat": "PUT req/sec",
          "range": true,
          "refId": "Upload"
        }
      ],
      "title": "Requests on object storage",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "µs"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 32
      },
      "id": 15,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "histogram_quantile(0.75, rate(quickwit_cli_thread_unpark_duration_microseconds_bucket{instance=~\"$instance\"}[$__rate_interval]))",
          "instant": false,
          "legendFormat": "{{pod}}",
          "range": true,
          "refId": "A"
        }
      ],
      "title": "Thread unpark duration",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 12,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "µs"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 32
      },
      "id": 12,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "pluginVersion": "9.2.1",
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "editorMode": "builder",
          "expr": "rate(quickwit_indexing_backpressure_micros{instance=~\"$instance\"}[$__rate_interval])",
          "legendFormat": "{{actor_name}}-{{pod}}",
          "range": true,
          "refId": "A"
        }
      ],
      "title": "Backpressure",
      "type": "timeseries"
    }
  ],
  "refresh": "30s",
  "revision": 1,
  "schemaVersion": 39,
  "tags": [
    "quickwit",
    "indexer"
  ],
  "templating": {
    "list": [
      {
        "current": {
          "selected": true,
          "text": "Prometheus",
          "value": "PBFA97CFB590B2093"
        },
        "hide": 0,
        "includeAll": false,
        "label": "Datasource",
        "multi": false,
        "name": "datasource",
        "options": [],
        "query": "prometheus",
        "queryValue": "",
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "type": "datasource"
      },
      {
        "current": {
          "selected": false,
          "text": "All",
          "value": "$__all"
        },
        "datasource": {
          "type": "prometheus",
          "uid": "${datasource}"
        },
        "definition": "label_values(quickwit_memory_in_flight_data_bytes, instance)",
        "hide": 0,
        "includeAll": true,
        "label": "Instance",
        "multi": false,
        "name": "instance",
        "options": [],
        "query": {
          "query": "label_values(quickwit_memory_in_flight_data_bytes, instance)",
          "refId": "StandardVariableQuery"
        },
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "sort": 0,
        "type": "query"
      }
    ]
  },
  "time": {
    "from": "now-1h",
    "to": "now"
  },
  "timepicker": {},
  "timezone": "",
  "title": "Quickwit Indexers",
  "uid": "quickwit-indexers",
  "version": 2,
  "weekStart": ""
}


================================================
FILE: monitoring/grafana/dashboards/ingesters.json
================================================
{
  "annotations": {
    "list": [
      {
        "builtIn": 1,
        "datasource": {
          "type": "grafana",
          "uid": "-- Grafana --"
        },
        "enable": true,
        "hide": true,
        "iconColor": "rgba(0, 211, 255, 1)",
        "name": "Annotations & Alerts",
        "target": {
          "limit": 100,
          "matchAny": false,
          "tags": [],
          "type": "dashboard"
        },
        "type": "dashboard"
      }
    ]
  },
  "editable": true,
  "fiscalYearStartMonth": 0,
  "graphTooltip": 0,
  "links": [],
  "liveNow": false,
  "panels": [
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": [
          {
            "__systemRef": "hideSeriesFrom",
            "matcher": {
              "id": "byNames",
              "options": {
                "mode": "exclude",
                "names": [
                  "{component=\"ingester\", instance=\"host.docker.internal:7280\", job=\"quickwit\", kind=\"server\", operation=\"truncate_shards\", status=\"success\"}"
                ],
                "prefix": "All except:",
                "readOnly": true
              }
            },
            "properties": [
              {
                "id": "custom.hideFrom",
                "value": {
                  "legend": false,
                  "tooltip": false,
                  "viz": true
                }
              }
            ]
          }
        ]
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 0
      },
      "id": 2,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "code",
          "expr": "rate(quickwit_ingest_grpc_requests_total{kind=\"server\", instance=~\"$instance\"}[$__rate_interval])",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "__auto",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "gRPC server request rate",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 0
      },
      "id": 10,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "code",
          "expr": "histogram_quantile(0.95, sum by(le, rpc) (rate(quickwit_ingest_grpc_request_duration_seconds_bucket{kind=\"server\", instance=~\"$instance\"}[$__rate_interval])))",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "__auto",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "gRPC server request latencies",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 8
      },
      "id": 9,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_ingest_grpc_requests_in_flight{kind=\"server\", instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "__auto",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "gRPC server in-flight requests",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 8
      },
      "id": 8,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "sum(quickwit_ingest_shards{state=\"open\", instance=~\"$instance\"})",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "Open shards",
          "range": true,
          "refId": "A",
          "useBackend": false
        },
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "sum(quickwit_ingest_shards{state=\"closed\", instance=~\"$instance\"})",
          "fullMetaSearch": false,
          "hide": false,
          "includeNullMetadata": true,
          "legendFormat": "Closed shards",
          "range": true,
          "refId": "B",
          "useBackend": false
        }
      ],
      "title": "Shard status",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "bytes"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 16
      },
      "id": 4,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_ingest_wal_disk_used_bytes{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "__auto",
          "range": true,
          "refId": "A",
          "useBackend": false
        },
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_ingest_wal_memory_used_bytes{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "hide": false,
          "includeNullMetadata": true,
          "legendFormat": "__auto",
          "range": true,
          "refId": "B",
          "useBackend": false
        }
      ],
      "title": "WAL usage",
      "type": "timeseries"
    }
  ],
  "refresh": "30s",
  "revision": 1,
  "schemaVersion": 39,
  "tags": [
    "quickwit"
  ],
  "templating": {
    "list": [
      {
        "current": {
          "selected": false,
          "text": "Prometheus",
          "value": "PBFA97CFB590B2093"
        },
        "hide": 0,
        "includeAll": false,
        "label": "Datasource",
        "multi": false,
        "name": "datasource",
        "options": [],
        "query": "prometheus",
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "type": "datasource"
      },
      {
        "current": {
          "selected": true,
          "text": "All",
          "value": "$__all"
        },
        "datasource": {
          "type": "prometheus",
          "uid": "PBFA97CFB590B2093"
        },
        "definition": "label_values(quickwit_ingest_shards,instance)",
        "hide": 0,
        "includeAll": true,
        "label": "Instance",
        "multi": false,
        "name": "instance",
        "options": [],
        "query": {
          "qryType": 1,
          "query": "label_values(quickwit_ingest_shards,instance)",
          "refId": "PrometheusVariableQueryEditor-VariableQuery"
        },
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "sort": 0,
        "type": "query"
      }
    ]
  },
  "time": {
    "from": "now-1h",
    "to": "now"
  },
  "timepicker": {},
  "timezone": "",
  "title": "Quickwit Ingesters",
  "uid": "DjSPsTvSz",
  "version": 1,
  "weekStart": ""
}


================================================
FILE: monitoring/grafana/dashboards/metastore.json
================================================
{
  "annotations": {
    "list": [
      {
        "builtIn": 1,
        "datasource": {
          "type": "grafana",
          "uid": "-- Grafana --"
        },
        "enable": true,
        "hide": true,
        "iconColor": "rgba(0, 211, 255, 1)",
        "name": "Annotations & Alerts",
        "target": {
          "limit": 100,
          "matchAny": false,
          "tags": [],
          "type": "dashboard"
        },
        "type": "dashboard"
      }
    ]
  },
  "editable": true,
  "fiscalYearStartMonth": 0,
  "graphTooltip": 0,
  "links": [],
  "liveNow": false,
  "panels": [
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "description": "",
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 13,
        "w": 12,
        "x": 0,
        "y": 0
      },
      "id": 2,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "sum by(rpc) (rate(quickwit_metastore_grpc_requests_total{kind=\"server\", instance=~\"$instance\"}[$__rate_interval]))",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "{{operation}}",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Metastore requests rate",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "description": "Duration in seconds",
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 13,
        "w": 12,
        "x": 12,
        "y": 0
      },
      "id": 3,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "histogram_quantile(0.95, sum by(le, rpc) (rate(quickwit_metastore_grpc_request_duration_seconds_bucket{kind=\"server\", instance=~\"$instance\"}[$__rate_interval])))",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "{{rpc}}",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Metastore requests duration (p95)",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "description": "",
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 13,
        "w": 12,
        "x": 0,
        "y": 13
      },
      "id": 4,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "sum by(rpc) (rate(quickwit_metastore_grpc_requests_total{kind=\"server\", status=\"error\", instance=~\"$instance\"}[$__rate_interval]))",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "legendFormat": "{{rpc}}",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Metastore requests error rate",
      "type": "timeseries"
    }
  ],
  "refresh": "30s",
  "schemaVersion": 39,
  "tags": [
    "quickwit",
    "metastore"
  ],
  "templating": {
    "list": [
      {
        "current": {
          "selected": true,
          "text": "Prometheus",
          "value": "PBFA97CFB590B2093"
        },
        "hide": 0,
        "includeAll": false,
        "label": "Datasource",
        "multi": false,
        "name": "datasource",
        "options": [],
        "query": "prometheus",
        "queryValue": "",
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "type": "datasource"
      },
      {
        "allValue": "",
        "current": {
          "selected": true,
          "text": "All",
          "value": "$__all"
        },
        "definition": "label_values(quickwit_metastore_grpc_requests_total{kind=\"server\"},instance)",
        "hide": 0,
        "includeAll": true,
        "label": "Instance",
        "multi": false,
        "name": "instance",
        "options": [],
        "query": {
          "qryType": 1,
          "query": "label_values(quickwit_metastore_grpc_requests_total{kind=\"server\"},instance)",
          "refId": "PrometheusVariableQueryEditor-VariableQuery"
        },
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "sort": 0,
        "type": "query"
      }
    ]
  },
  "time": {
    "from": "now-1h",
    "to": "now"
  },
  "timepicker": {},
  "timezone": "",
  "title": "Quickwit Metastore",
  "uid": "quickwit-metastore",
  "version": 1,
  "weekStart": ""
}


================================================
FILE: monitoring/grafana/dashboards/searchers.json
================================================
{
  "annotations": {
    "list": [
      {
        "builtIn": 1,
        "datasource": {
          "type": "grafana",
          "uid": "-- Grafana --"
        },
        "enable": true,
        "hide": true,
        "iconColor": "rgba(0, 211, 255, 1)",
        "name": "Annotations & Alerts",
        "type": "dashboard"
      }
    ]
  },
  "editable": true,
  "fiscalYearStartMonth": 0,
  "graphTooltip": 0,
  "id": 2,
  "links": [],
  "liveNow": false,
  "panels": [
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 0
      },
      "id": 1,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_search_leaf_searches_splits_total{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "{{instance}}",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Leaf search splits",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "decbytes"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 0
      },
      "id": 4,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_memory_resident_bytes{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "hide": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "{{instance}}",
          "range": true,
          "refId": "B",
          "useBackend": false
        }
      ],
      "title": "Memory usage (bytes)",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 8
      },
      "id": 2,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "rate(quickwit_storage_object_storage_gets_total{instance=~\"$instance\"}[$__rate_interval])",
          "fullMetaSearch": false,
          "includeNullMetadata": false,
          "instant": false,
          "legendFormat": "Total",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Number of GET requests",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "decbytes"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 8
      },
      "id": 22,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_storage_object_storage_download_num_bytes{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "Downloaded bytes",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Size of GET requests (bytes)",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 16
      },
      "id": 9,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "rate(quickwit_cache_cache_hits_total{instance=~\"$instance\"}[$__rate_interval])",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "{{component_name}}",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Cache hits",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          }
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 16
      },
      "id": 23,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "rate(quickwit_cache_cache_misses_total{instance=~\"$instance\"}[$__rate_interval])",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "{{component_name}}",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Cache misses",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "none"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 0,
        "y": 24
      },
      "id": 24,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "builder",
          "expr": "quickwit_cache_in_cache_count{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "Split footer",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Number of cached objects",
      "type": "timeseries"
    },
    {
      "datasource": {
        "type": "prometheus",
        "uid": "${datasource}"
      },
      "fieldConfig": {
        "defaults": {
          "color": {
            "mode": "palette-classic"
          },
          "custom": {
            "axisBorderShow": false,
            "axisCenteredZero": false,
            "axisColorMode": "text",
            "axisLabel": "",
            "axisPlacement": "auto",
            "barAlignment": 0,
            "drawStyle": "line",
            "fillOpacity": 0,
            "gradientMode": "none",
            "hideFrom": {
              "legend": false,
              "tooltip": false,
              "viz": false
            },
            "insertNulls": false,
            "lineInterpolation": "linear",
            "lineWidth": 1,
            "pointSize": 5,
            "scaleDistribution": {
              "type": "linear"
            },
            "showPoints": "auto",
            "spanNulls": false,
            "stacking": {
              "group": "A",
              "mode": "none"
            },
            "thresholdsStyle": {
              "mode": "off"
            }
          },
          "mappings": [],
          "thresholds": {
            "mode": "absolute",
            "steps": [
              {
                "color": "green",
                "value": null
              },
              {
                "color": "red",
                "value": 80
              }
            ]
          },
          "unit": "decbytes"
        },
        "overrides": []
      },
      "gridPos": {
        "h": 8,
        "w": 12,
        "x": 12,
        "y": 24
      },
      "id": 11,
      "options": {
        "legend": {
          "calcs": [],
          "displayMode": "list",
          "placement": "bottom",
          "showLegend": true
        },
        "tooltip": {
          "mode": "single",
          "sort": "none"
        }
      },
      "targets": [
        {
          "datasource": {
            "type": "prometheus",
            "uid": "${datasource}"
          },
          "disableTextWrap": false,
          "editorMode": "code",
          "expr": "quickwit_cache_in_cache_num_bytes{instance=~\"$instance\"}",
          "fullMetaSearch": false,
          "includeNullMetadata": true,
          "instant": false,
          "legendFormat": "Split footer",
          "range": true,
          "refId": "A",
          "useBackend": false
        }
      ],
      "title": "Size of cached objects (bytes)",
      "type": "timeseries"
    }
  ],
  "refresh": "30s",
  "schemaVersion": 39,
  "tags": [
    "quickwit",
    "searcher"
  ],
  "templating": {
    "list": [
      {
        "current": {
          "selected": false,
          "text": "Prometheus",
          "value": "PBFA97CFB590B2093"
        },
        "hide": 0,
        "includeAll": false,
        "label": "Datasource",
        "multi": false,
        "name": "datasource",
        "options": [],
        "query": "prometheus",
        "queryValue": "",
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "type": "datasource"
      },
      {
        "current": {
          "selected": false,
          "text": "All",
          "value": "$__all"
        },
        "datasource": {
          "type": "prometheus",
          "uid": "${datasource}"
        },
        "definition": "label_values(quickwit_search_leaf_searches_splits_total,instance)",
        "hide": 0,
        "includeAll": true,
        "label": "Instance",
        "multi": false,
        "name": "instance",
        "options": [],
        "query": {
          "query": "label_values(quickwit_search_leaf_searches_splits_total,instance)",
          "refId": "StandardVariableQuery"
        },
        "refresh": 1,
        "regex": "",
        "skipUrlSync": false,
        "sort": 0,
        "type": "query"
      }

    ]
  },
  "time": {
    "from": "now-1h",
    "to": "now"
  },
  "timepicker": {},
  "timezone": "",
  "title": "Quickwit Searchers",
  "uid": "quickwit-searchers",
  "version": 1,
  "weekStart": ""
}


================================================
FILE: monitoring/grafana/provisioning/dashboards/default.yaml
================================================
apiVersion: 1

providers:
  - name: Default
    folder: Quickwit
    allowUiUpdates: true
    options:
      path: /var/lib/grafana/dashboards
      foldersFromFilesStructure: true


================================================
FILE: monitoring/grafana/provisioning/datasources/default.yaml
================================================
apiVersion: 1

datasources:
  - id: 1
    name: Prometheus
    type: prometheus
    typeName: Prometheus
    access: proxy
    url: http://prometheus:9090
    isDefault: true
    jsonData:
      httpMethod: POST
      timeInterval: 5s
    readOnly: false

  - id: 2
    name: Jaeger
    type: jaeger
    typeName: Jaeger
    access: proxy
    url: http://jaeger:16686
    isDefault: false
    jsonData:
      httpMethod: POST
    readOnly: false


================================================
FILE: monitoring/otel-collector-config.yaml
================================================
receivers:
  jaeger:
    protocols:
      grpc:
      thrift_binary:
      thrift_compact:
      thrift_http:

  otlp:
    protocols:
      grpc:
      http:

processors:
  batch:

exporters:
  jaeger:
    endpoint: jaeger:14250
    tls:
      insecure: true

  kafka:
    brokers:
      - kafka-broker:29092

  otlp/qw:
    endpoint: host.docker.internal:7281
    tls:
      insecure: true

extensions:
  health_check:
  pprof:
  zpages:

service:
  extensions: [health_check, pprof, zpages]
  pipelines:
    traces:
      receivers: [jaeger, otlp]
      processors: [batch]
      exporters: [jaeger, kafka, otlp/qw]
    # metrics:
    #   receivers: [otlp]
    #   processors: [batch]
    #   exporters: [otlp]
    logs:
      receivers: [otlp]
      processors: [batch]
      exporters: [kafka, otlp/qw]


================================================
FILE: monitoring/prometheus.yaml
================================================
global:
  scrape_interval: 1s
  scrape_timeout: 1s

scrape_configs:
  - job_name: quickwit
    metrics_path: /metrics
    static_configs:
      - targets:
          - host.docker.internal:7280


================================================
FILE: quickwit/.cargo/config.toml
================================================
[build]
rustflags = ["--cfg", "tokio_unstable"]


================================================
FILE: quickwit/.cargo-dev/config.toml
================================================
# This configuration makes it possible to use mold
# as the linker for rustc.
#
# I recommended it for development as it really improves performance. 
# 
# To enable
# - install clang
# - install mold https://github.com/rui314/mold into /usr/local/bin/mold
# - add a symbolic link from .cargo -> .cargo-dev 
# via `ln -s .cargo-dev .cargo`.
#
# If there is an issue, reverting is as simple as deleting .cargo.

[target.x86_64-unknown-linux-gnu]
linker = "/usr/bin/clang"
rustflags = ["-C", "link-arg=-fuse-ld=/usr/local/bin/mold"]


================================================
FILE: quickwit/.config/nextest.toml
================================================
[profile.default]
slow-timeout = "10s"

[profile.ci]
# Print out output for failing tests as soon as they fail, and also at the end
# of the run (for easy scrollability).
failure-output = "immediate-final"
# Do not cancel the test run on the first failure.
fail-fast = false

================================================
FILE: quickwit/.license_header.txt
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.


================================================
FILE: quickwit/CLAUDE.md
================================================
## Build & Test Commands

### Formatting & Linting
- **`make fmt`** — Format and validate code (requires nightly toolchain: `rustup toolchain install nightly`):
  1. Runs `cargo +nightly fmt`
  2. Checks license headers on `.rs`, `.ts`, `.proto` files
  3. Enforces log format policy: no trailing punctuation, no uppercase first character in log and error messages
- **`make fix`** — Runs clippy with `--fix`, then `make fmt`, then `make unused-deps`
- **`make unused-deps`** — Detects unused dependencies via `cargo-machete`

Log messages (`info!`, `warn!`, `error!`, `debug!`) must:
- Start with a **lowercase** letter
- Have **no trailing punctuation**

### Testing
- **Single crate test**: `cargo nextest run -p quickwit-search my_test_name`
- **Single test**: `cargo test -p quickwit-common my_test_name`
- **`make test-all`** — Starts Docker services (LocalStack S3, PostgreSQL, Pub/Sub emulator) and runs the full test suite with `cargo nextest run --all-features --retries 5`
- **`make test-failpoints`** — Runs failpoint tests only: `cargo nextest run --test failpoints --features fail/failpoints`
- Docker services: `make docker-compose-up` / `make docker-compose-down` (subset: `DOCKER_SERVICES=kafka,postgres`)

### Building
- **`make doc`** — Generates docs with `cargo doc --all-features` (warnings as errors)
- Rust toolchain: **1.93**

## Code Conventions

### Clippy Disallowed Methods
These methods are banned (see `clippy.toml`):
- `Path::exists` — (use try_exists)
- `Option::is_some_and`, `Option::is_none_or`, `Option::xor`
- `Option::map_or`, `Option::map_or_else` — use `.map(..).unwrap_or(..)` or `let Some(..) else {..}` instead

### Formatting Shortcut
Use `/fmt` to automatically run format checks.

## Architecture Overview

Quickwit is a cloud-native distributed search engine for observability data (logs, traces). It's organized as a ~38-crate Rust workspace.

### Key Layers

**Protocol & Types** — `quickwit-proto` defines all gRPC service contracts and message types via protobuf. Service traits are auto-generated.

**Actor System** — `quickwit-actors` is a custom lightweight actor framework. The indexing pipeline is fully actor-based:
```
Source → DocProcessor → Indexer → IndexSerializer → Packager → Uploader → Sequencer → Publisher
```
A parallel merge pipeline runs alongside.

**Search** — `quickwit-search` implements a root-leaf pattern: root servers parse queries and coordinate, leaf servers search their assigned splits in parallel, leaf results are merged at root.

**Storage** — `quickwit-storage` abstracts cloud storage (S3, Azure, GCS, local file, RAM) behind a `Storage` trait.

**Metastore** — `quickwit-metastore` manages index metadata with file-backed (dev) and PostgreSQL (production) backends.

**Cluster** — `quickwit-cluster` uses Chitchat gossip protocol for membership. `quickwit-control-plane` handles indexing task scheduling and placement.

**API Surface** — `quickwit-serve` hosts both REST and gRPC endpoints over the same service traits, plus serves the embedded React UI.

### Core Crates
| Crate | Purpose |
|-------|---------|
| `quickwit-cli` | CLI entry point and binary |
| `quickwit-serve` | REST/gRPC server |
| `quickwit-search` | Distributed search orchestration |
| `quickwit-indexing` | Actor-based indexing pipeline |
| `quickwit-ingest` | Distributed ingestion with replication |
| `quickwit-metastore` | Index metadata storage |
| `quickwit-storage` | Multi-cloud storage abstraction |
| `quickwit-config` | Configuration parsing/validation |
| `quickwit-doc-mapper` | Index schema and document mapping |
| `quickwit-query` | Query DSL parsing (ES-compatible) |
| `quickwit-cluster` | Cluster membership (Chitchat) |
| `quickwit-control-plane` | Indexing task scheduling |
| `quickwit-actors` | Actor framework |
| `quickwit-proto` | Protobuf definitions and gRPC traits |
| `quickwit-common` | Shared utilities and metrics |
| `quickwit-lambda-server` | AWS Lambda leaf search handler |
| `quickwit-lambda-client` | Lambda invocation with auto-deployment |

quickwit-common contains shared utilities about metrics, rate limited logging, reading from environment variables, etc.
It also contains the `run_cpu_intensive` that should be use to run CPU-intensive tasks from tokio tasks.

When the client is unlikely to match on an error, you can rely on the crate level Error or anyhow::Error. If you need to introduce a new Error type, use thiserror.

### Design Patterns
- **Trait-based services**: `SearchService`, `MetastoreService`, etc. — enables mocking and multiple implementations
- **Feature gates**: Cloud backends (`azure`, `gcs`), message sources (`kafka`, `kinesis`, `pulsar`, `sqs`, `gcp-pubsub`), `postgres` metastore, `multilang` tokenizers
- **Metrics**: `once_cell::sync::Lazy` statics with `quickwit_common::metrics::*` factories

### Key Dependencies
- **Tantivy**: Search engine library (custom fork)
- **Tonic/Prost**: gRPC framework and protobuf
- **Tokio**: Async runtime
- **SQLx**: PostgreSQL metastore

# Quickwit Claude Guidelines

When adding a new dependency, update license by running `make update-licenses`.
Prefer referring to the crate in workspace. 
Make sure to keep features minimal.

In other words, prefer
zip = { workspace = true, default-features = false, features=["deflate"] }
to
zip = "2"

## Code Formatting
### Quick Fix

Use `/fmt` to automatically run format checks and see issues.

## Coding Style
- Avoid single-letter variable names except for indices (i, j, k)
- Document all "hidden contracts" (implicit assumptions, invariants, preconditions)
- Try to avoid deep nesting. In particular, prefer early return style
- Avoid abusing iterator chaining with complex constructs like `.transpose()`
- Write type names explicitly when it aids readability
- Use `with_capacity` to hint container capacity when size is known


================================================
FILE: quickwit/Cargo.toml
================================================
[workspace]
resolver = "2"
members = [
  "quickwit-actors",
  "quickwit-aws",
  "quickwit-cli",
  "quickwit-cluster",
  "quickwit-codegen",
  "quickwit-codegen/example",
  "quickwit-common",
  "quickwit-config",
  "quickwit-control-plane",
  "quickwit-datetime",
  "quickwit-directories",
  "quickwit-doc-mapper",
  "quickwit-index-management",
  "quickwit-indexing",
  "quickwit-ingest",
  "quickwit-integration-tests",
  "quickwit-jaeger",
  "quickwit-janitor",
  "quickwit-lambda-client",
  "quickwit-lambda-server",
  "quickwit-macros",
  "quickwit-metastore",

  # Disabling metastore-utils from the quickwit projects to ease build/deps.
  # We can reenable it when we need it.
  # "quickwit-metastore-utils",
  "quickwit-opentelemetry",
  "quickwit-proto",
  "quickwit-query",
  "quickwit-rest-client",
  "quickwit-search",
  "quickwit-serve",
  "quickwit-storage",
  "quickwit-telemetry",
]

# The following list excludes `quickwit-metastore-utils`
# from the default member to ease build/deps.
default-members = [
  "quickwit-actors",
  "quickwit-aws",
  "quickwit-cli",
  "quickwit-cluster",
  "quickwit-codegen",
  "quickwit-codegen/example",
  "quickwit-common",
  "quickwit-config",
  "quickwit-control-plane",
  "quickwit-datetime",
  "quickwit-directories",
  "quickwit-doc-mapper",
  "quickwit-index-management",
  "quickwit-indexing",
  "quickwit-ingest",
  "quickwit-integration-tests",
  "quickwit-jaeger",
  "quickwit-janitor",
  "quickwit-lambda-client",
  "quickwit-lambda-server",
  "quickwit-macros",
  "quickwit-metastore",
  "quickwit-opentelemetry",
  "quickwit-proto",
  "quickwit-query",
  "quickwit-rest-client",
  "quickwit-search",
  "quickwit-serve",
  "quickwit-storage",
  "quickwit-telemetry",
]

[workspace.package]
version = "0.8.0"
edition = "2024"
homepage = "https://quickwit.io/"
documentation = "https://quickwit.io/docs/"
repository = "https://github.com/quickwit-oss/quickwit"
authors = ["Quickwit, Inc. <hello@quickwit.io>"]
license = "Apache-2.0"

[workspace.dependencies]
anyhow = "1"
arc-swap = "1.8"
assert-json-diff = "2"
async-compression = { version = "0.4", features = ["tokio", "gzip"] }
async-speed-limit = "0.4"
async-trait = "0.1"
backtrace = "0.3"
base64 = "0.22"
binggan = { version = "0.15" }
bitpacking = "0.9.3"
bytes = { version = "1", features = ["serde"] }
bytesize = { version = "2.3.1", features = ["serde"] }
bytestring = "1.5"
chitchat = "0.10.0"
chrono = { version = "0.4", default-features = false, features = [
  "clock",
  "std",
] }
clap = { version = "4.5", features = ["env", "string"] }
coarsetime = "0.1"
colored = "3.0"
console-subscriber = "0.5"
criterion = { version = "0.8", features = ["async_tokio"] }
cron = "0.15"
dialoguer = { version = "0.12", default-features = false }
dotenvy = "0.15"
dyn-clone = "1.0"
enum-iterator = "2.3"
env_logger = { version = "0.11", default-features = false, features = ["auto-color"] }
fail = "0.5"
flate2 = "1.1"
flume = "0.12"
fnv = "1"
futures = "0.3"
futures-util = { version = "0.3", default-features = false }
glob = "0.3"
# We can't directly update google-cloud-auth to 1.3 and google-cloud-gax to 1.4, because the latest version
# of google-cloud-pubsub is "0.30" which explicitly depends on: google-cloud-auth ^0.17 and google-cloud-gax ^0.19.
google-cloud-auth = "0.17.2"
google-cloud-gax = "0.19.2"
google-cloud-googleapis = { version = "0.16", features = ["pubsub"] }
google-cloud-pubsub = "0.30"
governor = "0.10.4"
heck = "0.5"
hex = "0.4"
home = "0.5"
hostname = "0.4"
http = "1.4"
http-body = "1.0"
http-body-util = "0.1"
http-serde = "2.1"
humantime = "2.3"
hyper = { version = "1.8", features = ["client", "http1", "http2", "server"] }
hyper-rustls = "0.27"
hyper-util = { version = "0.1", default-features = false, features = [
  "client-legacy",
  "server-auto",
  "server-graceful",
  "service",
  "tokio",
] }
indexmap = { version = "2.12", features = ["serde"] }
indicatif = "0.18"
itertools = "0.14"
lambda_runtime = "0.13"
json_comments = "0.2"
libz-sys = "1.1"
lru = "0.16"
matches = "0.1"
md5 = "0.8"
mime_guess = "2.0"
mini-moka = "0.10.3"
mockall = "0.14"
mrecordlog = { git = "https://github.com/quickwit-oss/mrecordlog", rev = "306c0a7" }
new_string_template = "1.5"
nom = "8.0"
numfmt = "1.2"
once_cell = "1"
oneshot = "0.1"
openssl = { version = "0.10", default-features = false }
openssl-probe = "0.1"
opentelemetry = "0.31"
opentelemetry-appender-tracing = "0.31"
opentelemetry_sdk = { version = "0.31", features = ["rt-tokio"] }
opentelemetry-otlp = { version = "0.31", features = ["grpc-tonic"] }
ouroboros = "0.18"
percent-encoding = "2.3"
pin-project = "1.1"
pnet = { version = "0.35", features = ["std"] }
postcard = { version = "1.1", features = [
  "use-std",
], default-features = false }
pprof = { version = "0.15", features = ["flamegraph"] }
predicates = "3"
prettyplease = "0.2"
proc-macro2 = "1.0"
prometheus = { version = "0.14", default-features = false, features = ["process"] }
proptest = "1"
prost = { version = "0.14", default-features = false, features = [
  "derive",
] }
prost-build = "0.14"
prost-types = "0.14"
pulsar = { version = "6.6", default-features = false, features = [
  "auth-oauth2",
  "compression",
  "tokio-runtime",
] }
quick_cache = "0.6.18"
quote = "1.0"
rand = "0.9"
rand_distr = "0.5"
rayon = "1.11"
rdkafka = { version = "0.38", default-features = false, features = [
  "cmake-build",
  "libz",
  "ssl",
  "tokio",
  "zstd",
] }
regex = "1.12"
regex-syntax = "0.8"
reqwest = { version = "0.12", default-features = false, features = [
  "json",
  "rustls-tls",
] }
reqwest-middleware = "0.4"
reqwest-retry = "0.8"
rust-embed = "8.9"
rustc-hash = "2.1"
rustls = "0.23"
rustls-pemfile = "2.2"
sea-query = { version = "0.32" }
sea-query-binder = { version = "0.7", features = [
  "runtime-tokio-rustls",
  "sqlx-postgres",
] }
# ^1.0.184 due to serde-rs/serde#2538
serde = { version = "1.0.228", features = ["derive", "rc"] }
serde_json = "1.0"
serde_json_borrow = "0.9"
serde_qs = { version = "0.15" }
serde_with = "3.16"
serde_yaml = "0.9"
serial_test = { version = "3.2", features = ["file_locks"] }
sha2 = "0.10"
siphasher = "1.0"
smallvec = "1"
sqlx = { version = "0.8", features = [
  "migrate",
  "postgres",
  "runtime-tokio-rustls",
  "time",
] }
syn = { version = "2.0", features = ["extra-traits", "full", "parsing"] }
sync_wrapper = "1"
sysinfo = { version = "0.37", default-features = false, features = ["disk"] }
tabled = { version = "0.20", features = ["ansi"] }
tempfile = "3"
thiserror = "2"
thousands = "0.2"
tikv-jemalloc-ctl = { version = "0.6", features = ["stats"] }
tikv-jemallocator = "0.6"
time = { version = "0.3", features = ["std", "formatting", "macros"] }
tokio = { version = "1.48", features = ["full"] }
tokio-metrics = { version = "0.4", features = ["rt"] }
tokio-rustls = { version = "0.26", default-features = false }
tokio-stream = { version = "0.1", features = ["sync"] }
tokio-util = { version = "0.7", default-features = false, features = [
  "compat",
  "io-util",
] }
toml = "0.9"
tonic = { version = "0.14", features = [
  "_tls-any",
  "gzip",
  "tls-native-roots",
  "zstd",
] }
tonic-build = "0.14"
tonic-health = "0.14"
tonic-prost = "0.14"
tonic-prost-build = "0.14"
tonic-reflection = "0.14"
tower = { version = "0.5", features = [
  "balance",
  "buffer",
  "load",
  "retry",
  "util",
] }
# legacy version because of warp
tower-http = { version = "0.6", features = [
  "compression-gzip",
  "compression-zstd",
  "cors",
] }
tracing = "0.1"
tracing-opentelemetry = "0.32"
tracing-subscriber = { version = "0.3", features = [
  "env-filter",
  "json",
  "std",
  "time",
] }
ttl_cache = "0.5"
typetag = "0.2"
ulid = "1.2"
ureq = "3"
username = "0.2"
# We cannot upgrade to utoipa 5.0+ due to significant breaking changes:
# 1. The `OpenApi` struct structure changed (fields are private), breaking our manual merging logic in openapi.rs
# in `quickwit-serve`. This code is fundamentally incompatible with version 5.x.
utoipa = { version = "4.2", features = ["time", "ulid"] }
uuid = { version = "1.19", features = ["v4", "serde"] }
vrl = { version = "0.29", default-features = false, features = [
  "compiler",
  "diagnostic",
  "stdlib",
  "value",
] }
warp = { version = "0.4", features = ["server", "test"] }
wiremock = "0.6"
zstd = { version = "0.13", default-features = false }

aws-config = "1.8"
aws-credential-types = { version = "1.2", features = ["hardcoded-credentials"] }
aws-runtime = "1.5"
aws-sdk-kinesis = "1.97"
aws-sdk-s3 = "=1.62"
aws-sdk-lambda = "1"
aws-sdk-sqs = "1.91"
aws-smithy-async = "1.2"
aws-smithy-mocks = "0.2"
aws-smithy-http-client = { version = "1.1", features = ["default-client"] }
aws-smithy-runtime = "1.9"
aws-smithy-types = { version = "1.3", features = [
  "byte-stream-poll-next",
  "http-body-1-x",
] }
aws-types = "1.3"

azure_core = { version = "0.21", features = ["hmac_rust", "enable_reqwest_rustls"] }
azure_identity = { version = "0.21" }
azure_storage = { version = "0.21", default-features = false, features = [
  "enable_reqwest_rustls",
] }
azure_storage_blobs = { version = "0.21", default-features = false, features = [
  "enable_reqwest_rustls",
] }

opendal = { version = "0.55", default-features = false }
reqsign = { version = "0.18", default-features = false, features = ["google", "default-context"] }

quickwit-actors = { path = "quickwit-actors" }
quickwit-aws = { path = "quickwit-aws" }
quickwit-cli = { path = "quickwit-cli" }
quickwit-cluster = { path = "quickwit-cluster" }
quickwit-codegen = { path = "quickwit-codegen" }
quickwit-codegen-example = { path = "quickwit-codegen/example" }
quickwit-common = { path = "quickwit-common" }
quickwit-config = { path = "quickwit-config" }
quickwit-control-plane = { path = "quickwit-control-plane" }
quickwit-datetime = { path = "quickwit-datetime" }
quickwit-directories = { path = "quickwit-directories" }
quickwit-doc-mapper = { path = "quickwit-doc-mapper" }
quickwit-index-management = { path = "quickwit-index-management" }
quickwit-indexing = { path = "quickwit-indexing" }
quickwit-ingest = { path = "quickwit-ingest" }
quickwit-integration-tests = { path = "quickwit-integration-tests" }
quickwit-jaeger = { path = "quickwit-jaeger" }
quickwit-janitor = { path = "quickwit-janitor" }
quickwit-lambda-client = { path = "quickwit-lambda-client" }
quickwit-lambda-server = { path = "quickwit-lambda-server" }
quickwit-macros = { path = "quickwit-macros" }
quickwit-metastore = { path = "quickwit-metastore" }
quickwit-opentelemetry = { path = "quickwit-opentelemetry" }
quickwit-proto = { path = "quickwit-proto" }
quickwit-query = { path = "quickwit-query" }
quickwit-rest-client = { path = "quickwit-rest-client" }
quickwit-search = { path = "quickwit-search" }
quickwit-serve = { path = "quickwit-serve" }
quickwit-storage = { path = "quickwit-storage" }
quickwit-telemetry = { path = "quickwit-telemetry" }

tantivy = { git = "https://github.com/quickwit-oss/tantivy/", rev = "98ebbf9", default-features = false, features = [
  "lz4-compression",
  "mmap",
  "quickwit",
  "zstd-compression",
  "columnar-zstd-compression",
] }
tantivy-fst = "0.5"

# This is actually not used directly the goal is to fix the version
# used by reqwest.
encoding_rs = "=0.8.35"

[patch.crates-io]
sasl2-sys = { git = "https://github.com/quickwit-oss/rust-sasl/", rev = "085a4c7" }

## this patched version of tracing helps better understand what happens inside futures (when are
## they polled, how long does poll take...)
#tracing = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }
#tracing-attributes = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }
#tracing-core = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }
#tracing-futures = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }
#tracing-log = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }
#tracing-opentelemetry = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }
#tracing-subscriber = { git = "https://github.com/trinity-1686a/tracing.git", rev = "6806cac3" }

[profile.dev]
debug = false

[profile.release]
lto = "thin"


================================================
FILE: quickwit/Cross.toml
================================================
[build.env]
passthrough = [
    "QW_COMMIT_DATE",
    "QW_COMMIT_HASH",
    "QW_COMMIT_TAGS",
]

[target.x86_64-unknown-linux-gnu]
image = "quickwit/cross:x86_64-unknown-linux-gnu"

[target.x86_64-unknown-linux-musl]
image = "quickwit/cross:x86_64-unknown-linux-musl"

[target.aarch64-unknown-linux-gnu]
image = "quickwit/cross:aarch64-unknown-linux-gnu"

[target.aarch64-unknown-linux-gnu.env]
# Fix build for transitive dependency rdkafka -> rdkafka-sys -> sasl2-sys -> krb5-src
# Introduced by https://github.com/MaterializeInc/rust-krb5-src/pull/27
passthrough = [
    "krb5_cv_attr_constructor_destructor=yes",
    "ac_cv_func_regcomp=yes",
    "ac_cv_printf_positional=yes",
]

[target.aarch64-unknown-linux-musl]
image = "quickwit/cross:aarch64-unknown-linux-musl"


================================================
FILE: quickwit/Makefile
================================================
help:
	@grep '^[^\.#[:space:]].*:' Makefile

doc:
	@echo "Running cargo doc"
	@RUSTDOCFLAGS='-Dwarnings -Arustdoc::private_intra_doc_links' cargo doc --all-features

fmt:
	@echo "Formatting Rust files"
	@(rustup toolchain list | ( ! grep -q nightly && echo "Toolchain 'nightly' is not installed. Please install using 'rustup toolchain install nightly'.") ) || cargo +nightly fmt
	@echo "Checking license headers"
	@bash scripts/check_license_headers.sh
	@echo "Checking log format"
	@bash scripts/check_log_format.sh

dependency-licenses.html: Cargo.lock scripts/about.hbs scripts/about.toml
	@echo "Checking dependency licenses"
	@cargo about generate -c scripts/about.toml scripts/about.hbs -o dependency-licenses.html --workspace

fix:
	@echo "Running cargo clippy --fix"
	@cargo clippy --workspace --all-features --tests --fix --allow-dirty --allow-staged
	@$(MAKE) fmt
	@$(MAKE) unused-deps

unused-deps:
	@echo "Checking for unused dependencies"
	@(command -v cargo-machete >/dev/null || cargo --list | grep -q machete || (echo "cargo-machete is not installed. Please install using 'cargo install cargo-machete'." && exit 1))
	@cargo machete

# Usage:
# `make test-all` starts the Docker services and runs all the tests.
# `make -k test-all docker-compose-down`, tears down the Docker services after running all the tests.
test-all:
	AWS_ACCESS_KEY_ID=ignored \
	AWS_SECRET_ACCESS_KEY=ignored \
	AWS_REGION=us-east-1 \
	PUBSUB_EMULATOR_HOST=localhost:8681 \
	QW_S3_ENDPOINT=http://localhost:4566 \
	QW_S3_FORCE_PATH_STYLE_ACCESS=1 \
	QW_TEST_DATABASE_URL=postgres://quickwit-dev:quickwit-dev@localhost:5432/quickwit-metastore-dev \
	RUST_MIN_STACK=67108864 \
	cargo nextest run --all-features --retries 5
	cargo nextest run --test failpoints --features fail/failpoints

test-failpoints:
	cargo nextest run --test failpoints --features fail/failpoints

# TODO: to be replaced by https://github.com/quickwit-oss/quickwit/issues/237
TARGET ?= x86_64-unknown-linux-gnu
.PHONY: build
build: build-ui
	@echo "Building binary for target=${TARGET}"
	@which cross > /dev/null 2>&1 || (echo "Cross is not installed. Please install using 'cargo install cross'." && exit 1)
	@case "${TARGET}" in \
		*musl ) \
			cross build --release --features release-feature-set --target ${TARGET}; \
		;; \
		* ) \
			cross build --release --features release-feature-vendored-set --target ${TARGET}; \
		;; \
	esac

workspace-deps-tree:
	cargo tree --all-features --workspace -f "{p}" --prefix depth | cut -f 1 -d ' ' | python3 scripts/dep-tree.py

.PHONY: build-rustdoc
build-rustdoc:
	RUSTDOCFLAGS="-Dwarnings -Arustdoc::private_intra_doc_links" cargo doc --no-deps --all-features --document-private-items

.PHONY: build-ui
build-ui:
	NODE_ENV=production cd quickwit-ui && $(MAKE) install build

rm-postgres:
	rm -fr /tmp/quickwit/services/postgres

update-licenses:
	 dd-rust-license-tool --config license-tool.toml write
	 mv LICENSE-3rdparty.csv ../LICENSE-3rdparty.csv


================================================
FILE: quickwit/NOTICE
================================================
Datadog Quickwit
Copyright 2021-Present Datadog, Inc.
This product includes software developed at Datadog (<https://www.datadoghq.com/).>


================================================
FILE: quickwit/clippy.toml
================================================
disallowed-methods = [
    # This function is not sound because it does not return a Result
    "std::path::Path::exists",
    # These functions hurt readability (according to Paul)
    "std::option::Option::is_some_and",
    "std::option::Option::is_none_or",
    "std::option::Option::xor",
    # "std::option::Option::and_then",
    # .map(..).unwrap_or(..) or let Some(..) else {..}
    "std::option::Option::map_or",
    # .map(..).unwrap_or_else(..) or let Some(..) else {..}
    "std::option::Option::map_or_else",
]

ignore-interior-mutability = [
    "bytes::Bytes",
    "bytestring::ByteString",
    "quickwit_ingest::ShardInfo",
    "quickwit_ingest::ShardInfos",
    "quickwit_proto::types::ShardId",
]


================================================
FILE: quickwit/deny.toml
================================================
# This template contains all of the possible sections and their default values

# Note that all fields that take a lint level have these possible values:
# * deny - An error will be produced and the check will fail
# * warn - A warning will be produced, but the check will not fail
# * allow - No warning or error will be produced, though in some cases a note
# will be

# The values provided in this template are the default values that will be used
# when any section or field is not specified in your own configuration

[graph]
# If 1 or more target triples (and optionally, target_features) are specified,
# only the specified targets will be checked when running `cargo deny check`.
# This means, if a particular package is only ever used as a target specific
# dependency, such as, for example, the `nix` crate only being used via the
# `target_family = "unix"` configuration, that only having windows targets in
# this list would mean the nix crate, as well as any of its exclusive
# dependencies not shared by any other crates, would be ignored, as the target
# list here is effectively saying which targets you are building for.
targets = [
    # The triple can be any string, but only the target triples built in to
    # rustc (as of 1.40) can be checked against actual config expressions
    #{ triple = "x86_64-unknown-linux-musl" },
    # You can also specify which target_features you promise are enabled for a
    # particular target. target_features are currently not validated against
    # the actual valid features supported by the target architecture.
    #{ triple = "wasm32-unknown-unknown", features = ["atomics"] },
]

# This section is considered when running `cargo deny check advisories`
# More documentation for the advisories section can be found here:
# https://embarkstudios.github.io/cargo-deny/checks/advisories/cfg.html
[advisories]
version = 2
# The path where the advisory database is cloned/fetched into
db-path = "~/.cargo/advisory-db"
# The url(s) of the advisory databases to use
db-urls = ["https://github.com/rustsec/advisory-db"]
# A list of advisory IDs to ignore. Note that ignored advisories will still
# output a note when they are encountered.
ignore = [
    "RUSTSEC-2021-0153", # `encoding` is unmaintained, it's used in lindera
]

# This section is considered when running `cargo deny check licenses`
# More documentation for the licenses section can be found here:
# https://embarkstudios.github.io/cargo-deny/checks/licenses/cfg.html
[licenses]
version = 2
# List of explicitly allowed licenses
# See https://spdx.org/licenses/ for list of possible licenses
# [possible values: any SPDX 3.11 short identifier (+ optional exception)].
allow = [
    # "Apache-2.0 WITH LLVM-exception",
    "0BSD",
    "Apache-2.0",
    "BSD-2-Clause",
    "BSD-3-Clause",
    "CC0-1.0",
    "CDLA-Permissive-2.0",
    "ISC",
    "MIT",
    "MPL-2.0",
    "OpenSSL",
    "Unicode-3.0",
    "Unlicense",
    "Zlib",
    "zlib-acknowledgement",
]
# The confidence threshold for detecting a license from license text.
# The higher the value, the more closely the license text must be to the
# canonical license text of a valid SPDX license file.
# [possible values: any between 0.0 and 1.0].
confidence-threshold = 0.8
# Allow 1 or more licenses on a per-crate basis, so that particular licenses
# aren't accepted for every possible crate as with the normal allow list
exceptions = []

# Some crates don't have (easily) machine readable licensing information,
# adding a clarification entry for it allows you to manually specify the
# licensing information
[[licenses.clarify]]
# The name of the crate the clarification applies to
name = "ring"
# The optional version constraint for the crate
version = "*"
# The SPDX expression for the license requirements of the crate
expression = "OpenSSL"
# One or more files in the crate's source used as the "source of truth" for
# the license expression. If the contents match, the clarification will be used
# when running the license check, otherwise the clarification will be ignored
# and the crate will be checked normally, which may produce warnings or errors
# depending on the rest of your configuration
license-files = [
    # Each entry is a crate relative path, and the (opaque) hash of its contents
    { path = "LICENSE", hash = 0xbd0eed23 }
]

[licenses.private]
# If true, ignores workspace crates that aren't published, or are only
# published to private registries
ignore = false
# One or more private registries that you might publish crates to, if a crate
# is only published to private registries, and ignore is true, the crate will
# not have its license(s) checked
registries = [
    #"https://sekretz.com/registry
]

# This section is considered when running `cargo deny check bans`.
# More documentation about the 'bans' section can be found here:
# https://embarkstudios.github.io/cargo-deny/checks/bans/cfg.html
[bans]
# Lint level for when multiple versions of the same crate are detected
multiple-versions = "warn"
# Lint level for when a crate version requirement is `*`
wildcards = "allow"
# The graph highlighting used when creating dotgraphs for crates
# with multiple versions
# * lowest-version - The path to the lowest versioned duplicate is highlighted
# * simplest-path - The path to the version with the fewest edges is highlighted
# * all - Both lowest-version and simplest-path are used
highlight = "all"
# List of crates that are allowed. Use with care!
allow = [
    #{ name = "ansi_term", version = "=0.11.0" },
]
# List of crates to deny
deny = [
    # Each entry the name of a crate and a version range. If version is
    # not specified, all versions will be matched.
    #{ name = "ansi_term", version = "=0.11.0" },
    #
    # Wrapper crates can optionally be specified to allow the crate when it
    # is a direct dependency of the otherwise banned crate
    #{ name = "ansi_term", version = "=0.11.0", wrappers = [] },
]
# Certain crates/versions that will be skipped when doing duplicate detection.
skip = [
    #{ name = "ansi_term", version = "=0.11.0" },
]
# Similarly to `skip` allows you to skip certain crates during duplicate
# detection. Unlike skip, it also includes the entire tree of transitive
# dependencies starting at the specified crate, up to a certain depth, which is
# by default infinite
skip-tree = [
    #{ name = "ansi_term", version = "=0.11.0", depth = 20 },
]

# This section is considered when running `cargo deny check sources`.
# More documentation about the 'sources' section can be found here:
# https://embarkstudios.github.io/cargo-deny/checks/sources/cfg.html
[sources]
# Lint level for what to happen when a crate from a crate registry that is not
# in the allow list is encountered
unknown-registry = "warn"
# Lint level for what to happen when a crate from a git repository that is not
# in the allow list is encountered
unknown-git = "warn"
# List of URLs for allowed crate registries. Defaults to the crates.io index
# if not specified. If it is specified but empty, no registries are allowed.
allow-registry = ["https://github.com/rust-lang/crates.io-index"]
# List of URLs for allowed Git repositories
allow-git = []

[sources.allow-org]
# 1 or more github.com organizations to allow git sources for
github = ["quickwit-oss"]
# 1 or more gitlab.com organizations to allow git sources for
gitlab = []
# 1 or more bitbucket.org organizations to allow git sources for
bitbucket = []


================================================
FILE: quickwit/dependency-licenses.html
================================================
<html>

<head>
    <style>
        @media (prefers-color-scheme: dark) {
            body {
                background: #333;
                color: white;
            }
            a {
                color: skyblue;
            }
        }
        .container {
            font-family: sans-serif;
            max-width: 800px;
            margin: 0 auto;
        }
        .intro {
            text-align: center;
        }
        .licenses-list {
            list-style-type: none;
            margin: 0;
            padding: 0;
        }
        .license-used-by {
            margin-top: -10px;
        }
        .license-text {
            max-height: 200px;
            overflow-y: scroll;
            white-space: pre-wrap;
        }
    </style>
</head>

<body>
    <main class="container">
        <div class="intro">
            <h1>Third Party Licenses</h1>
            <p>This page lists the licenses of the projects used in cargo-about.</p>
        </div>
    
        <h2>Overview of licenses:</h2>
        <ul class="licenses-overview">
            <li><a href="#Apache-2.0">Apache License 2.0</a> (424)</li>
            <li><a href="#MIT">MIT License</a> (168)</li>
            <li><a href="#AGPL-3.0">GNU Affero General Public License v3.0</a> (29)</li>
            <li><a href="#CC0-1.0">Creative Commons Zero v1.0 Universal</a> (7)</li>
            <li><a href="#BSD-3-Clause">BSD 3-Clause &quot;New&quot; or &quot;Revised&quot; License</a> (5)</li>
            <li><a href="#ISC">ISC License</a> (5)</li>
            <li><a href="#0BSD">BSD Zero Clause License</a> (2)</li>
            <li><a href="#MPL-2.0">Mozilla Public License 2.0</a> (2)</li>
            <li><a href="#Zlib">zlib License</a> (2)</li>
            <li><a href="#OpenSSL">OpenSSL License</a> (1)</li>
            <li><a href="#Unicode-DFS-2016">Unicode License Agreement - Data Files and Software (2016)</a> (1)</li>
            <li><a href="#zlib-acknowledgement">zlib/libpng License with Acknowledgement</a> (1)</li>
        </ul>

        <h2>All license text:</h2>
        <ul class="licenses-list">
            <li class="license">
                <h3 id="0BSD">BSD Zero Clause License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/stephaneyfx/enum-iterator.git ">enum-iterator-derive 1.4.0</a></li>
                </ul>
                <pre class="license-text">BSD Zero Clause License

Copyright (c) 2018 Stephane Raux

Permission to use, copy, modify, and/or distribute this software for any
purpose with or without fee is hereby granted.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH
REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY
AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT,
INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM
LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR
OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
PERFORMANCE OF THIS SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="0BSD">BSD Zero Clause License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/oyvindln/adler2 ">adler2 2.0.0</a></li>
                </ul>
                <pre class="license-text">Copyright (C) Jonas Schievink &lt;jonasschievink@gmail.com&gt;

Permission to use, copy, modify, and/or distribute this software for
any purpose with or without fee is hereby granted.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND THE AUTHOR DISCLAIMS ALL WARRANTIES
WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN
AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="AGPL-3.0">GNU Affero General Public License v3.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-actors 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-aws 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-cli 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-cluster 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-codegen 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-codegen-example 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-common 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-config 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-control-plane 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-datetime 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-directories 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-doc-mapper 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-index-management 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-indexing 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-ingest 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-integration-tests 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-jaeger 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-janitor 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-lambda 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-macros 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-metastore 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-opentelemetry 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-proto 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-query 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-rest-client 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-search 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-serve 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-storage 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/quickwit ">quickwit-telemetry 0.8.0</a></li>
                </ul>
                <pre class="license-text">GNU AFFERO GENERAL PUBLIC LICENSE
Version 3, 19 November 2007

Copyright (C) 2007 Free Software Foundation, Inc. &lt;http://fsf.org/&gt;

Everyone is permitted to copy and distribute verbatim copies of this license document, but changing it is not allowed.

                            Preamble

The GNU Affero General Public License is a free, copyleft license for software and other kinds of works, specifically designed to ensure cooperation with the community in the case of network server software.

The licenses for most software and other practical works are designed to take away your freedom to share and change the works.  By contrast, our General Public Licenses are intended to guarantee your freedom to share and change all versions of a program--to make sure it remains free software for all its users.

When we speak of free software, we are referring to freedom, not price.  Our General Public Licenses are designed to make sure that you have the freedom to distribute copies of free software (and charge for them if you wish), that you receive source code or can get it if you want it, that you can change the software or use pieces of it in new free programs, and that you know you can do these things.

Developers that use our General Public Licenses protect your rights with two steps: (1) assert copyright on the software, and (2) offer you this License which gives you legal permission to copy, distribute and/or modify the software.

A secondary benefit of defending all users&#x27; freedom is that improvements made in alternate versions of the program, if they receive widespread use, become available for other developers to incorporate.  Many developers of free software are heartened and encouraged by the resulting cooperation.  However, in the case of software used on network servers, this result may fail to come about. The GNU General Public License permits making a modified version and letting the public access it on a server without ever releasing its source code to the public.

The GNU Affero General Public License is designed specifically to ensure that, in such cases, the modified source code becomes available to the community.  It requires the operator of a network server to provide the source code of the modified version running there to the users of that server.  Therefore, public use of a modified version, on a publicly accessible server, gives the public access to the source code of the modified version.

An older license, called the Affero General Public License and published by Affero, was designed to accomplish similar goals.  This is a different license, not a version of the Affero GPL, but Affero has released a new version of the Affero GPL which permits relicensing under this license.

The precise terms and conditions for copying, distribution and modification follow.

                       TERMS AND CONDITIONS

0. Definitions.

&quot;This License&quot; refers to version 3 of the GNU Affero General Public License.

&quot;Copyright&quot; also means copyright-like laws that apply to other kinds of works, such as semiconductor masks.

&quot;The Program&quot; refers to any copyrightable work licensed under this License.  Each licensee is addressed as &quot;you&quot;.  &quot;Licensees&quot; and &quot;recipients&quot; may be individuals or organizations.

To &quot;modify&quot; a work means to copy from or adapt all or part of the work in a fashion requiring copyright permission, other than the making of an exact copy.  The resulting work is called a &quot;modified version&quot; of the earlier work or a work &quot;based on&quot; the earlier work.

A &quot;covered work&quot; means either the unmodified Program or a work based on the Program.

To &quot;propagate&quot; a work means to do anything with it that, without permission, would make you directly or secondarily liable for infringement under applicable copyright law, except executing it on a computer or modifying a private copy.  Propagation includes copying, distribution (with or without modification), making available to the public, and in some countries other activities as well.

To &quot;convey&quot; a work means any kind of propagation that enables other parties to make or receive copies.  Mere interaction with a user through a computer network, with no transfer of a copy, is not conveying.

An interactive user interface displays &quot;Appropriate Legal Notices&quot; to the extent that it includes a convenient and prominently visible feature that (1) displays an appropriate copyright notice, and (2) tells the user that there is no warranty for the work (except to the extent that warranties are provided), that licensees may convey the work under this License, and how to view a copy of this License.  If the interface presents a list of user commands or options, such as a menu, a prominent item in the list meets this criterion.

1. Source Code.
The &quot;source code&quot; for a work means the preferred form of the work for making modifications to it.  &quot;Object code&quot; means any non-source form of a work.

A &quot;Standard Interface&quot; means an interface that either is an official standard defined by a recognized standards body, or, in the case of interfaces specified for a particular programming language, one that is widely used among developers working in that language.

The &quot;System Libraries&quot; of an executable work include anything, other than the work as a whole, that (a) is included in the normal form of packaging a Major Component, but which is not part of that Major Component, and (b) serves only to enable use of the work with that Major Component, or to implement a Standard Interface for which an implementation is available to the public in source code form.  A &quot;Major Component&quot;, in this context, means a major essential component (kernel, window system, and so on) of the specific operating system (if any) on which the executable work runs, or a compiler used to produce the work, or an object code interpreter used to run it.

The &quot;Corresponding Source&quot; for a work in object code form means all the source code needed to generate, install, and (for an executable work) run the object code and to modify the work, including scripts to control those activities.  However, it does not include the work&#x27;s System Libraries, or general-purpose tools or generally available free programs which are used unmodified in performing those activities but which are not part of the work.  For example, Corresponding Source includes interface definition files associated with source files for the work, and the source code for shared libraries and dynamically linked subprograms that the work is specifically designed to require, such as by intimate data communication or control flow between those
subprograms and other parts of the work.

The Corresponding Source need not include anything that users can regenerate automatically from other parts of the Corresponding Source.

The Corresponding Source for a work in source code form is that same work.

2. Basic Permissions.
All rights granted under this License are granted for the term of copyright on the Program, and are irrevocable provided the stated conditions are met.  This License explicitly affirms your unlimited permission to run the unmodified Program.  The output from running a covered work is covered by this License only if the output, given its content, constitutes a covered work.  This License acknowledges your rights of fair use or other equivalent, as provided by copyright law.

You may make, run and propagate covered works that you do not convey, without conditions so long as your license otherwise remains in force.  You may convey covered works to others for the sole purpose of having them make modifications exclusively for you, or provide you with facilities for running those works, provided that you comply with the terms of this License in conveying all material for which you do not control copyright.  Those thus making or running the covered works for you must do so exclusively on your behalf, under your direction and control, on terms that prohibit them from making any copies of your copyrighted material outside their relationship with you.

Conveying under any other circumstances is permitted solely under the conditions stated below.  Sublicensing is not allowed; section 10 makes it unnecessary.

3. Protecting Users&#x27; Legal Rights From Anti-Circumvention Law.
No covered work shall be deemed part of an effective technological measure under any applicable law fulfilling obligations under article 11 of the WIPO copyright treaty adopted on 20 December 1996, or similar laws prohibiting or restricting circumvention of such measures.

When you convey a covered work, you waive any legal power to forbid circumvention of technological measures to the extent such circumvention is effected by exercising rights under this License with respect to the covered work, and you disclaim any intention to limit operation or modification of the work as a means of enforcing, against the work&#x27;s users, your or third parties&#x27; legal rights to forbid circumvention of technological measures.

4. Conveying Verbatim Copies.
You may convey verbatim copies of the Program&#x27;s source code as you receive it, in any medium, provided that you conspicuously and appropriately publish on each copy an appropriate copyright notice; keep intact all notices stating that this License and any non-permissive terms added in accord with section 7 apply to the code; keep intact all notices of the absence of any warranty; and give all recipients a copy of this License along with the Program.

You may charge any price or no price for each copy that you convey, and you may offer support or warranty protection for a fee.

5. Conveying Modified Source Versions.
You may convey a work based on the Program, or the modifications to produce it from the Program, in the form of source code under the terms of section 4, provided that you also meet all of these conditions:

    a) The work must carry prominent notices stating that you modified it, and giving a relevant date.

    b) The work must carry prominent notices stating that it is released under this License and any conditions added under section 7.  This requirement modifies the requirement in section 4 to &quot;keep intact all notices&quot;.

    c) You must license the entire work, as a whole, under this License to anyone who comes into possession of a copy.  This License will therefore apply, along with any applicable section 7 additional terms, to the whole of the work, and all its parts, regardless of how they are packaged.  This License gives no permission to license the work in any other way, but it does not invalidate such permission if you have separately received it.

    d) If the work has interactive user interfaces, each must display Appropriate Legal Notices; however, if the Program has interactive interfaces that do not display Appropriate Legal Notices, your work need not make them do so.

A compilation of a covered work with other separate and independent works, which are not by their nature extensions of the covered work, and which are not combined with it such as to form a larger program, in or on a volume of a storage or distribution medium, is called an &quot;aggregate&quot; if the compilation and its resulting copyright are not used to limit the access or legal rights of the compilation&#x27;s users beyond what the individual works permit.  Inclusion of a covered work in an aggregate does not cause this License to apply to the other parts of the aggregate.

6. Conveying Non-Source Forms.
You may convey a covered work in object code form under the terms of sections 4 and 5, provided that you also convey the machine-readable Corresponding Source under the terms of this License, in one of these ways:

    a) Convey the object code in, or embodied in, a physical product (including a physical distribution medium), accompanied by the Corresponding Source fixed on a durable physical medium customarily used for software interchange.

    b) Convey the object code in, or embodied in, a physical product (including a physical distribution medium), accompanied by a written offer, valid for at least three years and valid for as long as you offer spare parts or customer support for that product model, to give anyone who possesses the object code either (1) a copy of the Corresponding Source for all the software in the product that is covered by this License, on a durable physical medium customarily used for software interchange, for a price no more than your reasonable cost of physically performing this conveying of source, or (2) access to copy the Corresponding Source from a network server at no charge.

    c) Convey individual copies of the object code with a copy of the written offer to provide the Corresponding Source.  This alternative is allowed only occasionally and noncommercially, and only if you received the object code with such an offer, in accord with subsection 6b.

    d) Convey the object code by offering access from a designated place (gratis or for a charge), and offer equivalent access to the Corresponding Source in the same way through the same place at no further charge.  You need not require recipients to copy the Corresponding Source along with the object code.  If the place to copy the object code is a network server, the Corresponding Source may be on a different server (operated by you or a third party) that supports equivalent copying facilities, provided you maintain clear directions next to the object code saying where to find the Corresponding Source.  Regardless of what server hosts the Corresponding Source, you remain obligated to ensure that it is available for as long as needed to satisfy these requirements.

    e) Convey the object code using peer-to-peer transmission, provided you inform other peers where the object code and Corresponding Source of the work are being offered to the general public at no charge under subsection 6d.

A separable portion of the object code, whose source code is excluded from the Corresponding Source as a System Library, need not be included in conveying the object code work.

A &quot;User Product&quot; is either (1) a &quot;consumer product&quot;, which means any tangible personal property which is normally used for personal, family, or household purposes, or (2) anything designed or sold for incorporation into a dwelling.  In determining whether a product is a consumer product, doubtful cases shall be resolved in favor of coverage.  For a particular product received by a particular user, &quot;normally used&quot; refers to a typical or common use of that class of product, regardless of the status of the particular user or of the way in which the particular user actually uses, or expects or is expected to use, the product.  A product is a consumer product regardless of whether the product has substantial commercial, industrial or non-consumer uses, unless such uses represent the only significant mode of use of the product.

&quot;Installation Information&quot; for a User Product means any methods, procedures, authorization keys, or other information required to install and execute modified versions of a covered work in that User Product from a modified version of its Corresponding Source.  The information must suffice to ensure that the continued functioning of the modified object code is in no case prevented or interfered with solely because modification has been made.

If you convey an object code work under this section in, or with, or specifically for use in, a User Product, and the conveying occurs as part of a transaction in which the right of possession and use of the User Product is transferred to the recipient in perpetuity or for a fixed term (regardless of how the transaction is characterized), the Corresponding Source conveyed under this section must be accompanied by the Installation Information.  But this requirement does not apply if neither you nor any third party retains the ability to install modified object code on the User Product (for example, the work has been installed in ROM).

The requirement to provide Installation Information does not include a requirement to continue to provide support service, warranty, or updates for a work that has been modified or installed by the recipient, or for the User Product in which it has been modified or installed.  Access to a network may be denied when the modification itself materially and adversely affects the operation of the network or violates the rules and protocols for communication across the network.

Corresponding Source conveyed, and Installation Information provided, in accord with this section must be in a format that is publicly documented (and with an implementation available to the public in source code form), and must require no special password or key for unpacking, reading or copying.

7. Additional Terms.
&quot;Additional permissions&quot; are terms that supplement the terms of this License by making exceptions from one or more of its conditions. Additional permissions that are applicable to the entire Program shall be treated as though they were included in this License, to the extent that they are valid under applicable law.  If additional permissions apply only to part of the Program, that part may be used separately under those permissions, but the entire Program remains governed by this License without regard to the additional permissions.

When you convey a copy of a covered work, you may at your option remove any additional permissions from that copy, or from any part of it.  (Additional permissions may be written to require their own removal in certain cases when you modify the work.)  You may place additional permissions on material, added by you to a covered work, for which you have or can give appropriate copyright permission.

Notwithstanding any other provision of this License, for material you add to a covered work, you may (if authorized by the copyright holders of that material) supplement the terms of this License with terms:

    a) Disclaiming warranty or limiting liability differently from the terms of sections 15 and 16 of this License; or

    b) Requiring preservation of specified reasonable legal notices or author attributions in that material or in the Appropriate Legal Notices displayed by works containing it; or

    c) Prohibiting misrepresentation of the origin of that material, or requiring that modified versions of such material be marked in reasonable ways as different from the original version; or

    d) Limiting the use for publicity purposes of names of licensors or authors of the material; or

    e) Declining to grant rights under trademark law for use of some trade names, trademarks, or service marks; or

    f) Requiring indemnification of licensors and authors of that material by anyone who conveys the material (or modified versions of it) with contractual assumptions of liability to the recipient, for any liability that these contractual assumptions directly impose on those licensors and authors.

All other non-permissive additional terms are considered &quot;further restrictions&quot; within the meaning of section 10.  If the Program as you received it, or any part of it, contains a notice stating that it is governed by this License along with a term that is a further restriction, you may remove that term.  If a license document contains a further restriction but permits relicensing or conveying under this License, you may add to a covered work material governed by the terms of that license document, provided that the further restriction does not survive such relicensing or conveying.

If you add terms to a covered work in accord with this section, you must place, in the relevant source files, a statement of the additional terms that apply to those files, or a notice indicating where to find the applicable terms.

Additional terms, permissive or non-permissive, may be stated in the form of a separately written license, or stated as exceptions; the above requirements apply either way.

8. Termination.

You may not propagate or modify a covered work except as expressly provided under this License.  Any attempt otherwise to propagate or modify it is void, and will automatically terminate your rights under this License (including any patent licenses granted under the third paragraph of section 11).

However, if you cease all violation of this License, then your license from a particular copyright holder is reinstated (a) provisionally, unless and until the copyright holder explicitly and finally terminates your license, and (b) permanently, if the copyright holder fails to notify you of the violation by some reasonable means prior to 60 days after the cessation.

Moreover, your license from a particular copyright holder is reinstated permanently if the copyright holder notifies you of the violation by some reasonable means, this is the first time you have received notice of violation of this License (for any work) from that copyright holder, and you cure the violation prior to 30 days after your receipt of the notice.

Termination of your rights under this section does not terminate the licenses of parties who have received copies or rights from you under this License.  If your rights have been terminated and not permanently reinstated, you do not qualify to receive new licenses for the same material under section 10.

9. Acceptance Not Required for Having Copies.

You are not required to accept this License in order to receive or run a copy of the Program.  Ancillary propagation of a covered work occurring solely as a consequence of using peer-to-peer transmission to receive a copy likewise does not require acceptance.  However, nothing other than this License grants you permission to propagate or modify any covered work.  These actions infringe copyright if you do not accept this License.  Therefore, by modifying or propagating a covered work, you indicate your acceptance of this License to do so.

10. Automatic Licensing of Downstream Recipients.

Each time you convey a covered work, the recipient automatically receives a license from the original licensors, to run, modify and propagate that work, subject to this License.  You are not responsible for enforcing compliance by third parties with this License.

An &quot;entity transaction&quot; is a transaction transferring control of an organization, or substantially all assets of one, or subdividing an organization, or merging organizations.  If propagation of a covered work results from an entity transaction, each party to that transaction who receives a copy of the work also receives whatever licenses to the work the party&#x27;s predecessor in interest had or could give under the previous paragraph, plus a right to possession of the Corresponding Source of the work from the predecessor in interest, if the predecessor has it or can get it with reasonable efforts.

You may not impose any further restrictions on the exercise of the rights granted or affirmed under this License.  For example, you may not impose a license fee, royalty, or other charge for exercise of rights granted under this License, and you may not initiate litigation (including a cross-claim or counterclaim in a lawsuit) alleging that any patent claim is infringed by making, using, selling, offering for sale, or importing the Program or any portion of it.

11. Patents.

A &quot;contributor&quot; is a copyright holder who authorizes use under this License of the Program or a work on which the Program is based.  The work thus licensed is called the contributor&#x27;s &quot;contributor version&quot;.

A contributor&#x27;s &quot;essential patent claims&quot; are all patent claims owned or controlled by the contributor, whether already acquired or hereafter acquired, that would be infringed by some manner, permitted by this License, of making, using, or selling its contributor version, but do not include claims that would be infringed only as a consequence of further modification of the contributor version.  For purposes of this definition, &quot;control&quot; includes the right to grant patent sublicenses in a manner consistent with the requirements of this License.

Each contributor grants you a non-exclusive, worldwide, royalty-free patent license under the contributor&#x27;s essential patent claims, to make, use, sell, offer for sale, import and otherwise run, modify and propagate the contents of its contributor version.

In the following three paragraphs, a &quot;patent license&quot; is any express agreement or commitment, however denominated, not to enforce a patent (such as an express permission to practice a patent or covenant not to sue for patent infringement).  To &quot;grant&quot; such a patent license to a party means to make such an agreement or commitment not to enforce a patent against the party.

If you convey a covered work, knowingly relying on a patent license, and the Corresponding Source of the work is not available for anyone to copy, free of charge and under the terms of this License, through a publicly available network server or other readily accessible means, then you must either (1) cause the Corresponding Source to be so available, or (2) arrange to deprive yourself of the benefit of the patent license for this particular work, or (3) arrange, in a manner consistent with the requirements of this License, to extend the patent
license to downstream recipients.  &quot;Knowingly relying&quot; means you have actual knowledge that, but for the patent license, your conveying the covered work in a country, or your recipient&#x27;s use of the covered work in a country, would infringe one or more identifiable patents in that country that you have reason to believe are valid.

If, pursuant to or in connection with a single transaction or arrangement, you convey, or propagate by procuring conveyance of, a covered work, and grant a patent license to some of the parties receiving the covered work authorizing them to use, propagate, modify or convey a specific copy of the covered work, then the patent license you grant is automatically extended to all recipients of the covered work and works based on it.

A patent license is &quot;discriminatory&quot; if it does not include within the scope of its coverage, prohibits the exercise of, or is conditioned on the non-exercise of one or more of the rights that are specifically granted under this License.  You may not convey a covered work if you are a party to an arrangement with a third party that is in the business of distributing software, under which you make payment to the third party based on the extent of your activity of conveying the work, and under which the third party grants, to any of the parties who would receive the covered work from you, a discriminatory patent license (a) in connection with copies of the covered work conveyed by you (or copies made from those copies), or (b) primarily for and in connection with specific products or compilations that contain the covered work, unless you entered into that arrangement, or that patent license was granted, prior to 28 March 2007.

Nothing in this License shall be construed as excluding or limiting any implied license or other defenses to infringement that may otherwise be available to you under applicable patent law.

12. No Surrender of Others&#x27; Freedom.

If conditions are imposed on you (whether by court order, agreement or otherwise) that contradict the conditions of this License, they do not excuse you from the conditions of this License.  If you cannot convey a covered work so as to satisfy simultaneously your obligations under this License and any other pertinent obligations, then as a consequence you may
not convey it at all.  For example, if you agree to terms that obligate you to collect a royalty for further conveying from those to whom you convey the Program, the only way you could satisfy both those terms and this License would be to refrain entirely from conveying the Program.

13. Remote Network Interaction; Use with the GNU General Public License.

Notwithstanding any other provision of this License, if you modify the Program, your modified version must prominently offer all users interacting with it remotely through a computer network (if your version supports such interaction) an opportunity to receive the Corresponding Source of your version by providing access to the Corresponding Source from a network server at no charge, through some standard or customary means of facilitating copying of software.  This Corresponding Source shall include the Corresponding Source for any work covered by version 3 of the GNU General Public License that is incorporated pursuant to the following paragraph.

Notwithstanding any other provision of this License, you have permission to link or combine any covered work with a work licensed under version 3 of the GNU General Public License into a single combined work, and to convey the resulting work.  The terms of this License will continue to apply to the part which is the covered work, but the work with which it is combined will remain governed by version 3 of the GNU General Public License.

14. Revised Versions of this License.

The Free Software Foundation may publish revised and/or new versions of the GNU Affero General Public License from time to time.  Such new versions will be similar in spirit to the present version, but may differ in detail to address new problems or concerns.

Each version is given a distinguishing version number.  If the Program specifies that a certain numbered version of the GNU Affero General Public License &quot;or any later version&quot; applies to it, you have the option of following the terms and conditions either of that numbered version or of any later version published by the Free Software Foundation.  If the Program does not specify a version number of the GNU Affero General Public License, you may choose any version ever published by the Free Software Foundation.

If the Program specifies that a proxy can decide which future versions of the GNU Affero General Public License can be used, that proxy&#x27;s public statement of acceptance of a version permanently authorizes you to choose that version for the Program.

Later license versions may give you additional or different permissions.  However, no additional obligations are imposed on any author or copyright holder as a result of your choosing to follow a later version.

15. Disclaimer of Warranty.

THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM &quot;AS IS&quot; WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.

16. Limitation of Liability.

IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.

17. Interpretation of Sections 15 and 16.

If the disclaimer of warranty and limitation of liability provided above cannot be given local legal effect according to their terms, reviewing courts shall apply local law that most closely approximates an absolute waiver of all civil liability in connection with the Program, unless a warranty or assumption of liability accompanies a copy of the Program in return for a fee.

END OF TERMS AND CONDITIONS

            How to Apply These Terms to Your New Programs

If you develop a new program, and you want it to be of the greatest possible use to the public, the best way to achieve this is to make it free software which everyone can redistribute and change under these terms.

To do so, attach the following notices to the program.  It is safest to attach them to the start of each source file to most effectively state the exclusion of warranty; and each file should have at least the &quot;copyright&quot; line and a pointer to where the full notice is found.

     &lt;one line to give the program&#x27;s name and a brief idea of what it does.&gt;
     Copyright (C) &lt;year&gt;  &lt;name of author&gt;

     This program is free software: you can redistribute it and/or modify it under the terms of the GNU Affero General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version.

     This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public License for more details.

     You should have received a copy of the GNU Affero General Public License along with this program.  If not, see &lt;http://www.gnu.org/licenses/&gt;.

Also add information on how to contact you by electronic and paper mail.

If your software can interact with users remotely through a computer network, you should also make sure that it provides a way for users to get its source.  For example, if your program is a web application, its interface could display a &quot;Source&quot; link that leads users to an archive of the code.  There are many ways you could offer source, and different solutions will be better for different programs; see section 13 for the specific requirements.

You should also get your employer (if you work as a programmer) or school, if any, to sign a &quot;copyright disclaimer&quot; for the program, if necessary. For more information on this, and how to apply and follow the GNU AGPL, see &lt;http://www.gnu.org/licenses/&gt;.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-config 1.5.8</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-credential-types 1.2.1</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-runtime 1.4.3</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-async 1.2.1</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-checksums 0.60.12</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-eventstream 0.60.5</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-http 0.60.11</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-json 0.60.7</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-protocol-test 0.63.0</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-query 0.60.7</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-runtime-api 1.7.2</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-runtime 1.7.2</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-types 1.2.7</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-smithy-xml 0.60.9</a></li>
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-types 1.3.3</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/Frommi/miniz_oxide/tree/master/miniz_oxide ">miniz_oxide 0.8.0</a></li>
                    <li><a href=" https://github.com/taiki-e/pin-project ">pin-project-internal 1.1.6</a></li>
                    <li><a href=" https://github.com/taiki-e/pin-project-lite ">pin-project-lite 0.2.14</a></li>
                    <li><a href=" https://github.com/taiki-e/pin-project ">pin-project 1.1.6</a></li>
                    <li><a href=" https://github.com/taiki-e/portable-atomic ">portable-atomic 1.9.0</a></li>
                    <li><a href=" https://github.com/Actyx/sync_wrapper ">sync_wrapper 0.1.2</a></li>
                    <li><a href=" https://github.com/gyscos/zstd-rs ">zstd-safe 5.0.2+zstd.1.5.2</a></li>
                    <li><a href=" https://github.com/gyscos/zstd-rs ">zstd-safe 7.2.1</a></li>
                    <li><a href=" https://github.com/gyscos/zstd-rs ">zstd-sys 2.0.13+zstd.1.5.6</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/jhpratt/deranged ">deranged 0.3.11</a></li>
                    <li><a href=" https://github.com/time-rs/time ">time-core 0.1.2</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2022 Jacob Pratt et al.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/jhpratt/num-conv ">num-conv 0.1.0</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2023 Jacob Pratt

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/jhpratt/powerfmt ">powerfmt 0.2.0</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2023 Jacob Pratt et al.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/time-rs/time ">time-macros 0.2.18</a></li>
                    <li><a href=" https://github.com/time-rs/time ">time 0.3.36</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2024 Jacob Pratt et al.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/smithy-lang/smithy-rs ">aws-sigv4 1.2.4</a></li>
                    <li><a href=" https://github.com/tormol/encode_unicode ">encode_unicode 0.3.6</a></li>
                    <li><a href=" https://github.com/hsivonen/encoding_rs ">encoding_rs 0.8.32</a></li>
                    <li><a href=" https://github.com/mitsuhiko/fragile ">fragile 2.0.0</a></li>
                    <li><a href=" https://github.com/nvzqz/static-assertions-rs ">static_assertions 1.1.0</a></li>
                    <li><a href=" https://github.com/Lokathor/tinyvec ">tinyvec 1.8.0</a></li>
                    <li><a href=" https://github.com/RustCrypto/utils/tree/master/zeroize ">zeroize 1.8.1</a></li>
                </ul>
                <pre class="license-text">
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright [yyyy] [name of copyright owner]

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/wvwwvwwv/scalable-delayed-dealloc/ ">sdd 3.0.3</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, April 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   Copyright 2024-present Changgyoo Park

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/assert-rs/predicates-rs ">predicates 2.1.5</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows-core 0.52.0</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows-sys 0.48.0</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows-sys 0.52.0</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows-sys 0.59.0</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows-targets 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows-targets 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_aarch64_gnullvm 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_aarch64_gnullvm 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_aarch64_msvc 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_aarch64_msvc 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_i686_gnu 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_i686_gnu 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_i686_gnullvm 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_i686_msvc 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_i686_msvc 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_x86_64_gnu 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_x86_64_gnu 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_x86_64_gnullvm 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_x86_64_gnullvm 0.52.6</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_x86_64_msvc 0.48.5</a></li>
                    <li><a href=" https://github.com/microsoft/windows-rs ">windows_x86_64_msvc 0.52.6</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright (c) Microsoft Corporation.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/Soveu/tinyvec_macros ">tinyvec_macros 0.1.1</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2020 Tomasz &quot;Soveu&quot; Marx

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.

</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/google/zerocopy ">zerocopy-derive 0.7.35</a></li>
                    <li><a href=" https://github.com/google/zerocopy ">zerocopy 0.7.35</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2023 The Fuchsia Authors

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.

</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust ">opentelemetry-http 0.9.0</a></li>
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-otlp ">opentelemetry-otlp 0.13.0</a></li>
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-proto ">opentelemetry-proto 0.3.0</a></li>
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust/tree/main/opentelemetry-semantic-conventions ">opentelemetry-semantic-conventions 0.12.0</a></li>
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust ">opentelemetry 0.20.0</a></li>
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust ">opentelemetry_api 0.20.0</a></li>
                    <li><a href=" https://github.com/open-telemetry/opentelemetry-rust ">opentelemetry_sdk 0.20.0</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2023 The OpenTelemetry Authors

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/daxpedda/web-time ">web-time 1.1.0</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2023 dAxpeDDa

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/mheffner/rust-sketches-ddsketch ">sketches-ddsketch 0.3.0</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright [2019] [Mike Heffner]

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/juhaku/utoipa ">utoipa-gen 4.3.1</a></li>
                    <li><a href=" https://github.com/juhaku/utoipa ">utoipa 4.2.3</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright [yyyy] [name of copyright owner]

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/enarx/ciborium ">ciborium-io 0.2.2</a></li>
                    <li><a href=" https://github.com/enarx/ciborium ">ciborium-ll 0.2.2</a></li>
                    <li><a href=" https://github.com/enarx/ciborium ">ciborium 0.2.2</a></li>
                    <li><a href=" https://github.com/clap-rs/clap ">clap_builder 4.5.20</a></li>
                    <li><a href=" https://github.com/clap-rs/clap ">clap_lex 0.7.2</a></li>
                    <li><a href=" https://github.com/vinted/elasticsearch-dsl-rs ">elasticsearch-dsl 0.4.22</a></li>
                    <li><a href=" https://github.com/tmccombs/json-comments-rs ">json_comments 0.2.2</a></li>
                    <li><a href=" https://github.com/MiSawa/time-fmt ">time-fmt 0.3.8</a></li>
                    <li><a href=" https://github.com/cameron1024/unarray ">unarray 0.1.4</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright [yyyy] [name of copyright owner]

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/krisprice/ipnet ">ipnet 2.10.1</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2017 Juniper Networks, Inc.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/actix/actix-net.git ">bytestring 1.3.1</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2017-NOW Actix Team

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/bikeshedder/deadpool ">deadpool-runtime 0.1.4</a></li>
                    <li><a href=" https://github.com/bikeshedder/deadpool ">deadpool 0.9.5</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2019 Michael P. Jung

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.

</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tikv/fail-rs ">fail 0.5.1</a></li>
                    <li><a href=" https://github.com/tikv/rust-prometheus ">prometheus 0.13.4</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2019 TiKV Project Authors.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-cli/anstyle.git ">anstyle-parse 0.2.5</a></li>
                    <li><a href=" https://github.com/llogiq/bytecount ">bytecount 0.6.8</a></li>
                    <li><a href=" https://github.com/utkarshkukreti/diff.rs ">diff 0.1.13</a></li>
                    <li><a href=" https://github.com/achanda/ipnetwork ">ipnetwork 0.20.0</a></li>
                    <li><a href=" https://github.com/derekdreery/normalize-line-endings ">normalize-line-endings 0.3.0</a></li>
                    <li><a href=" https://github.com/assert-rs/predicates-rs/tree/master/crates/core ">predicates-core 1.0.8</a></li>
                    <li><a href=" https://github.com/assert-rs/predicates-rs/tree/master/crates/tree ">predicates-tree 1.0.11</a></li>
                    <li><a href=" https://github.com/assert-rs/predicates-rs ">predicates 3.1.2</a></li>
                    <li><a href=" https://github.com/retep998/winapi-rs ">winapi 0.3.9</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright {yyyy} {name of copyright owner}

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-cli/anstyle.git ">anstream 0.6.15</a></li>
                    <li><a href=" https://github.com/rust-cli/anstyle ">anstyle-query 1.1.1</a></li>
                    <li><a href=" https://github.com/rust-cli/anstyle.git ">anstyle-wincon 3.0.4</a></li>
                    <li><a href=" https://github.com/rust-cli/anstyle.git ">anstyle 1.0.8</a></li>
                    <li><a href=" https://github.com/hyunsik/bytesize/ ">bytesize 1.3.0</a></li>
                    <li><a href=" https://github.com/clap-rs/clap ">clap 4.5.20</a></li>
                    <li><a href=" https://github.com/jamesmunns/cobs.rs ">cobs 0.2.3</a></li>
                    <li><a href=" https://github.com/rust-cli/anstyle ">colorchoice 1.0.2</a></li>
                    <li><a href=" https://github.com/srijs/rust-crc32fast ">crc32fast 1.4.2</a></li>
                    <li><a href=" https://github.com/rust-cli/env_logger ">env_logger 0.10.2</a></li>
                    <li><a href=" https://github.com/KokaKiwi/rust-hex ">hex 0.4.3</a></li>
                    <li><a href=" https://github.com/tailhook/humantime ">humantime 2.1.0</a></li>
                    <li><a href=" https://github.com/polyfill-rs/is_terminal_polyfill ">is_terminal_polyfill 1.70.1</a></li>
                    <li><a href=" https://github.com/rust-pretty-assertions/rust-pretty-assertions ">pretty_assertions 1.4.1</a></li>
                    <li><a href=" http://github.com/tailhook/quick-error ">quick-error 1.2.3</a></li>
                    <li><a href=" https://github.com/toml-rs/toml ">serde_spanned 0.6.8</a></li>
                    <li><a href=" https://github.com/sfackler/tokio-io-timeout ">tokio-io-timeout 1.2.0</a></li>
                    <li><a href=" https://github.com/toml-rs/toml ">toml 0.7.8</a></li>
                    <li><a href=" https://github.com/toml-rs/toml ">toml_datetime 0.6.8</a></li>
                    <li><a href=" https://github.com/toml-rs/toml ">toml_edit 0.19.15</a></li>
                    <li><a href=" https://github.com/stusmall/ttl_cache ">ttl_cache 0.5.1</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright {yyyy} {name of copyright owner}

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.

</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/http-rs/http-types ">http-types 2.12.0</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   Copyright 2019 Yoshua Wuyts
   Copyright 2016-2018 Michael Tilli (Pyfisch) &amp; &#x60;httpdate&#x60; contributors

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/wvwwvwwv/scalable-concurrent-containers/ ">scc 2.2.0</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   Copyright 2020-2024 Changgyoo Park

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/RumovZ/android-tzdata ">android-tzdata 0.1.1</a></li>
                </ul>
                <pre class="license-text">                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1.  Definitions.

    &quot;License&quot; shall mean the terms and conditions for use, reproduction,
    and distribution as defined by Sections 1 through 9 of this document.

    &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
    the copyright owner that is granting the License.

    &quot;Legal Entity&quot; shall mean the union of the acting entity and all
    other entities that control, are controlled by, or are under common
    control with that entity. For the purposes of this definition,
    &quot;control&quot; means (i) the power, direct or indirect, to cause the
    direction or management of such entity, whether by contract or
    otherwise, or (ii) ownership of fifty percent (50%) or more of the
    outstanding shares, or (iii) beneficial ownership of such entity.

    &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
    exercising permissions granted by this License.

    &quot;Source&quot; form shall mean the preferred form for making modifications,
    including but not limited to software source code, documentation
    source, and configuration files.

    &quot;Object&quot; form shall mean any form resulting from mechanical
    transformation or translation of a Source form, including but
    not limited to compiled object code, generated documentation,
    and conversions to other media types.

    &quot;Work&quot; shall mean the work of authorship, whether in Source or
    Object form, made available under the License, as indicated by a
    copyright notice that is included in or attached to the work
    (an example is provided in the Appendix below).

    &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
    form, that is based on (or derived from) the Work and for which the
    editorial revisions, annotations, elaborations, or other modifications
    represent, as a whole, an original work of authorship. For the purposes
    of this License, Derivative Works shall not include works that remain
    separable from, or merely link (or bind by name) to the interfaces of,
    the Work and Derivative Works thereof.

    &quot;Contribution&quot; shall mean any work of authorship, including
    the original version of the Work and any modifications or additions
    to that Work or Derivative Works thereof, that is intentionally
    submitted to Licensor for inclusion in the Work by the copyright owner
    or by an individual or Legal Entity authorized to submit on behalf of
    the copyright owner. For the purposes of this definition, &quot;submitted&quot;
    means any form of electronic, verbal, or written communication sent
    to the Licensor or its representatives, including but not limited to
    communication on electronic mailing lists, source code control systems,
    and issue tracking systems that are managed by, or on behalf of, the
    Licensor for the purpose of discussing and improving the Work, but
    excluding communication that is conspicuously marked or otherwise
    designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

    &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
    on behalf of whom a Contribution has been received by Licensor and
    subsequently incorporated within the Work.

2.  Grant of Copyright License. Subject to the terms and conditions of
    this License, each Contributor hereby grants to You a perpetual,
    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
    copyright license to reproduce, prepare Derivative Works of,
    publicly display, publicly perform, sublicense, and distribute the
    Work and such Derivative Works in Source or Object form.

3.  Grant of Patent License. Subject to the terms and conditions of
    this License, each Contributor hereby grants to You a perpetual,
    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
    (except as stated in this section) patent license to make, have made,
    use, offer to sell, sell, import, and otherwise transfer the Work,
    where such license applies only to those patent claims licensable
    by such Contributor that are necessarily infringed by their
    Contribution(s) alone or by combination of their Contribution(s)
    with the Work to which such Contribution(s) was submitted. If You
    institute patent litigation against any entity (including a
    cross-claim or counterclaim in a lawsuit) alleging that the Work
    or a Contribution incorporated within the Work constitutes direct
    or contributory patent infringement, then any patent licenses
    granted to You under this License for that Work shall terminate
    as of the date such litigation is filed.

4.  Redistribution. You may reproduce and distribute copies of the
    Work or Derivative Works thereof in any medium, with or without
    modifications, and in Source or Object form, provided that You
    meet the following conditions:

    (a) You must give any other recipients of the Work or
    Derivative Works a copy of this License; and

    (b) You must cause any modified files to carry prominent notices
    stating that You changed the files; and

    (c) You must retain, in the Source form of any Derivative Works
    that You distribute, all copyright, patent, trademark, and
    attribution notices from the Source form of the Work,
    excluding those notices that do not pertain to any part of
    the Derivative Works; and

    (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
    distribution, then any Derivative Works that You distribute must
    include a readable copy of the attribution notices contained
    within such NOTICE file, excluding those notices that do not
    pertain to any part of the Derivative Works, in at least one
    of the following places: within a NOTICE text file distributed
    as part of the Derivative Works; within the Source form or
    documentation, if provided along with the Derivative Works; or,
    within a display generated by the Derivative Works, if and
    wherever such third-party notices normally appear. The contents
    of the NOTICE file are for informational purposes only and
    do not modify the License. You may add Your own attribution
    notices within Derivative Works that You distribute, alongside
    or as an addendum to the NOTICE text from the Work, provided
    that such additional attribution notices cannot be construed
    as modifying the License.

    You may add Your own copyright statement to Your modifications and
    may provide additional or different license terms and conditions
    for use, reproduction, or distribution of Your modifications, or
    for any such Derivative Works as a whole, provided Your use,
    reproduction, and distribution of the Work otherwise complies with
    the conditions stated in this License.

5.  Submission of Contributions. Unless You explicitly state otherwise,
    any Contribution intentionally submitted for inclusion in the Work
    by You to the Licensor shall be under the terms and conditions of
    this License, without any additional terms or conditions.
    Notwithstanding the above, nothing herein shall supersede or modify
    the terms of any separate license agreement you may have executed
    with Licensor regarding such Contributions.

6.  Trademarks. This License does not grant permission to use the trade
    names, trademarks, service marks, or product names of the Licensor,
    except as required for reasonable and customary use in describing the
    origin of the Work and reproducing the content of the NOTICE file.

7.  Disclaimer of Warranty. Unless required by applicable law or
    agreed to in writing, Licensor provides the Work (and each
    Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
    implied, including, without limitation, any warranties or conditions
    of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
    PARTICULAR PURPOSE. You are solely responsible for determining the
    appropriateness of using or redistributing the Work and assume any
    risks associated with Your exercise of permissions under this License.

8.  Limitation of Liability. In no event and under no legal theory,
    whether in tort (including negligence), contract, or otherwise,
    unless required by applicable law (such as deliberate and grossly
    negligent acts) or agreed to in writing, shall any Contributor be
    liable to You for damages, including any direct, indirect, special,
    incidental, or consequential damages of any character arising as a
    result of this License or out of the use or inability to use the
    Work (including but not limited to damages for loss of goodwill,
    work stoppage, computer failure or malfunction, or any and all
    other commercial damages or losses), even if such Contributor
    has been advised of the possibility of such damages.

9.  Accepting Warranty or Additional Liability. While redistributing
    the Work or Derivative Works thereof, You may choose to offer,
    and charge a fee for, acceptance of support, warranty, indemnity,
    or other liability obligations and/or rights consistent with this
    License. However, in accepting such obligations, You may act only
    on Your own behalf and on Your sole responsibility, not on behalf
    of any other Contributor, and only if You agree to indemnify,
    defend, and hold each Contributor harmless for any liability
    incurred by, or claims asserted against, such Contributor by reason
    of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/awslabs/aws-sdk-rust ">aws-sdk-s3 1.54.0</a></li>
                    <li><a href=" https://github.com/awslabs/aws-sdk-rust ">aws-sdk-sqs 1.45.0</a></li>
                    <li><a href=" https://github.com/awslabs/aws-sdk-rust ">aws-sdk-sso 1.45.0</a></li>
                    <li><a href=" https://github.com/awslabs/aws-sdk-rust ">aws-sdk-ssooidc 1.46.0</a></li>
                    <li><a href=" https://github.com/awslabs/aws-sdk-rust ">aws-sdk-sts 1.45.0</a></li>
                </ul>
                <pre class="license-text">                                Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright 2018-2020 Amazon.com, Inc. or its affiliates. All Rights Reserved.

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.

</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tmiasko/shell-words ">shell-words 1.1.0</a></li>
                </ul>
                <pre class="license-text">                               Apache License
                         Version 2.0, January 2004
                      http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

  &quot;License&quot; shall mean the terms and conditions for use, reproduction,
  and distribution as defined by Sections 1 through 9 of this document.

  &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
  the copyright owner that is granting the License.

  &quot;Legal Entity&quot; shall mean the union of the acting entity and all
  other entities that control, are controlled by, or are under common
  control with that entity. For the purposes of this definition,
  &quot;control&quot; means (i) the power, direct or indirect, to cause the
  direction or management of such entity, whether by contract or
  otherwise, or (ii) ownership of fifty percent (50%) or more of the
  outstanding shares, or (iii) beneficial ownership of such entity.

  &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
  exercising permissions granted by this License.

  &quot;Source&quot; form shall mean the preferred form for making modifications,
  including but not limited to software source code, documentation
  source, and configuration files.

  &quot;Object&quot; form shall mean any form resulting from mechanical
  transformation or translation of a Source form, including but
  not limited to compiled object code, generated documentation,
  and conversions to other media types.

  &quot;Work&quot; shall mean the work of authorship, whether in Source or
  Object form, made available under the License, as indicated by a
  copyright notice that is included in or attached to the work
  (an example is provided in the Appendix below).

  &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
  form, that is based on (or derived from) the Work and for which the
  editorial revisions, annotations, elaborations, or other modifications
  represent, as a whole, an original work of authorship. For the purposes
  of this License, Derivative Works shall not include works that remain
  separable from, or merely link (or bind by name) to the interfaces of,
  the Work and Derivative Works thereof.

  &quot;Contribution&quot; shall mean any work of authorship, including
  the original version of the Work and any modifications or additions
  to that Work or Derivative Works thereof, that is intentionally
  submitted to Licensor for inclusion in the Work by the copyright owner
  or by an individual or Legal Entity authorized to submit on behalf of
  the copyright owner. For the purposes of this definition, &quot;submitted&quot;
  means any form of electronic, verbal, or written communication sent
  to the Licensor or its representatives, including but not limited to
  communication on electronic mailing lists, source code control systems,
  and issue tracking systems that are managed by, or on behalf of, the
  Licensor for the purpose of discussing and improving the Work, but
  excluding communication that is conspicuously marked or otherwise
  designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

  &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
  on behalf of whom a Contribution has been received by Licensor and
  subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
  this License, each Contributor hereby grants to You a perpetual,
  worldwide, non-exclusive, no-charge, royalty-free, irrevocable
  copyright license to reproduce, prepare Derivative Works of,
  publicly display, publicly perform, sublicense, and distribute the
  Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
  this License, each Contributor hereby grants to You a perpetual,
  worldwide, non-exclusive, no-charge, royalty-free, irrevocable
  (except as stated in this section) patent license to make, have made,
  use, offer to sell, sell, import, and otherwise transfer the Work,
  where such license applies only to those patent claims licensable
  by such Contributor that are necessarily infringed by their
  Contribution(s) alone or by combination of their Contribution(s)
  with the Work to which such Contribution(s) was submitted. If You
  institute patent litigation against any entity (including a
  cross-claim or counterclaim in a lawsuit) alleging that the Work
  or a Contribution incorporated within the Work constitutes direct
  or contributory patent infringement, then any patent licenses
  granted to You under this License for that Work shall terminate
  as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
  Work or Derivative Works thereof in any medium, with or without
  modifications, and in Source or Object form, provided that You
  meet the following conditions:

  (a) You must give any other recipients of the Work or
      Derivative Works a copy of this License; and

  (b) You must cause any modified files to carry prominent notices
      stating that You changed the files; and

  (c) You must retain, in the Source form of any Derivative Works
      that You distribute, all copyright, patent, trademark, and
      attribution notices from the Source form of the Work,
      excluding those notices that do not pertain to any part of
      the Derivative Works; and

  (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
      distribution, then any Derivative Works that You distribute must
      include a readable copy of the attribution notices contained
      within such NOTICE file, excluding those notices that do not
      pertain to any part of the Derivative Works, in at least one
      of the following places: within a NOTICE text file distributed
      as part of the Derivative Works; within the Source form or
      documentation, if provided along with the Derivative Works; or,
      within a display generated by the Derivative Works, if and
      wherever such third-party notices normally appear. The contents
      of the NOTICE file are for informational purposes only and
      do not modify the License. You may add Your own attribution
      notices within Derivative Works that You distribute, alongside
      or as an addendum to the NOTICE text from the Work, provided
      that such additional attribution notices cannot be construed
      as modifying the License.

  You may add Your own copyright statement to Your modifications and
  may provide additional or different license terms and conditions
  for use, reproduction, or distribution of Your modifications, or
  for any such Derivative Works as a whole, provided Your use,
  reproduction, and distribution of the Work otherwise complies with
  the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
  any Contribution intentionally submitted for inclusion in the Work
  by You to the Licensor shall be under the terms and conditions of
  this License, without any additional terms or conditions.
  Notwithstanding the above, nothing herein shall supersede or modify
  the terms of any separate license agreement you may have executed
  with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
  names, trademarks, service marks, or product names of the Licensor,
  except as required for reasonable and customary use in describing the
  origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
  agreed to in writing, Licensor provides the Work (and each
  Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
  implied, including, without limitation, any warranties or conditions
  of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
  PARTICULAR PURPOSE. You are solely responsible for determining the
  appropriateness of using or redistributing the Work and assume any
  risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
  whether in tort (including negligence), contract, or otherwise,
  unless required by applicable law (such as deliberate and grossly
  negligent acts) or agreed to in writing, shall any Contributor be
  liable to You for damages, including any direct, indirect, special,
  incidental, or consequential damages of any character arising as a
  result of this License or out of the use or inability to use the
  Work (including but not limited to damages for loss of goodwill,
  work stoppage, computer failure or malfunction, or any and all
  other commercial damages or losses), even if such Contributor
  has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
  the Work or Derivative Works thereof, You may choose to offer,
  and charge a fee for, acceptance of support, warranty, indemnity,
  or other liability obligations and/or rights consistent with this
  License. However, in accepting such obligations, You may act only
  on Your own behalf and on Your sole responsibility, not on behalf
  of any other Contributor, and only if You agree to indemnify,
  defend, and hold each Contributor harmless for any liability
  incurred by, or claims asserted against, such Contributor by reason
  of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

  To apply the Apache License to your work, attach the following
  boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
  replaced with your own identifying information. (Don&#x27;t include
  the brackets!)  The text should be enclosed in the appropriate
  comment syntax for the file format. We also recommend that a
  file or class name and description of purpose be included on the
  same &quot;printed page&quot; as the copyright notice for easier
  identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/takuyaa/yada ">yada 0.5.1</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/dtolnay/anyhow ">anyhow 1.0.89</a></li>
                    <li><a href=" https://github.com/dtolnay/async-trait ">async-trait 0.1.83</a></li>
                    <li><a href=" https://github.com/zslayton/cron ">cron 0.12.1</a></li>
                    <li><a href=" https://github.com/dtolnay/dtoa ">dtoa 1.0.9</a></li>
                    <li><a href=" https://github.com/dtolnay/dyn-clone ">dyn-clone 1.0.17</a></li>
                    <li><a href=" https://github.com/dtolnay/erased-serde ">erased-serde 0.4.5</a></li>
                    <li><a href=" https://github.com/dtolnay/inventory ">inventory 0.3.15</a></li>
                    <li><a href=" https://github.com/dtolnay/itoa ">itoa 1.0.11</a></li>
                    <li><a href=" https://github.com/rust-lang/libc ">libc 0.2.159</a></li>
                    <li><a href=" https://github.com/dtolnay/prettyplease ">prettyplease 0.1.25</a></li>
                    <li><a href=" https://github.com/dtolnay/prettyplease ">prettyplease 0.2.22</a></li>
                    <li><a href=" https://github.com/SergioBenitez/proc-macro2-diagnostics ">proc-macro2-diagnostics 0.10.1</a></li>
                    <li><a href=" https://github.com/dtolnay/proc-macro2 ">proc-macro2 1.0.87</a></li>
                    <li><a href=" https://github.com/dtolnay/quote ">quote 1.0.37</a></li>
                    <li><a href=" https://github.com/dtolnay/rustversion ">rustversion 1.0.17</a></li>
                    <li><a href=" https://github.com/dtolnay/ryu ">ryu 1.0.18</a></li>
                    <li><a href=" https://github.com/dtolnay/semver ">semver 1.0.23</a></li>
                    <li><a href=" https://github.com/serde-rs/serde ">serde 1.0.210</a></li>
                    <li><a href=" https://github.com/serde-rs/serde ">serde_derive 1.0.210</a></li>
                    <li><a href=" https://github.com/serde-rs/json ">serde_json 1.0.112</a></li>
                    <li><a href=" https://github.com/dtolnay/path-to-error ">serde_path_to_error 0.1.16</a></li>
                    <li><a href=" https://github.com/samscott89/serde_qs ">serde_qs 0.12.0</a></li>
                    <li><a href=" https://github.com/samscott89/serde_qs ">serde_qs 0.8.5</a></li>
                    <li><a href=" https://github.com/nox/serde_urlencoded ">serde_urlencoded 0.7.1</a></li>
                    <li><a href=" https://github.com/dtolnay/serde-yaml ">serde_yaml 0.9.30</a></li>
                    <li><a href=" https://github.com/dtolnay/syn ">syn 2.0.79</a></li>
                    <li><a href=" https://github.com/dtolnay/thiserror ">thiserror-impl 1.0.64</a></li>
                    <li><a href=" https://github.com/dtolnay/thiserror ">thiserror 1.0.64</a></li>
                    <li><a href=" https://github.com/dtolnay/typeid ">typeid 1.0.2</a></li>
                    <li><a href=" https://github.com/dtolnay/typetag ">typetag-impl 0.2.18</a></li>
                    <li><a href=" https://github.com/dtolnay/typetag ">typetag 0.2.18</a></li>
                    <li><a href=" https://github.com/dtolnay/unicode-ident ">unicode-ident 1.0.13</a></li>
                    <li><a href=" https://github.com/SimonSapin/rust-utf8 ">utf-8 0.7.6</a></li>
                    <li><a href=" https://github.com/alacritty/vte ">utf8parse 0.2.2</a></li>
                    <li><a href=" https://github.com/alacritty/vte ">vte 0.10.1</a></li>
                    <li><a href=" https://github.com/alacritty/vte ">vte_generate_state_changes 0.1.2</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-channel 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-core 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-executor 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-io 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-macro 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-sink 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-task 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures-util 0.3.31</a></li>
                    <li><a href=" https://github.com/rust-lang/futures-rs ">futures 0.3.31</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright (c) 2016 Alex Crichton
Copyright (c) 2017 The Tokio Authors

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/paholg/typenum ">typenum 1.17.0</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2014 Paho Lurie-Gregg

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/seanmonstar/reqwest ">reqwest 0.11.27</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2016 Sean McArthur

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/SergioBenitez/yansi ">yansi 1.0.1</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2017 Sergio Benitez

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/http ">http 0.2.12</a></li>
                    <li><a href=" https://github.com/hyperium/http ">http 1.1.0</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2017 http-rs authors

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rustls/tokio-rustls ">tokio-rustls 0.24.1</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2017 quininer kel

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-lang-nursery/pin-utils ">pin-utils 0.1.0</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2018 The pin-utils authors

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/RustCrypto/signatures/tree/master/ecdsa ">ecdsa 0.14.8</a></li>
                    <li><a href=" https://github.com/RustCrypto/signatures/tree/master/rfc6979 ">rfc6979 0.3.1</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2018-2022 RustCrypto Developers

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/cryptocorrosion/cryptocorrosion ">ppv-lite86 0.2.20</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2019 The CryptoCorrosion Contributors

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://gitlab.com/CreepySkeleton/proc-macro-error ">proc-macro-error-attr 1.0.4</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2019-2020 CreepySkeleton &lt;creepy-skeleton@yandex.ru&gt;

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/strawlab/iana-time-zone ">iana-time-zone-haiku 0.1.2</a></li>
                    <li><a href=" https://github.com/strawlab/iana-time-zone ">iana-time-zone 0.1.61</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2020 Andrew Straw

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/RazrFalcon/memmap2-rs ">memmap2 0.9.5</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [2015] [Dan Burkert]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/gimli-rs/addr2line ">addr2line 0.24.2</a></li>
                    <li><a href=" https://github.com/tkaitchuck/ahash ">ahash 0.8.11</a></li>
                    <li><a href=" https://github.com/vorner/arc-swap ">arc-swap 1.7.1</a></li>
                    <li><a href=" https://github.com/bluss/arrayvec ">arrayvec 0.5.2</a></li>
                    <li><a href=" https://github.com/smol-rs/async-channel ">async-channel 1.9.0</a></li>
                    <li><a href=" https://github.com/Nullus157/async-compression ">async-compression 0.4.13</a></li>
                    <li><a href=" https://github.com/cuviper/autocfg ">autocfg 1.4.0</a></li>
                    <li><a href=" https://github.com/rust-lang/backtrace-rs ">backtrace 0.3.74</a></li>
                    <li><a href=" https://github.com/marshallpierce/rust-base64 ">base64 0.13.1</a></li>
                    <li><a href=" https://github.com/marshallpierce/rust-base64 ">base64 0.20.0</a></li>
                    <li><a href=" https://github.com/marshallpierce/rust-base64 ">base64 0.21.7</a></li>
                    <li><a href=" https://github.com/marshallpierce/rust-base64 ">base64 0.22.1</a></li>
                    <li><a href=" https://github.com/bitflags/bitflags ">bitflags 1.3.2</a></li>
                    <li><a href=" https://github.com/bitflags/bitflags ">bitflags 2.6.0</a></li>
                    <li><a href=" https://github.com/Nullus157/bs58-rs ">bs58 0.5.1</a></li>
                    <li><a href=" https://github.com/fitzgen/bumpalo ">bumpalo 3.16.0</a></li>
                    <li><a href=" https://github.com/vorner/bytes-utils ">bytes-utils 0.1.4</a></li>
                    <li><a href=" https://github.com/alexcrichton/bzip2-rs ">bzip2-sys 0.1.11+1.0.8</a></li>
                    <li><a href=" https://github.com/alexcrichton/bzip2-rs ">bzip2 0.4.4</a></li>
                    <li><a href=" https://github.com/japaric/cast.rs ">cast 0.3.0</a></li>
                    <li><a href=" https://github.com/Nullus157/cbor-diag-rs ">cbor-diag 0.1.12</a></li>
                    <li><a href=" https://github.com/rust-lang/cc-rs ">cc 1.1.28</a></li>
                    <li><a href=" https://github.com/alexcrichton/cfg-if ">cfg-if 1.0.0</a></li>
                    <li><a href=" https://github.com/smol-rs/concurrent-queue ">concurrent-queue 2.5.0</a></li>
                    <li><a href=" https://github.com/servo/core-foundation-rs ">core-foundation-sys 0.8.7</a></li>
                    <li><a href=" https://github.com/servo/core-foundation-rs ">core-foundation 0.9.4</a></li>
                    <li><a href=" https://github.com/bheisler/criterion.rs ">criterion-plot 0.5.0</a></li>
                    <li><a href=" https://github.com/bheisler/criterion.rs ">criterion 0.5.1</a></li>
                    <li><a href=" https://github.com/crossbeam-rs/crossbeam ">crossbeam-channel 0.5.13</a></li>
                    <li><a href=" https://github.com/crossbeam-rs/crossbeam ">crossbeam-deque 0.8.5</a></li>
                    <li><a href=" https://github.com/crossbeam-rs/crossbeam ">crossbeam-epoch 0.9.18</a></li>
                    <li><a href=" https://github.com/crossbeam-rs/crossbeam ">crossbeam-utils 0.8.20</a></li>
                    <li><a href=" https://github.com/rayon-rs/either ">either 1.13.0</a></li>
                    <li><a href=" https://github.com/BurntSushi/encoding_rs_io ">encoding_rs_io 0.1.7</a></li>
                    <li><a href=" https://github.com/cuviper/equivalent ">equivalent 1.0.1</a></li>
                    <li><a href=" https://github.com/lambda-fairy/rust-errno ">errno 0.3.9</a></li>
                    <li><a href=" https://github.com/smol-rs/event-listener ">event-listener 2.5.3</a></li>
                    <li><a href=" https://github.com/smol-rs/fastrand ">fastrand 1.9.0</a></li>
                    <li><a href=" https://github.com/smol-rs/fastrand ">fastrand 2.1.1</a></li>
                    <li><a href=" https://github.com/alexcrichton/filetime ">filetime 0.2.25</a></li>
                    <li><a href=" https://github.com/petgraph/fixedbitset ">fixedbitset 0.4.2</a></li>
                    <li><a href=" https://github.com/rust-lang/flate2-rs ">flate2 1.0.34</a></li>
                    <li><a href=" https://github.com/servo/rust-fnv ">fnv 1.0.7</a></li>
                    <li><a href=" https://github.com/servo/rust-url ">form_urlencoded 1.2.1</a></li>
                    <li><a href=" https://github.com/al8n/fs4-rs ">fs4 0.8.4</a></li>
                    <li><a href=" https://github.com/smol-rs/futures-lite ">futures-lite 1.13.0</a></li>
                    <li><a href=" https://github.com/async-rs/futures-timer ">futures-timer 3.0.3</a></li>
                    <li><a href=" https://github.com/gimli-rs/gimli ">gimli 0.31.1</a></li>
                    <li><a href=" https://github.com/rust-lang/glob ">glob 0.3.1</a></li>
                    <li><a href=" https://github.com/zkcrypto/group ">group 0.12.1</a></li>
                    <li><a href=" https://github.com/rust-lang/hashbrown ">hashbrown 0.12.3</a></li>
                    <li><a href=" https://github.com/rust-lang/hashbrown ">hashbrown 0.14.5</a></li>
                    <li><a href=" https://github.com/rust-lang/hashbrown ">hashbrown 0.15.0</a></li>
                    <li><a href=" https://github.com/withoutboats/heck ">heck 0.4.1</a></li>
                    <li><a href=" https://github.com/hermit-os/hermit-rs ">hermit-abi 0.3.9</a></li>
                    <li><a href=" https://github.com/hermit-os/hermit-rs ">hermit-abi 0.4.0</a></li>
                    <li><a href=" https://github.com/seanmonstar/httparse ">httparse 1.9.5</a></li>
                    <li><a href=" https://github.com/rustls/hyper-rustls ">hyper-rustls 0.24.2</a></li>
                    <li><a href=" https://github.com/hjr3/hyper-timeout ">hyper-timeout 0.4.1</a></li>
                    <li><a href=" https://github.com/servo/rust-url/ ">idna 0.5.0</a></li>
                    <li><a href=" https://github.com/bluss/indexmap ">indexmap 1.9.3</a></li>
                    <li><a href=" https://github.com/bluss/indexmap ">indexmap 2.1.0</a></li>
                    <li><a href=" https://github.com/rust-itertools/itertools ">itertools 0.10.5</a></li>
                    <li><a href=" https://github.com/rust-itertools/itertools ">itertools 0.12.1</a></li>
                    <li><a href=" https://github.com/rust-itertools/itertools ">itertools 0.13.0</a></li>
                    <li><a href=" https://github.com/rust-lang/jobserver-rs ">jobserver 0.1.32</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/js-sys ">js-sys 0.3.71</a></li>
                    <li><a href=" https://github.com/rust-lang-nursery/lazy-static.rs ">lazy_static 1.5.0</a></li>
                    <li><a href=" https://github.com/rust-lang/libm ">libm 0.2.8</a></li>
                    <li><a href=" https://github.com/sunfishcode/linux-raw-sys ">linux-raw-sys 0.4.14</a></li>
                    <li><a href=" https://github.com/Amanieu/parking_lot ">lock_api 0.4.12</a></li>
                    <li><a href=" https://github.com/rust-lang/log ">log 0.4.22</a></li>
                    <li><a href=" https://github.com/gnzlbg/match_cfg ">match_cfg 0.1.0</a></li>
                    <li><a href=" https://github.com/hyperium/mime ">mime 0.3.17</a></li>
                    <li><a href=" https://github.com/asomers/mockall ">mockall 0.11.4</a></li>
                    <li><a href=" https://github.com/asomers/mockall ">mockall_derive 0.11.4</a></li>
                    <li><a href=" https://github.com/havarnov/multimap ">multimap 0.8.3</a></li>
                    <li><a href=" https://github.com/rust-num/num-bigint ">num-bigint 0.4.6</a></li>
                    <li><a href=" https://github.com/rust-num/num-integer ">num-integer 0.1.46</a></li>
                    <li><a href=" https://github.com/rust-num/num-rational ">num-rational 0.4.2</a></li>
                    <li><a href=" https://github.com/rust-num/num-traits ">num-traits 0.2.19</a></li>
                    <li><a href=" https://github.com/seanmonstar/num_cpus ">num_cpus 1.16.0</a></li>
                    <li><a href=" https://github.com/gimli-rs/object ">object 0.36.5</a></li>
                    <li><a href=" https://github.com/matklad/once_cell ">once_cell 1.20.2</a></li>
                    <li><a href=" https://github.com/alexcrichton/openssl-probe ">openssl-probe 0.1.5</a></li>
                    <li><a href=" https://github.com/smol-rs/parking ">parking 2.2.1</a></li>
                    <li><a href=" https://github.com/Amanieu/parking_lot ">parking_lot 0.12.3</a></li>
                    <li><a href=" https://github.com/Amanieu/parking_lot ">parking_lot_core 0.9.10</a></li>
                    <li><a href=" https://github.com/servo/rust-url/ ">percent-encoding 2.3.1</a></li>
                    <li><a href=" https://github.com/petgraph/petgraph ">petgraph 0.6.5</a></li>
                    <li><a href=" https://github.com/rust-lang/pkg-config-rs ">pkg-config 0.3.31</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_base 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_datalink 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_macros 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_macros_support 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_packet 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_sys 0.33.0</a></li>
                    <li><a href=" https://github.com/libpnet/libpnet ">pnet_transport 0.33.0</a></li>
                    <li><a href=" https://github.com/proptest-rs/proptest ">proptest 1.5.0</a></li>
                    <li><a href=" https://github.com/tokio-rs/prost ">prost-build 0.11.9</a></li>
                    <li><a href=" https://github.com/tokio-rs/prost ">prost-derive 0.11.9</a></li>
                    <li><a href=" https://github.com/tokio-rs/prost ">prost-types 0.11.9</a></li>
                    <li><a href=" https://github.com/tokio-rs/prost ">prost 0.11.9</a></li>
                    <li><a href=" https://github.com/rayon-rs/rayon ">rayon-core 1.12.1</a></li>
                    <li><a href=" https://github.com/rayon-rs/rayon ">rayon 1.10.0</a></li>
                    <li><a href=" https://github.com/rust-lang/regex/tree/master/regex-automata ">regex-automata 0.4.8</a></li>
                    <li><a href=" https://github.com/rust-lang/regex/tree/master/regex-lite ">regex-lite 0.1.6</a></li>
                    <li><a href=" https://github.com/rust-lang/regex ">regex-syntax 0.6.29</a></li>
                    <li><a href=" https://github.com/rust-lang/regex/tree/master/regex-syntax ">regex-syntax 0.8.5</a></li>
                    <li><a href=" https://github.com/rust-lang/regex ">regex 1.11.0</a></li>
                    <li><a href=" https://github.com/RazrFalcon/roxmltree ">roxmltree 0.14.1</a></li>
                    <li><a href=" https://github.com/rust-lang/rustc-demangle ">rustc-demangle 0.1.24</a></li>
                    <li><a href=" https://github.com/rust-lang-nursery/rustc-hash ">rustc-hash 1.1.0</a></li>
                    <li><a href=" https://github.com/djc/rustc-version-rs ">rustc_version 0.4.1</a></li>
                    <li><a href=" https://github.com/bytecodealliance/rustix ">rustix 0.38.37</a></li>
                    <li><a href=" https://github.com/ctz/rustls-native-certs ">rustls-native-certs 0.6.3</a></li>
                    <li><a href=" https://github.com/rustls/pemfile ">rustls-pemfile 1.0.4</a></li>
                    <li><a href=" https://github.com/rustls/rustls ">rustls 0.21.12</a></li>
                    <li><a href=" https://github.com/altsysrq/rusty-fork ">rusty-fork 0.3.0</a></li>
                    <li><a href=" https://github.com/alexcrichton/scoped-tls ">scoped-tls 1.0.1</a></li>
                    <li><a href=" https://github.com/bluss/scopeguard ">scopeguard 1.2.0</a></li>
                    <li><a href=" https://github.com/rustls/sct.rs ">sct 0.7.1</a></li>
                    <li><a href=" https://github.com/kornelski/rust-security-framework ">security-framework-sys 2.12.0</a></li>
                    <li><a href=" https://github.com/kornelski/rust-security-framework ">security-framework 2.11.1</a></li>
                    <li><a href=" https://github.com/jonasbb/serde_with/ ">serde_with 3.11.0</a></li>
                    <li><a href=" https://github.com/jonasbb/serde_with/ ">serde_with_macros 3.11.0</a></li>
                    <li><a href=" https://github.com/vorner/signal-hook ">signal-hook-registry 1.4.2</a></li>
                    <li><a href=" https://github.com/servo/rust-smallvec ">smallvec 1.13.2</a></li>
                    <li><a href=" https://github.com/rust-lang/socket2 ">socket2 0.5.7</a></li>
                    <li><a href=" https://github.com/storyyeller/stable_deref_trait ">stable_deref_trait 1.2.0</a></li>
                    <li><a href=" https://github.com/dtolnay/syn ">syn 1.0.109</a></li>
                    <li><a href=" https://github.com/alexcrichton/tar-rs ">tar 0.4.42</a></li>
                    <li><a href=" https://github.com/Stebalien/tempfile ">tempfile 3.13.0</a></li>
                    <li><a href=" https://github.com/tov/thousands-rs ">thousands 0.2.0</a></li>
                    <li><a href=" https://github.com/Amanieu/thread_local-rs ">thread_local 1.1.8</a></li>
                    <li><a href=" https://github.com/bheisler/TinyTemplate ">tinytemplate 1.2.1</a></li>
                    <li><a href=" https://github.com/snapview/tungstenite-rs ">tungstenite 0.21.0</a></li>
                    <li><a href=" https://github.com/seanmonstar/unicase ">unicase 2.7.0</a></li>
                    <li><a href=" https://github.com/servo/unicode-bidi ">unicode-bidi 0.3.17</a></li>
                    <li><a href=" https://github.com/unicode-rs/unicode-normalization ">unicode-normalization 0.1.24</a></li>
                    <li><a href=" https://github.com/unicode-rs/unicode-width ">unicode-width 0.1.14</a></li>
                    <li><a href=" https://github.com/servo/rust-url ">url 2.5.2</a></li>
                    <li><a href=" https://github.com/uuid-rs/uuid ">uuid 1.10.0</a></li>
                    <li><a href=" https://github.com/SergioBenitez/version_check ">version_check 0.9.5</a></li>
                    <li><a href=" https://github.com/alexcrichton/wait-timeout ">wait-timeout 0.2.0</a></li>
                    <li><a href=" https://github.com/smol-rs/waker-fn ">waker-fn 1.2.0</a></li>
                    <li><a href=" https://github.com/bytecodealliance/wasi ">wasi 0.11.0+wasi-snapshot-preview1</a></li>
                    <li><a href=" https://github.com/bytecodealliance/wasi ">wasi 0.9.0+wasi-snapshot-preview1</a></li>
                    <li><a href=" https://github.com/wasix-org/wasix-abi-rust ">wasix 0.12.21</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/backend ">wasm-bindgen-backend 0.2.94</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/futures ">wasm-bindgen-futures 0.4.44</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/macro-support ">wasm-bindgen-macro-support 0.2.94</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/macro ">wasm-bindgen-macro 0.2.94</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/shared ">wasm-bindgen-shared 0.2.94</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen ">wasm-bindgen 0.2.94</a></li>
                    <li><a href=" https://github.com/rustwasm/wasm-bindgen/tree/master/crates/web-sys ">web-sys 0.3.71</a></li>
                    <li><a href=" https://github.com/LukeMathWalker/wiremock-rs ">wiremock 0.5.22</a></li>
                    <li><a href=" https://github.com/Stebalien/xattr ">xattr 1.3.1</a></li>
                    <li><a href=" https://github.com/RazrFalcon/xmlparser ">xmlparser 0.13.6</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/zkcrypto/ff ">ff 0.12.1</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.

</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/contain-rs/bit-set ">bit-set 0.5.3</a></li>
                    <li><a href=" https://github.com/contain-rs/bit-vec ">bit-vec 0.6.3</a></li>
                    <li><a href=" https://github.com/marcianx/downcast-rs ">downcast-rs 1.2.1</a></li>
                    <li><a href=" https://github.com/contain-rs/linked-hash-map ">linked-hash-map 0.5.6</a></li>
                    <li><a href=" https://github.com/Alexhuszagh/minimal-lexical ">minimal-lexical 0.2.1</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/RustCrypto/block-ciphers ">aes 0.8.4</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/base16ct ">base16ct 0.1.1</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/base64ct ">base64ct 1.6.0</a></li>
                    <li><a href=" https://github.com/RustCrypto/utils ">block-buffer 0.10.4</a></li>
                    <li><a href=" https://github.com/RustCrypto/traits ">cipher 0.4.4</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/const-oid ">const-oid 0.9.6</a></li>
                    <li><a href=" https://github.com/RustCrypto/utils ">cpufeatures 0.2.14</a></li>
                    <li><a href=" https://github.com/RustCrypto/crypto-bigint ">crypto-bigint 0.4.9</a></li>
                    <li><a href=" https://github.com/RustCrypto/crypto-bigint ">crypto-bigint 0.5.5</a></li>
                    <li><a href=" https://github.com/RustCrypto/traits ">crypto-common 0.1.6</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/der ">der 0.6.1</a></li>
                    <li><a href=" https://github.com/RustCrypto/traits ">digest 0.10.7</a></li>
                    <li><a href=" https://github.com/RustCrypto/traits/tree/master/elliptic-curve ">elliptic-curve 0.12.3</a></li>
                    <li><a href=" https://github.com/RustCrypto/MACs ">hmac 0.12.1</a></li>
                    <li><a href=" https://github.com/RustCrypto/utils ">inout 0.1.3</a></li>
                    <li><a href=" https://github.com/RustCrypto/hashes ">md-5 0.10.6</a></li>
                    <li><a href=" https://github.com/RustCrypto/elliptic-curves/tree/master/p256 ">p256 0.11.1</a></li>
                    <li><a href=" https://github.com/RustCrypto/traits/tree/master/password-hash ">password-hash 0.4.2</a></li>
                    <li><a href=" https://github.com/RustCrypto/password-hashes/tree/master/pbkdf2 ">pbkdf2 0.11.0</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/pkcs8 ">pkcs8 0.9.0</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/sec1 ">sec1 0.3.0</a></li>
                    <li><a href=" https://github.com/RustCrypto/hashes ">sha1 0.10.6</a></li>
                    <li><a href=" https://github.com/RustCrypto/hashes ">sha2 0.10.8</a></li>
                    <li><a href=" https://github.com/RustCrypto/traits/tree/master/signature ">signature 1.6.4</a></li>
                    <li><a href=" https://github.com/RustCrypto/formats/tree/master/spki ">spki 0.6.0</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-random/rand ">rand 0.8.5</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     https://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-random/rand ">rand_core 0.6.4</a></li>
                    <li><a href=" https://github.com/rust-random/rand ">rand_distr 0.4.3</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     https://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-random/getrandom ">getrandom 0.1.16</a></li>
                    <li><a href=" https://github.com/rust-random/getrandom ">getrandom 0.2.15</a></li>
                    <li><a href=" https://github.com/rust-random/rand ">rand 0.7.3</a></li>
                    <li><a href=" https://github.com/rust-random/rand ">rand_chacha 0.2.2</a></li>
                    <li><a href=" https://github.com/rust-random/rand ">rand_chacha 0.3.1</a></li>
                    <li><a href=" https://github.com/rust-random/rand ">rand_core 0.5.1</a></li>
                    <li><a href=" https://github.com/rust-random/rand ">rand_hc 0.2.0</a></li>
                    <li><a href=" https://github.com/rust-random/rngs ">rand_xorshift 0.3.0</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     https://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	https://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-lang/cargo ">home 0.5.9</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     https://www.apache.org/licenses/LICENSE-2.0

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	https://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/zakarumych/allocator-api2 ">allocator-api2 0.2.18</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://gitlab.com/CreepySkeleton/proc-macro-error ">proc-macro-error 1.0.4</a></li>
                </ul>
                <pre class="license-text">                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright 2019-2020 CreepySkeleton &lt;creepy-skeleton@yandex.ru&gt;

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/zesterer/flume ">flume 0.11.0</a></li>
                </ul>
                <pre class="license-text">   Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright [yyyy] [name of copyright owner]

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tikv/async-speed-limit ">async-speed-limit 0.4.2</a></li>
                </ul>
                <pre class="license-text">Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      &quot;License&quot; shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      &quot;Legal Entity&quot; shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      &quot;control&quot; means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      &quot;Source&quot; form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      &quot;Object&quot; form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      &quot;Work&quot; shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      &quot;Contribution&quot; shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, &quot;submitted&quot;
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

      &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets &quot;{}&quot;
      replaced with your own identifying information. (Don&#x27;t include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same &quot;printed page&quot; as the copyright notice for easier
      identification within third-party archives.

   Copyright {}

   Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/pyfisch/httpdate ">httpdate 1.0.3</a></li>
                </ul>
                <pre class="license-text">Apache License
Version 2.0, January 2004
http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

&quot;License&quot; shall mean the terms and conditions for use, reproduction,
and distribution as defined by Sections 1 through 9 of this document.

&quot;Licensor&quot; shall mean the copyright owner or entity authorized by
the copyright owner that is granting the License.

&quot;Legal Entity&quot; shall mean the union of the acting entity and all
other entities that control, are controlled by, or are under common
control with that entity. For the purposes of this definition,
&quot;control&quot; means (i) the power, direct or indirect, to cause the
direction or management of such entity, whether by contract or
otherwise, or (ii) ownership of fifty percent (50%) or more of the
outstanding shares, or (iii) beneficial ownership of such entity.

&quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
exercising permissions granted by this License.

&quot;Source&quot; form shall mean the preferred form for making modifications,
including but not limited to software source code, documentation
source, and configuration files.

&quot;Object&quot; form shall mean any form resulting from mechanical
transformation or translation of a Source form, including but
not limited to compiled object code, generated documentation,
and conversions to other media types.

&quot;Work&quot; shall mean the work of authorship, whether in Source or
Object form, made available under the License, as indicated by a
copyright notice that is included in or attached to the work
(an example is provided in the Appendix below).

&quot;Derivative Works&quot; shall mean any work, whether in Source or Object
form, that is based on (or derived from) the Work and for which the
editorial revisions, annotations, elaborations, or other modifications
represent, as a whole, an original work of authorship. For the purposes
of this License, Derivative Works shall not include works that remain
separable from, or merely link (or bind by name) to the interfaces of,
the Work and Derivative Works thereof.

&quot;Contribution&quot; shall mean any work of authorship, including
the original version of the Work and any modifications or additions
to that Work or Derivative Works thereof, that is intentionally
submitted to Licensor for inclusion in the Work by the copyright owner
or by an individual or Legal Entity authorized to submit on behalf of
the copyright owner. For the purposes of this definition, &quot;submitted&quot;
means any form of electronic, verbal, or written communication sent
to the Licensor or its representatives, including but not limited to
communication on electronic mailing lists, source code control systems,
and issue tracking systems that are managed by, or on behalf of, the
Licensor for the purpose of discussing and improving the Work, but
excluding communication that is conspicuously marked or otherwise
designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

&quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
on behalf of whom a Contribution has been received by Licensor and
subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
this License, each Contributor hereby grants to You a perpetual,
worldwide, non-exclusive, no-charge, royalty-free, irrevocable
copyright license to reproduce, prepare Derivative Works of,
publicly display, publicly perform, sublicense, and distribute the
Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
this License, each Contributor hereby grants to You a perpetual,
worldwide, non-exclusive, no-charge, royalty-free, irrevocable
(except as stated in this section) patent license to make, have made,
use, offer to sell, sell, import, and otherwise transfer the Work,
where such license applies only to those patent claims licensable
by such Contributor that are necessarily infringed by their
Contribution(s) alone or by combination of their Contribution(s)
with the Work to which such Contribution(s) was submitted. If You
institute patent litigation against any entity (including a
cross-claim or counterclaim in a lawsuit) alleging that the Work
or a Contribution incorporated within the Work constitutes direct
or contributory patent infringement, then any patent licenses
granted to You under this License for that Work shall terminate
as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
Work or Derivative Works thereof in any medium, with or without
modifications, and in Source or Object form, provided that You
meet the following conditions:

(a) You must give any other recipients of the Work or
Derivative Works a copy of this License; and

(b) You must cause any modified files to carry prominent notices
stating that You changed the files; and

(c) You must retain, in the Source form of any Derivative Works
that You distribute, all copyright, patent, trademark, and
attribution notices from the Source form of the Work,
excluding those notices that do not pertain to any part of
the Derivative Works; and

(d) If the Work includes a &quot;NOTICE&quot; text file as part of its
distribution, then any Derivative Works that You distribute must
include a readable copy of the attribution notices contained
within such NOTICE file, excluding those notices that do not
pertain to any part of the Derivative Works, in at least one
of the following places: within a NOTICE text file distributed
as part of the Derivative Works; within the Source form or
documentation, if provided along with the Derivative Works; or,
within a display generated by the Derivative Works, if and
wherever such third-party notices normally appear. The contents
of the NOTICE file are for informational purposes only and
do not modify the License. You may add Your own attribution
notices within Derivative Works that You distribute, alongside
or as an addendum to the NOTICE text from the Work, provided
that such additional attribution notices cannot be construed
as modifying the License.

You may add Your own copyright statement to Your modifications and
may provide additional or different license terms and conditions
for use, reproduction, or distribution of Your modifications, or
for any such Derivative Works as a whole, provided Your use,
reproduction, and distribution of the Work otherwise complies with
the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
any Contribution intentionally submitted for inclusion in the Work
by You to the Licensor shall be under the terms and conditions of
this License, without any additional terms or conditions.
Notwithstanding the above, nothing herein shall supersede or modify
the terms of any separate license agreement you may have executed
with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
names, trademarks, service marks, or product names of the Licensor,
except as required for reasonable and customary use in describing the
origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
agreed to in writing, Licensor provides the Work (and each
Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
implied, including, without limitation, any warranties or conditions
of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
PARTICULAR PURPOSE. You are solely responsible for determining the
appropriateness of using or redistributing the Work and assume any
risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
whether in tort (including negligence), contract, or otherwise,
unless required by applicable law (such as deliberate and grossly
negligent acts) or agreed to in writing, shall any Contributor be
liable to You for damages, including any direct, indirect, special,
incidental, or consequential damages of any character arising as a
result of this License or out of the use or inability to use the
Work (including but not limited to damages for loss of goodwill,
work stoppage, computer failure or malfunction, or any and all
other commercial damages or losses), even if such Contributor
has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
the Work or Derivative Works thereof, You may choose to offer,
and charge a fee for, acceptance of support, warranty, indemnity,
or other liability obligations and/or rights consistent with this
License. However, in accepting such obligations, You may act only
on Your own behalf and on Your sole responsibility, not on behalf
of any other Contributor, and only if You agree to indemnify,
defend, and hold each Contributor harmless for any liability
incurred by, or claims asserted against, such Contributor by reason
of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

To apply the Apache License to your work, attach the following
boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
replaced with your own identifying information. (Don&#x27;t include
the brackets!)  The text should be enclosed in the appropriate
comment syntax for the file format. We also recommend that a
file or class name and description of purpose be included on the
same &quot;printed page&quot; as the copyright notice for easier
identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/nical/android_system_properties ">android_system_properties 0.1.5</a></li>
                    <li><a href=" https://github.com/zrzka/anes-rs ">anes 0.1.6</a></li>
                    <li><a href=" https://github.com/zowens/crc32c ">crc32c 0.6.8</a></li>
                    <li><a href=" https://github.com/starkat99/half-rs ">half 2.4.1</a></li>
                    <li><a href=" https://github.com/veddan/rust-htmlescape ">htmlescape 0.3.1</a></li>
                    <li><a href=" https://gitlab.com/kornelski/http-serde ">http-serde 1.1.3</a></li>
                    <li><a href=" https://gitlab.com/kornelski/http-serde ">http-serde 2.1.1</a></li>
                    <li><a href=" https://github.com/TedDriggs/ident_case ">ident_case 1.0.1</a></li>
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">lambda_http 0.8.3</a></li>
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">lambda_runtime 0.13.0</a></li>
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">lambda_runtime 0.8.3</a></li>
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">lambda_runtime_api_client 0.11.1</a></li>
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">lambda_runtime_api_client 0.8.0</a></li>
                    <li><a href=" https://github.com/stainless-steel/md5 ">md5 0.7.0</a></li>
                    <li><a href=" https://github.com/faern/oneshot ">oneshot 0.1.8</a></li>
                    <li><a href=" https://github.com/someguynamedjosh/ouroboros ">ouroboros 0.18.4</a></li>
                    <li><a href=" https://github.com/someguynamedjosh/ouroboros ">ouroboros_macro 0.18.4</a></li>
                    <li><a href=" https://github.com/jamesmunns/postcard ">postcard 1.0.10</a></li>
                    <li><a href=" https://github.com/eminence/procfs ">procfs-core 0.16.0</a></li>
                    <li><a href=" https://github.com/eminence/procfs ">procfs 0.16.0</a></li>
                    <li><a href=" https://github.com/comex/rust-shlex ">shlex 1.3.0</a></li>
                    <li><a href=" https://github.com/jedisct1/rust-siphash ">siphasher 0.3.11</a></li>
                    <li><a href=" https://github.com/mullvad/system-configuration-rs ">system-configuration-sys 0.5.0</a></li>
                    <li><a href=" https://github.com/mullvad/system-configuration-rs ">system-configuration 0.5.1</a></li>
                    <li><a href=" https://pijul.org/darcs/user ">username 0.2.0</a></li>
                    <li><a href=" https://github.com/retep998/winapi-rs ">winapi-i686-pc-windows-gnu 0.4.0</a></li>
                    <li><a href=" https://github.com/retep998/winapi-rs ">winapi-x86_64-pc-windows-gnu 0.4.0</a></li>
                </ul>
                <pre class="license-text">Apache License
Version 2.0, January 2004
http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

&quot;License&quot; shall mean the terms and conditions for use, reproduction, and distribution as defined by Sections 1 through 9 of this document.

&quot;Licensor&quot; shall mean the copyright owner or entity authorized by the copyright owner that is granting the License.

&quot;Legal Entity&quot; shall mean the union of the acting entity and all other entities that control, are controlled by, or are under common control with that entity. For the purposes of this definition, &quot;control&quot; means (i) the power, direct or indirect, to cause the direction or management of such entity, whether by contract or otherwise, or (ii) ownership of fifty percent (50%) or more of the outstanding shares, or (iii) beneficial ownership of such entity.

&quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity exercising permissions granted by this License.

&quot;Source&quot; form shall mean the preferred form for making modifications, including but not limited to software source code, documentation source, and configuration files.

&quot;Object&quot; form shall mean any form resulting from mechanical transformation or translation of a Source form, including but not limited to compiled object code, generated documentation, and conversions to other media types.

&quot;Work&quot; shall mean the work of authorship, whether in Source or Object form, made available under the License, as indicated by a copyright notice that is included in or attached to the work (an example is provided in the Appendix below).

&quot;Derivative Works&quot; shall mean any work, whether in Source or Object form, that is based on (or derived from) the Work and for which the editorial revisions, annotations, elaborations, or other modifications represent, as a whole, an original work of authorship. For the purposes of this License, Derivative Works shall not include works that remain separable from, or merely link (or bind by name) to the interfaces of, the Work and Derivative Works thereof.

&quot;Contribution&quot; shall mean any work of authorship, including the original version of the Work and any modifications or additions to that Work or Derivative Works thereof, that is intentionally submitted to Licensor for inclusion in the Work by the copyright owner or by an individual or Legal Entity authorized to submit on behalf of the copyright owner. For the purposes of this definition, &quot;submitted&quot; means any form of electronic, verbal, or written communication sent to the Licensor or its representatives, including but not limited to communication on electronic mailing lists, source code control systems, and issue tracking systems that are managed by, or on behalf of, the Licensor for the purpose of discussing and improving the Work, but excluding communication that is conspicuously marked or otherwise designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

&quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity on behalf of whom a Contribution has been received by Licensor and subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable copyright license to reproduce, prepare Derivative Works of, publicly display, publicly perform, sublicense, and distribute the Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable (except as stated in this section) patent license to make, have made, use, offer to sell, sell, import, and otherwise transfer the Work, where such license applies only to those patent claims licensable by such Contributor that are necessarily infringed by their Contribution(s) alone or by combination of their Contribution(s) with the Work to which such Contribution(s) was submitted. If You institute patent litigation against any entity (including a cross-claim or counterclaim in a lawsuit) alleging that the Work or a Contribution incorporated within the Work constitutes direct or contributory patent infringement, then any patent licenses granted to You under this License for that Work shall terminate as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the Work or Derivative Works thereof in any medium, with or without modifications, and in Source or Object form, provided that You meet the following conditions:

     (a) You must give any other recipients of the Work or Derivative Works a copy of this License; and

     (b) You must cause any modified files to carry prominent notices stating that You changed the files; and

     (c) You must retain, in the Source form of any Derivative Works that You distribute, all copyright, patent, trademark, and attribution notices from the Source form of the Work, excluding those notices that do not pertain to any part of the Derivative Works; and

     (d) If the Work includes a &quot;NOTICE&quot; text file as part of its distribution, then any Derivative Works that You distribute must include a readable copy of the attribution notices contained within such NOTICE file, excluding those notices that do not pertain to any part of the Derivative Works, in at least one of the following places: within a NOTICE text file distributed as part of the Derivative Works; within the Source form or documentation, if provided along with the Derivative Works; or, within a display generated by the Derivative Works, if and wherever such third-party notices normally appear. The contents of the NOTICE file are for informational purposes only and do not modify the License. You may add Your own attribution notices within Derivative Works that You distribute, alongside or as an addendum to the NOTICE text from the Work, provided that such additional attribution notices cannot be construed as modifying the License.

     You may add Your own copyright statement to Your modifications and may provide additional or different license terms and conditions for use, reproduction, or distribution of Your modifications, or for any such Derivative Works as a whole, provided Your use, reproduction, and distribution of the Work otherwise complies with the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise, any Contribution intentionally submitted for inclusion in the Work by You to the Licensor shall be under the terms and conditions of this License, without any additional terms or conditions. Notwithstanding the above, nothing herein shall supersede or modify the terms of any separate license agreement you may have executed with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade names, trademarks, service marks, or product names of the Licensor, except as required for reasonable and customary use in describing the origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or agreed to in writing, Licensor provides the Work (and each Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied, including, without limitation, any warranties or conditions of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are solely responsible for determining the appropriateness of using or redistributing the Work and assume any risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory, whether in tort (including negligence), contract, or otherwise, unless required by applicable law (such as deliberate and grossly negligent acts) or agreed to in writing, shall any Contributor be liable to You for damages, including any direct, indirect, special, incidental, or consequential damages of any character arising as a result of this License or out of the use or inability to use the Work (including but not limited to damages for loss of goodwill, work stoppage, computer failure or malfunction, or any and all other commercial damages or losses), even if such Contributor has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing the Work or Derivative Works thereof, You may choose to offer, and charge a fee for, acceptance of support, warranty, indemnity, or other liability obligations and/or rights consistent with this License. However, in accepting such obligations, You may act only on Your own behalf and on Your sole responsibility, not on behalf of any other Contributor, and only if You agree to indemnify, defend, and hold each Contributor harmless for any liability incurred by, or claims asserted against, such Contributor by reason of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

To apply the Apache License to your work, attach the following boilerplate notice, with the fields enclosed by brackets &quot;[]&quot; replaced with your own identifying information. (Don&#x27;t include the brackets!)  The text should be enclosed in the appropriate comment syntax for the file format. We also recommend that a file or class name and description of purpose be included on the same &quot;printed page&quot; as the copyright notice for easier identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
</pre>
            </li>
            <li class="license">
                <h3 id="Apache-2.0">Apache License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/chronotope/chrono ">chrono 0.4.38</a></li>
                </ul>
                <pre class="license-text">Rust-chrono is dual-licensed under The MIT License [1] and
Apache 2.0 License [2]. Copyright (c) 2014--2017, Kang Seonghoon and
contributors.

Nota Bene: This is same as the Rust Project&#x27;s own license.


[1]: &lt;http://opensource.org/licenses/MIT&gt;, which is reproduced below:

~~~~
The MIT License (MIT)

Copyright (c) 2014, Kang Seonghoon.

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
~~~~


[2]: &lt;http://www.apache.org/licenses/LICENSE-2.0&gt;, which is reproduced below:

~~~~
                              Apache License
                        Version 2.0, January 2004
                     http://www.apache.org/licenses/

TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

1. Definitions.

   &quot;License&quot; shall mean the terms and conditions for use, reproduction,
   and distribution as defined by Sections 1 through 9 of this document.

   &quot;Licensor&quot; shall mean the copyright owner or entity authorized by
   the copyright owner that is granting the License.

   &quot;Legal Entity&quot; shall mean the union of the acting entity and all
   other entities that control, are controlled by, or are under common
   control with that entity. For the purposes of this definition,
   &quot;control&quot; means (i) the power, direct or indirect, to cause the
   direction or management of such entity, whether by contract or
   otherwise, or (ii) ownership of fifty percent (50%) or more of the
   outstanding shares, or (iii) beneficial ownership of such entity.

   &quot;You&quot; (or &quot;Your&quot;) shall mean an individual or Legal Entity
   exercising permissions granted by this License.

   &quot;Source&quot; form shall mean the preferred form for making modifications,
   including but not limited to software source code, documentation
   source, and configuration files.

   &quot;Object&quot; form shall mean any form resulting from mechanical
   transformation or translation of a Source form, including but
   not limited to compiled object code, generated documentation,
   and conversions to other media types.

   &quot;Work&quot; shall mean the work of authorship, whether in Source or
   Object form, made available under the License, as indicated by a
   copyright notice that is included in or attached to the work
   (an example is provided in the Appendix below).

   &quot;Derivative Works&quot; shall mean any work, whether in Source or Object
   form, that is based on (or derived from) the Work and for which the
   editorial revisions, annotations, elaborations, or other modifications
   represent, as a whole, an original work of authorship. For the purposes
   of this License, Derivative Works shall not include works that remain
   separable from, or merely link (or bind by name) to the interfaces of,
   the Work and Derivative Works thereof.

   &quot;Contribution&quot; shall mean any work of authorship, including
   the original version of the Work and any modifications or additions
   to that Work or Derivative Works thereof, that is intentionally
   submitted to Licensor for inclusion in the Work by the copyright owner
   or by an individual or Legal Entity authorized to submit on behalf of
   the copyright owner. For the purposes of this definition, &quot;submitted&quot;
   means any form of electronic, verbal, or written communication sent
   to the Licensor or its representatives, including but not limited to
   communication on electronic mailing lists, source code control systems,
   and issue tracking systems that are managed by, or on behalf of, the
   Licensor for the purpose of discussing and improving the Work, but
   excluding communication that is conspicuously marked or otherwise
   designated in writing by the copyright owner as &quot;Not a Contribution.&quot;

   &quot;Contributor&quot; shall mean Licensor and any individual or Legal Entity
   on behalf of whom a Contribution has been received by Licensor and
   subsequently incorporated within the Work.

2. Grant of Copyright License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   copyright license to reproduce, prepare Derivative Works of,
   publicly display, publicly perform, sublicense, and distribute the
   Work and such Derivative Works in Source or Object form.

3. Grant of Patent License. Subject to the terms and conditions of
   this License, each Contributor hereby grants to You a perpetual,
   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
   (except as stated in this section) patent license to make, have made,
   use, offer to sell, sell, import, and otherwise transfer the Work,
   where such license applies only to those patent claims licensable
   by such Contributor that are necessarily infringed by their
   Contribution(s) alone or by combination of their Contribution(s)
   with the Work to which such Contribution(s) was submitted. If You
   institute patent litigation against any entity (including a
   cross-claim or counterclaim in a lawsuit) alleging that the Work
   or a Contribution incorporated within the Work constitutes direct
   or contributory patent infringement, then any patent licenses
   granted to You under this License for that Work shall terminate
   as of the date such litigation is filed.

4. Redistribution. You may reproduce and distribute copies of the
   Work or Derivative Works thereof in any medium, with or without
   modifications, and in Source or Object form, provided that You
   meet the following conditions:

   (a) You must give any other recipients of the Work or
       Derivative Works a copy of this License; and

   (b) You must cause any modified files to carry prominent notices
       stating that You changed the files; and

   (c) You must retain, in the Source form of any Derivative Works
       that You distribute, all copyright, patent, trademark, and
       attribution notices from the Source form of the Work,
       excluding those notices that do not pertain to any part of
       the Derivative Works; and

   (d) If the Work includes a &quot;NOTICE&quot; text file as part of its
       distribution, then any Derivative Works that You distribute must
       include a readable copy of the attribution notices contained
       within such NOTICE file, excluding those notices that do not
       pertain to any part of the Derivative Works, in at least one
       of the following places: within a NOTICE text file distributed
       as part of the Derivative Works; within the Source form or
       documentation, if provided along with the Derivative Works; or,
       within a display generated by the Derivative Works, if and
       wherever such third-party notices normally appear. The contents
       of the NOTICE file are for informational purposes only and
       do not modify the License. You may add Your own attribution
       notices within Derivative Works that You distribute, alongside
       or as an addendum to the NOTICE text from the Work, provided
       that such additional attribution notices cannot be construed
       as modifying the License.

   You may add Your own copyright statement to Your modifications and
   may provide additional or different license terms and conditions
   for use, reproduction, or distribution of Your modifications, or
   for any such Derivative Works as a whole, provided Your use,
   reproduction, and distribution of the Work otherwise complies with
   the conditions stated in this License.

5. Submission of Contributions. Unless You explicitly state otherwise,
   any Contribution intentionally submitted for inclusion in the Work
   by You to the Licensor shall be under the terms and conditions of
   this License, without any additional terms or conditions.
   Notwithstanding the above, nothing herein shall supersede or modify
   the terms of any separate license agreement you may have executed
   with Licensor regarding such Contributions.

6. Trademarks. This License does not grant permission to use the trade
   names, trademarks, service marks, or product names of the Licensor,
   except as required for reasonable and customary use in describing the
   origin of the Work and reproducing the content of the NOTICE file.

7. Disclaimer of Warranty. Unless required by applicable law or
   agreed to in writing, Licensor provides the Work (and each
   Contributor provides its Contributions) on an &quot;AS IS&quot; BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
   implied, including, without limitation, any warranties or conditions
   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
   PARTICULAR PURPOSE. You are solely responsible for determining the
   appropriateness of using or redistributing the Work and assume any
   risks associated with Your exercise of permissions under this License.

8. Limitation of Liability. In no event and under no legal theory,
   whether in tort (including negligence), contract, or otherwise,
   unless required by applicable law (such as deliberate and grossly
   negligent acts) or agreed to in writing, shall any Contributor be
   liable to You for damages, including any direct, indirect, special,
   incidental, or consequential damages of any character arising as a
   result of this License or out of the use or inability to use the
   Work (including but not limited to damages for loss of goodwill,
   work stoppage, computer failure or malfunction, or any and all
   other commercial damages or losses), even if such Contributor
   has been advised of the possibility of such damages.

9. Accepting Warranty or Additional Liability. While redistributing
   the Work or Derivative Works thereof, You may choose to offer,
   and charge a fee for, acceptance of support, warranty, indemnity,
   or other liability obligations and/or rights consistent with this
   License. However, in accepting such obligations, You may act only
   on Your own behalf and on Your sole responsibility, not on behalf
   of any other Contributor, and only if You agree to indemnify,
   defend, and hold each Contributor harmless for any liability
   incurred by, or claims asserted against, such Contributor by reason
   of your accepting any such warranty or additional liability.

END OF TERMS AND CONDITIONS

APPENDIX: How to apply the Apache License to your work.

   To apply the Apache License to your work, attach the following
   boilerplate notice, with the fields enclosed by brackets &quot;[]&quot;
   replaced with your own identifying information. (Don&#x27;t include
   the brackets!)  The text should be enclosed in the appropriate
   comment syntax for the file format. We also recommend that a
   file or class name and description of purpose be included on the
   same &quot;printed page&quot; as the copyright notice for easier
   identification within third-party archives.

Copyright [yyyy] [name of copyright owner]

Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an &quot;AS IS&quot; BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
~~~~

</pre>
            </li>
            <li class="license">
                <h3 id="BSD-3-Clause">BSD 3-Clause &quot;New&quot; or &quot;Revised&quot; License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/ibraheemdev/matchit ">matchit 0.7.3</a></li>
                </ul>
                <pre class="license-text">BSD 3-Clause License

Copyright (c) 2013, Julien Schmidt
All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:

1. Redistributions of source code must retain the above copyright notice, this
   list of conditions and the following disclaimer.

2. Redistributions in binary form must reproduce the above copyright notice,
   this list of conditions and the following disclaimer in the documentation
   and/or other materials provided with the distribution.

3. Neither the name of the copyright holder nor the names of its
   contributors may be used to endorse or promote products derived from
   this software without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot;
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
</pre>
            </li>
            <li class="license">
                <h3 id="BSD-3-Clause">BSD 3-Clause &quot;New&quot; or &quot;Revised&quot; License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/CurrySoftware/rust-stemmers ">rust-stemmers 1.2.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2001, Dr Martin Porter
Copyright (c) 2004,2005, Richard Boulton
All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:

  1. Redistributions of source code must retain the above copyright notice,
     this list of conditions and the following disclaimer.
  2. Redistributions in binary form must reproduce the above copyright notice,
     this list of conditions and the following disclaimer in the documentation
     and/or other materials provided with the distribution.
  3. Neither the name of the Snowball project nor the names of its contributors
     may be used to endorse or promote products derived from this software
     without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot; AND
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.</pre>
            </li>
            <li class="license">
                <h3 id="BSD-3-Clause">BSD 3-Clause &quot;New&quot; or &quot;Revised&quot; License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/dalek-cryptography/subtle ">subtle 2.6.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2016-2017 Isis Agora Lovecruft, Henry de Valence. All rights reserved.
Copyright (c) 2016-2024 Isis Agora Lovecruft. All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are
met:

1. Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.

2. Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in the
documentation and/or other materials provided with the distribution.

3. Neither the name of the copyright holder nor the names of its
contributors may be used to endorse or promote products derived from
this software without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS
IS&quot; AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 
</pre>
            </li>
            <li class="license">
                <h3 id="BSD-3-Clause">BSD 3-Clause &quot;New&quot; or &quot;Revised&quot; License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/sebcrozet/instant ">instant 0.1.13</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019, Sébastien Crozet
All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:

1. Redistributions of source code must retain the above copyright notice, this
   list of conditions and the following disclaimer.

2. Redistributions in binary form must reproduce the above copyright notice,
   this list of conditions and the following disclaimer in the documentation
   and/or other materials provided with the distribution.

3. Neither the name of the author nor the names of its contributors may be used
   to endorse or promote products derived from this software without specific
   prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot; AND
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
</pre>
            </li>
            <li class="license">
                <h3 id="BSD-3-Clause">BSD 3-Clause &quot;New&quot; or &quot;Revised&quot; License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hsivonen/encoding_rs ">encoding_rs 0.8.32</a></li>
                </ul>
                <pre class="license-text">Copyright © WHATWG (Apple, Google, Mozilla, Microsoft).

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:

1. Redistributions of source code must retain the above copyright notice, this
   list of conditions and the following disclaimer.

2. Redistributions in binary form must reproduce the above copyright notice,
   this list of conditions and the following disclaimer in the documentation
   and/or other materials provided with the distribution.

3. Neither the name of the copyright holder nor the names of its
   contributors may be used to endorse or promote products derived from
   this software without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot;
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
</pre>
            </li>
            <li class="license">
                <h3 id="CC0-1.0">Creative Commons Zero v1.0 Universal</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/cesarb/constant_time_eq ">constant_time_eq 0.1.5</a></li>
                    <li><a href=" https://crates.io/crates/encoding-index-japanese ">encoding-index-japanese 1.20141219.5</a></li>
                    <li><a href=" https://crates.io/crates/encoding-index-korean ">encoding-index-korean 1.20141219.5</a></li>
                    <li><a href=" https://crates.io/crates/encoding-index-simpchinese ">encoding-index-simpchinese 1.20141219.5</a></li>
                    <li><a href=" https://crates.io/crates/encoding-index-singlebyte ">encoding-index-singlebyte 1.20141219.5</a></li>
                    <li><a href=" https://crates.io/crates/encoding-index-tradchinese ">encoding-index-tradchinese 1.20141219.5</a></li>
                    <li><a href=" https://crates.io/crates/encoding_index_tests ">encoding_index_tests 0.1.4</a></li>
                </ul>
                <pre class="license-text">Creative Commons Legal Code

CC0 1.0 Universal

    CREATIVE COMMONS CORPORATION IS NOT A LAW FIRM AND DOES NOT PROVIDE
    LEGAL SERVICES. DISTRIBUTION OF THIS DOCUMENT DOES NOT CREATE AN
    ATTORNEY-CLIENT RELATIONSHIP. CREATIVE COMMONS PROVIDES THIS
    INFORMATION ON AN &quot;AS-IS&quot; BASIS. CREATIVE COMMONS MAKES NO WARRANTIES
    REGARDING THE USE OF THIS DOCUMENT OR THE INFORMATION OR WORKS
    PROVIDED HEREUNDER, AND DISCLAIMS LIABILITY FOR DAMAGES RESULTING FROM
    THE USE OF THIS DOCUMENT OR THE INFORMATION OR WORKS PROVIDED
    HEREUNDER.

Statement of Purpose

The laws of most jurisdictions throughout the world automatically confer
exclusive Copyright and Related Rights (defined below) upon the creator
and subsequent owner(s) (each and all, an &quot;owner&quot;) of an original work of
authorship and/or a database (each, a &quot;Work&quot;).

Certain owners wish to permanently relinquish those rights to a Work for
the purpose of contributing to a commons of creative, cultural and
scientific works (&quot;Commons&quot;) that the public can reliably and without fear
of later claims of infringement build upon, modify, incorporate in other
works, reuse and redistribute as freely as possible in any form whatsoever
and for any purposes, including without limitation commercial purposes.
These owners may contribute to the Commons to promote the ideal of a free
culture and the further production of creative, cultural and scientific
works, or to gain reputation or greater distribution for their Work in
part through the use and efforts of others.

For these and/or other purposes and motivations, and without any
expectation of additional consideration or compensation, the person
associating CC0 with a Work (the &quot;Affirmer&quot;), to the extent that he or she
is an owner of Copyright and Related Rights in the Work, voluntarily
elects to apply CC0 to the Work and publicly distribute the Work under its
terms, with knowledge of his or her Copyright and Related Rights in the
Work and the meaning and intended legal effect of CC0 on those rights.

1. Copyright and Related Rights. A Work made available under CC0 may be
protected by copyright and related or neighboring rights (&quot;Copyright and
Related Rights&quot;). Copyright and Related Rights include, but are not
limited to, the following:

  i. the right to reproduce, adapt, distribute, perform, display,
     communicate, and translate a Work;
 ii. moral rights retained by the original author(s) and/or performer(s);
iii. publicity and privacy rights pertaining to a person&#x27;s image or
     likeness depicted in a Work;
 iv. rights protecting against unfair competition in regards to a Work,
     subject to the limitations in paragraph 4(a), below;
  v. rights protecting the extraction, dissemination, use and reuse of data
     in a Work;
 vi. database rights (such as those arising under Directive 96/9/EC of the
     European Parliament and of the Council of 11 March 1996 on the legal
     protection of databases, and under any national implementation
     thereof, including any amended or successor version of such
     directive); and
vii. other similar, equivalent or corresponding rights throughout the
     world based on applicable law or treaty, and any national
     implementations thereof.

2. Waiver. To the greatest extent permitted by, but not in contravention
of, applicable law, Affirmer hereby overtly, fully, permanently,
irrevocably and unconditionally waives, abandons, and surrenders all of
Affirmer&#x27;s Copyright and Related Rights and associated claims and causes
of action, whether now known or unknown (including existing as well as
future claims and causes of action), in the Work (i) in all territories
worldwide, (ii) for the maximum duration provided by applicable law or
treaty (including future time extensions), (iii) in any current or future
medium and for any number of copies, and (iv) for any purpose whatsoever,
including without limitation commercial, advertising or promotional
purposes (the &quot;Waiver&quot;). Affirmer makes the Waiver for the benefit of each
member of the public at large and to the detriment of Affirmer&#x27;s heirs and
successors, fully intending that such Waiver shall not be subject to
revocation, rescission, cancellation, termination, or any other legal or
equitable action to disrupt the quiet enjoyment of the Work by the public
as contemplated by Affirmer&#x27;s express Statement of Purpose.

3. Public License Fallback. Should any part of the Waiver for any reason
be judged legally invalid or ineffective under applicable law, then the
Waiver shall be preserved to the maximum extent permitted taking into
account Affirmer&#x27;s express Statement of Purpose. In addition, to the
extent the Waiver is so judged Affirmer hereby grants to each affected
person a royalty-free, non transferable, non sublicensable, non exclusive,
irrevocable and unconditional license to exercise Affirmer&#x27;s Copyright and
Related Rights in the Work (i) in all territories worldwide, (ii) for the
maximum duration provided by applicable law or treaty (including future
time extensions), (iii) in any current or future medium and for any number
of copies, and (iv) for any purpose whatsoever, including without
limitation commercial, advertising or promotional purposes (the
&quot;License&quot;). The License shall be deemed effective as of the date CC0 was
applied by Affirmer to the Work. Should any part of the License for any
reason be judged legally invalid or ineffective under applicable law, such
partial invalidity or ineffectiveness shall not invalidate the remainder
of the License, and in such case Affirmer hereby affirms that he or she
will not (i) exercise any of his or her remaining Copyright and Related
Rights in the Work or (ii) assert any associated claims and causes of
action with respect to the Work, in either case contrary to Affirmer&#x27;s
express Statement of Purpose.

4. Limitations and Disclaimers.

 a. No trademark or patent rights held by Affirmer are waived, abandoned,
    surrendered, licensed or otherwise affected by this document.
 b. Affirmer offers the Work as-is and makes no representations or
    warranties of any kind concerning the Work, express, implied,
    statutory or otherwise, including without limitation warranties of
    title, merchantability, fitness for a particular purpose, non
    infringement, or the absence of latent or other defects, accuracy, or
    the present or absence of errors, whether or not discoverable, all to
    the greatest extent permissible under applicable law.
 c. Affirmer disclaims responsibility for clearing rights of other persons
    that may apply to the Work or any use thereof, including without
    limitation any person&#x27;s Copyright and Related Rights in the Work.
    Further, Affirmer disclaims responsibility for obtaining any necessary
    consents, permissions or other rights required for any use of the
    Work.
 d. Affirmer understands and acknowledges that Creative Commons is not a
    party to this document and has no duty or obligation with respect to
    this CC0 or use of the Work.
</pre>
            </li>
            <li class="license">
                <h3 id="ISC">ISC License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/briansmith/ring ">ring 0.17.8</a></li>
                </ul>
                <pre class="license-text">   Copyright 2015-2016 Brian Smith.

   Permission to use, copy, modify, and/or distribute this software for any
   purpose with or without fee is hereby granted, provided that the above
   copyright notice and this permission notice appear in all copies.

   THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND THE AUTHORS DISCLAIM ALL WARRANTIES
   WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
   MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY
   SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
   WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
   OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
   CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="ISC">ISC License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/briansmith/ring ">ring 0.17.8</a></li>
                </ul>
                <pre class="license-text">/* Copyright (c) 2015, Google Inc.
 *
 * Permission to use, copy, modify, and/or distribute this software for any
 * purpose with or without fee is hereby granted, provided that the above
 * copyright notice and this permission notice appear in all copies.
 *
 * THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND THE AUTHOR DISCLAIMS ALL WARRANTIES
 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
 * SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
 * OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
 * CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */
</pre>
            </li>
            <li class="license">
                <h3 id="ISC">ISC License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/briansmith/untrusted ">untrusted 0.9.0</a></li>
                </ul>
                <pre class="license-text">// Copyright 2015-2016 Brian Smith.
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice appear in all copies.
//
// THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND THE AUTHORS DISCLAIM ALL WARRANTIES
// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
// ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
// ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
// OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="ISC">ISC License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rustls/webpki ">rustls-webpki 0.101.7</a></li>
                </ul>
                <pre class="license-text">// Copyright 2021 Brian Smith.
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice appear in all copies.
//
// THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND THE AUTHORS DISCLAIM ALL WARRANTIES
// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
// ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
// ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
// OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.

#[test]
fn cert_without_extensions_test() {
    // Check the certificate is valid with
    // &#x60;openssl x509 -in cert_without_extensions.der -inform DER -text -noout&#x60;
    const CERT_WITHOUT_EXTENSIONS_DER: &amp;[u8] &#x3D; include_bytes!(&quot;cert_without_extensions.der&quot;);

    assert!(webpki::EndEntityCert::try_from(CERT_WITHOUT_EXTENSIONS_DER).is_ok());
}
</pre>
            </li>
            <li class="license">
                <h3 id="ISC">ISC License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/jedisct1/rust-coarsetime ">coarsetime 0.1.34</a></li>
                </ul>
                <pre class="license-text">ISC License:

Copyright (c) 2004-2010 by Internet Systems Consortium, Inc. (&quot;ISC&quot;)
Copyright (c) 1995-2003 by Internet Software Consortium

Permission to use, copy, modify, and/or distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot; AND ISC DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL ISC BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/allan2/dotenvy ">dotenvy 0.15.7</a></li>
                </ul>
                <pre class="license-text"># The MIT License (MIT)

Copyright (c) 2014 Santiago Lapresta and contributors

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/mio ">mio 1.0.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2014 Carl Lerche and other MIO contributors

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/SimonSapin/rust-std-candidates ">matches 0.1.10</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2014-2016 Simon Sapin

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/Geal/nom ">nom 7.1.3</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2014-2019 Geoffroy Couprie

Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
&quot;Software&quot;), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:

The above copyright notice and this permission notice shall be
included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/headers ">headers-core 0.2.0</a></li>
                    <li><a href=" https://github.com/hyperium/headers ">headers 0.3.9</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2014-2019 Sean McArthur

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/mikedilger/float-cmp ">float-cmp 0.9.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2014-2020 Optimal Computing (NZ) Ltd

Permission is hereby granted, free of charge, to any person obtaining a copy of
this software and associated documentation files (the &quot;Software&quot;), to deal in
the Software without restriction, including without limitation the rights to
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
of the Software, and to permit persons to whom the Software is furnished to do
so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/hyper ">hyper 0.14.30</a></li>
                    <li><a href=" https://github.com/hyperium/hyper ">hyper 1.4.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2014-2021 Sean McArthur

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/gentoo90/winreg-rs ">winreg 0.50.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2015 Igor Shaula

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/reem/rust-ordered-float ">ordered-float 3.9.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2015 Jonathan Reem

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/harryfei/which-rs.git ">which 4.4.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2015 fangyuanziti

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/steffengy/schannel-rs ">schannel 0.1.26</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2015 steffengy

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/briansmith/ring ">ring 0.17.8</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2015-2016 the fiat-crypto authors (see
https://github.com/mit-plv/fiat-crypto/blob/master/AUTHORS).

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-oss/bitpacking ">bitpacking 0.9.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2016 Paul Masurel

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/snapview/tokio-tungstenite ">tokio-tungstenite 0.21.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2017 Daniel Abramov
Copyright (c) 2017 Alexey Galakhov

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rust-cli/termtree ">termtree 0.4.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2017 Doug Tangren

Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
&quot;Software&quot;), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:

The above copyright notice and this permission notice shall be
included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://gitlab.redox-os.org/redox-os/syscall ">redox_syscall 0.5.7</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2017 Redox OS Developers

MIT License

Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
&quot;Software&quot;), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:

The above copyright notice and this permission notice shall be
included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/h2 ">h2 0.3.26</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2017 h2 authors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/bytes ">bytes 1.7.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018 Carl Lerche

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tantivy-search/levenshtein-automata ">levenshtein_automata 0.2.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018 Paul Masurel

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/palfrey/serial_test/ ">serial_test 3.1.1</a></li>
                    <li><a href=" https://github.com/palfrey/serial_test/ ">serial_test_derive 3.1.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018 Tom Parker-Shemilt

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-inc/census ">census 0.4.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018 by Quickwit, Inc. 

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy 0.23.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018 by the project authors, as listed in the AUTHORS file. 

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/seanmonstar/want ">want 0.3.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018-2019 Sean McArthur

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/seanmonstar/warp ">warp 0.3.7</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018-2020 Sean McArthur

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/seanmonstar/try-lock ">try-lock 0.2.5</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2018-2023 Sean McArthur
Copyright (c) 2016 Alex Crichton

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/axum ">axum 0.6.20</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Axum Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/slab ">slab 0.4.9</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Carl Lerche

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/davidpdrsn/assert-json-diff.git ">assert-json-diff 1.1.0</a></li>
                    <li><a href=" https://github.com/davidpdrsn/assert-json-diff.git ">assert-json-diff 2.0.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 David Pedersen

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hawkw/sharded-slab ">sharded-slab 0.1.7</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Eliza Weisman

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hawkw/matchers ">matchers 0.1.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Eliza Weisman

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/http-body ">http-body-util 0.1.2</a></li>
                    <li><a href=" https://github.com/hyperium/http-body ">http-body 0.4.6</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Hyper Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/stepancheg/rust-protobuf/ ">protobuf 2.28.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Stepan Koltsov

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE
OR OTHER DEALINGS IN THE SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing-attributes 0.1.27</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing-core 0.1.32</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing-log 0.1.4</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing-log 0.2.0</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing-opentelemetry ">tracing-opentelemetry 0.20.0</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing-serde 0.1.3</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing-subscriber 0.3.18</a></li>
                    <li><a href=" https://github.com/tokio-rs/tracing ">tracing 0.1.40</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Tokio Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tower-rs/tower ">tower-layer 0.3.3</a></li>
                    <li><a href=" https://github.com/tower-rs/tower ">tower-service 0.3.3</a></li>
                    <li><a href=" https://github.com/tower-rs/tower ">tower 0.4.13</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019 Tower Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tower-rs/tower-http ">tower-http 0.4.4</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019-2021 Tower Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/http-body ">http-body 1.0.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2019-2024 Sean McArthur &amp; Hyper Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/tonic ">tonic-build 0.9.2</a></li>
                    <li><a href=" https://github.com/hyperium/tonic ">tonic 0.9.2</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2020 Lucio Franco

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/calavera/query-map-rs ">query_map 0.7.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2021 David Calavera &lt;david.calavera@gmail.com&gt;

MIT License

Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
&quot;Software&quot;), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:

The above copyright notice and this permission notice shall be
included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/tokio-metrics ">tokio-metrics 0.3.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2022 Tokio Contributors

Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://crates.io/crates/mrecordlog ">mrecordlog 0.4.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2022 by Quickwit, Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/hyperium/hyper-util ">hyper-util 0.1.9</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2023 Sean McArthur

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://crates.io/crates/whichlang ">whichlang 0.1.0</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2023 by Quickwit Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-inc/murmurhash32 ">murmurhash32 0.3.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2024 by Quickwit Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/axum ">axum-core 0.3.4</a></li>
                </ul>
                <pre class="license-text">Copyright 2021 Axum Contributors

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/PSeitz/rust_measure_time ">measure_time 0.8.3</a></li>
                </ul>
                <pre class="license-text">Includes portions of humantime
Copyright (c) 2016 The humantime Developers

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.


</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/jeromefroe/lru-rs.git ">lru 0.12.5</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2016 Jerome Froelich

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/svartalf/hostname ">hostname 0.3.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2016 fengcen
Copyright (c) 2019 svartalf

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/dylanhart/ulid-rs ">ulid 1.1.3</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2017 Dylan Hart

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/TedDriggs/darling ">darling 0.20.10</a></li>
                    <li><a href=" https://github.com/TedDriggs/darling ">darling_core 0.20.10</a></li>
                    <li><a href=" https://github.com/TedDriggs/darling ">darling_macro 0.20.10</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2017 Ted Driggs

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/dunmatt/no-std-net ">no-std-net 0.6.0</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2018 M@

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">aws_lambda_events 0.12.1</a></li>
                    <li><a href=" https://github.com/awslabs/aws-lambda-rust-runtime ">aws_lambda_events 0.15.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2018 Sam Rijs and Christian Legnitto
Copyright 2023 Amazon.com, Inc. or its affiliates


Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/bojand/infer ">infer 0.2.3</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2019 Bojan

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/tokio ">tokio-macros 2.4.0</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2019 Yoshua Wuyts
Copyright (c) Tokio Contributors

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/brunoczim/fslock ">fslock 0.2.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2019 brunoczim

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tabac/hyperloglog.rs ">hyperloglogplus 0.4.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2020 Anastasios Bakogiannis

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rousan/multer-rs ">multer 2.1.0</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2020 Rousan Ali

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/zenlist/serde_dynamo ">serde_dynamo 4.2.14</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2020 Zenlist

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/MarcusGrass/parse-range-headers ">http-range-header 0.3.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2021 MarcusGrass

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/zhiburt/tabled ">papergrid 0.10.0</a></li>
                    <li><a href=" https://github.com/zhiburt/tabled ">tabled 0.14.0</a></li>
                    <li><a href=" https://github.com/zhiburt/tabled ">tabled_derive 0.6.0</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2021 Maxim Zhiburt

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/ibraheemdev/matchit ">matchit 0.7.3</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2022 Ibraheem Ahmed

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/zhiburt/ansi-str ">ansi-str 0.8.0</a></li>
                    <li><a href=" https://gitlab.com/zhiburt/ansitok ">ansitok 0.2.0</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2022 Maxim Zhiburt

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/Nugine/outref ">outref 0.5.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2022 Nugine

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://gitlab.redox-os.org/redox-os/libredox.git ">libredox 0.1.3</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2023 4lDO2

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/kdr-aus/numfmt ">numfmt 1.1.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2023 kurtlawrence

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-oss/chitchat ">chitchat 0.8.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">ownedbytes 0.7.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-bitpacker 0.6.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-columnar 0.3.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-common 0.7.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-query-grammar 0.22.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-sstable 0.3.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-stacker 0.3.0</a></li>
                    <li><a href=" https://github.com/quickwit-oss/tantivy ">tantivy-tokenizer-api 0.3.0</a></li>
                    <li><a href=" https://github.com/retep998/winapi-rs ">advapi32-sys 0.2.0</a></li>
                    <li><a href=" https://github.com/tokio-rs/async-stream ">async-stream-impl 0.3.6</a></li>
                    <li><a href=" https://github.com/tokio-rs/async-stream ">async-stream 0.3.6</a></li>
                    <li><a href=" https://github.com/Nugine/simd ">base64-simd 0.8.0</a></li>
                    <li><a href=" https://crates.io/crates/crunchy ">crunchy 0.2.2</a></li>
                    <li><a href=" https://github.com/DimaKudosh/difflib ">difflib 0.4.0</a></li>
                    <li><a href=" https://github.com/stephaneyfx/enum-iterator.git ">enum-iterator 1.5.0</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-cc-cedict-builder 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-cc-cedict 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-compress 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-core 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-decompress 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-dictionary 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-ipadic-builder 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-ipadic-neologd-builder 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-ipadic 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-ko-dic-builder 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-ko-dic 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-tokenizer 0.27.2</a></li>
                    <li><a href=" https://github.com/lindera-morphology/lindera ">lindera-unidic-builder 0.27.2</a></li>
                    <li><a href=" https://github.com/hasezoey/new_string_template ">new_string_template 1.5.3</a></li>
                    <li><a href=" https://github.com/ogham/rust-number-prefix ">number_prefix 0.4.0</a></li>
                    <li><a href=" https://github.com/plotters-rs/plotters ">plotters-backend 0.3.7</a></li>
                    <li><a href=" https://github.com/plotters-rs/plotters.git ">plotters-svg 0.3.7</a></li>
                    <li><a href=" https://github.com/plotters-rs/plotters ">plotters 0.3.7</a></li>
                    <li><a href=" https://github.com/tokio-rs/valuable ">valuable 0.1.0</a></li>
                    <li><a href=" https://github.com/Nugine/simd ">vsimd 0.8.0</a></li>
                    <li><a href=" https://github.com/retep998/winapi-rs ">winapi-build 0.1.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) &lt;year&gt; &lt;copyright holders&gt;

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/tokio-rs/tokio ">tokio-stream 0.1.16</a></li>
                    <li><a href=" https://github.com/tokio-rs/tokio ">tokio-util 0.7.12</a></li>
                    <li><a href=" https://github.com/tokio-rs/tokio ">tokio 1.40.0</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) Tokio Contributors

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/danaugrs/overload ">overload 0.1.1</a></li>
                </ul>
                <pre class="license-text">MIT License

Copyright (c) 2019 Daniel Augusto Rizzi Salvadori

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/fkoep/downcast-rs ">downcast 0.11.0</a></li>
                </ul>
                <pre class="license-text">MIT License (MIT)

Copyright (c) 2017 Felix Köpge

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/davidpdrsn/ext.git ">extend 0.1.2</a></li>
                </ul>
                <pre class="license-text">MIT License Copyright (c) 2020 David Pedersen

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is furnished
to do so, subject to the following conditions:

The above copyright notice and this permission notice (including the next
paragraph) shall be included in all copies or substantial portions of the
Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS
OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/sunfishcode/is-terminal ">is-terminal 0.4.13</a></li>
                    <li><a href=" https://github.com/upsuper/retain_mut ">retain_mut 0.1.9</a></li>
                    <li><a href=" https://github.com/PSeitz/serde_json_borrow ">serde_json_borrow 0.5.1</a></li>
                    <li><a href=" https://github.com/dtolnay/unsafe-libyaml ">unsafe-libyaml 0.2.11</a></li>
                </ul>
                <pre class="license-text">Permission is hereby granted, free of charge, to any
person obtaining a copy of this software and associated
documentation files (the &quot;Software&quot;), to deal in the
Software without restriction, including without
limitation the rights to use, copy, modify, merge,
publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software
is furnished to do so, subject to the following
conditions:

The above copyright notice and this permission notice
shall be included in all copies or substantial portions
of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/winnow-rs/winnow ">winnow 0.5.40</a></li>
                </ul>
                <pre class="license-text">Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
&quot;Software&quot;), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:

The above copyright notice and this permission notice shall be
included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/lifthrasiir/rust-encoding ">encoding 0.2.33</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2013, Kang Seonghoon.

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/nushell/nu-ansi-term ">nu-ansi-term 0.46.0</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2014 Benjamin Sago
Copyright (c) 2021-2022 The Nushell Project Developers

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/mvdnes/spin-rs.git ">spin 0.9.8</a></li>
                    <li><a href=" https://github.com/zip-rs/zip.git ">zip 0.6.6</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2014 Mathijs van de Nes

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/BurntSushi/aho-corasick ">aho-corasick 1.1.3</a></li>
                    <li><a href=" https://github.com/BurntSushi/byteorder ">byteorder 1.5.0</a></li>
                    <li><a href=" https://github.com/BurntSushi/rust-csv ">csv-core 0.1.11</a></li>
                    <li><a href=" https://github.com/BurntSushi/rust-csv ">csv 1.3.0</a></li>
                    <li><a href=" https://github.com/BurntSushi/memchr ">memchr 2.7.4</a></li>
                    <li><a href=" https://github.com/BurntSushi/regex-automata ">regex-automata 0.1.10</a></li>
                    <li><a href=" https://github.com/BurntSushi/termcolor ">termcolor 1.4.1</a></li>
                    <li><a href=" https://github.com/BurntSushi/utf8-ranges ">utf8-ranges 1.0.5</a></li>
                    <li><a href=" https://github.com/BurntSushi/walkdir ">walkdir 2.5.0</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Andrew Gallant

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/quickwit-inc/fst ">tantivy-fst 0.5.0</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Andrew Gallant
Copyright (c) 2019 Paul Masurel

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rapidfuzz/strsim-rs ">strsim 0.11.1</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Danny Guo
Copyright (c) 2016 Titus Wormer &lt;tituswormer@gmail.com&gt;
Copyright (c) 2018 Akash Kurdekar

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/retep998/winapi-rs ">winapi 0.2.8</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Peter Atashian

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/saghm/rust-separator ">separator 0.4.1</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Saghm Rossi

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/ia0/data-encoding ">data-encoding 2.6.0</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015-2020 Julien Cretin
Copyright (c) 2017-2020 Google Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/BurntSushi/same-file ">same-file 1.0.6</a></li>
                    <li><a href=" https://github.com/BurntSushi/winapi-util ">winapi-util 0.1.9</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2017 Andrew Gallant

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/console-rs/console ">console 0.15.8</a></li>
                    <li><a href=" https://github.com/mitsuhiko/dialoguer ">dialoguer 0.10.4</a></li>
                    <li><a href=" https://github.com/console-rs/indicatif ">indicatif 0.17.8</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2017 Armin Ronacher &lt;armin.ronacher@active-4.com&gt;

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/pyros2097/rust-embed ">rust-embed-impl 6.8.1</a></li>
                    <li><a href=" https://github.com/pyros2097/rust-embed ">rust-embed-utils 7.8.1</a></li>
                    <li><a href=" https://github.com/pyros2097/rust-embed ">rust-embed 6.8.1</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2018 pyros2097

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://hg.sr.ht/~icefox/oorandom ">oorandom 11.1.4</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2019 Simon Heath

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/avitex/rust-aliasable ">aliasable 0.1.3</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2020 James Dyson &lt;avitex@wfxlabs.com&gt;

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/pseitz/lz4_flex ">lz4_flex 0.11.3</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2020 Pascal Seitz

Permission is hereby granted, free of charge, to any person obtaining a copy of
this software and associated documentation files (the &quot;Software&quot;), to deal in
the Software without restriction, including without limitation the rights to
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
the Software, and to permit persons to whom the Software is furnished to do so,
subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/gyscos/zstd-rs ">zstd 0.11.2+zstd.1.5.2</a></li>
                    <li><a href=" https://github.com/gyscos/zstd-rs ">zstd 0.13.2</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)
Copyright (c) 2016 Alexandre Bury

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the &quot;Software&quot;), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/servo/bincode ">bincode 1.3.3</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2014 Ty Overby

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/abonander/mime_guess ">mime_guess 2.0.5</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Austin Bonander

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.

</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/fizyk20/generic-array.git ">generic-array 0.14.7</a></li>
                </ul>
                <pre class="license-text">The MIT License (MIT)

Copyright (c) 2015 Bartłomiej Kamiński

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.</pre>
            </li>
            <li class="license">
                <h3 id="MIT">MIT License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/kornelski/rust_urlencoding ">urlencoding 2.1.3</a></li>
                </ul>
                <pre class="license-text">© 2016 Bertram Truong
© 2021 Kornel Lesiński

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the &quot;Software&quot;), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
</pre>
            </li>
            <li class="license">
                <h3 id="MPL-2.0">Mozilla Public License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/mackwic/colored ">colored 2.1.0</a></li>
                </ul>
                <pre class="license-text">Mozilla Public License Version 2.0
&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;

1. Definitions
--------------

1.1. &quot;Contributor&quot;
    means each individual or legal entity that creates, contributes to
    the creation of, or owns Covered Software.

1.2. &quot;Contributor Version&quot;
    means the combination of the Contributions of others (if any) used
    by a Contributor and that particular Contributor&#x27;s Contribution.

1.3. &quot;Contribution&quot;
    means Covered Software of a particular Contributor.

1.4. &quot;Covered Software&quot;
    means Source Code Form to which the initial Contributor has attached
    the notice in Exhibit A, the Executable Form of such Source Code
    Form, and Modifications of such Source Code Form, in each case
    including portions thereof.

1.5. &quot;Incompatible With Secondary Licenses&quot;
    means

    (a) that the initial Contributor has attached the notice described
        in Exhibit B to the Covered Software; or

    (b) that the Covered Software was made available under the terms of
        version 1.1 or earlier of the License, but not also under the
        terms of a Secondary License.

1.6. &quot;Executable Form&quot;
    means any form of the work other than Source Code Form.

1.7. &quot;Larger Work&quot;
    means a work that combines Covered Software with other material, in 
    a separate file or files, that is not Covered Software.

1.8. &quot;License&quot;
    means this document.

1.9. &quot;Licensable&quot;
    means having the right to grant, to the maximum extent possible,
    whether at the time of the initial grant or subsequently, any and
    all of the rights conveyed by this License.

1.10. &quot;Modifications&quot;
    means any of the following:

    (a) any file in Source Code Form that results from an addition to,
        deletion from, or modification of the contents of Covered
        Software; or

    (b) any new file in Source Code Form that contains any Covered
        Software.

1.11. &quot;Patent Claims&quot; of a Contributor
    means any patent claim(s), including without limitation, method,
    process, and apparatus claims, in any patent Licensable by such
    Contributor that would be infringed, but for the grant of the
    License, by the making, using, selling, offering for sale, having
    made, import, or transfer of either its Contributions or its
    Contributor Version.

1.12. &quot;Secondary License&quot;
    means either the GNU General Public License, Version 2.0, the GNU
    Lesser General Public License, Version 2.1, the GNU Affero General
    Public License, Version 3.0, or any later versions of those
    licenses.

1.13. &quot;Source Code Form&quot;
    means the form of the work preferred for making modifications.

1.14. &quot;You&quot; (or &quot;Your&quot;)
    means an individual or a legal entity exercising rights under this
    License. For legal entities, &quot;You&quot; includes any entity that
    controls, is controlled by, or is under common control with You. For
    purposes of this definition, &quot;control&quot; means (a) the power, direct
    or indirect, to cause the direction or management of such entity,
    whether by contract or otherwise, or (b) ownership of more than
    fifty percent (50%) of the outstanding shares or beneficial
    ownership of such entity.

2. License Grants and Conditions
--------------------------------

2.1. Grants

Each Contributor hereby grants You a world-wide, royalty-free,
non-exclusive license:

(a) under intellectual property rights (other than patent or trademark)
    Licensable by such Contributor to use, reproduce, make available,
    modify, display, perform, distribute, and otherwise exploit its
    Contributions, either on an unmodified basis, with Modifications, or
    as part of a Larger Work; and

(b) under Patent Claims of such Contributor to make, use, sell, offer
    for sale, have made, import, and otherwise transfer either its
    Contributions or its Contributor Version.

2.2. Effective Date

The licenses granted in Section 2.1 with respect to any Contribution
become effective for each Contribution on the date the Contributor first
distributes such Contribution.

2.3. Limitations on Grant Scope

The licenses granted in this Section 2 are the only rights granted under
this License. No additional rights or licenses will be implied from the
distribution or licensing of Covered Software under this License.
Notwithstanding Section 2.1(b) above, no patent license is granted by a
Contributor:

(a) for any code that a Contributor has removed from Covered Software;
    or

(b) for infringements caused by: (i) Your and any other third party&#x27;s
    modifications of Covered Software, or (ii) the combination of its
    Contributions with other software (except as part of its Contributor
    Version); or

(c) under Patent Claims infringed by Covered Software in the absence of
    its Contributions.

This License does not grant any rights in the trademarks, service marks,
or logos of any Contributor (except as may be necessary to comply with
the notice requirements in Section 3.4).

2.4. Subsequent Licenses

No Contributor makes additional grants as a result of Your choice to
distribute the Covered Software under a subsequent version of this
License (see Section 10.2) or under the terms of a Secondary License (if
permitted under the terms of Section 3.3).

2.5. Representation

Each Contributor represents that the Contributor believes its
Contributions are its original creation(s) or it has sufficient rights
to grant the rights to its Contributions conveyed by this License.

2.6. Fair Use

This License is not intended to limit any rights You have under
applicable copyright doctrines of fair use, fair dealing, or other
equivalents.

2.7. Conditions

Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted
in Section 2.1.

3. Responsibilities
-------------------

3.1. Distribution of Source Form

All distribution of Covered Software in Source Code Form, including any
Modifications that You create or to which You contribute, must be under
the terms of this License. You must inform recipients that the Source
Code Form of the Covered Software is governed by the terms of this
License, and how they can obtain a copy of this License. You may not
attempt to alter or restrict the recipients&#x27; rights in the Source Code
Form.

3.2. Distribution of Executable Form

If You distribute Covered Software in Executable Form then:

(a) such Covered Software must also be made available in Source Code
    Form, as described in Section 3.1, and You must inform recipients of
    the Executable Form how they can obtain a copy of such Source Code
    Form by reasonable means in a timely manner, at a charge no more
    than the cost of distribution to the recipient; and

(b) You may distribute such Executable Form under the terms of this
    License, or sublicense it under different terms, provided that the
    license for the Executable Form does not attempt to limit or alter
    the recipients&#x27; rights in the Source Code Form under this License.

3.3. Distribution of a Larger Work

You may create and distribute a Larger Work under terms of Your choice,
provided that You also comply with the requirements of this License for
the Covered Software. If the Larger Work is a combination of Covered
Software with a work governed by one or more Secondary Licenses, and the
Covered Software is not Incompatible With Secondary Licenses, this
License permits You to additionally distribute such Covered Software
under the terms of such Secondary License(s), so that the recipient of
the Larger Work may, at their option, further distribute the Covered
Software under the terms of either this License or such Secondary
License(s).

3.4. Notices

You may not remove or alter the substance of any license notices
(including copyright notices, patent notices, disclaimers of warranty,
or limitations of liability) contained within the Source Code Form of
the Covered Software, except that You may alter any license notices to
the extent required to remedy known factual inaccuracies.

3.5. Application of Additional Terms

You may choose to offer, and to charge a fee for, warranty, support,
indemnity or liability obligations to one or more recipients of Covered
Software. However, You may do so only on Your own behalf, and not on
behalf of any Contributor. You must make it absolutely clear that any
such warranty, support, indemnity, or liability obligation is offered by
You alone, and You hereby agree to indemnify every Contributor for any
liability incurred by such Contributor as a result of warranty, support,
indemnity or liability terms You offer. You may include additional
disclaimers of warranty and limitations of liability specific to any
jurisdiction.

4. Inability to Comply Due to Statute or Regulation
---------------------------------------------------

If it is impossible for You to comply with any of the terms of this
License with respect to some or all of the Covered Software due to
statute, judicial order, or regulation then You must: (a) comply with
the terms of this License to the maximum extent possible; and (b)
describe the limitations and the code they affect. Such description must
be placed in a text file included with all distributions of the Covered
Software under this License. Except to the extent prohibited by statute
or regulation, such description must be sufficiently detailed for a
recipient of ordinary skill to be able to understand it.

5. Termination
--------------

5.1. The rights granted under this License will terminate automatically
if You fail to comply with any of its terms. However, if You become
compliant, then the rights granted under this License from a particular
Contributor are reinstated (a) provisionally, unless and until such
Contributor explicitly and finally terminates Your grants, and (b) on an
ongoing basis, if such Contributor fails to notify You of the
non-compliance by some reasonable means prior to 60 days after You have
come back into compliance. Moreover, Your grants from a particular
Contributor are reinstated on an ongoing basis if such Contributor
notifies You of the non-compliance by some reasonable means, this is the
first time You have received notice of non-compliance with this License
from such Contributor, and You become compliant prior to 30 days after
Your receipt of the notice.

5.2. If You initiate litigation against any entity by asserting a patent
infringement claim (excluding declaratory judgment actions,
counter-claims, and cross-claims) alleging that a Contributor Version
directly or indirectly infringes any patent, then the rights granted to
You by any and all Contributors for the Covered Software under Section
2.1 of this License shall terminate.

5.3. In the event of termination under Sections 5.1 or 5.2 above, all
end user license agreements (excluding distributors and resellers) which
have been validly granted by You or Your distributors under this License
prior to termination shall survive termination.

************************************************************************
*                                                                      *
*  6. Disclaimer of Warranty                                           *
*  -------------------------                                           *
*                                                                      *
*  Covered Software is provided under this License on an &quot;as is&quot;       *
*  basis, without warranty of any kind, either expressed, implied, or  *
*  statutory, including, without limitation, warranties that the       *
*  Covered Software is free of defects, merchantable, fit for a        *
*  particular purpose or non-infringing. The entire risk as to the     *
*  quality and performance of the Covered Software is with You.        *
*  Should any Covered Software prove defective in any respect, You     *
*  (not any Contributor) assume the cost of any necessary servicing,   *
*  repair, or correction. This disclaimer of warranty constitutes an   *
*  essential part of this License. No use of any Covered Software is   *
*  authorized under this License except under this disclaimer.         *
*                                                                      *
************************************************************************

************************************************************************
*                                                                      *
*  7. Limitation of Liability                                          *
*  --------------------------                                          *
*                                                                      *
*  Under no circumstances and under no legal theory, whether tort      *
*  (including negligence), contract, or otherwise, shall any           *
*  Contributor, or anyone who distributes Covered Software as          *
*  permitted above, be liable to You for any direct, indirect,         *
*  special, incidental, or consequential damages of any character      *
*  including, without limitation, damages for lost profits, loss of    *
*  goodwill, work stoppage, computer failure or malfunction, or any    *
*  and all other commercial damages or losses, even if such party      *
*  shall have been informed of the possibility of such damages. This   *
*  limitation of liability shall not apply to liability for death or   *
*  personal injury resulting from such party&#x27;s negligence to the       *
*  extent applicable law prohibits such limitation. Some               *
*  jurisdictions do not allow the exclusion or limitation of           *
*  incidental or consequential damages, so this exclusion and          *
*  limitation may not apply to You.                                    *
*                                                                      *
************************************************************************

8. Litigation
-------------

Any litigation relating to this License may be brought only in the
courts of a jurisdiction where the defendant maintains its principal
place of business and such litigation shall be governed by laws of that
jurisdiction, without reference to its conflict-of-law provisions.
Nothing in this Section shall prevent a party&#x27;s ability to bring
cross-claims or counter-claims.

9. Miscellaneous
----------------

This License represents the complete agreement concerning the subject
matter hereof. If any provision of this License is held to be
unenforceable, such provision shall be reformed only to the extent
necessary to make it enforceable. Any law or regulation which provides
that the language of a contract shall be construed against the drafter
shall not be used to construe this License against a Contributor.

10. Versions of the License
---------------------------

10.1. New Versions

Mozilla Foundation is the license steward. Except as provided in Section
10.3, no one other than the license steward has the right to modify or
publish new versions of this License. Each version will be given a
distinguishing version number.

10.2. Effect of New Versions

You may distribute the Covered Software under the terms of the version
of the License under which You originally received the Covered Software,
or under the terms of any subsequent version published by the license
steward.

10.3. Modified Versions

If you create software not governed by this License, and you want to
create a new license for such software, you may create and use a
modified version of this License if you rename the license and remove
any references to the name of the license steward (except to note that
such modified license differs from this License).

10.4. Distributing Source Code Form that is Incompatible With Secondary
Licenses

If You choose to distribute Source Code Form that is Incompatible With
Secondary Licenses under the terms of this version of the License, the
notice described in Exhibit B of this License must be attached.

Exhibit A - Source Code Form License Notice
-------------------------------------------

  This Source Code Form is subject to the terms of the Mozilla Public
  License, v. 2.0. If a copy of the MPL was not distributed with this
  file, You can obtain one at http://mozilla.org/MPL/2.0/.

If it is not possible or desirable to put the notice in a particular
file, then You may include the notice in a location (such as a LICENSE
file in a relevant directory) where a recipient would be likely to look
for such a notice.

You may add additional accurate notices of copyright ownership.

Exhibit B - &quot;Incompatible With Secondary Licenses&quot; Notice
---------------------------------------------------------

  This Source Code Form is &quot;Incompatible With Secondary Licenses&quot;, as
  defined by the Mozilla Public License, v. 2.0.
</pre>
            </li>
            <li class="license">
                <h3 id="MPL-2.0">Mozilla Public License 2.0</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/rustls/webpki-roots ">webpki-roots 0.25.4</a></li>
                </ul>
                <pre class="license-text">Mozilla Public License Version 2.0
&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;

1. Definitions
--------------

1.1. &quot;Contributor&quot;
    means each individual or legal entity that creates, contributes to
    the creation of, or owns Covered Software.

1.2. &quot;Contributor Version&quot;
    means the combination of the Contributions of others (if any) used
    by a Contributor and that particular Contributor&#x27;s Contribution.

1.3. &quot;Contribution&quot;
    means Covered Software of a particular Contributor.

1.4. &quot;Covered Software&quot;
    means Source Code Form to which the initial Contributor has attached
    the notice in Exhibit A, the Executable Form of such Source Code
    Form, and Modifications of such Source Code Form, in each case
    including portions thereof.

1.5. &quot;Incompatible With Secondary Licenses&quot;
    means

    (a) that the initial Contributor has attached the notice described
        in Exhibit B to the Covered Software; or

    (b) that the Covered Software was made available under the terms of
        version 1.1 or earlier of the License, but not also under the
        terms of a Secondary License.

1.6. &quot;Executable Form&quot;
    means any form of the work other than Source Code Form.

1.7. &quot;Larger Work&quot;
    means a work that combines Covered Software with other material, in 
    a separate file or files, that is not Covered Software.

1.8. &quot;License&quot;
    means this document.

1.9. &quot;Licensable&quot;
    means having the right to grant, to the maximum extent possible,
    whether at the time of the initial grant or subsequently, any and
    all of the rights conveyed by this License.

1.10. &quot;Modifications&quot;
    means any of the following:

    (a) any file in Source Code Form that results from an addition to,
        deletion from, or modification of the contents of Covered
        Software; or

    (b) any new file in Source Code Form that contains any Covered
        Software.

1.11. &quot;Patent Claims&quot; of a Contributor
    means any patent claim(s), including without limitation, method,
    process, and apparatus claims, in any patent Licensable by such
    Contributor that would be infringed, but for the grant of the
    License, by the making, using, selling, offering for sale, having
    made, import, or transfer of either its Contributions or its
    Contributor Version.

1.12. &quot;Secondary License&quot;
    means either the GNU General Public License, Version 2.0, the GNU
    Lesser General Public License, Version 2.1, the GNU Affero General
    Public License, Version 3.0, or any later versions of those
    licenses.

1.13. &quot;Source Code Form&quot;
    means the form of the work preferred for making modifications.

1.14. &quot;You&quot; (or &quot;Your&quot;)
    means an individual or a legal entity exercising rights under this
    License. For legal entities, &quot;You&quot; includes any entity that
    controls, is controlled by, or is under common control with You. For
    purposes of this definition, &quot;control&quot; means (a) the power, direct
    or indirect, to cause the direction or management of such entity,
    whether by contract or otherwise, or (b) ownership of more than
    fifty percent (50%) of the outstanding shares or beneficial
    ownership of such entity.

2. License Grants and Conditions
--------------------------------

2.1. Grants

Each Contributor hereby grants You a world-wide, royalty-free,
non-exclusive license:

(a) under intellectual property rights (other than patent or trademark)
    Licensable by such Contributor to use, reproduce, make available,
    modify, display, perform, distribute, and otherwise exploit its
    Contributions, either on an unmodified basis, with Modifications, or
    as part of a Larger Work; and

(b) under Patent Claims of such Contributor to make, use, sell, offer
    for sale, have made, import, and otherwise transfer either its
    Contributions or its Contributor Version.

2.2. Effective Date

The licenses granted in Section 2.1 with respect to any Contribution
become effective for each Contribution on the date the Contributor first
distributes such Contribution.

2.3. Limitations on Grant Scope

The licenses granted in this Section 2 are the only rights granted under
this License. No additional rights or licenses will be implied from the
distribution or licensing of Covered Software under this License.
Notwithstanding Section 2.1(b) above, no patent license is granted by a
Contributor:

(a) for any code that a Contributor has removed from Covered Software;
    or

(b) for infringements caused by: (i) Your and any other third party&#x27;s
    modifications of Covered Software, or (ii) the combination of its
    Contributions with other software (except as part of its Contributor
    Version); or

(c) under Patent Claims infringed by Covered Software in the absence of
    its Contributions.

This License does not grant any rights in the trademarks, service marks,
or logos of any Contributor (except as may be necessary to comply with
the notice requirements in Section 3.4).

2.4. Subsequent Licenses

No Contributor makes additional grants as a result of Your choice to
distribute the Covered Software under a subsequent version of this
License (see Section 10.2) or under the terms of a Secondary License (if
permitted under the terms of Section 3.3).

2.5. Representation

Each Contributor represents that the Contributor believes its
Contributions are its original creation(s) or it has sufficient rights
to grant the rights to its Contributions conveyed by this License.

2.6. Fair Use

This License is not intended to limit any rights You have under
applicable copyright doctrines of fair use, fair dealing, or other
equivalents.

2.7. Conditions

Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted
in Section 2.1.

3. Responsibilities
-------------------

3.1. Distribution of Source Form

All distribution of Covered Software in Source Code Form, including any
Modifications that You create or to which You contribute, must be under
the terms of this License. You must inform recipients that the Source
Code Form of the Covered Software is governed by the terms of this
License, and how they can obtain a copy of this License. You may not
attempt to alter or restrict the recipients&#x27; rights in the Source Code
Form.

3.2. Distribution of Executable Form

If You distribute Covered Software in Executable Form then:

(a) such Covered Software must also be made available in Source Code
    Form, as described in Section 3.1, and You must inform recipients of
    the Executable Form how they can obtain a copy of such Source Code
    Form by reasonable means in a timely manner, at a charge no more
    than the cost of distribution to the recipient; and

(b) You may distribute such Executable Form under the terms of this
    License, or sublicense it under different terms, provided that the
    license for the Executable Form does not attempt to limit or alter
    the recipients&#x27; rights in the Source Code Form under this License.

3.3. Distribution of a Larger Work

You may create and distribute a Larger Work under terms of Your choice,
provided that You also comply with the requirements of this License for
the Covered Software. If the Larger Work is a combination of Covered
Software with a work governed by one or more Secondary Licenses, and the
Covered Software is not Incompatible With Secondary Licenses, this
License permits You to additionally distribute such Covered Software
under the terms of such Secondary License(s), so that the recipient of
the Larger Work may, at their option, further distribute the Covered
Software under the terms of either this License or such Secondary
License(s).

3.4. Notices

You may not remove or alter the substance of any license notices
(including copyright notices, patent notices, disclaimers of warranty,
or limitations of liability) contained within the Source Code Form of
the Covered Software, except that You may alter any license notices to
the extent required to remedy known factual inaccuracies.

3.5. Application of Additional Terms

You may choose to offer, and to charge a fee for, warranty, support,
indemnity or liability obligations to one or more recipients of Covered
Software. However, You may do so only on Your own behalf, and not on
behalf of any Contributor. You must make it absolutely clear that any
such warranty, support, indemnity, or liability obligation is offered by
You alone, and You hereby agree to indemnify every Contributor for any
liability incurred by such Contributor as a result of warranty, support,
indemnity or liability terms You offer. You may include additional
disclaimers of warranty and limitations of liability specific to any
jurisdiction.

4. Inability to Comply Due to Statute or Regulation
---------------------------------------------------

If it is impossible for You to comply with any of the terms of this
License with respect to some or all of the Covered Software due to
statute, judicial order, or regulation then You must: (a) comply with
the terms of this License to the maximum extent possible; and (b)
describe the limitations and the code they affect. Such description must
be placed in a text file included with all distributions of the Covered
Software under this License. Except to the extent prohibited by statute
or regulation, such description must be sufficiently detailed for a
recipient of ordinary skill to be able to understand it.

5. Termination
--------------

5.1. The rights granted under this License will terminate automatically
if You fail to comply with any of its terms. However, if You become
compliant, then the rights granted under this License from a particular
Contributor are reinstated (a) provisionally, unless and until such
Contributor explicitly and finally terminates Your grants, and (b) on an
ongoing basis, if such Contributor fails to notify You of the
non-compliance by some reasonable means prior to 60 days after You have
come back into compliance. Moreover, Your grants from a particular
Contributor are reinstated on an ongoing basis if such Contributor
notifies You of the non-compliance by some reasonable means, this is the
first time You have received notice of non-compliance with this License
from such Contributor, and You become compliant prior to 30 days after
Your receipt of the notice.

5.2. If You initiate litigation against any entity by asserting a patent
infringement claim (excluding declaratory judgment actions,
counter-claims, and cross-claims) alleging that a Contributor Version
directly or indirectly infringes any patent, then the rights granted to
You by any and all Contributors for the Covered Software under Section
2.1 of this License shall terminate.

5.3. In the event of termination under Sections 5.1 or 5.2 above, all
end user license agreements (excluding distributors and resellers) which
have been validly granted by You or Your distributors under this License
prior to termination shall survive termination.

************************************************************************
*                                                                      *
*  6. Disclaimer of Warranty                                           *
*  -------------------------                                           *
*                                                                      *
*  Covered Software is provided under this License on an &quot;as is&quot;       *
*  basis, without warranty of any kind, either expressed, implied, or  *
*  statutory, including, without limitation, warranties that the       *
*  Covered Software is free of defects, merchantable, fit for a        *
*  particular purpose or non-infringing. The entire risk as to the     *
*  quality and performance of the Covered Software is with You.        *
*  Should any Covered Software prove defective in any respect, You     *
*  (not any Contributor) assume the cost of any necessary servicing,   *
*  repair, or correction. This disclaimer of warranty constitutes an   *
*  essential part of this License. No use of any Covered Software is   *
*  authorized under this License except under this disclaimer.         *
*                                                                      *
************************************************************************

************************************************************************
*                                                                      *
*  7. Limitation of Liability                                          *
*  --------------------------                                          *
*                                                                      *
*  Under no circumstances and under no legal theory, whether tort      *
*  (including negligence), contract, or otherwise, shall any           *
*  Contributor, or anyone who distributes Covered Software as          *
*  permitted above, be liable to You for any direct, indirect,         *
*  special, incidental, or consequential damages of any character      *
*  including, without limitation, damages for lost profits, loss of    *
*  goodwill, work stoppage, computer failure or malfunction, or any    *
*  and all other commercial damages or losses, even if such party      *
*  shall have been informed of the possibility of such damages. This   *
*  limitation of liability shall not apply to liability for death or   *
*  personal injury resulting from such party&#x27;s negligence to the       *
*  extent applicable law prohibits such limitation. Some               *
*  jurisdictions do not allow the exclusion or limitation of           *
*  incidental or consequential damages, so this exclusion and          *
*  limitation may not apply to You.                                    *
*                                                                      *
************************************************************************

8. Litigation
-------------

Any litigation relating to this License may be brought only in the
courts of a jurisdiction where the defendant maintains its principal
place of business and such litigation shall be governed by laws of that
jurisdiction, without reference to its conflict-of-law provisions.
Nothing in this Section shall prevent a party&#x27;s ability to bring
cross-claims or counter-claims.

9. Miscellaneous
----------------

This License represents the complete agreement concerning the subject
matter hereof. If any provision of this License is held to be
unenforceable, such provision shall be reformed only to the extent
necessary to make it enforceable. Any law or regulation which provides
that the language of a contract shall be construed against the drafter
shall not be used to construe this License against a Contributor.

10. Versions of the License
---------------------------

10.1. New Versions

Mozilla Foundation is the license steward. Except as provided in Section
10.3, no one other than the license steward has the right to modify or
publish new versions of this License. Each version will be given a
distinguishing version number.

10.2. Effect of New Versions

You may distribute the Covered Software under the terms of the version
of the License under which You originally received the Covered Software,
or under the terms of any subsequent version published by the license
steward.

10.3. Modified Versions

If you create software not governed by this License, and you want to
create a new license for such software, you may create and use a
modified version of this License if you rename the license and remove
any references to the name of the license steward (except to note that
such modified license differs from this License).

10.4. Distributing Source Code Form that is Incompatible With Secondary
Licenses

If You choose to distribute Source Code Form that is Incompatible With
Secondary Licenses under the terms of this version of the License, the
notice described in Exhibit B of this License must be attached.

Exhibit A - Source Code Form License Notice
-------------------------------------------

  This Source Code Form is subject to the terms of the Mozilla Public
  License, v. 2.0. If a copy of the MPL was not distributed with this
  file, You can obtain one at https://mozilla.org/MPL/2.0/.

If it is not possible or desirable to put the notice in a particular
file, then You may include the notice in a location (such as a LICENSE
file in a relevant directory) where a recipient would be likely to look
for such a notice.

You may add additional accurate notices of copyright ownership.

Exhibit B - &quot;Incompatible With Secondary Licenses&quot; Notice
---------------------------------------------------------

  This Source Code Form is &quot;Incompatible With Secondary Licenses&quot;, as
  defined by the Mozilla Public License, v. 2.0.
</pre>
            </li>
            <li class="license">
                <h3 id="OpenSSL">OpenSSL License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/briansmith/ring ">ring 0.17.8</a></li>
                </ul>
                <pre class="license-text">/* &#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;
 * Copyright (c) 1998-2011 The OpenSSL Project.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 *
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer. 
 *
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in
 *    the documentation and/or other materials provided with the
 *    distribution.
 *
 * 3. All advertising materials mentioning features or use of this
 *    software must display the following acknowledgment:
 *    &quot;This product includes software developed by the OpenSSL Project
 *    for use in the OpenSSL Toolkit. (http://www.openssl.org/)&quot;
 *
 * 4. The names &quot;OpenSSL Toolkit&quot; and &quot;OpenSSL Project&quot; must not be used to
 *    endorse or promote products derived from this software without
 *    prior written permission. For written permission, please contact
 *    openssl-core@openssl.org.
 *
 * 5. Products derived from this software may not be called &quot;OpenSSL&quot;
 *    nor may &quot;OpenSSL&quot; appear in their names without prior written
 *    permission of the OpenSSL Project.
 *
 * 6. Redistributions of any form whatsoever must retain the following
 *    acknowledgment:
 *    &quot;This product includes software developed by the OpenSSL Project
 *    for use in the OpenSSL Toolkit (http://www.openssl.org/)&quot;
 *
 * THIS SOFTWARE IS PROVIDED BY THE OpenSSL PROJECT &#x60;&#x60;AS IS&#x27;&#x27; AND ANY
 * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE OpenSSL PROJECT OR
 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
 * OF THE POSSIBILITY OF SUCH DAMAGE.
 * &#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;
 *
 * This product includes cryptographic software written by Eric Young
 * (eay@cryptsoft.com).  This product includes software written by Tim
 * Hudson (tjh@cryptsoft.com).
 *
 */</pre>
            </li>
            <li class="license">
                <h3 id="Unicode-DFS-2016">Unicode License Agreement - Data Files and Software (2016)</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/dtolnay/unicode-ident ">unicode-ident 1.0.13</a></li>
                </ul>
                <pre class="license-text">UNICODE, INC. LICENSE AGREEMENT - DATA FILES AND SOFTWARE

See Terms of Use &lt;https://www.unicode.org/copyright.html&gt;
for definitions of Unicode Inc.’s Data Files and Software.

NOTICE TO USER: Carefully read the following legal agreement.
BY DOWNLOADING, INSTALLING, COPYING OR OTHERWISE USING UNICODE INC.&#x27;S
DATA FILES (&quot;DATA FILES&quot;), AND/OR SOFTWARE (&quot;SOFTWARE&quot;),
YOU UNEQUIVOCALLY ACCEPT, AND AGREE TO BE BOUND BY, ALL OF THE
TERMS AND CONDITIONS OF THIS AGREEMENT.
IF YOU DO NOT AGREE, DO NOT DOWNLOAD, INSTALL, COPY, DISTRIBUTE OR USE
THE DATA FILES OR SOFTWARE.

COPYRIGHT AND PERMISSION NOTICE

Copyright © 1991-2022 Unicode, Inc. All rights reserved.
Distributed under the Terms of Use in https://www.unicode.org/copyright.html.

Permission is hereby granted, free of charge, to any person obtaining
a copy of the Unicode data files and any associated documentation
(the &quot;Data Files&quot;) or Unicode software and any associated documentation
(the &quot;Software&quot;) to deal in the Data Files or Software
without restriction, including without limitation the rights to use,
copy, modify, merge, publish, distribute, and/or sell copies of
the Data Files or Software, and to permit persons to whom the Data Files
or Software are furnished to do so, provided that either
(a) this copyright and permission notice appear with all copies
of the Data Files or Software, or
(b) this copyright and permission notice appear in associated
Documentation.

THE DATA FILES AND SOFTWARE ARE PROVIDED &quot;AS IS&quot;, WITHOUT WARRANTY OF
ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
NONINFRINGEMENT OF THIRD PARTY RIGHTS.
IN NO EVENT SHALL THE COPYRIGHT HOLDER OR HOLDERS INCLUDED IN THIS
NOTICE BE LIABLE FOR ANY CLAIM, OR ANY SPECIAL INDIRECT OR CONSEQUENTIAL
DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE,
DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
PERFORMANCE OF THE DATA FILES OR SOFTWARE.

Except as contained in this notice, the name of a copyright holder
shall not be used in advertising or otherwise to promote the sale,
use or other dealings in these Data Files or Software without prior
written authorization of the copyright holder.
</pre>
            </li>
            <li class="license">
                <h3 id="Zlib">zlib License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/orlp/foldhash ">foldhash 0.1.3</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2024 Orson Peters

This software is provided &#x27;as-is&#x27;, without any express or implied warranty. In
no event will the authors be held liable for any damages arising from the use of
this software.

Permission is granted to anyone to use this software for any purpose, including
commercial applications, and to alter it and redistribute it freely, subject to
the following restrictions:

1. The origin of this software must not be misrepresented; you must not claim
    that you wrote the original software. If you use this software in a product,
    an acknowledgment in the product documentation would be appreciated but is
    not required.

2. Altered source versions must be plainly marked as such, and must not be
    misrepresented as being the original software.

3. This notice may not be removed or altered from any source distribution.</pre>
            </li>
            <li class="license">
                <h3 id="Zlib">zlib License</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/Absolucy/nanorand-rs ">nanorand 0.7.0</a></li>
                </ul>
                <pre class="license-text">The zlib/libpng License
&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;&#x3D;

Copyright (c) 2021 lucy

This software is provided &#x27;as-is&#x27;, without any express or implied warranty. In
no event will the authors be held liable for any damages arising from the use of
this software.

Permission is granted to anyone to use this software for any purpose, including
commercial applications, and to alter it and redistribute it freely, subject to
the following restrictions:

1.  The origin of this software must not be misrepresented; you must not claim
    that you wrote the original software. If you use this software in a product,
    an acknowledgment in the product documentation would be appreciated but is
    not required.

2.  Altered source versions must be plainly marked as such, and must not be
    misrepresented as being the original software.

3.  This notice may not be removed or altered from any source distribution.
</pre>
            </li>
            <li class="license">
                <h3 id="zlib-acknowledgement">zlib/libpng License with Acknowledgement</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    <li><a href=" https://github.com/fulmicoton/fastdivide ">fastdivide 0.4.1</a></li>
                </ul>
                <pre class="license-text">Copyright (c) 2002-2007 Charlie Poole
Copyright (c) 2002-2004 James W. Newkirk, Michael C. Two, Alexei A. Vorontsov
Copyright (c) 2000-2002 Philip A. Craig

This software is provided &#x27;as-is&#x27;, without any express or implied warranty. In no event will the authors be held liable for any damages arising from the use of this software.

Permission is granted to anyone to use this software for any purpose, including commercial applications, and to alter it and redistribute it freely, subject to the following restrictions:

1. The origin of this software must not be misrepresented; you must not claim that you wrote the original software. If you use this software in a product, an acknowledgment (see the following) in the product documentation is required.

     Portions Copyright (c) 2002-2007 Charlie Poole or Copyright (c) 2002-2004 James W. Newkirk, Michael C. Two, Alexei A. Vorontsov or Copyright (c) 2000-2002 Philip A. Craig

2. Altered source versions must be plainly marked as such, and must not be misrepresented as being the original software.

3. This notice may not be removed or altered from any source distribution.
</pre>
            </li>
        </ul>
    </main>
</body>

</html>


================================================
FILE: quickwit/license-tool.toml
================================================
[overrides]
# rust-license-tool can't find the license for crunchy-0.2.2, but it's MIT
# according to the crate's Cargo.toml.
"crunchy-0.2.2" = { license = "MIT", origin = "https://github.com/eira-fransham/crunchy" }

# `ring` has a custom license that is mostly "ISC-style" but parts of it also fall under OpenSSL licensing.
"ring-0.17.8" = { license = "ISC AND Custom" }


================================================
FILE: quickwit/quickwit-actors/Cargo.toml
================================================
[package]
name = "quickwit-actors"
description = "Actor framework powering Quickwit services"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
flume = { workspace = true }
futures = { workspace = true }
once_cell = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
sync_wrapper = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }

quickwit-common = { workspace = true }

[features]
testsuite = []

[dev-dependencies]
rand = { workspace = true }
criterion = { workspace = true }

[[bench]]
name = "bench"
harness = false


================================================
FILE: quickwit/quickwit-actors/LICENSE
================================================
The files under the quickwit-actors/ subdirectory are published under the MIT license.

Copyright (c) 2023 by Quickwit Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.


================================================
FILE: quickwit/quickwit-actors/README.md
================================================
# Quickwit actors

Yet another actor crate for rust.
This crate exists specifically to answer quickwit needs.
The API may change in the future.

## Objective

- Producing easy-to-reason with code: Quickwit's indexing pipeline is complex as it is.
- Easy to test actors.
- Control over the runtime.

## Non-objective

- High number of message throughput. Most of message exchanged in quickwit
are "large". For instance, it can hold a temp directory with gigabytes worth of data.
The actor dealing with the highest number of messages are the indexer and sources.
One message then typically holds a batch of records.

# Features

- Actor message box
- The framework is meant to run asynchronous actors by default, but it can also run actors that are blocking for long amount of time. The message handler methods are technically asynchronous in both case, but the `Actor::runner` method makes it possible to run an actor with blocking code on a dedicated thread.
- A scheduler actor that makes it possible to mock simulate time.

# Example

```rust
use std::time::Duration;
use async_trait::async_trait;
use quickwit_actors::{Handler, Actor, Universe, ActorContext, ActorExitStatus, Mailbox};

#[derive(Default)]
struct PingReceiver;

impl Actor for PingReceiver {
    type ObservableState = ();
    fn observable_state(&self) -> Self::ObservableState {}
}

#[async_trait]
impl Handler<Ping> for PingReceiver {
    type Reply = String;
    async fn handle(
        &mut self,
        _msg: Ping,
        _ctx: &ActorContext<Self>,
    ) -> Result<String, ActorExitStatus> {
        Ok("Pong".to_string())
    }
}

struct PingSender {
    peer: Mailbox<PingReceiver>,
}

#[derive(Debug)]
struct Loop;

#[derive(Debug)]
struct Ping;

#[async_trait]
impl Actor for PingSender {
    type ObservableState = ();
    fn observable_state(&self) -> Self::ObservableState {}

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(),ActorExitStatus> {
        ctx.send_self_message(Loop).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<Loop> for PingSender {
    type Reply = ();

    async fn handle(
        &mut self,
        _: Loop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let reply_msg = ctx.ask(&self.peer, Ping).await.unwrap();
        println!("{reply_msg}");
        ctx.schedule_self_msg(Duration::from_secs(1), Loop).await;
        Ok(())
    }
}

#[tokio::main]
async fn main() {
    let universe = Universe::new();

    let (recv_mailbox, _) =
        universe.spawn_actor(PingReceiver::default()).spawn();

    let ping_sender = PingSender { peer: recv_mailbox };
    let (_, ping_sender_handler) = universe.spawn_actor(ping_sender).spawn();

    ping_sender_handler.join().await;
}
```


================================================
FILE: quickwit/quickwit-actors/benches/bench.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;
use criterion::{BenchmarkId, Criterion, criterion_group, criterion_main};
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Universe};

#[derive(Default)]
struct DoNothingActor<const YIELD_AFTER_EACH_MESSAGE: bool>(u64);

#[async_trait]
impl<const YIELD_AFTER_EACH_MESSAGE: bool> Actor for DoNothingActor<YIELD_AFTER_EACH_MESSAGE> {
    type ObservableState = u64;

    fn observable_state(&self) -> u64 {
        self.0
    }

    fn yield_after_each_message(&self) -> bool {
        YIELD_AFTER_EACH_MESSAGE
    }
}

#[derive(Debug)]
struct AddMessage(u64);

#[async_trait]
impl<const YIELD_AFTER_EACH_MESSAGE: bool> Handler<AddMessage>
    for DoNothingActor<YIELD_AFTER_EACH_MESSAGE>
{
    type Reply = ();

    async fn handle(
        &mut self,
        msg: AddMessage,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.0 += msg.0;
        Ok(())
    }
}

async fn actor_bench_code<const YIELD_AFTER_EACH_MESSAGE: bool>(num_messages: usize) {
    let universe = Universe::default();
    let actor: DoNothingActor<YIELD_AFTER_EACH_MESSAGE> = DoNothingActor::default();
    let (mailbox, handle) = universe.spawn_builder().spawn(actor);
    for _ in 0..num_messages {
        mailbox.send_message(AddMessage(1)).await.unwrap();
    }
    drop(mailbox);
    let (_, total) = handle.join().await;
    assert_eq!(total, num_messages as u64);
}

async fn flume_bench_code(num_messages: usize) {
    let (tx, rx) = flume::unbounded::<AddMessage>();
    for _ in 0..num_messages {
        tx.send_async(AddMessage(1)).await.unwrap();
    }
    let join = tokio::task::spawn(async move {
        let mut sum = 0;
        while rx.recv_async().await.is_ok() {
            sum += 1;
        }
        sum
    });
    drop(tx);
    let total = join.await.unwrap();
    assert_eq!(total, num_messages as u64);
}

async fn chan_with_priority_bench_code(num_messages: usize) {
    let (tx, rx) =
        quickwit_actors::channel_with_priority::channel(quickwit_actors::QueueCapacity::Unbounded);
    for _ in 0..num_messages {
        tx.send_low_priority(AddMessage(1)).await.unwrap();
    }
    let join = tokio::task::spawn(async move {
        let mut sum = 0;
        while rx.recv().await.is_ok() {
            sum += 1;
        }
        sum
    });
    drop(tx);
    let total = join.await.unwrap();
    assert_eq!(total, num_messages as u64);
}

fn message_throughput(c: &mut Criterion) {
    let num_messages = [10_000]; // [1, 1_000, 10_000]
    for num_messages in num_messages {
        c.bench_with_input(
            BenchmarkId::new(
                "unlimited_capacity_actors_yield_after_each_message",
                num_messages,
            ),
            &num_messages,
            |b, &num_messages| {
                // Insert a call to `to_async` to convert the bencher to async mode.
                // The timing loops are the same as with the normal bencher.
                let runtime = tokio::runtime::Builder::new_multi_thread()
                    .enable_all()
                    .build()
                    .unwrap();
                b.to_async(runtime)
                    .iter(|| actor_bench_code::<true>(num_messages));
            },
        );
        c.bench_with_input(
            BenchmarkId::new(
                "unlimited_capacity_actors_no_yield_after_each_message",
                num_messages,
            ),
            &num_messages,
            |b, &num_messages| {
                // Insert a call to `to_async` to convert the bencher to async mode.
                // The timing loops are the same as with the normal bencher.
                let runtime = tokio::runtime::Builder::new_multi_thread()
                    .enable_all()
                    .build()
                    .unwrap();
                b.to_async(runtime)
                    .iter(|| actor_bench_code::<false>(num_messages));
            },
        );
        c.bench_with_input(
            BenchmarkId::new("unlimited_capacity_flume", num_messages),
            &num_messages,
            |b, &num_messages| {
                // Insert a call to `to_async` to convert the bencher to async mode.
                // The timing loops are the same as with the normal bencher.
                let runtime = tokio::runtime::Builder::new_multi_thread()
                    .enable_all()
                    .build()
                    .unwrap();
                b.to_async(runtime).iter(|| flume_bench_code(num_messages));
            },
        );
        c.bench_with_input(
            BenchmarkId::new("unlimited_capacity_chan_with_priority", num_messages),
            &num_messages,
            |b, &num_messages| {
                // Insert a call to `to_async` to convert the bencher to async mode.
                // The timing loops are the same as with the normal bencher.
                let runtime = tokio::runtime::Builder::new_multi_thread()
                    .enable_all()
                    .build()
                    .unwrap();
                b.to_async(runtime)
                    .iter(|| chan_with_priority_bench_code(num_messages));
            },
        );
    }
}

criterion_group!(benches, message_throughput);
criterion_main!(benches);


================================================
FILE: quickwit/quickwit-actors/examples/ping_actor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, Universe};
use rand::prelude::IteratorRandom;

struct PingReceiver {
    name: &'static str,
    num_ping_received: usize,
}

impl PingReceiver {
    pub fn with_name(name: &'static str) -> Self {
        PingReceiver {
            name,
            num_ping_received: 0,
        }
    }
}

impl Actor for PingReceiver {
    type ObservableState = usize;

    fn observable_state(&self) -> Self::ObservableState {
        self.num_ping_received
    }
}

#[async_trait]
impl Handler<Ping> for PingReceiver {
    type Reply = String;
    async fn handle(
        &mut self,
        _msg: Ping,
        _ctx: &ActorContext<Self>,
    ) -> Result<String, ActorExitStatus> {
        self.num_ping_received += 1;
        Ok(format!(
            "Actor `{}` received {} pings",
            self.name, self.num_ping_received
        ))
    }
}

// ------------------

#[derive(Default)]
struct PingSender {
    peers: Vec<Mailbox<PingReceiver>>,
    num_ping_emitted: usize,
}

#[derive(Debug)]
struct Loop;

#[derive(Debug)]
struct Ping;

#[derive(Debug)]
pub struct AddPeer(Mailbox<PingReceiver>);

#[async_trait]
impl Actor for PingSender {
    type ObservableState = ();
    fn observable_state(&self) -> Self::ObservableState {}

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        ctx.send_self_message(Loop).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<Loop> for PingSender {
    type Reply = ();

    async fn handle(&mut self, _: Loop, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        let random_peer_id_opt = (0..self.peers.len()).choose(&mut rand::rng());
        if let Some(random_peer_id) = random_peer_id_opt {
            match ctx.ask(&self.peers[random_peer_id], Ping).await {
                Ok(reply_msg) => {
                    println!("{reply_msg}");
                }
                Err(_send_error) => {
                    self.peers.swap_remove(random_peer_id);
                }
            }
        }
        self.num_ping_emitted += 1;
        if self.num_ping_emitted == 10 {
            return Err(ActorExitStatus::Success);
        }
        ctx.schedule_self_msg(Duration::from_secs(1), Loop);
        Ok(())
    }
}

#[async_trait]
impl Handler<AddPeer> for PingSender {
    type Reply = ();

    async fn handle(
        &mut self,
        add_peer_msg: AddPeer,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let AddPeer(peer_mailbox) = add_peer_msg;
        self.peers.push(peer_mailbox);
        Ok(())
    }
}

#[tokio::main]
async fn main() {
    let universe = Universe::new();

    let (roger_mailbox, _) = universe
        .spawn_builder()
        .spawn(PingReceiver::with_name("Roger"));

    let (myriam_mailbox, _) = universe
        .spawn_builder()
        .spawn(PingReceiver::with_name("Myriam"));

    let (ping_sender_mailbox, ping_sender_handler) =
        universe.spawn_builder().spawn(PingSender::default());

    ping_sender_mailbox
        .send_message(AddPeer(roger_mailbox))
        .await
        .unwrap();
    ping_sender_mailbox
        .send_message(AddPeer(myriam_mailbox))
        .await
        .unwrap();

    ping_sender_handler.join().await;
}


================================================
FILE: quickwit/quickwit-actors/src/actor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::type_name;
use std::fmt;
use std::sync::Arc;

use async_trait::async_trait;
use thiserror::Error;

use crate::{ActorContext, QueueCapacity, SendError};

/// The actor exit status represents the outcome of the execution of an actor,
/// after the end of the execution.
///
/// It is in many ways, similar to the exit status code of a program.
#[derive(Clone, Debug, Error)]
pub enum ActorExitStatus {
    /// The actor successfully exited.
    ///
    /// It happens either because:
    /// - all of the existing mailboxes were dropped and the actor message queue was exhausted. No
    ///   new message could ever arrive to the actor. (This exit is triggered by the framework.) or
    /// - the actor `process_message` method returned `Err(ExitStatusCode::Success)`. (This exit is
    ///   triggered by the actor implementer.)
    ///
    /// (This is equivalent to exit status code 0.)
    /// Note that this is not really an error.
    #[error("success")]
    Success,

    /// The actor was asked to gracefully shutdown.
    ///
    /// (Semantically equivalent to exit status code 130, triggered by SIGINT aka Ctrl-C, or
    /// SIGQUIT)
    #[error("quit")]
    Quit,

    /// The actor tried to send a message to a dowstream actor and failed.
    /// The logic ruled that the actor should be killed.
    ///
    /// (Semantically equivalent to exit status code 141, triggered by SIGPIPE)
    #[error("downstream actor exited")]
    DownstreamClosed,

    /// The actor was killed.
    ///
    /// It can happen because:
    /// - it received `Command::Kill`.
    /// - its kill switch was activated.
    ///
    /// (Semantically equivalent to exit status code 137, triggered by SIGKILL)
    #[error("killed")]
    Killed,

    /// An unexpected error happened while processing a message.
    #[error("failure(cause={0:?})")]
    Failure(Arc<anyhow::Error>),

    /// The thread or the task executing the actor loop panicked.
    #[error("panicked")]
    Panicked,
}

impl From<anyhow::Error> for ActorExitStatus {
    fn from(err: anyhow::Error) -> Self {
        ActorExitStatus::Failure(Arc::new(err))
    }
}

impl ActorExitStatus {
    pub fn is_success(&self) -> bool {
        matches!(self, ActorExitStatus::Success)
    }
}

impl From<SendError> for ActorExitStatus {
    fn from(_: SendError) -> Self {
        ActorExitStatus::DownstreamClosed
    }
}

/// An actor has an internal state and processes a stream of messages.
/// Each actor has a mailbox where the messages are enqueued before being processed.
///
/// While processing a message, the actor typically
/// - update its state;
/// - emits one or more messages to other actors.
#[async_trait]
pub trait Actor: Send + Sized + 'static {
    /// Piece of state that can be copied for assert in unit test, admin, etc.
    type ObservableState: fmt::Debug + serde::Serialize + Send + Sync + Clone;
    /// A name identifying the type of actor.
    ///
    /// Ideally respect the `CamelCase` convention.
    ///
    /// It does not need to be "instance-unique", and can be the name of
    /// the actor implementation.
    fn name(&self) -> String {
        type_name::<Self>().to_string()
    }

    /// The runner method makes it possible to decide the environment
    /// of execution of the Actor.
    ///
    /// Actor with a handler that may block for more than 50 microseconds
    /// should use the `ActorRunner::DedicatedThread`.
    fn runtime_handle(&self) -> tokio::runtime::Handle {
        tokio::runtime::Handle::current()
    }

    /// If set to true, the actor will yield after every single
    /// message.
    ///
    /// For actors that are calling `.await` regularly,
    /// returning `false` can yield better performance.
    fn yield_after_each_message(&self) -> bool {
        true
    }

    /// The Actor's incoming mailbox queue capacity. It is set when the actor is spawned.
    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Unbounded
    }

    /// Extracts an observable state. Useful for unit tests, and admin UI.
    ///
    /// This function should return quickly.
    fn observable_state(&self) -> Self::ObservableState;

    /// Initialize is called before running the actor.
    ///
    /// This function is useful for instance to schedule an initial message in a looping
    /// actor.
    ///
    /// It can be compared just to an implicit Initial message.
    ///
    /// Returning an ActorExitStatus will therefore have the same effect as if it
    /// was in `process_message` (e.g. the actor will stop, the finalize method will be called.
    /// the kill switch may be activated etc.)
    async fn initialize(&mut self, _ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        Ok(())
    }

    /// This function is called after a series of one, or several messages have been processed and
    /// no more message is available.
    ///
    /// It is a great place to have the actor "sleep".
    ///
    /// Quickwit's Indexer actor for instance use `on_drained_messages` to
    /// schedule indexing in such a way that an indexer drains all of its
    /// available messages and sleeps for some amount of time.
    async fn on_drained_messages(
        &mut self,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        Ok(())
    }

    /// Hook  that can be set up to define what should happen upon actor exit.
    /// This hook is called only once.
    ///
    /// It is always called regardless of the reason why the actor exited.
    /// The exit status is passed as an argument to make it possible to act conditionally
    /// upon it.
    /// For instance, it is often better to do as little work as possible on a killed actor.
    /// It can be done by checking the `exit_status` and performing an early-exit if it is
    /// equal to `ActorExitStatus::Killed`.
    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        Ok(())
    }
}

/// Message handler that allows actor to defer the reply
#[async_trait::async_trait]
pub trait DeferableReplyHandler<M>: Actor {
    type Reply: Send + 'static;

    async fn handle_message(
        &mut self,
        message: M,
        reply: impl FnOnce(Self::Reply) + Send + Sync + 'static,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus>
    where
        M: Send + 'static;
}

/// Message handler that requires actor to provide immediate response
#[async_trait::async_trait]
pub trait Handler<M>: Actor {
    type Reply: Send + 'static;

    /// Processes a message.
    ///
    /// If an exit status is returned as an error, the actor will exit.
    /// It will stop processing more message, the finalize method will be called,
    /// and its exit status will be the one defined in the error.
    async fn handle(
        &mut self,
        message: M,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus>;
}

#[async_trait::async_trait]
impl<H, M> DeferableReplyHandler<M> for H
where H: Handler<M>
{
    type Reply = H::Reply;

    async fn handle_message(
        &mut self,
        message: M,
        reply: impl FnOnce(Self::Reply) + Send + 'static,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus>
    where
        M: Send + 'static,
    {
        self.handle(message, ctx).await.map(reply)
    }
}


================================================
FILE: quickwit/quickwit-actors/src/actor_context.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::Infallible;
use std::fmt;
use std::future::Future;
use std::ops::Deref;
use std::sync::Arc;
use std::sync::atomic::{AtomicBool, Ordering};
use std::time::Duration;

use quickwit_common::metrics::IntCounter;
use quickwit_common::{KillSwitch, Progress, ProtectedZoneGuard};
use tokio::sync::{oneshot, watch};
use tracing::{debug, error};

#[cfg(any(test, feature = "testsuite"))]
use crate::Universe;
use crate::actor_state::AtomicState;
use crate::registry::ActorRegistry;
use crate::spawn_builder::{SpawnBuilder, SpawnContext};
use crate::{
    Actor, ActorExitStatus, ActorState, AskError, Command, DeferableReplyHandler, Mailbox,
    SendError, TrySendError,
};

// TODO hide all of this public stuff
pub struct ActorContext<A: Actor> {
    inner: Arc<ActorContextInner<A>>,
}

impl<A: Actor> Clone for ActorContext<A> {
    fn clone(&self) -> Self {
        ActorContext {
            inner: self.inner.clone(),
        }
    }
}

impl<A: Actor> Deref for ActorContext<A> {
    type Target = ActorContextInner<A>;

    fn deref(&self) -> &Self::Target {
        self.inner.as_ref()
    }
}

pub struct ActorContextInner<A: Actor> {
    spawn_ctx: SpawnContext,
    self_mailbox: Mailbox<A>,
    progress: Progress,
    actor_state: AtomicState,
    backpressure_micros_counter_opt: Option<IntCounter>,
    observable_state_tx: watch::Sender<A::ObservableState>,
    // Boolean marking the presence of an observe message in the actor's high priority queue.
    observe_enqueued: AtomicBool,
}

impl<A: Actor> ActorContext<A> {
    pub(crate) fn new(
        self_mailbox: Mailbox<A>,
        spawn_ctx: SpawnContext,
        observable_state_tx: watch::Sender<A::ObservableState>,
        backpressure_micros_counter_opt: Option<IntCounter>,
    ) -> Self {
        ActorContext {
            inner: ActorContextInner {
                self_mailbox,
                spawn_ctx,
                progress: Progress::default(),
                actor_state: AtomicState::default(),
                observable_state_tx,
                backpressure_micros_counter_opt,
                observe_enqueued: AtomicBool::new(false),
            }
            .into(),
        }
    }

    pub fn spawn_ctx(&self) -> &SpawnContext {
        &self.spawn_ctx
    }

    /// Sleeps for a given amount of time.
    ///
    /// That sleep is measured by the universe scheduler, which means that it can be
    /// shortened if `Universe::simulate_sleep(..)` is used.
    ///
    /// While sleeping, an actor is NOT protected from its supervisor.
    /// It is up to the user to call `ActorContext::protect_future(..)`.
    pub async fn sleep(&self, duration: Duration) {
        let scheduler_client = &self.spawn_ctx().scheduler_client;
        scheduler_client.dec_no_advance_time();
        scheduler_client.sleep(duration).await;
        scheduler_client.inc_no_advance_time();
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(
        universe: &Universe,
        actor_mailbox: Mailbox<A>,
        observable_state_tx: watch::Sender<A::ObservableState>,
    ) -> Self {
        Self::new(
            actor_mailbox,
            universe.spawn_ctx.clone(),
            observable_state_tx,
            None,
        )
    }

    pub fn mailbox(&self) -> &Mailbox<A> {
        &self.self_mailbox
    }

    pub(crate) fn registry(&self) -> &ActorRegistry {
        &self.spawn_ctx.registry
    }

    pub fn actor_instance_id(&self) -> &str {
        self.mailbox().actor_instance_id()
    }

    /// This function returns a guard that prevents any supervisor from identifying the
    /// actor as dead.
    /// The protection ends when the `ProtectZoneGuard` is dropped.
    ///
    /// In an ideal world, you should never need to call this function.
    /// It is only useful in some corner cases, like calling a long blocking
    /// from an external library that you trust.
    pub fn protect_zone(&self) -> ProtectedZoneGuard {
        self.progress.protect_zone()
    }

    /// Executes a future in a protected zone.
    pub async fn protect_future<Fut, T>(&self, future: Fut) -> T
    where Fut: Future<Output = T> {
        let _guard = self.protect_zone();
        future.await
    }

    /// Cooperatively yields, while keeping the actor protected.
    pub async fn yield_now(&self) {
        self.protect_future(tokio::task::yield_now()).await;
    }

    /// Gets a copy of the actor kill switch.
    /// This should rarely be used.
    ///
    /// For instance, when quitting from the process_message function, prefer simply
    /// returning `Error(ActorExitStatus::Failure(..))`
    pub fn kill_switch(&self) -> &KillSwitch {
        &self.spawn_ctx.kill_switch
    }

    #[must_use]
    pub fn progress(&self) -> &Progress {
        &self.progress
    }

    pub fn spawn_actor<SpawnedActor: Actor>(&self) -> SpawnBuilder<SpawnedActor> {
        self.spawn_ctx.clone().spawn_builder()
    }

    /// Records some progress.
    /// This function is only useful when implementing actors that may take more than
    /// `HEARTBEAT` to process a single message.
    /// In that case, you can call this function in the middle of the process_message method
    /// to prevent the actor from being identified as blocked or dead.
    pub fn record_progress(&self) {
        self.progress.record_progress();
    }

    pub(crate) fn state(&self) -> ActorState {
        self.actor_state.get_state()
    }

    pub fn pause(&self) {
        self.actor_state.pause();
    }

    pub(crate) fn resume(&self) {
        self.actor_state.resume();
    }

    /// Sets the queue as observed and returns the previous value.
    /// This method is used to make sure we do not have Observe messages
    /// stacking up in the observe queue.
    pub(crate) fn set_observe_enqueued_and_return_previous(&self) -> bool {
        self.observe_enqueued.swap(true, Ordering::Relaxed)
    }

    /// Updates the observable state of the actor.
    pub fn observe(&self, actor: &mut A) -> A::ObservableState {
        let obs_state = actor.observable_state();
        self.inner.observe_enqueued.store(false, Ordering::Relaxed);
        let _ = self.observable_state_tx.send(obs_state.clone());
        obs_state
    }

    pub(crate) fn exit(&self, exit_status: &ActorExitStatus) {
        self.actor_state.exit(exit_status.is_success());
        if should_activate_kill_switch(exit_status) {
            error!(actor=%self.actor_instance_id(), exit_status=?exit_status, "exit activating-kill-switch");
            self.kill_switch().kill();
        }
    }

    /// Posts a message in an actor's mailbox.
    ///
    /// This method does not wait for the message to be handled by the
    /// target actor. However, it returns a oneshot receiver that the caller
    /// that makes it possible to `.await` it.
    /// If the reply is important, chances are the `.ask(...)` method is
    /// more indicated.
    ///
    /// Dropping the receiver channel will not cancel the
    /// processing of the message. It is a very common usage.
    /// In fact most actors are expected to send message in a
    /// fire-and-forget fashion.
    ///
    /// Regular messages (as opposed to commands) are queued and guaranteed
    /// to be processed in FIFO order.
    ///
    /// This method hides logic to prevent an actor from being identified
    /// as frozen if the destination actor channel is saturated, and we
    /// are simply experiencing back pressure.
    pub async fn send_message<DestActor, M>(
        &self,
        mailbox: &Mailbox<DestActor>,
        msg: M,
    ) -> Result<oneshot::Receiver<DestActor::Reply>, SendError>
    where
        DestActor: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        let _guard = self.protect_zone();
        debug!(from=%self.self_mailbox.actor_instance_id(), send=%mailbox.actor_instance_id(), msg=?msg);
        mailbox
            .send_message_with_backpressure_counter(
                msg,
                self.backpressure_micros_counter_opt.as_ref(),
            )
            .await
    }

    pub async fn ask<DestActor, M, T>(
        &self,
        mailbox: &Mailbox<DestActor>,
        msg: M,
    ) -> Result<T, AskError<Infallible>>
    where
        DestActor: DeferableReplyHandler<M, Reply = T>,
        M: fmt::Debug + Send + 'static,
    {
        let _guard = self.protect_zone();
        debug!(from=%self.self_mailbox.actor_instance_id(), send=%mailbox.actor_instance_id(), msg=?msg, "ask");
        mailbox
            .ask_with_backpressure_counter(msg, self.backpressure_micros_counter_opt.as_ref())
            .await
    }

    /// Similar to `send_message`, except this method
    /// waits asynchronously for the actor reply.
    pub async fn ask_for_res<DestActor, M, T, E>(
        &self,
        mailbox: &Mailbox<DestActor>,
        msg: M,
    ) -> Result<T, AskError<E>>
    where
        DestActor: DeferableReplyHandler<M, Reply = Result<T, E>>,
        M: fmt::Debug + Send + Sync + 'static,
        E: fmt::Debug,
    {
        let _guard = self.protect_zone();
        debug!(from=%self.self_mailbox.actor_instance_id(), send=%mailbox.actor_instance_id(), msg=?msg, "ask");
        mailbox.ask_for_res(msg).await
    }

    /// Send the Success message to terminate the destination actor with the Success exit status.
    ///
    /// The message is queued like any regular message, so that pending messages will be processed
    /// first.
    pub async fn send_exit_with_success<Dest: Actor>(
        &self,
        mailbox: &Mailbox<Dest>,
    ) -> Result<(), SendError> {
        let _guard = self.protect_zone();
        debug!(from=%self.self_mailbox.actor_instance_id(), to=%mailbox.actor_instance_id(), "success");
        mailbox.send_message(Command::ExitWithSuccess).await?;
        Ok(())
    }

    /// Sends a message to an actor's own mailbox.
    ///
    /// Warning: This method is dangerous as it can very easily
    /// cause a deadlock.
    pub async fn send_self_message<M>(
        &self,
        msg: M,
    ) -> Result<oneshot::Receiver<A::Reply>, SendError>
    where
        A: DeferableReplyHandler<M>,
        M: 'static + Sync + Send + fmt::Debug,
    {
        debug!(self=%self.self_mailbox.actor_instance_id(), msg=?msg, "self_send");
        self.self_mailbox.send_message(msg).await
    }

    /// Attempts to send a message to itself.
    /// The message will be queue to self's low_priority queue.
    ///
    /// Warning: This method will always fail if
    /// an actor has a capacity of 0.
    pub fn try_send_self_message<M>(
        &self,
        msg: M,
    ) -> Result<oneshot::Receiver<A::Reply>, TrySendError<M>>
    where
        A: DeferableReplyHandler<M>,
        M: 'static + Sync + Send + fmt::Debug,
    {
        self.self_mailbox.try_send_message(msg)
    }

    /// Schedules a message that will be sent to the high-priority queue of the
    /// actor Mailbox once `after_duration` has elapsed.
    ///
    /// Note that this holds a reference to the actor mailbox until the message
    /// is actually sent.
    pub fn schedule_self_msg<M>(&self, after_duration: Duration, message: M)
    where
        A: DeferableReplyHandler<M>,
        M: Sync + Send + std::fmt::Debug + 'static,
    {
        let self_mailbox = self.mailbox().clone();
        let callback = move || {
            let _ = self_mailbox.send_message_with_high_priority(message);
        };
        self.spawn_ctx().schedule_event(callback, after_duration);
    }
}

/// If an actor exits in an unexpected manner, its kill
/// switch will be activated, and all other actors under the same
/// kill switch will be killed.
fn should_activate_kill_switch(exit_status: &ActorExitStatus) -> bool {
    match exit_status {
        ActorExitStatus::DownstreamClosed => true,
        ActorExitStatus::Failure(_) => true,
        ActorExitStatus::Panicked => true,
        ActorExitStatus::Success => false,
        ActorExitStatus::Quit => false,
        ActorExitStatus::Killed => false,
    }
}


================================================
FILE: quickwit/quickwit-actors/src/actor_handle.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::ops::Deref;

use serde::Serialize;
use tokio::sync::{oneshot, watch};
use tracing::error;

use crate::actor_state::ActorState;
use crate::command::Observe;
use crate::mailbox::Priority;
use crate::observation::ObservationType;
use crate::registry::ActorJoinHandle;
use crate::{Actor, ActorContext, ActorExitStatus, Command, Mailbox, Observation};

/// An Actor Handle serves as an address to communicate with an actor.
pub struct ActorHandle<A: Actor> {
    actor_context: ActorContext<A>,
    last_state: watch::Receiver<A::ObservableState>,
    join_handle: ActorJoinHandle,
}

/// Describes the health of a given actor.
#[derive(Clone, Eq, PartialEq, Debug, Hash, Serialize)]
pub enum Health {
    /// The actor is running and behaving as expected.
    Healthy,
    /// No progress was registered, or the process terminated with an error
    FailureOrUnhealthy,
    /// The actor terminated successfully.
    Success,
}

/// Message received by health probe handlers.
#[derive(Clone, Debug)]
pub struct Healthz;

impl<A: Actor> fmt::Debug for ActorHandle<A> {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("ActorHandle")
            .field("name", &self.actor_context.actor_instance_id())
            .finish()
    }
}

pub trait Supervisable {
    fn name(&self) -> &str;

    /// Check for the ActorState (has it terminated?), and provided `check_for_progress`
    /// is set to `true`, it will also check for the progress of the actor.
    fn check_health(&self, check_for_progress: bool) -> Health;

    fn state(&self) -> ActorState;
}

impl<A: Actor> Supervisable for ActorHandle<A> {
    fn name(&self) -> &str {
        self.actor_context.actor_instance_id()
    }

    fn state(&self) -> ActorState {
        self.actor_context.state()
    }

    /// Harvests the health of the actor by checking its state (see [`ActorState`]) and,
    /// provided `check_for_progress` is set to true, it will check its progress too
    /// (see `Progress`).
    ///
    /// When `check_for_progress` is set to true, calling this method resets its progress state
    /// to "no update" (see `ProgressState`). As a consequence, only one supervisor or probe
    /// should periodically invoke this method during the lifetime of the actor.
    fn check_health(&self, check_for_progress: bool) -> Health {
        let actor_state = self.state();
        if actor_state == ActorState::Success {
            return Health::Success;
        }
        if actor_state == ActorState::Failure {
            error!(actor = self.name(), "actor-exit-without-success");
            return Health::FailureOrUnhealthy;
        }
        if !check_for_progress
            || self
                .actor_context
                .progress()
                .registered_activity_since_last_call()
        {
            Health::Healthy
        } else {
            error!(actor = self.name(), "actor-timeout");
            Health::FailureOrUnhealthy
        }
    }
}

impl<A: Actor> ActorHandle<A> {
    pub(crate) fn new(
        last_state: watch::Receiver<A::ObservableState>,
        join_handle: ActorJoinHandle,
        actor_context: ActorContext<A>,
    ) -> Self {
        ActorHandle {
            actor_context,
            last_state,
            join_handle,
        }
    }

    pub fn state(&self) -> ActorState {
        self.actor_context.state()
    }

    /// Process all of the pending messages, and returns a snapshot of
    /// the observable state of the actor after this.
    ///
    /// This method is mostly useful for tests.
    ///
    /// To actually observe the state of an actor for ops purpose,
    /// prefer using the `.observe()` method.
    ///
    /// This method timeout if reaching the end of the message takes more than an HEARTBEAT.
    pub async fn process_pending_and_observe(&self) -> Observation<A::ObservableState> {
        self.observe_with_priority(Priority::Low).await
    }

    /// Observe the current state.
    ///
    /// The observation will be scheduled as a high priority message, therefore it will be executed
    /// after the current active message and the current command queue have been processed.
    ///
    /// This method does not do anything to avoid Observe messages from stacking up.
    /// In supervisors, prefer using `refresh_observation`.
    pub async fn observe(&self) -> Observation<A::ObservableState> {
        self.observe_with_priority(Priority::High).await
    }

    /// Triggers an observation.
    /// It is scheduled as a high priority
    /// message, and will hence be executed as soon as possible.
    ///
    /// This method does not enqueue an Observe request if there is already one in
    /// the queue.
    ///
    /// The resulting observation can eventually be accessible using the
    /// observation watch channel.
    ///
    /// This function returning does NOT mean that the observation was executed.
    pub fn refresh_observe(&self) {
        let observation_already_enqueued = self
            .actor_context
            .set_observe_enqueued_and_return_previous();
        if !observation_already_enqueued {
            let _ = self
                .actor_context
                .mailbox()
                .send_message_with_high_priority(Observe);
        }
    }

    async fn observe_with_priority(&self, priority: Priority) -> Observation<A::ObservableState> {
        if !self.actor_context.state().is_exit() {
            if let Ok(oneshot_rx) = self
                .actor_context
                .mailbox()
                .send_message_with_priority(Observe, priority)
                .await
            {
                // The timeout is required here. If the actor fails, its inbox is properly dropped
                // but the send channel might actually prevent the onechannel
                // Receiver from being dropped.
                return self.wait_for_observable_state_callback(oneshot_rx).await;
            } else {
                error!(
                    actor_id=%self.actor_context.actor_instance_id(),
                    "Failed to send observe message"
                );
            }
        }
        let state = self.last_observation().clone();
        Observation {
            obs_type: ObservationType::PostMortem,
            state,
        }
    }

    /// Pauses the actor. The actor will stop processing messages from the low priority
    /// channel, but its work can be resumed by calling the method `.resume()`.
    pub fn pause(&self) {
        let _ = self
            .actor_context
            .mailbox()
            .send_message_with_high_priority(Command::Pause);
    }

    /// Resumes a paused actor.
    pub fn resume(&self) {
        let _ = self
            .actor_context
            .mailbox()
            .send_message_with_high_priority(Command::Resume);
    }

    /// Kills the actor. Its finalize function will still be called.
    ///
    /// This function also actionnates the actor kill switch.
    ///
    /// The other difference with quit is the exit status. It is important,
    /// as the finalize logic may behave differently depending on the exit status.
    pub async fn kill(self) -> (ActorExitStatus, A::ObservableState) {
        self.actor_context.kill_switch().kill();
        let _ = self
            .actor_context
            .mailbox()
            .send_message_with_high_priority(Command::Nudge);
        self.join().await
    }

    /// Gracefully quit the actor, regardless of whether there are pending messages or not.
    /// Its finalize function will be called.
    ///
    /// The kill switch is not actionated.
    ///
    /// The other difference with kill is the exit status. It is important,
    /// as the finalize logic may behave differently depending on the exit status.
    pub async fn quit(self) -> (ActorExitStatus, A::ObservableState) {
        let _ = self
            .actor_context
            .mailbox()
            .send_message_with_high_priority(Command::Quit);
        self.join().await
    }

    /// Waits until the actor exits by itself. This is the equivalent of `Thread::join`.
    pub async fn join(self) -> (ActorExitStatus, A::ObservableState) {
        let exit_status = self.join_handle.join().await;
        let observation = self.last_state.borrow().clone();
        (exit_status, observation)
    }

    pub fn last_observation(&self) -> impl Deref<Target = A::ObservableState> + '_ {
        self.last_state.borrow()
    }

    async fn wait_for_observable_state_callback(
        &self,
        rx: oneshot::Receiver<A::ObservableState>,
    ) -> Observation<A::ObservableState> {
        let scheduler_client = &self.actor_context.spawn_ctx().scheduler_client;
        let observable_state_or_timeout =
            scheduler_client.timeout(crate::OBSERVE_TIMEOUT, rx).await;
        match observable_state_or_timeout {
            Ok(Ok(state)) => {
                let obs_type = ObservationType::Alive;
                Observation { obs_type, state }
            }
            Ok(Err(_)) => {
                let state = self.last_observation().clone();
                let obs_type = ObservationType::PostMortem;
                Observation { obs_type, state }
            }
            Err(_) => {
                let state = self.last_observation().clone();
                let obs_type = if self.actor_context.state().is_exit() {
                    ObservationType::PostMortem
                } else {
                    ObservationType::Timeout
                };
                Observation { obs_type, state }
            }
        }
    }

    pub fn mailbox(&self) -> &Mailbox<A> {
        self.actor_context.mailbox()
    }
}

#[cfg(test)]
mod tests {
    use std::sync::atomic::{AtomicU32, Ordering};
    use std::time::Duration;

    use async_trait::async_trait;

    use super::*;
    use crate::{Handler, Universe};

    #[derive(Default)]
    struct PanickingActor {
        count: usize,
    }

    impl Actor for PanickingActor {
        type ObservableState = usize;
        fn observable_state(&self) -> usize {
            self.count
        }
    }

    #[derive(Debug)]
    struct Panic;

    #[async_trait]
    impl Handler<Panic> for PanickingActor {
        type Reply = ();
        async fn handle(
            &mut self,
            _message: Panic,
            _ctx: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            self.count += 1;
            panic!("Oops");
        }
    }

    #[derive(Default)]
    struct ExitActor {
        count: usize,
    }

    impl Actor for ExitActor {
        type ObservableState = usize;
        fn observable_state(&self) -> usize {
            self.count
        }
    }

    #[derive(Debug)]
    struct Exit;

    #[async_trait]
    impl Handler<Exit> for ExitActor {
        type Reply = ();

        async fn handle(
            &mut self,
            _msg: Exit,
            _ctx: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            self.count += 1;
            Err(ActorExitStatus::DownstreamClosed)
        }
    }

    #[tokio::test]
    async fn test_panic_in_actor() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (mailbox, handle) = universe.spawn_builder().spawn(PanickingActor::default());
        mailbox.send_message(Panic).await?;
        let (exit_status, count) = handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Panicked));
        assert!(matches!(count, 1)); //< Upon panick we cannot get a post mortem state.
        Ok(())
    }

    #[tokio::test]
    async fn test_exit() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (mailbox, handle) = universe.spawn_builder().spawn(ExitActor::default());
        mailbox.send_message(Exit).await?;
        let (exit_status, count) = handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::DownstreamClosed));
        assert!(matches!(count, 1)); //< Upon panick we cannot get a post mortem state.
        Ok(())
    }

    #[derive(Default)]
    struct ObserveActor {
        observe: AtomicU32,
    }

    #[async_trait]
    impl Actor for ObserveActor {
        type ObservableState = u32;

        fn observable_state(&self) -> u32 {
            self.observe.fetch_add(1, Ordering::Relaxed)
        }

        async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
            ctx.send_self_message(YieldLoop).await?;
            Ok(())
        }
    }

    #[derive(Debug)]
    struct YieldLoop;

    #[async_trait]
    impl Handler<YieldLoop> for ObserveActor {
        type Reply = ();
        async fn handle(
            &mut self,
            _: YieldLoop,
            ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, ActorExitStatus> {
            ctx.sleep(Duration::from_millis(25)).await; // OBSERVE_TIMEOUT.mul_f32(10.0f32)).await;
            ctx.send_self_message(YieldLoop).await?;
            Ok(())
        }
    }

    #[tokio::test]
    async fn test_observation_debounce() {
        // TODO investigate why Universe::with_accelerated_time() does not work here.
        let universe = Universe::new();
        let (_, actor_handle) = universe.spawn_builder().spawn(ObserveActor::default());
        for _ in 0..10 {
            actor_handle.refresh_observe();
            universe.sleep(Duration::from_millis(10)).await;
        }
        let (_last_obs, num_obs) = actor_handle.quit().await;
        assert!(num_obs < 8);
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-actors/src/actor_state.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::atomic::{AtomicU32, Ordering};

#[repr(u32)]
#[derive(Clone, Copy, Debug, Eq, PartialEq)]
pub enum ActorState {
    /// Running means that the actor consumes and processes both low priority messages (regular
    /// message) and high priority message commands.
    Running = 0,
    /// Pause means that the actor only consumes and processes high priority messages. Typically
    /// commands as well as scheduled messages.
    Paused = 1,
    /// Success means that the actor exited and cannot return to any other states.
    Success = 2,
    /// Failure means that the actor exited with a failure or panicked.
    Failure = 3,
}

impl From<u32> for ActorState {
    fn from(actor_state_u32: u32) -> Self {
        match actor_state_u32 {
            0 => ActorState::Running,
            1 => ActorState::Paused,
            2 => ActorState::Success,
            3 => ActorState::Failure,
            _ => {
                panic!(
                    "Found forbidden u32 value for ActorState `{actor_state_u32}`. This should \
                     never happen."
                );
            }
        }
    }
}

impl From<ActorState> for AtomicState {
    fn from(state: ActorState) -> Self {
        AtomicState(AtomicU32::from(state as u32))
    }
}

impl ActorState {
    pub fn is_running(&self) -> bool {
        *self == ActorState::Running
    }

    pub fn is_exit(&self) -> bool {
        match self {
            ActorState::Running | ActorState::Paused => false,
            ActorState::Success | ActorState::Failure => true,
        }
    }
}

pub(crate) struct AtomicState(AtomicU32);

impl Default for AtomicState {
    fn default() -> Self {
        AtomicState(AtomicU32::new(ActorState::Running as u32))
    }
}

impl AtomicState {
    pub(crate) fn pause(&self) {
        let _ = self
            .0
            .fetch_update(Ordering::SeqCst, Ordering::SeqCst, |state| {
                if ActorState::from(state).is_running() {
                    return Some(ActorState::Paused as u32);
                }
                None
            });
    }

    pub(crate) fn resume(&self) {
        let _ = self.0.compare_exchange(
            ActorState::Paused as u32,
            ActorState::Running as u32,
            Ordering::SeqCst,
            Ordering::SeqCst,
        );
    }

    pub(crate) fn exit(&self, success: bool) {
        let new_state = if success {
            ActorState::Success
        } else {
            ActorState::Failure
        };
        self.0.fetch_max(new_state as u32, Ordering::Release);
    }

    pub fn get_state(&self) -> ActorState {
        ActorState::from(self.0.load(Ordering::Acquire))
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    enum Operation {
        Pause,
        Resume,
        ExitSuccess,
        ExitFailure,
    }

    impl Operation {
        fn apply(&self, state: &AtomicState) {
            match self {
                Operation::Pause => {
                    state.pause();
                }
                Operation::Resume => state.resume(),
                Operation::ExitSuccess => state.exit(true),
                Operation::ExitFailure => state.exit(false),
            }
        }
    }

    #[track_caller]
    fn test_transition(from_state: ActorState, op: Operation, expected_state: ActorState) {
        let state = AtomicState::from(from_state);
        op.apply(&state);
        assert_eq!(state.get_state(), expected_state);
    }

    #[test]
    fn test_atomic_state_from_running() {
        test_transition(ActorState::Running, Operation::Pause, ActorState::Paused);
        test_transition(ActorState::Running, Operation::Resume, ActorState::Running);
        test_transition(
            ActorState::Running,
            Operation::ExitSuccess,
            ActorState::Success,
        );
        test_transition(ActorState::Paused, Operation::Pause, ActorState::Paused);
        test_transition(ActorState::Paused, Operation::Resume, ActorState::Running);
        test_transition(
            ActorState::Paused,
            Operation::ExitSuccess,
            ActorState::Success,
        );
        test_transition(
            ActorState::Success,
            Operation::ExitFailure,
            ActorState::Failure,
        );

        test_transition(ActorState::Success, Operation::Pause, ActorState::Success);
        test_transition(ActorState::Success, Operation::Resume, ActorState::Success);
        test_transition(
            ActorState::Success,
            Operation::ExitSuccess,
            ActorState::Success,
        );

        test_transition(ActorState::Failure, Operation::Pause, ActorState::Failure);
        test_transition(ActorState::Failure, Operation::Resume, ActorState::Failure);
        test_transition(
            ActorState::Failure,
            Operation::ExitSuccess,
            ActorState::Failure,
        );
        test_transition(
            ActorState::Failure,
            Operation::ExitFailure,
            ActorState::Failure,
        );
    }
}


================================================
FILE: quickwit/quickwit-actors/src/channel_with_priority.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Mutex;
use std::sync::atomic::{AtomicBool, Ordering};

use flume::TryRecvError;
use thiserror::Error;

#[derive(Default)]
struct LockedOption<T> {
    opt: Mutex<Option<T>>,
    has_val: AtomicBool,
}

impl<T> LockedOption<T> {
    pub fn none() -> Self {
        LockedOption {
            opt: Mutex::new(None),
            has_val: AtomicBool::new(false),
        }
    }

    pub fn is_some(&self) -> bool {
        self.has_val.load(Ordering::Acquire)
    }

    pub fn is_none(&self) -> bool {
        !self.is_some()
    }

    pub fn take(&self) -> Option<T> {
        if !self.has_val.load(Ordering::Acquire) {
            return None;
        }
        let mut lock = self.opt.lock().unwrap();
        let val_opt = lock.take();
        self.has_val.store(false, Ordering::Release);
        val_opt
    }

    pub fn place(&self, val: T) {
        let mut lock = self.opt.lock().unwrap();
        self.has_val.store(true, Ordering::Release);
        *lock = Some(val);
    }
}

#[derive(Debug, Error)]
pub enum SendError {
    #[error("the channel is closed")]
    Disconnected,
    #[error("the channel is full")]
    Full,
}

#[derive(Debug, Error)]
pub enum TrySendError<M> {
    #[error("the channel is closed")]
    Disconnected,
    #[error("the channel is full")]
    Full(M),
}

impl<M> From<flume::TrySendError<M>> for TrySendError<M> {
    fn from(err: flume::TrySendError<M>) -> Self {
        match err {
            flume::TrySendError::Full(msg) => TrySendError::Full(msg),
            flume::TrySendError::Disconnected(_) => TrySendError::Disconnected,
        }
    }
}

#[derive(Clone, Copy, Debug, Error, Eq, PartialEq)]
pub enum RecvError {
    #[error("no message are currently available")]
    NoMessageAvailable,
    #[error("all senders were dropped and no pending messages are in the channel")]
    Disconnected,
}

impl From<flume::RecvTimeoutError> for RecvError {
    fn from(flume_err: flume::RecvTimeoutError) -> Self {
        match flume_err {
            flume::RecvTimeoutError::Timeout => Self::NoMessageAvailable,
            flume::RecvTimeoutError::Disconnected => Self::Disconnected,
        }
    }
}

impl<T> From<flume::SendError<T>> for SendError {
    fn from(_send_error: flume::SendError<T>) -> Self {
        SendError::Disconnected
    }
}

impl<T> From<flume::TrySendError<T>> for SendError {
    fn from(try_send_error: flume::TrySendError<T>) -> Self {
        match try_send_error {
            flume::TrySendError::Full(_) => SendError::Full,
            flume::TrySendError::Disconnected(_) => SendError::Disconnected,
        }
    }
}

#[derive(Clone, Copy, Debug)]
pub enum QueueCapacity {
    Bounded(usize),
    Unbounded,
}

/// Creates a channel with the ability to send high priority messages.
///
/// A high priority message is guaranteed to be consumed before any
/// low priority message sent after it.
pub fn channel<T>(queue_capacity: QueueCapacity) -> (Sender<T>, Receiver<T>) {
    let (high_priority_tx, high_priority_rx) = flume::unbounded();
    let (low_priority_tx, low_priority_rx) = match queue_capacity {
        QueueCapacity::Bounded(cap) => flume::bounded(cap),
        QueueCapacity::Unbounded => flume::unbounded(),
    };
    let receiver = Receiver {
        low_priority_rx,
        high_priority_rx,
        _high_priority_tx: high_priority_tx.clone(),
        pending_low_priority_message: LockedOption::none(),
        _clone_is_forbidden: CloneIsForbidden,
    };
    let sender = Sender {
        low_priority_tx,
        high_priority_tx,
    };
    (sender, receiver)
}

pub struct Sender<T> {
    low_priority_tx: flume::Sender<T>,
    high_priority_tx: flume::Sender<T>,
}

impl<T> Sender<T> {
    pub fn is_disconnected(&self) -> bool {
        self.low_priority_tx.is_disconnected()
    }

    pub fn try_send_low_priority(&self, msg: T) -> Result<(), TrySendError<T>> {
        self.low_priority_tx.try_send(msg)?;
        Ok(())
    }

    pub async fn send_low_priority(&self, msg: T) -> Result<(), SendError> {
        self.low_priority_tx.send_async(msg).await?;
        Ok(())
    }

    pub fn send_high_priority(&self, msg: T) -> Result<(), SendError> {
        self.high_priority_tx.send(msg)?;
        Ok(())
    }
}

// Message to future generations. I created this flag to prevent you
// from naively making a struct cloneable.
// The drop implementation drains the elements in the channel.
struct CloneIsForbidden;

pub struct Receiver<T> {
    low_priority_rx: flume::Receiver<T>,
    high_priority_rx: flume::Receiver<T>,
    _high_priority_tx: flume::Sender<T>,
    pending_low_priority_message: LockedOption<T>,
    _clone_is_forbidden: CloneIsForbidden,
}

impl<T> Drop for Receiver<T> {
    fn drop(&mut self) {
        // Flume strangely (tokio::mpsc does not behave like this for instance)
        // does not drop the message in the channel when all receiver are dropped.
        //
        // They are only dropped when both the receivers AND the sender are dropped.
        // We fix this behavior by drainng the channel upon drop.
        self.high_priority_rx.drain();
        self.low_priority_rx.drain();
    }
}

impl<T> Receiver<T> {
    pub fn is_empty(&self) -> bool {
        self.low_priority_rx.is_empty()
            && self.pending_low_priority_message.is_none()
            && self.high_priority_rx.is_empty()
    }

    pub fn try_recv_high_priority_message(&self) -> Result<T, RecvError> {
        match self.high_priority_rx.try_recv() {
            Ok(msg) => Ok(msg),
            Err(TryRecvError::Disconnected) => {
                unreachable!(
                    "This can never happen, as the high priority Sender is owned by the Receiver."
                );
            }
            Err(TryRecvError::Empty) => {
                if self.low_priority_rx.is_disconnected() {
                    // We check that no new high priority message were sent
                    // in between.
                    if let Ok(msg) = self.high_priority_rx.try_recv() {
                        Ok(msg)
                    } else {
                        Err(RecvError::Disconnected)
                    }
                } else {
                    Err(RecvError::NoMessageAvailable)
                }
            }
        }
    }

    pub fn try_recv(&self) -> Result<T, RecvError> {
        if let Ok(msg) = self.high_priority_rx.try_recv() {
            return Ok(msg);
        }
        if let Some(pending_msg) = self.pending_low_priority_message.take() {
            return Ok(pending_msg);
        }
        match self.low_priority_rx.try_recv() {
            Ok(low_msg) => {
                if let Ok(high_msg) = self.high_priority_rx.try_recv() {
                    self.pending_low_priority_message.place(low_msg);
                    Ok(high_msg)
                } else {
                    Ok(low_msg)
                }
            }
            Err(TryRecvError::Disconnected) => {
                if let Ok(high_msg) = self.high_priority_rx.try_recv() {
                    Ok(high_msg)
                } else {
                    Err(RecvError::Disconnected)
                }
            }
            Err(TryRecvError::Empty) => Err(RecvError::NoMessageAvailable),
        }
    }

    pub async fn recv_high_priority(&self) -> T {
        self.high_priority_rx
            .recv_async()
            .await
            .expect("The Receiver owns the high priority Sender to avoid any disconnection.")
    }

    pub async fn recv(&self) -> Result<T, RecvError> {
        if let Ok(msg) = self.try_recv_high_priority_message() {
            return Ok(msg);
        }
        if let Some(pending_msg) = self.pending_low_priority_message.take() {
            return Ok(pending_msg);
        }
        tokio::select! {
            // We don't really care about fairness here.
            // We will double check if there is a command or not anyway.
            biased;
            high_priority_msg_res = self.high_priority_rx.recv_async() => {
                match high_priority_msg_res {
                    Ok(high_priority_msg) => {
                        Ok(high_priority_msg)
                    },
                    Err(_) => {
                        unreachable!("The Receiver owns the high priority Sender to avoid any disconnection.")
                    },
                }
            }
            low_priority_msg_res = self.low_priority_rx.recv_async() => {
                match low_priority_msg_res {
                    Ok(low_priority_msg) => {
                        if let Ok(high_priority_msg) = self.try_recv_high_priority_message() {
                            self.pending_low_priority_message.place(low_priority_msg);
                            Ok(high_priority_msg)
                        } else {
                            Ok(low_priority_msg)
                        }
                    },
                    Err(flume::RecvError::Disconnected) => {
                        if let Ok(high_priority_msg) = self.try_recv_high_priority_message() {
                            Ok(high_priority_msg)
                        } else {
                            Err(RecvError::Disconnected)
                        }
                    }
                }
           }
        }
    }

    /// Drain all of the pending low priority messages and return them.
    pub fn drain_low_priority(&self) -> Vec<T> {
        let mut messages = Vec::new();
        while let Ok(msg) = self.low_priority_rx.try_recv() {
            messages.push(msg);
        }
        messages
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::time::Duration;

    use super::*;

    #[tokio::test]
    async fn test_channel_with_priority_drop_receiver_drop_messages() {
        let arc_high = Arc::new(());
        let arc_low = Arc::new(());
        let (tx, rx) = super::channel(QueueCapacity::Bounded(2));
        tx.send_high_priority(arc_high.clone()).unwrap();
        tx.send_low_priority(arc_low.clone()).await.unwrap();
        assert_eq!(Arc::strong_count(&arc_high), 2);
        assert_eq!(Arc::strong_count(&arc_low), 2);
        drop(rx);
        assert_eq!(Arc::strong_count(&arc_high), 1);
        assert_eq!(Arc::strong_count(&arc_low), 1);
    }

    #[test]
    fn test_locked_option_new_empty() {
        let locked_option: LockedOption<usize> = LockedOption::none();
        assert_eq!(locked_option.take(), None);
    }

    #[test]
    fn test_locked_option_place() {
        let locked_option = LockedOption::none();
        locked_option.place(1);
        assert_eq!(locked_option.take(), Some(1));
    }

    #[test]
    fn test_locked_option_place_twice_keep_last() {
        let locked_option = LockedOption::none();
        locked_option.place(1);
        locked_option.place(2);
        assert_eq!(locked_option.take(), Some(2));
    }

    #[test]
    fn test_locked_option_place_take_twice() {
        let locked_option = LockedOption::none();
        locked_option.place(1);
        assert_eq!(locked_option.take(), Some(1));
        assert_eq!(locked_option.take(), None);
    }

    #[tokio::test]
    async fn test_recv_priority() -> anyhow::Result<()> {
        let (sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        sender.send_low_priority(1).await?;
        sender.send_high_priority(2)?;
        assert_eq!(receiver.recv().await, Ok(2));
        assert_eq!(receiver.recv().await, Ok(1));
        assert!(
            tokio::time::timeout(Duration::from_millis(50), receiver.recv())
                .await
                .is_err()
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_try_recv() -> anyhow::Result<()> {
        let (sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        sender.send_low_priority(1).await?;
        assert_eq!(receiver.try_recv(), Ok(1));
        assert_eq!(receiver.try_recv(), Err(RecvError::NoMessageAvailable));
        Ok(())
    }

    #[tokio::test]
    async fn test_try_recv_high_priority() -> anyhow::Result<()> {
        let (sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        sender.send_low_priority(1).await?;
        assert_eq!(
            receiver.try_recv_high_priority_message(),
            Err(RecvError::NoMessageAvailable)
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_recv_high_priority_ignore_disconnection() -> anyhow::Result<()> {
        let (sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        std::mem::drop(sender);
        assert!(
            tokio::time::timeout(Duration::from_millis(100), receiver.recv_high_priority())
                .await
                .is_err()
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_recv_disconnect() -> anyhow::Result<()> {
        let (sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        std::mem::drop(sender);
        assert_eq!(receiver.recv().await, Err(RecvError::Disconnected));
        Ok(())
    }

    #[tokio::test]
    async fn test_recv_timeout_simple() -> anyhow::Result<()> {
        let (_sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        assert!(matches!(
            receiver.try_recv(),
            Err(RecvError::NoMessageAvailable)
        ));
        Ok(())
    }

    #[tokio::test]
    async fn test_try_recv_priority_corner_case() -> anyhow::Result<()> {
        let (sender, receiver) = super::channel::<usize>(QueueCapacity::Unbounded);
        tokio::task::spawn(async move {
            tokio::time::sleep(Duration::from_millis(10)).await;
            sender.send_high_priority(1)?;
            sender.send_low_priority(2).await?;
            Result::<(), SendError>::Ok(())
        });
        assert_eq!(receiver.recv().await, Ok(1));
        assert_eq!(receiver.try_recv(), Ok(2));
        assert!(matches!(receiver.try_recv(), Err(RecvError::Disconnected)));
        Ok(())
    }

    #[tokio::test]
    async fn test_try_recv_high_low() {
        let (tx, rx) = super::channel::<usize>(QueueCapacity::Unbounded);
        tx.send_low_priority(1).await.unwrap();
        tx.send_high_priority(2).unwrap();
        assert_eq!(rx.try_recv(), Ok(2));
        assert_eq!(rx.try_recv(), Ok(1));
        assert_eq!(rx.try_recv(), Err(RecvError::NoMessageAvailable));
    }

    #[tokio::test]
    async fn test_try_recv_high() {
        let (tx, rx) = super::channel::<usize>(QueueCapacity::Unbounded);
        tx.send_low_priority(1).await.unwrap();
        tx.send_high_priority(2).unwrap();
        assert_eq!(rx.try_recv_high_priority_message(), Ok(2));
        assert_eq!(
            rx.try_recv_high_priority_message(),
            Err(RecvError::NoMessageAvailable)
        );
        assert_eq!(rx.try_recv(), Ok(1));
        assert_eq!(rx.try_recv(), Err(RecvError::NoMessageAvailable));
    }
}


================================================
FILE: quickwit/quickwit-actors/src/command.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;

use crate::{Actor, ActorContext, ActorExitStatus, Handler};

/// Commands are messages that can be send to control the behavior of an actor.
///
/// They are similar to UNIX signals.
///
/// They are treated with a higher priority than regular actor messages.
#[derive(Debug)]
pub enum Command {
    /// Temporarily pauses the actor. A paused actor only checks
    /// on its high priority channel and still shows "progress". It appears as
    /// healthy to the supervisor.
    ///
    /// Scheduled message are still processed.
    ///
    /// Semantically, it is similar to SIGSTOP.
    Pause,

    /// Resume a paused actor. If the actor was not paused this command
    /// has no effects.
    ///
    /// Semantically, it is similar to SIGCONT.
    Resume,

    /// Stops the actor with a success exit status code.
    ///
    /// Upstream `actors` that terminates should send the `ExitWithSuccess`
    /// command to downstream actors to inform them that there are no more
    /// incoming messages.
    ///
    /// It is similar to `Quit`, except for the resulting exit status.
    ExitWithSuccess,

    /// Asks the actor to gracefully shutdown.
    ///
    /// The actor will stop processing messages and its finalize function will
    /// be called.
    ///
    /// The exit status is then `ActorExitStatus::Quit`.
    ///
    /// This is the equivalent of sending SIGINT/Ctrl-C to a process.
    Quit,

    /// Nudging is a No-op message.
    ///
    /// Its only effect is to wake-up actors that are stuck waiting
    /// for a message.
    ///
    /// This is useful to kill actors properly or for tests.
    /// Actors stuck waiting for a message do not have any timeout to
    /// check for their killswitch signal.
    ///
    ///
    /// Note: Historically, actors used to have a timeout, then
    /// the wake up logic worked using a Kill command.
    /// However, after the introduction of supervision, it became common
    /// to recycle a mailbox.
    ///
    /// After a panic for instance, the supervisor of an actor might kill
    /// it by activating its killswitch and sending a Kill message.
    ///
    /// The respawned actor would receive its predecessor mailbox and
    /// possibly end up process a Kill message as its first message.
    Nudge,
}

#[async_trait]
impl<A: Actor> Handler<Command> for A {
    type Reply = ();

    /// and its exit status will be the one defined in the error.
    async fn handle(
        &mut self,
        command: Command,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        match command {
            Command::Pause => {
                ctx.pause();
                Ok(())
            }
            Command::ExitWithSuccess => Err(ActorExitStatus::Success),
            Command::Quit => Err(ActorExitStatus::Quit),
            Command::Nudge => Ok(()),
            Command::Resume => {
                ctx.resume();
                Ok(())
            }
        }
    }
}

/// Asks the actor to update its ObservableState.
///
/// The observation is then available using the `ActorHandler::last_observation()`
/// method.
#[derive(Debug)]
pub struct Observe;

#[async_trait]
impl<A: Actor> Handler<Observe> for A {
    type Reply = A::ObservableState;

    async fn handle(
        &mut self,
        _observe: Observe,
        ctx: &ActorContext<Self>,
    ) -> Result<A::ObservableState, ActorExitStatus> {
        Ok(ctx.observe(self))
    }
}


================================================
FILE: quickwit/quickwit-actors/src/envelope.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::Any;
use std::fmt;

use async_trait::async_trait;
use tokio::sync::oneshot;

use crate::actor::DeferableReplyHandler;
use crate::scheduler::NoAdvanceTimeGuard;
use crate::{Actor, ActorContext, ActorExitStatus};

/// An `Envelope` is just a way to capture the handler
/// of a message and hide its type.
///
/// Messages can have different types but somehow need to be pushed to a
/// queue with a single type.
/// Before appending, we capture the right handler implementation
/// in the form of a `Box<dyn Envelope>`, and append that to the queue.
pub struct Envelope<A> {
    handler_envelope: Box<dyn EnvelopeT<A>>,
    _no_advance_time_guard: Option<NoAdvanceTimeGuard>,
}

impl<A: Actor> Envelope<A> {
    /// Returns the message as a boxed any.
    ///
    /// This method is only useful in unit tests.
    pub fn message(&mut self) -> Box<dyn Any> {
        self.handler_envelope.message()
    }

    pub fn message_typed<M: 'static>(&mut self) -> Option<M> {
        if let Ok(boxed_msg) = self.handler_envelope.message().downcast::<M>() {
            Some(*boxed_msg)
        } else {
            None
        }
    }

    /// Executes the captured handle function.
    ///
    /// When exiting, also returns the message type name.
    pub async fn handle_message(
        &mut self,
        actor: &mut A,
        ctx: &ActorContext<A>,
    ) -> Result<(), (ActorExitStatus, &'static str)> {
        let handling_res = self.handler_envelope.handle_message(actor, ctx).await;
        if let Err(exit_status) = handling_res {
            return Err((exit_status, self.handler_envelope.message_type_name()));
        }
        Ok(())
    }
}

impl<A: Actor> fmt::Debug for Envelope<A> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let msg_str = self.handler_envelope.debug_msg();
        f.debug_tuple("Envelope").field(&msg_str).finish()
    }
}

#[async_trait]
trait EnvelopeT<A: Actor>: Send {
    fn message_type_name(&self) -> &'static str;

    fn debug_msg(&self) -> String;

    /// Returns the message as a boxed any.
    ///
    /// This method is only useful in unit tests.
    fn message(&mut self) -> Box<dyn Any>;

    /// Execute the captured handle function.
    async fn handle_message(
        &mut self,
        actor: &mut A,
        ctx: &ActorContext<A>,
    ) -> Result<(), ActorExitStatus>;
}

#[async_trait]
impl<A, M> EnvelopeT<A> for Option<(oneshot::Sender<A::Reply>, M)>
where
    A: DeferableReplyHandler<M>,
    M: fmt::Debug + Send + 'static,
{
    fn message_type_name(&self) -> &'static str {
        std::any::type_name::<M>()
    }

    fn debug_msg(&self) -> String {
        #[allow(clippy::needless_option_take)]
        if let Some((_response_tx, msg)) = self.as_ref().take() {
            format!("{msg:?}")
        } else {
            "<consumed>".to_string()
        }
    }

    fn message(&mut self) -> Box<dyn Any> {
        if let Some((_, message)) = self.take() {
            Box::new(message)
        } else {
            Box::new(())
        }
    }

    async fn handle_message(
        &mut self,
        actor: &mut A,
        ctx: &ActorContext<A>,
    ) -> Result<(), ActorExitStatus> {
        let (response_tx, msg) = self
            .take()
            .expect("handle_message should never be called twice.");
        actor
            .handle_message(
                msg,
                |response| {
                    // A SendError is fine here. The caller just did not wait
                    // for our response and dropped its Receiver channel.
                    let _ = response_tx.send(response);
                },
                ctx,
            )
            .await?;
        Ok(())
    }
}

pub(crate) fn wrap_in_envelope<A, M>(
    msg: M,
    no_advance_time_guard: Option<NoAdvanceTimeGuard>,
) -> (Envelope<A>, oneshot::Receiver<A::Reply>)
where
    A: DeferableReplyHandler<M>,
    M: fmt::Debug + Send + 'static,
{
    let (response_tx, response_rx) = oneshot::channel();
    let handler_envelope = Some((response_tx, msg));
    let envelope = Envelope {
        handler_envelope: Box::new(handler_envelope),
        _no_advance_time_guard: no_advance_time_guard,
    };
    (envelope, response_rx)
}


================================================
FILE: quickwit/quickwit-actors/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

//! quickwit-actors is a simplified actor framework for quickwit.
//!
//! It solves the following problem:
//! - have sync and async tasks communicate together.
//! - make these task observable
//! - make these task modular and testable
//! - detect when some task is stuck and does not progress anymore

use std::fmt;
use std::num::NonZeroU64;

use once_cell::sync::Lazy;
use tokio::time::Duration;
mod actor;
mod actor_context;
mod actor_handle;
mod actor_state;
#[doc(hidden)]
pub mod channel_with_priority;
mod command;
mod envelope;
mod mailbox;
mod observation;
mod registry;
pub(crate) mod scheduler;
mod spawn_builder;
mod supervisor;

pub use scheduler::{SchedulerClient, start_scheduler};

#[cfg(test)]
pub(crate) mod tests;
mod universe;

pub use actor::{Actor, ActorExitStatus, DeferableReplyHandler, Handler};
pub use actor_handle::{ActorHandle, Health, Healthz, Supervisable};
pub use command::{Command, Observe};
pub use observation::{Observation, ObservationType};
use quickwit_common::KillSwitch;
pub use spawn_builder::SpawnContext;
use thiserror::Error;
use tracing::{info, warn};
pub use universe::Universe;

pub use self::actor_context::ActorContext;
pub use self::actor_state::ActorState;
pub use self::channel_with_priority::{QueueCapacity, RecvError, SendError, TrySendError};
pub use self::mailbox::{Inbox, Mailbox, WeakMailbox};
pub use self::registry::ActorObservation;
pub use self::supervisor::{Supervisor, SupervisorMetrics, SupervisorState};

/// Heartbeat used to verify that actors are progressing.
///
/// If an actor does not advertise a progress within an interval of duration `HEARTBEAT`,
/// its supervisor will consider it as blocked and will proceed to kill it, as well
/// as all of the actors all the actors that share the killswitch.
pub static HEARTBEAT: Lazy<Duration> = Lazy::new(heartbeat_from_env_or_default);

/// Returns the actor's heartbeat duration:
/// - Derived from `QW_ACTOR_HEARTBEAT_SECS` if set and valid.
/// - Defaults to 30 seconds or 500ms for tests.
fn heartbeat_from_env_or_default() -> Duration {
    if cfg!(any(test, feature = "testsuite")) {
        // Right now some unit test end when we detect that a
        // pipeline has terminated, which can require waiting
        // for a heartbeat.
        //
        // We use a shorter heartbeat to reduce the time running unit tests.
        return Duration::from_millis(500);
    }
    match std::env::var("QW_ACTOR_HEARTBEAT_SECS") {
        Ok(actor_heartbeat_secs_str) => {
            if let Ok(actor_heartbeat_secs) = actor_heartbeat_secs_str.parse::<NonZeroU64>() {
                info!("set the actor heartbeat to {actor_heartbeat_secs} seconds");
                return Duration::from_secs(actor_heartbeat_secs.get());
            } else {
                warn!(
                    "failed to parse `QW_ACTOR_HEARTBEAT_SECS={actor_heartbeat_secs_str}` in \
                     seconds > 0, using default heartbeat (30 seconds)"
                );
            };
        }
        Err(std::env::VarError::NotUnicode(os_str)) => {
            warn!(
                "failed to parse `QW_ACTOR_HEARTBEAT_SECS={os_str:?}` in a valid unicode string, \
                 using default heartbeat (30 seconds)"
            );
        }
        Err(std::env::VarError::NotPresent) => {}
    }
    Duration::from_secs(30)
}

/// Time we accept to wait for a new observation.
///
/// Once this time is elapsed, we just return the last observation.
const OBSERVE_TIMEOUT: Duration = Duration::from_secs(3);

/// Error that occurred while calling `ActorContext::ask(..)` or `Universe::ask`
#[derive(Error, Debug)]
pub enum AskError<E: fmt::Debug> {
    #[error("message could not be delivered")]
    MessageNotDelivered,
    #[error("error while the message was being processed")]
    ProcessMessageError,
    #[error("the handler returned an error: `{0:?}`")]
    ErrorReply(#[from] E),
}


================================================
FILE: quickwit/quickwit-actors/src/mailbox.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::Any;
use std::convert::Infallible;
use std::fmt;
use std::sync::atomic::{AtomicUsize, Ordering};
use std::sync::{Arc, OnceLock, Weak};
use std::time::Instant;

use quickwit_common::metrics::{GaugeGuard, IntCounter, IntGauge};
use tokio::sync::oneshot;

use crate::channel_with_priority::{Receiver, Sender, TrySendError};
use crate::envelope::{Envelope, wrap_in_envelope};
use crate::scheduler::SchedulerClient;
use crate::{Actor, AskError, Command, DeferableReplyHandler, QueueCapacity, RecvError, SendError};

/// A mailbox is the object that makes it possible to send a message
/// to an actor.
///
/// It is lightweight to clone.
///
/// The actor holds its `Inbox` counterpart.
///
/// The mailbox can receive high priority and low priority messages.
/// Commands are typically sent as high priority messages, whereas regular
/// actor messages are sent to the low priority channel.
///
/// Whenever a high priority message is available, it is processed
/// before low priority messages.
///
/// If all mailboxes are dropped, the actor will process all of the pending messages
/// and gracefully exit with [`crate::actor::ActorExitStatus::Success`].
pub struct Mailbox<A: Actor> {
    inner: Arc<Inner<A>>,
    // We do not rely on the `Arc:strong_count` here to avoid an intricate
    // race condition. We want to make sure the processing of the `Nudge`
    // message happens AFTER we decrement the refcount.
    ref_count: Arc<AtomicUsize>,
}

impl<A: Actor> Mailbox<A> {
    pub fn downgrade(&self) -> WeakMailbox<A> {
        WeakMailbox {
            inner: Arc::downgrade(&self.inner),
            ref_count: Arc::downgrade(&self.ref_count),
        }
    }
}

impl<A: Actor> Drop for Mailbox<A> {
    fn drop(&mut self) {
        let old_val = self.ref_count.fetch_sub(1, Ordering::SeqCst);
        if old_val == 2 {
            // This was the last mailbox.
            // `ref_count == 1` means that only the mailbox in the ActorContext
            // is remaining.
            let _ = self.send_message_with_high_priority(Command::Nudge);
        }
    }
}

#[derive(Copy, Clone)]
pub(crate) enum Priority {
    High,
    Low,
}

impl<A: Actor> Clone for Mailbox<A> {
    fn clone(&self) -> Self {
        self.ref_count.fetch_add(1, Ordering::SeqCst);
        Mailbox {
            inner: self.inner.clone(),
            ref_count: self.ref_count.clone(),
        }
    }
}

impl<A: Actor> Mailbox<A> {
    pub(crate) fn is_last_mailbox(&self) -> bool {
        self.ref_count.load(Ordering::SeqCst) == 1
    }

    pub fn id(&self) -> &str {
        &self.inner.instance_id
    }

    pub(crate) fn scheduler_client(&self) -> Option<&SchedulerClient> {
        self.inner.scheduler_client_opt.as_ref()
    }
}

struct Inner<A: Actor> {
    pub(crate) tx: Sender<Envelope<A>>,
    scheduler_client_opt: Option<SchedulerClient>,
    instance_id: String,
}

impl<A: Actor> fmt::Debug for Mailbox<A> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_tuple("Mailbox")
            .field(&self.actor_instance_id())
            .finish()
    }
}

impl<A: Actor> Mailbox<A> {
    pub fn actor_instance_id(&self) -> &str {
        &self.inner.instance_id
    }

    pub fn is_disconnected(&self) -> bool {
        self.inner.tx.is_disconnected()
    }

    /// Sends a message to the actor owning the associated inbox.
    ///
    /// From an actor context, use the `ActorContext::send_message` method instead.
    ///
    /// SendError is returned if the actor has already exited.
    pub async fn send_message<M>(
        &self,
        message: M,
    ) -> Result<oneshot::Receiver<A::Reply>, SendError>
    where
        A: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        self.send_message_with_backpressure_counter(message, None)
            .await
    }

    /// Attempts to queue a message in the low priority channel of the mailbox.
    ///
    /// If sending the message would block, the method simply returns `TrySendError::Full(message)`.
    pub fn try_send_message<M>(
        &self,
        message: M,
    ) -> Result<oneshot::Receiver<A::Reply>, TrySendError<M>>
    where
        A: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        let (envelope, response_rx) = self.wrap_in_envelope(message);
        self.inner
            .tx
            .try_send_low_priority(envelope)
            .map_err(|err| {
                match err {
                    TrySendError::Disconnected => TrySendError::Disconnected,
                    TrySendError::Full(mut envelope) => {
                        // We need to un pack the envelope.
                        let message: M = envelope.message_typed().unwrap();
                        TrySendError::Full(message)
                    }
                }
            })?;
        Ok(response_rx)
    }

    fn wrap_in_envelope<M>(&self, message: M) -> (Envelope<A>, oneshot::Receiver<A::Reply>)
    where
        A: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        let guard = self
            .inner
            .scheduler_client_opt
            .as_ref()
            .map(|scheduler_client| scheduler_client.no_advance_time_guard());
        wrap_in_envelope(message, guard)
    }

    /// Sends a message to the actor owning the associated inbox.
    ///
    /// If the actor experiences some backpressure, then
    /// `backpressure_micros` will be increased by the amount of
    /// microseconds of backpressure experienced.
    pub async fn send_message_with_backpressure_counter<M>(
        &self,
        message: M,
        backpressure_micros_counter_opt: Option<&IntCounter>,
    ) -> Result<oneshot::Receiver<A::Reply>, SendError>
    where
        A: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        let (envelope, response_rx) = self.wrap_in_envelope(message);
        match self.inner.tx.try_send_low_priority(envelope) {
            Ok(()) => Ok(response_rx),
            Err(TrySendError::Full(envelope)) => {
                if let Some(backpressure_micros_counter) = backpressure_micros_counter_opt {
                    let now = Instant::now();
                    self.inner.tx.send_low_priority(envelope).await?;
                    let elapsed = now.elapsed();
                    backpressure_micros_counter.inc_by(elapsed.as_micros() as u64);
                } else {
                    self.inner.tx.send_low_priority(envelope).await?;
                }
                Ok(response_rx)
            }
            Err(TrySendError::Disconnected) => Err(SendError::Disconnected),
        }
    }

    pub fn send_message_with_high_priority<M>(
        &self,
        message: M,
    ) -> Result<oneshot::Receiver<A::Reply>, SendError>
    where
        A: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        let (envelope, response_rx) = self.wrap_in_envelope(message);
        self.inner.tx.send_high_priority(envelope)?;
        Ok(response_rx)
    }

    pub(crate) async fn send_message_with_priority<M>(
        &self,
        message: M,
        priority: Priority,
    ) -> Result<oneshot::Receiver<A::Reply>, SendError>
    where
        A: DeferableReplyHandler<M>,
        M: fmt::Debug + Send + 'static,
    {
        let (envelope, response_rx) = self.wrap_in_envelope(message);
        match priority {
            Priority::High => self.inner.tx.send_high_priority(envelope)?,
            Priority::Low => {
                self.inner.tx.send_low_priority(envelope).await?;
            }
        }
        Ok(response_rx)
    }

    /// Similar to `send_message`, except this method
    /// waits asynchronously for the actor reply.
    ///
    /// From an actor context, use the `ActorContext::ask` method instead.
    pub async fn ask<M, T>(&self, message: M) -> Result<T, AskError<Infallible>>
    where
        A: DeferableReplyHandler<M, Reply = T>,
        M: fmt::Debug + Send + 'static,
    {
        self.ask_with_backpressure_counter(message, None).await
    }

    /// Similar to `ask`, but if a backpressure counter is passed,
    /// it increments the amount of time spent in the backpressure.
    ///
    /// The backpressure duration only includes the amount of time
    /// it took to `queue` the request into the actor pipeline.
    ///
    /// It does not include
    /// - the amount spent waiting in the queue,
    /// - the amount spent processing the message.
    ///
    /// From an actor context, use the `ActorContext::ask` method instead.
    pub async fn ask_with_backpressure_counter<M, T>(
        &self,
        message: M,
        backpressure_micros_counter_opt: Option<&IntCounter>,
    ) -> Result<T, AskError<Infallible>>
    where
        A: DeferableReplyHandler<M, Reply = T>,
        M: fmt::Debug + Send + 'static,
    {
        let resp = self
            .send_message_with_backpressure_counter(message, backpressure_micros_counter_opt)
            .await;
        resp.map_err(|_send_error| AskError::MessageNotDelivered)?
            .await
            .map_err(|_| AskError::ProcessMessageError)
    }

    /// Similar to `send_message`, except this method
    /// waits asynchronously for the actor reply.
    ///
    /// From an actor context, use the `ActorContext::ask` method instead.
    pub async fn ask_for_res<M, T, E>(&self, message: M) -> Result<T, AskError<E>>
    where
        A: DeferableReplyHandler<M, Reply = Result<T, E>>,
        M: fmt::Debug + Send + 'static,
        E: fmt::Debug,
    {
        self.send_message(message)
            .await
            .map_err(|_send_error| AskError::MessageNotDelivered)?
            .await
            .map_err(|_| AskError::ProcessMessageError)?
            .map_err(AskError::from)
    }
}

struct InboxInner<A: Actor> {
    rx: Receiver<Envelope<A>>,
    _inboxes_count_gauge_guard: GaugeGuard<'static>,
}

pub struct Inbox<A: Actor> {
    inner: Arc<InboxInner<A>>,
}

impl<A: Actor> Clone for Inbox<A> {
    fn clone(&self) -> Self {
        Inbox {
            inner: self.inner.clone(),
        }
    }
}

impl<A: Actor> Inbox<A> {
    pub(crate) fn is_empty(&self) -> bool {
        self.inner.rx.is_empty()
    }

    pub(crate) async fn recv(&self) -> Result<Envelope<A>, RecvError> {
        self.inner.rx.recv().await
    }

    pub(crate) async fn recv_cmd_and_scheduled_msg_only(&self) -> Envelope<A> {
        self.inner.rx.recv_high_priority().await
    }

    pub(crate) fn try_recv(&self) -> Result<Envelope<A>, RecvError> {
        self.inner.rx.try_recv()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub async fn recv_typed_message<M: 'static>(&self) -> Result<M, RecvError> {
        loop {
            match self.inner.rx.recv().await {
                Ok(mut envelope) => {
                    if let Some(msg) = envelope.message_typed() {
                        return Ok(msg);
                    }
                }
                Err(err) => {
                    return Err(err);
                }
            }
        }
    }

    /// Destroys the inbox and returns the list of pending messages or commands
    /// in the low priority channel.
    ///
    /// Warning this iterator might never be exhausted if there is a living
    /// mailbox associated to it.
    pub fn drain_for_test(&self) -> Vec<Box<dyn Any>> {
        self.inner
            .rx
            .drain_low_priority()
            .into_iter()
            .map(|mut envelope| envelope.message())
            .collect()
    }

    /// Destroys the inbox and returns the list of pending messages or commands
    /// in the low priority channel.
    ///
    /// Warning this iterator might never be exhausted if there is a living
    /// mailbox associated to it.
    pub fn drain_for_test_typed<M: 'static>(&self) -> Vec<M> {
        self.inner
            .rx
            .drain_low_priority()
            .into_iter()
            .flat_map(|mut envelope| envelope.message_typed())
            .collect()
    }
}

fn get_actor_inboxes_count_gauge_guard() -> GaugeGuard<'static> {
    static INBOX_GAUGE: std::sync::OnceLock<IntGauge> = OnceLock::new();
    let gauge = INBOX_GAUGE.get_or_init(|| {
        quickwit_common::metrics::new_gauge(
            "inboxes_count",
            "overall count of actors",
            "actor",
            &[],
        )
    });
    let mut gauge_guard = GaugeGuard::from_gauge(gauge);
    gauge_guard.add(1);
    gauge_guard
}

pub(crate) fn create_mailbox<A: Actor>(
    actor_name: String,
    queue_capacity: QueueCapacity,
    scheduler_client_opt: Option<SchedulerClient>,
) -> (Mailbox<A>, Inbox<A>) {
    let (tx, rx) = crate::channel_with_priority::channel(queue_capacity);
    let ref_count = Arc::new(AtomicUsize::new(1));
    let mailbox = Mailbox {
        inner: Arc::new(Inner {
            tx,
            instance_id: quickwit_common::new_coolid(&actor_name),
            scheduler_client_opt,
        }),
        ref_count,
    };
    let inner = InboxInner {
        rx,
        _inboxes_count_gauge_guard: get_actor_inboxes_count_gauge_guard(),
    };
    let inbox = Inbox {
        inner: Arc::new(inner),
    };
    (mailbox, inbox)
}

pub struct WeakMailbox<A: Actor> {
    inner: Weak<Inner<A>>,
    ref_count: Weak<AtomicUsize>,
}

impl<A: Actor> Clone for WeakMailbox<A> {
    fn clone(&self) -> Self {
        Self {
            inner: self.inner.clone(),
            ref_count: self.ref_count.clone(),
        }
    }
}

impl<A: Actor> WeakMailbox<A> {
    pub fn upgrade(&self) -> Option<Mailbox<A>> {
        let inner = self.inner.upgrade()?;
        let ref_count = self.ref_count.upgrade()?;
        ref_count.fetch_add(1, Ordering::SeqCst);
        Some(Mailbox { inner, ref_count })
    }
}

#[cfg(test)]
mod tests {
    use std::mem;
    use std::time::Duration;

    use super::*;
    use crate::tests::{Ping, PingReceiverActor};
    use crate::{ActorContext, ActorExitStatus, Handler, Universe};

    #[tokio::test]
    async fn test_weak_mailbox_downgrade_upgrade() {
        let universe = Universe::with_accelerated_time();
        let (mailbox, _inbox) = universe.create_test_mailbox::<PingReceiverActor>();
        let weak_mailbox = mailbox.downgrade();
        assert!(weak_mailbox.upgrade().is_some());
    }

    #[tokio::test]
    async fn test_weak_mailbox_failing_upgrade() {
        let universe = Universe::with_accelerated_time();
        let (mailbox, _inbox) = universe.create_test_mailbox::<PingReceiverActor>();
        let weak_mailbox = mailbox.downgrade();
        drop(mailbox);
        assert!(weak_mailbox.upgrade().is_none());
    }

    struct BackPressureActor;

    impl Actor for BackPressureActor {
        type ObservableState = ();

        fn observable_state(&self) -> Self::ObservableState {}

        fn queue_capacity(&self) -> QueueCapacity {
            QueueCapacity::Bounded(0)
        }

        fn yield_after_each_message(&self) -> bool {
            false
        }
    }

    use async_trait::async_trait;

    #[async_trait]
    impl Handler<Duration> for BackPressureActor {
        type Reply = ();

        async fn handle(
            &mut self,
            sleep_duration: Duration,
            _ctx: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            if !sleep_duration.is_zero() {
                tokio::time::sleep(sleep_duration).await;
            }
            Ok(())
        }
    }

    #[tokio::test]
    async fn test_mailbox_send_with_backpressure_counter_low_backpressure() {
        let universe = Universe::with_accelerated_time();
        let back_pressure_actor = BackPressureActor;
        let (mailbox, _handle) = universe.spawn_builder().spawn(back_pressure_actor);
        // We send a first message to make sure the actor has been properly spawned and is listening
        // for new messages.
        mailbox
            .ask_with_backpressure_counter(Duration::default(), None)
            .await
            .unwrap();
        // At this point the actor was started and even processed a message entirely.
        let backpressure_micros_counter =
            IntCounter::new("test_counter", "help for test_counter").unwrap();
        let wait_duration = Duration::from_millis(1);
        let processed = mailbox
            .send_message_with_backpressure_counter(
                wait_duration,
                Some(&backpressure_micros_counter),
            )
            .await
            .unwrap();
        assert!(backpressure_micros_counter.get() < 500);
        processed.await.unwrap();
        assert!(backpressure_micros_counter.get() < 500);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_mailbox_send_with_backpressure_counter_backpressure() {
        let universe = Universe::with_accelerated_time();
        let back_pressure_actor = BackPressureActor;
        let (mailbox, _handle) = universe.spawn_builder().spawn(back_pressure_actor);
        // We send a first message to make sure the actor has been properly spawned and is listening
        // for new messages.
        mailbox
            .ask_with_backpressure_counter(Duration::default(), None)
            .await
            .unwrap();
        let backpressure_micros_counter =
            IntCounter::new("test_counter", "help for test_counter").unwrap();
        let wait_duration = Duration::from_millis(1);
        mailbox
            .send_message_with_backpressure_counter(
                wait_duration,
                Some(&backpressure_micros_counter),
            )
            .await
            .unwrap();
        // That second message will present some backpressure, since the capacity is 0 and
        // the first message will take 1000 micros to be processed.
        mailbox
            .send_message_with_backpressure_counter(
                Duration::default(),
                Some(&backpressure_micros_counter),
            )
            .await
            .unwrap();
        assert!(backpressure_micros_counter.get() > 1_000u64);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_mailbox_waiting_for_processing_does_not_counter_as_backpressure() {
        let universe = Universe::with_accelerated_time();
        let back_pressure_actor = BackPressureActor;
        let (mailbox, _handle) = universe.spawn_builder().spawn(back_pressure_actor);
        mailbox
            .ask_with_backpressure_counter(Duration::default(), None)
            .await
            .unwrap();
        let backpressure_micros_counter =
            IntCounter::new("test_counter", "help for test_counter").unwrap();
        let start = Instant::now();
        mailbox
            .ask_with_backpressure_counter(Duration::from_millis(1), None)
            .await
            .unwrap();
        let elapsed = start.elapsed();
        assert!(elapsed.as_micros() > 1000);
        assert_eq!(backpressure_micros_counter.get(), 0);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_try_send() {
        let universe = Universe::with_accelerated_time();
        let (mailbox, _inbox) = universe
            .create_mailbox::<PingReceiverActor>("hello".to_string(), QueueCapacity::Bounded(1));
        assert!(mailbox.try_send_message(Ping).is_ok());
        assert!(matches!(
            mailbox.try_send_message(Ping).unwrap_err(),
            TrySendError::Full(Ping)
        ));
    }

    #[tokio::test]
    async fn test_try_send_disconnect() {
        let universe = Universe::with_accelerated_time();
        let (mailbox, inbox) = universe
            .create_mailbox::<PingReceiverActor>("hello".to_string(), QueueCapacity::Bounded(1));
        assert!(mailbox.try_send_message(Ping).is_ok());
        mem::drop(inbox);
        assert!(matches!(
            mailbox.try_send_message(Ping).unwrap_err(),
            TrySendError::Disconnected
        ));
    }

    #[tokio::test]
    async fn test_weak_mailbox_ref_count() {
        let universe = Universe::with_accelerated_time();
        let (mailbox, _inbox) = universe
            .create_mailbox::<PingReceiverActor>("hello".to_string(), QueueCapacity::Bounded(1));
        assert!(mailbox.is_last_mailbox());
        let weak_mailbox = mailbox.downgrade();
        let second_mailbox = weak_mailbox.upgrade().unwrap();
        assert!(!mailbox.is_last_mailbox());
        drop(second_mailbox);
        assert!(mailbox.is_last_mailbox());
    }
}


================================================
FILE: quickwit/quickwit-actors/src/observation.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::ops::Deref;

#[derive(Debug)]
pub struct Observation<ObservableState> {
    pub obs_type: ObservationType,
    pub state: ObservableState,
}

impl<ObservableState> Deref for Observation<ObservableState> {
    type Target = ObservableState;

    fn deref(&self) -> &Self::Target {
        &self.state
    }
}

// Describes the actual outcome of observation.
#[derive(Clone, Copy, Debug, Eq, PartialEq)]
pub enum ObservationType {
    /// The actor is alive and was able to snapshot its state within `HEARTBEAT`
    Alive,
    /// An observation could not be made with HEARTBEAT, because
    /// the actor had too much work. In that case, in a best effort fashion, the
    /// last observed state is returned. The actor will still update its state,
    /// as soon as it has finished processing the current message.
    Timeout,
    /// The actor has exited. The post-mortem state is joined.
    PostMortem,
}

impl<State: fmt::Debug + PartialEq> PartialEq for Observation<State> {
    fn eq(&self, other: &Self) -> bool {
        self.obs_type.eq(&other.obs_type) && self.state.eq(&other.state)
    }
}

impl<State: fmt::Debug + PartialEq + Eq> Eq for Observation<State> {}


================================================
FILE: quickwit/quickwit-actors/src/registry.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::{Any, TypeId};
use std::collections::HashMap;
use std::pin::Pin;
use std::sync::{Arc, RwLock};
use std::time::Duration;

use async_trait::async_trait;
use futures::future::{self, Shared};
use futures::{Future, FutureExt};
use serde::Serialize;
use serde_json::Value as JsonValue;
use tokio::task::JoinHandle;

use crate::command::Observe;
use crate::mailbox::WeakMailbox;
use crate::{Actor, ActorExitStatus, Command, Mailbox};

struct TypedJsonObservable<A: Actor> {
    actor_instance_id: String,
    weak_mailbox: WeakMailbox<A>,
    join_handle: ActorJoinHandle,
}

#[async_trait]
trait JsonObservable: Sync + Send {
    fn is_disconnected(&self) -> bool;
    fn any(&self) -> &dyn Any;
    fn actor_instance_id(&self) -> &str;
    async fn observe(&self) -> Option<JsonValue>;
    async fn quit(&self) -> ActorExitStatus;
    async fn join(&self) -> ActorExitStatus;
}

#[async_trait]
impl<A: Actor> JsonObservable for TypedJsonObservable<A> {
    fn is_disconnected(&self) -> bool {
        self.weak_mailbox
            .upgrade()
            .map(|mailbox| mailbox.is_disconnected())
            .unwrap_or(true)
    }
    fn any(&self) -> &dyn Any {
        &self.weak_mailbox
    }
    fn actor_instance_id(&self) -> &str {
        self.actor_instance_id.as_str()
    }
    async fn observe(&self) -> Option<JsonValue> {
        let mailbox = self.weak_mailbox.upgrade()?;
        let oneshot_rx = mailbox.send_message_with_high_priority(Observe).ok()?;
        let state: <A as Actor>::ObservableState = oneshot_rx.await.ok()?;
        serde_json::to_value(&state).ok()
    }

    async fn quit(&self) -> ActorExitStatus {
        if let Some(mailbox) = self.weak_mailbox.upgrade() {
            let _ = mailbox.send_message_with_high_priority(Command::Quit);
        }
        self.join().await
    }

    async fn join(&self) -> ActorExitStatus {
        self.join_handle.join().await
    }
}

#[derive(Default, Clone)]
pub(crate) struct ActorRegistry {
    actors: Arc<RwLock<HashMap<TypeId, ActorRegistryForSpecificType>>>,
}

struct ActorRegistryForSpecificType {
    type_name: &'static str,
    observables: Vec<Arc<dyn JsonObservable>>,
}

impl ActorRegistryForSpecificType {
    fn for_type<A>() -> ActorRegistryForSpecificType {
        ActorRegistryForSpecificType {
            type_name: std::any::type_name::<A>(),
            observables: Vec::new(),
        }
    }

    fn gc(&mut self) {
        let mut i = 0;
        while i < self.observables.len() {
            if self.observables[i].is_disconnected() {
                self.observables.swap_remove(i);
            } else {
                i += 1;
            }
        }
    }
}

#[derive(Serialize, Debug)]
pub struct ActorObservation {
    pub type_name: &'static str,
    pub instance_id: String,
    pub obs: Option<JsonValue>,
}

impl ActorRegistry {
    pub fn register<A: Actor>(&self, mailbox: &Mailbox<A>, join_handle: ActorJoinHandle) {
        let typed_id = TypeId::of::<A>();
        let actor_instance_id = mailbox.actor_instance_id().to_string();
        let weak_mailbox = mailbox.downgrade();
        self.actors
            .write()
            .unwrap()
            .entry(typed_id)
            .or_insert_with(|| ActorRegistryForSpecificType::for_type::<A>())
            .observables
            .push(Arc::new(TypedJsonObservable {
                weak_mailbox,
                actor_instance_id,
                join_handle,
            }));
    }

    pub async fn observe(&self, timeout: Duration) -> Vec<ActorObservation> {
        self.gc();
        let mut obs_futures = Vec::new();
        for registry_for_type in self.actors.read().unwrap().values() {
            for obs in &registry_for_type.observables {
                if obs.is_disconnected() {
                    continue;
                }
                let obs_clone = obs.clone();
                let type_name = registry_for_type.type_name;
                let instance_id = obs.actor_instance_id().to_string();
                obs_futures.push(async move {
                    let obs = tokio::time::timeout(timeout, obs_clone.observe())
                        .await
                        .unwrap_or(None);
                    ActorObservation {
                        type_name,
                        instance_id,
                        obs,
                    }
                });
            }
        }
        future::join_all(obs_futures.into_iter()).await
    }

    pub fn get<A: Actor>(&self) -> Vec<Mailbox<A>> {
        let mut lock = self.actors.write().unwrap();
        get_iter::<A>(&mut lock).collect()
    }

    pub fn get_one<A: Actor>(&self) -> Option<Mailbox<A>> {
        let mut lock = self.actors.write().unwrap();
        get_iter::<A>(&mut lock).next()
    }

    fn gc(&self) {
        for registry_for_type in self.actors.write().unwrap().values_mut() {
            registry_for_type.gc();
        }
    }

    pub async fn quit(&self) -> HashMap<String, ActorExitStatus> {
        let mut obs_futures = Vec::new();
        let mut actor_ids = Vec::new();
        for registry_for_type in self.actors.read().unwrap().values() {
            for obs in &registry_for_type.observables {
                let obs_clone = obs.clone();
                obs_futures.push(async move { obs_clone.quit().await });
                actor_ids.push(obs.actor_instance_id().to_string());
            }
        }
        let res = future::join_all(obs_futures).await;
        actor_ids.into_iter().zip(res).collect()
    }

    pub fn is_empty(&self) -> bool {
        self.actors
            .read()
            .unwrap()
            .values()
            .all(|registry_for_type| {
                registry_for_type
                    .observables
                    .iter()
                    .all(|obs| obs.is_disconnected())
            })
    }
}

fn get_iter<A: Actor>(
    actors: &mut HashMap<TypeId, ActorRegistryForSpecificType>,
) -> impl Iterator<Item = Mailbox<A>> + '_ {
    let typed_id = TypeId::of::<A>();
    actors
        .get(&typed_id)
        .into_iter()
        .flat_map(|registry_for_type| {
            registry_for_type
                .observables
                .iter()
                .flat_map(|box_any| box_any.any().downcast_ref::<WeakMailbox<A>>())
                .flat_map(|weak_mailbox| weak_mailbox.upgrade())
        })
        .filter(|mailbox| !mailbox.is_disconnected())
}

/// This structure contains an optional exit handle. The handle is present
/// until the join() method is called.
#[derive(Clone)]
pub(crate) struct ActorJoinHandle {
    holder: Shared<Pin<Box<dyn Future<Output = ActorExitStatus> + Send>>>,
}

impl ActorJoinHandle {
    pub(crate) fn new(join_handle: JoinHandle<ActorExitStatus>) -> Self {
        ActorJoinHandle {
            holder: Self::inner_join(join_handle).boxed().shared(),
        }
    }

    async fn inner_join(join_handle: JoinHandle<ActorExitStatus>) -> ActorExitStatus {
        join_handle.await.unwrap_or_else(|join_err| {
            if join_err.is_panic() {
                ActorExitStatus::Panicked
            } else {
                ActorExitStatus::Killed
            }
        })
    }

    /// Joins the actor and returns its exit status on the first invocation.
    /// Returns None afterwards.
    pub(crate) async fn join(&self) -> ActorExitStatus {
        self.holder.clone().await
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use crate::Universe;
    use crate::tests::PingReceiverActor;

    #[tokio::test]
    async fn test_registry() {
        let test_actor = PingReceiverActor::default();
        let universe = Universe::with_accelerated_time();
        let (_mailbox, _handle) = universe.spawn_builder().spawn(test_actor);
        let _actor_mailbox = universe.get_one::<PingReceiverActor>().unwrap();
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_registry_killed_actor() {
        let test_actor = PingReceiverActor::default();
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handle) = universe.spawn_builder().spawn(test_actor);
        handle.kill().await;
        assert!(universe.get_one::<PingReceiverActor>().is_none());
    }

    #[tokio::test]
    async fn test_registry_last_mailbox_dropped_actor() {
        let test_actor = PingReceiverActor::default();
        let universe = Universe::with_accelerated_time();
        let (mailbox, handle) = universe.spawn_builder().spawn(test_actor);
        drop(mailbox);
        handle.join().await;
        assert!(universe.get_one::<PingReceiverActor>().is_none());
    }

    #[tokio::test]
    async fn test_get_actor_states() {
        let test_actor = PingReceiverActor::default();
        let universe = Universe::with_accelerated_time();
        let (_mailbox, _handle) = universe.spawn_builder().spawn(test_actor);
        let obs = universe.observe(Duration::from_millis(1000)).await;
        assert_eq!(obs.len(), 1);
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-actors/src/scheduler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Reverse;
use std::collections::BinaryHeap;
use std::collections::binary_heap::PeekMut;
use std::future::Future;
use std::sync::atomic::{AtomicBool, AtomicUsize, Ordering};
use std::sync::{Arc, Weak};
use std::time::{Duration, Instant};

use quickwit_common::spawn_named_task;
use tokio::sync::oneshot;
use tokio::task::JoinHandle;

type Callback = Box<dyn FnOnce() + Sync + Send + 'static>;

struct TimeoutEvent {
    deadline: Instant,
    event_id: u64, //< only useful to break ties in a deterministic way.
    callback: Callback,
}

impl PartialEq for TimeoutEvent {
    fn eq(&self, other: &Self) -> bool {
        self.event_id == other.event_id
    }
}

impl Eq for TimeoutEvent {}

impl PartialOrd for TimeoutEvent {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}

impl Ord for TimeoutEvent {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        self.deadline
            .cmp(&other.deadline)
            .then_with(|| self.event_id.cmp(&other.event_id))
    }
}

enum SchedulerMessage {
    ProcessTime,
    Schedule {
        callback: Callback,
        timeout: Duration,
    },
}

#[derive(Clone)]
pub struct SchedulerClient {
    inner: Arc<SchedulerClientInner>,
}

struct SchedulerClientInner {
    no_advance_time_guard_count: AtomicUsize,
    accelerate_time: AtomicBool,
    tx: flume::Sender<SchedulerMessage>,
}

impl SchedulerClient {
    /// Returns true if someone asked for the time to be accelerated.
    fn time_is_accelerated(&self) -> bool {
        self.inner.accelerate_time.load(Ordering::Relaxed)
    }

    /// Returns true if something is preventing for accelerating the time.
    fn is_advance_time_forbidden(&self) -> bool {
        self.inner
            .no_advance_time_guard_count
            .load(Ordering::SeqCst)
            > 0
    }

    /// Schedules a new event.
    /// Once `timeout` is elapsed, the future `fut` is
    /// executed.
    ///
    /// `fut` will be executed in the scheduler task, so it is
    /// required to be short.
    pub fn schedule_event<F: FnOnce() + Send + Sync + 'static>(
        &self,
        callback: F,
        timeout: Duration,
    ) {
        let _ = self.inner.tx.send(SchedulerMessage::Schedule {
            callback: Box::new(callback),
            timeout,
        });
    }

    // Increases the number of reasons to not simulate advance time.
    pub(crate) fn inc_no_advance_time(&self) {
        self.inner
            .no_advance_time_guard_count
            .fetch_add(1, Ordering::SeqCst);
    }

    // Decrease the number of reasons to not simulate advance time.
    //
    // If the number reaches 0, we trigger a `timeout`.
    pub(crate) fn dec_no_advance_time(&self) {
        let previous_count = self
            .inner
            .no_advance_time_guard_count
            .fetch_sub(1, Ordering::SeqCst);
        if previous_count == 1 {
            self.process_time();
        }
    }

    /// Switch accelerated time mode for the scheduler.
    ///
    /// The scheduler will jump in time whenever there are no more `NoAdvanceInTimeGuard`.
    pub fn accelerate_time(&self) {
        self.inner.accelerate_time.store(true, Ordering::Relaxed);
        self.process_time();
    }

    pub async fn sleep(&self, duration: Duration) {
        let (oneshot_tx, oneshot_rx) = oneshot::channel();
        self.schedule_event(
            move || {
                let _ = oneshot_tx.send(());
            },
            duration,
        );
        let _ = oneshot_rx.await;
    }

    pub async fn timeout<O>(
        &self,
        duration: Duration,
        fut: impl Future<Output = O>,
    ) -> Result<O, ()> {
        tokio::select! {
            _ = self.sleep(duration) => {
                Err(())
            },
            future_output = fut => {
                Ok(future_output)
            }
        }
    }

    // Triggers an event, telling the Scheduler to process time,
    // checks whether some scheduled events have timed out, or whether we should
    // jump forward in time.
    pub(crate) fn process_time(&self) {
        let _ = self.inner.tx.send(SchedulerMessage::ProcessTime);
    }

    /// Returns a `NoAdvanceTimeGuard` which calls `inc_no_advance_time`
    /// on `NoAdvanceTimeGuard::new` and `dec_no_advance_time` when dropped.
    pub fn no_advance_time_guard(&self) -> NoAdvanceTimeGuard {
        NoAdvanceTimeGuard::new(self.clone())
    }
}

pub struct NoAdvanceTimeGuard {
    scheduler_client: SchedulerClient,
}

impl NoAdvanceTimeGuard {
    fn new(scheduler_client: SchedulerClient) -> Self {
        scheduler_client.inc_no_advance_time();
        NoAdvanceTimeGuard { scheduler_client }
    }
}

impl Drop for NoAdvanceTimeGuard {
    fn drop(&mut self) {
        self.scheduler_client.dec_no_advance_time();
    }
}

pub fn start_scheduler() -> SchedulerClient {
    let (tx, rx) = flume::unbounded::<SchedulerMessage>();
    let scheduler_client = SchedulerClient {
        inner: Arc::new(SchedulerClientInner {
            no_advance_time_guard_count: AtomicUsize::default(),
            accelerate_time: Default::default(),
            tx,
        }),
    };
    let mut scheduler = Scheduler::new(&scheduler_client);
    spawn_named_task(
        async move {
            while let Ok(scheduler_message) = rx.recv_async().await {
                match scheduler_message {
                    SchedulerMessage::ProcessTime => scheduler.process_time(),
                    SchedulerMessage::Schedule { callback, timeout } => {
                        scheduler.process_schedule(callback, timeout);
                    }
                }
            }
        },
        "scheduler",
    );
    scheduler_client
}

struct Scheduler {
    // We attribute an event_id to all event just to break ties
    // if two events are scheduled on the same time.
    event_id_generator: u64,
    // Simulated time shift which defines the scheduler time reference as `simulated_time =
    // Instant::now() + simulated_time_shift`. By default `simulated_time_shift` is set to 0
    // but it can be shifted when the scheduler has to process a simulate sleep event`.
    simulated_time_shift: Duration,
    future_events: BinaryHeap<Reverse<TimeoutEvent>>,
    next_timeout: Option<JoinHandle<()>>,
    weak_scheduler_client: Weak<SchedulerClientInner>,
}

impl Scheduler {
    /// Processes "time".
    ///
    /// This :
    /// - identifies all events that are elapsed and execute their callback,
    /// - advance time if necessary
    /// - schedule a message to make sure process_time is called in time for the next event.
    fn process_time(&mut self) {
        let now = self.simulated_now();
        // Pops all elapsed events and executes the associated callback.
        while let Some(next_event_peek) = self.future_events.peek_mut() {
            if next_event_peek.0.deadline > now {
                // The next event is out of scope.
                break;
            }
            let next_event = PeekMut::pop(next_event_peek);
            (next_event.0.callback)();
        }

        // If the condition to accelerate time are met, we can
        // advance time and jump straight to the next timeout.
        self.advance_time_if_necessary();
        self.schedule_next_timeout();
    }

    /// Schedules a new event.
    fn process_schedule(&mut self, callback: Callback, timeout: Duration) {
        let new_evt_deadline = self.simulated_now() + timeout;
        let timeout_event = self.timeout_event(new_evt_deadline, callback);
        self.future_events.push(Reverse(timeout_event));
        self.process_time();
    }

    fn scheduler_client(&self) -> Option<SchedulerClient> {
        let scheduler_client = SchedulerClient {
            inner: self.weak_scheduler_client.upgrade()?,
        };
        Some(scheduler_client)
    }

    /// Schedules a Timeout event callback if necessary.
    fn schedule_next_timeout(&mut self) {
        let Some(scheduler_client) = self.scheduler_client() else {
            return;
        };
        let simulated_now = self.simulated_now();
        let Some(next_deadline) = self.next_event_deadline() else {
            return;
        };
        let timeout: Duration = if next_deadline <= simulated_now {
            // This should almost never happen, because we supposedly triggered
            // all pending events.
            //
            // But time has advanced as we were calling the different callbacks
            // so it is actually possible.
            Duration::default()
        } else {
            next_deadline - simulated_now
        };
        if let Some(previous_join_handle) = self.next_timeout.take() {
            // The next event timeout is about to change. Let's cancel the previous
            // scheduled event.
            previous_join_handle.abort();
        }
        let new_join_handle: JoinHandle<()> = tokio::task::spawn(async move {
            if timeout.is_zero() {
                tokio::task::yield_now().await;
            } else {
                tokio::time::sleep(timeout).await;
            }
            scheduler_client.process_time();
        });
        self.next_timeout = Some(new_join_handle);
    }
}

impl Scheduler {
    pub fn new(scheduler_client: &SchedulerClient) -> Self {
        Scheduler {
            event_id_generator: 0u64,
            simulated_time_shift: Duration::default(),
            future_events: Default::default(),
            next_timeout: None,
            weak_scheduler_client: Arc::downgrade(&scheduler_client.inner),
        }
    }

    /// Updates the simulated time shift, if appropriate.
    ///
    /// We advance time if:
    /// - someone is actually requesting for a simulated fast forward in time. (if
    ///   Universe::simulate_time_shift(..) has been called).
    /// - no message is queued for processing, no initialize or no finalize is being processed.
    fn advance_time_if_necessary(&mut self) {
        let Some(scheduler_client) = self.scheduler_client() else {
            return;
        };
        if !scheduler_client.time_is_accelerated() {
            return;
        }
        if scheduler_client.is_advance_time_forbidden() {
            return;
        }
        let Some(advance_to_instant) = self.next_event_deadline() else {
            return;
        };
        let now = self.simulated_now();
        if let Some(time_shift) = advance_to_instant.checked_duration_since(now) {
            self.simulated_time_shift += time_shift;
        }
    }

    fn next_event_deadline(&self) -> Option<Instant> {
        self.future_events.peek().map(|rev| rev.0.deadline)
    }

    fn simulated_now(&self) -> Instant {
        Instant::now() + self.simulated_time_shift
    }

    fn timeout_event(&mut self, deadline: Instant, callback: Callback) -> TimeoutEvent {
        let event_id = self.event_id_generator;
        self.event_id_generator += 1;
        TimeoutEvent {
            deadline,
            event_id,
            callback,
        }
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};
    use std::time::{Duration, Instant};

    use async_trait::async_trait;

    use crate::{Actor, ActorContext, ActorExitStatus, Handler, Universe};

    struct ClockActor {
        count: Arc<AtomicUsize>,
    }

    #[derive(Debug)]
    struct Tick;

    #[async_trait]
    impl Actor for ClockActor {
        type ObservableState = ();
        fn observable_state(&self) -> Self::ObservableState {}

        async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
            self.handle(Tick, ctx).await
        }
    }

    #[async_trait]
    impl Handler<Tick> for ClockActor {
        type Reply = ();

        async fn handle(
            &mut self,
            _tick: Tick,
            ctx: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            self.count.fetch_add(1, Ordering::SeqCst);
            ctx.schedule_self_msg(Duration::from_secs(1), Tick);
            Ok(())
        }
    }

    #[tokio::test]
    async fn test_scheduler_advance_time_fast_forward_initialize() {
        quickwit_common::setup_logging_for_tests();
        let count: Arc<AtomicUsize> = Default::default();
        let simple_actor = ClockActor {
            count: count.clone(),
        };
        let universe = Universe::with_accelerated_time();
        universe.spawn_builder().spawn(simple_actor);
        assert_eq!(count.load(Ordering::SeqCst), 0);
        universe.sleep(Duration::from_millis(15)).await;
        assert_eq!(count.load(Ordering::SeqCst), 1);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_scheduler_advance_time_fast_forward_scheduled_message() {
        let start = Instant::now();
        quickwit_common::setup_logging_for_tests();
        let count: Arc<AtomicUsize> = Default::default();
        let simple_actor = ClockActor {
            count: count.clone(),
        };
        let universe = Universe::with_accelerated_time();
        universe.spawn_builder().spawn(simple_actor);
        assert_eq!(count.load(Ordering::SeqCst), 0);
        universe.sleep(Duration::from_secs(10)).await;
        assert_eq!(count.load(Ordering::SeqCst), 10);
        let elapsed = start.elapsed();
        // The whole point is to accelerate time.
        assert!(elapsed.as_millis() < 50);
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-actors/src/spawn_builder.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

use anyhow::Context;
use quickwit_common::metrics::IntCounter;
use sync_wrapper::SyncWrapper;
use tokio::sync::watch;
use tracing::{debug, error, info};

use crate::envelope::Envelope;
use crate::mailbox::{Inbox, create_mailbox};
use crate::registry::{ActorJoinHandle, ActorRegistry};
use crate::scheduler::{NoAdvanceTimeGuard, SchedulerClient};
use crate::supervisor::Supervisor;
use crate::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, KillSwitch, Mailbox, QueueCapacity,
};

#[derive(Clone)]
pub struct SpawnContext {
    pub(crate) scheduler_client: SchedulerClient,
    pub(crate) kill_switch: KillSwitch,
    pub(crate) registry: ActorRegistry,
}

impl SpawnContext {
    pub fn new(scheduler_client: SchedulerClient) -> Self {
        SpawnContext {
            scheduler_client,
            kill_switch: Default::default(),
            registry: ActorRegistry::default(),
        }
    }

    pub fn spawn_builder<A: Actor>(&self) -> SpawnBuilder<A> {
        SpawnBuilder::new(self.child_context())
    }

    pub fn create_mailbox<A: Actor>(
        &self,
        actor_name: impl ToString,
        queue_capacity: QueueCapacity,
    ) -> (Mailbox<A>, Inbox<A>) {
        create_mailbox(
            actor_name.to_string(),
            queue_capacity,
            Some(self.scheduler_client.clone()),
        )
    }

    pub fn child_context(&self) -> SpawnContext {
        SpawnContext {
            scheduler_client: self.scheduler_client.clone(),
            kill_switch: self.kill_switch.child(),
            registry: self.registry.clone(),
        }
    }

    /// Schedules a new event.
    /// Once `timeout` is elapsed, the future `fut` is
    /// executed.
    ///
    /// `fut` will be executed in the scheduler task, so it is
    /// required to be short.
    pub fn schedule_event<F: FnOnce() + Send + Sync + 'static>(
        &self,
        callback: F,
        timeout: Duration,
    ) {
        self.scheduler_client.schedule_event(callback, timeout)
    }
}

/// `SpawnBuilder` makes it possible to configure misc parameters before spawning an actor.
#[derive(Clone)]
pub struct SpawnBuilder<A: Actor> {
    spawn_ctx: SpawnContext,
    #[allow(clippy::type_complexity)]
    mailboxes: Option<(Mailbox<A>, Inbox<A>)>,
    backpressure_micros_counter_opt: Option<IntCounter>,
}

impl<A: Actor> SpawnBuilder<A> {
    pub(crate) fn new(spawn_ctx: SpawnContext) -> Self {
        SpawnBuilder {
            spawn_ctx,
            mailboxes: None,
            backpressure_micros_counter_opt: None,
        }
    }

    /// Sets a specific kill switch for the actor.
    ///
    /// By default, the kill switch is inherited from the context that was used to
    /// spawn the actor.
    pub fn set_kill_switch(mut self, kill_switch: KillSwitch) -> Self {
        self.spawn_ctx.kill_switch = kill_switch;
        self
    }

    /// Sets a specific set of mailbox.
    ///
    /// By default, a brand new set of mailboxes will be created
    /// when the actor is spawned.
    ///
    /// This function makes it possible to create non-DAG networks
    /// of actors.
    pub fn set_mailboxes(mut self, mailbox: Mailbox<A>, inbox: Inbox<A>) -> Self {
        self.mailboxes = Some((mailbox, inbox));
        self
    }

    /// Adds a counter to track the amount of time the actor is
    /// spending in "backpressure".
    ///
    /// When using `.ask` the amount of time counted may be misleading.
    /// (See `Mailbox::ask_with_backpressure_counter` for more details)
    pub fn set_backpressure_micros_counter(
        mut self,
        backpressure_micros_counter: IntCounter,
    ) -> Self {
        self.backpressure_micros_counter_opt = Some(backpressure_micros_counter);
        self
    }

    fn take_or_create_mailboxes(&mut self, actor: &A) -> (Mailbox<A>, Inbox<A>) {
        if let Some((mailbox, inbox)) = self.mailboxes.take() {
            return (mailbox, inbox);
        }
        let actor_name = actor.name();
        let queue_capacity = actor.queue_capacity();
        self.spawn_ctx.create_mailbox(actor_name, queue_capacity)
    }

    fn create_actor_context_and_inbox(
        mut self,
        actor: &A,
    ) -> (
        ActorContext<A>,
        Inbox<A>,
        watch::Receiver<A::ObservableState>,
    ) {
        let (mailbox, inbox) = self.take_or_create_mailboxes(actor);
        let obs_state = actor.observable_state();
        let (state_tx, state_rx) = watch::channel(obs_state);
        let ctx = ActorContext::new(
            mailbox,
            self.spawn_ctx.clone(),
            state_tx,
            self.backpressure_micros_counter_opt,
        );
        (ctx, inbox, state_rx)
    }

    /// Spawns an async actor.
    pub fn spawn(self, actor: A) -> (Mailbox<A>, ActorHandle<A>) {
        // We prevent fast forward of the scheduler during  initialization.
        let no_advance_time_guard = self.spawn_ctx.scheduler_client.no_advance_time_guard();
        let runtime_handle = actor.runtime_handle();
        let (ctx, inbox, state_rx) = self.create_actor_context_and_inbox(&actor);
        debug!(actor_id = %ctx.actor_instance_id(), "spawn-actor");
        let mailbox = ctx.mailbox().clone();
        let ctx_clone = ctx.clone();
        let loop_async_actor_future =
            async move { actor_loop(actor, inbox, no_advance_time_guard, ctx).await };
        let join_handle = ActorJoinHandle::new(quickwit_common::spawn_named_task_on(
            loop_async_actor_future,
            std::any::type_name::<A>(),
            &runtime_handle,
        ));
        ctx_clone.registry().register(&mailbox, join_handle.clone());
        let actor_handle = ActorHandle::new(state_rx, join_handle, ctx_clone);
        (mailbox, actor_handle)
    }

    pub fn supervise_fn<F: Fn() -> A + Send + 'static>(
        mut self,
        actor_factory: F,
    ) -> (Mailbox<A>, ActorHandle<Supervisor<A>>) {
        let actor = actor_factory();
        let actor_name = actor.name();
        let (mailbox, inbox) = self.take_or_create_mailboxes(&actor);
        self.mailboxes = Some((mailbox, inbox.clone()));
        let child_ctx = self.spawn_ctx.child_context();
        let parent_spawn_ctx = std::mem::replace(&mut self.spawn_ctx, child_ctx);
        let (mailbox, actor_handle) = self.spawn(actor);
        let supervisor = Supervisor::new(actor_name, Box::new(actor_factory), inbox, actor_handle);
        let (_supervisor_mailbox, supervisor_handle) =
            parent_spawn_ctx.spawn_builder().spawn(supervisor);
        (mailbox, supervisor_handle)
    }
}

impl<A: Actor + Clone> SpawnBuilder<A> {
    pub fn supervise(self, actor: A) -> (Mailbox<A>, ActorHandle<Supervisor<A>>) {
        self.supervise_fn(move || actor.clone())
    }
}

impl<A: Actor + Default> SpawnBuilder<A> {
    pub fn supervise_default(self) -> (Mailbox<A>, ActorHandle<Supervisor<A>>) {
        self.supervise_fn(Default::default)
    }
}

enum ActorExitPhase {
    Initializing,
    Handling { message: &'static str },
    Running,
    OnDrainedMessaged,
    Completed,
}

impl fmt::Debug for ActorExitPhase {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        match self {
            ActorExitPhase::Initializing => write!(f, "initializing"),
            ActorExitPhase::Handling { message } => write!(f, "handling({message})"),
            ActorExitPhase::Running => write!(f, "running"),
            ActorExitPhase::OnDrainedMessaged => write!(f, "on_drained_messages"),
            ActorExitPhase::Completed => write!(f, "completed"),
        }
    }
}

/// Receives an envelope from either the high priority queue or the low priority queue.
///
/// In the paused state, the actor will only attempt to receive high priority messages.
///
/// If no message is available, this function will yield until a message arrives.
/// If a high priority message is arrives first it is guaranteed to be processed first.
/// This other way around is however not guaranteed.
async fn recv_envelope<A: Actor>(inbox: &mut Inbox<A>, ctx: &ActorContext<A>) -> Envelope<A> {
    if ctx.state().is_running() {
        ctx.protect_future(inbox.recv()).await.expect(
            "Disconnection should be impossible because the ActorContext holds a Mailbox too",
        )
    } else {
        // The actor is paused. We only process command and scheduled message.
        ctx.protect_future(inbox.recv_cmd_and_scheduled_msg_only())
            .await
    }
}

fn try_recv_envelope<A: Actor>(inbox: &mut Inbox<A>) -> Option<Envelope<A>> {
    inbox.try_recv().ok()
}

struct ActorExecutionEnv<A: Actor> {
    actor: SyncWrapper<A>,
    inbox: Inbox<A>,
    ctx: ActorContext<A>,
}

impl<A: Actor> ActorExecutionEnv<A> {
    async fn initialize(&mut self) -> Result<(), ActorExitStatus> {
        self.actor.get_mut().initialize(&self.ctx).await
    }

    async fn process_messages(&mut self) -> (ActorExitStatus, ActorExitPhase) {
        loop {
            if let Err((exit_status, exit_phase)) = self.process_all_available_messages().await {
                return (exit_status, exit_phase);
            }
        }
    }

    async fn process_one_message(
        &mut self,
        mut envelope: Envelope<A>,
    ) -> Result<(), (ActorExitStatus, ActorExitPhase)> {
        self.yield_and_check_if_killed().await?;
        envelope
            .handle_message(self.actor.get_mut(), &self.ctx)
            .await
            .map_err(|(exit_status, message)| {
                (exit_status, ActorExitPhase::Handling { message })
            })?;
        Ok(())
    }

    async fn yield_and_check_if_killed(&mut self) -> Result<(), (ActorExitStatus, ActorExitPhase)> {
        if self.ctx.kill_switch().is_dead() {
            return Err((ActorExitStatus::Killed, ActorExitPhase::Running));
        }
        if self.actor.get_mut().yield_after_each_message() {
            self.ctx.yield_now().await;
            if self.ctx.kill_switch().is_dead() {
                return Err((ActorExitStatus::Killed, ActorExitPhase::Running));
            }
        } else {
            self.ctx.record_progress();
        }
        Ok(())
    }

    async fn process_all_available_messages(
        &mut self,
    ) -> Result<(), (ActorExitStatus, ActorExitPhase)> {
        self.yield_and_check_if_killed().await?;
        let envelope = recv_envelope(&mut self.inbox, &self.ctx).await;
        self.process_one_message(envelope).await?;
        // If the actor is Running (not Paused), we consume all the messages in the mailbox
        // and call `on_drained_message`.
        if self.ctx.state().is_running() {
            loop {
                while let Some(envelope) = try_recv_envelope(&mut self.inbox) {
                    self.process_one_message(envelope).await?;
                }
                // We have reached the last message.
                // Let's still yield and see if we have more messages:
                // an upstream actor might have experienced backpressure, and is now waiting for our
                // mailbox to have some room.
                self.ctx.yield_now().await;
                if self.inbox.is_empty() {
                    break;
                }
            }
            self.actor
                .get_mut()
                .on_drained_messages(&self.ctx)
                .await
                .map_err(|exit_status| (exit_status, ActorExitPhase::OnDrainedMessaged))?;
        }
        if self.ctx.mailbox().is_last_mailbox() {
            // We double check here that the mailbox does not contain any messages,
            // as someone on different runtime thread could have added a last message
            // and dropped the last mailbox right before this block.
            // See #4248
            if self.inbox.is_empty() {
                // No one will be able to send us more messages.
                // We can exit the actor.
                return Err((ActorExitStatus::Success, ActorExitPhase::Completed));
            }
        }

        Ok(())
    }

    async fn finalize(&mut self, exit_status: ActorExitStatus) -> ActorExitStatus {
        let _no_advance_time_guard = self
            .ctx
            .mailbox()
            .scheduler_client()
            .map(|scheduler_client| scheduler_client.no_advance_time_guard());
        if let Err(finalize_error) = self
            .actor
            .get_mut()
            .finalize(&exit_status, &self.ctx)
            .await
            .with_context(|| format!("finalization of actor {}", self.actor.get_mut().name()))
        {
            error!(error=?finalize_error, "finalizing failed, set exit status to panicked");
            return ActorExitStatus::Panicked;
        }
        exit_status
    }
}

impl<A: Actor> Drop for ActorExecutionEnv<A> {
    // We rely on this object internally to fetch a post-mortem state,
    // even in case of a panic.
    fn drop(&mut self) {
        self.ctx.observe(self.actor.get_mut());
    }
}

async fn actor_loop<A: Actor>(
    actor: A,
    inbox: Inbox<A>,
    no_advance_time_guard: NoAdvanceTimeGuard,
    ctx: ActorContext<A>,
) -> ActorExitStatus {
    let mut actor_env = ActorExecutionEnv {
        actor: SyncWrapper::new(actor),
        inbox,
        ctx,
    };

    let initialize_exit_status_res: Result<(), ActorExitStatus> = actor_env.initialize().await;
    drop(no_advance_time_guard);

    let (after_process_exit_status, exit_phase) =
        if let Err(initialize_exit_status) = initialize_exit_status_res {
            // We do not process messages if initialize yield an error.
            // We still call finalize however!
            (initialize_exit_status, ActorExitPhase::Initializing)
        } else {
            actor_env.process_messages().await
        };

    let actor_id = actor_env.ctx.actor_instance_id();
    match after_process_exit_status {
        ActorExitStatus::Success
        | ActorExitStatus::Quit
        | ActorExitStatus::DownstreamClosed
        | ActorExitStatus::Killed => {
            info!(actor_id, phase = ?exit_phase, exit_status = ?after_process_exit_status, "actor-exit");
        }
        ActorExitStatus::Failure(_) | ActorExitStatus::Panicked => {
            error!(actor_id, phase = ?exit_phase, exit_status = ?after_process_exit_status, "actor-exit");
        }
    };

    // TODO the no advance time guard for finalize has a race condition. Ideally we would
    // like to have the guard before we drop the last envelope.
    let final_exit_status = actor_env.finalize(after_process_exit_status).await;
    // The last observation is collected on `ActorExecutionEnv::Drop`.
    actor_env.ctx.exit(&final_exit_status);
    final_exit_status
}


================================================
FILE: quickwit/quickwit-actors/src/supervisor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;
use serde::Serialize;
use tracing::{info, warn};

use crate::mailbox::Inbox;
use crate::{Actor, ActorContext, ActorExitStatus, ActorHandle, Handler, Health, Supervisable};

#[derive(Debug, Clone, Copy, Default, Eq, PartialEq, Serialize)]
pub struct SupervisorMetrics {
    pub num_panics: usize,
    pub num_errors: usize,
    pub num_kills: usize,
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize)]
pub struct SupervisorState<S> {
    pub metrics: SupervisorMetrics,
    pub state_opt: Option<S>,
}

impl<S> Default for SupervisorState<S> {
    fn default() -> Self {
        SupervisorState {
            metrics: Default::default(),
            state_opt: None,
        }
    }
}

pub struct Supervisor<A: Actor> {
    actor_name: String,
    actor_factory: Box<dyn Fn() -> A + Send>,
    inbox: Inbox<A>,
    handle_opt: Option<ActorHandle<A>>,
    metrics: SupervisorMetrics,
}

#[derive(Debug, Copy, Clone)]
struct SuperviseLoop;

#[async_trait]
impl<A: Actor> Actor for Supervisor<A> {
    type ObservableState = SupervisorState<A::ObservableState>;

    fn observable_state(&self) -> Self::ObservableState {
        let state_opt: Option<A::ObservableState> = self
            .handle_opt
            .as_ref()
            .map(|handle| handle.last_observation().clone());
        SupervisorState {
            metrics: self.metrics,
            state_opt,
        }
    }

    fn name(&self) -> String {
        format!("Supervisor({})", self.actor_name)
    }

    fn queue_capacity(&self) -> crate::QueueCapacity {
        crate::QueueCapacity::Unbounded
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        ctx.schedule_self_msg(*crate::HEARTBEAT, SuperviseLoop);
        Ok(())
    }

    async fn finalize(
        &mut self,
        exit_status: &ActorExitStatus,
        _ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        match exit_status {
            ActorExitStatus::Quit => {
                if let Some(handle) = self.handle_opt.take() {
                    handle.quit().await;
                }
            }
            ActorExitStatus::Killed => {
                if let Some(handle) = self.handle_opt.take() {
                    handle.kill().await;
                }
            }
            ActorExitStatus::Failure(_)
            | ActorExitStatus::Success
            | ActorExitStatus::DownstreamClosed => {}
            ActorExitStatus::Panicked => {}
        }

        Ok(())
    }
}

impl<A: Actor> Supervisor<A> {
    pub(crate) fn new(
        actor_name: String,
        actor_factory: Box<dyn Fn() -> A + Send>,
        inbox: Inbox<A>,
        handle: ActorHandle<A>,
    ) -> Self {
        Supervisor {
            actor_name,
            actor_factory,
            inbox,
            handle_opt: Some(handle),
            metrics: Default::default(),
        }
    }

    async fn supervise(
        &mut self,
        ctx: &ActorContext<Supervisor<A>>,
    ) -> Result<(), ActorExitStatus> {
        let handle_ref = self
            .handle_opt
            .as_ref()
            .expect("The actor handle should always be set.");
        match handle_ref.check_health(true) {
            Health::Healthy => {
                handle_ref.refresh_observe();
                return Ok(());
            }
            Health::FailureOrUnhealthy => {}
            Health::Success => {
                return Err(ActorExitStatus::Success);
            }
        }
        warn!("unhealthy-actor");
        // The actor is failing we need to restart it.
        let actor_handle = self.handle_opt.take().unwrap();
        let actor_mailbox = actor_handle.mailbox().clone();
        let (actor_exit_status, _last_state) = if !actor_handle.state().is_exit() {
            // The actor is probably frozen.
            // Let's kill it.
            warn!("killing");
            actor_handle.kill().await
        } else {
            actor_handle.join().await
        };
        match actor_exit_status {
            ActorExitStatus::Success => {
                return Err(ActorExitStatus::Success);
            }
            ActorExitStatus::Quit => {
                return Err(ActorExitStatus::Quit);
            }
            ActorExitStatus::DownstreamClosed => {
                return Err(ActorExitStatus::DownstreamClosed);
            }
            ActorExitStatus::Killed => {
                self.metrics.num_kills += 1;
            }
            ActorExitStatus::Failure(_err) => {
                self.metrics.num_errors += 1;
            }
            ActorExitStatus::Panicked => {
                self.metrics.num_panics += 1;
            }
        }
        info!("respawning-actor");
        let (_, actor_handle) = ctx
            .spawn_actor()
            .set_mailboxes(actor_mailbox, self.inbox.clone())
            .set_kill_switch(ctx.kill_switch().child())
            .spawn((*self.actor_factory)());
        self.handle_opt = Some(actor_handle);
        Ok(())
    }
}

#[async_trait]
impl<A: Actor> Handler<SuperviseLoop> for Supervisor<A> {
    type Reply = ();

    async fn handle(
        &mut self,
        _msg: SuperviseLoop,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        self.supervise(ctx).await?;
        ctx.schedule_self_msg(*crate::HEARTBEAT, SuperviseLoop);
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use async_trait::async_trait;
    use tracing::info;

    use crate::supervisor::SupervisorMetrics;
    use crate::tests::{Ping, PingReceiverActor};
    use crate::{Actor, ActorContext, ActorExitStatus, AskError, Handler, Observe, Universe};

    #[derive(Copy, Clone, Debug)]
    enum FailingActorMessage {
        Panic,
        ReturnError,
        Increment,
        Freeze(Duration),
    }

    #[derive(Default, Clone)]
    struct FailingActor {
        counter: usize,
    }

    #[async_trait]
    impl Actor for FailingActor {
        type ObservableState = usize;

        fn name(&self) -> String {
            "FailingActor".to_string()
        }

        fn observable_state(&self) -> Self::ObservableState {
            self.counter
        }

        async fn finalize(
            &mut self,
            _exit_status: &ActorExitStatus,
            _ctx: &ActorContext<Self>,
        ) -> anyhow::Result<()> {
            info!("finalize-failing-actor");
            Ok(())
        }
    }

    #[async_trait]
    impl Handler<FailingActorMessage> for FailingActor {
        type Reply = usize;

        async fn handle(
            &mut self,
            msg: FailingActorMessage,
            ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, ActorExitStatus> {
            match msg {
                FailingActorMessage::Panic => {
                    panic!("Failing actor panicked");
                }
                FailingActorMessage::ReturnError => {
                    return Err(ActorExitStatus::from(anyhow::anyhow!(
                        "failing actor error"
                    )));
                }
                FailingActorMessage::Increment => {
                    self.counter += 1;
                }
                FailingActorMessage::Freeze(wait_duration) => {
                    ctx.sleep(wait_duration).await;
                }
            }
            Ok(self.counter)
        }
    }

    #[tokio::test]
    async fn test_supervisor_restart_on_panic() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let actor = FailingActor::default();
        let (mailbox, supervisor_handle) = universe.spawn_builder().supervise(actor);
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            2
        );
        assert!(mailbox.ask(FailingActorMessage::Panic).await.is_err());
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        assert_eq!(
            supervisor_handle.observe().await.metrics,
            SupervisorMetrics {
                num_panics: 1,
                num_errors: 0,
                num_kills: 0
            }
        );
        assert!(!matches!(
            supervisor_handle.quit().await.0,
            ActorExitStatus::Panicked
        ));
    }

    #[tokio::test]
    async fn test_supervisor_restart_on_error() {
        let universe = Universe::with_accelerated_time();
        let actor = FailingActor::default();
        let (mailbox, supervisor_handle) = universe.spawn_builder().supervise(actor);
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            2
        );
        assert!(mailbox.ask(FailingActorMessage::ReturnError).await.is_err());
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        assert_eq!(
            supervisor_handle.observe().await.metrics,
            SupervisorMetrics {
                num_panics: 0,
                num_errors: 1,
                num_kills: 0
            }
        );
        assert!(!matches!(
            supervisor_handle.quit().await.0,
            ActorExitStatus::Panicked
        ));
    }

    #[tokio::test]
    async fn test_supervisor_kills_and_restart_frozen_actor() {
        let universe = Universe::with_accelerated_time();
        let actor = FailingActor::default();
        let (mailbox, supervisor_handle) = universe.spawn_builder().supervise(actor);
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            2
        );
        assert_eq!(
            supervisor_handle.observe().await.metrics,
            SupervisorMetrics {
                num_panics: 0,
                num_errors: 0,
                num_kills: 0
            }
        );
        mailbox
            .send_message(FailingActorMessage::Freeze(
                crate::HEARTBEAT.mul_f32(3.0f32),
            ))
            .await
            .unwrap();
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        assert_eq!(
            supervisor_handle.observe().await.metrics,
            SupervisorMetrics {
                num_panics: 0,
                num_errors: 0,
                num_kills: 1
            }
        );
        assert!(!matches!(
            supervisor_handle.quit().await.0,
            ActorExitStatus::Panicked
        ));
    }

    #[tokio::test]
    async fn test_supervisor_forwards_quit_commands() {
        let universe = Universe::with_accelerated_time();
        let actor = FailingActor::default();
        let (mailbox, supervisor_handle) = universe.spawn_builder().supervise(actor);
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        let (exit_status, _state) = supervisor_handle.quit().await;
        assert!(matches!(
            mailbox
                .ask(FailingActorMessage::Increment)
                .await
                .unwrap_err(),
            AskError::MessageNotDelivered
        ));
        assert!(matches!(exit_status, ActorExitStatus::Quit));
    }

    #[tokio::test]
    async fn test_supervisor_forwards_kill_command() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let actor = FailingActor::default();
        let (mailbox, supervisor_handle) = universe.spawn_builder().supervise(actor);
        assert_eq!(
            mailbox.ask(FailingActorMessage::Increment).await.unwrap(),
            1
        );
        let (exit_status, _state) = supervisor_handle.kill().await;
        assert!(mailbox.ask(FailingActorMessage::Increment).await.is_err());
        assert!(matches!(
            mailbox
                .ask(FailingActorMessage::Increment)
                .await
                .unwrap_err(),
            AskError::MessageNotDelivered
        ));
        assert!(matches!(exit_status, ActorExitStatus::Killed));
    }

    #[tokio::test]
    async fn test_supervisor_exits_successfully_when_supervised_actor_mailbox_is_dropped() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let actor = FailingActor::default();
        let (_, supervisor_handle) = universe.spawn_builder().supervise(actor);
        let (exit_status, _state) = supervisor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_supervisor_state() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let ping_actor = PingReceiverActor::default();
        let (mailbox, handler) = universe.spawn_builder().supervise(ping_actor);
        let obs = handler.observe().await;
        assert_eq!(obs.state.state_opt, Some(0));
        let _ = mailbox.ask(Ping).await;
        assert_eq!(mailbox.ask(Observe).await.unwrap(), 1);
        universe.sleep(Duration::from_secs(60)).await;
        let obs = handler.observe().await;
        assert_eq!(obs.state.state_opt, Some(1));
        handler.quit().await;
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-actors/src/tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cell::Cell;
use std::collections::HashMap;
use std::ops::Mul;
use std::time::Duration;

use async_trait::async_trait;
use quickwit_common::new_coolid;
use serde::Serialize;

use crate::observation::ObservationType;
use crate::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, ActorState, Command, Handler, Health,
    Mailbox, Observation, Supervisable, Universe,
};

// An actor that receives ping messages.
#[derive(Default, Clone)]
pub struct PingReceiverActor {
    ping_count: usize,
}

impl Actor for PingReceiverActor {
    type ObservableState = usize;

    fn name(&self) -> String {
        "Ping".to_string()
    }

    fn observable_state(&self) -> Self::ObservableState {
        self.ping_count
    }
}

#[derive(Debug)]
pub struct Ping;

#[async_trait]
impl Handler<Ping> for PingReceiverActor {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: Ping,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.ping_count += 1;
        assert_eq!(ctx.state(), ActorState::Running);
        Ok(())
    }
}

#[derive(Default)]
pub struct PingerSenderActor {
    count: usize,
    peers: HashMap<String, Mailbox<PingReceiverActor>>,
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize)]
pub struct SenderState {
    pub count: usize,
    pub num_peers: usize,
}

#[derive(Clone, Debug)]
pub struct AddPeer(Mailbox<PingReceiverActor>);

impl Actor for PingerSenderActor {
    type ObservableState = SenderState;

    fn name(&self) -> String {
        "PingSender".to_string()
    }

    fn observable_state(&self) -> Self::ObservableState {
        SenderState {
            count: self.count,
            num_peers: self.peers.len(),
        }
    }
}

#[async_trait]
impl Handler<Ping> for PingerSenderActor {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: Ping,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.count += 1;
        for peer in self.peers.values() {
            let _ = peer.send_message(Ping).await;
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<AddPeer> for PingerSenderActor {
    type Reply = ();

    async fn handle(
        &mut self,
        message: AddPeer,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let AddPeer(peer) = message;
        let peer_id = peer.actor_instance_id().to_string();
        self.peers.insert(peer_id, peer);
        Ok(())
    }
}

#[tokio::test]
async fn test_actor_stops_when_last_mailbox_is_dropped() {
    quickwit_common::setup_logging_for_tests();
    let universe = Universe::with_accelerated_time();
    let (ping_recv_mailbox, ping_recv_handle) =
        universe.spawn_builder().spawn(PingReceiverActor::default());
    drop(ping_recv_mailbox);
    let (exit_status, _) = ping_recv_handle.join().await;
    assert!(exit_status.is_success());
}

#[tokio::test]
async fn test_ping_actor() {
    quickwit_common::setup_logging_for_tests();
    let universe = Universe::with_accelerated_time();
    let (ping_recv_mailbox, ping_recv_handle) =
        universe.spawn_builder().spawn(PingReceiverActor::default());
    let (ping_sender_mailbox, ping_sender_handle) =
        universe.spawn_builder().spawn(PingerSenderActor::default());
    assert_eq!(
        ping_recv_handle.observe().await,
        Observation {
            obs_type: ObservationType::Alive,
            state: 0
        }
    );
    // No peers. This one will have no impact.
    let ping_recv_mailbox = ping_recv_mailbox.clone();
    assert!(ping_sender_mailbox.send_message(Ping).await.is_ok());
    assert!(
        ping_sender_mailbox
            .send_message(AddPeer(ping_recv_mailbox.clone()))
            .await
            .is_ok()
    );
    assert_eq!(
        ping_sender_handle.process_pending_and_observe().await,
        Observation {
            obs_type: ObservationType::Alive,
            state: SenderState {
                num_peers: 1,
                count: 1
            }
        }
    );
    assert!(ping_sender_mailbox.send_message(Ping).await.is_ok());
    assert!(ping_sender_mailbox.send_message(Ping).await.is_ok());
    assert_eq!(
        ping_sender_handle.process_pending_and_observe().await,
        Observation {
            obs_type: ObservationType::Alive,
            state: SenderState {
                num_peers: 1,
                count: 3
            }
        }
    );
    assert_eq!(
        ping_recv_handle.process_pending_and_observe().await,
        Observation {
            obs_type: ObservationType::Alive,
            state: 2
        }
    );
    universe.kill();
    assert_eq!(
        ping_recv_handle.process_pending_and_observe().await,
        Observation {
            obs_type: ObservationType::PostMortem,
            state: 2
        }
    );
    assert_eq!(
        ping_sender_handle.process_pending_and_observe().await,
        Observation {
            obs_type: ObservationType::PostMortem,
            state: SenderState {
                num_peers: 1,
                count: 3
            }
        }
    );
    ping_sender_handle.join().await;
    assert!(ping_sender_mailbox.send_message(Ping).await.is_err());
}

struct BuggyActor;

#[derive(Clone, Debug)]
struct DoNothing;

#[derive(Clone, Debug)]
struct Block;

impl Actor for BuggyActor {
    type ObservableState = ();

    fn name(&self) -> String {
        "BuggyActor".to_string()
    }

    fn observable_state(&self) {}
}

#[async_trait]
impl Handler<DoNothing> for BuggyActor {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: DoNothing,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        Ok(())
    }
}

#[async_trait]
impl Handler<Block> for BuggyActor {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: Block,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        while ctx.kill_switch().is_alive() {
            tokio::task::yield_now().await;
        }
        Ok(())
    }
}

#[tokio::test]
async fn test_timeouting_actor() {
    let universe = Universe::with_accelerated_time();
    let (buggy_mailbox, buggy_handle) = universe.spawn_builder().spawn(BuggyActor);
    let buggy_mailbox = buggy_mailbox;
    assert_eq!(
        buggy_handle.observe().await.obs_type,
        ObservationType::Alive
    );
    assert!(buggy_mailbox.send_message(DoNothing).await.is_ok());
    assert_eq!(
        buggy_handle.observe().await.obs_type,
        ObservationType::Alive
    );
    assert!(buggy_mailbox.send_message(Block).await.is_ok());

    assert_eq!(buggy_handle.check_health(true), Health::Healthy);
    assert_eq!(
        buggy_handle.process_pending_and_observe().await.obs_type,
        ObservationType::Timeout
    );
    assert_eq!(buggy_handle.check_health(true), Health::Healthy);
    universe.sleep(crate::HEARTBEAT.mul(2)).await;
    assert_eq!(buggy_handle.check_health(true), Health::FailureOrUnhealthy);
    buggy_handle.kill().await;
}

#[tokio::test]
async fn test_pause_actor() {
    quickwit_common::setup_logging_for_tests();
    let universe = Universe::with_accelerated_time();
    let (ping_mailbox, ping_handle) = universe.spawn_builder().spawn(PingReceiverActor::default());
    for _ in 0u32..1000u32 {
        assert!(ping_mailbox.send_message(Ping).await.is_ok());
    }
    assert!(
        ping_mailbox
            .send_message_with_high_priority(Command::Pause)
            .is_ok()
    );
    let first_state = ping_handle.observe().await.state;
    assert!(first_state < 1000);
    let second_state = ping_handle.observe().await.state;
    assert_eq!(first_state, second_state);
    assert!(
        ping_mailbox
            .send_message_with_high_priority(Command::Resume)
            .is_ok()
    );
    let end_state = ping_handle.process_pending_and_observe().await.state;
    assert_eq!(end_state, 1000);
    universe.assert_quit().await;
}

#[tokio::test]
async fn test_actor_running_states() {
    quickwit_common::setup_logging_for_tests();
    let universe = Universe::with_accelerated_time();
    let (ping_mailbox, ping_handle) = universe.spawn_builder().spawn(PingReceiverActor::default());
    assert_eq!(ping_handle.state(), ActorState::Running);
    for _ in 0u32..10u32 {
        assert!(ping_mailbox.send_message(Ping).await.is_ok());
    }
    let obs = ping_handle.process_pending_and_observe().await;
    assert_eq!(*obs, 10);
    universe.sleep(Duration::from_millis(1)).await;
    assert_eq!(ping_handle.state(), ActorState::Running);
    universe.assert_quit().await;
}

#[derive(Clone, Debug, Default, Serialize)]
struct LoopingActor {
    pub loop_count: usize,
    pub single_shot_count: usize,
}

#[derive(Debug)]
struct Loop;

#[derive(Debug)]
struct SingleShot;

#[async_trait]
impl Actor for LoopingActor {
    type ObservableState = Self;

    fn observable_state(&self) -> Self::ObservableState {
        self.clone()
    }

    fn yield_after_each_message(&self) -> bool {
        false
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.handle(Loop, ctx).await
    }
}

#[async_trait]
impl Handler<Loop> for LoopingActor {
    type Reply = ();
    async fn handle(
        &mut self,
        _msg: Loop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.loop_count += 1;
        ctx.send_self_message(Loop).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<SingleShot> for LoopingActor {
    type Reply = ();

    async fn handle(
        &mut self,
        _msg: SingleShot,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.single_shot_count += 1;
        Ok(())
    }
}

#[tokio::test(flavor = "multi_thread")]
async fn test_looping() -> anyhow::Result<()> {
    let universe = Universe::with_accelerated_time();
    let looping_actor = LoopingActor::default();
    let (looping_actor_mailbox, looping_actor_handle) =
        universe.spawn_builder().spawn(looping_actor);
    assert!(looping_actor_mailbox.send_message(SingleShot).await.is_ok());
    looping_actor_handle.process_pending_and_observe().await;
    let (exit_status, state) = looping_actor_handle.quit().await;
    assert!(matches!(exit_status, ActorExitStatus::Quit));
    assert_eq!(state.single_shot_count, 1);
    assert!(state.loop_count > 0);
    Ok(())
}

#[derive(Default)]
struct SummingActor {
    sum: u64,
}

#[async_trait]
impl Handler<u64> for SummingActor {
    type Reply = ();

    async fn handle(&mut self, add: u64, _ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.sum += add;
        Ok(())
    }
}

impl Actor for SummingActor {
    type ObservableState = u64;

    fn observable_state(&self) -> Self::ObservableState {
        self.sum
    }
}

#[derive(Default)]
struct SpawningActor {
    res: u64,
    handle_opt: Option<(Mailbox<SummingActor>, ActorHandle<SummingActor>)>,
}

#[async_trait]
impl Actor for SpawningActor {
    type ObservableState = u64;

    fn observable_state(&self) -> Self::ObservableState {
        self.res
    }

    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        if let Some((_, child_handler)) = self.handle_opt.take() {
            self.res = child_handler.process_pending_and_observe().await.state;
            child_handler.kill().await;
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<u64> for SpawningActor {
    type Reply = ();

    async fn handle(
        &mut self,
        message: u64,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let (mailbox, _) = self
            .handle_opt
            .get_or_insert_with(|| ctx.spawn_actor().spawn(SummingActor::default()));
        ctx.send_message(mailbox, message).await?;
        Ok(())
    }
}

#[tokio::test]
async fn test_actor_spawning_actor() -> anyhow::Result<()> {
    let universe = Universe::with_accelerated_time();
    let (mailbox, handle) = universe.spawn_builder().spawn(SpawningActor::default());
    mailbox.send_message(1).await?;
    mailbox.send_message(2).await?;
    mailbox.send_message(3).await?;
    drop(mailbox);
    let (exit, result) = handle.join().await;
    assert!(matches!(exit, ActorExitStatus::Success));
    assert_eq!(result, 6);
    Ok(())
}

struct BuggyFinalizeActor;

#[async_trait]
impl Actor for BuggyFinalizeActor {
    type ObservableState = ();

    fn name(&self) -> String {
        "BuggyFinalizeActor".to_string()
    }

    fn observable_state(&self) {}

    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        anyhow::bail!("finalize error")
    }
}

#[tokio::test]
async fn test_actor_finalize_error_set_exit_status_to_panicked() -> anyhow::Result<()> {
    let universe = Universe::with_accelerated_time();
    let (mailbox, handle) = universe.spawn_builder().spawn(BuggyFinalizeActor);
    assert!(matches!(handle.state(), ActorState::Running));
    drop(mailbox);
    let (exit, _) = handle.join().await;
    assert!(matches!(exit, ActorExitStatus::Panicked));
    Ok(())
}

#[derive(Default)]
struct Adder(u64);

impl Actor for Adder {
    type ObservableState = u64;

    fn yield_after_each_message(&self) -> bool {
        false
    }

    fn observable_state(&self) -> Self::ObservableState {
        self.0
    }
}

#[derive(Debug)]
struct AddOperand(u64);

#[async_trait]
impl Handler<AddOperand> for Adder {
    type Reply = u64;

    async fn handle(
        &mut self,
        add_op: AddOperand,
        _ctx: &ActorContext<Self>,
    ) -> Result<u64, ActorExitStatus> {
        self.0 += add_op.0;
        Ok(self.0)
    }
}

#[tokio::test]
async fn test_actor_return_response() -> anyhow::Result<()> {
    let universe = Universe::with_accelerated_time();
    let adder = Adder::default();
    let (mailbox, _handle) = universe.spawn_builder().spawn(adder);
    let plus_two = mailbox.send_message(AddOperand(2)).await?;
    let plus_two_plus_four = mailbox.send_message(AddOperand(4)).await?;
    assert_eq!(plus_two.await.unwrap(), 2);
    assert_eq!(plus_two_plus_four.await.unwrap(), 6);
    universe.assert_quit().await;
    Ok(())
}

#[derive(Default)]
struct TestActorWithDrain {
    counts: ProcessAndDrainCounts,
}

#[derive(Clone, Copy, Debug, Default, Eq, PartialEq, Serialize)]
struct ProcessAndDrainCounts {
    process_calls_count: usize,
    drain_calls_count: usize,
}

#[async_trait]
impl Actor for TestActorWithDrain {
    type ObservableState = ProcessAndDrainCounts;

    fn observable_state(&self) -> ProcessAndDrainCounts {
        self.counts
    }

    async fn on_drained_messages(
        &mut self,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.counts.drain_calls_count += 1;
        Ok(())
    }
}

#[async_trait]
impl Handler<()> for TestActorWithDrain {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: (),
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        self.counts.process_calls_count += 1;
        Ok(())
    }
}

#[tokio::test]
async fn test_drain_is_called() {
    quickwit_common::setup_logging_for_tests();
    let universe = Universe::with_accelerated_time();
    let test_actor_with_drain = TestActorWithDrain::default();
    let (mailbox, handle) = universe.spawn_builder().spawn(test_actor_with_drain);
    assert_eq!(
        *handle.process_pending_and_observe().await,
        ProcessAndDrainCounts {
            process_calls_count: 0,
            drain_calls_count: 0
        }
    );
    handle.pause();
    mailbox.send_message(()).await.unwrap();
    mailbox.send_message(()).await.unwrap();
    mailbox.send_message(()).await.unwrap();
    handle.resume();
    universe.sleep(Duration::from_millis(1)).await;
    assert_eq!(
        *handle.process_pending_and_observe().await,
        ProcessAndDrainCounts {
            process_calls_count: 3,
            drain_calls_count: 1
        }
    );
    mailbox.send_message(()).await.unwrap();
    universe.sleep(Duration::from_millis(1)).await;
    assert_eq!(
        *handle.process_pending_and_observe().await,
        ProcessAndDrainCounts {
            process_calls_count: 4,
            drain_calls_count: 2
        }
    );
    universe.assert_quit().await;
}

#[tokio::test]
async fn test_unsync_actor() {
    #[derive(Default)]
    struct UnsyncActor(Cell<u64>);

    impl Actor for UnsyncActor {
        type ObservableState = u64;

        fn observable_state(&self) -> Self::ObservableState {
            self.0.get()
        }
    }

    #[async_trait]
    impl Handler<u64> for UnsyncActor {
        type Reply = u64;

        async fn handle(
            &mut self,
            number: u64,
            _ctx: &ActorContext<Self>,
        ) -> Result<u64, ActorExitStatus> {
            *self.0.get_mut() += number;
            Ok(self.0.get())
        }
    }
    let universe = Universe::with_accelerated_time();
    let unsync_message_actor = UnsyncActor::default();
    let (mailbox, _handle) = universe.spawn_builder().spawn(unsync_message_actor);

    let response = mailbox.ask(1).await.unwrap();
    assert_eq!(response, 1);

    universe.assert_quit().await;
}

#[tokio::test]
async fn test_unsync_actor_message() {
    #[derive(Default)]
    struct UnsyncMessageActor(u64);

    impl Actor for UnsyncMessageActor {
        type ObservableState = u64;

        fn observable_state(&self) -> Self::ObservableState {
            self.0
        }
    }

    #[async_trait]
    impl Handler<Cell<u64>> for UnsyncMessageActor {
        type Reply = anyhow::Result<u64>;

        async fn handle(
            &mut self,
            number: Cell<u64>,
            _ctx: &ActorContext<Self>,
        ) -> Result<anyhow::Result<u64>, ActorExitStatus> {
            self.0 += number.get();
            Ok(Ok(self.0))
        }
    }
    let universe = Universe::with_accelerated_time();
    let unsync_message_actor = UnsyncMessageActor::default();
    let (mailbox, _handle) = universe.spawn_builder().spawn(unsync_message_actor);

    let response_rx = mailbox.send_message(Cell::new(1)).await.unwrap();
    assert_eq!(response_rx.await.unwrap().unwrap(), 1);

    let response = mailbox.ask(Cell::new(1)).await.unwrap().unwrap();
    assert_eq!(response, 2);

    let response = mailbox.ask_for_res(Cell::new(1)).await.unwrap();
    assert_eq!(response, 3);

    let response_rx = mailbox
        .send_message_with_high_priority(Cell::new(1))
        .unwrap();
    assert_eq!(response_rx.await.unwrap().unwrap(), 4);

    let response_rx = mailbox.try_send_message(Cell::new(1)).unwrap();
    assert_eq!(response_rx.await.unwrap().unwrap(), 5);

    universe.assert_quit().await;
}

struct FakeActorService {
    // We use a cool id to make sure in the test that we get twice the same instance.
    cool_id: String,
}

#[derive(Debug)]
struct GetCoolId;

impl Actor for FakeActorService {
    type ObservableState = ();

    fn observable_state(&self) {}
}

#[async_trait]
impl Handler<GetCoolId> for FakeActorService {
    type Reply = String;

    async fn handle(
        &mut self,
        _: GetCoolId,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.cool_id.clone())
    }
}

impl Default for FakeActorService {
    fn default() -> Self {
        FakeActorService {
            cool_id: new_coolid("fake-actor"),
        }
    }
}

#[tokio::test]
async fn test_get_or_spawn() {
    let universe = Universe::new();
    let mailbox1: Mailbox<FakeActorService> = universe.get_or_spawn_one();
    let id1 = mailbox1.ask(GetCoolId).await.unwrap();
    let mailbox2: Mailbox<FakeActorService> = universe.get_or_spawn_one();
    let id2 = mailbox2.ask(GetCoolId).await.unwrap();
    assert_eq!(id1, id2);
    universe.assert_quit().await;
}


================================================
FILE: quickwit/quickwit-actors/src/universe.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::thread;
use std::time::Duration;

use crate::mailbox::create_mailbox;
use crate::registry::ActorObservation;
use crate::scheduler::start_scheduler;
use crate::spawn_builder::{SpawnBuilder, SpawnContext};
use crate::{Actor, ActorExitStatus, Command, Inbox, Mailbox, QueueCapacity};

/// Universe serves as the top-level context in which Actor can be spawned.
///
/// It is *not* a singleton. A typical application will usually have only one universe hosting all
/// of the actors but it is not a requirement.
///
/// In particular, unit test all have their own universe and hence can be executed in parallel.
pub struct Universe {
    pub(crate) spawn_ctx: SpawnContext,
}

impl Default for Universe {
    fn default() -> Universe {
        Universe::new()
    }
}

impl Universe {
    /// Creates a new universe.
    pub fn new() -> Universe {
        let scheduler_client = start_scheduler();
        Universe {
            spawn_ctx: SpawnContext::new(scheduler_client),
        }
    }

    /// Creates a universe were time is accelerated.
    ///
    /// Time is accelerated in a way to exhibit a behavior as close as possible
    /// to what would have happened with normal time but faster.
    ///
    /// The time "jumps" only happen when no actor is processing any message,
    /// running initialization or finalize.
    #[cfg(any(test, feature = "testsuite"))]
    pub fn with_accelerated_time() -> Universe {
        let universe = Universe::new();
        universe.spawn_ctx().scheduler_client.accelerate_time();
        universe
    }

    pub fn spawn_ctx(&self) -> &SpawnContext {
        &self.spawn_ctx
    }

    pub fn create_test_mailbox<A: Actor>(&self) -> (Mailbox<A>, Inbox<A>) {
        create_mailbox("test-mailbox".to_string(), QueueCapacity::Unbounded, None)
    }

    pub fn create_mailbox<A: Actor>(
        &self,
        actor_name: impl ToString,
        queue_capacity: QueueCapacity,
    ) -> (Mailbox<A>, Inbox<A>) {
        self.spawn_ctx.create_mailbox(actor_name, queue_capacity)
    }

    pub fn get<A: Actor>(&self) -> Vec<Mailbox<A>> {
        self.spawn_ctx.registry.get::<A>()
    }

    pub fn get_one<A: Actor>(&self) -> Option<Mailbox<A>> {
        self.spawn_ctx.registry.get_one::<A>()
    }

    pub fn get_or_spawn_one<A: Actor + Default>(&self) -> Mailbox<A> {
        if let Some(actor_mailbox) = self.spawn_ctx.registry.get_one::<A>() {
            actor_mailbox
        } else {
            let actor_default = A::default();
            let (mailbox, _handler) = self.spawn_builder().spawn(actor_default);
            mailbox
        }
    }

    pub async fn observe(&self, timeout: Duration) -> Vec<ActorObservation> {
        self.spawn_ctx.registry.observe(timeout).await
    }

    pub fn kill(&self) {
        self.spawn_ctx.kill_switch.kill();
    }

    /// This function acts as a drop-in replacement of
    /// `tokio::time::sleep`.
    ///
    /// It can however be accelerated when using a time-accelerated
    /// universe.
    pub async fn sleep(&self, duration: Duration) {
        self.spawn_ctx.scheduler_client.sleep(duration).await;
    }

    pub fn spawn_builder<A: Actor>(&self) -> SpawnBuilder<A> {
        self.spawn_ctx.spawn_builder()
    }

    /// Inform an actor to process pending message and then stop processing new messages
    /// and exit successfully.
    pub async fn send_exit_with_success<A: Actor>(
        &self,
        mailbox: &Mailbox<A>,
    ) -> Result<(), crate::SendError> {
        mailbox.send_message(Command::ExitWithSuccess).await?;
        Ok(())
    }

    /// Gracefully quits all registered actors.
    pub async fn quit(&self) -> HashMap<String, ActorExitStatus> {
        self.spawn_ctx.registry.quit().await
    }

    /// Gracefully quits all registered actors and asserts that none of them panicked.
    ///
    /// This is useful for testing purposes to detect failed asserts in actors.
    #[cfg(any(test, feature = "testsuite"))]
    pub async fn assert_quit(self) {
        assert!(
            !self
                .quit()
                .await
                .values()
                .any(|status| matches!(status, ActorExitStatus::Panicked))
        );
    }
}

impl Drop for Universe {
    fn drop(&mut self) {
        if cfg!(any(test, feature = "testsuite"))
            && !self.spawn_ctx.registry.is_empty()
            && !thread::panicking()
        {
            panic!(
                "There are still running actors at the end of the test. Did you call \
                 universe.assert_quit()?"
            );
        }
        self.spawn_ctx.kill_switch.kill();
    }
}

#[cfg(test)]
mod tests {
    use core::panic;
    use std::time::Duration;

    use async_trait::async_trait;

    use crate::{Actor, ActorContext, ActorExitStatus, Handler, Universe};

    #[derive(Default)]
    pub struct CountingMinutesActor {
        count: usize,
    }

    #[async_trait]
    impl Actor for CountingMinutesActor {
        type ObservableState = usize;

        fn observable_state(&self) -> usize {
            self.count
        }

        async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
            self.handle(Loop, ctx).await
        }
    }

    #[derive(Debug)]
    struct Loop;

    #[async_trait]
    impl Handler<Loop> for CountingMinutesActor {
        type Reply = ();
        async fn handle(
            &mut self,
            _msg: Loop,
            ctx: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            self.count += 1;
            ctx.schedule_self_msg(Duration::from_secs(60), Loop);
            Ok(())
        }
    }

    #[derive(Default)]
    pub struct ExitPanickingActor {}

    #[async_trait]
    impl Actor for ExitPanickingActor {
        type ObservableState = ();

        fn observable_state(&self) -> Self::ObservableState {}
    }

    impl Drop for ExitPanickingActor {
        fn drop(&mut self) {
            panic!("Panicking on drop")
        }
    }

    #[tokio::test]
    async fn test_schedule_for_actor() {
        let universe = Universe::with_accelerated_time();
        let actor_with_schedule = CountingMinutesActor::default();
        let (_mailbox, handler) = universe.spawn_builder().spawn(actor_with_schedule);
        let count_after_initialization = handler.process_pending_and_observe().await.state;
        assert_eq!(count_after_initialization, 1);
        universe.sleep(Duration::from_secs(200)).await;
        let count_after_advance_time = handler.process_pending_and_observe().await.state;
        assert_eq!(count_after_advance_time, 4);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_actor_quit_after_universe_quit() {
        let universe = Universe::with_accelerated_time();
        let actor_with_schedule = CountingMinutesActor::default();
        let (_mailbox, handler) = universe.spawn_builder().spawn(actor_with_schedule);
        universe.sleep(Duration::from_secs(200)).await;
        let res = universe.quit().await;
        assert_eq!(res.len(), 1);
        assert!(matches!(
            res.values().next().unwrap(),
            ActorExitStatus::Quit
        ));
        assert!(matches!(handler.quit().await, (ActorExitStatus::Quit, 4)));
    }

    #[tokio::test]
    async fn test_universe_join_after_actor_quit() {
        let universe = Universe::default();
        let actor_with_schedule = CountingMinutesActor::default();
        let (_mailbox, handler) = universe.spawn_builder().spawn(actor_with_schedule);
        assert!(matches!(handler.quit().await, (ActorExitStatus::Quit, 1)));
        assert!(
            !universe
                .quit()
                .await
                .values()
                .any(|status| matches!(status, ActorExitStatus::Panicked))
        );
    }

    #[tokio::test]
    async fn test_universe_quit_with_panicking_actor() {
        let universe = Universe::default();
        let panicking_actor = ExitPanickingActor::default();
        let actor_with_schedule = CountingMinutesActor::default();
        let (_mailbox, _handler) = universe.spawn_builder().spawn(panicking_actor);
        let (_mailbox, _handler) = universe.spawn_builder().spawn(actor_with_schedule);
        assert!(
            universe
                .quit()
                .await
                .values()
                .any(|status| matches!(status, ActorExitStatus::Panicked))
        );
    }

    #[tokio::test]
    #[should_panic(
        expected = "There are still running actors at the end of the test. Did you call \
                    universe.assert_quit()?"
    )]
    async fn test_enforce_universe_assert_quit_calls() {
        let universe = Universe::with_accelerated_time();
        let actor_with_schedule = CountingMinutesActor::default();
        let _ = universe.spawn_builder().spawn(actor_with_schedule);
    }
}


================================================
FILE: quickwit/quickwit-aws/Cargo.toml
================================================
[package]
name = "quickwit-aws"
description = "Set up AWS config and clients"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
aws-config = { workspace = true }
aws-runtime = { workspace = true }
aws-sdk-kinesis = { workspace = true, optional = true }
aws-sdk-s3 = { workspace = true }
aws-sdk-sqs = { workspace = true, optional = true }
aws-smithy-async = { workspace = true }
futures = { workspace = true }
tokio = { workspace = true }

quickwit-common = { workspace = true }

[features]
kinesis = ["aws-sdk-kinesis"]
sqs = ["aws-sdk-sqs"]


================================================
FILE: quickwit/quickwit-aws/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![allow(clippy::match_like_matches_macro)]

use aws_runtime::retries::classifiers::{THROTTLING_ERRORS, TRANSIENT_ERRORS};
use aws_sdk_s3::error::SdkError;
use aws_sdk_s3::operation::abort_multipart_upload::AbortMultipartUploadError;
use aws_sdk_s3::operation::complete_multipart_upload::CompleteMultipartUploadError;
use aws_sdk_s3::operation::create_multipart_upload::CreateMultipartUploadError;
use aws_sdk_s3::operation::delete_object::DeleteObjectError;
use aws_sdk_s3::operation::delete_objects::DeleteObjectsError;
use aws_sdk_s3::operation::get_object::GetObjectError;
use aws_sdk_s3::operation::head_object::HeadObjectError;
use aws_sdk_s3::operation::put_object::PutObjectError;
use aws_sdk_s3::operation::upload_part::UploadPartError;

use crate::retry::AwsRetryable;

impl<E> AwsRetryable for SdkError<E>
where E: AwsRetryable
{
    fn is_retryable(&self) -> bool {
        match self {
            SdkError::ConstructionFailure(_) => false,
            SdkError::TimeoutError(_) => true,
            SdkError::DispatchFailure(_) => false,
            SdkError::ResponseError(_) => true,
            SdkError::ServiceError(error) => error.err().is_retryable(),
            _ => false,
        }
    }
}

fn is_retryable(meta: &aws_sdk_s3::error::ErrorMetadata) -> bool {
    if let Some(code) = meta.code() {
        THROTTLING_ERRORS.contains(&code)
            || TRANSIENT_ERRORS.contains(&code)
            || code == "InternalError" // this is somehow not considered transient, despite the
    // associated error message containing "Please try again."
    } else {
        false
    }
}

impl AwsRetryable for GetObjectError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for DeleteObjectError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for DeleteObjectsError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for UploadPartError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for CompleteMultipartUploadError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for AbortMultipartUploadError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for CreateMultipartUploadError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for PutObjectError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

impl AwsRetryable for HeadObjectError {
    fn is_retryable(&self) -> bool {
        is_retryable(self.meta())
    }
}

#[cfg(feature = "kinesis")]
mod kinesis {
    use aws_sdk_kinesis::operation::create_stream::CreateStreamError;
    use aws_sdk_kinesis::operation::delete_stream::DeleteStreamError;
    use aws_sdk_kinesis::operation::describe_stream::DescribeStreamError;
    use aws_sdk_kinesis::operation::get_records::GetRecordsError;
    use aws_sdk_kinesis::operation::get_shard_iterator::GetShardIteratorError;
    use aws_sdk_kinesis::operation::list_shards::ListShardsError;
    use aws_sdk_kinesis::operation::list_streams::ListStreamsError;
    use aws_sdk_kinesis::operation::merge_shards::MergeShardsError;
    use aws_sdk_kinesis::operation::split_shard::SplitShardError;

    use super::*;

    impl AwsRetryable for GetRecordsError {
        fn is_retryable(&self) -> bool {
            match self {
                GetRecordsError::KmsThrottlingException(_) => true,
                GetRecordsError::ProvisionedThroughputExceededException(_) => true,
                _ => false,
            }
        }
    }

    impl AwsRetryable for GetShardIteratorError {
        fn is_retryable(&self) -> bool {
            matches!(
                self,
                GetShardIteratorError::ProvisionedThroughputExceededException(_)
            )
        }
    }

    impl AwsRetryable for ListShardsError {
        fn is_retryable(&self) -> bool {
            matches!(
                self,
                ListShardsError::ResourceInUseException(_)
                    | ListShardsError::LimitExceededException(_)
            )
        }
    }

    impl AwsRetryable for CreateStreamError {
        fn is_retryable(&self) -> bool {
            matches!(
                self,
                CreateStreamError::ResourceInUseException(_)
                    | CreateStreamError::LimitExceededException(_)
            )
        }
    }

    impl AwsRetryable for DeleteStreamError {
        fn is_retryable(&self) -> bool {
            matches!(
                self,
                DeleteStreamError::ResourceInUseException(_)
                    | DeleteStreamError::LimitExceededException(_)
            )
        }
    }

    impl AwsRetryable for DescribeStreamError {
        fn is_retryable(&self) -> bool {
            matches!(self, DescribeStreamError::LimitExceededException(_))
        }
    }

    impl AwsRetryable for ListStreamsError {
        fn is_retryable(&self) -> bool {
            matches!(self, ListStreamsError::LimitExceededException(_))
        }
    }

    impl AwsRetryable for MergeShardsError {
        fn is_retryable(&self) -> bool {
            matches!(
                self,
                MergeShardsError::ResourceInUseException(_)
                    | MergeShardsError::LimitExceededException(_)
            )
        }
    }

    impl AwsRetryable for SplitShardError {
        fn is_retryable(&self) -> bool {
            matches!(
                self,
                SplitShardError::ResourceInUseException(_)
                    | SplitShardError::LimitExceededException(_)
            )
        }
    }
}

#[cfg(feature = "sqs")]
mod sqs {
    use aws_sdk_sqs::operation::change_message_visibility::ChangeMessageVisibilityError;
    use aws_sdk_sqs::operation::delete_message_batch::DeleteMessageBatchError;
    use aws_sdk_sqs::operation::receive_message::ReceiveMessageError;

    use super::*;

    impl AwsRetryable for ReceiveMessageError {
        fn is_retryable(&self) -> bool {
            false
        }
    }

    impl AwsRetryable for DeleteMessageBatchError {
        fn is_retryable(&self) -> bool {
            false
        }
    }

    impl AwsRetryable for ChangeMessageVisibilityError {
        fn is_retryable(&self) -> bool {
            false
        }
    }
}


================================================
FILE: quickwit/quickwit-aws/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use aws_config::retry::RetryConfig;
use aws_config::stalled_stream_protection::StalledStreamProtectionConfig;
use aws_config::{BehaviorVersion, Region};
pub use aws_smithy_async::rt::sleep::TokioSleep;
use tokio::sync::OnceCell;

pub mod error;
pub mod retry;

pub const DEFAULT_AWS_REGION: Region = Region::from_static("us-east-1");

/// Initialises and returns the AWS config.
pub async fn get_aws_config() -> &'static aws_config::SdkConfig {
    static SDK_CONFIG: OnceCell<aws_config::SdkConfig> = OnceCell::const_new();

    SDK_CONFIG
        .get_or_init(|| async {
            aws_config::defaults(aws_behavior_version())
                .stalled_stream_protection(StalledStreamProtectionConfig::enabled().build())
                // Currently handle this ourselves so probably best for now to leave it as is.
                .retry_config(RetryConfig::disabled())
                .sleep_impl(TokioSleep::default())
                .load()
                .await
        })
        .await
}

/// Returns the AWS behavior version.
pub fn aws_behavior_version() -> BehaviorVersion {
    BehaviorVersion::v2026_01_12()
}


================================================
FILE: quickwit/quickwit-aws/src/retry.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Debug;

use futures::{Future, TryFutureExt};
use quickwit_common::retry::{
    Retry, RetryParams, Retryable, TokioSleep, retry_with_mockable_sleep,
};

pub trait AwsRetryable {
    fn is_retryable(&self) -> bool {
        false
    }
}

impl<E> AwsRetryable for Retry<E> {
    fn is_retryable(&self) -> bool {
        match self {
            Retry::Transient(_) => true,
            Retry::Permanent(_) => false,
        }
    }
}

#[derive(Debug)]
struct AwsRetryableWrapper<E>(E);

impl<E> Retryable for AwsRetryableWrapper<E>
where E: AwsRetryable
{
    fn is_retryable(&self) -> bool {
        self.0.is_retryable()
    }
}

pub async fn aws_retry<U, E, Fut>(retry_params: &RetryParams, f: impl Fn() -> Fut) -> Result<U, E>
where
    Fut: Future<Output = Result<U, E>>,
    E: AwsRetryable + Debug + 'static,
{
    retry_with_mockable_sleep(
        retry_params,
        || f().map_err(AwsRetryableWrapper),
        TokioSleep,
    )
    .await
    .map_err(|error| error.0)
}


================================================
FILE: quickwit/quickwit-cli/Cargo.toml
================================================
[package]
name = "quickwit-cli"
description = "Command line interface for launching and managing Quickwit clusters"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

default-run = "quickwit"

[[bin]]
name = "quickwit"
path = "src/main.rs"

[[bin]]
name = "generate_markdown"
path = "src/generate_markdown.rs"

[dependencies]
anyhow = { workspace = true }
backtrace = { workspace = true, optional = true }
bytesize = { workspace = true }
chrono = { workspace = true }
clap = { workspace = true }
colored = { workspace = true }
console-subscriber = { workspace = true, optional = true }
dialoguer = { workspace = true }
futures = { workspace = true }
humantime = { workspace = true }
indicatif = { workspace = true }
itertools = { workspace = true }
numfmt = { workspace = true }
once_cell = { workspace = true }
openssl-probe = { workspace = true, optional = true }
opentelemetry = { workspace = true }
opentelemetry-appender-tracing = { workspace = true }
opentelemetry_sdk = { workspace = true }
opentelemetry-otlp = { workspace = true }
reqwest = { workspace = true }
rustls = { workspace = true }
serde_json = { workspace = true }
tabled = { workspace = true }
tempfile = { workspace = true }
thiserror = { workspace = true }
thousands = { workspace = true }
tikv-jemalloc-ctl = { workspace = true, optional = true }
tikv-jemallocator = { workspace = true, optional = true }
time = { workspace = true }
tokio = { workspace = true }
toml = { workspace = true }
tracing = { workspace = true }
tracing-opentelemetry = { workspace = true }
tracing-subscriber = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-index-management = { workspace = true }
quickwit-indexing = { workspace = true }
quickwit-ingest = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-rest-client = { workspace = true }
quickwit-search = { workspace = true }
quickwit-serve = { workspace = true }
quickwit-storage = { workspace = true }
quickwit-telemetry = { workspace = true }

[dev-dependencies]
predicates = { workspace = true }
reqwest = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }

[features]
jemalloc = ["dep:tikv-jemalloc-ctl", "dep:tikv-jemallocator"]
jemalloc-profiled = [
  "dep:backtrace",
  "quickwit-common/jemalloc-profiled",
  "quickwit-serve/jemalloc-profiled"
]
ci-test = []
pprof = ["quickwit-serve/pprof"]
openssl-support = ["openssl-probe"]
# Requires to enable tokio unstable via RUSTFLAGS="--cfg tokio_unstable"
tokio-console = ["console-subscriber", "quickwit-common/named_tasks"]
release-feature-set = [
  "jemalloc",
  "openssl-support",
  "pprof",
  "quickwit-indexing/kafka",
  "quickwit-indexing/kinesis",
  "quickwit-indexing/pulsar",
  "quickwit-indexing/sqs",
  "quickwit-indexing/vrl",
  "quickwit-serve/lambda",
  "quickwit-storage/azure",
  "quickwit-storage/gcs",
  "quickwit-metastore/postgres",
]
release-feature-vendored-set = [
  "jemalloc",
  "openssl-support",
  "pprof",
  "quickwit-indexing/kinesis",
  "quickwit-indexing/pulsar",
  "quickwit-indexing/sqs",
  "quickwit-indexing/vrl",
  "quickwit-indexing/vendored-kafka",
  "quickwit-serve/lambda",
  "quickwit-storage/azure",
  "quickwit-storage/gcs",
  "quickwit-metastore/postgres",
]
release-macos-feature-vendored-set = [
  "jemalloc",
  "openssl-support",
  "quickwit-indexing/kinesis",
  "quickwit-indexing/pulsar",
  "quickwit-indexing/sqs",
  "quickwit-indexing/vrl",
  "quickwit-indexing/vendored-kafka-macos",
  "quickwit-serve/lambda",
  "quickwit-storage/azure",
  "quickwit-storage/gcs",
  "quickwit-metastore/postgres",
]
release-jemalloc-profiled = [
  "release-feature-set",
  "jemalloc-profiled",
]


================================================
FILE: quickwit/quickwit-cli/src/checklist.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Display;

use colored::{Color, Colorize};
use itertools::Itertools;
use thiserror::Error;

/// Quickwit main colors slightly adapted to be readable on a terminal.
pub const BLUE_COLOR: Color = Color::TrueColor {
    r: 22,
    g: 74,
    b: 209,
};

pub const GREEN_COLOR: Color = Color::Green;
pub const WHITE_COLOR: Color = Color::TrueColor {
    r: 255,
    g: 255,
    b: 255,
};
pub const RED_COLOR: Color = Color::TrueColor {
    r: 230,
    g: 0,
    b: 34,
};

pub fn print_checklist(check_list_results: &[(&str, anyhow::Result<()>)]) {
    eprintln!(
        "\n{}\n{}",
        "---------------------------------------------------".color(GREEN_COLOR),
        " Connectivity checklist "
            .color(WHITE_COLOR)
            .on_color(GREEN_COLOR)
    );
    let mut errors = Vec::new();
    for (check_item_name, check_item_result) in check_list_results {
        let outcome_symbol = if check_item_result.is_ok() {
            "✔".color(GREEN_COLOR) // '✓'
        } else {
            "✖".color(RED_COLOR) //𐄂
        };
        eprintln!(" {outcome_symbol} {check_item_name}");
        if let Err(check_item_err) = check_item_result {
            errors.push((check_item_name, check_item_err));
        }
    }
    if errors.is_empty() {
        println!();
        return;
    }
    eprintln!(
        "{}\n{}",
        "---------------------------------------------------".color(RED_COLOR),
        " Error Details ".color(WHITE_COLOR).on_color(RED_COLOR)
    );
    for (check_item_name, check_item_err) in errors {
        eprintln!(
            "\n{}\n{:?}",
            format!(" ✖ {check_item_name}").color(RED_COLOR),
            check_item_err
        );
    }
    eprintln!("\n\n");
}

/// Run a checklist and print out its successes and failures on stdout.
///
/// If an error is encountered, the process will exit with exit code 1.
pub fn run_checklist(checks: Vec<(&str, anyhow::Result<()>)>) -> Result<(), ChecklistError> {
    print_checklist(&checks);
    if !checks
        .iter()
        .all(|(_, check_items_res)| check_items_res.is_ok())
    {
        return Err(ChecklistError::from_results(checks));
    }

    Ok(())
}

#[derive(Error, Debug)]
pub struct ChecklistError {
    pub errors: Vec<(String, anyhow::Result<()>)>,
}

impl ChecklistError {
    pub fn from_results(results: Vec<(&str, anyhow::Result<()>)>) -> Self {
        let errors = results
            .into_iter()
            .filter(|(_, check_res)| check_res.is_err())
            .map(|(check_elem, check_res)| (check_elem.to_string(), check_res))
            .collect();
        ChecklistError { errors }
    }
}

impl Display for ChecklistError {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        let err_string = self
            .errors
            .iter()
            .map(|(check_item, check_item_err)| {
                format!(
                    "\n{}: {}",
                    check_item,
                    check_item_err
                        .as_ref()
                        .expect_err("ChecklistError can't contain success results")
                )
            })
            .join("");
        write!(f, "{err_string}")
    }
}


================================================
FILE: quickwit/quickwit-cli/src/cli.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use anyhow::{Context, bail};
use clap::{Arg, ArgAction, ArgMatches, Command, arg};
use quickwit_serve::EnvFilterReloadFn;
use tracing::Level;

use crate::index::{IndexCliCommand, build_index_command};
use crate::service::{RunCliCommand, build_run_command};
use crate::source::{SourceCliCommand, build_source_command};
use crate::split::{SplitCliCommand, build_split_command};
use crate::tool::{ToolCliCommand, build_tool_command};

pub fn build_cli() -> Command {
    Command::new("Quickwit")
        .arg(
            // Following https://no-color.org/
            Arg::new("no-color")
                .long("no-color")
                .help(
                    "Disable ANSI terminal codes (colors, etc...) being injected into the logging \
                     output",
                )
                .env("NO_COLOR")
                .value_parser(clap::builder::FalseyValueParser::new())
                .global(true)
                .action(ArgAction::SetTrue),
        )
        .arg(arg!(-y --"yes" "Assume \"yes\" as an answer to all prompts and run non-interactively.")
            .global(true)
            .required(false)
        )
        .subcommand(build_run_command().display_order(1))
        .subcommand(build_index_command().display_order(2))
        .subcommand(build_source_command().display_order(3))
        .subcommand(build_split_command().display_order(4))
        .subcommand(build_tool_command().display_order(5))
        .arg_required_else_help(true)
        .disable_help_subcommand(true)
        .subcommand_required(true)
}

#[derive(Debug, PartialEq)]
pub enum CliCommand {
    Run(RunCliCommand),
    Index(IndexCliCommand),
    Split(SplitCliCommand),
    Source(SourceCliCommand),
    Tool(ToolCliCommand),
}

impl CliCommand {
    pub fn default_log_level(&self) -> Level {
        match self {
            CliCommand::Run(_) => Level::INFO,
            CliCommand::Index(subcommand) => subcommand.default_log_level(),
            CliCommand::Source(_) => Level::ERROR,
            CliCommand::Split(_) => Level::ERROR,
            CliCommand::Tool(_) => Level::ERROR,
        }
    }

    pub fn parse_cli_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let (subcommand, submatches) = matches
            .remove_subcommand()
            .context("failed to parse command")?;
        match subcommand.as_str() {
            "index" => IndexCliCommand::parse_cli_args(submatches).map(CliCommand::Index),
            "run" => RunCliCommand::parse_cli_args(submatches).map(CliCommand::Run),
            "source" => SourceCliCommand::parse_cli_args(submatches).map(CliCommand::Source),
            "split" => SplitCliCommand::parse_cli_args(submatches).map(CliCommand::Split),
            "tool" => ToolCliCommand::parse_cli_args(submatches).map(CliCommand::Tool),
            _ => bail!("unknown command `{subcommand}`"),
        }
    }

    pub async fn execute(self, env_filter_reload_fn: EnvFilterReloadFn) -> anyhow::Result<()> {
        match self {
            CliCommand::Index(subcommand) => subcommand.execute().await,
            CliCommand::Run(subcommand) => subcommand.execute(env_filter_reload_fn).await,
            CliCommand::Source(subcommand) => subcommand.execute().await,
            CliCommand::Split(subcommand) => subcommand.execute().await,
            CliCommand::Tool(subcommand) => subcommand.execute().await,
        }
    }
}


================================================
FILE: quickwit/quickwit-cli/src/cli_doc_ext.toml
================================================
[index.create]
long_about = """
Creates an index of ID `index` at `index-uri` configured by a [YAML config file](../configuration/index-config.md) located at `index-config`.
The index config lets you define the mapping of your document on the index and how each field is stored and indexed.
If `index-uri` is omitted, `index-uri` will be set to `{default_index_root_uri}/{index}`, more info on [Quickwit config docs](../configuration/node-config.md).
The command fails if an index already exists unless `overwrite` is passed.
When `overwrite` is enabled, the command deletes all the files stored at `index-uri` before creating a new index.
"""

[[index.create.examples]]
name= "Create a new index."
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
curl -o wikipedia_index_config.yaml https://raw.githubusercontent.com/quickwit-oss/quickwit/main/config/tutorials/wikipedia/index-config.yaml
quickwit index create --endpoint=http://127.0.0.1:7280 --index-config wikipedia_index_config.yaml
'''

[index.ingest]
long_about = """
Indexes a dataset consisting of newline-delimited JSON objects located at `input-path` or read from *stdin*.
The data is appended to the target index of ID `index` unless `overwrite` is passed. `input-path` can be a file or another command output piped into stdin.
Currently, only local datasets are supported.
By default, Quickwit's indexer will work with a heap of 2 GiB of memory. Learn how to change `heap-size` in the [index config doc page](../configuration/index-config.md).
"""

[[index.ingest.examples]]
name = "Indexing a dataset from a file"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
curl -o wiki-articles-10000.json https://quickwit-datasets-public.s3.amazonaws.com/wiki-articles-10000.json
quickwit index ingest --endpoint=http://127.0.0.1:7280 --index wikipedia --input-path wiki-articles-10000.json
'''

[[index.ingest.examples]]
name = "Indexing a dataset from stdin"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
cat wiki-articles-10000.json | quickwit index ingest --endpoint=http://127.0.0.1:7280 --index wikipedia
'''

[tool.gc]
note = """
Intermediate files are created while executing Quickwit commands.
These intermediate files are always cleaned at the end of each successfully executed command.
However, failed or interrupted commands can leave behind intermediate files that need to be removed.
Also, note that using a very short grace period (like seconds) can cause the removal of intermediate files being operated on, especially when using Quickwit concurrently on the same index.
In practice, you can settle with the default value (1 hour) and only specify a lower value if you really know what you are doing.
"""

[index.search]
long_about = """
Searches an index with ID `--index` and returns the documents matching the query specified with `--query`.
More details on the [query language page](query-language.md).
The offset of the first hit returned and the number of hits returned can be set with the `start-offset` and `max-hits` options.
It's possible to override the default search fields `search-fields` option to define the list of fields that Quickwit will search into if 
the user query does not explicitly target a field in the query. Quickwit will return snippets of the matching content when requested via the `snippet-fields` options.
Search can also be limited to a time range using the `start-timestamp` and `end-timestamp` options.
These timestamp options are useful for boosting query performance when using a time series dataset.

:::warning
The `start_timestamp` and `end_timestamp` should be specified in seconds regardless of the timestamp field precision. The timestamp field precision only affects the way it's stored as fast-fields, whereas the document filtering is always performed in seconds.
:::
"""

[[index.search.examples]]
name = "Searching a index"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama"
# If you have jq installed.
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama" | jq '.hits[].title'
'''

[[index.search.examples]]
name = "Sorting documents by their BM25 score"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "obama" --sort-by-score
'''

[[index.search.examples]]
name = "Limiting the result set to 50 hits"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama" --max-hits 50
# If you have jq installed.
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "Barack Obama" --max-hits 50 | jq '.num_hits'
'''

[[index.search.examples]]
name = "Looking for matches in the title only"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "obama" --search-fields body
# If you have jq installed.
quickwit index search --endpoint=http://127.0.0.1:7280 --index wikipedia --query "obama" --search-fields body | jq '.hits[].title'
'''

[[index.list.examples]]
name = "List indexes"
command = '''
# Start a Quickwit server.
quickwit run --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index list --endpoint=http://127.0.0.1:7280
# Or with alias.
quickwit index ls --endpoint=http://127.0.0.1:7280

                                    Indexes                                     
+-----------+--------------------------------------------------------+
| Index ID  |                       Index URI                        |
+-----------+--------------------------------------------------------+
| hdfs-logs | file:///home/quickwit-indices/qwdata/indexes/hdfs-logs |
+-----------+--------------------------------------------------------+
| wikipedia | file:///home/quickwit-indices/qwdata/indexes/wikipedia |
+-----------+--------------------------------------------------------+

'''


[[index.describe.examples]]
name = "Displays descriptive statistics of your index"
command = '''
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index describe --endpoint=http://127.0.0.1:7280 --index wikipedia

1. General infos
===============================================================================
Index id:                           wikipedia
Index uri:                          file:///home/quickwit-indices/qwdata/indexes/wikipedia
Number of published splits:         1
Number of published documents:      300000
Size of published splits:           448 MB

2. Statistics on splits
===============================================================================
Document count stats:
Mean ± σ in [min … max]:            300000 ± 0 in [300000 … 300000]
Quantiles [1%, 25%, 50%, 75%, 99%]: [300000, 300000, 300000, 300000, 300000]

Size in MB stats:
Mean ± σ in [min … max]:            448 ± 0 in [448 … 448]
Quantiles [1%, 25%, 50%, 75%, 99%]: [448, 448, 448, 448, 448]
'''

[[index.delete.examples]]
name = "Delete your index"
command = '''
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit index delete --index wikipedia --endpoint=http://127.0.0.1:7280
'''


[run]
long_about = """

### Indexer service

The indexer service runs indexing pipelines assigned by the control plane.

### Searcher service 
Starts a web server at `rest_listing_address:rest_list_port` that exposes the [Quickwit REST API](rest-api.md)
where `rest_listing_address` and `rest_list_port` are defined in Quickwit config file (quickwit.yaml).
The node can optionally join a cluster using the `peer_seeds` parameter.
This list of node addresses is used to discover the remaining peer nodes in the cluster through a gossip protocol, see [chitchat](https://github.com/quickwit-oss/chitchat).

### Metastore service

The metastore service exposes Quickwit metastore over the network. This is a core internal service that is needed to operate Quickwit. As such, at least one running instance of this service is required for other services to work.

### Control plane service

The control plane service schedules indexing tasks to indexers. It listens to metastore events such as
an source create, delete, toggle, or index delete and reacts accordingly to update the indexing plan.

### Janitor service

The Janitor service runs maintenance tasks on indexes: garbage collection, documents delete, and retention policy tasks.

:::note
Quickwit needs to open the following port for cluster formation and workload distribution:

    TCP port (default is 7280) for REST API
    TCP and UDP port (default is 7280) for cluster membership protocol
    TCP port + 1 (default is 7281) for gRPC address for the distributed search

If ports are already taken, the serve command will fail.
:::
"""

[[run.examples]]
name = "Starts an indexer and a metastore services"
command = "quickwit run --service indexer --service metastore --endpoint=http://127.0.0.1:7280"

[[run.examples]]
name = "Start a control plane, metastore and janitor services"
command = "quickwit run --service control_plane --service metastore --service janitor --config=./config/quickwit.yaml"

[[run.examples]]
name = "Make a search request on a wikipedia index"
command = '''
# To create wikipedia index and ingest data, go to our tutorials https://quickwit.io/docs/get-started/.
# Start a searcher.
quickwit run --service searcher --service metastore --config=./config/quickwit.yaml
# Make a request.
curl "http://127.0.0.1:7280/api/v1/wikipedia/search?query=barack+obama"
'''

[[source.examples]]
name = "Add a Kafka source to `wikipedia` index"
command = '''
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
cat << EOF > wikipedia-kafka-source.json
{
  "version": "0.7",
  "source_id": "kafka-source",
  "source_type": "kafka",
  "params": {
    "topic": "wikipedia",
      "client_params": {
        "bootstrap.servers": "localhost:9092",
        "group.id": "my-group-id",
        "security.protocol": "SSL"
      }
  }
}
EOF
quickwit source create --endpoint=http://127.0.0.1:7280 --index wikipedia --config-file wikipedia-kafka-source.json
'''

[[source.list.examples]]
name = "List `wikipedia` index sources"
command = '''
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit source list --endpoint=http://127.0.0.1:7280 --index wikipedia
'''


[[source.delete.examples]]
name = "Delete a `wikipedia-source` source"
command = '''
# Start a Quickwit server.
quickwit run --service metastore --config=./config/quickwit.yaml
# Open a new terminal and run:
quickwit source delete --endpoint=http://127.0.0.1:7280 --index wikipedia --source wikipedia-source
'''


================================================
FILE: quickwit/quickwit-cli/src/generate_markdown.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use clap::Command;
use quickwit_cli::cli::build_cli;
use quickwit_serve::BuildInfo;
use toml::Value;

#[tokio::main]
async fn main() -> anyhow::Result<()> {
    let version_text = BuildInfo::get_version_text();
    let app = build_cli()
        .version(version_text)
        .disable_help_subcommand(true);

    generate_markdown_from_clap(&app);
    Ok(())
}

fn markdown_for_command(command: &Command, doc_extensions: &toml::Value) {
    let command_name = command.get_name();
    let command_ext: Option<&Value> = doc_extensions.get(command_name.to_string());
    markdown_for_command_helper(command, command_ext, command_name.to_string(), Vec::new());
}

fn markdown_for_subcommand(
    subcommand: &Command,
    command_group: Vec<String>,
    doc_extensions: &toml::Value,
    level: usize,
) {
    let subcommand_name = subcommand.get_name();

    let command_name = format!("{} {}", command_group.join(" "), subcommand_name);
    let header_level = "#".repeat(level);
    println!("{header_level} {command_name}\n");

    let subcommand_ext: Option<&Value> = {
        let mut val_opt: Option<&Value> = doc_extensions.get(command_group[0].to_string());
        for command in command_group
            .iter()
            .skip(1)
            .chain(&[subcommand_name.to_string()])
        {
            if let Some(val) = val_opt {
                val_opt = val.get(command);
            }
        }
        val_opt
    };
    markdown_for_command_helper(subcommand, subcommand_ext, command_name, command_group);
}

fn markdown_for_command_helper(
    subcommand: &Command,
    subcommand_ext: Option<&Value>,
    command_name: String,
    command_group: Vec<String>,
) {
    let long_about_opt: Option<&str> =
        subcommand_ext.and_then(|el| el.get("long_about").and_then(|el| el.as_str()));

    let note: Option<&str> =
        subcommand_ext.and_then(|el| el.get("note").and_then(|el| el.as_str()));

    let examples_opt: Option<&Vec<Value>> =
        subcommand_ext.and_then(|el| el.get("examples").and_then(|el| el.as_array()));

    if let Some(about) = long_about_opt {
        if !about.trim().is_empty() {
            println!("{about}  ");
        }
    } else if let Some(about) = subcommand.get_about()
        && !about.to_string().trim().is_empty()
    {
        println!("{about}  ");
    }

    if let Some(note) = note {
        println!(":::note");
        println!("{note}");
        println!(":::");
    }

    println!(
        "`quickwit {} {} [args]`",
        command_group.join(" "),
        subcommand.get_name()
    );
    for alias in subcommand.get_all_aliases() {
        println!("`quickwit {} {} [args]`", command_group.join(" "), alias);
    }

    let arguments = subcommand
        .get_arguments()
        .filter(|arg| !(arg.get_id() == "help" || arg.get_id() == "version"))
        .collect::<Vec<_>>();
    if !arguments.is_empty() {
        println!("\n*Synopsis*\n");

        println!("```bash");
        println!("quickwit {command_name}");
        for arg in &arguments {
            let is_required = arg.is_required_set();
            let is_bool = !arg.get_action().takes_values();

            let mut commando = format!("--{}", arg.get_id());
            if !is_bool {
                commando = format!("{} <{}>", commando, arg.get_id());
            }
            if !is_required {
                commando = format!("[{commando}]");
            }
            println!("    {commando}");
        }
        println!("```");
        println!("\n*Options*\n");

        // Check if any options have defaults to know if the "Default" column is needed
        let has_defaults = arguments
            .iter()
            .any(|arg| !arg.get_default_values().is_empty());

        if has_defaults {
            println!("| Option | Description | Default |");
            println!("|-----------------|-------------|--------:|");
            for arg in arguments {
                let default = if let Some(val) = arg.get_default_values().first() {
                    format!("`{}`", val.to_str().unwrap())
                } else {
                    "".to_string()
                };
                println!(
                    "| `--{}` | {} | {} |",
                    arg.get_id(),
                    arg.get_help().unwrap_or_default(),
                    default
                );
            }
        } else {
            println!("| Option | Description |");
            println!("|-----------------|-------------|");
            for arg in arguments {
                println!(
                    "| `--{}` | {} |",
                    arg.get_id(),
                    arg.get_help().unwrap_or_default()
                );
            }
        }
    }

    if let Some(examples) = examples_opt {
        println!("\n*Examples*\n");
        for example in examples {
            println!("*{}*", example.get("name").unwrap().as_str().unwrap());
            println!(
                "```bash\n{}\n```\n",
                example.get("command").unwrap().as_str().unwrap()
            );
        }
    }
}

fn generate_markdown_from_clap(command: &Command) {
    let ext_toml = include_str!("cli_doc_ext.toml");
    let doc_extensions: Value = ext_toml.parse::<Value>().unwrap();

    let commands = command.get_subcommands();
    for command in commands {
        let command_name = command.get_name(); // index, split, source
        println!("## {command_name}");
        if let Some(about) = command.get_long_about().or_else(|| command.get_about())
            && !about.to_string().trim().is_empty()
        {
            println!("{about}\n");
        }

        if command.get_subcommands().count() == 0 {
            markdown_for_command(command, &doc_extensions);
            continue;
        }

        let excluded_doc_commands = ["merge", "local-search"];
        for subcommand in command
            .get_subcommands()
            .filter(|subcommand| !excluded_doc_commands.contains(&subcommand.get_name()))
        {
            let commands = vec![command.get_name().to_string()];
            markdown_for_subcommand(subcommand, commands, &doc_extensions, 3);

            for subsubcommand in subcommand.get_subcommands() {
                let commands = vec![
                    command.get_name().to_string(),
                    subcommand.get_name().to_string(),
                ];
                markdown_for_subcommand(subsubcommand, commands, &doc_extensions, 4);
            }
        }
    }
    std::process::exit(0);
}


================================================
FILE: quickwit/quickwit-cli/src/index.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::fmt::Display;
use std::num::NonZeroUsize;
use std::ops::Div;
use std::path::PathBuf;
use std::str::FromStr;
use std::time::{Duration, Instant};

use anyhow::{Context, anyhow, bail};
use bytesize::ByteSize;
use clap::{Arg, ArgAction, ArgMatches, Command, arg};
use colored::Colorize;
use indicatif::{ProgressBar, ProgressStyle};
use itertools::Itertools;
use numfmt::{Formatter, Scales};
use quickwit_common::tower::{Rate, RateEstimator, SmaRateEstimator};
use quickwit_common::uri::Uri;
use quickwit_config::{ConfigFormat, IndexConfig};
use quickwit_metastore::{IndexMetadata, Split, SplitState};
use quickwit_proto::search::{CountHits, SortField, SortOrder};
use quickwit_proto::types::IndexId;
use quickwit_rest_client::models::{IngestSource, SearchResponseRestClient};
use quickwit_rest_client::rest_client::{CommitType, IngestEvent};
use quickwit_serve::{ListSplitsQueryParams, SearchRequestQueryString, SortBy};
use quickwit_storage::{StorageResolver, load_file};
use tabled::settings::object::{FirstRow, Rows, Segment};
use tabled::settings::panel::Footer;
use tabled::settings::{Alignment, Format, Modify, Panel, Remove, Rotate, Style};
use tabled::{Table, Tabled};
use tracing::{Level, debug};

use crate::checklist::{GREEN_COLOR, RED_COLOR};
use crate::stats::{mean, percentile, std_deviation};
use crate::{ClientArgs, client_args, make_table, prompt_confirmation};

pub fn build_index_command() -> Command {
    Command::new("index")
        .about("Manages indexes: creates, updates, deletes, ingests, searches, describes...")
        .args(client_args())
        .subcommand(
            Command::new("create")
                .display_order(1)
                .about("Creates an index from an index config file.")
                .args(&[
                    arg!(--"index-config" <INDEX_CONFIG> "Location of the index config file.")
                        .display_order(1)
                        .required(true),
                    arg!(--overwrite "Overwrites pre-existing index. This will delete all existing data stored at `index-uri` before creating a new index.")
                        .display_order(2)
                        .required(false),
                ])
            )
        .subcommand(
            Command::new("update")
            .display_order(1)
            .about("Updates an index using an index config file.")
            .long_about("This command follows PUT semantics, which means that all the fields of the current configuration are replaced by the values specified in this request or the associated defaults. In particular, if the field is optional (e.g. `retention_policy`), omitting it will delete the associated configuration. If the new configuration file contains updates that cannot be applied, the request fails, and none of the updates are applied.")
            .args(&[
                arg!(--index <INDEX> "ID of the target index")
                    .display_order(1)
                    .required(true),
                arg!(--"index-config" <INDEX_CONFIG> "Location of the index config file.")
                    .display_order(2)
                    .required(true),
                arg!(--"create" "Create the index if it does not already exists.")
                    .display_order(3)
                    .required(false),
            ])
        )
        .subcommand(
            Command::new("clear")
                .display_order(3)
                .alias("clr")
                .about("Clears an index: deletes all splits and resets checkpoint.")
                .long_about("Deletes all its splits and resets its checkpoint. This operation is destructive and cannot be undone, proceed with caution.")
                .args(&[
                    arg!(--index <INDEX> "Index ID")
                        .display_order(1)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("delete")
                .display_order(4)
                .alias("del")
                .about("Deletes an index.")
                .long_about("Deletes an index. This operation is destructive and cannot be undone, proceed with caution.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--"dry-run" "Executes the command in dry run mode and only displays the list of splits candidates for deletion.")
                        .required(false),
                ])
            )
        .subcommand(
            Command::new("describe")
                .display_order(5)
                .about("Displays descriptive statistics of an index.")
                .long_about("Displays descriptive statistics of an index. Displayed statistics are: number of published splits, number of documents, splits min/max timestamps, size of splits.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("list")
                .alias("ls")
                .display_order(6)
                .about("List indexes.")
            )
        .subcommand(
            Command::new("ingest")
                .display_order(7)
                .about("Ingest NDJSON documents with the ingest API.")
                .long_about("Reads NDJSON documents from a file or streamed from stdin and sends them into ingest API.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--"input-path" <INPUT_PATH> "Location of the input file.")
                        .required(false),
                    arg!(--"batch-size-limit" <BATCH_SIZE_LIMIT> "Size limit of each submitted document batch.")
                        .required(false),
                    Arg::new("wait")
                        .long("wait")
                        .short('w')
                        .help("Wait for all documents to be committed and available for search before exiting. Applies only to the last batch, see [#5417](https://github.com/quickwit-oss/quickwit/issues/5417).")
                        .action(ArgAction::SetTrue),
                    Arg::new("detailed-response")
                        .long("detailed-response")
                        .help("Print detailed errors. Enabling might impact performance negatively.")
                        .action(ArgAction::SetTrue),
                    Arg::new("force")
                        .long("force")
                        .short('f')
                        .help("Force a commit after the last document is sent, and wait for all documents to be committed and available for search before exiting. Applies only to the last batch, see [#5417](https://github.com/quickwit-oss/quickwit/issues/5417).")
                        .action(ArgAction::SetTrue)
                        .conflicts_with("wait"),
                    Arg::new("commit-timeout")
                        .long("commit-timeout")
                        .help("Timeout for ingest operations that require waiting for the final commit (`--wait` or `--force`). This is different from the `commit_timeout_secs` indexing setting, which sets the maximum time before committing splits after their creation.")
                        .required(false)
                        .global(true),
                ])
            )
        .subcommand(
            Command::new("search")
                .display_order(8)
                .about("Searches an index.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--query <QUERY> "Query expressed in natural query language ((barack AND obama) OR \"president of united states\"). Learn more on https://quickwit.io/docs/reference/search-language.")
                        .display_order(2)
                        .required(true),
                    arg!(--aggregation <AGG> "JSON serialized aggregation request in tantivy/elasticsearch format.")
                        .required(false),
                    arg!(--"max-hits" <MAX_HITS> "Maximum number of hits returned.")
                        .default_value("20")
                        .required(false),
                    arg!(--"start-offset" <OFFSET> "Offset in the global result set of the first hit returned.")
                        .default_value("0")
                        .required(false),
                    arg!(--"search-fields" <FIELD_NAME> "List of fields that Quickwit will search into if the user query does not explicitly target a field in the query. It overrides the default search fields defined in the index config. Space-separated list, e.g. \"field1 field2\". ")
                        .num_args(1..)
                        .required(false),
                    arg!(--"snippet-fields" <FIELD_NAME> "List of fields that Quickwit will return snippet highlight on. Space-separated list, e.g. \"field1 field2\". ")
                        .num_args(1..)
                        .required(false),
                    arg!(--"start-timestamp" <TIMESTAMP> "Filters out documents before that timestamp (time-series indexes only).")
                        .required(false),
                    arg!(--"end-timestamp" <TIMESTAMP> "Filters out documents after that timestamp (time-series indexes only).")
                        .required(false),
                    arg!(--"sort-by-score" "Sorts documents by their BM25 score.")
                        .required(false),
                ])
            )
        .arg_required_else_help(true)
}

#[derive(Debug, Eq, PartialEq)]
pub struct ClearIndexArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct CreateIndexArgs {
    pub client_args: ClientArgs,
    pub index_config_uri: Uri,
    pub overwrite: bool,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct UpdateIndexArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub index_config_uri: Uri,
    pub create: bool,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct DescribeIndexArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
}

#[derive(Debug, Eq, PartialEq)]
pub struct IngestDocsArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub input_path_opt: Option<PathBuf>,
    pub batch_size_limit_opt: Option<ByteSize>,
    pub commit_type: CommitType,
    pub detailed_response: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct SearchIndexArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub query: String,
    pub aggregation: Option<String>,
    pub max_hits: usize,
    pub start_offset: usize,
    pub search_fields: Option<Vec<String>>,
    pub snippet_fields: Option<Vec<String>>,
    pub start_timestamp: Option<i64>,
    pub end_timestamp: Option<i64>,
    pub sort_by_score: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct DeleteIndexArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub dry_run: bool,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct ListIndexesArgs {
    pub client_args: ClientArgs,
}

#[derive(Debug, Eq, PartialEq)]
pub enum IndexCliCommand {
    Clear(ClearIndexArgs),
    Create(CreateIndexArgs),
    Update(UpdateIndexArgs),
    Delete(DeleteIndexArgs),
    Describe(DescribeIndexArgs),
    Ingest(IngestDocsArgs),
    List(ListIndexesArgs),
    Search(SearchIndexArgs),
}

impl IndexCliCommand {
    pub fn default_log_level(&self) -> Level {
        match self {
            Self::Search(_) => Level::ERROR,
            _ => Level::INFO,
        }
    }

    pub fn parse_cli_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let (subcommand, submatches) = matches
            .remove_subcommand()
            .context("failed to parse index subcommand")?;
        match subcommand.as_str() {
            "clear" => Self::parse_clear_args(submatches),
            "create" => Self::parse_create_args(submatches),
            "delete" => Self::parse_delete_args(submatches),
            "describe" => Self::parse_describe_args(submatches),
            "ingest" => Self::parse_ingest_args(submatches),
            "list" => Self::parse_list_args(submatches),
            "search" => Self::parse_search_args(submatches),
            "update" => Self::parse_update_args(submatches),
            _ => bail!("unknown index subcommand `{subcommand}`"),
        }
    }

    fn parse_clear_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg");
        let assume_yes = matches.get_flag("yes");
        Ok(Self::Clear(ClearIndexArgs {
            client_args,
            index_id,
            assume_yes,
        }))
    }

    fn parse_create_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_config_uri = matches
            .remove_one::<String>("index-config")
            .map(|uri| Uri::from_str(&uri))
            .expect("`index-config` should be a required arg")?;
        let overwrite = matches.get_flag("overwrite");
        let assume_yes = matches.get_flag("yes");

        Ok(Self::Create(CreateIndexArgs {
            client_args,
            index_config_uri,
            overwrite,
            assume_yes,
        }))
    }

    fn parse_update_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg");
        let index_config_uri = matches
            .remove_one::<String>("index-config")
            .map(|uri| Uri::from_str(&uri))
            .expect("`index-config` should be a required arg")?;
        let create = matches.get_flag("create");
        let assume_yes = matches.get_flag("yes");

        Ok(Self::Update(UpdateIndexArgs {
            index_id,
            client_args,
            index_config_uri,
            create,
            assume_yes,
        }))
    }

    fn parse_describe_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg");

        Ok(Self::Describe(DescribeIndexArgs {
            client_args,
            index_id,
        }))
    }

    fn parse_list_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        Ok(Self::List(ListIndexesArgs { client_args }))
    }

    fn parse_ingest_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse_for_ingest(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg");
        let input_path_opt = if let Some(input_path) = matches.remove_one::<String>("input-path") {
            Uri::from_str(&input_path)?
                .filepath()
                .map(|path| path.to_path_buf())
        } else {
            None
        };
        let detailed_response: bool = matches.get_flag("detailed-response");
        let batch_size_limit_opt = matches
            .remove_one::<String>("batch-size-limit")
            .map(|limit| limit.parse::<ByteSize>())
            .transpose()
            .map_err(|error| anyhow!(error))?;
        let commit_type = match (matches.get_flag("wait"), matches.get_flag("force")) {
            (false, false) => CommitType::Auto,
            (false, true) => CommitType::Force,
            (true, false) => CommitType::WaitFor,
            (true, true) => bail!("`--wait` and `--force` are mutually exclusive options"),
        };

        if commit_type == CommitType::Auto && client_args.commit_timeout.is_some() {
            bail!("`--commit-timeout` can only be used with --wait or --force options");
        }

        Ok(Self::Ingest(IngestDocsArgs {
            client_args,
            index_id,
            input_path_opt,
            batch_size_limit_opt,
            commit_type,
            detailed_response,
        }))
    }

    fn parse_search_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg");
        let query = matches
            .remove_one::<String>("query")
            .context("`query` should be a required arg")?;
        let aggregation = matches.remove_one::<String>("aggregation");

        let max_hits = matches
            .remove_one::<String>("max-hits")
            .expect("`max-hits` should have a default value.")
            .parse()?;
        let start_offset = matches
            .remove_one::<String>("start-offset")
            .expect("`start-offset` should have a default value.")
            .parse()?;
        let search_fields = matches
            .remove_many::<String>("search-fields")
            .map(|values| values.collect());
        let snippet_fields = matches
            .remove_many::<String>("snippet-fields")
            .map(|values| values.collect());
        let sort_by_score = matches.get_flag("sort-by-score");
        let start_timestamp = matches
            .remove_one::<String>("start-timestamp")
            .map(|ts| ts.parse())
            .transpose()?;
        let end_timestamp = matches
            .remove_one::<String>("end-timestamp")
            .map(|ts| ts.parse())
            .transpose()?;
        let client_args = ClientArgs::parse(&mut matches)?;
        Ok(Self::Search(SearchIndexArgs {
            index_id,
            query,
            aggregation,
            max_hits,
            start_offset,
            search_fields,
            snippet_fields,
            start_timestamp,
            end_timestamp,
            client_args,
            sort_by_score,
        }))
    }

    fn parse_delete_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg");
        let dry_run = matches.get_flag("dry-run");
        let assume_yes = matches.get_flag("yes");
        Ok(Self::Delete(DeleteIndexArgs {
            index_id,
            dry_run,
            client_args,
            assume_yes,
        }))
    }

    pub async fn execute(self) -> anyhow::Result<()> {
        match self {
            Self::Clear(args) => clear_index_cli(args).await,
            Self::Create(args) => create_index_cli(args).await,
            Self::Delete(args) => delete_index_cli(args).await,
            Self::Describe(args) => describe_index_cli(args).await,
            Self::Ingest(args) => ingest_docs_cli(args).await,
            Self::List(args) => list_index_cli(args).await,
            Self::Search(args) => search_index_cli(args).await,
            Self::Update(args) => update_index_cli(args).await,
        }
    }
}

pub async fn clear_index_cli(args: ClearIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "clear-index");
    if !args.assume_yes {
        let prompt = format!(
            "This operation will delete all the splits of the index `{}` and reset its \
             checkpoint. Do you want to proceed?",
            args.index_id
        );
        if !prompt_confirmation(&prompt, false) {
            return Ok(());
        }
    }
    let qw_client = args.client_args.client();
    qw_client.indexes().clear(&args.index_id).await?;
    println!("{} Index successfully cleared.", "✔".color(GREEN_COLOR),);
    Ok(())
}

pub async fn create_index_cli(args: CreateIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "create-index");
    println!("❯ Creating index...");
    let storage_resolver = StorageResolver::unconfigured();
    let file_content = load_file(&storage_resolver, &args.index_config_uri).await?;
    let index_config_str: String = std::str::from_utf8(&file_content)
        .with_context(|| format!("Invalid utf8: `{}`", args.index_config_uri))?
        .to_string();
    let config_format = ConfigFormat::sniff_from_uri(&args.index_config_uri)?;
    let qw_client = args.client_args.client();
    // TODO: nice to have: check first if the index exists by send a GET request, if we get a 404,
    // the index does not exist. If it exists, we can display the prompt.
    if args.overwrite && !args.assume_yes {
        // Stop if user answers no.
        let prompt = "This operation will overwrite the index and delete all its data. Do you \
                      want to proceed?"
            .to_string();
        if !prompt_confirmation(&prompt, false) {
            return Ok(());
        }
    }
    qw_client
        .indexes()
        .create(&index_config_str, config_format, args.overwrite)
        .await?;
    println!("{} Index successfully created.", "✔".color(GREEN_COLOR));
    Ok(())
}

pub async fn update_index_cli(args: UpdateIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "update-index");
    println!("❯ Updating index...");
    let storage_resolver = StorageResolver::unconfigured();
    let file_content = load_file(&storage_resolver, &args.index_config_uri).await?;
    let index_config_str = std::str::from_utf8(&file_content)
        .with_context(|| {
            format!(
                "index config file `{}` contains some invalid UTF-8 characters",
                args.index_config_uri
            )
        })?
        .to_string();
    let config_format = ConfigFormat::sniff_from_uri(&args.index_config_uri)?;
    let qw_client = args.client_args.client();
    if !args.assume_yes {
        let prompt = "This operation will update the index configuration. Do you want to proceed?";
        if !prompt_confirmation(prompt, false) {
            return Ok(());
        }
    }
    qw_client
        .indexes()
        .update(
            &args.index_id,
            &index_config_str,
            config_format,
            args.create,
        )
        .await?;
    println!("{} Index successfully updated.", "✔".color(GREEN_COLOR));
    Ok(())
}

pub async fn list_index_cli(args: ListIndexesArgs) -> anyhow::Result<()> {
    debug!(args=?args, "list-index");
    let qw_client = args.client_args.client();
    let indexes_metadatas = qw_client.indexes().list().await?;
    let index_table = make_list_indexes_table(
        indexes_metadatas
            .into_iter()
            .map(IndexMetadata::into_index_config),
    );
    println!("\n{index_table}\n");
    Ok(())
}

fn make_list_indexes_table<I>(indexes: I) -> Table
where I: IntoIterator<Item = IndexConfig> {
    let rows = indexes
        .into_iter()
        .map(|index| IndexRow {
            index_id: index.index_id,
            index_uri: index.index_uri,
        })
        .sorted_by(|left, right| left.index_id.cmp(&right.index_id));
    make_table("Indexes", rows, false)
}

#[derive(Tabled)]
struct IndexRow {
    #[tabled(rename = "Index ID")]
    index_id: IndexId,
    #[tabled(rename = "Index URI")]
    index_uri: Uri,
}

pub async fn describe_index_cli(args: DescribeIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "describe-index");
    let qw_client = args.client_args.client();
    let index_metadata = qw_client.indexes().get(&args.index_id).await?;
    let list_splits_query_params = ListSplitsQueryParams::default();
    let splits = qw_client
        .splits(&args.index_id)
        .list(list_splits_query_params)
        .await?;
    let index_stats = IndexStats::from_metadata(index_metadata, splits)?;
    println!("{}", index_stats.display_as_table());
    Ok(())
}

pub struct IndexStats {
    pub index_id: IndexId,
    pub index_uri: Uri,
    pub num_published_splits: usize,
    pub size_published_splits: ByteSize,
    pub num_published_docs: u64,
    pub size_published_docs_uncompressed: ByteSize,
    pub timestamp_field_name: Option<String>,
    pub timestamp_range: Option<(i64, i64)>,
    pub num_docs_descriptive: Option<DescriptiveStats>,
    pub num_bytes_descriptive: Option<DescriptiveStats>,
}

impl Tabled for IndexStats {
    const LENGTH: usize = 9;

    fn fields(&self) -> Vec<Cow<'_, str>> {
        let num_published_docs = format!(
            "{} ({})",
            format_to_si_scale(self.num_published_docs),
            separate_thousands(self.num_published_docs)
        );

        [
            self.index_id.to_string(),
            self.index_uri.to_string(),
            num_published_docs,
            self.size_published_docs_uncompressed.to_string(),
            separate_thousands(self.num_published_splits),
            self.size_published_splits.to_string(),
            display_option_in_table(&self.timestamp_field_name),
            display_timestamp(&self.timestamp_range.map(|(start, _end)| start)),
            display_timestamp(&self.timestamp_range.map(|(_start, end)| end)),
        ]
        .into_iter()
        .map(|field| field.into())
        .collect()
    }

    fn headers() -> Vec<Cow<'static, str>> {
        [
            "Index ID",
            "Index URI",
            "Number of published documents",
            "Size of published documents (uncompressed)",
            "Number of published splits",
            "Size of published splits",
            "Timestamp field",
            "Timestamp range start",
            "Timestamp range end",
        ]
        .into_iter()
        .map(|header| header.into())
        .collect()
    }
}

fn format_to_si_scale(num: impl numfmt::Numeric) -> String {
    let mut si_scale_formatter = Formatter::new().scales(Scales::metric());
    si_scale_formatter.fmt2(num).to_string()
}

fn separate_thousands(num: impl numfmt::Numeric) -> String {
    let mut thousands_separator_formatter = Formatter::new()
        .separator(',')
        // NOTE: .separator(sep) only panics if sep.len_utf8() != 1
        .expect("`,` separator should be valid")
        .precision(numfmt::Precision::Significance(3));

    thousands_separator_formatter.fmt2(num).to_string()
}

fn display_option_in_table(opt: &Option<impl Display>) -> String {
    match opt {
        Some(opt_val) => format!("\"{opt_val}\""),
        None => "Field does not exist for the index.".to_string(),
    }
}

fn display_timestamp(timestamp: &Option<i64>) -> String {
    match timestamp {
        Some(timestamp) => {
            let datetime = chrono::DateTime::from_timestamp_millis(*timestamp * 1000)
                .map(|datetime| datetime.format("%Y-%m-%d %H:%M:%S").to_string())
                .unwrap_or_else(|| "Invalid timestamp!".to_string());
            format!("{datetime} (Timestamp: {timestamp})")
        }
        _ => "Timestamp does not exist for the index.".to_string(),
    }
}

impl IndexStats {
    pub fn from_metadata(
        index_metadata: IndexMetadata,
        splits: Vec<Split>,
    ) -> anyhow::Result<Self> {
        let published_splits: Vec<Split> = splits
            .into_iter()
            .filter(|split| split.split_state == SplitState::Published)
            .collect();
        let splits_num_docs = published_splits
            .iter()
            .map(|split| split.split_metadata.num_docs as u64)
            .sorted()
            .collect_vec();

        let total_num_docs = splits_num_docs.iter().sum::<u64>();

        let splits_bytes = published_splits
            .iter()
            .map(|split| split.split_metadata.footer_offsets.end)
            .sorted()
            .collect_vec();
        let total_num_bytes = splits_bytes.iter().sum::<u64>();
        let total_uncompressed_num_bytes = published_splits
            .iter()
            .map(|split| split.split_metadata.uncompressed_docs_size_in_bytes)
            .sum::<u64>();

        let timestamp_range = if index_metadata
            .index_config()
            .doc_mapping
            .timestamp_field
            .is_some()
        {
            let time_min = published_splits
                .iter()
                .flat_map(|split| split.split_metadata.time_range.clone())
                .map(|time_range| *time_range.start())
                .min();
            let time_max = published_splits
                .iter()
                .flat_map(|split| split.split_metadata.time_range.clone())
                .map(|time_range| *time_range.end())
                .max();
            if let (Some(time_min), Some(time_max)) = (time_min, time_max) {
                Some((time_min, time_max))
            } else {
                None
            }
        } else {
            None
        };

        let (num_docs_descriptive, num_bytes_descriptive) = if !published_splits.is_empty() {
            (
                DescriptiveStats::maybe_new(&splits_num_docs),
                DescriptiveStats::maybe_new(&splits_bytes),
            )
        } else {
            (None, None)
        };
        let index_config = index_metadata.into_index_config();

        Ok(Self {
            index_id: index_config.index_id.clone(),
            index_uri: index_config.index_uri.clone(),
            num_published_splits: published_splits.len(),
            size_published_splits: ByteSize(total_num_bytes),
            num_published_docs: total_num_docs,
            size_published_docs_uncompressed: ByteSize(total_uncompressed_num_bytes),
            timestamp_field_name: index_config.doc_mapping.timestamp_field,
            timestamp_range,
            num_docs_descriptive,
            num_bytes_descriptive,
        })
    }

    pub fn display_as_table(&self) -> String {
        let mut tables = Vec::new();
        let index_stats_table = create_table(self, "General Information", true);
        tables.push(index_stats_table);

        if let Some(docs_stats) = &self.num_docs_descriptive {
            let doc_stats_table = docs_stats.into_table("Published documents count stats");
            tables.push(doc_stats_table);
        }

        if let Some(size_stats) = &self.num_bytes_descriptive {
            let size_stats_in_mb = size_stats / 1_000_000.0;
            let size_stats_table = size_stats_in_mb.into_table("Published splits size stats (MB)");
            tables.push(size_stats_table);
        }

        Table::builder(tables.into_iter().map(|table| table.to_string()))
            .build()
            .with(Modify::new(Segment::all()).with(Alignment::center_vertical()))
            .with(Remove::row(FirstRow))
            .with(Style::empty())
            .to_string()
    }
}

fn create_table(table: impl Tabled, header: &str, is_vertical: bool) -> Table {
    let mut table = Table::new(vec![table]);

    // Make the field names GREEN :D
    table.with(Modify::new(Rows::first()).with(Format::content(|column| {
        column.color(GREEN_COLOR).to_string()
    })));

    if is_vertical {
        table.with(Rotate::Left).with(Rotate::Bottom);
    }

    table
        .with(Panel::header(header))
        // Makes the table header bright green and bold.
        .with(Modify::new(Rows::first()).with(Format::content(|header| {
            header.bright_green().bold().to_string()
        })))
        .with(
            Modify::new(Segment::all())
                .with(Alignment::left())
                .with(Alignment::top()),
        )
        .with(Footer::new("\n"))
        .with(Style::psql());

    table
}

#[derive(Debug, Clone, Copy)]
pub struct DescriptiveStats {
    summary_stats: SummaryStats,
    quantiles: Quantiles,
}

impl DescriptiveStats {
    pub fn into_table(self, header: &str) -> Table {
        let summary_stats_table = create_table(self.summary_stats, header, true);
        let quantiles_table = create_table(self.quantiles, "Quantiles", false);
        let mut table =
            Table::builder([summary_stats_table.to_string(), quantiles_table.to_string()]).build();

        table
            .with(Style::empty())
            .with(Remove::row(FirstRow))
            // We separate tables with a newline already, this is to separate quantile part of the
            // table further away from the next table.
            .with(Footer::new("\n"));

        table
    }
}

impl Div<f32> for &DescriptiveStats {
    type Output = DescriptiveStats;

    fn div(self, rhs: f32) -> Self::Output {
        DescriptiveStats {
            summary_stats: self.summary_stats / rhs,
            quantiles: self.quantiles / rhs,
        }
    }
}

#[derive(Debug, Clone, Copy)]
pub struct SummaryStats {
    mean_val: f32,
    std_val: f32,
    min_val: u64,
    max_val: u64,
}

impl Div<f32> for SummaryStats {
    type Output = Self;

    fn div(self, rhs: f32) -> Self::Output {
        Self {
            mean_val: self.mean_val / rhs,
            std_val: self.std_val / rhs,
            min_val: self.min_val / rhs as u64,
            max_val: self.max_val / rhs as u64,
        }
    }
}

#[derive(Debug, Clone, Copy)]
pub struct Quantiles {
    q1: f32,
    q25: f32,
    q50: f32,
    q75: f32,
    q99: f32,
}

impl Div<f32> for Quantiles {
    type Output = Self;

    fn div(self, rhs: f32) -> Self::Output {
        Self {
            q1: self.q1 / rhs,
            q25: self.q25 / rhs,
            q50: self.q50 / rhs,
            q75: self.q75 / rhs,
            q99: self.q99 / rhs,
        }
    }
}

impl DescriptiveStats {
    pub fn maybe_new(values: &[u64]) -> Option<DescriptiveStats> {
        if values.is_empty() {
            return None;
        }

        Some(DescriptiveStats {
            summary_stats: SummaryStats {
                mean_val: mean(values),
                std_val: std_deviation(values),
                min_val: *values.iter().min().expect("Values should not be empty."),
                max_val: *values.iter().max().expect("Values should not be empty."),
            },
            quantiles: Quantiles {
                q1: percentile(values, 1),
                q25: percentile(values, 25),
                q50: percentile(values, 50),
                q75: percentile(values, 75),
                q99: percentile(values, 99),
            },
        })
    }
}

impl Tabled for SummaryStats {
    const LENGTH: usize = 4;

    fn fields(&self) -> Vec<Cow<'_, str>> {
        [
            separate_thousands(self.mean_val),
            separate_thousands(self.min_val),
            separate_thousands(self.max_val),
            separate_thousands(self.std_val),
        ]
        .into_iter()
        .map(|field| field.into())
        .collect()
    }

    fn headers() -> Vec<Cow<'static, str>> {
        [
            "Mean".to_string(),
            "Min".to_string(),
            "Max".to_string(),
            "Standard deviation".to_string(),
        ]
        .into_iter()
        .map(|header| header.into())
        .collect()
    }
}

impl Tabled for Quantiles {
    const LENGTH: usize = 5;

    fn fields(&self) -> Vec<Cow<'_, str>> {
        [
            separate_thousands(self.q1),
            separate_thousands(self.q25),
            separate_thousands(self.q50),
            separate_thousands(self.q75),
            separate_thousands(self.q99),
        ]
        .into_iter()
        .map(|field| field.into())
        .collect()
    }

    fn headers() -> Vec<Cow<'static, str>> {
        [
            "1%".to_string(),
            "25%".to_string(),
            "50%".to_string(),
            "75%".to_string(),
            "99%".to_string(),
        ]
        .into_iter()
        .map(|header| header.into())
        .collect()
    }
}

pub async fn ingest_docs_cli(args: IngestDocsArgs) -> anyhow::Result<()> {
    debug!(args=?args, "ingest-docs");
    let mut rate_estimator = SmaRateEstimator::new(
        NonZeroUsize::new(8).unwrap(),
        Duration::from_millis(250),
        Duration::from_secs(1),
    );
    if let Some(input_path) = &args.input_path_opt {
        println!("❯ Ingesting documents from {}.", input_path.display());
    } else {
        println!("❯ Ingesting documents from stdin.");
    }
    let progress_bar = match &args.input_path_opt {
        Some(filepath) => {
            let file_len = std::fs::metadata(filepath).context("file not found")?.len();
            ProgressBar::new(file_len)
        }
        None => ProgressBar::new_spinner(),
    };
    progress_bar.enable_steady_tick(Duration::from_millis(100));
    progress_bar.set_style(progress_bar_style());
    progress_bar.set_message("0MiB/s");
    // It is not used by the rate estimator anyway.
    let useless_start_time = Instant::now();
    let mut update_progress_bar = |ingest_event: IngestEvent| {
        match ingest_event {
            IngestEvent::IngestedDocBatch(num_bytes) => {
                rate_estimator.update(useless_start_time, Instant::now(), num_bytes as u64);
                progress_bar.inc(num_bytes as u64)
            }
            IngestEvent::Sleep => {} // To
        };
        let throughput = rate_estimator.work() as f64 / (1024 * 1024) as f64;
        progress_bar.set_message(format!("{throughput:.1} MiB/s"));
    };

    let mut qw_client_builder = args.client_args.client_builder();
    if args.detailed_response {
        qw_client_builder = qw_client_builder.detailed_response(args.detailed_response);
    }
    let qw_client = qw_client_builder.build();
    let ingest_source = match args.input_path_opt {
        Some(filepath) => IngestSource::File(filepath),
        None => IngestSource::Stdin,
    };
    let batch_size_limit_opt = args
        .batch_size_limit_opt
        .map(|batch_size_limit| batch_size_limit.as_u64() as usize);
    let response = qw_client
        .ingest(
            &args.index_id,
            ingest_source,
            batch_size_limit_opt,
            Some(&mut update_progress_bar),
            args.commit_type,
        )
        .await?;
    progress_bar.finish();
    println!(
        "{} Ingested {} document(s) successfully.",
        "✔".color(GREEN_COLOR),
        response
            .num_ingested_docs
            // TODO(#5604) remove unwrap
            .unwrap_or(response.num_docs_for_processing),
    );
    if let Some(rejected) = response.num_rejected_docs
        && rejected > 0
    {
        println!(
            "{} Rejected {} document(s).",
            "✖".color(RED_COLOR),
            rejected
        );
    }
    if let Some(parse_failures) = response.parse_failures {
        if !parse_failures.is_empty() {
            println!("Detailed parse failures:");
        }
        for (idx, failure) in parse_failures.iter().enumerate() {
            let reason_value = serde_json::to_value(failure.reason).unwrap();
            println!();
            println!("┌ error {}", idx + 1);
            println!("├ reason: {}", reason_value.as_str().unwrap());
            println!("├ message: {}", failure.message);
            println!("└ document: {}", failure.document);
        }
    }
    Ok(())
}

fn progress_bar_style() -> ProgressStyle {
    ProgressStyle::with_template(
        "{spinner:.blue} [{elapsed_precise}] {bytes}/{total_bytes} ({msg})",
    )
    .expect("Progress style should always be valid.")
    .tick_strings(&["⠋", "⠙", "⠹", "⠸", "⠼", "⠴", "⠦", "⠧", "⠇", "⠏"])
}

pub async fn search_index(args: SearchIndexArgs) -> anyhow::Result<SearchResponseRestClient> {
    let aggs: Option<serde_json::Value> = args
        .aggregation
        .map(|aggs_string| {
            serde_json::from_str(&aggs_string).context("failed to deserialize aggregations")
        })
        .transpose()?;
    let sort_fields = if args.sort_by_score {
        vec![SortField {
            field_name: "_score".to_string(),
            sort_order: SortOrder::Desc as i32,
            sort_datetime_format: None,
        }]
    } else {
        Vec::new()
    };
    let sort_by = SortBy { sort_fields };
    let search_request = SearchRequestQueryString {
        query: args.query,
        aggs,
        search_fields: args.search_fields.clone(),
        snippet_fields: args.snippet_fields.clone(),
        start_timestamp: args.start_timestamp,
        end_timestamp: args.end_timestamp,
        max_hits: args.max_hits as u64,
        start_offset: args.start_offset as u64,
        sort_by,
        count_all: CountHits::CountAll,
        ..Default::default()
    };
    let qw_client = args.client_args.client();
    let search_response = qw_client.search(&args.index_id, search_request).await?;
    Ok(search_response)
}

pub async fn search_index_cli(args: SearchIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "search-index");
    let search_response_rest = search_index(args).await?;
    let search_response_json = serde_json::to_string_pretty(&search_response_rest)?;
    println!("{search_response_json}");
    Ok(())
}

pub async fn delete_index_cli(args: DeleteIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "delete-index");
    if !args.dry_run && !args.assume_yes {
        let prompt = "This operation will delete the index. Do you want to proceed?".to_string();
        if !prompt_confirmation(&prompt, false) {
            return Ok(());
        }
    }

    println!("❯ Deleting index...");
    let qw_client = args.client_args.client();
    let affected_files = qw_client
        .indexes()
        .delete(&args.index_id, args.dry_run)
        .await?;

    if args.dry_run {
        if affected_files.is_empty() {
            println!("Only the index will be deleted since it does not contains any data file.");
            return Ok(());
        }
        println!(
            "The following files will be removed from the index `{}`",
            args.index_id
        );
        for split_info in affected_files {
            println!(" - {}", split_info.file_name.display());
        }
        return Ok(());
    }
    println!("{} Index successfully deleted.", "✔".color(GREEN_COLOR));
    Ok(())
}

#[cfg(test)]
mod test {

    use std::ops::RangeInclusive;

    use quickwit_metastore::SplitMetadata;

    use super::*;

    pub fn split_metadata_for_test(
        split_id: &str,
        num_docs: usize,
        time_range: RangeInclusive<i64>,
        size: u64,
    ) -> SplitMetadata {
        let mut split_metadata = SplitMetadata::for_test(split_id.to_string());
        split_metadata.num_docs = num_docs;
        split_metadata.time_range = Some(time_range);
        split_metadata.footer_offsets = (size - 10)..size;
        split_metadata
    }

    #[test]
    fn test_index_stats() -> anyhow::Result<()> {
        let index_id = "index-stats-env".to_string();
        let split_id_1 = "test_split_id_1".to_string();
        let split_id_2 = "test_split_id_2".to_string();
        let index_uri = "s3://some-test-bucket";

        let index_metadata = IndexMetadata::for_test(&index_id, index_uri);
        let mut split_metadata_1 =
            split_metadata_for_test(&split_id_1, 100_000, 1111..=2222, 15_000_000);
        split_metadata_1.uncompressed_docs_size_in_bytes = 19_000_000;
        let mut split_metadata_2 =
            split_metadata_for_test(&split_id_2, 100_000, 1000..=3000, 30_000_000);
        split_metadata_2.uncompressed_docs_size_in_bytes = 36_000_000;

        let split_data_1 = Split {
            split_metadata: split_metadata_1,
            split_state: SplitState::Published,
            update_timestamp: 0,
            publish_timestamp: Some(10),
        };
        let split_data_2 = Split {
            split_metadata: split_metadata_2,
            split_state: SplitState::MarkedForDeletion,
            update_timestamp: 0,
            publish_timestamp: Some(10),
        };

        let index_stats =
            IndexStats::from_metadata(index_metadata, vec![split_data_1, split_data_2])?;

        assert_eq!(index_stats.index_id, index_id);
        assert_eq!(index_stats.index_uri.as_str(), index_uri);
        assert_eq!(index_stats.num_published_splits, 1);
        assert_eq!(index_stats.size_published_splits, ByteSize::mb(15));
        assert_eq!(index_stats.num_published_docs, 100_000);
        assert_eq!(
            index_stats.size_published_docs_uncompressed,
            ByteSize::mb(19)
        );
        assert_eq!(
            index_stats.timestamp_field_name,
            Some("timestamp".to_string())
        );
        assert_eq!(index_stats.timestamp_range, Some((1111, 2222)));

        Ok(())
    }

    #[test]
    fn test_descriptive_stats() -> anyhow::Result<()> {
        let split_id = "stat-test-split".to_string();
        let template_split = Split {
            split_state: SplitState::Published,
            update_timestamp: 10,
            publish_timestamp: Some(10),
            split_metadata: SplitMetadata::default(),
        };

        let split_metadata_1 = split_metadata_for_test(&split_id, 70_000, 10..=12, 60_000_000);
        let split_metadata_2 = split_metadata_for_test(&split_id, 120_000, 11..=15, 145_000_000);
        let split_metadata_3 = split_metadata_for_test(&split_id, 90_000, 15..=22, 115_000_000);
        let split_metadata_4 = split_metadata_for_test(&split_id, 40_000, 22..=22, 55_000_000);

        let mut split_1 = template_split.clone();
        split_1.split_metadata = split_metadata_1;
        let mut split_2 = template_split.clone();
        split_2.split_metadata = split_metadata_2;
        let mut split_3 = template_split.clone();
        split_3.split_metadata = split_metadata_3;
        let mut split_4 = template_split;
        split_4.split_metadata = split_metadata_4;

        let splits = [split_1, split_2, split_3, split_4];

        let splits_num_docs = splits
            .iter()
            .map(|split| split.split_metadata.num_docs as u64)
            .sorted()
            .collect_vec();

        let splits_bytes = splits
            .iter()
            .map(|split| split.split_metadata.footer_offsets.end)
            .sorted()
            .collect_vec();

        let num_docs_descriptive = DescriptiveStats::maybe_new(&splits_num_docs);
        let num_bytes_descriptive = DescriptiveStats::maybe_new(&splits_bytes);

        assert!(num_docs_descriptive.is_some());
        assert!(num_bytes_descriptive.is_some());

        let num_docs_descriptive = num_docs_descriptive.unwrap();
        let num_bytes_descriptive = num_bytes_descriptive.unwrap();

        assert_eq!(num_docs_descriptive.quantiles.q1, 40900.0);
        assert_eq!(num_docs_descriptive.quantiles.q25, 62500.0);
        assert_eq!(num_docs_descriptive.quantiles.q50, 80000.0);
        assert_eq!(num_docs_descriptive.quantiles.q75, 97500.0);
        assert_eq!(num_docs_descriptive.quantiles.q99, 119100.0);

        assert_eq!(num_bytes_descriptive.quantiles.q1, 55150000.0);
        assert_eq!(num_bytes_descriptive.quantiles.q25, 58750000.0);
        assert_eq!(num_bytes_descriptive.quantiles.q50, 87500000.0);
        assert_eq!(num_bytes_descriptive.quantiles.q75, 122500000.0);
        assert_eq!(num_bytes_descriptive.quantiles.q99, 144100000.0);

        let descriptive_stats_none = DescriptiveStats::maybe_new(&[]);
        assert!(descriptive_stats_none.is_none());

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-cli/src/jemalloc.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use quickwit_common::metrics::MEMORY_METRICS;
use tikv_jemallocator::Jemalloc;
use tracing::error;

#[cfg(feature = "jemalloc-profiled")]
#[global_allocator]
pub static GLOBAL: quickwit_common::jemalloc_profiled::JemallocProfiled =
    quickwit_common::jemalloc_profiled::JemallocProfiled(Jemalloc);

#[cfg(not(feature = "jemalloc-profiled"))]
#[global_allocator]
pub static GLOBAL: Jemalloc = Jemalloc;

const JEMALLOC_METRICS_POLLING_INTERVAL: Duration = Duration::from_secs(1);

pub async fn jemalloc_metrics_loop() -> tikv_jemalloc_ctl::Result<()> {
    let memory_metrics = MEMORY_METRICS.clone();

    // Obtain a MIB for the `epoch`, `stats.active`, `stats.allocated`, and `stats.resident` keys:
    let epoch_mib = tikv_jemalloc_ctl::epoch::mib()?;
    let active_mib = tikv_jemalloc_ctl::stats::active::mib()?;
    let allocated_mib = tikv_jemalloc_ctl::stats::allocated::mib()?;
    let resident_mib = tikv_jemalloc_ctl::stats::resident::mib()?;

    let mut poll_interval = tokio::time::interval(JEMALLOC_METRICS_POLLING_INTERVAL);

    loop {
        poll_interval.tick().await;

        // Many statistics are cached and only updated when the epoch is advanced:
        epoch_mib.advance()?;

        // Read statistics using MIB keys:
        let active = active_mib.read()?;
        memory_metrics.active_bytes.set(active as i64);

        let allocated = allocated_mib.read()?;
        memory_metrics.allocated_bytes.set(allocated as i64);

        let resident = resident_mib.read()?;
        memory_metrics.resident_bytes.set(resident as i64);
    }
}

pub fn start_jemalloc_metrics_loop() {
    tokio::task::spawn(async {
        if let Err(error) = jemalloc_metrics_loop().await {
            error!(%error, "failed to collect metrics from jemalloc");
        }
    });
}


================================================
FILE: quickwit/quickwit-cli/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

use std::collections::HashSet;
use std::str::FromStr;
use std::sync::OnceLock;

use anyhow::Context;
use clap::{Arg, ArgMatches, arg};
use dialoguer::Confirm;
use dialoguer::theme::ColorfulTheme;
use quickwit_common::runtimes::RuntimesConfig;
use quickwit_common::uri::Uri;
use quickwit_config::service::QuickwitService;
use quickwit_config::{
    ConfigFormat, DEFAULT_QW_CONFIG_PATH, MetastoreConfigs, NodeConfig, SourceConfig,
    StorageConfigs,
};
use quickwit_indexing::check_source_connectivity;
use quickwit_metastore::{IndexMetadataResponseExt, MetastoreResolver};
use quickwit_proto::metastore::{IndexMetadataRequest, MetastoreService, MetastoreServiceClient};
use quickwit_rest_client::models::Timeout;
use quickwit_rest_client::rest_client::{DEFAULT_BASE_URL, QuickwitClient, QuickwitClientBuilder};
use quickwit_storage::{StorageResolver, load_file};
use reqwest::Url;
use tabled::settings::object::Rows;
use tabled::settings::panel::Header;
use tabled::settings::{Alignment, Modify, Style};
use tabled::{Table, Tabled};
use tracing::info;

use crate::checklist::run_checklist;

pub mod checklist;
pub mod cli;
pub mod index;
#[cfg(feature = "jemalloc")]
pub mod jemalloc;
pub mod logger;
pub mod metrics;
pub mod service;
pub mod source;
pub mod split;
pub mod stats;
pub mod tool;

/// Throughput calculation window size.
const THROUGHPUT_WINDOW_SIZE: usize = 5;

pub const QW_ENABLE_TOKIO_CONSOLE_ENV_KEY: &str = "QW_ENABLE_TOKIO_CONSOLE";

pub const QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER_ENV_KEY: &str =
    "QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER";

fn config_cli_arg() -> Arg {
    Arg::new("config")
        .long("config")
        .help("Config file location")
        .env("QW_CONFIG")
        .default_value(DEFAULT_QW_CONFIG_PATH)
        .global(true)
        .display_order(1)
}

fn client_args() -> Vec<Arg> {
    vec![
        arg!(--"endpoint" <QW_CLUSTER_ENDPOINT> "Quickwit cluster endpoint.")
            .default_value("http://127.0.0.1:7280")
            .env("QW_CLUSTER_ENDPOINT")
            .required(false)
            .display_order(1)
            .global(true),
        Arg::new("timeout")
            .long("timeout")
            .help("Duration of the timeout.")
            .required(false)
            .global(true)
            .display_order(2),
        Arg::new("connect-timeout")
            .long("connect-timeout")
            .help("Duration of the connect timeout.")
            .required(false)
            .global(true)
            .display_order(3),
        Arg::new("retries")
            .long("retries")
            .help(
                "Maximum number of retries for transient errors. Default value is 0. The total \
                 number of attempts will be `1 + RETRIES`.",
            )
            .required(false)
            .global(true)
            .default_value("0")
            .display_order(4),
    ]
}

pub fn install_default_crypto_ring_provider() {
    static CALL_ONLY_ONCE: OnceLock<Result<(), ()>> = OnceLock::new();
    CALL_ONLY_ONCE
        .get_or_init(|| {
            rustls::crypto::ring::default_provider()
                .install_default()
                .map_err(|_| ())
        })
        .expect("rustls crypto ring default provider installation should not fail");
}

#[derive(Debug, Eq, PartialEq)]
pub struct ClientArgs {
    pub cluster_endpoint: Url,
    pub connect_timeout: Option<Timeout>,
    pub timeout: Option<Timeout>,
    pub commit_timeout: Option<Timeout>,
    pub num_retries: u32,
}

impl Default for ClientArgs {
    fn default() -> Self {
        Self {
            cluster_endpoint: Url::parse(DEFAULT_BASE_URL).unwrap(),
            connect_timeout: None,
            timeout: None,
            commit_timeout: None,
            num_retries: 0,
        }
    }
}

impl ClientArgs {
    pub fn client_builder(self) -> QuickwitClientBuilder {
        let mut builder = QuickwitClientBuilder::new(self.cluster_endpoint);
        if let Some(connect_timeout) = self.connect_timeout {
            builder = builder.connect_timeout(connect_timeout);
        }
        if let Some(timeout) = self.timeout {
            builder = builder.timeout(timeout);
            builder = builder.search_timeout(timeout);
            builder = builder.ingest_timeout(timeout);
        }
        if let Some(commit_timeout) = self.commit_timeout {
            builder = builder.commit_timeout(commit_timeout);
        }
        builder.num_retries(self.num_retries)
    }

    pub fn client(self) -> QuickwitClient {
        self.client_builder().build()
    }

    pub fn parse_for_ingest(matches: &mut ArgMatches) -> anyhow::Result<Self> {
        Self::parse_inner(matches, true)
    }

    pub fn parse(matches: &mut ArgMatches) -> anyhow::Result<Self> {
        Self::parse_inner(matches, false)
    }

    fn parse_inner(matches: &mut ArgMatches, process_ingest: bool) -> anyhow::Result<Self> {
        let cluster_endpoint = matches
            .remove_one::<String>("endpoint")
            .map(|endpoint_str| Url::from_str(&endpoint_str))
            .expect("`endpoint` should be a required arg")?;
        let connect_timeout =
            if let Some(duration) = matches.remove_one::<String>("connect-timeout") {
                Some(parse_duration_or_none(&duration)?)
            } else {
                None
            };
        let timeout = if let Some(duration) = matches.remove_one::<String>("timeout") {
            Some(parse_duration_or_none(&duration)?)
        } else {
            None
        };
        let commit_timeout = if process_ingest {
            if let Some(duration) = matches.remove_one::<String>("commit-timeout") {
                Some(parse_duration_or_none(&duration)?)
            } else {
                None
            }
        } else {
            None
        };
        let num_retries = matches
            .remove_one::<String>("retries")
            .map(|retries| retries.parse::<u32>())
            .expect("`retries` should have a default value")?;
        Ok(Self {
            cluster_endpoint,
            connect_timeout,
            timeout,
            commit_timeout,
            num_retries,
        })
    }
}

pub fn parse_duration_or_none(duration_with_unit_str: &str) -> anyhow::Result<Timeout> {
    if duration_with_unit_str == "none" {
        Ok(Timeout::none())
    } else {
        humantime::parse_duration(duration_with_unit_str)
            .map(Timeout::new)
            .context("failed to parse timeout")
    }
}

pub fn start_actor_runtimes(
    runtimes_config: RuntimesConfig,
    services: &HashSet<QuickwitService>,
) -> anyhow::Result<()> {
    if services.contains(&QuickwitService::Indexer)
        || services.contains(&QuickwitService::Janitor)
        || services.contains(&QuickwitService::ControlPlane)
    {
        quickwit_common::runtimes::initialize_runtimes(runtimes_config)
            .context("failed to start actor runtimes")?;
    }
    Ok(())
}

/// Loads a node config located at `config_uri` with the default storage configuration.
async fn load_node_config(config_uri: &Uri) -> anyhow::Result<NodeConfig> {
    let config_content = load_file(&StorageResolver::unconfigured(), config_uri)
        .await
        .context("failed to load node config")?;
    let config_format = ConfigFormat::sniff_from_uri(config_uri)?;
    let config = NodeConfig::load(config_format, config_content.as_slice())
        .await
        .with_context(|| format!("failed to parse node config `{config_uri}`"))?;
    info!(config_uri=%config_uri, config=?config, "loaded node config");
    Ok(config)
}

fn get_resolvers(
    storage_configs: &StorageConfigs,
    metastore_configs: &MetastoreConfigs,
) -> (StorageResolver, MetastoreResolver) {
    // The CLI tests rely on the unconfigured singleton resolvers, so it's better to return them if
    // the storage and metastore configs are not set.
    if storage_configs.is_empty() && metastore_configs.is_empty() {
        return (
            StorageResolver::unconfigured(),
            MetastoreResolver::unconfigured(),
        );
    }
    let storage_resolver = StorageResolver::configured(storage_configs);
    let metastore_resolver =
        MetastoreResolver::configured(storage_resolver.clone(), metastore_configs);
    (storage_resolver, metastore_resolver)
}

/// Runs connectivity checks for a given `metastore_uri` and `index_id`.
/// Optionally, it takes a `SourceConfig` that will be checked instead
/// of the index's sources.
pub async fn run_index_checklist(
    metastore: &mut MetastoreServiceClient,
    storage_resolver: &StorageResolver,
    index_id: &str,
    source_config_opt: Option<&SourceConfig>,
) -> anyhow::Result<()> {
    let mut checks: Vec<(&str, anyhow::Result<()>)> = Vec::new();
    for metastore_endpoint in metastore.endpoints() {
        // If it's not a database, the metastore is file-backed. To display a nicer message to the
        // user, we check the metastore storage connectivity before the mestastore check
        // connectivity which will check the storage anyway.
        if !metastore_endpoint.protocol().is_database() {
            let metastore_storage = storage_resolver.resolve(&metastore_endpoint).await?;
            checks.push((
                "metastore storage",
                metastore_storage.check_connectivity().await,
            ));
        }
    }
    checks.push(("metastore", metastore.check_connectivity().await));
    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await?
        .deserialize_index_metadata()?;
    let index_storage = storage_resolver.resolve(index_metadata.index_uri()).await?;
    checks.push(("index storage", index_storage.check_connectivity().await));

    if let Some(source_config) = source_config_opt {
        checks.push((
            source_config.source_id.as_str(),
            check_source_connectivity(storage_resolver, source_config).await,
        ));
    } else {
        for source_config in index_metadata.sources.values() {
            checks.push((
                source_config.source_id.as_str(),
                check_source_connectivity(storage_resolver, source_config).await,
            ));
        }
    }
    run_checklist(checks)?;
    Ok(())
}

/// Constructs a table for display.
pub fn make_table<T: Tabled>(
    header: &str,
    rows: impl IntoIterator<Item = T>,
    transpose: bool,
) -> Table {
    let mut table = if transpose {
        let index_builder = Table::builder(rows).index();
        index_builder.column(0).transpose().build()
    } else {
        Table::builder(rows).build()
    };

    table
        .with(Modify::new(Rows::new(1..)).with(Alignment::left()))
        .with(Style::ascii())
        .with(Header::new(header))
        .with(Modify::new(Rows::new(0..1)).with(Alignment::center()));

    table
}

/// Prompts user for confirmation.
fn prompt_confirmation(prompt: &str, default: bool) -> bool {
    if Confirm::with_theme(&ColorfulTheme::default())
        .with_prompt(prompt)
        .default(default)
        .interact()
        .unwrap()
    {
        true
    } else {
        println!("Aborting.");
        false
    }
}

pub mod busy_detector {
    use std::sync::atomic::{AtomicBool, AtomicU64, Ordering};
    use std::time::Instant;

    use once_cell::sync::Lazy;
    use tracing::debug;

    use crate::metrics::CLI_METRICS;

    // we need that time reference to use an atomic and not a mutex for LAST_UNPARK
    static TIME_REF: Lazy<Instant> = Lazy::new(Instant::now);
    static ENABLED: AtomicBool = AtomicBool::new(false);

    const ALLOWED_DELAY_MICROS: u64 = 5000;
    const DEBUG_SUPPRESSION_MICROS: u64 = 30_000_000;

    // LAST_UNPARK_TIMESTAMP and NEXT_DEBUG_TIMESTAMP are semantically micro-second
    // precision timestamps, but we use atomics to allow accessing them without locks.
    thread_local!(static LAST_UNPARK_TIMESTAMP: AtomicU64 = const { AtomicU64::new(0) });
    static NEXT_DEBUG_TIMESTAMP: AtomicU64 = AtomicU64::new(0);
    static SUPPRESSED_DEBUG_COUNT: AtomicU64 = AtomicU64::new(0);

    pub fn set_enabled(enabled: bool) {
        ENABLED.store(enabled, Ordering::Relaxed);
    }

    pub fn thread_unpark() {
        LAST_UNPARK_TIMESTAMP.with(|time| {
            let now = Instant::now()
                .checked_duration_since(*TIME_REF)
                .unwrap_or_default();
            time.store(now.as_micros() as u64, Ordering::Relaxed);
        })
    }

    pub fn thread_park() {
        if !ENABLED.load(Ordering::Relaxed) {
            return;
        }

        LAST_UNPARK_TIMESTAMP.with(|time| {
            let now = Instant::now()
                .checked_duration_since(*TIME_REF)
                .unwrap_or_default();
            let now = now.as_micros() as u64;
            let delta = now - time.load(Ordering::Relaxed);
            CLI_METRICS
                .thread_unpark_duration_microseconds
                .with_label_values([])
                .observe(delta as f64);
            if delta > ALLOWED_DELAY_MICROS {
                emit_debug(delta, now);
            }
        })
    }

    fn emit_debug(delta: u64, now: u64) {
        if NEXT_DEBUG_TIMESTAMP
            .fetch_update(Ordering::Relaxed, Ordering::Relaxed, |next_debug| {
                if next_debug < now {
                    Some(now + DEBUG_SUPPRESSION_MICROS)
                } else {
                    None
                }
            })
            .is_err()
        {
            // a debug was emitted recently, don't emit log for this one
            SUPPRESSED_DEBUG_COUNT.fetch_add(1, Ordering::Relaxed);
            return;
        }

        let suppressed = SUPPRESSED_DEBUG_COUNT.swap(0, Ordering::Relaxed);
        if suppressed == 0 {
            debug!("thread wasn't parked for {delta}µs, is the runtime too busy?");
        } else {
            debug!(
                "thread wasn't parked for {delta}µs, is the runtime too busy? ({suppressed} \
                 similar messages suppressed)"
            );
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_config::{S3StorageConfig, StorageConfigs};
    use quickwit_rest_client::models::Timeout;

    use super::*;
    use crate::parse_duration_or_none;

    #[test]
    fn test_parse_duration_or_none() -> anyhow::Result<()> {
        assert_eq!(parse_duration_or_none("1s")?, Timeout::from_secs(1));
        assert_eq!(parse_duration_or_none("2m")?, Timeout::from_mins(2));
        assert_eq!(parse_duration_or_none("3h")?, Timeout::from_hours(3));
        assert_eq!(parse_duration_or_none("4d")?, Timeout::from_days(4));
        assert_eq!(parse_duration_or_none("none")?, Timeout::none());
        assert!(parse_duration_or_none("something").is_err());
        Ok(())
    }

    #[test]
    fn test_get_resolvers() {
        let s3_storage_config = S3StorageConfig {
            force_path_style_access: true,
            ..Default::default()
        };
        let storage_configs = StorageConfigs::new(vec![s3_storage_config.into()]);
        let metastore_configs = MetastoreConfigs::default();
        let (_storage_resolver, _metastore_resolver) =
            get_resolvers(&storage_configs, &metastore_configs);
    }
}


================================================
FILE: quickwit/quickwit-cli/src/logger.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;
use std::{env, fmt};

use anyhow::Context;
use opentelemetry::trace::TracerProvider;
use opentelemetry::{KeyValue, global};
use opentelemetry_appender_tracing::layer::OpenTelemetryTracingBridge;
use opentelemetry_sdk::logs::SdkLoggerProvider;
use opentelemetry_sdk::propagation::TraceContextPropagator;
use opentelemetry_sdk::trace::{BatchConfigBuilder, SdkTracerProvider};
use opentelemetry_sdk::{Resource, trace};
use quickwit_common::{get_bool_from_env, get_from_env_opt};
use quickwit_serve::{BuildInfo, EnvFilterReloadFn};
use time::format_description::BorrowedFormatItem;
use tracing::{Event, Level, Subscriber};
use tracing_subscriber::EnvFilter;
use tracing_subscriber::field::RecordFields;
use tracing_subscriber::fmt::FmtContext;
use tracing_subscriber::fmt::format::{
    DefaultFields, Format, FormatEvent, FormatFields, Full, Json, JsonFields, Writer,
};
use tracing_subscriber::fmt::time::UtcTime;
use tracing_subscriber::layer::SubscriberExt;
use tracing_subscriber::prelude::*;
use tracing_subscriber::registry::LookupSpan;

use crate::QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER_ENV_KEY;
#[cfg(feature = "tokio-console")]
use crate::QW_ENABLE_TOKIO_CONSOLE_ENV_KEY;

/// Load the default logging filter from the environment. The filter can later
/// be updated using the result callback of [setup_logging_and_tracing].
fn startup_env_filter(level: Level) -> anyhow::Result<EnvFilter> {
    let env_filter = env::var("RUST_LOG")
        .map(|_| EnvFilter::from_default_env())
        .or_else(|_| EnvFilter::try_new(format!("quickwit={level},tantivy=WARN")))
        .context("failed to set up tracing env filter")?;
    Ok(env_filter)
}

type ReloadLayer = tracing_subscriber::reload::Layer<EnvFilter, tracing_subscriber::Registry>;

pub fn setup_logging_and_tracing(
    level: Level,
    ansi_colors: bool,
    build_info: &BuildInfo,
) -> anyhow::Result<(
    EnvFilterReloadFn,
    Option<(SdkTracerProvider, SdkLoggerProvider)>,
)> {
    #[cfg(feature = "tokio-console")]
    {
        if get_bool_from_env(QW_ENABLE_TOKIO_CONSOLE_ENV_KEY, false) {
            console_subscriber::init();
            return Ok((quickwit_serve::do_nothing_env_filter_reload_fn(), None));
        }
    }
    global::set_text_map_propagator(TraceContextPropagator::new());

    let event_format = EventFormat::get_from_env();
    let fmt_fields = event_format.format_fields();
    let registry = tracing_subscriber::registry();

    let (reloadable_env_filter, reload_handle) = ReloadLayer::new(startup_env_filter(level)?);

    #[cfg(not(feature = "jemalloc-profiled"))]
    let registry = registry.with(reloadable_env_filter).with(
        tracing_subscriber::fmt::layer()
            .event_format(event_format)
            .fmt_fields(fmt_fields)
            .with_ansi(ansi_colors),
    );

    #[cfg(feature = "jemalloc-profiled")]
    let registry = jemalloc_profiled::configure_registry(
        registry,
        event_format,
        fmt_fields,
        ansi_colors,
        level,
        reloadable_env_filter,
    )?;

    // Note on disabling ANSI characters: setting the ansi boolean on event format is insufficient.
    // It is thus set on layers, see https://github.com/tokio-rs/tracing/issues/1817
    let provider_opt = if get_bool_from_env(QW_ENABLE_OPENTELEMETRY_OTLP_EXPORTER_ENV_KEY, false) {
        let span_exporter = opentelemetry_otlp::SpanExporter::builder()
            .with_tonic()
            .build()
            .context("failed to initialize OpenTelemetry OTLP exporter")?;
        let span_processor = trace::BatchSpanProcessor::builder(span_exporter)
            .with_batch_config(
                BatchConfigBuilder::default()
                    // Quickwit can generate a lot of spans, especially in debug mode, and the
                    // default queue size of 2048 is too small.
                    .with_max_queue_size(32_768)
                    .build(),
            )
            .build();

        let resource = Resource::builder()
            .with_service_name("quickwit")
            .with_attribute(KeyValue::new("service.version", build_info.version.clone()))
            .build();

        let logs_exporter = opentelemetry_otlp::LogExporter::builder()
            .with_tonic()
            .build()
            .context("failed to initialize OpenTelemetry OTLP logs")?;

        let logger_provider = SdkLoggerProvider::builder()
            .with_resource(resource.clone())
            .with_batch_exporter(logs_exporter)
            .build();

        let tracing_provider = opentelemetry_sdk::trace::SdkTracerProvider::builder()
            .with_span_processor(span_processor)
            .with_resource(resource)
            .build();

        let tracer = tracing_provider.tracer("quickwit");
        let telemetry_layer = tracing_opentelemetry::layer().with_tracer(tracer);

        // Bridge between tracing logs and otel tracing events
        let logs_otel_layer = OpenTelemetryTracingBridge::new(&logger_provider);

        registry
            .with(telemetry_layer)
            .with(logs_otel_layer)
            .try_init()
            .context("failed to register tracing subscriber")?;
        Some((tracing_provider, logger_provider))
    } else {
        registry
            .try_init()
            .context("failed to register tracing subscriber")?;
        None
    };

    Ok((
        Arc::new(move |env_filter_def: &str| {
            let new_env_filter = EnvFilter::try_new(env_filter_def)?;
            reload_handle.reload(new_env_filter)?;
            Ok(())
        }),
        provider_opt,
    ))
}

/// We do not rely on the RFC3339 implementation, because it has a nanosecond precision.
/// See discussion here: https://github.com/time-rs/time/discussions/418
fn time_formatter() -> UtcTime<Vec<BorrowedFormatItem<'static>>> {
    let time_format = time::format_description::parse(
        "[year]-[month]-[day]T[hour]:[minute]:[second].[subsecond digits:3]Z",
    )
    .expect("time format description should be valid");
    UtcTime::new(time_format)
}

enum EventFormat<'a> {
    Full(Format<Full, UtcTime<Vec<BorrowedFormatItem<'a>>>>),
    Json(Format<Json>),
}

impl EventFormat<'_> {
    /// Gets the log format from the environment variable `QW_LOG_FORMAT`. Returns a JSON
    /// formatter if the variable is set to `json`, otherwise returns a full formatter.
    fn get_from_env() -> Self {
        if get_from_env_opt::<String>("QW_LOG_FORMAT", false)
            .map(|log_format| log_format.eq_ignore_ascii_case("json"))
            .unwrap_or(false)
        {
            let json_format = tracing_subscriber::fmt::format().json();
            EventFormat::Json(json_format)
        } else {
            let full_format = tracing_subscriber::fmt::format()
                .with_target(true)
                .with_timer(time_formatter());

            EventFormat::Full(full_format)
        }
    }

    fn format_fields(&self) -> FieldFormat {
        match self {
            EventFormat::Full(_) => FieldFormat::Default(DefaultFields::new()),
            EventFormat::Json(_) => FieldFormat::Json(JsonFields::new()),
        }
    }
}

impl<S, N> FormatEvent<S, N> for EventFormat<'_>
where
    S: Subscriber + for<'a> LookupSpan<'a>,
    N: for<'a> FormatFields<'a> + 'static,
{
    fn format_event(
        &self,
        ctx: &FmtContext<'_, S, N>,
        writer: Writer<'_>,
        event: &Event<'_>,
    ) -> fmt::Result {
        match self {
            EventFormat::Full(format) => format.format_event(ctx, writer, event),
            EventFormat::Json(format) => format.format_event(ctx, writer, event),
        }
    }
}

enum FieldFormat {
    Default(DefaultFields),
    Json(JsonFields),
}

impl FormatFields<'_> for FieldFormat {
    fn format_fields<R: RecordFields>(&self, writer: Writer<'_>, fields: R) -> fmt::Result {
        match self {
            FieldFormat::Default(default_fields) => default_fields.format_fields(writer, fields),
            FieldFormat::Json(json_fields) => json_fields.format_fields(writer, fields),
        }
    }
}

/// Logger configurations specific to the jemalloc profiler.
///
/// A custom event formatter is used to print the backtrace of the
/// profiling events.
#[cfg(feature = "jemalloc-profiled")]
pub(super) mod jemalloc_profiled {
    use std::fmt;

    use quickwit_common::jemalloc_profiled::JEMALLOC_PROFILER_TARGET;
    use time::format_description::BorrowedFormatItem;
    use tracing::{Event, Level, Metadata, Subscriber};
    use tracing_subscriber::Layer;
    use tracing_subscriber::filter::filter_fn;
    use tracing_subscriber::fmt::format::{DefaultFields, Writer};
    use tracing_subscriber::fmt::time::{FormatTime, UtcTime};
    use tracing_subscriber::fmt::{FmtContext, FormatEvent, FormatFields, FormattedFields};
    use tracing_subscriber::layer::SubscriberExt;
    use tracing_subscriber::registry::LookupSpan;

    use super::{EventFormat, FieldFormat, startup_env_filter, time_formatter};
    use crate::logger::ReloadLayer;

    /// An event formatter specific to the memory profiler output.
    ///
    /// Also displays a backtrace after the spans and fields of the tracing
    /// event (into separate lines).
    struct ProfilingFormat {
        time_formatter: UtcTime<Vec<BorrowedFormatItem<'static>>>,
    }

    impl Default for ProfilingFormat {
        fn default() -> Self {
            Self {
                time_formatter: time_formatter(),
            }
        }
    }

    impl<S, N> FormatEvent<S, N> for ProfilingFormat
    where
        S: Subscriber + for<'a> LookupSpan<'a>,
        N: for<'a> FormatFields<'a> + 'static,
    {
        fn format_event(
            &self,
            ctx: &FmtContext<'_, S, N>,
            mut writer: Writer<'_>,
            event: &Event<'_>,
        ) -> fmt::Result {
            self.time_formatter.format_time(&mut writer)?;
            write!(writer, " {JEMALLOC_PROFILER_TARGET} ")?;
            if let Some(scope) = ctx.event_scope() {
                let mut seen = false;

                for span in scope.from_root() {
                    write!(writer, "{}", span.metadata().name())?;
                    seen = true;

                    let ext = span.extensions();
                    if let Some(fields) = &ext.get::<FormattedFields<N>>()
                        && !fields.is_empty()
                    {
                        write!(writer, "{{{fields}}}:")?;
                    }
                }

                if seen {
                    writer.write_char(' ')?;
                }
            };

            ctx.format_fields(writer.by_ref(), event)?;
            writeln!(writer)?;

            // Print a backtrace to help identify the callsite
            backtrace::trace(|frame| {
                backtrace::resolve_frame(frame, |symbol| {
                    if let Some(symbole_name) = symbol.name() {
                        let _ = writeln!(writer, "{symbole_name}");
                    } else {
                        let _ = writeln!(writer, "symb failed");
                    }
                });
                true
            });
            Ok(())
        }
    }

    fn profiler_tracing_filter(metadata: &Metadata) -> bool {
        metadata.is_span() || (metadata.is_event() && metadata.target() == JEMALLOC_PROFILER_TARGET)
    }

    /// Configures the regular logging layer and a specific layer that gathers
    /// extra debug information for the jemalloc profiler.
    ///
    /// The the jemalloc profiler formatter disables the env filter reloading
    /// because the [tracing_subscriber::reload::Layer] seems to overwrite the
    /// filter configured by [profiler_tracing_filter()] even though it is
    /// applied to a separate layer.
    pub(super) fn configure_registry<S>(
        registry: S,
        event_format: EventFormat<'static>,
        fmt_fields: FieldFormat,
        ansi_colors: bool,
        level: Level,
        _reloadable_env_filter: ReloadLayer,
    ) -> anyhow::Result<impl Subscriber + for<'span> LookupSpan<'span>>
    where
        S: Subscriber + for<'span> LookupSpan<'span>,
    {
        Ok(registry
            .with(
                tracing_subscriber::fmt::layer()
                    .event_format(ProfilingFormat::default())
                    .fmt_fields(DefaultFields::new())
                    .with_ansi(ansi_colors)
                    .with_filter(filter_fn(profiler_tracing_filter)),
            )
            .with(
                tracing_subscriber::fmt::layer()
                    .event_format(event_format)
                    .fmt_fields(fmt_fields)
                    .with_ansi(ansi_colors)
                    .with_filter(startup_env_filter(level)?),
            ))
    }
}


================================================
FILE: quickwit/quickwit-cli/src/main.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![recursion_limit = "256"]

use std::collections::BTreeMap;

use anyhow::Context;
use colored::Colorize;
use quickwit_cli::checklist::RED_COLOR;
use quickwit_cli::cli::{CliCommand, build_cli};
#[cfg(feature = "jemalloc")]
use quickwit_cli::jemalloc::start_jemalloc_metrics_loop;
use quickwit_cli::logger::setup_logging_and_tracing;
use quickwit_cli::{busy_detector, install_default_crypto_ring_provider};
use quickwit_common::runtimes::scrape_tokio_runtime_metrics;
use quickwit_serve::BuildInfo;
use tracing::error;

/// The main tokio runtime takes num_cores / 3 threads by default, and can be overridden by the
/// QW_RUNTIME_NUM_THREADS environment variable.
fn get_main_runtime_num_threads() -> usize {
    let default_num_runtime_threads: usize = quickwit_common::num_cpus().div_ceil(3);
    quickwit_common::get_from_env(
        "QW_TOKIO_RUNTIME_NUM_THREADS",
        default_num_runtime_threads,
        false,
    )
}

fn main() -> anyhow::Result<()> {
    let main_runtime_num_threads: usize = get_main_runtime_num_threads();
    let rt = tokio::runtime::Builder::new_multi_thread()
        .enable_all()
        .on_thread_unpark(busy_detector::thread_unpark)
        .on_thread_park(busy_detector::thread_park)
        .thread_name("main_runtime_thread")
        .worker_threads(main_runtime_num_threads)
        .build()
        .context("failed to start main Tokio runtime")?;

    scrape_tokio_runtime_metrics(rt.handle(), "main");

    rt.block_on(main_impl())
}

fn register_build_info_metric() {
    use itertools::Itertools;
    let build_info = BuildInfo::get();
    let mut build_kvs = BTreeMap::default();
    build_kvs.insert("build_date", build_info.build_date.to_string());
    build_kvs.insert("commit_hash", build_info.commit_short_hash.to_string());
    build_kvs.insert("version", build_info.version.to_string());
    if !build_info.commit_tags.is_empty() {
        let tags_str = build_info.commit_tags.iter().join(",");
        build_kvs.insert("commit_tags", tags_str);
    }
    build_kvs.insert("target", build_info.build_target.to_string());
    quickwit_common::metrics::register_info("build_info", "Quickwit's build info", build_kvs);
}

async fn main_impl() -> anyhow::Result<()> {
    #[cfg(feature = "openssl-support")]
    unsafe {
        openssl_probe::init_openssl_env_vars()
    };
    register_build_info_metric();

    let about_text = about_text();
    let version_text = BuildInfo::get_version_text();

    let app = build_cli().about(about_text).version(version_text);
    let matches = app.get_matches();
    let ansi_colors = !matches.get_flag("no-color");

    let command = match CliCommand::parse_cli_args(matches) {
        Ok(command) => command,
        Err(error) => {
            eprintln!("failed to parse command line arguments: {error:?}");
            std::process::exit(1);
        }
    };

    install_default_crypto_ring_provider();

    #[cfg(feature = "jemalloc")]
    start_jemalloc_metrics_loop();

    let build_info = BuildInfo::get();
    let (env_filter_reload_fn, tracer_provider_opt) =
        setup_logging_and_tracing(command.default_log_level(), ansi_colors, build_info)?;

    let return_code: i32 = if let Err(command_error) = command.execute(env_filter_reload_fn).await {
        error!(error=%command_error, "command failed");
        eprintln!(
            "{} command failed: {:?}\n",
            "✘".color(RED_COLOR),
            command_error
        );
        1
    } else {
        0
    };

    if let Some((trace_provider, logs_provider)) = tracer_provider_opt {
        trace_provider
            .shutdown()
            .context("failed to shutdown OpenTelemetry tracer provider")?;
        logs_provider
            .shutdown()
            .context("failed to shutdown OpenTelemetry logs provider")?;
    }

    std::process::exit(return_code)
}

/// Return the about text with telemetry info.
fn about_text() -> String {
    let mut about_text = String::from(
        "Sub-second search & analytics engine on cloud storage.\n  Find more information at https://quickwit.io/docs\n\n",
    );
    if !quickwit_telemetry::is_telemetry_disabled() {
        about_text += "Telemetry: enabled";
    }
    about_text
}

#[cfg(test)]
mod tests {
    use std::str::FromStr;
    use std::time::Duration;

    use bytesize::ByteSize;
    use quickwit_cli::ClientArgs;
    use quickwit_cli::cli::{CliCommand, build_cli};
    use quickwit_cli::index::{
        ClearIndexArgs, CreateIndexArgs, DeleteIndexArgs, DescribeIndexArgs, IndexCliCommand,
        IngestDocsArgs, SearchIndexArgs,
    };
    use quickwit_cli::split::{DescribeSplitArgs, SplitCliCommand};
    use quickwit_cli::tool::{
        ExtractSplitArgs, GarbageCollectIndexArgs, LocalIngestDocsArgs, LocalSearchArgs, MergeArgs,
        ToolCliCommand,
    };
    use quickwit_common::uri::Uri;
    use quickwit_config::SourceInputFormat;
    use quickwit_rest_client::models::Timeout;
    use quickwit_rest_client::rest_client::CommitType;
    use reqwest::Url;

    #[test]
    fn test_parse_clear_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(["index", "clear", "--index", "wikipedia"])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_cmd = CliCommand::Index(IndexCliCommand::Clear(ClearIndexArgs {
            client_args: ClientArgs::default(),
            index_id: "wikipedia".to_string(),
            assume_yes: false,
        }));
        assert_eq!(command, expected_cmd);

        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(["index", "clear", "--index", "wikipedia", "--yes"])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_cmd = CliCommand::Index(IndexCliCommand::Clear(ClearIndexArgs {
            client_args: ClientArgs::default(),
            index_id: "wikipedia".to_string(),
            assume_yes: true,
        }));
        assert_eq!(command, expected_cmd);
    }

    #[test]
    fn test_parse_create_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let _ = app
            .try_get_matches_from(["new", "--index-uri", "file:///indexes/wikipedia"])
            .unwrap_err();

        let app = build_cli().no_binary_name(true);
        let matches =
            app.try_get_matches_from(["index", "create", "--index-config", "index-conf.yaml"])?;
        let command = CliCommand::parse_cli_args(matches)?;
        let expected_index_config_uri = Uri::from_str(&format!(
            "file://{}/index-conf.yaml",
            std::env::current_dir().unwrap().display()
        ))
        .unwrap();
        let expected_cmd = CliCommand::Index(IndexCliCommand::Create(CreateIndexArgs {
            client_args: ClientArgs::default(),
            index_config_uri: expected_index_config_uri.clone(),
            overwrite: false,
            assume_yes: false,
        }));
        assert_eq!(command, expected_cmd);

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "create",
            "--index-config",
            "index-conf.yaml",
            "--overwrite",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        let expected_cmd = CliCommand::Index(IndexCliCommand::Create(CreateIndexArgs {
            client_args: ClientArgs::default(),
            index_config_uri: expected_index_config_uri,
            overwrite: true,
            assume_yes: false,
        }));
        assert_eq!(command, expected_cmd);

        Ok(())
    }

    #[test]
    fn test_parse_ingest_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "ingest",
            "--index",
            "wikipedia",
            "--endpoint",
            "http://127.0.0.1:8000",
            "--retries",
            "2",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Ingest(
                IngestDocsArgs {
                    client_args,
                    index_id,
                    input_path_opt: None,
                    batch_size_limit_opt: None,
                    commit_type: CommitType::Auto,
                    detailed_response: false,
                })) if &index_id == "wikipedia"
                && client_args.timeout.is_none()
                && client_args.connect_timeout.is_none()
                && client_args.commit_timeout.is_none()
                && client_args.cluster_endpoint == Url::from_str("http://127.0.0.1:8000").unwrap()
                && client_args.num_retries == 2
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "ingest",
            "--index",
            "wikipedia",
            "--detailed-response",
            "--batch-size-limit",
            "8MB",
            "--force",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Ingest(
                IngestDocsArgs {
                    client_args,
                    index_id,
                    input_path_opt: None,
                    batch_size_limit_opt: Some(batch_size_limit),
                    commit_type: CommitType::Force,
                    detailed_response: true,
                })) if &index_id == "wikipedia"
                        && client_args.cluster_endpoint == Url::from_str("http://127.0.0.1:7280").unwrap()
                        && client_args.timeout.is_none()
                        && client_args.connect_timeout.is_none()
                        && client_args.commit_timeout.is_none()
                        && client_args.num_retries == 0
                        && batch_size_limit == ByteSize::mb(8)
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "ingest",
            "--index",
            "wikipedia",
            "--batch-size-limit",
            "4KB",
            "--wait",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Ingest(
                IngestDocsArgs {
                    client_args,
                    index_id,
                    input_path_opt: None,
                    batch_size_limit_opt: Some(batch_size_limit),
                    commit_type: CommitType::WaitFor,
                    detailed_response: false,
                })) if &index_id == "wikipedia"
                    && client_args.cluster_endpoint == Url::from_str("http://127.0.0.1:7280").unwrap()
                    && client_args.timeout.is_none()
                    && client_args.connect_timeout.is_none()
                    && client_args.commit_timeout.is_none()
                    && client_args.num_retries == 0
                    && batch_size_limit == ByteSize::kb(4)
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "ingest",
            "--index",
            "wikipedia",
            "--timeout",
            "10s",
            "--connect-timeout",
            "2s",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Ingest(
                IngestDocsArgs {
                    client_args,
                    index_id,
                    input_path_opt: None,
                    batch_size_limit_opt: None,
                    commit_type: CommitType::Auto,
                    detailed_response: false,
                })) if &index_id == "wikipedia"
                        && client_args.cluster_endpoint == Url::from_str("http://127.0.0.1:7280").unwrap()
                        && client_args.timeout == Some(Timeout::from_secs(10))
                        && client_args.connect_timeout == Some(Timeout::from_secs(2))
                        && client_args.commit_timeout.is_none()
                        && client_args.num_retries == 0
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "ingest",
            "--index",
            "wikipedia",
            "--timeout",
            "none",
            "--wait",
            "--connect-timeout",
            "15s",
            "--commit-timeout",
            "4h",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Ingest(
                IngestDocsArgs {
                    client_args,
                    index_id,
                    input_path_opt: None,
                    batch_size_limit_opt: None,
                    commit_type: CommitType::WaitFor,
                    detailed_response: false,
                })) if &index_id == "wikipedia"
                        && client_args.cluster_endpoint == Url::from_str("http://127.0.0.1:7280").unwrap()
                        && client_args.timeout == Some(Timeout::none())
                        && client_args.connect_timeout == Some(Timeout::from_secs(15))
                        && client_args.commit_timeout == Some(Timeout::from_hours(4))
        ));

        let app = build_cli().no_binary_name(true);
        assert_eq!(
            app.try_get_matches_from([
                "index",
                "ingest",
                "--index",
                "wikipedia",
                "--wait",
                "--force",
            ])
            .unwrap_err()
            .kind(),
            clap::error::ErrorKind::ArgumentConflict
        );
        Ok(())
    }

    #[test]
    fn test_parse_local_ingest_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from([
                "tool",
                "local-ingest",
                "--index",
                "wikipedia",
                "--config",
                "/config.yaml",
                "--overwrite",
                "--keep-cache",
                "--input-format",
                "plain",
                "--transform-script",
                ".message = downcase(string!(.message))",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::LocalIngest(
                LocalIngestDocsArgs {
                    config_uri,
                    index_id,
                    input_path_opt: None,
                    input_format,
                    overwrite,
                    vrl_script: Some(vrl_script),
                    clear_cache,
                })) if &index_id == "wikipedia"
                       && config_uri == Uri::from_str("file:///config.yaml").unwrap()
                       && vrl_script == ".message = downcase(string!(.message))"
                       && overwrite
                       && !clear_cache
                       && input_format == SourceInputFormat::PlainText,
        ));
    }

    #[test]
    fn test_parse_search_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "search",
            "--index",
            "wikipedia",
            "--query",
            "Barack Obama",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Search(SearchIndexArgs {
                index_id,
                query,
                max_hits: 20,
                start_offset: 0,
                search_fields: None,
                snippet_fields: None,
                start_timestamp: None,
                end_timestamp: None,
                aggregation: None,
                ..
            })) if &index_id == "wikipedia" && &query == "Barack Obama"
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "index",
            "search",
            "--index",
            "wikipedia",
            "--query",
            "Barack Obama",
            "--max-hits",
            "50",
            "--start-offset",
            "100",
            "--start-timestamp",
            "0",
            "--end-timestamp",
            "1",
            "--search-fields",
            "title",
            "url",
            "--snippet-fields",
            "body",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Search(SearchIndexArgs {
                client_args: _,
                index_id,
                query,
                aggregation: None,
                max_hits: 50,
                start_offset: 100,
                search_fields: Some(search_field_names),
                snippet_fields: Some(snippet_field_names),
                start_timestamp: Some(0),
                end_timestamp: Some(1),
                sort_by_score: false,
            })) if &index_id == "wikipedia"
                  && query == "Barack Obama"
                  && search_field_names == vec!["title".to_string(), "url".to_string()]
                  && snippet_field_names == vec!["body".to_string()]
        ));
        Ok(())
    }

    #[test]
    fn test_parse_local_search_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from([
                "tool",
                "local-search",
                "--index",
                "wikipedia",
                "--query",
                "Barack Obama",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::LocalSearch(LocalSearchArgs {
                index_id,
                query,
                max_hits: 20,
                start_offset: 0,
                search_fields: None,
                snippet_fields: None,
                start_timestamp: None,
                end_timestamp: None,
                aggregation: None,
                ..
            })) if &index_id == "wikipedia" && &query == "Barack Obama"
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from([
                "tool",
                "local-search",
                "--index",
                "wikipedia",
                "--query",
                "Barack Obama",
                "--max-hits",
                "50",
                "--start-offset",
                "100",
                "--start-timestamp",
                "0",
                "--end-timestamp",
                "1",
                "--search-fields",
                "title",
                "url",
                "--snippet-fields",
                "body",
                "--sort-by-field=-score",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::LocalSearch(LocalSearchArgs {
                config_uri: _,
                index_id,
                query,
                aggregation: None,
                max_hits: 50,
                start_offset: 100,
                search_fields: Some(search_field_names),
                snippet_fields: Some(snippet_field_names),
                start_timestamp: Some(0),
                end_timestamp: Some(1),
                sort_by_field: Some(sort_by_field),
            })) if &index_id == "wikipedia"
                  && query == "Barack Obama"
                  && search_field_names == vec!["title".to_string(), "url".to_string()]
                  && snippet_field_names == vec!["body".to_string()]
                  && sort_by_field == "-score"
        ));
    }

    #[test]
    fn test_parse_delete_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(["index", "delete", "--index", "wikipedia"])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Delete(DeleteIndexArgs {
                index_id,
                dry_run: false,
                ..
            })) if &index_id == "wikipedia"
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(["index", "delete", "--index", "wikipedia", "--dry-run"])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Delete(DeleteIndexArgs {
                index_id,
                dry_run: true,
                ..
            })) if &index_id == "wikipedia"
        ));
    }

    #[test]
    fn test_parse_describe_index_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(["index", "describe", "--index", "wikipedia"])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        assert!(matches!(
            command,
            CliCommand::Index(IndexCliCommand::Describe(DescribeIndexArgs {
                index_id,
                ..
            })) if &index_id == "wikipedia"
        ));
    }

    #[test]
    fn test_parse_split_describe_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "split",
            "describe",
            "--index",
            "wikipedia",
            "--split",
            "ABC",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Split(SplitCliCommand::Describe(DescribeSplitArgs {
                index_id,
                split_id,
                verbose: false,
                ..
            })) if &index_id == "wikipedia" && &split_id == "ABC"
        ));
        Ok(())
    }

    #[test]
    fn test_parse_split_extract_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "tool",
            "extract-split",
            "--index",
            "wikipedia",
            "--split",
            "ABC",
            "--target-dir",
            "datadir",
            "--config",
            "/config.yaml",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::ExtractSplit(ExtractSplitArgs {
                index_id,
                split_id,
                target_dir,
                ..
            })) if &index_id == "wikipedia" && &split_id == "ABC" && target_dir == *"datadir"
        ));
        Ok(())
    }

    #[test]
    fn test_parse_garbage_collect_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "tool",
            "gc",
            "--index",
            "wikipedia",
            "--config",
            "/config.yaml",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::GarbageCollect(GarbageCollectIndexArgs {
                index_id,
                grace_period,
                dry_run: false,
                ..
            })) if &index_id == "wikipedia" && grace_period == Duration::from_secs(60 * 60)
        ));

        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "tool",
            "gc",
            "--index",
            "wikipedia",
            "--grace-period",
            "5m",
            "--config",
            "/config.yaml",
            "--dry-run",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        let expected_config_uri = Uri::from_str("file:///config.yaml").unwrap();
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::GarbageCollect(GarbageCollectIndexArgs {
                index_id,
                grace_period,
                config_uri,
                dry_run: true,
            })) if &index_id == "wikipedia" && grace_period == Duration::from_secs(5 * 60) && config_uri == expected_config_uri
        ));
        Ok(())
    }

    #[test]
    fn test_parse_merge_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from([
            "tool",
            "merge",
            "--index",
            "wikipedia",
            "--source",
            "ingest-source",
            "--config",
            "/config.yaml",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Tool(ToolCliCommand::Merge(MergeArgs {
                index_id,
                source_id,
                ..
            })) if &index_id == "wikipedia" && source_id == "ingest-source"
        ));
        Ok(())
    }

    #[test]
    fn test_parse_no_color() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremly inconvenient to run it in a different
        // way, we are keeping it that way

        let previous_no_color_res = std::env::var("NO_COLOR");
        {
            unsafe { std::env::set_var("NO_COLOR", "whatever_interpreted_as_true") };
            let app = build_cli().no_binary_name(true);
            let matches = app.try_get_matches_from(["run"]).unwrap();
            let no_color = matches.get_flag("no-color");
            assert!(no_color);
        }
        {
            // empty string is false.
            unsafe { std::env::set_var("NO_COLOR", "") };
            let app = build_cli().no_binary_name(true);
            let matches = app.try_get_matches_from(["run"]).unwrap();
            let no_color = matches.get_flag("no-color");
            assert!(!no_color);
        }
        {
            // empty string is false.
            let app = build_cli().no_binary_name(true);
            let matches = app.try_get_matches_from(["run", "--no-color"]).unwrap();
            let no_color = matches.get_flag("no-color");
            assert!(no_color);
        }
        if let Ok(previous_no_color) = previous_no_color_res {
            unsafe { std::env::set_var("NO_COLOR", previous_no_color) };
        }
    }
}


================================================
FILE: quickwit/quickwit-cli/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{HistogramVec, new_histogram_vec};

pub struct CliMetrics {
    pub thread_unpark_duration_microseconds: HistogramVec<0>,
}

impl Default for CliMetrics {
    fn default() -> Self {
        CliMetrics {
            thread_unpark_duration_microseconds: new_histogram_vec(
                "thread_unpark_duration_microseconds",
                "Duration for which a thread of the main tokio runtime is unparked.",
                "cli",
                &[],
                [],
                quickwit_common::metrics::exponential_buckets(5.0, 5.0, 5).unwrap(),
            ),
        }
    }
}

/// Serve counters exposes a bunch a set of metrics about the request received to quickwit.
pub static CLI_METRICS: Lazy<CliMetrics> = Lazy::new(CliMetrics::default);


================================================
FILE: quickwit/quickwit-cli/src/service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::pin::pin;
use std::str::FromStr;

use clap::{ArgAction, ArgMatches, Command, arg};
use colored::Colorize;
use futures::future::select;
use itertools::Itertools;
use quickwit_common::runtimes::RuntimesConfig;
use quickwit_common::uri::{Protocol, Uri};
use quickwit_config::NodeConfig;
use quickwit_config::service::QuickwitService;
use quickwit_serve::tcp_listener::DefaultTcpListenerResolver;
use quickwit_serve::{BuildInfo, EnvFilterReloadFn, serve_quickwit};
use quickwit_telemetry::payload::{QuickwitFeature, QuickwitTelemetryInfo, TelemetryEvent};
use tokio::signal;
use tracing::{debug, info};

use crate::checklist::{BLUE_COLOR, RED_COLOR};
use crate::{config_cli_arg, get_resolvers, load_node_config, start_actor_runtimes};

pub fn build_run_command() -> Command {
    Command::new("run")
        .about("Starts a Quickwit node.")
        .long_about("Starts a Quickwit node with all services enabled by default: `indexer`, `searcher`, `metastore`, `control-plane`, and `janitor`.")
        .arg(config_cli_arg())
        .args(&[
            arg!(--"service" <SERVICE> "Services (`indexer`, `searcher`, `metastore`, `control-plane`, or `janitor`) to run. If unspecified, all the supported services are started.")
                .action(ArgAction::Append)
                .required(false),
        ])
}

#[derive(Debug, Eq, PartialEq)]
pub struct RunCliCommand {
    pub config_uri: Uri,
    pub services: Option<HashSet<QuickwitService>>,
}

async fn listen_interrupt() {
    async fn ctrl_c() {
        signal::ctrl_c()
            .await
            .expect("registering a signal handler for SIGINT should not fail");
        // carriage return to hide the ^C echo from the terminal
        print!("\r");
    }
    ctrl_c().await;
    println!(
        "{} Graceful shutdown initiated. Waiting for ingested data to be indexed. This may take a \
         few minutes. Press Ctrl+C again to force shutdown.",
        "❢".color(BLUE_COLOR)
    );
    tokio::spawn(async {
        ctrl_c().await;
        println!(
            "{} Quickwit was forcefully shut down. Some data might not have been indexed.",
            "✘".color(RED_COLOR)
        );
        std::process::exit(1);
    });
}

async fn listen_sigterm() {
    signal::unix::signal(signal::unix::SignalKind::terminate())
        .expect("registering a signal handler for SIGTERM should not fail")
        .recv()
        .await;
    info!("SIGTERM received");
}

impl RunCliCommand {
    pub fn parse_cli_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let config_uri = matches
            .remove_one::<String>("config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`config` should be a required arg.")?;
        let services = matches
            .remove_many::<String>("service")
            .map(|values| {
                let services: Result<HashSet<_>, _> = values
                    .into_iter()
                    .map(|service_str| QuickwitService::from_str(&service_str))
                    .collect();
                services
            })
            .transpose()?;
        Ok(RunCliCommand {
            config_uri,
            services,
        })
    }

    pub async fn execute(&self, env_filter_reload_fn: EnvFilterReloadFn) -> anyhow::Result<()> {
        debug!(args = ?self, "run-service");
        let version_text = BuildInfo::get_version_text();
        info!("quickwit version: {version_text}");
        let mut node_config = load_node_config(&self.config_uri).await?;
        let (storage_resolver, metastore_resolver) =
            get_resolvers(&node_config.storage_configs, &node_config.metastore_configs);
        crate::busy_detector::set_enabled(true);

        if let Some(services) = &self.services {
            info!(services = %services.iter().join(", "), "setting services from override");
            node_config.enabled_services.clone_from(services);
        }
        let telemetry_handle_opt =
            quickwit_telemetry::start_telemetry_loop(quickwit_telemetry_info(&node_config));
        quickwit_telemetry::send_telemetry_event(TelemetryEvent::RunCommand).await;
        // TODO move in serve quickwit?
        let runtimes_config = RuntimesConfig::default();
        start_actor_runtimes(runtimes_config, &node_config.enabled_services)?;
        let shutdown_signal = Box::pin(async {
            select(pin!(listen_interrupt()), pin!(listen_sigterm())).await;
        });
        let serve_result = serve_quickwit(
            node_config,
            runtimes_config,
            metastore_resolver,
            storage_resolver,
            DefaultTcpListenerResolver,
            shutdown_signal,
            env_filter_reload_fn,
        )
        .await;
        let return_code = match serve_result {
            Ok(_) => 0,
            Err(_) => 1,
        };
        quickwit_telemetry::send_telemetry_event(TelemetryEvent::EndCommand { return_code }).await;
        if let Some(telemetry_handle) = telemetry_handle_opt {
            telemetry_handle.terminate_telemetry().await;
        }
        serve_result?;
        info!("quickwit successfully terminated");
        Ok(())
    }
}

fn quickwit_telemetry_info(config: &NodeConfig) -> QuickwitTelemetryInfo {
    let mut features = HashSet::new();
    if config.indexer_config.enable_otlp_endpoint {
        features.insert(QuickwitFeature::Otlp);
    }
    if config.jaeger_config.enable_endpoint {
        features.insert(QuickwitFeature::Jaeger);
    }
    // The metastore URI is only relevant if the metastore is enabled.
    if config.is_service_enabled(QuickwitService::Metastore) {
        let feature = if config.metastore_uri.protocol() == Protocol::PostgreSQL {
            QuickwitFeature::PostgresqMetastore
        } else {
            QuickwitFeature::FileBackedMetastore
        };
        features.insert(feature);
    }
    let services = config
        .enabled_services
        .iter()
        .map(|service| service.to_string())
        .collect();
    QuickwitTelemetryInfo::new(services, features)
}

#[cfg(test)]
mod tests {

    use super::*;
    use crate::cli::{CliCommand, build_cli};

    #[test]
    fn test_parse_service_run_args_all_services() -> anyhow::Result<()> {
        let command = build_cli().no_binary_name(true);
        let matches = command.try_get_matches_from(vec!["run", "--config", "/config.yaml"])?;
        let command = CliCommand::parse_cli_args(matches)?;
        let expected_config_uri = Uri::from_str("file:///config.yaml").unwrap();
        assert!(matches!(
            command,
            CliCommand::Run(RunCliCommand {
                config_uri,
                services,
                ..
            })
            if config_uri == expected_config_uri && services.is_none()
        ));
        Ok(())
    }

    #[test]
    fn test_parse_service_run_args_indexer_only() -> anyhow::Result<()> {
        let command = build_cli().no_binary_name(true);
        let matches = command.try_get_matches_from(vec![
            "run",
            "--config",
            "/config.yaml",
            "--service",
            "indexer",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        let expected_config_uri = Uri::from_str("file:///config.yaml").unwrap();
        assert!(matches!(
            command,
            CliCommand::Run(RunCliCommand {
                config_uri,
                services,
                ..
            })
            if config_uri == expected_config_uri && services.as_ref().unwrap().len() == 1 && services.as_ref().unwrap().iter().cloned().next().unwrap() == QuickwitService::Indexer
        ));
        Ok(())
    }

    #[test]
    fn test_parse_service_run_args_searcher_and_metastore() -> anyhow::Result<()> {
        let command = build_cli().no_binary_name(true);
        let matches = command.try_get_matches_from(vec![
            "run",
            "--config",
            "/config.yaml",
            "--service",
            "searcher",
            "--service",
            "metastore",
        ])?;
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_config_uri = Uri::from_str("file:///config.yaml").unwrap();
        let expected_services =
            HashSet::from_iter([QuickwitService::Metastore, QuickwitService::Searcher]);
        assert!(matches!(
            command,
            CliCommand::Run(RunCliCommand {
                config_uri,
                services,
                ..
            })
            if config_uri == expected_config_uri && services.as_ref().unwrap().len() == 2 && services.as_ref().unwrap() == &expected_services
        ));
        Ok(())
    }

    #[test]
    fn test_parse_service_run_indexer_only_args() -> anyhow::Result<()> {
        let command = build_cli().no_binary_name(true);
        let matches = command.try_get_matches_from(vec![
            "run",
            "--config",
            "/config.yaml",
            "--service",
            "indexer",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        let expected_config_uri = Uri::from_str("file:///config.yaml").unwrap();
        assert!(matches!(
            command,
            CliCommand::Run(RunCliCommand {
                config_uri,
                services,
                ..
            })
            if config_uri == expected_config_uri && services.as_ref().unwrap().len() == 1 && services.as_ref().unwrap().contains(&QuickwitService::Indexer)
        ));
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-cli/src/source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::str::FromStr;

use anyhow::{Context, bail};
use clap::{ArgMatches, Command, arg};
use colored::Colorize;
use itertools::Itertools;
use quickwit_common::uri::Uri;
use quickwit_config::{ConfigFormat, SourceConfig, validate_identifier};
use quickwit_metastore::checkpoint::SourceCheckpoint;
use quickwit_proto::types::{IndexId, SourceId};
use quickwit_storage::{StorageResolver, load_file};
use serde_json::Value as JsonValue;
use tabled::{Table, Tabled};
use tracing::debug;

use crate::checklist::GREEN_COLOR;
use crate::{ClientArgs, client_args, make_table, prompt_confirmation};

pub fn build_source_command() -> Command {
    Command::new("source")
        .about("Manages sources: creates, updates, deletes sources...")
        .args(client_args())
        .subcommand(
            Command::new("create")
                .about("Adds a new source to an index.")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--"source-config" <SOURCE_CONFIG> "Path to source config file. Please, refer to the documentation for more details.")
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("update")
                .about("Updates an existing source.")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "ID of the source")
                        .display_order(2)
                        .required(true),
                    arg!(--"source-config" <SOURCE_CONFIG> "Path to source config file. Please, refer to the documentation for more details.")
                        .required(true),
                    arg!(--"create" "Create the index if it does not already exists.")
                        .required(false),
                ])
            )
        .subcommand(
            Command::new("enable")
                .about("Enables a source for an index.")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "ID of the source.")
                        .display_order(2)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("disable")
                .about("Disables a source for an index.")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "ID of the source.")
                        .display_order(2)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("ingest-api")
                .about("Enables/disables the ingest API of an index.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--enable "Enables the ingest API.")
                        .display_order(2),
                    arg!(--disable "Disables the ingest API.")
                        .display_order(3)
                        .conflicts_with("enable"),
                ])
            )
        .subcommand(
            Command::new("delete")
                .about("Deletes a source from an index.")
                .alias("del")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "ID of the source.")
                        .display_order(2)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("describe")
                .about("Describes a source.")
                .alias("desc")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "ID of the source.")
                        .display_order(2)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("list")
                .about("Lists the sources of an index.")
                .alias("ls")
                .args(&[
                    arg!(--index <INDEX_ID> "ID of the target index")
                        .display_order(1)
                        .required(true),
                ])
            )
        .subcommand(
            Command::new("reset-checkpoint")
                .about("Resets a source checkpoint.")
                .alias("reset")
                .args(&[
                    arg!(--index <INDEX_ID> "Index ID")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "Source ID")
                        .display_order(2)
                        .required(true),
                ])
            )
        .arg_required_else_help(true)
}

#[derive(Debug, Eq, PartialEq)]
pub struct CreateSourceArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub source_config_uri: Uri,
}

#[derive(Debug, Eq, PartialEq)]
pub struct UpdateSourceArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub source_id: SourceId,
    pub source_config_uri: Uri,
    pub create: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct ToggleSourceArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub source_id: SourceId,
    pub enable: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct DeleteSourceArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub source_id: SourceId,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct DescribeSourceArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub source_id: SourceId,
}

#[derive(Debug, Eq, PartialEq)]
pub struct ListSourcesArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
}

#[derive(Debug, Eq, PartialEq)]
pub struct ResetCheckpointArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub source_id: SourceId,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub enum SourceCliCommand {
    CreateSource(CreateSourceArgs),
    UpdateSource(UpdateSourceArgs),
    ToggleSource(ToggleSourceArgs),
    DeleteSource(DeleteSourceArgs),
    DescribeSource(DescribeSourceArgs),
    ListSources(ListSourcesArgs),
    ResetCheckpoint(ResetCheckpointArgs),
}

impl SourceCliCommand {
    pub async fn execute(self) -> anyhow::Result<()> {
        match self {
            Self::CreateSource(args) => create_source_cli(args).await,
            Self::UpdateSource(args) => update_source_cli(args).await,
            Self::ToggleSource(args) => toggle_source_cli(args).await,
            Self::DeleteSource(args) => delete_source_cli(args).await,
            Self::DescribeSource(args) => describe_source_cli(args).await,
            Self::ListSources(args) => list_sources_cli(args).await,
            Self::ResetCheckpoint(args) => reset_checkpoint_cli(args).await,
        }
    }

    pub fn parse_cli_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let (subcommand, submatches) = matches
            .remove_subcommand()
            .context("failed to parse source subcommand")?;
        match subcommand.as_str() {
            "create" => Self::parse_create_args(submatches).map(Self::CreateSource),
            "update" => Self::parse_update_args(submatches).map(Self::UpdateSource),
            "enable" => {
                Self::parse_toggle_source_args(&subcommand, submatches).map(Self::ToggleSource)
            }
            "disable" => {
                Self::parse_toggle_source_args(&subcommand, submatches).map(Self::ToggleSource)
            }
            "delete" => Self::parse_delete_args(submatches).map(Self::DeleteSource),
            "describe" => Self::parse_describe_args(submatches).map(Self::DescribeSource),
            "list" => Self::parse_list_args(submatches).map(Self::ListSources),
            "reset-checkpoint" => {
                Self::parse_reset_checkpoint_args(submatches).map(Self::ResetCheckpoint)
            }
            _ => bail!("unknown source subcommand `{subcommand}`"),
        }
    }

    fn parse_create_args(mut matches: ArgMatches) -> anyhow::Result<CreateSourceArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let source_config_uri = matches
            .remove_one::<String>("source-config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`source-config` should be a required arg.")?;
        Ok(CreateSourceArgs {
            client_args,
            index_id,
            source_config_uri,
        })
    }

    fn parse_update_args(mut matches: ArgMatches) -> anyhow::Result<UpdateSourceArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let source_id = matches
            .remove_one::<String>("source")
            .expect("`source` should be a required arg.");
        let source_config_uri = matches
            .remove_one::<String>("source-config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`source-config` should be a required arg.")?;
        let create = matches.get_flag("create");

        Ok(UpdateSourceArgs {
            client_args,
            index_id,
            source_id,
            source_config_uri,
            create,
        })
    }

    fn parse_toggle_source_args(
        subcommand: &str,
        mut matches: ArgMatches,
    ) -> anyhow::Result<ToggleSourceArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let source_id = matches
            .remove_one::<String>("source")
            .expect("`source` should be a required arg.");
        let enable = matches!(subcommand, "enable");
        Ok(ToggleSourceArgs {
            client_args,
            index_id,
            source_id,
            enable,
        })
    }

    fn parse_delete_args(mut matches: ArgMatches) -> anyhow::Result<DeleteSourceArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let source_id = matches
            .remove_one::<String>("source")
            .expect("`source` should be a required arg.");
        let assume_yes = matches.get_flag("yes");
        Ok(DeleteSourceArgs {
            client_args,
            index_id,
            source_id,
            assume_yes,
        })
    }

    fn parse_describe_args(mut matches: ArgMatches) -> anyhow::Result<DescribeSourceArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let source_id = matches
            .remove_one::<String>("source")
            .expect("`source` should be a required arg.");
        Ok(DescribeSourceArgs {
            client_args,
            index_id,
            source_id,
        })
    }

    fn parse_list_args(mut matches: ArgMatches) -> anyhow::Result<ListSourcesArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        Ok(ListSourcesArgs {
            client_args,
            index_id,
        })
    }

    fn parse_reset_checkpoint_args(mut matches: ArgMatches) -> anyhow::Result<ResetCheckpointArgs> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let source_id = matches
            .remove_one::<String>("source")
            .expect("`source` should be a required arg.");
        let assume_yes = matches.get_flag("yes");
        Ok(ResetCheckpointArgs {
            client_args,
            index_id,
            source_id,
            assume_yes,
        })
    }
}

async fn create_source_cli(args: CreateSourceArgs) -> anyhow::Result<()> {
    debug!(args=?args, "create-source");
    println!("❯ Creating source...");
    let storage_resolver = StorageResolver::unconfigured();
    let source_config_content = load_file(&storage_resolver, &args.source_config_uri).await?;
    let source_config_str: &str = std::str::from_utf8(&source_config_content)
        .with_context(|| format!("source config is not utf-8: {}", args.source_config_uri))?;
    let config_format = ConfigFormat::sniff_from_uri(&args.source_config_uri)?;
    let qw_client = args.client_args.client();
    qw_client
        .sources(&args.index_id)
        .create(source_config_str, config_format)
        .await?;
    println!("{} Source successfully created.", "✔".color(GREEN_COLOR));
    Ok(())
}

async fn update_source_cli(args: UpdateSourceArgs) -> anyhow::Result<()> {
    debug!(args=?args, "update-source");
    println!("❯ Updating source...");
    let storage_resolver = StorageResolver::unconfigured();
    let source_config_content = load_file(&storage_resolver, &args.source_config_uri).await?;
    let source_config_str: &str = std::str::from_utf8(&source_config_content)
        .with_context(|| format!("source config is not utf-8: {}", args.source_config_uri))?;
    let config_format = ConfigFormat::sniff_from_uri(&args.source_config_uri)?;
    let qw_client = args.client_args.client();
    qw_client
        .sources(&args.index_id)
        .update(
            &args.source_id,
            source_config_str,
            config_format,
            args.create,
        )
        .await?;
    println!("{} Source successfully updated.", "✔".color(GREEN_COLOR));
    Ok(())
}

async fn toggle_source_cli(args: ToggleSourceArgs) -> anyhow::Result<()> {
    debug!(args=?args, "toggle-source");
    println!("❯ Toggling source...");
    let qw_client = args.client_args.client();
    qw_client
        .sources(&args.index_id)
        .toggle(&args.source_id, args.enable)
        .await
        .context("failed to update source")?;

    let toggled_state_name = if args.enable { "enabled" } else { "disabled" };
    println!(
        "{} Source successfully {}.",
        toggled_state_name,
        "✔".color(GREEN_COLOR)
    );
    Ok(())
}

async fn delete_source_cli(args: DeleteSourceArgs) -> anyhow::Result<()> {
    debug!(args=?args, "delete-source");
    println!("❯ Deleting source...");
    validate_identifier("Source ID", &args.source_id)?;

    if !args.assume_yes {
        let prompt = "This operation will delete the source. Do you want to proceed?".to_string();
        if !prompt_confirmation(&prompt, false) {
            return Ok(());
        }
    }

    let qw_client = args.client_args.client();
    qw_client
        .sources(&args.index_id)
        .delete(&args.source_id)
        .await
        .context("failed to delete source")?;
    println!("{} Source successfully deleted.", "✔".color(GREEN_COLOR));
    Ok(())
}

async fn describe_source_cli(args: DescribeSourceArgs) -> anyhow::Result<()> {
    debug!(args=?args, "describe-source");
    let qw_client = args.client_args.client();
    let index_metadata = qw_client
        .indexes()
        .get(&args.index_id)
        .await
        .context("failed to fetch index metadata")?;
    let source_checkpoint = index_metadata
        .checkpoint
        .source_checkpoint(&args.source_id)
        .cloned()
        .unwrap_or_default();
    let (source_table, params_table, checkpoint_table) = make_describe_source_tables(
        source_checkpoint,
        index_metadata.sources.into_values(),
        &args.source_id,
    )?;
    display_tables(&[source_table, params_table, checkpoint_table]);
    Ok(())
}

fn make_describe_source_tables<I>(
    checkpoint: SourceCheckpoint,
    sources: I,
    source_id: &str,
) -> anyhow::Result<(Table, Table, Table)>
where
    I: IntoIterator<Item = SourceConfig>,
{
    let source = sources
        .into_iter()
        .find(|source| source.source_id == source_id)
        .with_context(|| format!("source `{source_id}` does not exist"))?;

    let source_rows = vec![SourceRow {
        source_id: source.source_id.clone(),
        source_type: source.source_type().as_str().to_string(),
        enabled: source.enabled.to_string(),
    }];
    let source_table = make_table("Source", source_rows, true);

    let params_rows = flatten_json(source.params())
        .into_iter()
        .map(|(key, value)| ParamsRow { key, value })
        .sorted_by(|left, right| left.key.cmp(&right.key));
    let params_table = make_table("Parameters", params_rows, false);

    let checkpoint_rows = checkpoint
        .iter()
        .map(|(partition_id, position)| CheckpointRow {
            partition_id: partition_id.0.to_string(),
            offset: position.to_string(),
        })
        .sorted_by(|left, right| left.partition_id.cmp(&right.partition_id));
    let checkpoint_table = make_table("Checkpoint", checkpoint_rows, false);
    Ok((source_table, params_table, checkpoint_table))
}

async fn list_sources_cli(args: ListSourcesArgs) -> anyhow::Result<()> {
    let qw_client = args.client_args.client();
    let index_metadata = qw_client
        .indexes()
        .get(&args.index_id)
        .await
        .context("failed to fetch indexes metadatas")?;
    let table = make_list_sources_table(index_metadata.sources.into_values());
    display_tables(&[table]);
    Ok(())
}

fn make_list_sources_table<I>(sources: I) -> Table
where I: IntoIterator<Item = SourceConfig> {
    let rows = sources
        .into_iter()
        .map(|source| SourceRow {
            source_type: source.source_type().as_str().to_string(),
            source_id: source.source_id,
            enabled: source.enabled.to_string(),
        })
        .sorted_by(|left, right| left.source_id.cmp(&right.source_id));
    make_table("Sources", rows, false)
}

#[derive(Tabled)]
struct SourceRow {
    #[tabled(rename = "ID")]
    source_id: SourceId,
    #[tabled(rename = "Type")]
    source_type: String,
    #[tabled(rename = "Enabled")]
    enabled: String,
}

#[derive(Tabled)]
struct ParamsRow {
    #[tabled(rename = "Key")]
    key: String,
    #[tabled(rename = "Value")]
    value: JsonValue,
}

#[derive(Tabled)]
struct CheckpointRow {
    #[tabled(rename = "Partition ID")]
    partition_id: String,
    #[tabled(rename = "Offset")]
    offset: String,
}

fn display_tables(tables: &[Table]) {
    println!(
        "{}",
        tables.iter().map(|table| table.to_string()).join("\n\n")
    );
}

async fn reset_checkpoint_cli(args: ResetCheckpointArgs) -> anyhow::Result<()> {
    debug!(args=?args, "reset-checkpoint-source");
    println!("❯ Resetting source checkpoint...");
    if !args.assume_yes {
        let prompt =
            "This operation will reset the source checkpoints. Do you want to proceed?".to_string();
        if !prompt_confirmation(&prompt, false) {
            return Ok(());
        }
    }
    let qw_client = args.client_args.client();
    qw_client
        .sources(&args.index_id)
        .reset_checkpoint(&args.source_id)
        .await?;
    println!(
        "{} Checkpoint successfully deleted.",
        "✔".color(GREEN_COLOR)
    );
    Ok(())
}

/// Recursively flattens a JSON object into a vector of `(path, value)` tuples where `path`
/// represents the full path of each property in the original object. For instance, `{"root": true,
/// "parent": {"child": 0}}` yields `[("root", true), ("parent.child", 0)]`. Arrays are not
/// flattened.
fn flatten_json(value: JsonValue) -> Vec<(String, JsonValue)> {
    let mut acc = Vec::new();
    let mut values = vec![(String::new(), value)];

    while let Some((root, value)) = values.pop() {
        if let JsonValue::Object(obj) = value {
            for (key, val) in obj {
                values.push((
                    if root.is_empty() {
                        key
                    } else {
                        format!("{root}.{key}")
                    },
                    val,
                ));
            }
            continue;
        }
        acc.push((root, value))
    }
    acc
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;
    use std::str::FromStr;

    use quickwit_config::{SourceInputFormat, SourceParams};
    use quickwit_metastore::checkpoint::PartitionId;
    use quickwit_proto::types::Position;
    use serde_json::json;

    use super::*;
    use crate::cli::{CliCommand, build_cli};

    #[test]
    fn test_flatten_json() {
        assert!(flatten_json(json!({})).is_empty());

        assert_eq!(
            flatten_json(json!(JsonValue::Null)),
            vec![("".to_string(), JsonValue::Null)]
        );
        assert_eq!(
            flatten_json(
                json!({"foo": {"bar": JsonValue::Bool(true)}, "baz": JsonValue::Bool(false)})
            ),
            vec![
                ("baz".to_string(), JsonValue::Bool(false)),
                ("foo.bar".to_string(), JsonValue::Bool(true)),
            ]
        );
    }

    #[test]
    fn test_parse_create_source_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(vec![
                "source",
                "create",
                "--index",
                "hdfs-logs",
                "--source-config",
                "/source-conf.yaml",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_command =
            CliCommand::Source(SourceCliCommand::CreateSource(CreateSourceArgs {
                client_args: ClientArgs::default(),
                index_id: "hdfs-logs".to_string(),
                source_config_uri: Uri::from_str("file:///source-conf.yaml").unwrap(),
            }));
        assert_eq!(command, expected_command);
    }

    #[test]
    fn test_parse_update_source_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(vec![
                "source",
                "update",
                "--index",
                "hdfs-logs",
                "--source",
                "kafka-foo",
                "--source-config",
                "/source-conf.yaml",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_command =
            CliCommand::Source(SourceCliCommand::UpdateSource(UpdateSourceArgs {
                client_args: ClientArgs::default(),
                index_id: "hdfs-logs".to_string(),
                source_id: "kafka-foo".to_string(),
                source_config_uri: Uri::from_str("file:///source-conf.yaml").unwrap(),
                create: false,
            }));
        assert_eq!(command, expected_command);
    }

    #[test]
    fn test_parse_toggle_source_args() {
        {
            let app = build_cli().no_binary_name(true);
            let matches = app
                .try_get_matches_from(vec![
                    "source",
                    "enable",
                    "--index",
                    "hdfs-logs",
                    "--source",
                    "kafka-foo",
                ])
                .unwrap();
            let command = CliCommand::parse_cli_args(matches).unwrap();
            let expected_command =
                CliCommand::Source(SourceCliCommand::ToggleSource(ToggleSourceArgs {
                    client_args: ClientArgs::default(),
                    index_id: "hdfs-logs".to_string(),
                    source_id: "kafka-foo".to_string(),
                    enable: true,
                }));
            assert_eq!(command, expected_command);
        }
        {
            let app = build_cli().no_binary_name(true);
            let matches = app
                .try_get_matches_from(vec![
                    "source",
                    "disable",
                    "--index",
                    "hdfs-logs",
                    "--source",
                    "kafka-foo",
                ])
                .unwrap();
            let command = CliCommand::parse_cli_args(matches).unwrap();
            let expected_command =
                CliCommand::Source(SourceCliCommand::ToggleSource(ToggleSourceArgs {
                    client_args: ClientArgs::default(),
                    index_id: "hdfs-logs".to_string(),
                    source_id: "kafka-foo".to_string(),
                    enable: false,
                }));
            assert_eq!(command, expected_command);
        }
    }

    #[test]
    fn test_parse_delete_source_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(vec![
                "source",
                "delete",
                "--index",
                "hdfs-logs",
                "--source",
                "hdfs-logs-source",
                "--yes",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_command =
            CliCommand::Source(SourceCliCommand::DeleteSource(DeleteSourceArgs {
                client_args: ClientArgs::default(),
                index_id: "hdfs-logs".to_string(),
                source_id: "hdfs-logs-source".to_string(),
                assume_yes: true,
            }));
        assert_eq!(command, expected_command);
    }

    #[test]
    fn test_parse_describe_source_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(vec![
                "source",
                "describe",
                "--index",
                "hdfs-logs",
                "--source",
                "hdfs-logs-source",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_command =
            CliCommand::Source(SourceCliCommand::DescribeSource(DescribeSourceArgs {
                client_args: ClientArgs::default(),
                index_id: "hdfs-logs".to_string(),
                source_id: "hdfs-logs-source".to_string(),
            }));
        assert_eq!(command, expected_command);
    }

    #[test]
    fn test_parse_reset_checkpoint_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(vec![
                "source",
                "reset-checkpoint",
                "--index",
                "hdfs-logs",
                "--source",
                "hdfs-logs-source",
                "--yes",
            ])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_command =
            CliCommand::Source(SourceCliCommand::ResetCheckpoint(ResetCheckpointArgs {
                client_args: ClientArgs::default(),
                index_id: "hdfs-logs".to_string(),
                source_id: "hdfs-logs-source".to_string(),
                assume_yes: true,
            }));
        assert_eq!(command, expected_command);
    }

    #[test]
    fn test_make_describe_source_tables() {
        assert!(
            make_describe_source_tables(SourceCheckpoint::default(), [], "source-does-not-exist")
                .is_err()
        );

        let checkpoint: SourceCheckpoint = vec![("shard-000", ""), ("shard-001", "1234567890")]
            .into_iter()
            .map(|(partition_id, offset)| {
                (PartitionId::from(partition_id), Position::offset(offset))
            })
            .collect();
        let sources = vec![SourceConfig {
            source_id: "foo-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::file_from_str("path/to/file").unwrap(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }];
        let expected_source = vec![SourceRow {
            source_id: "foo-source".to_string(),
            source_type: "file".to_string(),
            enabled: "true".to_string(),
        }];
        let expected_uri = Uri::from_str("path/to/file").unwrap();
        let expected_params = vec![ParamsRow {
            key: "filepath".to_string(),
            value: JsonValue::String(expected_uri.to_string()),
        }];
        let expected_checkpoint = vec![
            CheckpointRow {
                partition_id: "shard-000".to_string(),
                offset: "".to_string(),
            },
            CheckpointRow {
                partition_id: "shard-001".to_string(),
                offset: "1234567890".to_string(),
            },
        ];
        let (source_table, params_table, checkpoint_table) =
            make_describe_source_tables(checkpoint, sources, "foo-source").unwrap();
        assert_eq!(
            source_table.to_string(),
            make_table("Source", expected_source, true).to_string()
        );
        assert_eq!(
            params_table.to_string(),
            make_table("Parameters", expected_params, false).to_string()
        );
        assert_eq!(
            checkpoint_table.to_string(),
            make_table("Checkpoint", expected_checkpoint, false).to_string()
        );
    }

    #[test]
    fn test_parse_list_sources_args() {
        let app = build_cli().no_binary_name(true);
        let matches = app
            .try_get_matches_from(vec!["source", "list", "--index", "hdfs-logs"])
            .unwrap();
        let command = CliCommand::parse_cli_args(matches).unwrap();
        let expected_command = CliCommand::Source(SourceCliCommand::ListSources(ListSourcesArgs {
            client_args: ClientArgs::default(),
            index_id: "hdfs-logs".to_string(),
        }));
        assert_eq!(command, expected_command);
    }

    #[test]
    fn test_make_list_sources_table() {
        let sources = [
            SourceConfig {
                source_id: "foo-source".to_string(),
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::stdin(),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            },
            SourceConfig {
                source_id: "bar-source".to_string(),
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::stdin(),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            },
        ];
        let expected_sources = [
            SourceRow {
                source_id: "bar-source".to_string(),
                source_type: "stdin".to_string(),
                enabled: "true".to_string(),
            },
            SourceRow {
                source_id: "foo-source".to_string(),
                source_type: "stdin".to_string(),
                enabled: "true".to_string(),
            },
        ];
        assert_eq!(
            make_list_sources_table(sources).to_string(),
            make_table("Sources", expected_sources, false).to_string()
        );
    }
}


================================================
FILE: quickwit/quickwit-cli/src/split.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::str::FromStr;

use anyhow::{Context, bail};
use clap::{ArgMatches, Command, arg};
use colored::Colorize;
use itertools::Itertools;
use quickwit_metastore::{Split, SplitState};
use quickwit_proto::types::{IndexId, SplitId};
use quickwit_serve::ListSplitsQueryParams;
use tabled::{Table, Tabled};
use time::{Date, OffsetDateTime, PrimitiveDateTime, format_description};
use tracing::debug;

use crate::checklist::GREEN_COLOR;
use crate::{ClientArgs, client_args, make_table, prompt_confirmation};

pub fn build_split_command() -> Command {
    Command::new("split")
        .about("Manages splits: lists, describes, marks for deletion...")
        .args(client_args())
        .subcommand(
            Command::new("list")
                .about("Lists the splits of an index.")
                .alias("ls")
                .args(&[
                    arg!(--index <INDEX> "Target index ID")
                        .display_order(1)
                        .required(true),
                    arg!(--"offset" <OFFSET> "Number of splits to skip.")
                        .display_order(2)
                        .required(false),
                    arg!(--"limit" <LIMIT> "Maximum number of splits to retrieve.")
                        .display_order(3)
                        .required(false),
                    arg!(--states <SPLIT_STATES> "Selects the splits whose states are included in this comma-separated list of states. Possible values are `staged`, `published`, and `marked`.")
                        .display_order(4)
                        .required(false)
                        .value_delimiter(','),
                    arg!(--"create-date" <CREATE_DATE> "Selects the splits whose creation dates are before this date.")
                        .display_order(5)
                        .required(false),
                    arg!(--"start-date" <START_DATE> "Selects the splits that contain documents after this date (time-series indexes only).")
                        .display_order(6)
                        .required(false),
                    arg!(--"end-date" <END_DATE> "Selects the splits that contain documents before this date (time-series indexes only).")
                        .display_order(7)
                        .required(false),
                    // See #2762:
                    // arg!(--tags <TAGS> "Selects the splits whose tags are all included in this comma-separated list of tags.")
                    //     .display_order(6)
                    //     .required(false)
                    //     .use_value_delimiter(true),
                    arg!(--"output-format" <OUTPUT_FORMAT> "Output format. Possible values are `table`, `json`, and `pretty-json`.")
                        .alias("format")
                        .display_order(8)
                        .required(false)
                ])
            )
        .subcommand(
            Command::new("describe")
                .about("Displays metadata about a split.")
                .alias("desc")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--split <SPLIT> "ID of the target split")
                        .display_order(2)
                        .required(true),
                    arg!(--verbose "Displays additional metadata about the hotcache."),
                ])
            )
        .subcommand(
            Command::new("mark-for-deletion")
                .about("Marks one or multiple splits of an index for deletion.")
                .alias("mark")
                .args(&[
                    arg!(--index <INDEX_ID> "Target index ID")
                        .display_order(1)
                        .required(true),
                    arg!(--splits <SPLIT_IDS> "Comma-separated list of split IDs")
                        .display_order(2)
                        .required(true)
                        .value_delimiter(','),
                    arg!(-y --"yes" "Assume \"yes\" as an answer to all prompts and run non-interactively.")
                        .required(false),
                ])
            )
        .arg_required_else_help(true)
}

#[derive(Debug, Eq, PartialEq)]
enum OutputFormat {
    Table, // Default
    Json,
    PrettyJson,
}

impl FromStr for OutputFormat {
    type Err = anyhow::Error;

    fn from_str(output_format_str: &str) -> anyhow::Result<Self> {
        match output_format_str {
            "json" => Ok(OutputFormat::Json),
            "pretty-json" | "pretty_json" => Ok(OutputFormat::PrettyJson),
            "table" => Ok(OutputFormat::Table),
            _ => bail!(
                "unknown output format `{output_format_str}`. supported formats are: `table`, \
                 `json`, and `pretty-json`"
            ),
        }
    }
}

#[derive(Debug, PartialEq)]
pub struct ListSplitArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub offset: Option<usize>,
    pub limit: Option<usize>,
    pub split_states: Option<Vec<SplitState>>,
    pub create_date: Option<OffsetDateTime>,
    pub start_date: Option<OffsetDateTime>,
    pub end_date: Option<OffsetDateTime>,
    // pub tags: Option<TagFilterAst>,
    output_format: OutputFormat,
}

#[derive(Debug, Eq, PartialEq)]
pub struct MarkForDeletionArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub split_ids: Vec<String>,
    pub assume_yes: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct DescribeSplitArgs {
    pub client_args: ClientArgs,
    pub index_id: IndexId,
    pub split_id: SplitId,
    pub verbose: bool,
}

#[derive(Debug, PartialEq)]
pub enum SplitCliCommand {
    List(ListSplitArgs),
    MarkForDeletion(MarkForDeletionArgs),
    Describe(DescribeSplitArgs),
}

impl SplitCliCommand {
    pub fn parse_cli_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let (subcommand, submatches) = matches
            .remove_subcommand()
            .context("failed to split subcommand")?;
        match subcommand.as_str() {
            "describe" => Self::parse_describe_args(submatches),
            "list" => Self::parse_list_args(submatches),
            "mark-for-deletion" => Self::parse_mark_for_deletion_args(submatches),
            _ => bail!("unknown split subcommand `{subcommand}`"),
        }
    }

    fn parse_list_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let offset = matches
            .remove_one::<String>("offset")
            .and_then(|s| s.parse::<usize>().ok());
        let limit = matches
            .remove_one::<String>("limit")
            .and_then(|s| s.parse::<usize>().ok());
        let split_states = matches
            .remove_many::<String>("states")
            .map(|values| {
                values
                    .into_iter()
                    .dedup()
                    .map(|split_state_str| parse_split_state(&split_state_str))
                    .collect::<Result<Vec<_>, _>>()
            })
            .transpose()?;
        let create_date = matches
            .remove_one::<String>("create-date")
            .map(|date_str| parse_date(&date_str, "create"))
            .transpose()?;
        let start_date = matches
            .remove_one::<String>("start-date")
            .map(|date_str| parse_date(&date_str, "start"))
            .transpose()?;
        let end_date = matches
            .remove_one::<String>("end-date")
            .map(|date_str| parse_date(&date_str, "end"))
            .transpose()?;
        // let tags = matches.values_of("tags").map(|values| {
        //     TagFilterAst::And(
        //         values
        //             .into_iter()
        //             .map(|value| TagFilterAst::Tag {
        //                 get_flag: true,
        //                 tag: value.to_string(),
        //             })
        //             .collect(),
        //     )
        // });
        let output_format = matches
            .remove_one::<String>("output-format")
            .map(|s| OutputFormat::from_str(s.as_str()))
            .transpose()?
            .unwrap_or(OutputFormat::Table);
        Ok(Self::List(ListSplitArgs {
            client_args,
            index_id,
            offset,
            limit,
            split_states,
            start_date,
            end_date,
            create_date,
            // tags,
            output_format,
        }))
    }

    fn parse_mark_for_deletion_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let client_args = ClientArgs::parse(&mut matches)?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let split_ids = matches
            .remove_many::<String>("splits")
            .expect("`splits` should be a required arg.")
            .collect();
        let assume_yes = matches.get_flag("yes");
        Ok(Self::MarkForDeletion(MarkForDeletionArgs {
            client_args,
            index_id,
            split_ids,
            assume_yes,
        }))
    }

    fn parse_describe_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let split_id = matches
            .remove_one::<String>("split")
            .expect("`split` should be a required arg.");
        let client_args = ClientArgs::parse(&mut matches)?;
        let verbose = matches.get_flag("verbose");

        Ok(Self::Describe(DescribeSplitArgs {
            client_args,
            index_id,
            split_id,
            verbose,
        }))
    }

    pub async fn execute(self) -> anyhow::Result<()> {
        match self {
            Self::List(args) => list_split_cli(args).await,
            Self::MarkForDeletion(args) => mark_splits_for_deletion_cli(args).await,
            Self::Describe(args) => describe_split_cli(args).await,
        }
    }
}

async fn list_split_cli(args: ListSplitArgs) -> anyhow::Result<()> {
    debug!(args=?args, "list-split");
    let qw_client = args.client_args.client();
    let list_splits_query_params = ListSplitsQueryParams {
        offset: args.offset,
        limit: args.limit,
        split_states: args.split_states,
        start_timestamp: args.start_date.map(OffsetDateTime::unix_timestamp),
        end_timestamp: args.end_date.map(OffsetDateTime::unix_timestamp),
        end_create_timestamp: args.create_date.map(OffsetDateTime::unix_timestamp),
    };
    // TODO: plug tags.
    // if let Some(tags) = args.tags {
    //     query = query.with_tags_filter(tags);
    // }
    let splits = qw_client
        .splits(&args.index_id)
        .list(list_splits_query_params)
        .await
        .context("failed to list splits")?;
    let output = match args.output_format {
        OutputFormat::Json => serde_json::to_string(&splits)?,
        OutputFormat::PrettyJson => serde_json::to_string_pretty(&splits)?,
        OutputFormat::Table => make_split_table(&splits, "Splits").to_string(),
    };
    println!("{output}");
    Ok(())
}

async fn mark_splits_for_deletion_cli(args: MarkForDeletionArgs) -> anyhow::Result<()> {
    debug!(args=?args, "mark-splits-for-deletion");
    println!("❯ Marking splits for deletion...");
    if !args.assume_yes {
        let prompt = "This operation will mark splits for deletion, those splits will be deleted \
                      after the next garbage collection. Do you want to proceed?";
        if !prompt_confirmation(prompt, false) {
            return Ok(());
        }
    }
    let qw_client = args.client_args.client();
    qw_client
        .splits(&args.index_id)
        .mark_for_deletion(args.split_ids)
        .await?;
    println!(
        "{} Splits successfully marked for deletion.",
        "✔".color(GREEN_COLOR)
    );
    Ok(())
}

async fn describe_split_cli(args: DescribeSplitArgs) -> anyhow::Result<()> {
    debug!(args=?args, "describe-split");
    let qw_client = args.client_args.client();
    let list_splits_query_params = ListSplitsQueryParams::default();
    let split = qw_client
        .splits(&args.index_id)
        .list(list_splits_query_params)
        .await
        .expect("Failed to fetch splits.")
        .into_iter()
        .find(|split| split.split_id() == args.split_id)
        .with_context(|| {
            format!(
                "could not find split metadata in metastore {}",
                args.split_id
            )
        })?;

    println!("{}", make_split_table(&[split], "Split"));

    // TODO: if we have access to the storage, we could fetch that.
    // let split_file = PathBuf::from(format!("{}.split", args.split_id));
    // let (split_footer, _) = read_split_footer(index_storage, &split_file).await?;
    // let stats = BundleDirectory::get_stats_split(split_footer.clone())?;
    // let hotcache_bytes = get_hotcache_from_split(split_footer)?;

    // let mut file_rows = Vec::new();

    // for (path, size) in stats {
    //     file_rows.push(FileRow {
    //         file_name: path.to_str().unwrap().to_string(),
    //         size: format_size(size, DECIMAL),
    //     });
    // }
    // println!(
    //     "{}",
    //     make_table("Files in Split", file_rows.into_iter(), false)
    // );
    // if args.verbose {
    //     let mut hotcache_files = Vec::new();
    //     let hotcache_stats = HotDirectory::get_stats_per_file(hotcache_bytes)?;
    //     for (path, size) in hotcache_stats {
    //         hotcache_files.push(FileRow {
    //             file_name: path.to_str().unwrap().to_string(),
    //             size: format_size(size, DECIMAL),
    //         });
    //     }
    //     let hotcache_table = make_table("Files in Hotcache", hotcache_files.into_iter(), false);
    //     println!("{hotcache_table}");
    // }
    Ok(())
}

fn make_split_table(splits: &[Split], title: &str) -> Table {
    let rows = splits
        .iter()
        .map(|split| {
            let time_range = if let Some(time_range) = &split.split_metadata.time_range {
                format!("[{time_range:?}]")
            } else {
                "[*]".to_string()
            };
            let created_at =
                OffsetDateTime::from_unix_timestamp(split.split_metadata.create_timestamp)
                    .expect("Failed to create `OffsetDateTime` from split create timestamp.");
            let updated_at = OffsetDateTime::from_unix_timestamp(split.update_timestamp)
                .expect("Failed to create `OffsetDateTime` from split update timestamp.");

            SplitRow {
                split_id: split.split_metadata.split_id.clone(),
                split_state: split.split_state,
                num_docs: split.split_metadata.num_docs,
                size_mega_bytes: split.split_metadata.uncompressed_docs_size_in_bytes / 1_000_000,
                created_at,
                updated_at,
                time_range,
            }
        })
        .sorted_by(|left, right| left.created_at.cmp(&right.created_at));
    make_table(title, rows, false)
}

fn parse_date(date_arg: &str, option_name: &str) -> anyhow::Result<OffsetDateTime> {
    let description = format_description::parse("[year]-[month]-[day]")?;
    if let Ok(date) = Date::parse(date_arg, &description) {
        return Ok(date.with_hms(0, 0, 0)?.assume_utc());
    }

    for datetime_format in [
        "[year]-[month]-[day] [hour]:[minute]",
        "[year]-[month]-[day] [hour]:[minute]:[second]",
        "[year]-[month]-[day]T[hour]:[minute]",
        "[year]-[month]-[day]T[hour]:[minute]:[second]",
    ] {
        let description = format_description::parse(datetime_format)?;
        if let Ok(datetime) = PrimitiveDateTime::parse(date_arg, &description) {
            return Ok(datetime.assume_utc());
        }
    }
    bail!(
        "failed to parse --{}-date option parameter `{}`. supported format is `YYYY-MM-DD[ \
         HH:DD[:SS]]`",
        option_name,
        date_arg
    );
}

fn parse_split_state(split_state_arg: &str) -> anyhow::Result<SplitState> {
    let split_state = match split_state_arg.to_lowercase().as_str() {
        "staged" => SplitState::Staged,
        "published" => SplitState::Published,
        "marked" => SplitState::MarkedForDeletion,
        _ => bail!(format!(
            "unknown split state `{split_state_arg}`. possible values are `staged`, `published`, \
             and `marked`"
        )),
    };
    Ok(split_state)
}

#[derive(Tabled)]
struct SplitRow {
    #[tabled(rename = "ID")]
    split_id: SplitId,
    #[tabled(rename = "State")]
    split_state: SplitState,
    #[tabled(rename = "Num docs")]
    num_docs: usize,
    #[tabled(rename = "Size (MB)")]
    size_mega_bytes: u64,
    #[tabled(rename = "Created at")]
    created_at: OffsetDateTime,
    #[tabled(rename = "Updated at")]
    updated_at: OffsetDateTime,
    #[tabled(rename = "Time range")]
    time_range: String,
}

#[cfg(test)]
mod tests {
    use reqwest::Url;
    use time::macros::datetime;

    use super::*;
    use crate::cli::{CliCommand, build_cli};

    #[test]
    fn test_parse_list_split_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from(vec![
            "split",
            "list",
            "--index",
            "hdfs",
            "--states",
            "staged,published",
            "--create-date",
            "2020-12-24",
            "--start-date",
            "2020-12-24",
            "--end-date",
            "2020-12-25T12:42",
            // "--tags",
            // "tenant:a,service:zk",
            "--format",
            "json",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;

        let expected_split_states = Some(vec![SplitState::Staged, SplitState::Published]);
        let expected_create_date = Some(datetime!(2020-12-24 00:00 UTC));
        let expected_start_date = Some(datetime!(2020-12-24 00:00 UTC));
        let expected_end_date = Some(datetime!(2020-12-25 12:42 UTC));
        // let expected_tags = Some(TagFilterAst::And(vec![
        //     TagFilterAst::Tag {
        //         get_flag: true,
        //         tag: "tenant:a".to_string(),
        //     },
        //     TagFilterAst::Tag {
        //         get_flag: true,
        //         tag: "service:zk".to_string(),
        //     },
        // ]));
        let expected_output_format = OutputFormat::Json;
        assert!(matches!(
            command,
            CliCommand::Split(SplitCliCommand::List(ListSplitArgs {
                index_id,
                split_states,
                create_date,
                start_date,
                end_date,
                // tags,
                output_format,
                ..
            })) if index_id == "hdfs"
                   && split_states == expected_split_states
                   && create_date == expected_create_date
                   && start_date == expected_start_date
                   && end_date == expected_end_date
                   // && tags == expected_tags
                   && output_format == expected_output_format
        ));
        Ok(())
    }

    #[test]
    fn test_parse_split_mark_for_deletion_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from(vec![
            "split",
            "mark",
            "--endpoint",
            "https://quickwit-cluster.io",
            "--index",
            "wikipedia",
            "--splits",
            "split1,split2",
            "--yes",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Split(SplitCliCommand::MarkForDeletion(MarkForDeletionArgs {
                client_args,
                index_id,
                split_ids,
                assume_yes,
            })) if client_args.cluster_endpoint == Url::from_str("https://quickwit-cluster.io").unwrap()
                && index_id == "wikipedia"
                && split_ids == vec!["split1".to_string(), "split2".to_string()]
                && assume_yes
        ));
        Ok(())
    }

    #[test]
    fn test_parse_split_describe_args() -> anyhow::Result<()> {
        let app = build_cli().no_binary_name(true);
        let matches = app.try_get_matches_from(vec![
            "split",
            "describe",
            "--index",
            "wikipedia",
            "--split",
            "ABC",
        ])?;
        let command = CliCommand::parse_cli_args(matches)?;
        assert!(matches!(
            command,
            CliCommand::Split(SplitCliCommand::Describe(DescribeSplitArgs {
                index_id,
                split_id,
                verbose: false,
                ..
            })) if &index_id == "wikipedia" && &split_id == "ABC"
        ));
        Ok(())
    }

    #[test]
    fn test_parse_date() {
        assert_eq!(
            parse_date("2020-12-24", "create").unwrap(),
            datetime!(2020-12-24 00:00 UTC)
        );
        assert_eq!(
            parse_date("2020-12-24 10:20", "create").unwrap(),
            datetime!(2020-12-24 10:20 UTC)
        );
        assert_eq!(
            parse_date("2020-12-24T10:20", "create").unwrap(),
            datetime!(2020-12-24 10:20 UTC)
        );
        assert_eq!(
            parse_date("2020-12-24 10:20:30", "create").unwrap(),
            datetime!(2020-12-24 10:20:30 UTC)
        );
        assert_eq!(
            parse_date("2020-12-24T10:20:30", "create").unwrap(),
            datetime!(2020-12-24 10:20:30 UTC)
        );
    }

    #[test]
    fn test_parse_split_state() {
        assert_eq!(parse_split_state("Staged").unwrap(), SplitState::Staged);
        assert_eq!(
            parse_split_state("Published").unwrap(),
            SplitState::Published
        );
        assert_eq!(
            parse_split_state("Marked").unwrap(),
            SplitState::MarkedForDeletion
        );
    }
}


================================================
FILE: quickwit/quickwit-cli/src/stats.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub(crate) fn mean(values: &[u64]) -> f32 {
    assert!(!values.is_empty());
    let sum: u64 = values.iter().sum();
    sum as f32 / values.len() as f32
}

pub(crate) fn std_deviation(values: &[u64]) -> f32 {
    assert!(!values.is_empty());
    let mean = mean(values);
    let variance = values
        .iter()
        .map(|value| {
            let diff = mean - (*value as f32);
            diff * diff
        })
        .sum::<f32>()
        / values.len() as f32;
    variance.sqrt()
}

/// Return percentile of sorted values using linear interpolation.
pub(crate) fn percentile(sorted_values: &[u64], percent: usize) -> f32 {
    assert!(!sorted_values.is_empty());
    assert!(percent <= 100);
    if sorted_values.len() == 1 {
        return sorted_values[0] as f32;
    }
    if percent == 100 {
        return sorted_values[sorted_values.len() - 1] as f32;
    }
    let length = (sorted_values.len() - 1) as f32;
    let rank = (percent as f32 / 100f32) * length;
    let lrank = rank.floor();
    let d = rank - lrank;
    let n = lrank as usize;
    let lo = sorted_values[n] as f32;
    let hi = sorted_values[n + 1] as f32;
    lo + (hi - lo) * d
}


================================================
FILE: quickwit/quickwit-cli/src/tool.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashSet, VecDeque};
use std::io::{IsTerminal, Stdout, Write, stdout};
use std::num::NonZeroUsize;
use std::path::PathBuf;
use std::str::FromStr;
use std::time::{Duration, Instant};
use std::{env, fmt, io};

use anyhow::{Context, bail};
use clap::{ArgMatches, Command, arg};
use colored::{ColoredString, Colorize};
use humantime::format_duration;
use quickwit_actors::{ActorExitStatus, ActorHandle, Mailbox, Universe};
use quickwit_cluster::{
    ChannelTransport, Cluster, ClusterMember, FailureDetectorConfig, make_client_grpc_config,
};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::runtimes::RuntimesConfig;
use quickwit_common::uri::Uri;
use quickwit_config::service::QuickwitService;
use quickwit_config::{
    CLI_SOURCE_ID, IndexerConfig, NodeConfig, SourceConfig, SourceInputFormat, SourceParams,
    TransformConfig, VecSourceParams,
};
use quickwit_index_management::{IndexService, clear_cache_directory};
use quickwit_indexing::IndexingPipeline;
use quickwit_indexing::actors::{IndexingService, MergePipeline, MergeSchedulerService};
use quickwit_indexing::models::{
    DetachIndexingPipeline, DetachMergePipeline, IndexingStatistics, SpawnPipeline,
};
use quickwit_ingest::IngesterPool;
use quickwit_metastore::IndexMetadataResponseExt;
use quickwit_proto::indexing::CpuCapacity;
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::metastore::{IndexMetadataRequest, MetastoreService, MetastoreServiceClient};
use quickwit_proto::search::{CountHits, SearchResponse};
use quickwit_proto::types::{IndexId, PipelineUid, SourceId, SplitId};
use quickwit_search::{SearchResponseRest, single_node_search};
use quickwit_serve::{
    BodyFormat, SearchRequestQueryString, SortBy, search_request_from_api_request,
};
use quickwit_storage::{BundleStorage, Storage};
use thousands::Separable;
use tracing::{debug, info};

use crate::checklist::{GREEN_COLOR, RED_COLOR};
use crate::{
    THROUGHPUT_WINDOW_SIZE, config_cli_arg, get_resolvers, load_node_config, run_index_checklist,
    start_actor_runtimes,
};

pub fn build_tool_command() -> Command {
    Command::new("tool")
        .about("Performs utility operations. Requires a node config.")
        .arg(config_cli_arg())
        .subcommand(
            Command::new("local-ingest")
                .display_order(10)
                .about("Indexes NDJSON documents locally.")
                .long_about("Local ingest indexes locally NDJSON documents from a file or from stdin and uploads splits on the configured storage.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--"input-path" <INPUT_PATH> "Location of the input file.")
                        .required(false),
                    arg!(--"input-format" <INPUT_FORMAT> "Format of the input data.")
                        .default_value("json")
                        .required(false),
                    arg!(--overwrite "Overwrites pre-existing index.")
                        .required(false),
                    arg!(--"transform-script" <SCRIPT> "VRL program to transform docs before ingesting.")
                        .required(false),
                    arg!(--"keep-cache" "Does not clear local cache directory upon completion.")
                        .required(false),
                ])
            )
        .subcommand(
            Command::new("local-search")
                .display_order(10)
                .about("Searches an index locally.")
                .long_about("Searchers an index directly on the configured storage without using a server.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--query <QUERY> "Query expressed in natural query language ((barack AND obama) OR \"president of united states\"). Learn more on https://quickwit.io/docs/reference/search-language.")
                        .display_order(2)
                        .required(true),
                    arg!(--aggregation <AGG> "JSON serialized aggregation request in tantivy/elasticsearch format.")
                        .required(false),
                    arg!(--"max-hits" <MAX_HITS> "Maximum number of hits returned.")
                        .default_value("20")
                        .required(false),
                    arg!(--"start-offset" <OFFSET> "Offset in the global result set of the first hit returned.")
                        .default_value("0")
                        .required(false),
                    arg!(--"search-fields" <FIELD_NAME> "List of fields that Quickwit will search into if the user query does not explicitly target a field in the query. It overrides the default search fields defined in the index config. Space-separated list, e.g. \"field1 field2\". ")
                        .num_args(1..)
                        .required(false),
                    arg!(--"snippet-fields" <FIELD_NAME> "List of fields that Quickwit will return snippet highlight on. Space-separated list, e.g. \"field1 field2\". ")
                        .num_args(1..)
                        .required(false),
                    arg!(--"start-timestamp" <TIMESTAMP> "Filters out documents before that timestamp (time-series indexes only).")
                        .required(false),
                    arg!(--"end-timestamp" <TIMESTAMP> "Filters out documents after that timestamp (time-series indexes only).")
                        .required(false),
                    arg!(--"sort-by-field" <SORT_BY_FIELD> "Sort by field.")
                        .required(false),
                ])
            )
        .subcommand(
            Command::new("extract-split")
                .about("Downloads and extracts a split to a directory.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--split <SPLIT> "ID of the target split")
                        .display_order(2)
                        .required(true),
                    arg!(--"target-dir" <TARGET_DIR> "Directory to extract the split to."),
                ])
            )
        .subcommand(
            Command::new("gc")
                .display_order(10)
                .about("Garbage collects stale staged splits and splits marked for deletion.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index")
                        .display_order(1)
                        .required(true),
                    arg!(--"grace-period" <GRACE_PERIOD> "Threshold period after which stale staged splits are garbage collected.")
                        .default_value("1h")
                        .required(false),
                    arg!(--"dry-run" "Executes the command in dry run mode and only displays the list of splits candidates for garbage collection.")
                        .required(false),
                ])
            )
        .subcommand(
            Command::new("merge")
                .display_order(10)
                .about("Merges all the splits for a given Node ID, index ID, source ID.")
                .args(&[
                    arg!(--index <INDEX> "ID of the target index.")
                        .display_order(1)
                        .required(true),
                    arg!(--source <SOURCE_ID> "ID of the target source.")
                        .display_order(2)
                        .required(true),
                ])
            )
        .arg_required_else_help(true)
}

#[derive(Debug, Eq, PartialEq)]
pub struct LocalIngestDocsArgs {
    pub config_uri: Uri,
    pub index_id: IndexId,
    pub input_path_opt: Option<Uri>,
    pub input_format: SourceInputFormat,
    pub overwrite: bool,
    pub vrl_script: Option<String>,
    pub clear_cache: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct LocalSearchArgs {
    pub config_uri: Uri,
    pub index_id: IndexId,
    pub query: String,
    pub aggregation: Option<String>,
    pub max_hits: usize,
    pub start_offset: usize,
    pub search_fields: Option<Vec<String>>,
    pub snippet_fields: Option<Vec<String>>,
    pub start_timestamp: Option<i64>,
    pub end_timestamp: Option<i64>,
    pub sort_by_field: Option<String>,
}

#[derive(Debug, Eq, PartialEq)]
pub struct GarbageCollectIndexArgs {
    pub config_uri: Uri,
    pub index_id: IndexId,
    pub grace_period: Duration,
    pub dry_run: bool,
}

#[derive(Debug, Eq, PartialEq)]
pub struct MergeArgs {
    pub config_uri: Uri,
    pub index_id: IndexId,
    pub source_id: SourceId,
}

#[derive(Debug, Eq, PartialEq)]
pub struct ExtractSplitArgs {
    pub config_uri: Uri,
    pub index_id: IndexId,
    pub split_id: SplitId,
    pub target_dir: PathBuf,
}

#[derive(Debug, Eq, PartialEq)]
pub enum ToolCliCommand {
    GarbageCollect(GarbageCollectIndexArgs),
    LocalIngest(LocalIngestDocsArgs),
    LocalSearch(LocalSearchArgs),
    Merge(MergeArgs),
    ExtractSplit(ExtractSplitArgs),
}

impl ToolCliCommand {
    pub fn parse_cli_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let (subcommand, submatches) = matches
            .remove_subcommand()
            .context("failed to parse tool subcommand")?;
        match subcommand.as_str() {
            "gc" => Self::parse_garbage_collect_args(submatches),
            "local-ingest" => Self::parse_local_ingest_args(submatches),
            "local-search" => Self::parse_local_search_args(submatches),
            "merge" => Self::parse_merge_args(submatches),
            "extract-split" => Self::parse_extract_split_args(submatches),
            _ => bail!("unknown tool subcommand `{subcommand}`"),
        }
    }

    fn parse_local_ingest_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let config_uri = matches
            .remove_one::<String>("config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`config` should be a required arg.")?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let input_path_opt = if let Some(input_path) = matches.remove_one::<String>("input-path") {
            Some(Uri::from_str(&input_path)?)
        } else {
            None
        };

        let input_format = matches
            .remove_one::<String>("input-format")
            .map(|input_format| SourceInputFormat::from_str(&input_format))
            .expect("`input-format` should have a default value.")
            .map_err(|err| anyhow::anyhow!(err))?;
        let overwrite = matches.get_flag("overwrite");
        let vrl_script = matches.remove_one::<String>("transform-script");
        let clear_cache = !matches.get_flag("keep-cache");

        Ok(Self::LocalIngest(LocalIngestDocsArgs {
            config_uri,
            index_id,
            input_path_opt,
            input_format,
            overwrite,
            vrl_script,
            clear_cache,
        }))
    }

    fn parse_local_search_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let config_uri = matches
            .remove_one::<String>("config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`config` should be a required arg.")?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let query = matches
            .remove_one::<String>("query")
            .context("`query` should be a required arg")?;
        let aggregation = matches.remove_one::<String>("aggregation");
        let max_hits = matches
            .remove_one::<String>("max-hits")
            .expect("`max-hits` should have a default value.")
            .parse()?;
        let start_offset = matches
            .remove_one::<String>("start-offset")
            .expect("`start-offset` should have a default value.")
            .parse()?;
        let search_fields = matches
            .remove_many::<String>("search-fields")
            .map(|values| values.collect());
        let snippet_fields = matches
            .remove_many::<String>("snippet-fields")
            .map(|values| values.collect());
        let sort_by_field = matches.remove_one::<String>("sort-by-field");
        let start_timestamp = matches
            .remove_one::<String>("start-timestamp")
            .map(|ts| ts.parse())
            .transpose()?;
        let end_timestamp = matches
            .remove_one::<String>("end-timestamp")
            .map(|ts| ts.parse())
            .transpose()?;
        Ok(Self::LocalSearch(LocalSearchArgs {
            config_uri,
            index_id,
            query,
            aggregation,
            max_hits,
            start_offset,
            search_fields,
            snippet_fields,
            start_timestamp,
            end_timestamp,
            sort_by_field,
        }))
    }

    fn parse_merge_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let config_uri = matches
            .remove_one::<String>("config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`config` should be a required arg.")?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("'index-id' should be a required arg.");
        let source_id = matches
            .remove_one::<String>("source")
            .expect("'source-id' should be a required arg.");
        Ok(Self::Merge(MergeArgs {
            index_id,
            source_id,
            config_uri,
        }))
    }

    fn parse_garbage_collect_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let config_uri = matches
            .get_one("config")
            .map(|uri_str: &String| Uri::from_str(uri_str))
            .expect("`config` should be a required arg.")?;
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let grace_period = matches
            .get_one("grace-period")
            .map(|duration_str: &String| humantime::parse_duration(duration_str))
            .expect("`grace-period` should have a default value.")?;
        let dry_run = matches.get_flag("dry-run");
        Ok(Self::GarbageCollect(GarbageCollectIndexArgs {
            index_id,
            grace_period,
            dry_run,
            config_uri,
        }))
    }

    fn parse_extract_split_args(mut matches: ArgMatches) -> anyhow::Result<Self> {
        let index_id = matches
            .remove_one::<String>("index")
            .expect("`index` should be a required arg.");
        let split_id = matches
            .remove_one::<String>("split")
            .expect("`split` should be a required arg.");
        let config_uri = matches
            .remove_one::<String>("config")
            .map(|uri_str| Uri::from_str(&uri_str))
            .expect("`config` should be a required arg.")?;
        let target_dir = matches
            .remove_one::<String>("target-dir")
            .map(PathBuf::from)
            .expect("`target-dir` should be a required arg.");
        Ok(Self::ExtractSplit(ExtractSplitArgs {
            config_uri,
            index_id,
            split_id,
            target_dir,
        }))
    }

    pub async fn execute(self) -> anyhow::Result<()> {
        match self {
            Self::GarbageCollect(args) => garbage_collect_index_cli(args).await,
            Self::LocalIngest(args) => local_ingest_docs_cli(args).await,
            Self::LocalSearch(args) => local_search_cli(args).await,
            Self::Merge(args) => merge_cli(args).await,
            Self::ExtractSplit(args) => extract_split_cli(args).await,
        }
    }
}

pub async fn local_ingest_docs_cli(args: LocalIngestDocsArgs) -> anyhow::Result<()> {
    debug!(args=?args, "local-ingest-docs");
    println!("❯ Ingesting documents locally...");

    let config = load_node_config(&args.config_uri).await?;
    let (storage_resolver, metastore_resolver) =
        get_resolvers(&config.storage_configs, &config.metastore_configs);
    let mut metastore = metastore_resolver.resolve(&config.metastore_uri).await?;

    let source_params = if let Some(uri) = args.input_path_opt.as_ref() {
        SourceParams::file_from_uri(uri.clone())
    } else {
        SourceParams::stdin()
    };
    let transform_config = args
        .vrl_script
        .map(|vrl_script| TransformConfig::new(vrl_script, None));
    let source_config = SourceConfig {
        source_id: CLI_SOURCE_ID.to_string(),
        num_pipelines: NonZeroUsize::MIN,
        enabled: true,
        source_params,
        transform_config,
        input_format: args.input_format,
    };
    run_index_checklist(
        &mut metastore,
        &storage_resolver,
        &args.index_id,
        Some(&source_config),
    )
    .await?;

    if args.overwrite {
        let mut index_service = IndexService::new(metastore.clone(), storage_resolver.clone());
        index_service.clear_index(&args.index_id).await?;
    }
    // The indexing service needs to update its cluster chitchat state so that the control plane is
    // aware of the running tasks. We thus create a fake cluster to instantiate the indexing service
    // and avoid impacting potential control plane running on the cluster.
    let cluster = create_empty_cluster(&config).await?;
    let indexer_config = IndexerConfig {
        ..Default::default()
    };
    let runtimes_config = RuntimesConfig::default();
    start_actor_runtimes(
        runtimes_config,
        &HashSet::from_iter([QuickwitService::Indexer]),
    )?;
    let universe = Universe::new();
    let merge_scheduler_service_mailbox = universe.get_or_spawn_one();
    let indexing_server = IndexingService::new(
        config.node_id.clone(),
        config.data_dir_path.clone(),
        indexer_config,
        runtimes_config.num_threads_blocking,
        cluster,
        metastore,
        None,
        merge_scheduler_service_mailbox,
        IngesterPool::default(),
        storage_resolver,
        EventBroker::default(),
    )
    .await?;
    let (indexing_server_mailbox, indexing_server_handle) =
        universe.spawn_builder().spawn(indexing_server);
    let pipeline_id = indexing_server_mailbox
        .ask_for_res(SpawnPipeline {
            index_id: args.index_id.clone(),
            source_config,
            pipeline_uid: PipelineUid::random(),
        })
        .await?;
    let merge_pipeline_handle = indexing_server_mailbox
        .ask_for_res(DetachMergePipeline {
            pipeline_id: pipeline_id.merge_pipeline_id(),
        })
        .await?;
    let indexing_pipeline_handle = indexing_server_mailbox
        .ask_for_res(DetachIndexingPipeline { pipeline_id })
        .await?;

    if args.input_path_opt.is_none() && io::stdin().is_terminal() {
        let eof_shortcut = match env::consts::OS {
            "windows" => "CTRL+Z",
            _ => "CTRL+D",
        };
        println!(
            "Please, enter JSON documents one line at a time.\nEnd your input using \
             {eof_shortcut}."
        );
    }
    let statistics =
        start_statistics_reporting_loop(indexing_pipeline_handle, args.input_path_opt.is_none())
            .await?;
    merge_pipeline_handle
        .mailbox()
        .ask(quickwit_indexing::FinishPendingMergesAndShutdownPipeline)
        .await?;
    merge_pipeline_handle.join().await;
    // Shutdown the indexing server.
    universe
        .send_exit_with_success(&indexing_server_mailbox)
        .await?;
    indexing_server_handle.join().await;
    universe.quit().await;
    if statistics.num_published_splits > 0 {
        println!(
            "Now, you can query the index with the following command:\nquickwit index search \
             --index {} --config ./config/quickwit.yaml --query \"my query\"",
            args.index_id
        );
    }

    if args.clear_cache {
        println!("Clearing local cache directory...");
        clear_cache_directory(&config.data_dir_path).await?;
        println!("{} Local cache directory cleared.", "✔".color(GREEN_COLOR));
    }

    match statistics.num_invalid_docs {
        0 => {
            println!("{} Documents successfully indexed.", "✔".color(GREEN_COLOR));
            Ok(())
        }
        _ => bail!("failed to ingest all the documents"),
    }
}

pub async fn local_search_cli(args: LocalSearchArgs) -> anyhow::Result<()> {
    debug!(args=?args, "local-search");
    println!("❯ Searching directly on the index storage (without calling REST API)...");
    let config = load_node_config(&args.config_uri).await?;
    let (storage_resolver, metastore_resolver) =
        get_resolvers(&config.storage_configs, &config.metastore_configs);
    let metastore: MetastoreServiceClient =
        metastore_resolver.resolve(&config.metastore_uri).await?;
    let aggs = args
        .aggregation
        .map(|agg_string| serde_json::from_str(&agg_string))
        .transpose()?;
    let sort_by: SortBy = args.sort_by_field.map(SortBy::from).unwrap_or_default();
    let search_request_query_string = SearchRequestQueryString {
        query: args.query,
        start_offset: args.start_offset as u64,
        max_hits: args.max_hits as u64,
        search_fields: args.search_fields,
        snippet_fields: args.snippet_fields,
        start_timestamp: args.start_timestamp,
        end_timestamp: args.end_timestamp,
        aggs,
        format: BodyFormat::Json,
        sort_by,
        count_all: CountHits::CountAll,
        allow_failed_splits: false,
    };
    let search_request =
        search_request_from_api_request(vec![args.index_id], search_request_query_string)?;
    debug!(search_request=?search_request, "search-request");
    let search_response: SearchResponse =
        single_node_search(search_request, metastore, storage_resolver).await?;
    let search_response_rest = SearchResponseRest::try_from(search_response)?;
    let search_response_json = serde_json::to_string_pretty(&search_response_rest)?;
    println!("{search_response_json}");
    Ok(())
}

pub async fn merge_cli(args: MergeArgs) -> anyhow::Result<()> {
    debug!(args=?args, "run-merge-operations");
    println!("❯ Merging splits locally...");
    let config = load_node_config(&args.config_uri).await?;
    let (storage_resolver, metastore_resolver) =
        get_resolvers(&config.storage_configs, &config.metastore_configs);
    let mut metastore = metastore_resolver.resolve(&config.metastore_uri).await?;
    run_index_checklist(&mut metastore, &storage_resolver, &args.index_id, None).await?;
    // The indexing service needs to update its cluster chitchat state so that the control plane is
    // aware of the running tasks. We thus create a fake cluster to instantiate the indexing service
    // and avoid impacting potential control plane running on the cluster.
    let cluster = create_empty_cluster(&config).await?;
    let runtimes_config = RuntimesConfig::default();
    start_actor_runtimes(
        runtimes_config,
        &HashSet::from_iter([QuickwitService::Indexer]),
    )?;
    let indexer_config = IndexerConfig::default();
    let universe = Universe::new();
    let merge_scheduler_service: Mailbox<MergeSchedulerService> = universe.get_or_spawn_one();
    let indexing_server = IndexingService::new(
        config.node_id,
        config.data_dir_path,
        indexer_config,
        runtimes_config.num_threads_blocking,
        cluster,
        metastore,
        None,
        merge_scheduler_service,
        IngesterPool::default(),
        storage_resolver,
        EventBroker::default(),
    )
    .await?;
    let (indexing_service_mailbox, indexing_service_handle) =
        universe.spawn_builder().spawn(indexing_server);
    let pipeline_id = indexing_service_mailbox
        .ask_for_res(SpawnPipeline {
            index_id: args.index_id,
            source_config: SourceConfig {
                source_id: args.source_id,
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::Vec(VecSourceParams::default()),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            },
            pipeline_uid: PipelineUid::random(),
        })
        .await?;
    let pipeline_handle: ActorHandle<MergePipeline> = indexing_service_mailbox
        .ask_for_res(DetachMergePipeline {
            pipeline_id: pipeline_id.merge_pipeline_id(),
        })
        .await?;

    let mut check_interval = tokio::time::interval(Duration::from_secs(1));
    loop {
        check_interval.tick().await;

        pipeline_handle.refresh_observe();
        let observation = pipeline_handle.last_observation();

        if observation.num_ongoing_merges == 0 {
            info!("merge pipeline has no more ongoing merges, exiting");
            break;
        }

        if pipeline_handle.state().is_exit() {
            info!("merge pipeline has exited, exiting");
            break;
        }
    }

    let (pipeline_exit_status, _pipeline_statistics) = pipeline_handle.quit().await;
    indexing_service_handle.quit().await;
    if !matches!(
        pipeline_exit_status,
        ActorExitStatus::Success | ActorExitStatus::Quit
    ) {
        bail!(pipeline_exit_status);
    }
    println!("{} Merge successful.", "✔".color(GREEN_COLOR));
    Ok(())
}

pub async fn garbage_collect_index_cli(args: GarbageCollectIndexArgs) -> anyhow::Result<()> {
    debug!(args=?args, "garbage-collect-index");
    println!("❯ Garbage collecting index...");

    let config = load_node_config(&args.config_uri).await?;
    let (storage_resolver, metastore_resolver) =
        get_resolvers(&config.storage_configs, &config.metastore_configs);
    let metastore = metastore_resolver.resolve(&config.metastore_uri).await?;
    let mut index_service = IndexService::new(metastore, storage_resolver);
    let removal_info = index_service
        .garbage_collect_index(&args.index_id, args.grace_period, args.dry_run)
        .await?;
    if removal_info.removed_split_entries.is_empty() && removal_info.failed_splits.is_empty() {
        println!("No dangling files to garbage collect.");
        return Ok(());
    }

    if args.dry_run {
        println!("The following files will be garbage collected.");
        for split_info in removal_info.removed_split_entries {
            println!(" - {}", split_info.file_name.display());
        }
        return Ok(());
    }

    if !removal_info.failed_splits.is_empty() {
        println!("The following splits were attempted to be removed, but failed.");
        for split_info in &removal_info.failed_splits {
            println!(" - {}", split_info.split_id);
        }
        println!(
            "{} Splits were unable to be removed.",
            removal_info.failed_splits.len()
        );
    }

    let deleted_bytes: u64 = removal_info
        .removed_split_entries
        .iter()
        .map(|split_info| split_info.file_size_bytes.as_u64())
        .sum();
    println!(
        "{}MB of storage garbage collected.",
        deleted_bytes / 1_000_000
    );

    if removal_info.failed_splits.is_empty() {
        println!(
            "{} Index successfully garbage collected.",
            "✔".color(GREEN_COLOR)
        );
    } else if removal_info.removed_split_entries.is_empty()
        && !removal_info.failed_splits.is_empty()
    {
        println!("{} Failed to garbage collect index.", "✘".color(RED_COLOR));
    } else {
        println!(
            "{} Index partially garbage collected.",
            "✘".color(RED_COLOR)
        );
    }

    Ok(())
}

async fn extract_split_cli(args: ExtractSplitArgs) -> anyhow::Result<()> {
    debug!(args=?args, "extract-split");
    println!("❯ Extracting split...");

    let config = load_node_config(&args.config_uri).await?;
    let (storage_resolver, metastore_resolver) =
        get_resolvers(&config.storage_configs, &config.metastore_configs);
    let metastore = metastore_resolver.resolve(&config.metastore_uri).await?;
    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(args.index_id))
        .await?
        .deserialize_index_metadata()?;
    let index_storage = storage_resolver.resolve(index_metadata.index_uri()).await?;
    let split_file = PathBuf::from(format!("{}.split", args.split_id));
    let split_data = index_storage.get_all(split_file.as_path()).await?;
    let (_hotcache_bytes, bundle_storage) = BundleStorage::open_from_split_data_with_owned_bytes(
        index_storage,
        split_file,
        split_data,
    )?;
    std::fs::create_dir_all(&args.target_dir)?;
    for path in bundle_storage.iter_files() {
        let mut out_path = args.target_dir.to_owned();
        out_path.push(path);
        println!("Copying {out_path:?}");
        bundle_storage.copy_to_file(path, &out_path).await?;
    }

    println!("{} Split successfully extracted.", "✔".color(GREEN_COLOR));
    Ok(())
}

/// Starts a tokio task that displays the indexing statistics
/// every once in awhile.
pub async fn start_statistics_reporting_loop(
    pipeline_handle: ActorHandle<IndexingPipeline>,
    is_stdin: bool,
) -> anyhow::Result<IndexingStatistics> {
    let mut stdout_handle = stdout();
    let start_time = Instant::now();
    let mut throughput_calculator = ThroughputCalculator::new(start_time);
    let mut report_interval = tokio::time::interval(Duration::from_secs(1));

    loop {
        // TODO fixme. The way we wait today is a bit lame: if the indexing pipeline exits, we will
        // still wait up to an entire heartbeat...  Ideally we should  select between two
        // futures.
        report_interval.tick().await;
        // Try to receive with a timeout of 1 second.
        // 1 second is also the frequency at which we update statistic in the console
        pipeline_handle.refresh_observe();

        let observation = pipeline_handle.last_observation();

        // Let's not display live statistics to allow screen to scroll.
        if observation.num_docs > 0 {
            display_statistics(&mut stdout_handle, &mut throughput_calculator, &observation)?;
        }

        if pipeline_handle.state().is_exit() {
            break;
        }
    }
    let (pipeline_exit_status, pipeline_statistics) = pipeline_handle.join().await;
    if !pipeline_exit_status.is_success() {
        bail!(pipeline_exit_status);
    }
    // If we have received zero docs at this point,
    // there is no point in displaying report.
    if pipeline_statistics.num_docs == 0 {
        return Ok(pipeline_statistics);
    }

    if is_stdin {
        display_statistics(
            &mut stdout_handle,
            &mut throughput_calculator,
            &pipeline_statistics,
        )?;
    }
    // display end of task report
    println!();
    let secs = Duration::from_secs(start_time.elapsed().as_secs());
    if pipeline_statistics.num_invalid_docs == 0 {
        println!(
            "Indexed {} documents in {}.",
            pipeline_statistics.num_docs.separate_with_commas(),
            format_duration(secs)
        );
    } else {
        let num_indexed_docs = (pipeline_statistics.num_docs
            - pipeline_statistics.num_invalid_docs)
            .separate_with_commas();

        let error_rate = (pipeline_statistics.num_invalid_docs as f64
            / pipeline_statistics.num_docs as f64)
            * 100.0;

        println!(
            "Indexed {} out of {} documents in {}. Failed to index {} document(s). {}\n",
            num_indexed_docs,
            pipeline_statistics.num_docs.separate_with_commas(),
            format_duration(secs),
            pipeline_statistics.num_invalid_docs.separate_with_commas(),
            colorize_error_rate(error_rate),
        );
    }

    Ok(pipeline_statistics)
}

fn colorize_error_rate(error_rate: f64) -> ColoredString {
    let error_rate_message = format!("({error_rate:.1}% error rate)");
    if error_rate < 1.0 {
        error_rate_message.yellow()
    } else if error_rate < 5.0 {
        error_rate_message.truecolor(255, 181, 46) //< Orange
    } else {
        error_rate_message.red()
    }
}

/// A struct to print data on the standard output.
struct Printer<'a> {
    pub stdout: &'a mut Stdout,
}

impl Printer<'_> {
    pub fn print_header(&mut self, header: &str) -> io::Result<()> {
        write!(&mut self.stdout, " {}", header.bright_blue())?;
        Ok(())
    }

    pub fn print_value(&mut self, fmt_args: fmt::Arguments) -> io::Result<()> {
        write!(&mut self.stdout, " {fmt_args}")
    }

    pub fn flush(&mut self) -> io::Result<()> {
        self.stdout.flush()
    }
}

fn display_statistics(
    stdout: &mut Stdout,
    throughput_calculator: &mut ThroughputCalculator,
    statistics: &IndexingStatistics,
) -> anyhow::Result<()> {
    let elapsed_duration = time::Duration::try_from(throughput_calculator.elapsed_time())?;
    let elapsed_time = format!(
        "{:02}:{:02}:{:02}",
        elapsed_duration.whole_hours(),
        elapsed_duration.whole_minutes() % 60,
        elapsed_duration.whole_seconds() % 60
    );
    let throughput_mb_s = throughput_calculator.calculate(statistics.total_bytes_processed);
    let mut printer = Printer { stdout };
    printer.print_header("Num docs")?;
    printer.print_value(format_args!("{:>7}", statistics.num_docs))?;
    printer.print_header("Parse errs")?;
    printer.print_value(format_args!("{:>5}", statistics.num_invalid_docs))?;
    printer.print_header("PublSplits")?;
    printer.print_value(format_args!("{:>3}", statistics.num_published_splits))?;
    printer.print_header("Input size")?;
    printer.print_value(format_args!(
        "{:>5}MB",
        statistics.total_bytes_processed / 1_000_000
    ))?;
    printer.print_header("Thrghput")?;
    printer.print_value(format_args!("{throughput_mb_s:>5.2}MB/s"))?;
    printer.print_header("Time")?;
    printer.print_value(format_args!("{elapsed_time}\n"))?;
    printer.flush()?;
    Ok(())
}

/// ThroughputCalculator is used to calculate throughput.
struct ThroughputCalculator {
    /// Stores the time series of processed bytes value.
    processed_bytes_values: VecDeque<(Instant, u64)>,
    /// Store the time this calculator started
    start_time: Instant,
}

impl ThroughputCalculator {
    /// Creates new instance.
    pub fn new(start_time: Instant) -> Self {
        let processed_bytes_values: VecDeque<(Instant, u64)> = (0..THROUGHPUT_WINDOW_SIZE)
            .map(|_| (start_time, 0u64))
            .collect();
        Self {
            processed_bytes_values,
            start_time,
        }
    }

    /// Calculates the throughput.
    pub fn calculate(&mut self, current_processed_bytes: u64) -> f64 {
        self.processed_bytes_values.pop_front();
        let current_instant = Instant::now();
        let (first_instant, first_processed_bytes) = *self.processed_bytes_values.front().unwrap();
        let elapsed_time = (current_instant - first_instant).as_millis() as f64 / 1_000f64;
        self.processed_bytes_values
            .push_back((current_instant, current_processed_bytes));
        (current_processed_bytes - first_processed_bytes) as f64
            / 1_000_000f64
            / elapsed_time.max(1f64)
    }

    pub fn elapsed_time(&self) -> Duration {
        self.start_time.elapsed()
    }
}

async fn create_empty_cluster(config: &NodeConfig) -> anyhow::Result<Cluster> {
    let self_node = ClusterMember {
        node_id: config.node_id.clone(),
        generation_id: quickwit_cluster::GenerationId::now(),
        is_ready: false,
        enabled_services: HashSet::new(),
        gossip_advertise_addr: config.gossip_advertise_addr,
        grpc_advertise_addr: config.grpc_advertise_addr,
        indexing_tasks: Vec::new(),
        indexing_cpu_capacity: CpuCapacity::zero(),
        ingester_status: IngesterStatus::default(),
        availability_zone: None,
    };
    let client_grpc_config = make_client_grpc_config(&config.grpc_config)?;
    let cluster = Cluster::join(
        config.cluster_id.clone(),
        self_node,
        config.gossip_advertise_addr,
        Vec::new(),
        config.gossip_interval,
        FailureDetectorConfig::default(),
        &ChannelTransport::default(),
        client_grpc_config,
    )
    .await?;

    Ok(cluster)
}


================================================
FILE: quickwit/quickwit-cli/tests/Pipfile
================================================
[[source]]
url = "https://pypi.org/simple"
verify_ssl = true
name = "pypi"

[packages]
awscli-local = "*"

[dev-packages]

[requires]
python_version = "3.11"


================================================
FILE: quickwit/quickwit-cli/tests/cli.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![recursion_limit = "256"]
#![allow(clippy::bool_assert_comparison)]

mod helpers;

use std::path::Path;

use anyhow::Result;
use clap::error::ErrorKind;
use helpers::{TestEnv, TestStorageType, uri_from_path};
use quickwit_cli::checklist::ChecklistError;
use quickwit_cli::cli::build_cli;
use quickwit_cli::index::{
    CreateIndexArgs, DeleteIndexArgs, SearchIndexArgs, UpdateIndexArgs, create_index_cli,
    delete_index_cli, search_index, update_index_cli,
};
use quickwit_cli::tool::{
    GarbageCollectIndexArgs, LocalIngestDocsArgs, garbage_collect_index_cli, local_ingest_docs_cli,
};
use quickwit_common::fs::get_cache_directory_path;
use quickwit_common::rand::append_random_suffix;
use quickwit_common::uri::Uri;
use quickwit_config::{CLI_SOURCE_ID, RetentionPolicy, SourceInputFormat};
use quickwit_metastore::{
    ListSplitsRequestExt, MetastoreResolver, MetastoreServiceExt, MetastoreServiceStreamSplitsExt,
    SplitMetadata, SplitState, StageSplitsRequestExt,
};
use quickwit_proto::metastore::{
    DeleteSplitsRequest, EntityKind, IndexMetadataRequest, ListSplitsRequest,
    MarkSplitsForDeletionRequest, MetastoreError, MetastoreService, StageSplitsRequest,
};
use serde_json::{Number, Value, json};
use tokio::time::{Duration, sleep};

use crate::helpers::{PACKAGE_BIN_NAME, create_test_env, upload_test_file};

async fn create_logs_index(test_env: &TestEnv) -> anyhow::Result<()> {
    let args = CreateIndexArgs {
        client_args: test_env.default_client_args(),
        index_config_uri: test_env.resource_files.index_config.clone(),
        overwrite: false,
        assume_yes: true,
    };
    create_index_cli(args).await
}

async fn local_ingest_docs(uri: Uri, test_env: &TestEnv) -> anyhow::Result<()> {
    let args = LocalIngestDocsArgs {
        config_uri: test_env.resource_files.config.clone(),
        index_id: test_env.index_id.clone(),
        input_path_opt: Some(uri),
        input_format: SourceInputFormat::Json,
        overwrite: false,
        clear_cache: true,
        vrl_script: None,
    };
    local_ingest_docs_cli(args).await
}

async fn local_ingest_log_docs(test_env: &TestEnv) -> anyhow::Result<()> {
    local_ingest_docs(test_env.resource_files.log_docs.clone(), test_env).await
}

#[test]
fn test_cmd_help() {
    let cmd = build_cli();
    let error = cmd
        .try_get_matches_from(vec![PACKAGE_BIN_NAME, "--help"])
        .unwrap_err();
    // on `--help` clap returns an error.
    assert_eq!(error.kind(), ErrorKind::DisplayHelp);
}

#[tokio::test]
async fn test_cmd_create() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-create-cmd");
    let test_env = create_test_env(index_id, TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    let index_metadata = test_env.index_metadata().await.unwrap();
    assert_eq!(index_metadata.index_id(), test_env.index_id);

    // Creating an existing index should fail.
    let error = create_logs_index(&test_env).await.unwrap_err();
    assert!(error.to_string().contains("already exist(s)"),);
}

#[tokio::test]
async fn test_cmd_create_no_index_uri() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-create-cmd-no-index-uri");
    let test_env = create_test_env(index_id, TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();

    let index_config_without_uri = test_env.resource_files.index_config_without_uri.clone();
    let args = CreateIndexArgs {
        client_args: test_env.default_client_args(),
        index_config_uri: index_config_without_uri,
        overwrite: false,
        assume_yes: true,
    };

    let response = create_index_cli(args).await;
    response.unwrap();

    let index_metadata = test_env.index_metadata().await.unwrap();
    assert_eq!(index_metadata.index_id(), test_env.index_id);
    assert_eq!(index_metadata.index_uri(), &test_env.index_uri);
}

#[tokio::test]
async fn test_cmd_create_overwrite() {
    // Create non existing index with --overwrite.
    let index_id = append_random_suffix("test-create-non-existing-index-with-overwrite");
    let test_env = create_test_env(index_id, TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();

    let index_config_without_uri = test_env.resource_files.index_config_without_uri.clone();
    let args = CreateIndexArgs {
        client_args: test_env.default_client_args(),
        index_config_uri: index_config_without_uri,
        overwrite: true,
        assume_yes: true,
    };

    create_index_cli(args).await.unwrap();

    let index_metadata = test_env.index_metadata().await.unwrap();
    assert_eq!(index_metadata.index_id(), &test_env.index_id);
    assert_eq!(index_metadata.index_uri(), &test_env.index_uri);
}

#[test]
fn test_cmd_create_with_ill_formed_command() {
    // Attempt to create with ill-formed new command.
    let app = build_cli();
    let error = app
        .try_get_matches_from(vec![PACKAGE_BIN_NAME, "index", "create"])
        .unwrap_err();
    assert_eq!(error.kind(), ErrorKind::MissingRequiredArgument);
}

#[tokio::test]
async fn test_cmd_ingest_on_non_existing_index() {
    let index_id = append_random_suffix("index-does-not-exist");
    let test_env = create_test_env(index_id, TestStorageType::LocalFileSystem)
        .await
        .unwrap();

    let args = LocalIngestDocsArgs {
        config_uri: test_env.resource_files.config,
        index_id: "index-does-not-exist".to_string(),
        input_path_opt: Some(test_env.resource_files.log_docs.clone()),
        input_format: SourceInputFormat::Json,
        overwrite: false,
        clear_cache: true,
        vrl_script: None,
    };

    let error = local_ingest_docs_cli(args).await.unwrap_err();

    assert_eq!(
        error.root_cause().downcast_ref::<MetastoreError>().unwrap(),
        &MetastoreError::NotFound(EntityKind::Index {
            index_id: "index-does-not-exist".to_string()
        })
    );
}

#[tokio::test]
async fn test_ingest_docs_cli_keep_cache() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-index-keep-cache");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    let args = LocalIngestDocsArgs {
        config_uri: test_env.resource_files.config,
        index_id,
        input_path_opt: Some(test_env.resource_files.log_docs.clone()),
        input_format: SourceInputFormat::Json,
        overwrite: false,
        clear_cache: false,
        vrl_script: None,
    };

    local_ingest_docs_cli(args).await.unwrap();
    // Ensure cache directory is not empty.
    let cache_directory_path = get_cache_directory_path(&test_env.data_dir_path);
    assert!(cache_directory_path.read_dir().unwrap().next().is_some());
}

#[tokio::test]
async fn test_ingest_docs_cli() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-index-simple");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();
    let index_uid = test_env.index_metadata().await.unwrap().index_uid;

    let args = LocalIngestDocsArgs {
        config_uri: test_env.resource_files.config.clone(),
        index_id: index_id.clone(),
        input_path_opt: Some(test_env.resource_files.log_docs.clone()),
        input_format: SourceInputFormat::Json,
        overwrite: false,
        clear_cache: true,
        vrl_script: None,
    };

    local_ingest_docs_cli(args).await.unwrap();

    let splits_metadata: Vec<SplitMetadata> = test_env
        .metastore()
        .await
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
        .await
        .unwrap()
        .collect_splits_metadata()
        .await
        .unwrap();

    assert_eq!(splits_metadata.len(), 1);
    assert_eq!(splits_metadata[0].num_docs, 5);

    // Ensure cache directory is empty.
    let cache_directory_path = get_cache_directory_path(&test_env.data_dir_path);
    assert!(cache_directory_path.read_dir().unwrap().next().is_none());

    let does_not_exist_uri = uri_from_path(&test_env.data_dir_path)
        .join("file-does-not-exist.json")
        .unwrap();

    // Ingest a non-existing file should fail.
    let args = LocalIngestDocsArgs {
        config_uri: test_env.resource_files.config,
        index_id: test_env.index_id,
        input_path_opt: Some(does_not_exist_uri),
        input_format: SourceInputFormat::Json,
        overwrite: false,
        clear_cache: true,
        vrl_script: None,
    };

    let error = local_ingest_docs_cli(args).await.unwrap_err();

    assert!(matches!(
        error.root_cause().downcast_ref::<ChecklistError>().unwrap(),
        ChecklistError {
            errors
        } if errors.len() == 1 && errors[0].0 == CLI_SOURCE_ID
    ));
}

#[tokio::test]
async fn test_reingest_same_file_cli() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-index-simple");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();
    let index_uid = test_env.index_metadata().await.unwrap().index_uid;

    for _ in 0..2 {
        let args = LocalIngestDocsArgs {
            config_uri: test_env.resource_files.config.clone(),
            index_id: index_id.clone(),
            input_path_opt: Some(test_env.resource_files.log_docs.clone()),
            input_format: SourceInputFormat::Json,
            overwrite: false,
            clear_cache: true,
            vrl_script: None,
        };

        local_ingest_docs_cli(args).await.unwrap();
    }

    let splits_metadata: Vec<SplitMetadata> = test_env
        .metastore()
        .await
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
        .await
        .unwrap()
        .collect_splits_metadata()
        .await
        .unwrap();

    assert_eq!(splits_metadata.len(), 1);
    assert_eq!(splits_metadata[0].num_docs, 5);
}

/// Helper function to compare a json payload.
///
/// It will serialize and deserialize the value in order
/// to make sure floating points are the exact value obtained via
/// JSON deserialization.
#[track_caller]
fn assert_flexible_json_eq(value_json: &serde_json::Value, expected_json: &serde_json::Value) {
    match (value_json, expected_json) {
        (Value::Array(left_arr), Value::Array(right_arr)) => {
            assert_eq!(
                left_arr.len(),
                right_arr.len(),
                "left: {left_arr:?} right: {right_arr:?}"
            );
            for i in 0..left_arr.len() {
                assert_flexible_json_eq(&left_arr[i], &right_arr[i]);
            }
        }
        (Value::Object(left_obj), Value::Object(right_obj)) => {
            assert_eq!(
                left_obj.len(),
                right_obj.len(),
                "left: {left_obj:?} right: {right_obj:?}"
            );
            for (k, v) in left_obj {
                if let Some(right_value) = right_obj.get(k) {
                    assert_flexible_json_eq(v, right_value);
                } else {
                    panic!("Missing key `{k}`");
                }
            }
        }
        (Value::Number(left_num), Value::Number(right_num)) => {
            let left = left_num.as_f64().unwrap();
            let right = right_num.as_f64().unwrap();
            assert!(
                (left - right).abs() / (1e-32 + left + right).abs() < 1e-4,
                "left: {left:?} right: {right:?}"
            );
        }
        (left, right) => {
            assert_eq!(left, right);
        }
    }
}

#[tokio::test]
async fn test_cmd_search_aggregation() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-search-cmd");
    let test_env = create_test_env(index_id, TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    local_ingest_log_docs(&test_env).await.unwrap();

    let aggregation: Value = json!(
    {
      "range_buckets": {
        "range": {
          "field": "ts",
          "ranges": [
            { "to": 72057597000000000f64 },
            { "from": 72057597000000000f64, "to": 72057600000000000f64 },
            { "from": 72057600000000000f64, "to": 72057604000000000f64 },
            { "from": 72057604000000000f64 },
          ]
        },
        "aggs": {
          "average_ts": {
            "avg": { "field": "ts" }
          }
        }
      }
    });

    // search with aggregation
    let args = SearchIndexArgs {
        index_id: test_env.index_id.clone(),
        query: "paris OR tokio OR london".to_string(),
        aggregation: Some(serde_json::to_string(&aggregation).unwrap()),
        max_hits: 10,
        start_offset: 0,
        search_fields: Some(vec!["city".to_string()]),
        snippet_fields: None,
        start_timestamp: None,
        end_timestamp: None,
        client_args: test_env.default_client_args(),
        sort_by_score: false,
    };
    let search_response = search_index(args).await.unwrap();

    let aggregation_res = search_response.aggregations.unwrap();
    let expected_json = serde_json::json!({
        "range_buckets": {
            "buckets": [
                {
                    "average_ts": {
                        "value": null
                    },
                    "doc_count": 0,
                    "key": "*-1972-04-13T23:59:57Z",
                    "to": 72057597000000000f64,
                    "to_as_string": "1972-04-13T23:59:57Z"
                },
                {
                    "average_ts": {
                        "value": 72057597500000000f64
                    },
                    "doc_count": 2,
                    "from": 72057597000000000f64,
                    "from_as_string": "1972-04-13T23:59:57Z",
                    "key": "1972-04-13T23:59:57Z-1972-04-14T00:00:00Z",
                    "to": 72057600000000000f64,
                    "to_as_string": "1972-04-14T00:00:00Z"
                },
                {
                    "average_ts": {
                        "value": null
                    },
                    "doc_count": 0,
                    "from": 72057600000000000f64,
                    "from_as_string": "1972-04-14T00:00:00Z",
                    "key": "1972-04-14T00:00:00Z-1972-04-14T00:00:04Z",
                    "to": 72057604000000000f64,
                    "to_as_string": "1972-04-14T00:00:04Z"
                },
                {
                    "average_ts": {
                        "value": 72057606333333330f64
                    },
                    "doc_count": 3,
                    "from": 72057604000000000f64,
                    "from_as_string": "1972-04-14T00:00:04Z",
                    "key": "1972-04-14T00:00:04Z-*"
                }
            ]
        }
    });
    assert_flexible_json_eq(&aggregation_res, &expected_json);
}

#[tokio::test]
async fn test_cmd_search_with_snippets() -> Result<()> {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-search-cmd");
    let test_env = create_test_env(index_id, TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    local_ingest_log_docs(&test_env).await.unwrap();

    // search with snippets
    let args = SearchIndexArgs {
        index_id: test_env.index_id.clone(),
        query: "event:baz".to_string(),
        aggregation: None,
        max_hits: 10,
        start_offset: 0,
        search_fields: None,
        snippet_fields: Some(vec!["event".to_string()]),
        start_timestamp: None,
        end_timestamp: None,
        client_args: test_env.default_client_args(),
        sort_by_score: false,
    };
    let search_response = search_index(args).await.unwrap();
    assert_eq!(search_response.hits.len(), 1);
    let hit = &search_response.hits[0];
    assert_eq!(hit, &json!({"event": "baz", "ts": 72057604}));
    assert_eq!(
        search_response.snippets.unwrap()[0],
        json!({
            "event": [ "<b>baz</b>"]
        })
    );
    Ok(())
}

#[tokio::test]
async fn test_search_index_cli() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-search-cmd");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    let create_search_args = |query: &str| SearchIndexArgs {
        client_args: test_env.default_client_args(),
        index_id: index_id.clone(),
        query: query.to_string(),
        aggregation: None,
        max_hits: 20,
        start_offset: 0,
        search_fields: None,
        snippet_fields: None,
        start_timestamp: None,
        end_timestamp: None,
        sort_by_score: false,
    };

    local_ingest_log_docs(&test_env).await.unwrap();

    let args = create_search_args("level:info");

    // search_index_cli calls search_index and prints the SearchResponse
    let search_res = search_index(args).await.unwrap();
    assert_eq!(search_res.num_hits, 2);

    // search with tag pruning
    let args = create_search_args("+level:info +city:paris");

    // search_index_cli calls search_index and prints the SearchResponse
    let search_res = search_index(args).await.unwrap();
    assert_eq!(search_res.num_hits, 1);

    // search with tag pruning
    let args = create_search_args("level:info AND city:conakry");

    // search_index_cli calls search_index and prints the SearchResponse
    let search_res = search_index(args).await.unwrap();
    assert_eq!(search_res.num_hits, 0);
}

#[tokio::test]
async fn test_cmd_update_index() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-update-cmd");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    // add retention policy
    let args = UpdateIndexArgs {
        client_args: test_env.default_client_args(),
        index_id: index_id.clone(),
        index_config_uri: test_env.resource_files.index_config_with_retention.clone(),
        create: false,
        assume_yes: true,
    };
    update_index_cli(args).await.unwrap();
    let index_metadata = test_env.index_metadata().await.unwrap();
    assert_eq!(index_metadata.index_id(), test_env.index_id);
    assert_eq!(
        index_metadata.index_config.retention_policy_opt,
        Some(RetentionPolicy {
            retention_period: String::from("1 week"),
            evaluation_schedule: String::from("daily")
        })
    );

    // remove retention policy
    let args = UpdateIndexArgs {
        client_args: test_env.default_client_args(),
        index_id,
        index_config_uri: test_env.resource_files.index_config.clone(),
        create: false,
        assume_yes: true,
    };
    update_index_cli(args).await.unwrap();
    let index_metadata = test_env.index_metadata().await.unwrap();
    assert_eq!(index_metadata.index_id(), test_env.index_id);
    assert_eq!(index_metadata.index_config.retention_policy_opt, None);
}

#[tokio::test]
async fn test_delete_index_cli_dry_run() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-delete-cmd--dry-run");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    let refresh_metastore = |metastore| async {
        // In this test we rely on the file backed metastore
        // and the file backed metastore caches results.
        // Therefore we need to force reading the disk to fetch updates.
        //
        // We do that by dropping and recreating our metastore.
        drop(metastore);
        MetastoreResolver::unconfigured()
            .resolve(&test_env.metastore_uri)
            .await
    };

    let create_delete_args = |dry_run| DeleteIndexArgs {
        client_args: test_env.default_client_args(),
        index_id: index_id.clone(),
        dry_run,
        assume_yes: true,
    };

    let mut metastore = MetastoreResolver::unconfigured()
        .resolve(&test_env.metastore_uri)
        .await
        .unwrap();

    assert!(metastore.index_exists(&index_id).await.unwrap());
    // On empty index.
    let args = create_delete_args(true);

    delete_index_cli(args).await.unwrap();
    // On dry run index should still exist
    let mut metastore = refresh_metastore(metastore).await.unwrap();
    metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap();
    assert!(metastore.index_exists(&index_id).await.unwrap());

    local_ingest_log_docs(&test_env).await.unwrap();

    // On non-empty index
    let args = create_delete_args(true);

    delete_index_cli(args).await.unwrap();
    // On dry run index should still exist
    let mut metastore = refresh_metastore(metastore).await.unwrap();
    metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap();
    assert!(metastore.index_exists(&index_id).await.unwrap());
}

#[tokio::test]
async fn test_delete_index_cli() {
    let index_id = append_random_suffix("test-delete-cmd");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    local_ingest_log_docs(&test_env).await.unwrap();

    let args = DeleteIndexArgs {
        client_args: test_env.default_client_args(),
        index_id: index_id.clone(),
        assume_yes: true,
        dry_run: false,
    };

    delete_index_cli(args).await.unwrap();

    assert!(test_env.index_metadata().await.is_err());
}

#[tokio::test]
async fn test_garbage_collect_cli_no_grace() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-gc-cmd--no-grace-period");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();
    let index_uid = test_env.index_metadata().await.unwrap().index_uid;
    local_ingest_log_docs(&test_env).await.unwrap();

    let metastore = MetastoreResolver::unconfigured()
        .resolve(&test_env.metastore_uri)
        .await
        .unwrap();

    let refresh_metastore = |metastore| async {
        // In this test we rely on the file backed metastore and write on
        // a different process. The file backed metastore caches results.
        // Therefore we need to force reading the disk.
        //
        // We do that by dropping and recreating our metastore.
        drop(metastore);
        MetastoreResolver::unconfigured()
            .resolve(&test_env.metastore_uri)
            .await
    };

    let create_gc_args = |dry_run| GarbageCollectIndexArgs {
        config_uri: test_env.resource_files.config.clone(),
        index_id: index_id.clone(),
        grace_period: Duration::from_secs(3600),
        dry_run,
    };

    let splits_metadata = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits_metadata()
        .await
        .unwrap();
    assert_eq!(splits_metadata.len(), 1);

    let args = create_gc_args(false);

    garbage_collect_index_cli(args).await.unwrap();

    // On gc splits within grace period should still exist.
    let index_path = test_env.indexes_dir_path.join(&test_env.index_id);
    assert_eq!(index_path.try_exists().unwrap(), true);

    let split_ids = vec![splits_metadata[0].split_id().to_string()];
    let metastore = refresh_metastore(metastore).await.unwrap();
    let mark_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid.clone(), split_ids.clone());
    metastore
        .mark_splits_for_deletion(mark_for_deletion_request)
        .await
        .unwrap();

    let args = create_gc_args(true);

    garbage_collect_index_cli(args).await.unwrap();

    // On `dry_run = true` splits `MarkedForDeletion` should still exist.
    for split_id in split_ids.iter() {
        let split_file = quickwit_common::split_file(split_id);
        let split_filepath = index_path.join(split_file);
        assert_eq!(split_filepath.try_exists().unwrap(), true);
    }

    let args = create_gc_args(false);

    garbage_collect_index_cli(args).await.unwrap();

    // If split is `MarkedForDeletion` it should be deleted after gc run
    for split_id in split_ids.iter() {
        let split_file = quickwit_common::split_file(split_id);
        let split_filepath = index_path.join(split_file);
        assert_eq!(split_filepath.try_exists().unwrap(), false);
    }

    let metastore = refresh_metastore(metastore).await.unwrap();
    assert_eq!(
        metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
            .await
            .unwrap()
            .collect_splits_metadata()
            .await
            .unwrap()
            .len(),
        0
    );

    let args = DeleteIndexArgs {
        client_args: test_env.default_client_args(),
        index_id,
        dry_run: false,
        assume_yes: true,
    };

    delete_index_cli(args).await.unwrap();

    assert_eq!(index_path.try_exists().unwrap(), false);
}

#[tokio::test]
async fn test_garbage_collect_index_cli() {
    let index_id = append_random_suffix("test-gc-cmd");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();
    let index_uid = test_env.index_metadata().await.unwrap().index_uid;
    local_ingest_log_docs(&test_env).await.unwrap();

    let refresh_metastore = |metastore| async {
        // In this test we rely on the file backed metastore and
        // modify it but the file backed metastore caches results.
        // Therefore we need to force reading the disk to update split info.
        //
        // We do that by dropping and recreating our metastore.
        drop(metastore);
        MetastoreResolver::unconfigured()
            .resolve(&test_env.metastore_uri)
            .await
    };

    let create_gc_args = |grace_period_secs| GarbageCollectIndexArgs {
        config_uri: test_env.resource_files.config.clone(),
        index_id: index_id.clone(),
        grace_period: Duration::from_secs(grace_period_secs),
        dry_run: false,
    };

    let metastore = MetastoreResolver::unconfigured()
        .resolve(&test_env.metastore_uri)
        .await
        .unwrap();

    let splits_metadata = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits_metadata()
        .await
        .unwrap();
    assert_eq!(splits_metadata.len(), 1);

    let index_path = test_env.indexes_dir_path.join(&test_env.index_id);
    let split_filename = quickwit_common::split_file(splits_metadata[0].split_id.as_str());
    let split_path = index_path.join(&split_filename);
    assert_eq!(split_path.try_exists().unwrap(), true);

    let args = create_gc_args(3600);

    garbage_collect_index_cli(args).await.unwrap();

    // Split should still exists within grace period.
    let metastore = refresh_metastore(metastore).await.unwrap();
    let splits_metadata = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits_metadata()
        .await
        .unwrap();
    assert_eq!(splits_metadata.len(), 1);

    // The following steps help turn an existing published split into a staged one
    // without deleting the files.
    let split_metadata = splits_metadata[0].clone();
    metastore
        .mark_splits_for_deletion(MarkSplitsForDeletionRequest::new(
            index_uid.clone(),
            vec![split_metadata.split_id.to_string()],
        ))
        .await
        .unwrap();
    metastore
        .delete_splits(DeleteSplitsRequest {
            index_uid: Some(index_uid.clone()),
            split_ids: splits_metadata
                .into_iter()
                .map(|split_metadata| split_metadata.split_id)
                .collect(),
        })
        .await
        .unwrap();
    metastore
        .stage_splits(
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap(),
        )
        .await
        .unwrap();
    assert_eq!(split_path.try_exists().unwrap(), true);

    let metastore = refresh_metastore(metastore).await.unwrap();
    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    assert_eq!(splits[0].split_state, SplitState::Staged);

    let args = create_gc_args(3600);

    garbage_collect_index_cli(args).await.unwrap();

    assert_eq!(split_path.try_exists().unwrap(), true);
    // Staged splits should still exist within grace period.
    let metastore = refresh_metastore(metastore).await.unwrap();
    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    assert_eq!(splits.len(), 1);
    assert_eq!(splits[0].split_state, SplitState::Staged);

    // Wait for grace period.
    // TODO: edit split update timestamps and remove this sleep.
    sleep(Duration::from_secs(2)).await;

    let args = create_gc_args(1);

    garbage_collect_index_cli(args).await.unwrap();

    let metastore = refresh_metastore(metastore).await.unwrap();
    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    // Splits should be deleted from both metastore and file system.
    assert_eq!(splits.len(), 0);
    assert_eq!(split_path.try_exists().unwrap(), false);
}

/// testing the api via cli commands
#[tokio::test]
async fn test_all_local_index() {
    quickwit_common::setup_logging_for_tests();
    let index_id = append_random_suffix("test-all");
    let test_env = create_test_env(index_id.clone(), TestStorageType::LocalFileSystem)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    let metadata_file_exists = test_env
        .storage
        .exists(&Path::new(&test_env.index_id).join("metastore.json"))
        .await
        .unwrap();
    assert!(metadata_file_exists);

    local_ingest_log_docs(&test_env).await.unwrap();

    let query_response = reqwest::get(format!(
        "http://127.0.0.1:{}/api/v1/{}/search?query=level:info",
        test_env.rest_listen_port, test_env.index_id
    ))
    .await
    .unwrap()
    .text()
    .await
    .unwrap();

    let result: Value = serde_json::from_str(&query_response).unwrap();
    assert_eq!(result["num_hits"], Value::Number(Number::from(2i64)));

    let args = DeleteIndexArgs {
        client_args: test_env.default_client_args(),
        index_id,
        dry_run: false,
        assume_yes: true,
    };
    delete_index_cli(args).await.unwrap();

    let metadata_file_exists = test_env
        .storage
        .exists(&Path::new(&test_env.index_id).join("metastore.json"))
        .await
        .unwrap();
    assert_eq!(metadata_file_exists, false);
}

/// testing the api via cli commands
#[tokio::test]
#[cfg_attr(not(feature = "ci-test"), ignore)]
async fn test_all_with_s3_localstack_cli() {
    let index_id = append_random_suffix("test-all--cli-s3-localstack");
    let test_env = create_test_env(index_id.clone(), TestStorageType::S3)
        .await
        .unwrap();
    test_env.start_server().await.unwrap();
    create_logs_index(&test_env).await.unwrap();

    let s3_uri = upload_test_file(
        test_env.storage_resolver.clone(),
        test_env
            .resource_files
            .log_docs
            .filepath()
            .unwrap()
            .to_path_buf(),
        "quickwit-integration-tests",
        "sources/",
        &append_random_suffix("test-all--cli-s3-localstack"),
    )
    .await;

    local_ingest_docs(s3_uri, &test_env).await.unwrap();

    // Cli search
    let args = SearchIndexArgs {
        client_args: test_env.default_client_args(),
        index_id: index_id.clone(),
        query: "level:info".to_string(),
        aggregation: None,
        max_hits: 20,
        start_offset: 0,
        search_fields: None,
        snippet_fields: None,
        start_timestamp: None,
        end_timestamp: None,
        sort_by_score: false,
    };

    let search_res = search_index(args).await.unwrap();
    assert_eq!(search_res.num_hits, 2);

    let query_response = reqwest::get(format!(
        "http://127.0.0.1:{}/api/v1/{}/search?query=level:info",
        test_env.rest_listen_port, test_env.index_id,
    ))
    .await
    .unwrap()
    .text()
    .await
    .unwrap();

    let result: Value = serde_json::from_str(&query_response).unwrap();
    assert_eq!(result["num_hits"], Value::Number(Number::from(2i64)));

    let args = DeleteIndexArgs {
        client_args: test_env.default_client_args(),
        index_id: index_id.clone(),
        dry_run: false,
        assume_yes: true,
    };

    delete_index_cli(args).await.unwrap();

    assert_eq!(
        test_env
            .storage
            .exists(Path::new(&test_env.index_id))
            .await
            .unwrap(),
        false
    );
}


================================================
FILE: quickwit/quickwit-cli/tests/helpers.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fs;
use std::path::{Path, PathBuf};
use std::str::FromStr;
use std::sync::Arc;

use anyhow::Context;
use predicates::str;
use quickwit_cli::ClientArgs;
use quickwit_cli::service::RunCliCommand;
use quickwit_common::net::find_available_tcp_port;
use quickwit_common::test_utils::wait_for_server_ready;
use quickwit_common::uri::Uri;
use quickwit_config::service::QuickwitService;
use quickwit_metastore::{IndexMetadata, IndexMetadataResponseExt, MetastoreResolver};
use quickwit_proto::metastore::{IndexMetadataRequest, MetastoreService, MetastoreServiceClient};
use quickwit_proto::types::IndexId;
use quickwit_storage::{Storage, StorageResolver};
use reqwest::Url;
use tempfile::{TempDir, tempdir};
use tracing::error;

pub const PACKAGE_BIN_NAME: &str = "quickwit";

const DEFAULT_INDEX_CONFIG: &str = r#"
    version: 0.8

    index_id: #index_id
    index_uri: #index_uri

    doc_mapping:
      field_mappings:
        - name: ts
          type: datetime
          input_formats:
            - unix_timestamp
          output_format: unix_timestamp_secs
          fast_precision: seconds
          fast: true
        - name: level
          type: text
          stored: false
        - name: event
          type: text
        - name: device
          type: text
          stored: false
          tokenizer: raw
        - name: city
          type: text
          stored: false
          tokenizer: raw

      timestamp_field: ts
      tag_fields: [city, device]

    indexing_settings:
      resources:
        heap_size: 50MB

    search_settings:
      default_search_fields: [event]
"#;

const RETENTION_CONFIG: &str = r#"
    retention:
      period: 1 week
      schedule: daily
"#;

const DEFAULT_QUICKWIT_CONFIG: &str = r#"
    version: 0.8
    metastore_uri: #metastore_uri
    data_dir: #data_dir
    rest:
        listen_port: #rest_listen_port
    grpc_listen_port: #grpc_listen_port
"#;

const LOGS_JSON_DOCS: &str = r#"{"event": "foo", "level": "info", "ts": 72057597, "device": "rpi", "city": "tokio"}
{"event": "bar", "level": "error", "ts": 72057598, "device": "rpi", "city": "paris"}
{"event": "baz", "level": "warning", "ts": 72057604, "device": "fbit", "city": "london"}
{"event": "buz", "level": "debug", "ts": 72057607, "device": "rpi", "city": "paris"}
{"event": "biz", "level": "info", "ts": 72057608, "device": "fbit", "city": "paris"}"#;

const WIKI_JSON_DOCS: &str = r#"{"body": "foo", "title": "shimroy", "url": "https://wiki.com?id=10"}
{"body": "bar", "title": "shimray", "url": "https://wiki.com?id=12"}
{"body": "baz", "title": "preshow", "url": "https://wiki.com?id=11"}
{"body": "buz", "title": "frederick", "url": "https://wiki.com?id=48"}
{"body": "biz", "title": "modern", "url": "https://wiki.com?id=13"}
"#;

pub struct TestResourceFiles {
    pub config: Uri,
    pub index_config: Uri,
    pub index_config_without_uri: Uri,
    pub index_config_with_retention: Uri,
    pub log_docs: Uri,
}

/// A struct to hold few info about the test environment.
pub struct TestEnv {
    /// The temporary directory of the test.
    _temp_dir: TempDir,
    /// Path of the directory where indexing directory are created.
    pub data_dir_path: PathBuf,
    /// Path of the directory where indexes are stored.
    pub indexes_dir_path: PathBuf,
    /// Resource files needed for the test.
    pub resource_files: TestResourceFiles,
    /// The metastore URI.
    pub metastore_uri: Uri,
    pub metastore_resolver: MetastoreResolver,

    pub cluster_endpoint: Url,

    /// The index ID.
    pub index_id: IndexId,
    pub index_uri: Uri,
    pub rest_listen_port: u16,
    pub storage_resolver: StorageResolver,
    pub storage: Arc<dyn Storage>,
}

impl TestEnv {
    // For cache reason, it's safer to always create an instance and then make your assertions.
    pub async fn metastore(&self) -> MetastoreServiceClient {
        self.metastore_resolver
            .resolve(&self.metastore_uri)
            .await
            .unwrap()
    }

    pub async fn index_metadata(&self) -> anyhow::Result<IndexMetadata> {
        let index_metadata = self
            .metastore()
            .await
            .index_metadata(IndexMetadataRequest::for_index_id(self.index_id.clone()))
            .await?
            .deserialize_index_metadata()?;
        Ok(index_metadata)
    }

    pub async fn start_server(&self) -> anyhow::Result<()> {
        let run_command = RunCliCommand {
            config_uri: self.resource_files.config.clone(),
            services: Some(QuickwitService::supported_services()),
        };
        tokio::spawn(async move {
            if let Err(error) = run_command
                .execute(quickwit_serve::do_nothing_env_filter_reload_fn())
                .await
            {
                error!(err=?error, "failed to start a quickwit server");
            }
        });
        wait_for_server_ready(([127, 0, 0, 1], self.rest_listen_port).into()).await?;
        Ok(())
    }

    pub fn default_client_args(&self) -> ClientArgs {
        ClientArgs {
            cluster_endpoint: self.cluster_endpoint.clone(),
            ..Default::default()
        }
    }
}

pub enum TestStorageType {
    S3,
    LocalFileSystem,
}

pub fn uri_from_path(path: &Path) -> Uri {
    Uri::from_str(path.to_str().unwrap()).unwrap()
}

/// Creates all necessary artifacts in a test environment.
pub async fn create_test_env(
    index_id: IndexId,
    storage_type: TestStorageType,
) -> anyhow::Result<TestEnv> {
    let temp_dir = tempdir()?;
    let data_dir_path = temp_dir.path().join("data");
    let indexes_dir_path = data_dir_path.join("indexes");
    let resources_dir_path = temp_dir.path().join("resources");

    for dir_path in [&data_dir_path, &indexes_dir_path, &resources_dir_path] {
        fs::create_dir(dir_path)?;
    }

    // TODO: refactor when we have a singleton storage resolver.
    let metastore_uri = match storage_type {
        TestStorageType::LocalFileSystem => {
            Uri::from_str(&format!("file://{}", indexes_dir_path.display())).unwrap()
        }
        TestStorageType::S3 => Uri::for_test("s3://quickwit-integration-tests/indexes"),
    };
    let storage_resolver = StorageResolver::unconfigured();
    let storage = storage_resolver.resolve(&metastore_uri).await?;
    let metastore_resolver = MetastoreResolver::unconfigured();
    let index_uri = metastore_uri.join(&index_id).unwrap();
    let index_config_path = resources_dir_path.join("index_config.yaml");
    fs::write(
        &index_config_path,
        DEFAULT_INDEX_CONFIG
            .replace("#index_id", &index_id)
            .replace("#index_uri", index_uri.as_str()),
    )?;
    let index_config_without_uri_path = resources_dir_path.join("index_config_without_uri.yaml");
    fs::write(
        &index_config_without_uri_path,
        DEFAULT_INDEX_CONFIG
            .replace("#index_id", &index_id)
            .replace("index_uri: #index_uri\n", ""),
    )?;
    let index_config_with_retention_path =
        resources_dir_path.join("index_config_with_retention.yaml");
    fs::write(
        &index_config_with_retention_path,
        format!("{DEFAULT_INDEX_CONFIG}{RETENTION_CONFIG}")
            .replace("#index_id", &index_id)
            .replace("#index_uri", index_uri.as_str()),
    )?;
    let node_config_path = resources_dir_path.join("config.yaml");
    let rest_listen_port = find_available_tcp_port()?;
    let grpc_listen_port = find_available_tcp_port()?;
    fs::write(
        &node_config_path,
        // A poor's man templating engine reloaded...
        DEFAULT_QUICKWIT_CONFIG
            .replace("#metastore_uri", metastore_uri.as_str())
            .replace("#data_dir", data_dir_path.to_str().unwrap())
            .replace("#rest_listen_port", &rest_listen_port.to_string())
            .replace("#grpc_listen_port", &grpc_listen_port.to_string()),
    )?;
    let log_docs_path = resources_dir_path.join("logs.json");
    fs::write(&log_docs_path, LOGS_JSON_DOCS)?;
    let wikipedia_docs_path = resources_dir_path.join("wikis.json");
    fs::write(wikipedia_docs_path, WIKI_JSON_DOCS)?;

    let cluster_endpoint = Url::parse(&format!("http://localhost:{rest_listen_port}"))
        .context("failed to parse cluster endpoint")?;

    let resource_files = TestResourceFiles {
        config: uri_from_path(&node_config_path),
        index_config: uri_from_path(&index_config_path),
        index_config_without_uri: uri_from_path(&index_config_without_uri_path),
        index_config_with_retention: uri_from_path(&index_config_with_retention_path),
        log_docs: uri_from_path(&log_docs_path),
    };

    Ok(TestEnv {
        _temp_dir: temp_dir,
        data_dir_path,
        indexes_dir_path,
        resource_files,
        metastore_uri,
        metastore_resolver,
        cluster_endpoint,
        index_id,
        index_uri,
        rest_listen_port,
        storage_resolver,
        storage,
    })
}

/// TODO: this should be part of the test env setup
pub async fn upload_test_file(
    storage_resolver: StorageResolver,
    local_src_path: PathBuf,
    bucket: &str,
    prefix: &str,
    filename: &str,
) -> Uri {
    let test_data = tokio::fs::read(local_src_path).await.unwrap();
    let src_location = format!("s3://{bucket}/{prefix}");
    let storage_uri = Uri::from_str(&src_location).unwrap();
    let storage = storage_resolver.resolve(&storage_uri).await.unwrap();
    storage
        .put(&PathBuf::from(filename), Box::new(test_data))
        .await
        .unwrap();
    storage_uri.join(filename).unwrap()
}


================================================
FILE: quickwit/quickwit-cli/tests/prepare_tests.sh
================================================
#!/bin/bash
awslocal s3 mb s3://quickwit-integration-tests && awslocal s3 rm --recursive s3://quickwit-integration-tests


================================================
FILE: quickwit/quickwit-cluster/Cargo.toml
================================================
[package]
name = "quickwit-cluster"
description = "Cluster membership based on Chitchat"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
bytesize = { workspace = true }
chitchat = { workspace = true }
futures = { workspace = true }
itertools = { workspace = true }
once_cell = { workspace = true }
pin-project = { workspace = true }
rand = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tonic = { workspace = true }
tracing = { workspace = true }
utoipa = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-proto = { workspace = true }

[features]
testsuite = []

[dev-dependencies]
rand = { workspace = true }

chitchat = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }

[package.metadata.cargo-machete]
# used inside code generated by utoipa
ignored = ["serde_json"]


================================================
FILE: quickwit/quickwit-cluster/src/change.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::collections::btree_map::Entry;
use std::pin::Pin;
use std::task::{Context, Poll};

use chitchat::{ChitchatId, NodeState};
use futures::Stream;
use pin_project::pin_project;
use quickwit_common::sorted_iter::{KeyDiff, SortedByKeyIterator};
use quickwit_common::tower::{ClientGrpcConfig, make_channel, warmup_channel};
use quickwit_proto::types::NodeId;
use tokio::sync::mpsc;
use tokio_stream::wrappers::UnboundedReceiverStream;
use tonic::transport::Channel;
use tracing::{info, warn};

use crate::ClusterNode;
use crate::member::NodeStateExt;

/// Describes a change in the cluster.
#[derive(Debug, Clone)]
pub enum ClusterChange {
    Add(ClusterNode),
    Update {
        previous: ClusterNode,
        updated: ClusterNode,
    },
    Remove(ClusterNode),
}

/// A stream of cluster change events.
#[pin_project]
pub struct ClusterChangeStream(#[pin] UnboundedReceiverStream<ClusterChange>);

impl ClusterChangeStream {
    pub fn new_unbounded() -> (Self, mpsc::UnboundedSender<ClusterChange>) {
        let (change_stream_tx, change_stream_rx) = mpsc::unbounded_channel();
        (
            Self(UnboundedReceiverStream::new(change_stream_rx)),
            change_stream_tx,
        )
    }
}

impl Stream for ClusterChangeStream {
    type Item = ClusterChange;

    fn poll_next(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
        self.project().0.poll_next(cx)
    }
}

/// A factory for creating cluster change streams.
pub trait ClusterChangeStreamFactory: Clone + Send + 'static {
    fn create(&self) -> ClusterChangeStream;
}

/// Compares the digests of the previous and new set of lives nodes, identifies the changes that
/// occurred in the cluster, and emits the corresponding events, focusing on ready nodes only.
pub(crate) async fn compute_cluster_change_events(
    cluster_id: &str,
    self_chitchat_id: &ChitchatId,
    previous_nodes: &mut BTreeMap<NodeId, ClusterNode>,
    previous_node_states: &BTreeMap<ChitchatId, NodeState>,
    new_node_states: &BTreeMap<ChitchatId, NodeState>,
    client_grpc_config: &ClientGrpcConfig,
) -> Vec<ClusterChange> {
    let mut cluster_events = Vec::new();

    for key_diff in previous_node_states
        .iter()
        .diff_by_key(new_node_states.iter())
    {
        match key_diff {
            // The node has joined the cluster.
            KeyDiff::Added(chitchat_id, node_state) => {
                let node_events = compute_cluster_change_events_on_added(
                    cluster_id,
                    self_chitchat_id,
                    chitchat_id,
                    node_state,
                    previous_nodes,
                    client_grpc_config.clone(),
                )
                .await;

                cluster_events.extend(node_events);
            }
            // The node's state has changed.
            KeyDiff::Unchanged(chitchat_id, previous_node_state, new_node_state)
                if previous_node_state.max_version() != new_node_state.max_version() =>
            {
                let node_event_opt = compute_cluster_change_events_on_updated(
                    cluster_id,
                    self_chitchat_id,
                    chitchat_id,
                    new_node_state,
                    previous_nodes,
                )
                .await;

                if let Some(node_event) = node_event_opt {
                    cluster_events.push(node_event);
                }
            }
            // The node's state has not changed.
            KeyDiff::Unchanged(_chitchat_id, _previous_max_version, _new_max_version) => {}
            // The node has left the cluster, i.e. it is considered dead by the failure detector.
            KeyDiff::Removed(chitchat_id, _node_state) => {
                let node_event_opt =
                    compute_cluster_change_events_on_removed(chitchat_id, previous_nodes);

                if let Some(node_event) = node_event_opt {
                    cluster_events.push(node_event);
                }
            }
        };
    }
    cluster_events
}

async fn compute_cluster_change_events_on_added(
    cluster_id: &str,
    self_chitchat_id: &ChitchatId,
    new_chitchat_id: &ChitchatId,
    new_node_state: &NodeState,
    previous_nodes: &mut BTreeMap<NodeId, ClusterNode>,
    client_grpc_config: ClientGrpcConfig,
) -> Vec<ClusterChange> {
    let is_self_node = self_chitchat_id == new_chitchat_id;
    let new_node_id: NodeId = new_chitchat_id.node_id.clone().into();
    let maybe_previous_node_entry = previous_nodes.entry(new_node_id);

    let mut events = Vec::new();
    let mut verb = "joined";

    if let Entry::Occupied(previous_node_entry) = maybe_previous_node_entry {
        let previous_node_ref = previous_node_entry.get();

        if previous_node_ref.chitchat_id().generation_id > new_chitchat_id.generation_id {
            warn!(
                node_id=%new_chitchat_id.node_id,
                generation_id=%new_chitchat_id.generation_id,
                "ignoring node `{}` rejoining the cluster with a lower generation ID",
                new_chitchat_id.node_id
            );
            return events;
        }
        let previous_node = previous_node_entry.remove();
        verb = "rejoined";

        if previous_node.is_ready() {
            events.push(ClusterChange::Remove(previous_node));
        }
    }
    let Some(new_node) = try_new_node(
        cluster_id,
        new_chitchat_id,
        new_node_state,
        is_self_node,
        &client_grpc_config,
    )
    .await
    else {
        return events;
    };
    info!(
        node_id=%new_chitchat_id.node_id,
        generation_id=%new_chitchat_id.generation_id,
        "node `{}` has {verb} the cluster",
        new_chitchat_id.node_id,
    );
    let new_node_id: NodeId = new_node.node_id().into();
    previous_nodes.insert(new_node_id, new_node.clone());

    if new_node.is_ready() {
        info!(
            node_id=%new_chitchat_id.node_id,
            generation_id=%new_chitchat_id.generation_id,
            "node `{}` has transitioned to ready state",
            new_chitchat_id.node_id
        );
        warmup_channel(new_node.channel()).await;
        events.push(ClusterChange::Add(new_node));
    }
    events
}

async fn compute_cluster_change_events_on_updated(
    cluster_id: &str,
    self_chitchat_id: &ChitchatId,
    updated_chitchat_id: &ChitchatId,
    updated_node_state: &NodeState,
    previous_nodes: &mut BTreeMap<NodeId, ClusterNode>,
) -> Option<ClusterChange> {
    let previous_node = previous_nodes.get(&updated_chitchat_id.node_id)?.clone();

    if previous_node.chitchat_id().generation_id > updated_chitchat_id.generation_id {
        warn!(
            node_id=%updated_chitchat_id.node_id,
            generation_id=%updated_chitchat_id.generation_id,
            "ignoring node `{}` update with a lower generation ID",
            updated_chitchat_id.node_id
        );
        return None;
    }
    let previous_channel = previous_node.channel();
    let is_self_node = self_chitchat_id == updated_chitchat_id;
    let updated_node = try_new_node_with_channel(
        cluster_id,
        updated_chitchat_id,
        updated_node_state,
        previous_channel,
        is_self_node,
    )?;
    let updated_node_id: NodeId = updated_node.chitchat_id().node_id.clone().into();
    previous_nodes.insert(updated_node_id, updated_node.clone());

    if !previous_node.is_ready() && updated_node.is_ready() {
        warmup_channel(updated_node.channel()).await;

        info!(
            node_id=%updated_chitchat_id.node_id,
            generation_id=%updated_chitchat_id.generation_id,
            "node `{}` has transitioned to ready state",
            updated_chitchat_id.node_id
        );
        Some(ClusterChange::Add(updated_node))
    } else if previous_node.is_ready() && !updated_node.is_ready() {
        info!(
            node_id=%updated_chitchat_id.node_id,
            generation_id=%updated_chitchat_id.generation_id,
            "node `{}` has transitioned out of ready state",
            updated_chitchat_id.node_id
        );
        Some(ClusterChange::Remove(updated_node))
    } else if previous_node.is_ready() && updated_node.is_ready() {
        Some(ClusterChange::Update {
            previous: previous_node,
            updated: updated_node,
        })
    } else {
        None
    }
}

fn compute_cluster_change_events_on_removed(
    removed_chitchat_id: &ChitchatId,
    previous_nodes: &mut BTreeMap<NodeId, ClusterNode>,
) -> Option<ClusterChange> {
    let removed_node_id: NodeId = removed_chitchat_id.node_id.clone().into();

    if let Entry::Occupied(previous_node_entry) = previous_nodes.entry(removed_node_id) {
        let previous_node_ref = previous_node_entry.get();

        if previous_node_ref.chitchat_id().generation_id == removed_chitchat_id.generation_id {
            info!(
                node_id=%removed_chitchat_id.node_id,
                generation_id=%removed_chitchat_id.generation_id,
                "node `{}` has left the cluster",
                removed_chitchat_id.node_id
            );
            let previous_node = previous_node_entry.remove();

            if previous_node.is_ready() {
                return Some(ClusterChange::Remove(previous_node));
            }
        }
    };
    None
}

fn try_new_node_with_channel(
    cluster_id: &str,
    chitchat_id: &ChitchatId,
    node_state: &NodeState,
    channel: Channel,
    is_self_node: bool,
) -> Option<ClusterNode> {
    match ClusterNode::try_new(chitchat_id.clone(), node_state, channel, is_self_node) {
        Ok(node) => Some(node),
        Err(error) => {
            warn!(
                cluster_id=%cluster_id,
                node_id=%chitchat_id.node_id,
                error=%error,
                "failed to create cluster node from Chitchat node state"
            );
            None
        }
    }
}

async fn try_new_node(
    cluster_id: &str,
    chitchat_id: &ChitchatId,
    node_state: &NodeState,
    is_self_node: bool,
    grpc_config: &ClientGrpcConfig,
) -> Option<ClusterNode> {
    match node_state.grpc_advertise_addr() {
        Ok(socket_addr) => {
            let channel = make_channel(socket_addr, grpc_config.clone()).await;
            try_new_node_with_channel(cluster_id, chitchat_id, node_state, channel, is_self_node)
        }
        Err(error) => {
            warn!(
                cluster_id=%cluster_id,
                node_id=%chitchat_id.node_id,
                error=%error,
                "failed to read or parse gRPC advertise address"
            );
            None
        }
    }
}

#[cfg(any(test, feature = "testsuite"))]
pub mod for_test {
    use std::sync::{Arc, Mutex};

    use tokio::sync::mpsc;

    use super::*;

    #[derive(Clone, Default)]
    pub struct ClusterChangeStreamFactoryForTest {
        inner: Arc<Mutex<Option<mpsc::UnboundedSender<ClusterChange>>>>,
    }

    impl ClusterChangeStreamFactoryForTest {
        pub fn change_stream_tx(&self) -> mpsc::UnboundedSender<ClusterChange> {
            self.inner.lock().unwrap().take().unwrap()
        }
    }

    impl ClusterChangeStreamFactory for ClusterChangeStreamFactoryForTest {
        fn create(&self) -> ClusterChangeStream {
            let (change_stream, change_stream_tx) = ClusterChangeStream::new_unbounded();
            *self.inner.lock().unwrap() = Some(change_stream_tx);
            change_stream
        }
    }
}

#[cfg(test)]
pub(crate) mod tests {
    use std::collections::HashSet;
    use std::net::SocketAddr;

    use itertools::Itertools;
    use quickwit_config::service::QuickwitService;
    use tonic::transport::Channel;

    use super::*;
    use crate::member::{
        ENABLED_SERVICES_KEY, GRPC_ADVERTISE_ADDR_KEY, READINESS_KEY, READINESS_VALUE_NOT_READY,
        READINESS_VALUE_READY,
    };

    pub(crate) struct NodeStateBuilder {
        enabled_services: HashSet<QuickwitService>,
        grpc_advertise_addr: SocketAddr,
        readiness: bool,
        key_values: Vec<(String, String)>,
    }

    impl Default for NodeStateBuilder {
        fn default() -> Self {
            Self {
                enabled_services: QuickwitService::supported_services(),
                grpc_advertise_addr: "127.0.0.1:7281".parse().unwrap(),
                readiness: false,
                key_values: Vec::new(),
            }
        }
    }

    impl NodeStateBuilder {
        pub(crate) fn with_grpc_advertise_addr(mut self, grpc_advertise_addr: SocketAddr) -> Self {
            self.grpc_advertise_addr = grpc_advertise_addr;
            self
        }

        pub(crate) fn with_readiness(mut self, readiness: bool) -> Self {
            self.readiness = readiness;
            self
        }

        pub(crate) fn with_key_value(mut self, key: &str, value: &str) -> Self {
            self.key_values.push((key.to_string(), value.to_string()));
            self
        }

        pub(crate) fn build(self) -> NodeState {
            let mut node_state = NodeState::for_test();

            node_state.set(
                ENABLED_SERVICES_KEY,
                self.enabled_services
                    .iter()
                    .map(|service| service.as_str())
                    .join(","),
            );
            node_state.set(
                GRPC_ADVERTISE_ADDR_KEY,
                self.grpc_advertise_addr.to_string(),
            );
            node_state.set(
                READINESS_KEY,
                if self.readiness {
                    READINESS_VALUE_READY
                } else {
                    READINESS_VALUE_NOT_READY
                },
            );
            for (key, value) in self.key_values {
                node_state.set(key, value);
            }
            node_state
        }
    }

    #[tokio::test]
    async fn test_compute_cluster_change_events_on_added() {
        let cluster_id = "test-cluster".to_string();
        let self_port = 1234;
        let self_chitchat_id = ChitchatId::for_local_test(self_port);
        {
            // New node joins the cluster with an invalid gRPC advertise address.
            let port = 1235;
            let new_chitchat_id = ChitchatId::for_local_test(port);
            let mut new_node_state = NodeStateBuilder::default().build();
            new_node_state.set(GRPC_ADVERTISE_ADDR_KEY, "bogus-grpc-advertise-addr");
            let mut previous_nodes = BTreeMap::new();

            let events = compute_cluster_change_events_on_added(
                &cluster_id,
                &self_chitchat_id,
                &new_chitchat_id,
                &new_node_state,
                &mut previous_nodes,
                Default::default(),
            )
            .await;
            assert!(events.is_empty());
            assert!(previous_nodes.is_empty());
        }
        {
            // New node joins the cluster but is not ready.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let new_chitchat_id = ChitchatId::for_local_test(port);
            let new_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(false)
                .build();
            let mut previous_nodes = BTreeMap::new();

            let events = compute_cluster_change_events_on_added(
                &cluster_id,
                &self_chitchat_id,
                &new_chitchat_id,
                &new_node_state,
                &mut previous_nodes,
                Default::default(),
            )
            .await;
            assert!(events.is_empty());

            let node = previous_nodes.get(&new_chitchat_id.node_id).unwrap();

            assert_eq!(node.chitchat_id(), &new_chitchat_id);
            assert_eq!(node.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(!node.is_self_node());
            assert!(!node.is_ready());
        }
        {
            // New node joins the cluster and is ready.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let new_chitchat_id = ChitchatId::for_local_test(port);
            let new_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let mut previous_nodes = BTreeMap::new();

            let events = compute_cluster_change_events_on_added(
                &cluster_id,
                &self_chitchat_id,
                &new_chitchat_id,
                &new_node_state,
                &mut previous_nodes,
                Default::default(),
            )
            .await;

            let ClusterChange::Add(node) = &events[0] else {
                panic!("expected `ClusterChange::Add` event, got `{:?}`", events[0]);
            };
            assert_eq!(node.chitchat_id(), &new_chitchat_id);
            assert_eq!(node.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(!node.is_self_node());
            assert!(node.is_ready());
            assert_eq!(previous_nodes.get(&new_chitchat_id.node_id).unwrap(), node);

            // Node rejoins with same node ID but newer generation ID.
            let mut rejoined_chitchat_id = ChitchatId::for_local_test(port);
            rejoined_chitchat_id.generation_id += 1;

            let events = compute_cluster_change_events_on_added(
                &cluster_id,
                &self_chitchat_id,
                &rejoined_chitchat_id,
                &new_node_state,
                &mut previous_nodes,
                Default::default(),
            )
            .await;
            assert_eq!(events.len(), 2);

            let ClusterChange::Remove(removed_node) = &events[0] else {
                panic!(
                    "expected `ClusterChange::Remove` event, got `{:?}`",
                    events[0]
                );
            };
            assert_eq!(removed_node.chitchat_id(), &new_chitchat_id);

            let ClusterChange::Add(rejoined_node) = &events[1] else {
                panic!("expected `ClusterChange::Add` event, got `{:?}`", events[1]);
            };
            assert_eq!(rejoined_node.chitchat_id(), &rejoined_chitchat_id);
            assert_eq!(
                previous_nodes.get(&rejoined_chitchat_id.node_id).unwrap(),
                rejoined_node
            );

            // Node comes back from the dead with an older generation ID.
            let events = compute_cluster_change_events_on_added(
                &cluster_id,
                &self_chitchat_id,
                &new_chitchat_id,
                &new_node_state,
                &mut previous_nodes,
                Default::default(),
            )
            .await;
            assert!(events.is_empty());
            assert_eq!(
                previous_nodes.get(&rejoined_chitchat_id.node_id).unwrap(),
                rejoined_node
            );
        }
        {
            // Self node joins the cluster and is ready.
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], self_port + 1).into();
            let new_chitchat_id = self_chitchat_id.clone();
            let new_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let mut previous_nodes = BTreeMap::new();

            let events = compute_cluster_change_events_on_added(
                &cluster_id,
                &self_chitchat_id,
                &new_chitchat_id,
                &new_node_state,
                &mut previous_nodes,
                Default::default(),
            )
            .await;
            assert_eq!(events.len(), 1);

            let ClusterChange::Add(node) = &events[0] else {
                panic!("expected `ClusterChange::Add` event, got `{:?}`", events[0]);
            };
            assert_eq!(node.chitchat_id(), &new_chitchat_id);
            assert_eq!(node.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(node.is_self_node());
            assert!(node.is_ready());
            assert_eq!(previous_nodes.get(&new_chitchat_id.node_id).unwrap(), node);
        }
    }

    #[tokio::test]
    async fn test_compute_cluster_change_events_on_updated() {
        let cluster_id = "test-cluster".to_string();
        let self_port = 1234;
        let self_chitchat_id = ChitchatId::for_local_test(self_port);
        {
            // Node becomes ready.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let updated_chitchat_id = ChitchatId::for_local_test(port);
            let updated_node_id: NodeId = updated_chitchat_id.node_id.clone().into();
            let previous_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(false)
                .build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                updated_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(updated_node_id, previous_node)]);

            let updated_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .with_key_value("my-key", "my-value")
                .build();
            let event = compute_cluster_change_events_on_updated(
                &cluster_id,
                &self_chitchat_id,
                &updated_chitchat_id,
                &updated_node_state,
                &mut previous_nodes,
            )
            .await
            .unwrap();
            let ClusterChange::Add(node) = event else {
                panic!("expected `ClusterChange::Add` event, got `{event:?}`");
            };
            assert_eq!(node.chitchat_id(), &updated_chitchat_id);
            assert_eq!(node.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(node.is_ready());
            assert!(!node.is_self_node());
            assert_eq!(
                previous_nodes.get(&updated_chitchat_id.node_id).unwrap(),
                &node
            );
        }
        {
            // Node changes.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let updated_chitchat_id = ChitchatId::for_local_test(port);
            let updated_node_id: NodeId = updated_chitchat_id.node_id.clone().into();
            let previous_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                updated_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(updated_node_id, previous_node)]);

            let updated_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .with_key_value("my-key", "my-value")
                .build();
            let event = compute_cluster_change_events_on_updated(
                &cluster_id,
                &self_chitchat_id,
                &updated_chitchat_id,
                &updated_node_state,
                &mut previous_nodes,
            )
            .await
            .unwrap();

            let ClusterChange::Update { updated, .. } = event else {
                panic!("expected `ClusterChange::Remove` event, got `{event:?}`");
            };
            assert_eq!(updated.chitchat_id(), &updated_chitchat_id);
            assert_eq!(updated.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(!updated.is_self_node());
            assert!(updated.is_ready());
            assert_eq!(
                previous_nodes.get(&updated_chitchat_id.node_id).unwrap(),
                &updated
            );
        }
        {
            // Node is no longer ready.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let updated_chitchat_id = ChitchatId::for_local_test(port);
            let updated_node_id: NodeId = updated_chitchat_id.node_id.clone().into();
            let previous_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                updated_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(updated_node_id, previous_node)]);

            let updated_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(false)
                .with_key_value("my-key", "my-value")
                .build();
            let event = compute_cluster_change_events_on_updated(
                &cluster_id,
                &self_chitchat_id,
                &updated_chitchat_id,
                &updated_node_state,
                &mut previous_nodes,
            )
            .await
            .unwrap();
            let ClusterChange::Remove(node) = event else {
                panic!("expected `ClusterChange::Remove` event, got `{event:?}`");
            };
            assert_eq!(node.chitchat_id(), &updated_chitchat_id);
            assert_eq!(node.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(!node.is_self_node());
            assert!(!node.is_ready());
            assert_eq!(
                previous_nodes.get(&updated_chitchat_id.node_id).unwrap(),
                &node
            );
        }
        {
            // Ignore node update with a lower generation ID.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let updated_chitchat_id = ChitchatId::for_local_test(port);
            let updated_node_id: NodeId = updated_chitchat_id.node_id.clone().into();
            let mut previous_chitchat_id = updated_chitchat_id.clone();
            previous_chitchat_id.generation_id += 1;
            let previous_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                previous_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes =
                BTreeMap::from_iter([(updated_node_id, previous_node.clone())]);

            let updated_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(false)
                .with_key_value("my-key", "my-value")
                .build();
            let event_opt = compute_cluster_change_events_on_updated(
                &cluster_id,
                &self_chitchat_id,
                &updated_chitchat_id,
                &updated_node_state,
                &mut previous_nodes,
            )
            .await;
            assert!(event_opt.is_none());

            assert_eq!(
                previous_nodes.get(&updated_chitchat_id.node_id).unwrap(),
                &previous_node
            );
        }
    }

    #[tokio::test]
    async fn test_compute_cluster_change_events_on_removed() {
        {
            // Node leaves the cluster but it's missing from the previous live nodes.
            let port = 1235;
            let removed_chitchat_id = ChitchatId::for_local_test(port);
            let mut previous_nodes = BTreeMap::default();

            let event_opt =
                compute_cluster_change_events_on_removed(&removed_chitchat_id, &mut previous_nodes);
            assert!(event_opt.is_none());
        }
        {
            // Node leaves the cluster in not ready state.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let removed_chitchat_id = ChitchatId::for_local_test(port);
            let removed_node_id: NodeId = removed_chitchat_id.node_id.clone().into();
            let previous_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(false)
                .build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                removed_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(removed_node_id, previous_node)]);

            let event_opt =
                compute_cluster_change_events_on_removed(&removed_chitchat_id, &mut previous_nodes);
            assert!(event_opt.is_none());
            assert!(!previous_nodes.contains_key(&removed_chitchat_id.node_id));
        }
        {
            // Node leaves the cluster in ready state.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let removed_chitchat_id = ChitchatId::for_local_test(port);
            let removed_node_id: NodeId = removed_chitchat_id.node_id.clone().into();
            let removed_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let removed_node = ClusterNode::try_new(
                removed_chitchat_id.clone(),
                &removed_node_state,
                channel,
                false,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(removed_node_id.clone(), removed_node)]);

            let event =
                compute_cluster_change_events_on_removed(&removed_chitchat_id, &mut previous_nodes)
                    .unwrap();

            let ClusterChange::Remove(node) = event else {
                panic!("expected `ClusterChange::Remove` event, got `{event:?}`");
            };
            assert_eq!(node.chitchat_id(), &removed_chitchat_id);
            assert_eq!(node.grpc_advertise_addr(), grpc_advertise_addr);
            assert!(!node.is_self_node());
            assert!(node.is_ready());
            assert!(!previous_nodes.contains_key(&removed_chitchat_id.node_id));
        }
        {
            // Node leaves the cluster in ready state but in the meantime it has rejoined the
            // cluster with a newer generation ID.
            let port = 1235;
            let grpc_advertise_addr: SocketAddr = ([127, 0, 0, 1], port + 1).into();
            let removed_chitchat_id = ChitchatId::for_local_test(port);

            let mut rejoined_chitchat_id = removed_chitchat_id.clone();
            rejoined_chitchat_id.generation_id += 1;
            let rejoined_node_id: NodeId = rejoined_chitchat_id.node_id.clone().into();
            let rejoined_node_state = NodeStateBuilder::default()
                .with_grpc_advertise_addr(grpc_advertise_addr)
                .with_readiness(true)
                .build();
            let channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let rejoined_node = ClusterNode::try_new(
                rejoined_chitchat_id.clone(),
                &rejoined_node_state,
                channel,
                false,
            )
            .unwrap();
            let mut previous_nodes =
                BTreeMap::from_iter([(rejoined_node_id.clone(), rejoined_node.clone())]);

            let event_opt =
                compute_cluster_change_events_on_removed(&removed_chitchat_id, &mut previous_nodes);
            assert!(event_opt.is_none());
            assert_eq!(
                previous_nodes.get(&rejoined_node_id).unwrap(),
                &rejoined_node
            );
        }
    }

    #[tokio::test]
    async fn test_compute_cluster_change_events() {
        let cluster_id = "test-cluster".to_string();
        let self_port = 1234;
        let self_chitchat_id = ChitchatId::for_local_test(self_port);
        let self_node_id: NodeId = self_chitchat_id.node_id.clone().into();
        {
            let mut previous_nodes = BTreeMap::default();
            let previous_node_states = BTreeMap::default();
            let new_node_states = BTreeMap::default();
            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                &mut previous_nodes,
                &previous_node_states,
                &new_node_states,
                &Default::default(),
            )
            .await;
            assert!(events.is_empty());
        }
        {
            // Node remained unchanged.
            let previous_node_state = NodeStateBuilder::default().with_readiness(true).build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                self_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(self_node_id.clone(), previous_node)]);
            let previous_node_states =
                BTreeMap::from_iter([(self_chitchat_id.clone(), previous_node_state)]);

            let new_node_state = NodeStateBuilder::default().with_readiness(true).build();
            let new_node_states = BTreeMap::from_iter([(self_chitchat_id.clone(), new_node_state)]);

            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                &mut previous_nodes,
                &previous_node_states,
                &new_node_states,
                &Default::default(),
            )
            .await;
            assert!(events.is_empty());
        }
        {
            // Node joins the cluster.
            let mut previous_nodes = BTreeMap::default();
            let previous_node_states = BTreeMap::default();
            let new_chitchat_id = ChitchatId::for_local_test(self_port + 1);
            let new_node_state = NodeStateBuilder::default().with_readiness(true).build();
            let new_node_states = BTreeMap::from_iter([(new_chitchat_id, new_node_state)]);
            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                &mut previous_nodes,
                &previous_node_states,
                &new_node_states,
                &Default::default(),
            )
            .await;
            assert_eq!(events.len(), 1);

            let ClusterChange::Add(_node) = events[0].clone() else {
                panic!("expected `ClusterChange::Add` event, got `{:?}`", events[0]);
            };

            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                &mut previous_nodes,
                &new_node_states,
                &new_node_states,
                &Default::default(),
            )
            .await;
            assert_eq!(events.len(), 0);
        }
        {
            // Node changes.
            let previous_node_state = NodeStateBuilder::default().with_readiness(true).build();
            let previous_channel = Channel::from_static("http://127.0.0.1:12345/").connect_lazy();
            let is_self_node = true;
            let previous_node = ClusterNode::try_new(
                self_chitchat_id.clone(),
                &previous_node_state,
                previous_channel,
                is_self_node,
            )
            .unwrap();
            let mut previous_nodes = BTreeMap::from_iter([(self_node_id, previous_node)]);
            let previous_node_states =
                BTreeMap::from_iter([(self_chitchat_id.clone(), previous_node_state)]);

            let new_node_state = NodeStateBuilder::default()
                .with_readiness(true)
                .with_key_value("my-key", "my-value")
                .build();
            let new_node_states = BTreeMap::from_iter([(self_chitchat_id.clone(), new_node_state)]);

            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                &mut previous_nodes,
                &previous_node_states,
                &new_node_states,
                &Default::default(),
            )
            .await;
            assert_eq!(events.len(), 1);

            let ClusterChange::Update { .. } = events[0].clone() else {
                panic!(
                    "Expected `ClusterChange::Update` event, got `{:?}`",
                    events[0]
                );
            };

            // Node leaves the cluster.
            let new_node_states = BTreeMap::default();
            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                &mut previous_nodes,
                &previous_node_states,
                &new_node_states,
                &Default::default(),
            )
            .await;
            assert_eq!(events.len(), 1);

            let ClusterChange::Remove(_node) = events[0].clone() else {
                panic!(
                    "Expected `ClusterChange::Remove` event, got `{:?}`",
                    events[0]
                );
            };
        }
    }
}


================================================
FILE: quickwit/quickwit-cluster/src/cluster.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, HashMap, HashSet};
use std::fmt::{Debug, Display};
use std::net::SocketAddr;
use std::str::FromStr;
use std::sync::Arc;
use std::time::Duration;

use anyhow::Context;
use chitchat::transport::Transport;
use chitchat::{
    Chitchat, ChitchatConfig, ChitchatHandle, ChitchatId, ClusterStateSnapshot,
    FailureDetectorConfig, KeyChangeEvent, ListenerHandle, NodeState, spawn_chitchat,
};
use itertools::Itertools;
use quickwit_common::tower::ClientGrpcConfig;
use quickwit_proto::indexing::{IndexingPipelineId, IndexingTask, PipelineMetrics};
use quickwit_proto::types::{NodeId, NodeIdRef, PipelineUid, ShardId};
use serde::{Deserialize, Serialize};
use tokio::sync::{Mutex, RwLock, mpsc, watch};
use tokio::time::timeout;
use tokio_stream::StreamExt;
use tokio_stream::wrappers::WatchStream;
use tracing::{info, warn};

use crate::change::{ClusterChange, ClusterChangeStreamFactory, compute_cluster_change_events};
use crate::grpc_gossip::spawn_catchup_callback_task;
use crate::member::{
    AVAILABILITY_ZONE_KEY, ClusterMember, ENABLED_SERVICES_KEY, GRPC_ADVERTISE_ADDR_KEY,
    NodeStateExt, PIPELINE_METRICS_PREFIX, READINESS_KEY, READINESS_VALUE_NOT_READY,
    READINESS_VALUE_READY, build_cluster_member,
};
use crate::metrics::spawn_metrics_task;
use crate::{ClusterChangeStream, ClusterNode};

const MARKED_FOR_DELETION_GRACE_PERIOD: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(2_500) // 2.5 secs
} else {
    Duration::from_secs(3_600 * 2) // 2 hours.
};

// An indexing task key is formatted as
// `{INDEXING_TASK_PREFIX}{PIPELINE_ULID}`.
const INDEXING_TASK_PREFIX: &str = "indexer.task:";

#[derive(Clone)]
pub struct Cluster {
    cluster_id: String,
    self_chitchat_id: ChitchatId,
    /// Socket address (UDP) the node listens on for receiving gossip messages.
    pub gossip_listen_addr: SocketAddr,
    // TODO this object contains a tls config. We might want to change it to a
    // ArcSwap<ClientGrpcConfig> or something so that some task can watch for new certificates
    // and update this (hot reloading)
    client_grpc_config: ClientGrpcConfig,
    gossip_interval: Duration,
    inner: Arc<RwLock<InnerCluster>>,
}

impl Debug for Cluster {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        formatter
            .debug_struct("Cluster")
            .field("cluster_id", &self.cluster_id)
            .field("self_node_id", &self.self_chitchat_id.node_id)
            .field("gossip_listen_addr", &self.gossip_listen_addr)
            .field(
                "gossip_advertise_addr",
                &self.self_chitchat_id.gossip_advertise_addr,
            )
            .field("gossip_interval", &self.gossip_interval)
            .finish()
    }
}

impl Cluster {
    pub fn cluster_id(&self) -> &str {
        &self.cluster_id
    }

    pub fn self_chitchat_id(&self) -> &ChitchatId {
        &self.self_chitchat_id
    }

    pub fn self_node_id(&self) -> &NodeIdRef {
        NodeIdRef::from_str(&self.self_chitchat_id.node_id)
    }

    pub fn gossip_listen_addr(&self) -> SocketAddr {
        self.gossip_listen_addr
    }

    pub fn gossip_advertise_addr(&self) -> SocketAddr {
        self.self_chitchat_id.gossip_advertise_addr
    }

    #[allow(clippy::too_many_arguments)]
    pub async fn join(
        cluster_id: String,
        self_node: ClusterMember,
        gossip_listen_addr: SocketAddr,
        peer_seed_addrs: Vec<String>,
        gossip_interval: Duration,
        failure_detector_config: FailureDetectorConfig,
        transport: &dyn Transport,
        client_grpc_config: ClientGrpcConfig,
    ) -> anyhow::Result<Self> {
        info!(
            cluster_id=%cluster_id,
            node_id=%self_node.node_id,
            generation_id=self_node.generation_id.as_u64(),
            enabled_services=?self_node.enabled_services,
            gossip_listen_addr=%gossip_listen_addr,
            gossip_advertise_addr=%self_node.gossip_advertise_addr,
            grpc_advertise_addr=%self_node.grpc_advertise_addr,
            peer_seed_addrs=%peer_seed_addrs.join(", "),
            "joining cluster"
        );
        // Set up catchup callback and extra liveness predicate functions.
        let (catchup_callback_tx, catchup_callback_rx) = watch::channel(());
        let catchup_callback = move || {
            let _ = catchup_callback_tx.send(());
        };
        let extra_liveness_predicate = |node_state: &NodeState| {
            [ENABLED_SERVICES_KEY, GRPC_ADVERTISE_ADDR_KEY]
                .iter()
                .all(|key| node_state.contains_key(key))
        };
        let chitchat_config = ChitchatConfig {
            cluster_id: cluster_id.clone(),
            chitchat_id: self_node.chitchat_id(),
            listen_addr: gossip_listen_addr,
            seed_nodes: peer_seed_addrs,
            failure_detector_config,
            gossip_interval,
            marked_for_deletion_grace_period: MARKED_FOR_DELETION_GRACE_PERIOD,
            catchup_callback: Some(Box::new(catchup_callback)),
            extra_liveness_predicate: Some(Box::new(extra_liveness_predicate)),
        };
        let mut initial_key_values = vec![
            (
                ENABLED_SERVICES_KEY.to_string(),
                self_node.enabled_services.iter().join(","),
            ),
            (
                GRPC_ADVERTISE_ADDR_KEY.to_string(),
                self_node.grpc_advertise_addr.to_string(),
            ),
            (
                READINESS_KEY.to_string(),
                READINESS_VALUE_NOT_READY.to_string(),
            ),
        ];

        if let Some(az) = &self_node.availability_zone {
            initial_key_values.push((AVAILABILITY_ZONE_KEY.to_string(), az.clone()));
        }
        let chitchat_handle =
            spawn_chitchat(chitchat_config, initial_key_values, transport).await?;

        let chitchat = chitchat_handle.chitchat();
        let chitchat_guard = chitchat.lock().await;
        let live_nodes_rx = chitchat_guard.live_nodes_watcher();
        let live_nodes_stream = chitchat_guard.live_nodes_watch_stream();
        let (ready_members_tx, ready_members_rx) = watch::channel(Vec::new());
        spawn_ready_members_task(cluster_id.clone(), live_nodes_stream, ready_members_tx);
        drop(chitchat_guard);

        let weak_chitchat = Arc::downgrade(&chitchat);
        spawn_metrics_task(weak_chitchat.clone(), self_node.chitchat_id());

        spawn_catchup_callback_task(
            cluster_id.clone(),
            self_node.chitchat_id(),
            weak_chitchat,
            live_nodes_rx,
            catchup_callback_rx.clone(),
            client_grpc_config.clone(),
        )
        .await;

        let inner = InnerCluster {
            cluster_id: cluster_id.clone(),
            self_chitchat_id: self_node.chitchat_id(),
            chitchat_handle,
            live_nodes: BTreeMap::new(),
            change_stream_subscribers: Vec::new(),
            ready_members_rx,
        };
        let cluster = Cluster {
            cluster_id,
            self_chitchat_id: self_node.chitchat_id(),
            gossip_listen_addr,
            gossip_interval,
            inner: Arc::new(RwLock::new(inner)),
            client_grpc_config,
        };
        spawn_change_stream_task(cluster.clone()).await;
        Ok(cluster)
    }

    /// Deprecated: this is going away soon.
    pub async fn ready_members(&self) -> Vec<ClusterMember> {
        self.inner.read().await.ready_members_rx.borrow().clone()
    }

    /// Deprecated: this is going away soon.
    async fn ready_members_watcher(&self) -> WatchStream<Vec<ClusterMember>> {
        WatchStream::new(self.inner.read().await.ready_members_rx.clone())
    }

    pub async fn ready_nodes(&self) -> Vec<ClusterNode> {
        self.inner
            .write()
            .await
            .live_nodes
            .values()
            .filter(|node| node.is_ready())
            .cloned()
            .collect()
    }

    /// Returns a stream of changes affecting the set of ready nodes in the cluster.
    pub fn change_stream(&self) -> ClusterChangeStream {
        let (change_stream, change_stream_tx) = ClusterChangeStream::new_unbounded();
        let inner = self.inner.clone();
        // We spawn a task so the signature of this function is sync.
        let future = async move {
            let mut inner = inner.write().await;
            for node in inner.live_nodes.values() {
                if node.is_ready() {
                    change_stream_tx
                        .send(ClusterChange::Add(node.clone()))
                        .expect("receiver end of the channel should be open");
                }
            }
            inner.change_stream_subscribers.push(change_stream_tx);
        };
        tokio::spawn(future);
        change_stream
    }

    /// Returns whether the self node is ready.
    pub async fn is_self_node_ready(&self) -> bool {
        self.chitchat()
            .await
            .lock()
            .await
            .node_state(&self.self_chitchat_id)
            .expect("The self node should always be present in the set of live nodes.")
            .is_ready()
    }

    /// Sets the self node's readiness.
    pub async fn set_self_node_readiness(&self, readiness: bool) {
        let readiness_value = if readiness {
            READINESS_VALUE_READY
        } else {
            READINESS_VALUE_NOT_READY
        };
        self.set_self_key_value(READINESS_KEY, readiness_value)
            .await
    }

    /// Sets a key-value pair on the cluster node's state.
    pub async fn set_self_key_value(&self, key: impl Display, value: impl Display) {
        self.chitchat()
            .await
            .lock()
            .await
            .self_node_state()
            .set(key, value);
    }

    /// Sets a key-value pair on the cluster node's state.
    pub async fn set_self_key_value_delete_after_ttl(
        &self,
        key: impl ToString,
        value: impl ToString,
    ) {
        let chitchat = self.chitchat().await;
        let mut chitchat_lock = chitchat.lock().await;
        let chitchat_self_node = chitchat_lock.self_node_state();
        let key = key.to_string();
        chitchat_self_node.set_with_ttl(key.clone(), value);
    }

    pub async fn get_self_key_value(&self, key: &str) -> Option<String> {
        self.chitchat()
            .await
            .lock()
            .await
            .self_node_state()
            .get(key)
            .map(|value| value.to_string())
    }

    pub async fn remove_self_key(&self, key: &str) {
        self.chitchat()
            .await
            .lock()
            .await
            .self_node_state()
            .delete(key)
    }

    pub async fn subscribe(
        &self,
        key_prefix: &str,
        callback: impl Fn(KeyChangeEvent) + Send + Sync + 'static,
    ) -> ListenerHandle {
        self.chitchat()
            .await
            .lock()
            .await
            .subscribe_event(key_prefix, callback)
    }

    /// Waits until the predicate holds true for the set of ready members.
    pub async fn wait_for_ready_members<F>(
        &self,
        mut predicate: F,
        timeout_after: Duration,
    ) -> anyhow::Result<()>
    where
        F: FnMut(&[ClusterMember]) -> bool,
    {
        timeout(
            timeout_after,
            self.ready_members_watcher()
                .await
                .skip_while(|members| !predicate(members))
                .next(),
        )
        .await
        .context("deadline has passed before predicate held true")?;
        Ok(())
    }

    /// Returns a snapshot of the cluster state, including the underlying Chitchat state.
    pub async fn snapshot(&self) -> ClusterSnapshot {
        let chitchat = self.chitchat().await;
        let chitchat_guard = chitchat.lock().await;
        let chitchat_state_snapshot = chitchat_guard.state_snapshot();
        let mut ready_nodes = HashSet::new();
        let mut live_nodes = HashSet::new();

        for chitchat_id in chitchat_guard.live_nodes().cloned() {
            let node_state = chitchat_guard.node_state(&chitchat_id).expect(
                "The node should always be present in the cluster state because we hold the \
                 Chitchat mutex.",
            );
            if node_state.is_ready() {
                ready_nodes.insert(chitchat_id);
            } else {
                live_nodes.insert(chitchat_id);
            }
        }
        let dead_nodes = chitchat_guard.dead_nodes().cloned().collect::<HashSet<_>>();

        ClusterSnapshot {
            cluster_id: self.cluster_id.clone(),
            self_node_id: self.self_chitchat_id.node_id.clone(),
            ready_nodes,
            live_nodes,
            dead_nodes,
            chitchat_state_snapshot,
        }
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub async fn leave(&self) {
        info!(
            cluster_id=%self.cluster_id,
            node_id=%self.self_chitchat_id.node_id,
            "leaving the cluster"
        );
        self.set_self_node_readiness(false).await;
        tokio::time::sleep(self.gossip_interval * 2).await;
    }

    pub async fn initiate_shutdown(&self) -> anyhow::Result<()> {
        self.inner.read().await.chitchat_handle.initiate_shutdown()
    }

    /// This exposes in chitchat some metrics about the CPU usage of cooperative pipelines.
    /// The metrics are exposed as follows:
    /// Key:        pipeline_metrics:<index_uid>:<source_id>
    /// Value:      179m,76MB/s
    pub async fn update_self_node_pipeline_metrics(
        &self,
        pipeline_metrics: &HashMap<&IndexingPipelineId, PipelineMetrics>,
    ) {
        let chitchat = self.chitchat().await;
        let mut chitchat_guard = chitchat.lock().await;
        let node_state = chitchat_guard.self_node_state();
        let mut current_metrics_keys: HashSet<String> = node_state
            .iter_prefix(PIPELINE_METRICS_PREFIX)
            .map(|(key, _)| key.to_string())
            .collect();
        for (pipeline_id, metrics) in pipeline_metrics {
            let key = format!("{PIPELINE_METRICS_PREFIX}{pipeline_id}");
            current_metrics_keys.remove(&key);
            node_state.set(key, metrics.to_string());
        }
        for obsolete_task_key in current_metrics_keys {
            node_state.delete(&obsolete_task_key);
        }
    }

    /// Updates indexing tasks in chitchat state.
    /// Tasks are grouped by (index_id, source_id), each group is stored in a key as follows:
    /// - key: `{INDEXING_TASK_PREFIX}{index_id}{INDEXING_TASK_SEPARATOR}{source_id}`
    /// - value: Number of indexing tasks in the group.
    ///
    /// Keys present in chitchat state but not in the given `indexing_tasks` are marked for
    /// deletion.
    pub async fn update_self_node_indexing_tasks(&self, indexing_tasks: &[IndexingTask]) {
        let chitchat = self.chitchat().await;
        let mut chitchat_guard = chitchat.lock().await;
        let node_state = chitchat_guard.self_node_state();
        set_indexing_tasks_in_node_state(indexing_tasks, node_state);
    }

    pub async fn chitchat(&self) -> Arc<Mutex<Chitchat>> {
        self.inner.read().await.chitchat_handle.chitchat()
    }

    pub async fn chitchat_server_termination_watcher(
        &self,
    ) -> impl Future<Output = anyhow::Result<()>> + use<> {
        self.inner
            .read()
            .await
            .chitchat_handle
            .termination_watcher()
    }
}

impl ClusterChangeStreamFactory for Cluster {
    fn create(&self) -> ClusterChangeStream {
        self.change_stream()
    }
}

/// Deprecated: this is going away soon.
fn spawn_ready_members_task(
    cluster_id: String,
    mut live_nodes_stream: WatchStream<BTreeMap<ChitchatId, NodeState>>,
    ready_members_tx: watch::Sender<Vec<ClusterMember>>,
) {
    let fut = async move {
        while let Some(new_live_nodes) = live_nodes_stream.next().await {
            let mut new_ready_members = Vec::with_capacity(new_live_nodes.len());

            for (chitchat_id, node_state) in new_live_nodes {
                let member = match build_cluster_member(chitchat_id, &node_state) {
                    Ok(member) => member,
                    Err(error) => {
                        warn!(
                            cluster_id=%cluster_id,
                            error=?error,
                            "Failed to build cluster member from Chitchat node state."
                        );
                        continue;
                    }
                };
                if member.is_ready {
                    new_ready_members.push(member);
                }
            }
            if *ready_members_tx.borrow() != new_ready_members
                && ready_members_tx.send(new_ready_members).is_err()
            {
                break;
            }
        }
    };
    tokio::spawn(fut);
}

/// Parses indexing tasks from the chitchat node state.
pub fn parse_indexing_tasks(node_state: &NodeState) -> Vec<IndexingTask> {
    node_state
        .iter_prefix(INDEXING_TASK_PREFIX)
        .map(|(key, versioned_value)| (key, versioned_value.value.as_str()))
        .flat_map(|(key, value)| {
            let indexing_task_opt = chitchat_kv_to_indexing_task(key, value);
            if indexing_task_opt.is_none() {
                warn!(key=%key, value=%value, "failed to parse indexing task from chitchat kv");
            }
            indexing_task_opt
        })
        .collect()
}

/// Writes the given indexing tasks in the given node state.
///
/// If previous indexing tasks were present in the node state but were not in the given tasks, they
/// are marked for deletion.
pub(crate) fn set_indexing_tasks_in_node_state(
    indexing_tasks: &[IndexingTask],
    node_state: &mut NodeState,
) {
    let mut current_indexing_tasks_keys: HashSet<String> = node_state
        .iter_prefix(INDEXING_TASK_PREFIX)
        .map(|(key, _)| key.to_string())
        .collect();
    for indexing_task in indexing_tasks {
        let (key, value) = indexing_task_to_chitchat_kv(indexing_task);
        current_indexing_tasks_keys.remove(&key);
        node_state.set(key, value);
    }
    for obsolete_task_key in current_indexing_tasks_keys {
        node_state.delete(&obsolete_task_key);
    }
}

fn indexing_task_to_chitchat_kv(indexing_task: &IndexingTask) -> (String, String) {
    let IndexingTask {
        index_uid: _,
        source_id,
        shard_ids,
        pipeline_uid: _,
        params_fingerprint: _,
    } = indexing_task;
    let index_uid = indexing_task.index_uid();
    let key = format!("{INDEXING_TASK_PREFIX}{}", indexing_task.pipeline_uid());
    let shard_ids_str = shard_ids.iter().sorted().join(",");
    let fingerprint = indexing_task.params_fingerprint;
    let value = format!("{index_uid}:{source_id}:{fingerprint}:{shard_ids_str}");
    (key, value)
}

fn parse_shard_ids_str(shard_ids_str: &str) -> Vec<ShardId> {
    shard_ids_str
        .split(',')
        .filter(|shard_id_str| !shard_id_str.is_empty())
        .map(ShardId::from)
        .collect()
}

fn chitchat_kv_to_indexing_task(key: &str, value: &str) -> Option<IndexingTask> {
    let pipeline_uid_str = key.strip_prefix(INDEXING_TASK_PREFIX)?;
    let pipeline_uid = PipelineUid::from_str(pipeline_uid_str).ok()?;
    let mut field_iterator = value.rsplitn(4, ':');
    let shards_str = field_iterator.next()?;
    let fingerprint_str = field_iterator.next()?;
    let source_id = field_iterator.next()?;
    let index_uid = field_iterator.next()?;
    let params_fingerprint: u64 = fingerprint_str.parse().ok()?;
    let index_uid = index_uid.parse().ok()?;
    let shard_ids = parse_shard_ids_str(shards_str);
    Some(IndexingTask {
        index_uid: Some(index_uid),
        source_id: source_id.to_string(),
        pipeline_uid: Some(pipeline_uid),
        shard_ids,
        params_fingerprint,
    })
}

async fn spawn_change_stream_task(cluster: Cluster) {
    let cluster_guard = cluster.inner.read().await;
    let cluster_id = cluster_guard.cluster_id.clone();
    let client_grpc_config = cluster.client_grpc_config.clone();
    let self_chitchat_id = cluster_guard.self_chitchat_id.clone();
    let chitchat = cluster_guard.chitchat_handle.chitchat();
    let weak_cluster = Arc::downgrade(&cluster.inner);
    drop(cluster_guard);
    drop(cluster);

    let mut previous_live_node_states = BTreeMap::new();
    let mut live_nodes_watch_stream = chitchat.lock().await.live_nodes_watch_stream();

    let future = async move {
        while let Some(new_live_node_states) = live_nodes_watch_stream.next().await {
            let Some(cluster) = weak_cluster.upgrade() else {
                break;
            };
            let mut cluster_guard = cluster.write().await;
            let previous_live_nodes = &mut cluster_guard.live_nodes;

            let events = compute_cluster_change_events(
                &cluster_id,
                &self_chitchat_id,
                previous_live_nodes,
                &previous_live_node_states,
                &new_live_node_states,
                &client_grpc_config,
            )
            .await;
            if !events.is_empty() {
                cluster_guard
                    .change_stream_subscribers
                    .retain(|change_stream_tx| {
                        events
                            .iter()
                            .all(|event| change_stream_tx.send(event.clone()).is_ok())
                    });
            }
            previous_live_node_states = new_live_node_states;
        }
    };
    tokio::spawn(future);
}

struct InnerCluster {
    cluster_id: String,
    self_chitchat_id: ChitchatId,
    chitchat_handle: ChitchatHandle,
    live_nodes: BTreeMap<NodeId, ClusterNode>,
    change_stream_subscribers: Vec<mpsc::UnboundedSender<ClusterChange>>,
    ready_members_rx: watch::Receiver<Vec<ClusterMember>>,
}

// Not used within the code, used for documentation.
#[derive(Debug, utoipa::ToSchema)]
pub struct NodeIdSchema {
    #[schema(example = "node-1")]
    /// The unique identifier of the node in the cluster.
    pub node_id: String,

    #[schema(example = "1683736537", value_type = u64)]
    /// A numeric identifier incremented every time the node leaves and rejoins the cluster.
    pub generation_id: u64,

    #[schema(example = "127.0.0.1:8000", value_type = String)]
    /// The socket address peers should use to gossip with the node.
    pub gossip_advertise_addr: SocketAddr,
}

#[derive(Debug, Serialize, Deserialize, utoipa::ToSchema)]
pub struct ClusterSnapshot {
    #[schema(example = "qw-cluster-1")]
    /// The ID of the cluster that the node is a part of.
    pub cluster_id: String,

    #[schema(value_type = NodeIdSchema)]
    /// The unique ID of the current node.
    pub self_node_id: String,

    #[schema(value_type  = Vec<NodeIdSchema>)]
    /// The set of cluster node IDs that are ready to handle requests.
    pub ready_nodes: HashSet<ChitchatId>,

    #[schema(value_type  = Vec<NodeIdSchema>)]
    /// The set of cluster node IDs that are alive but not ready.
    pub live_nodes: HashSet<ChitchatId>,

    #[schema(value_type  = Vec<NodeIdSchema>)]
    /// The set of cluster node IDs flagged as dead or faulty.
    pub dead_nodes: HashSet<ChitchatId>,

    #[schema(
        value_type = Object,
        example = json!({
            "key_values": {
                "grpc_advertise_addr": "127.0.0.1:8080",
                "enabled_services": "searcher",
            },
            "max_version": 5,
        })
    )]
    /// A complete snapshot of the Chitchat cluster state.
    pub chitchat_state_snapshot: ClusterStateSnapshot,
}

/// Computes the gRPC port from the listen address for tests.
#[cfg(any(test, feature = "testsuite"))]
pub fn grpc_addr_from_listen_addr_for_test(listen_addr: SocketAddr) -> SocketAddr {
    let grpc_port = listen_addr.port() + 1u16;
    (listen_addr.ip(), grpc_port).into()
}

#[cfg(any(test, feature = "testsuite"))]
pub async fn create_cluster_for_test_with_id(
    node_id: NodeId,
    gossip_advertise_port: u16,
    cluster_id: String,
    peer_seed_addrs: Vec<String>,
    enabled_services: &HashSet<quickwit_config::service::QuickwitService>,
    transport: &dyn Transport,
    self_node_readiness: bool,
) -> anyhow::Result<Cluster> {
    use quickwit_proto::indexing::PIPELINE_FULL_CAPACITY;
    use quickwit_proto::ingest::ingester::IngesterStatus;
    let gossip_advertise_addr: SocketAddr = ([127, 0, 0, 1], gossip_advertise_port).into();
    let self_node = ClusterMember {
        node_id,
        generation_id: crate::GenerationId(1),
        is_ready: self_node_readiness,
        enabled_services: enabled_services.clone(),
        gossip_advertise_addr,
        grpc_advertise_addr: grpc_addr_from_listen_addr_for_test(gossip_advertise_addr),
        indexing_tasks: Vec::new(),
        indexing_cpu_capacity: PIPELINE_FULL_CAPACITY,
        ingester_status: IngesterStatus::default(),
        availability_zone: None,
    };
    let failure_detector_config = create_failure_detector_config_for_test();
    let cluster = Cluster::join(
        cluster_id,
        self_node,
        gossip_advertise_addr,
        peer_seed_addrs,
        Duration::from_millis(25),
        failure_detector_config,
        transport,
        Default::default(),
    )
    .await?;
    cluster.set_self_node_readiness(self_node_readiness).await;
    Ok(cluster)
}

/// Creates a failure detector config for tests.
#[cfg(any(test, feature = "testsuite"))]
fn create_failure_detector_config_for_test() -> FailureDetectorConfig {
    FailureDetectorConfig {
        phi_threshold: 5.0,
        initial_interval: Duration::from_millis(25),
        ..Default::default()
    }
}

/// Creates a local cluster listening on a random port.
#[cfg(any(test, feature = "testsuite"))]
pub async fn create_cluster_for_test(
    seeds: Vec<String>,
    enabled_services: &[&str],
    transport: &dyn Transport,
    self_node_readiness: bool,
) -> anyhow::Result<Cluster> {
    use std::sync::atomic::{AtomicU16, Ordering};

    use quickwit_config::service::QuickwitService;

    static GOSSIP_ADVERTISE_PORT_SEQUENCE: AtomicU16 = AtomicU16::new(1u16);
    let gossip_advertise_port = GOSSIP_ADVERTISE_PORT_SEQUENCE.fetch_add(1, Ordering::Relaxed);
    let node_id: NodeId = format!("node-{gossip_advertise_port}").into();

    let enabled_services = enabled_services
        .iter()
        .map(|service_str| QuickwitService::from_str(service_str))
        .collect::<Result<HashSet<_>, _>>()?;
    let cluster = create_cluster_for_test_with_id(
        node_id,
        gossip_advertise_port,
        "test-cluster".to_string(),
        seeds,
        &enabled_services,
        transport,
        self_node_readiness,
    )
    .await?;
    Ok(cluster)
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;
    use std::net::SocketAddr;
    use std::time::Duration;

    use chitchat::transport::ChannelTransport;
    use itertools::Itertools;
    use quickwit_common::test_utils::wait_until_predicate;
    use quickwit_config::service::QuickwitService;
    use quickwit_proto::indexing::IndexingTask;
    use quickwit_proto::types::IndexUid;
    use rand::Rng;

    use super::*;

    #[tokio::test]
    async fn test_single_node_cluster_readiness() {
        let transport = ChannelTransport::default();
        let node = create_cluster_for_test(Vec::new(), &[], &transport, false)
            .await
            .unwrap();

        let mut ready_members_watcher = node.ready_members_watcher().await;
        let ready_members = ready_members_watcher.next().await.unwrap();

        assert!(ready_members.is_empty());
        assert!(!node.is_self_node_ready().await);

        let cluster_snapshot = node.snapshot().await;
        assert!(cluster_snapshot.ready_nodes.is_empty());

        let self_node_state = cluster_snapshot
            .chitchat_state_snapshot
            .node_states
            .into_iter()
            .find(|node_state| node_state.chitchat_id() == &node.self_chitchat_id)
            .unwrap();
        assert_eq!(
            self_node_state.get(READINESS_KEY).unwrap(),
            READINESS_VALUE_NOT_READY
        );

        node.set_self_node_readiness(true).await;

        let ready_members = ready_members_watcher.next().await.unwrap();
        assert_eq!(ready_members.len(), 1);
        assert!(node.is_self_node_ready().await);

        let cluster_snapshot = node.snapshot().await;
        assert_eq!(cluster_snapshot.ready_nodes.len(), 1);

        let self_node_state = cluster_snapshot
            .chitchat_state_snapshot
            .node_states
            .into_iter()
            .find(|node_state| node_state.chitchat_id() == &node.self_chitchat_id)
            .unwrap();
        assert_eq!(
            self_node_state.get(READINESS_KEY).unwrap(),
            READINESS_VALUE_READY
        );

        node.set_self_node_readiness(false).await;

        let ready_members = ready_members_watcher.next().await.unwrap();
        assert!(ready_members.is_empty());
        assert!(!node.is_self_node_ready().await);

        let cluster_snapshot = node.snapshot().await;
        assert!(cluster_snapshot.ready_nodes.is_empty());

        let self_node_state = cluster_snapshot
            .chitchat_state_snapshot
            .node_states
            .into_iter()
            .find(|node_state| node_state.chitchat_id() == &node.self_chitchat_id)
            .unwrap();
        assert_eq!(
            self_node_state.get(READINESS_KEY).unwrap(),
            READINESS_VALUE_NOT_READY
        );
        node.leave().await;
    }

    #[tokio::test]
    async fn test_cluster_multiple_nodes() -> anyhow::Result<()> {
        let transport = ChannelTransport::default();
        let node_1 = create_cluster_for_test(Vec::new(), &[], &transport, true).await?;
        let node_1_change_stream = node_1.change_stream();

        let peer_seeds = vec![node_1.gossip_listen_addr.to_string()];
        let node_2 = create_cluster_for_test(peer_seeds, &[], &transport, true).await?;

        let peer_seeds = vec![node_2.gossip_listen_addr.to_string()];
        let node_3 = create_cluster_for_test(peer_seeds, &[], &transport, true).await?;

        let wait_secs = Duration::from_secs(30);

        for node in [&node_1, &node_2, &node_3] {
            node.wait_for_ready_members(|members| members.len() == 3, wait_secs)
                .await
                .unwrap();
        }
        let members: Vec<SocketAddr> = node_1
            .ready_members()
            .await
            .into_iter()
            .map(|member| member.gossip_advertise_addr)
            .sorted()
            .collect();
        let mut expected_members = vec![
            node_1.gossip_listen_addr,
            node_2.gossip_listen_addr,
            node_3.gossip_listen_addr,
        ];
        expected_members.sort();
        assert_eq!(members, expected_members);

        node_2.leave().await;
        node_1
            .wait_for_ready_members(|members| members.len() == 2, wait_secs)
            .await
            .unwrap();

        node_3.leave().await;
        node_1
            .wait_for_ready_members(|members| members.len() == 1, wait_secs)
            .await
            .unwrap();

        node_1.leave().await;
        drop(node_1);

        let cluster_changes: Vec<ClusterChange> = node_1_change_stream.collect().await;
        assert_eq!(cluster_changes.len(), 6);
        assert!(matches!(&cluster_changes[0], ClusterChange::Add(_)));
        assert!(matches!(&cluster_changes[1], ClusterChange::Add(_)));
        assert!(matches!(&cluster_changes[2], ClusterChange::Add(_)));
        assert!(matches!(&cluster_changes[3], ClusterChange::Remove(_)));
        assert!(matches!(&cluster_changes[4], ClusterChange::Remove(_)));
        assert!(matches!(&cluster_changes[5], ClusterChange::Remove(_)));
        Ok(())
    }

    #[tokio::test]
    async fn test_multi_node_cluster_readiness() {
        let transport = ChannelTransport::default();
        let node_1 =
            create_cluster_for_test(Vec::new(), &["searcher", "indexer"], &transport, true)
                .await
                .unwrap();

        let peer_seeds = vec![node_1.gossip_listen_addr.to_string()];
        let node_2 = create_cluster_for_test(peer_seeds, &["indexer"], &transport, false)
            .await
            .unwrap();

        let wait_secs = Duration::from_secs(5);

        // Bother cluster 1 and cluster 2 see only one ready member.
        node_1
            .wait_for_ready_members(|members| members.len() == 1, wait_secs)
            .await
            .unwrap();

        node_2
            .wait_for_ready_members(|members| members.len() == 1, wait_secs)
            .await
            .unwrap();

        // Now, node 2 becomes ready.
        node_2.set_self_node_readiness(true).await;

        // Bother cluster 1 and cluster 2 see only two ready members.
        node_1
            .wait_for_ready_members(|members| members.len() == 2, wait_secs)
            .await
            .unwrap();

        node_2
            .wait_for_ready_members(|members| members.len() == 2, wait_secs)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_cluster_members_built_from_chitchat_state() {
        let transport = ChannelTransport::default();
        let cluster1 = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let cluster2 = create_cluster_for_test(
            vec![cluster1.gossip_listen_addr.to_string()],
            &["indexer", "metastore"],
            &transport,
            true,
        )
        .await
        .unwrap();
        let index_uid: IndexUid = IndexUid::for_test("index-1", 1);
        let indexing_task1 = IndexingTask {
            pipeline_uid: Some(PipelineUid::for_test(1u128)),
            index_uid: Some(index_uid.clone()),
            source_id: "source-1".to_string(),
            shard_ids: Vec::new(),
            params_fingerprint: 0,
        };
        let indexing_task2 = IndexingTask {
            pipeline_uid: Some(PipelineUid::for_test(2u128)),
            index_uid: Some(index_uid.clone()),
            source_id: "source-1".to_string(),
            shard_ids: Vec::new(),
            params_fingerprint: 0,
        };
        cluster2
            .set_self_key_value(GRPC_ADVERTISE_ADDR_KEY, "127.0.0.1:1001")
            .await;
        cluster2
            .update_self_node_indexing_tasks(&[indexing_task1.clone(), indexing_task2.clone()])
            .await;
        cluster1
            .wait_for_ready_members(|members| members.len() == 2, Duration::from_secs(30))
            .await
            .unwrap();
        let members = cluster1.ready_members().await;
        let member_node_1 = members
            .iter()
            .find(|member| member.chitchat_id() == cluster1.self_chitchat_id)
            .unwrap();
        let member_node_2 = members
            .iter()
            .find(|member| member.chitchat_id() == cluster2.self_chitchat_id)
            .unwrap();
        assert_eq!(
            member_node_1.enabled_services,
            HashSet::from_iter([QuickwitService::Indexer])
        );
        assert!(member_node_1.indexing_tasks.is_empty());
        assert_eq!(
            member_node_2.grpc_advertise_addr,
            ([127, 0, 0, 1], 1001).into()
        );
        assert_eq!(
            member_node_2.enabled_services,
            HashSet::from_iter([QuickwitService::Indexer, QuickwitService::Metastore].into_iter())
        );

        assert_eq!(
            &member_node_2.indexing_tasks,
            &[indexing_task1, indexing_task2]
        );
    }

    #[tokio::test]
    async fn test_chitchat_state_set_high_number_of_tasks() {
        let transport = ChannelTransport::default();
        let cluster1 = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let cluster2 = Arc::new(
            create_cluster_for_test(
                vec![cluster1.gossip_listen_addr.to_string()],
                &["indexer", "metastore"],
                &transport,
                true,
            )
            .await
            .unwrap(),
        );
        let cluster3 = Arc::new(
            create_cluster_for_test(
                vec![cluster1.gossip_listen_addr.to_string()],
                &["indexer", "metastore"],
                &transport,
                true,
            )
            .await
            .unwrap(),
        );
        let mut random_generator = rand::rng();
        // TODO: increase it back to 1000 when https://github.com/quickwit-oss/chitchat/issues/81 is fixed
        let indexing_tasks = (0..500)
            .map(|pipeline_id| {
                let index_id = random_generator.random_range(0..=10_000);
                let source_id = random_generator.random_range(0..=100);
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(pipeline_id as u128)),
                    index_uid: Some(
                        format!("index-{index_id}:11111111111111111111111111")
                            .parse()
                            .unwrap(),
                    ),
                    source_id: format!("source-{source_id}"),
                    shard_ids: Vec::new(),
                    params_fingerprint: 0,
                }
            })
            .collect_vec();
        cluster1
            .update_self_node_indexing_tasks(&indexing_tasks)
            .await;
        for cluster in [&cluster2, &cluster3] {
            let cluster_clone = cluster.clone();
            let indexing_tasks_clone = indexing_tasks.clone();
            wait_until_predicate(
                move || {
                    test_indexing_tasks_in_given_node(
                        cluster_clone.clone(),
                        cluster1.self_chitchat_id.gossip_advertise_addr,
                        indexing_tasks_clone.clone(),
                    )
                },
                Duration::from_secs(5),
                Duration::from_millis(100),
            )
            .await
            .unwrap();
        }

        // Mark tasks for deletion.
        cluster1.update_self_node_indexing_tasks(&[]).await;
        for cluster in [&cluster2, &cluster3] {
            let cluster_clone = cluster.clone();
            wait_until_predicate(
                move || {
                    test_indexing_tasks_in_given_node(
                        cluster_clone.clone(),
                        cluster1.self_chitchat_id.gossip_advertise_addr,
                        Vec::new(),
                    )
                },
                Duration::from_secs(4),
                Duration::from_millis(500),
            )
            .await
            .unwrap();
        }

        // Re-add tasks.
        cluster1
            .update_self_node_indexing_tasks(&indexing_tasks)
            .await;
        for cluster in [&cluster2, &cluster3] {
            let cluster_clone = cluster.clone();
            let indexing_tasks_clone = indexing_tasks.clone();
            wait_until_predicate(
                move || {
                    test_indexing_tasks_in_given_node(
                        cluster_clone.clone(),
                        cluster1.self_chitchat_id.gossip_advertise_addr,
                        indexing_tasks_clone.clone(),
                    )
                },
                Duration::from_secs(4),
                Duration::from_millis(500),
            )
            .await
            .unwrap();
        }
    }

    async fn test_indexing_tasks_in_given_node(
        cluster: Arc<Cluster>,
        gossip_advertise_addr: SocketAddr,
        indexing_tasks: Vec<IndexingTask>,
    ) -> bool {
        let members = cluster.ready_members().await;
        let node_opt = members
            .iter()
            .find(|member| member.gossip_advertise_addr == gossip_advertise_addr);
        let Some(node) = node_opt else {
            return false;
        };
        let node_grouped_tasks: HashMap<IndexingTask, usize> = node
            .indexing_tasks
            .iter()
            .chunk_by(|task| (*task).clone())
            .into_iter()
            .map(|(key, group)| (key, group.count()))
            .collect();
        let grouped_tasks: HashMap<IndexingTask, usize> = indexing_tasks
            .iter()
            .chunk_by(|task| (*task).clone())
            .into_iter()
            .map(|(key, group)| (key, group.count()))
            .collect();
        node_grouped_tasks == grouped_tasks
    }

    #[tokio::test]
    async fn test_chitchat_state_with_malformatted_indexing_task_key() {
        let transport = ChannelTransport::default();
        let node = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        {
            let chitchat_handle = node.inner.read().await.chitchat_handle.chitchat();
            let mut chitchat_guard = chitchat_handle.lock().await;
            chitchat_guard.self_node_state().set(
                format!("{INDEXING_TASK_PREFIX}01BX5ZZKBKACTAV9WEVGEMMVS0"),
                "my_index:00000000000000000000000000:my_source:41:1,3".to_string(),
            );
            chitchat_guard.self_node_state().set(
                format!("{INDEXING_TASK_PREFIX}01BX5ZZKBKACTAV9WEVGEMMVS1"),
                "my_index-00000000000000000000000000-my_source:53:3,5".to_string(),
            );
        }
        node.wait_for_ready_members(|members| members.len() == 1, Duration::from_secs(5))
            .await
            .unwrap();
        let ready_members = node.ready_members().await;
        assert_eq!(ready_members[0].indexing_tasks.len(), 1);
    }

    #[tokio::test]
    async fn test_cluster_id_isolation() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let transport = ChannelTransport::default();

        let cluster1a = create_cluster_for_test_with_id(
            "node-11".into(),
            11,
            "cluster1".to_string(),
            Vec::new(),
            &HashSet::default(),
            &transport,
            true,
        )
        .await?;
        let cluster2a = create_cluster_for_test_with_id(
            "node-21".into(),
            21,
            "cluster2".to_string(),
            vec![cluster1a.gossip_listen_addr.to_string()],
            &HashSet::default(),
            &transport,
            true,
        )
        .await?;
        let cluster1b = create_cluster_for_test_with_id(
            "node-12".into(),
            12,
            "cluster1".to_string(),
            vec![
                cluster1a.gossip_listen_addr.to_string(),
                cluster2a.gossip_listen_addr.to_string(),
            ],
            &HashSet::default(),
            &transport,
            true,
        )
        .await?;
        let cluster2b = create_cluster_for_test_with_id(
            "node-22".into(),
            22,
            "cluster2".to_string(),
            vec![
                cluster1a.gossip_listen_addr.to_string(),
                cluster2a.gossip_listen_addr.to_string(),
            ],
            &HashSet::default(),
            &transport,
            true,
        )
        .await?;

        let wait_secs = Duration::from_secs(10);

        for cluster in [&cluster1a, &cluster2a, &cluster1b, &cluster2b] {
            cluster
                .wait_for_ready_members(|members| members.len() == 2, wait_secs)
                .await
                .unwrap();
        }

        let members_a: Vec<SocketAddr> = cluster1a
            .ready_members()
            .await
            .iter()
            .map(|member| member.gossip_advertise_addr)
            .sorted()
            .collect();
        let mut expected_members_a =
            vec![cluster1a.gossip_listen_addr, cluster1b.gossip_listen_addr];
        expected_members_a.sort();
        assert_eq!(members_a, expected_members_a);

        let members_b: Vec<SocketAddr> = cluster2a
            .ready_members()
            .await
            .iter()
            .map(|member| member.gossip_advertise_addr)
            .sorted()
            .collect();
        let mut expected_members_b =
            vec![cluster2a.gossip_listen_addr, cluster2b.gossip_listen_addr];
        expected_members_b.sort();
        assert_eq!(members_b, expected_members_b);

        Ok(())
    }

    fn test_serialize_indexing_tasks_aux(
        indexing_tasks: &[IndexingTask],
        node_state: &mut NodeState,
    ) {
        set_indexing_tasks_in_node_state(indexing_tasks, node_state);
        let ser_deser_indexing_tasks = parse_indexing_tasks(node_state);
        assert_eq!(indexing_tasks, ser_deser_indexing_tasks);
    }

    #[test]
    fn test_serialize_indexing_tasks() {
        let mut node_state = NodeState::for_test();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        test_serialize_indexing_tasks_aux(&[], &mut node_state);
        test_serialize_indexing_tasks_aux(
            &[IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(1u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "my-source1".to_string(),
                shard_ids: vec![ShardId::from(1), ShardId::from(2)],
                params_fingerprint: 0,
            }],
            &mut node_state,
        );
        // change in the set of shards
        test_serialize_indexing_tasks_aux(
            &[IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(2u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "my-source1".to_string(),
                shard_ids: vec![ShardId::from(1), ShardId::from(2), ShardId::from(3)],
                params_fingerprint: 0,
            }],
            &mut node_state,
        );
        test_serialize_indexing_tasks_aux(
            &[
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(1u128)),
                    index_uid: Some(index_uid.clone()),
                    source_id: "my-source1".to_string(),
                    shard_ids: vec![ShardId::from(1), ShardId::from(2)],
                    params_fingerprint: 0,
                },
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(2u128)),
                    index_uid: Some(index_uid.clone()),
                    source_id: "my-source1".to_string(),
                    shard_ids: vec![ShardId::from(3), ShardId::from(4)],
                    params_fingerprint: 0,
                },
            ],
            &mut node_state,
        );
        // different index.
        test_serialize_indexing_tasks_aux(
            &[
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(1u128)),
                    index_uid: Some(index_uid.clone()),
                    source_id: "my-source1".to_string(),
                    shard_ids: vec![ShardId::from(1), ShardId::from(2)],
                    params_fingerprint: 0,
                },
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(2u128)),
                    index_uid: Some(IndexUid::for_test("test-index2", 0)),
                    source_id: "my-source1".to_string(),
                    shard_ids: vec![ShardId::from(3), ShardId::from(4)],
                    params_fingerprint: 0,
                },
            ],
            &mut node_state,
        );
        // same index, different source.
        test_serialize_indexing_tasks_aux(
            &[
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(1u128)),
                    index_uid: Some(index_uid.clone()),
                    source_id: "my-source1".to_string(),
                    shard_ids: vec![ShardId::from(1), ShardId::from(2)],
                    params_fingerprint: 0,
                },
                IndexingTask {
                    pipeline_uid: Some(PipelineUid::for_test(2u128)),
                    index_uid: Some(index_uid.clone()),
                    source_id: "my-source2".to_string(),
                    shard_ids: vec![ShardId::from(3), ShardId::from(4)],
                    params_fingerprint: 0,
                },
            ],
            &mut node_state,
        );
    }

    #[test]
    fn test_parse_shard_ids_str() {
        assert!(parse_shard_ids_str("").is_empty());
        assert!(parse_shard_ids_str(",").is_empty());
        assert_eq!(
            parse_shard_ids_str("00000000000000000012,"),
            [ShardId::from(12)]
        );
        assert_eq!(
            parse_shard_ids_str("00000000000000000012,00000000000000000023,"),
            [ShardId::from(12), ShardId::from(23)]
        );
    }

    #[test]
    fn test_parse_chitchat_kv() {
        assert!(
            chitchat_kv_to_indexing_task("invalidulid", "my_index:uid:my_source:42:1,3").is_none()
        );
        let task = super::chitchat_kv_to_indexing_task(
            "indexer.task:01BX5ZZKBKACTAV9WEVGEMMVS0",
            "my_index:00000000000000000000000000:my_source:42:00000000000000000001,\
             00000000000000000003",
        )
        .unwrap();
        assert_eq!(task.params_fingerprint, 42);
        assert_eq!(
            task.pipeline_uid(),
            PipelineUid::from_str("01BX5ZZKBKACTAV9WEVGEMMVS0").unwrap()
        );
        assert_eq!(
            &task.index_uid().to_string(),
            "my_index:00000000000000000000000000"
        );
        assert_eq!(&task.source_id, "my_source");
        assert_eq!(&task.shard_ids, &[ShardId::from(1), ShardId::from(3)]);
    }
}


================================================
FILE: quickwit/quickwit-cluster/src/grpc_gossip.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::iter::zip;
use std::net::SocketAddr;
use std::sync::{Arc, Weak};
use std::time::{Duration, Instant};

use chitchat::{Chitchat, ChitchatId, NodeState, VersionedValue};
use futures::Future;
use quickwit_common::pretty::PrettyDisplay;
use quickwit_common::tower::ClientGrpcConfig;
use quickwit_proto::cluster::{ClusterService, ClusterServiceClient, FetchClusterStateRequest};
use rand::seq::IteratorRandom;
use tokio::sync::{Mutex, watch};
use tokio_stream::StreamExt;
use tokio_stream::wrappers::WatchStream;
use tracing::{info, warn};

use crate::grpc_service::cluster_grpc_client;
use crate::member::NodeStateExt;
use crate::metrics::CLUSTER_METRICS;

const MAX_GOSSIP_PEERS: usize = 3;

/// select a few and then fetches the state from them via gRPC.
pub(crate) async fn spawn_catchup_callback_task(
    cluster_id: String,
    self_chitchat_id: ChitchatId,
    weak_chitchat: Weak<Mutex<Chitchat>>,
    live_nodes_rx: watch::Receiver<BTreeMap<ChitchatId, NodeState>>,
    mut catchup_callback_rx: watch::Receiver<()>,
    client_grpc_config: ClientGrpcConfig,
) {
    let catchup_callback_future = async move {
        let mut interval = tokio::time::interval(Duration::from_secs(60));
        interval.tick().await;

        loop {
            let Some(chitchat) = weak_chitchat.upgrade() else {
                return;
            };
            perform_grpc_gossip_rounds(
                cluster_id.clone(),
                &self_chitchat_id,
                chitchat,
                live_nodes_rx.clone(),
                |socket_addr| cluster_grpc_client(socket_addr, client_grpc_config.clone()),
            )
            .await;

            interval.tick().await;

            if catchup_callback_rx.changed().await.is_err() {
                return;
            }
        }
    };
    tokio::spawn(catchup_callback_future);
}

async fn perform_grpc_gossip_rounds<ClusterServiceClientFactory, Fut>(
    cluster_id: String,
    self_chitchat_id: &ChitchatId,
    chitchat: Arc<Mutex<Chitchat>>,
    live_nodes_rx: watch::Receiver<BTreeMap<ChitchatId, NodeState>>,
    grpc_client_factory: ClusterServiceClientFactory,
) where
    ClusterServiceClientFactory: Fn(SocketAddr) -> Fut,
    Fut: Future<Output = ClusterServiceClient>,
{
    wait_for_gossip_candidates(
        self_chitchat_id,
        live_nodes_rx.clone(),
        Duration::from_secs(10),
    )
    .await;

    let now = Instant::now();
    let (node_ids, grpc_advertise_addrs) =
        select_gossip_candidates(self_chitchat_id, live_nodes_rx);

    if node_ids.is_empty() {
        info!("no peer nodes to pull the cluster state from");
        return;
    }
    info!("pulling cluster state from node(s): {node_ids:?}");

    for (node_id, grpc_advertise_addr) in zip(node_ids, grpc_advertise_addrs) {
        let cluster_client = grpc_client_factory(grpc_advertise_addr).await;

        let request = FetchClusterStateRequest {
            cluster_id: cluster_id.clone(),
        };
        let Ok(response) = cluster_client.fetch_cluster_state(request).await else {
            warn!("failed to fetch cluster state from node `{node_id}`");
            continue;
        };
        CLUSTER_METRICS.grpc_gossip_rounds_total.inc();

        let mut chitchat_guard = chitchat.lock().await;

        for proto_node_state in response.node_states {
            let proto_chitchat_id = proto_node_state
                .chitchat_id
                .expect("`chitchat_id` should be a required field");
            let chitchat_id = ChitchatId {
                node_id: proto_chitchat_id.node_id.clone(),
                generation_id: proto_chitchat_id.generation_id,
                gossip_advertise_addr: proto_chitchat_id
                    .gossip_advertise_addr
                    .parse()
                    .expect("`gossip_advertise_addr` should be a valid socket address"),
            };
            if chitchat_id == *self_chitchat_id {
                continue;
            }
            let now = tokio::time::Instant::now();
            let key_values = proto_node_state.key_values.into_iter().map(|key_value| {
                let status: chitchat::DeletionStatus = match key_value.status() {
                    quickwit_proto::cluster::DeletionStatus::Set => chitchat::DeletionStatus::Set,
                    quickwit_proto::cluster::DeletionStatus::Deleted => {
                        chitchat::DeletionStatus::Deleted(now)
                    }
                    quickwit_proto::cluster::DeletionStatus::DeleteAfterTtl => {
                        chitchat::DeletionStatus::DeleteAfterTtl(now)
                    }
                };
                (
                    key_value.key,
                    VersionedValue {
                        value: key_value.value,
                        version: key_value.version,
                        status,
                    },
                )
            });
            chitchat_guard.reset_node_state_if_update(
                &chitchat_id,
                key_values,
                proto_node_state.max_version,
                proto_node_state.last_gc_version,
            );
        }
    }
    info!("pulled cluster state in {}", now.elapsed().pretty_display());
}

async fn wait_for_gossip_candidates(
    self_chitchat_id: &ChitchatId,
    live_nodes_rx: watch::Receiver<BTreeMap<ChitchatId, NodeState>>,
    timeout_after: Duration,
) {
    let live_nodes_stream = WatchStream::new(live_nodes_rx);
    let _ = tokio::time::timeout(
        timeout_after,
        live_nodes_stream
            .skip_while(|node_states| {
                node_states.len() < MAX_GOSSIP_PEERS
                    && node_states
                        .values()
                        .filter(|node_state| {
                            find_gossip_candidate_grpc_addr(self_chitchat_id, node_state).is_some()
                        })
                        .count()
                        < MAX_GOSSIP_PEERS
            })
            .next(),
    )
    .await;
}

fn select_gossip_candidates(
    self_chitchat_id: &ChitchatId,
    live_nodes_rx: watch::Receiver<BTreeMap<ChitchatId, NodeState>>,
) -> (Vec<String>, Vec<SocketAddr>) {
    live_nodes_rx
        .borrow()
        .values()
        .filter_map(|node_state| {
            find_gossip_candidate_grpc_addr(self_chitchat_id, node_state)
                .map(|grpc_addr| (&node_state.chitchat_id().node_id, grpc_addr))
        })
        .choose_multiple(&mut rand::rng(), MAX_GOSSIP_PEERS)
        .into_iter()
        .map(|(node_id, grpc_addr)| (node_id.clone(), grpc_addr))
        .unzip()
}

/// Returns the gRPC advertise address of the node if it is a gossip candidate.
fn find_gossip_candidate_grpc_addr(
    self_chitchat_id: &ChitchatId,
    node_state: &NodeState,
) -> Option<SocketAddr> {
    // Ignore self node, including previous generations, and nodes that are not ready.
    if self_chitchat_id.node_id == node_state.chitchat_id().node_id || !node_state.is_ready() {
        return None;
    }
    node_state.grpc_advertise_addr().ok()
}

#[cfg(test)]
mod tests {
    use chitchat::transport::ChannelTransport;
    use quickwit_proto::cluster::{
        ChitchatId as ProtoChitchatId, DeletionStatus, FetchClusterStateResponse,
        MockClusterService, NodeState as ProtoNodeState, VersionedKeyValue,
    };

    use super::*;
    use crate::change::tests::NodeStateBuilder;
    use crate::create_cluster_for_test;
    use crate::member::{GRPC_ADVERTISE_ADDR_KEY, READINESS_KEY, READINESS_VALUE_READY};

    #[tokio::test]
    async fn test_find_gossip_candidate_grpc_addr() {
        let gossip_advertise_addr: SocketAddr = "127.0.0.1:10000".parse().unwrap();
        let grpc_advertise_addr: SocketAddr = "127.0.0.1:10001".parse().unwrap();
        let self_chitchat_id =
            ChitchatId::new("test-node-foo".to_string(), 1, gossip_advertise_addr);

        let node_state = NodeStateBuilder::default()
            .with_readiness(true)
            .with_grpc_advertise_addr(grpc_advertise_addr)
            .build();
        let grpc_addr = find_gossip_candidate_grpc_addr(&self_chitchat_id, &node_state).unwrap();
        assert_eq!(grpc_addr, grpc_advertise_addr);

        let node_state = NodeStateBuilder::default()
            .with_readiness(false)
            .with_grpc_advertise_addr(grpc_advertise_addr)
            .build();
        let grpc_addr_opt = find_gossip_candidate_grpc_addr(&self_chitchat_id, &node_state);
        assert!(grpc_addr_opt.is_none());

        let node_state = NodeStateBuilder::default().with_readiness(false).build();
        let grpc_addr_opt = find_gossip_candidate_grpc_addr(&self_chitchat_id, &node_state);
        assert!(grpc_addr_opt.is_none());

        let self_chitchat_id = ChitchatId::new("test-node".to_string(), 1, gossip_advertise_addr);
        let node_state = NodeStateBuilder::default()
            .with_readiness(true)
            .with_grpc_advertise_addr(grpc_advertise_addr)
            .build();
        let grpc_addr_opt = find_gossip_candidate_grpc_addr(&self_chitchat_id, &node_state);
        assert!(grpc_addr_opt.is_none());
    }

    #[tokio::test]
    async fn test_perform_grpc_gossip_rounds() {
        let peer_seeds = Vec::new();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(peer_seeds, &["indexer"], &transport, true)
            .await
            .unwrap();
        let cluster_id = cluster.cluster_id().to_string();
        let self_chitchat_id = cluster.self_chitchat_id();
        let chitchat = cluster.chitchat().await;

        let grpc_client_factory = |_: SocketAddr| {
            Box::pin(async {
                let mut mock_cluster_service = MockClusterService::new();
                mock_cluster_service
                    .expect_fetch_cluster_state()
                    .returning(|_request| {
                        let response = FetchClusterStateResponse {
                            node_states: vec![ProtoNodeState {
                                chitchat_id: Some(ProtoChitchatId {
                                    node_id: "node-4".to_string(),
                                    generation_id: 0,
                                    gossip_advertise_addr: "127.0.0.1:14000".to_string(),
                                }),
                                key_values: vec![VersionedKeyValue {
                                    key: "foo".to_string(),
                                    value: "bar".to_string(),
                                    version: 2,

                                    status: DeletionStatus::Set as i32,
                                }],
                                max_version: 2,
                                last_gc_version: 1,
                            }],
                            ..Default::default()
                        };
                        Ok(response)
                    });
                ClusterServiceClient::from_mock(mock_cluster_service)
            })
        };
        let live_nodes = BTreeMap::from_iter([
            {
                let chitchat_id = ChitchatId::for_local_test(11_000);
                let mut node_state = NodeState::for_test();

                node_state.set(GRPC_ADVERTISE_ADDR_KEY, "127.0.0.1:11001");
                node_state.set(READINESS_KEY, READINESS_VALUE_READY);
                (chitchat_id, node_state)
            },
            {
                let chitchat_id = ChitchatId::for_local_test(12_000);
                let mut node_state = NodeState::for_test();

                node_state.set(GRPC_ADVERTISE_ADDR_KEY, "127.0.0.1:12001");
                node_state.set(READINESS_KEY, READINESS_VALUE_READY);
                (chitchat_id, node_state)
            },
            {
                let chitchat_id = ChitchatId::for_local_test(13_000);
                let mut node_state = NodeState::for_test();

                node_state.set(GRPC_ADVERTISE_ADDR_KEY, "127.0.0.1:13001");
                node_state.set(READINESS_KEY, READINESS_VALUE_READY);
                (chitchat_id, node_state)
            },
        ]);
        let (_live_nodes_tx, live_nodes_rx) = watch::channel(live_nodes);

        perform_grpc_gossip_rounds(
            cluster_id,
            self_chitchat_id,
            chitchat.clone(),
            live_nodes_rx,
            grpc_client_factory,
        )
        .await;

        let chitchat_mutex_guard = chitchat.lock().await;
        let chitchat_id = ChitchatId {
            node_id: "node-4".to_string(),
            generation_id: 0,
            gossip_advertise_addr: "127.0.0.1:14000".parse().unwrap(),
        };
        let node_state = chitchat_mutex_guard.node_state(&chitchat_id).unwrap();
        assert_eq!(node_state.num_key_values(), 1);
        assert_eq!(node_state.get("foo").unwrap(), "bar");
        assert_eq!(node_state.max_version(), 2);
        assert_eq!(node_state.last_gc_version(), 1);
    }
}


================================================
FILE: quickwit/quickwit-cluster/src/grpc_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::net::SocketAddr;

use bytesize::ByteSize;
use itertools::Itertools;
use once_cell::sync::Lazy;
use quickwit_common::tower::{ClientGrpcConfig, GrpcMetricsLayer, make_channel};
use quickwit_proto::cluster::cluster_service_grpc_server::ClusterServiceGrpcServer;
use quickwit_proto::cluster::{
    ChitchatId as ProtoChitchatId, ClusterError, ClusterResult, ClusterService,
    ClusterServiceClient, ClusterServiceGrpcServerAdapter, FetchClusterStateRequest,
    FetchClusterStateResponse, NodeState as ProtoNodeState, VersionedKeyValue,
};
use tonic::async_trait;

use crate::Cluster;

const MAX_MESSAGE_SIZE: ByteSize = ByteSize::mib(64);

static CLUSTER_GRPC_CLIENT_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("cluster", "client"));
static CLUSTER_GRPC_SERVER_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("cluster", "server"));

pub(crate) async fn cluster_grpc_client(
    socket_addr: SocketAddr,
    client_grpc_config: ClientGrpcConfig,
) -> ClusterServiceClient {
    let channel = make_channel(socket_addr, client_grpc_config).await;

    ClusterServiceClient::tower()
        .stack_layer(CLUSTER_GRPC_CLIENT_METRICS_LAYER.clone())
        .build_from_channel(socket_addr, channel, MAX_MESSAGE_SIZE, None)
}

pub fn cluster_grpc_server(
    cluster: Cluster,
) -> ClusterServiceGrpcServer<ClusterServiceGrpcServerAdapter> {
    ClusterServiceClient::tower()
        .stack_layer(CLUSTER_GRPC_SERVER_METRICS_LAYER.clone())
        .build(cluster)
        .as_grpc_service(MAX_MESSAGE_SIZE)
}

#[async_trait]
impl ClusterService for Cluster {
    async fn fetch_cluster_state(
        &self,
        request: FetchClusterStateRequest,
    ) -> ClusterResult<FetchClusterStateResponse> {
        if request.cluster_id != self.cluster_id() {
            return Err(ClusterError::Internal("wrong cluster".to_string()));
        }
        let chitchat = self.chitchat().await;
        let chitchat_guard = chitchat.lock().await;

        let num_nodes = chitchat_guard.node_states().len();
        let mut proto_node_states = Vec::with_capacity(num_nodes);

        for (chitchat_id, node_state) in chitchat_guard.node_states() {
            let proto_chitchat_id = ProtoChitchatId {
                node_id: chitchat_id.node_id.clone(),
                generation_id: chitchat_id.generation_id,
                gossip_advertise_addr: chitchat_id.gossip_advertise_addr.to_string(),
            };

            let key_values: Vec<VersionedKeyValue> = node_state
                .key_values_including_deleted()
                .map(|(key, versioned_value)| {
                    let key_value_status_proto = match versioned_value.status {
                        chitchat::DeletionStatus::Set => {
                            quickwit_proto::cluster::DeletionStatus::Set
                        }
                        chitchat::DeletionStatus::Deleted(_) => {
                            quickwit_proto::cluster::DeletionStatus::Deleted
                        }
                        chitchat::DeletionStatus::DeleteAfterTtl(_) => {
                            quickwit_proto::cluster::DeletionStatus::DeleteAfterTtl
                        }
                    };
                    VersionedKeyValue {
                        key: key.to_string(),
                        value: versioned_value.value.clone(),
                        version: versioned_value.version,
                        status: key_value_status_proto as i32,
                    }
                })
                .sorted_unstable_by_key(|key_value| key_value.version)
                .collect();
            if key_values.is_empty() {
                continue;
            }
            let proto_node_state = ProtoNodeState {
                chitchat_id: Some(proto_chitchat_id),
                key_values,
                max_version: node_state.max_version(),
                last_gc_version: node_state.last_gc_version(),
            };
            proto_node_states.push(proto_node_state);
        }
        let response = FetchClusterStateResponse {
            cluster_id: request.cluster_id,
            node_states: proto_node_states,
        };
        Ok(response)
    }
}

#[cfg(test)]
mod tests {
    use chitchat::transport::ChannelTransport;

    use super::*;
    use crate::create_cluster_for_test;
    use crate::member::{ENABLED_SERVICES_KEY, GRPC_ADVERTISE_ADDR_KEY, READINESS_KEY};

    #[tokio::test]
    async fn test_fetch_cluster_state() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();

        let cluster_id = cluster.cluster_id().to_string();
        let node_id = cluster.self_node_id().to_owned();

        cluster.set_self_key_value("foo", "bar").await;

        let fetch_cluster_state_request = FetchClusterStateRequest {
            cluster_id: cluster_id.clone(),
        };
        let mut fetch_cluster_state_response = cluster
            .fetch_cluster_state(fetch_cluster_state_request)
            .await
            .unwrap();
        assert_eq!(
            fetch_cluster_state_response.cluster_id,
            cluster.cluster_id()
        );
        assert_eq!(fetch_cluster_state_response.node_states.len(), 1);

        let node_state = &mut fetch_cluster_state_response.node_states[0];

        let chitchat_id = node_state.chitchat_id.clone().unwrap();
        assert_eq!(chitchat_id.node_id, node_id);
        assert_eq!(chitchat_id.generation_id, 1);

        node_state
            .key_values
            .sort_unstable_by(|left, right| left.key.cmp(&right.key));

        assert_eq!(node_state.key_values.len(), 4);
        assert_eq!(node_state.key_values[0].key, ENABLED_SERVICES_KEY);
        assert_eq!(node_state.key_values[0].value, "indexer");

        assert_eq!(node_state.key_values[1].key, "foo");
        assert_eq!(node_state.key_values[1].value, "bar");

        assert_eq!(node_state.key_values[2].key, GRPC_ADVERTISE_ADDR_KEY);

        assert_eq!(node_state.key_values[3].key, READINESS_KEY);
        assert_eq!(node_state.key_values[3].value, "READY");
    }
}


================================================
FILE: quickwit/quickwit-cluster/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

mod change;
mod cluster;
mod grpc_gossip;
mod grpc_service;
mod member;
mod metrics;
mod node;

use std::net::SocketAddr;
use std::time::Duration;

use async_trait::async_trait;
pub use chitchat::transport::ChannelTransport;
use chitchat::transport::{Socket, Transport, UdpSocket};
use chitchat::{ChitchatMessage, Serializable};
pub use chitchat::{FailureDetectorConfig, KeyChangeEvent, ListenerHandle};
pub use grpc_service::cluster_grpc_server;
use quickwit_common::metrics::IntCounter;
use quickwit_common::tower::ClientGrpcConfig;
use quickwit_config::service::QuickwitService;
use quickwit_config::{GrpcConfig, NodeConfig, TlsConfig};
use quickwit_proto::indexing::CpuCapacity;
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::tonic::transport::{Certificate, ClientTlsConfig, Identity};
use time::OffsetDateTime;

#[cfg(any(test, feature = "testsuite"))]
pub use crate::change::for_test::*;
pub use crate::change::{ClusterChange, ClusterChangeStream, ClusterChangeStreamFactory};
pub use crate::cluster::{Cluster, ClusterSnapshot, NodeIdSchema};
#[cfg(any(test, feature = "testsuite"))]
pub use crate::cluster::{
    create_cluster_for_test, create_cluster_for_test_with_id, grpc_addr_from_listen_addr_for_test,
};
pub use crate::member::{ClusterMember, INDEXING_CPU_CAPACITY_KEY};
pub use crate::node::ClusterNode;

#[derive(Debug, Clone, Copy, Eq, PartialEq)]
pub struct GenerationId(u64);

impl GenerationId {
    pub fn as_u64(&self) -> u64 {
        self.0
    }

    pub fn now() -> Self {
        Self(OffsetDateTime::now_utc().unix_timestamp_nanos() as u64)
    }
}

impl From<u64> for GenerationId {
    fn from(generation_id: u64) -> Self {
        Self(generation_id)
    }
}

struct CountingUdpTransport;

struct CountingUdpSocket {
    socket: UdpSocket,
    gossip_recv: IntCounter,
    gossip_recv_bytes: IntCounter,
    gossip_send: IntCounter,
    gossip_send_bytes: IntCounter,
}

#[async_trait]
impl Socket for CountingUdpSocket {
    async fn send(&mut self, to: SocketAddr, msg: ChitchatMessage) -> anyhow::Result<()> {
        let msg_len = msg.serialized_len() as u64;
        self.socket.send(to, msg).await?;
        self.gossip_send.inc();
        self.gossip_send_bytes.inc_by(msg_len);
        Ok(())
    }

    async fn recv(&mut self) -> anyhow::Result<(SocketAddr, ChitchatMessage)> {
        let (socket_addr, msg) = self.socket.recv().await?;
        self.gossip_recv.inc();
        let msg_len = msg.serialized_len() as u64;
        self.gossip_recv_bytes.inc_by(msg_len);
        Ok((socket_addr, msg))
    }
}

#[async_trait]
impl Transport for CountingUdpTransport {
    async fn open(&self, listen_addr: SocketAddr) -> anyhow::Result<Box<dyn Socket>> {
        let socket = UdpSocket::open(listen_addr).await?;
        Ok(Box::new(CountingUdpSocket {
            socket,
            gossip_recv: crate::metrics::CLUSTER_METRICS
                .gossip_recv_messages_total
                .clone(),
            gossip_recv_bytes: crate::metrics::CLUSTER_METRICS
                .gossip_recv_bytes_total
                .clone(),
            gossip_send: crate::metrics::CLUSTER_METRICS
                .gossip_sent_messages_total
                .clone(),
            gossip_send_bytes: crate::metrics::CLUSTER_METRICS
                .gossip_sent_bytes_total
                .clone(),
        }))
    }
}

pub async fn start_cluster_service(node_config: &NodeConfig) -> anyhow::Result<Cluster> {
    let cluster_id = node_config.cluster_id.clone();
    let gossip_listen_addr = node_config.gossip_listen_addr;
    let peer_seed_addrs = node_config.peer_seed_addrs().await?;
    let indexing_tasks = Vec::new();

    let node_id = node_config.node_id.clone();
    let generation_id = GenerationId::now();
    let is_ready = false;
    let indexing_cpu_capacity = if node_config.is_service_enabled(QuickwitService::Indexer) {
        node_config.indexer_config.cpu_capacity
    } else {
        CpuCapacity::zero()
    };
    let self_node = ClusterMember {
        node_id,
        generation_id,
        is_ready,
        enabled_services: node_config.enabled_services.clone(),
        gossip_advertise_addr: node_config.gossip_advertise_addr,
        grpc_advertise_addr: node_config.grpc_advertise_addr,
        indexing_tasks,
        indexing_cpu_capacity,
        ingester_status: IngesterStatus::default(),
        availability_zone: node_config.availability_zone.clone(),
    };
    let failure_detector_config = FailureDetectorConfig {
        dead_node_grace_period: Duration::from_secs(2 * 60 * 60), // 2 hours
        ..Default::default()
    };
    let client_grpc_config = make_client_grpc_config(&node_config.grpc_config)?;
    let cluster = Cluster::join(
        cluster_id,
        self_node,
        gossip_listen_addr,
        peer_seed_addrs,
        node_config.gossip_interval,
        failure_detector_config,
        &CountingUdpTransport,
        client_grpc_config,
    )
    .await?;
    if node_config
        .enabled_services
        .contains(&QuickwitService::Indexer)
    {
        cluster
            .set_self_key_value(INDEXING_CPU_CAPACITY_KEY, indexing_cpu_capacity)
            .await;
    }
    Ok(cluster)
}

pub fn make_client_grpc_config(grpc_config: &GrpcConfig) -> anyhow::Result<ClientGrpcConfig> {
    let tls_config_opt = grpc_config
        .tls
        .as_ref()
        .map(make_client_tls_config)
        .transpose()?;
    Ok(ClientGrpcConfig {
        keep_alive_opt: grpc_config.keep_alive.clone().map(Into::into),
        tls_config_opt,
    })
}

fn make_client_tls_config(tls_config: &TlsConfig) -> anyhow::Result<ClientTlsConfig> {
    let pem = std::fs::read_to_string(&tls_config.ca_path)?;
    let ca = Certificate::from_pem(pem);
    let mut tls = ClientTlsConfig::new().ca_certificate(ca);

    if tls_config.validate_client {
        let cert = std::fs::read_to_string(&tls_config.cert_path)?;
        let key = std::fs::read_to_string(&tls_config.key_path)?;
        let identity = Identity::from_pem(cert, key);
        tls = tls.identity(identity);
    }
    if let Some(expected_name) = &tls_config.expected_name {
        tls = tls.domain_name(expected_name);
    }

    Ok(tls)
}


================================================
FILE: quickwit/quickwit-cluster/src/member.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::mem::size_of;
use std::net::SocketAddr;
use std::str::FromStr;

use anyhow::Context;
use chitchat::{ChitchatId, NodeState, Version};
use quickwit_common::shared_consts::INGESTER_STATUS_KEY;
use quickwit_proto::indexing::{CpuCapacity, IndexingTask};
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::types::NodeId;
use tracing::{error, warn};

use crate::cluster::parse_indexing_tasks;
use crate::{GenerationId, QuickwitService};

// Keys used to store member's data in chitchat state.
pub(crate) const GRPC_ADVERTISE_ADDR_KEY: &str = "grpc_advertise_addr";
pub(crate) const ENABLED_SERVICES_KEY: &str = "enabled_services";
pub(crate) const PIPELINE_METRICS_PREFIX: &str = "pipeline_metrics:";

// Readiness key and values used to store node's readiness in Chitchat state.
pub(crate) const READINESS_KEY: &str = "readiness";
pub(crate) const READINESS_VALUE_READY: &str = "READY";
pub(crate) const READINESS_VALUE_NOT_READY: &str = "NOT_READY";

pub(crate) const AVAILABILITY_ZONE_KEY: &str = "availability_zone";

pub const INDEXING_CPU_CAPACITY_KEY: &str = "indexing_cpu_capacity";

pub(crate) trait NodeStateExt {
    fn grpc_advertise_addr(&self) -> anyhow::Result<SocketAddr>;

    fn is_ready(&self) -> bool;

    fn size_bytes(&self) -> usize;

    fn ingester_status(&self) -> IngesterStatus;

    fn availability_zone(&self) -> Option<String>;
}

impl NodeStateExt for NodeState {
    fn grpc_advertise_addr(&self) -> anyhow::Result<SocketAddr> {
        self.get(GRPC_ADVERTISE_ADDR_KEY)
            .with_context(|| {
                format!("could not find key `{GRPC_ADVERTISE_ADDR_KEY}` in Chitchat node state")
            })
            .map(|grpc_advertise_addr_value| {
                grpc_advertise_addr_value.parse().with_context(|| {
                    format!("failed to parse gRPC advertise address `{grpc_advertise_addr_value}`")
                })
            })?
    }

    fn is_ready(&self) -> bool {
        self.get(READINESS_KEY)
            .map(|health_value| health_value == READINESS_VALUE_READY)
            .unwrap_or(false)
    }

    // TODO: Expose more accurate size of the state in Chitchat.
    fn size_bytes(&self) -> usize {
        const SIZE_OF_VERSION: usize = size_of::<Version>();
        const SIZE_OF_TOMBSTONE: usize = size_of::<u64>();

        self.key_values_including_deleted()
            .map(|(key, value)| key.len() + value.value.len() + SIZE_OF_VERSION + SIZE_OF_TOMBSTONE)
            .sum()
    }

    fn ingester_status(&self) -> IngesterStatus {
        self.get(INGESTER_STATUS_KEY)
            .and_then(IngesterStatus::from_json_str_name)
            .unwrap_or_default()
    }

    fn availability_zone(&self) -> Option<String> {
        self.get(AVAILABILITY_ZONE_KEY).map(|az| az.to_string())
    }
}

/// Cluster member.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct ClusterMember {
    /// A unique node ID across the cluster.
    /// The Chitchat node ID is the concatenation of the node ID and the start timestamp:
    /// `{node_id}/{start_timestamp}`.
    pub node_id: NodeId,
    /// The start timestamp (seconds) of the node.
    pub generation_id: GenerationId,
    /// Enabled services, i.e. services configured to run on the node. Depending on the node and
    /// service health, each service may or may not be available/running.
    pub enabled_services: HashSet<QuickwitService>,
    /// Gossip advertise address, i.e. the address that other nodes should use to gossip with the
    /// node.
    pub gossip_advertise_addr: SocketAddr,
    /// gRPC advertise address, i.e. the address that other nodes should use to communicate with
    /// the node via gRPC.
    pub grpc_advertise_addr: SocketAddr,
    /// Running indexing plan.
    /// None if the node is not an indexer or the indexer has not yet started some indexing
    /// pipelines.
    pub indexing_tasks: Vec<IndexingTask>,
    /// Indexing cpu capacity of the node expressed in milli cpu.
    pub indexing_cpu_capacity: CpuCapacity,
    /// Status of the ingester service running on the node. `IngesterStatus::Unspecified` if the
    /// node is not an ingester.
    pub ingester_status: IngesterStatus,
    /// Whether the node is ready to serve requests.
    pub is_ready: bool,
    /// Availability zone the node is running in, if enabled.
    pub availability_zone: Option<String>,
}

impl ClusterMember {
    pub fn chitchat_id(&self) -> ChitchatId {
        ChitchatId::new(
            self.node_id.clone().into(),
            self.generation_id.as_u64(),
            self.gossip_advertise_addr,
        )
    }
}

impl From<ClusterMember> for ChitchatId {
    fn from(member: ClusterMember) -> Self {
        member.chitchat_id()
    }
}

fn parse_indexing_cpu_capacity(node_state: &NodeState) -> CpuCapacity {
    let Some(indexing_capacity_str) = node_state.get(INDEXING_CPU_CAPACITY_KEY) else {
        return CpuCapacity::zero();
    };
    if let Ok(indexing_capacity) = CpuCapacity::from_str(indexing_capacity_str) {
        indexing_capacity
    } else {
        error!(indexing_capacity=?indexing_capacity_str, "received an unparsable indexing capacity from node");
        CpuCapacity::zero()
    }
}

// Builds a cluster member from a [`NodeState`].
pub(crate) fn build_cluster_member(
    chitchat_id: ChitchatId,
    node_state: &NodeState,
) -> anyhow::Result<ClusterMember> {
    let is_ready = node_state.is_ready();
    let enabled_services = node_state
        .get(ENABLED_SERVICES_KEY)
        .ok_or_else(|| {
            anyhow::anyhow!(
                "could not find `{}` key in node `{}` state",
                ENABLED_SERVICES_KEY,
                chitchat_id.node_id
            )
        })
        .map(|enabled_services_str| {
            parse_enabled_services_str(enabled_services_str, &chitchat_id.node_id)
        })?;
    let grpc_advertise_addr = node_state.grpc_advertise_addr()?;
    let indexing_tasks = parse_indexing_tasks(node_state);
    let indexing_cpu_capacity = parse_indexing_cpu_capacity(node_state);
    let ingester_status = node_state.ingester_status();
    let availability_zone = node_state.availability_zone();

    let member = ClusterMember {
        node_id: chitchat_id.node_id.into(),
        generation_id: chitchat_id.generation_id.into(),
        is_ready,
        enabled_services,
        gossip_advertise_addr: chitchat_id.gossip_advertise_addr,
        grpc_advertise_addr,
        indexing_tasks,
        indexing_cpu_capacity,
        ingester_status,
        availability_zone,
    };
    Ok(member)
}

fn parse_enabled_services_str(
    enabled_services_str: &str,
    node_id: &str,
) -> HashSet<QuickwitService> {
    let enabled_services: HashSet<QuickwitService> = enabled_services_str
        .split(',')
        .filter(|service_str| !service_str.is_empty())
        .filter_map(|service_str| match service_str.parse() {
            Ok(service) => Some(service),
            Err(_) => {
                warn!(
                    node_id=%node_id,
                    service=%service_str,
                    "Found unknown service enabled on node."
                );
                None
            }
        })
        .collect();
    if enabled_services.is_empty() {
        warn!(
            node_id=%node_id,
            "Node has no enabled services."
        )
    }
    enabled_services
}


================================================
FILE: quickwit/quickwit-cluster/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::net::SocketAddr;
use std::sync::Weak;
use std::time::Duration;

use chitchat::{Chitchat, ChitchatId};
use once_cell::sync::Lazy;
use quickwit_common::metrics::{IntCounter, IntGauge, new_counter, new_gauge};
use tokio::sync::Mutex;

use crate::member::NodeStateExt;

pub struct ClusterMetrics {
    pub live_nodes: IntGauge,
    pub ready_nodes: IntGauge,
    pub zombie_nodes: IntGauge,
    pub dead_nodes: IntGauge,
    pub cluster_state_size_bytes: IntGauge,
    pub node_state_size_bytes: IntGauge,
    pub node_state_keys: IntGauge,
    pub gossip_recv_messages_total: IntCounter,
    pub gossip_recv_bytes_total: IntCounter,
    pub gossip_sent_messages_total: IntCounter,
    pub gossip_sent_bytes_total: IntCounter,
    pub grpc_gossip_rounds_total: IntCounter,
}

impl Default for ClusterMetrics {
    fn default() -> Self {
        ClusterMetrics {
            live_nodes: new_gauge(
                "live_nodes",
                "The number of live nodes observed locally.",
                "cluster",
                &[],
            ),
            ready_nodes: new_gauge(
                "ready_nodes",
                "The number of ready nodes observed locally.",
                "cluster",
                &[],
            ),
            zombie_nodes: new_gauge(
                "zombie_nodes",
                "The number of zombie nodes observed locally.",
                "cluster",
                &[],
            ),
            dead_nodes: new_gauge(
                "dead_nodes",
                "The number of dead nodes observed locally.",
                "cluster",
                &[],
            ),
            cluster_state_size_bytes: new_gauge(
                "cluster_state_size_bytes",
                "The size of the cluster state in bytes.",
                "cluster",
                &[],
            ),
            node_state_keys: new_gauge(
                "node_state_keys",
                "The number of keys in the node state.",
                "cluster",
                &[],
            ),
            node_state_size_bytes: new_gauge(
                "node_state_size_bytes",
                "The size of the node state in bytes.",
                "cluster",
                &[],
            ),
            gossip_recv_messages_total: new_counter(
                "gossip_recv_messages_total",
                "Total number of gossip messages received.",
                "cluster",
                &[],
            ),
            gossip_recv_bytes_total: new_counter(
                "gossip_recv_bytes_total",
                "Total amount of gossip data received in bytes.",
                "cluster",
                &[],
            ),
            gossip_sent_messages_total: new_counter(
                "gossip_sent_messages_total",
                "Total number of gossip messages sent.",
                "cluster",
                &[],
            ),
            gossip_sent_bytes_total: new_counter(
                "gossip_sent_bytes_total",
                "Total amount of gossip data sent in bytes.",
                "cluster",
                &[],
            ),
            grpc_gossip_rounds_total: new_counter(
                "grpc_gossip_rounds_total",
                "Total number of gRPC gossip rounds performed with peer nodes.",
                "cluster",
                &[],
            ),
        }
    }
}

pub static CLUSTER_METRICS: Lazy<ClusterMetrics> = Lazy::new(ClusterMetrics::default);

pub(crate) fn spawn_metrics_task(
    weak_chitchat: Weak<Mutex<Chitchat>>,
    self_chitchat_id: ChitchatId,
) {
    const METRICS_INTERVAL: Duration = Duration::from_secs(15);

    const SIZE_OF_GENERATION_ID: usize = std::mem::size_of::<u64>();
    const SIZE_OF_SOCKET_ADDR: usize = std::mem::size_of::<SocketAddr>();

    let future = async move {
        let mut interval = tokio::time::interval(METRICS_INTERVAL);

        while let Some(chitchat) = weak_chitchat.upgrade() {
            interval.tick().await;

            let mut num_ready_nodes = 0;
            let mut cluster_state_size_bytes = 0;

            let chitchat_guard = chitchat.lock().await;
            let live_nodes: HashSet<&ChitchatId> = chitchat_guard.live_nodes().collect();

            let num_live_nodes = live_nodes.len();
            let num_zombie_nodes = chitchat_guard.scheduled_for_deletion_nodes().count();
            let num_dead_nodes = chitchat_guard.dead_nodes().count();

            for (chitchat_id, node_state) in chitchat_guard.node_states() {
                if live_nodes.contains(chitchat_id) && node_state.is_ready() {
                    num_ready_nodes += 1;
                }
                let chitchat_id_size_bytes =
                    chitchat_id.node_id.len() + SIZE_OF_GENERATION_ID + SIZE_OF_SOCKET_ADDR;
                let node_state_size_bytes = node_state.size_bytes();

                cluster_state_size_bytes += chitchat_id_size_bytes + node_state_size_bytes;

                if *chitchat_id == self_chitchat_id {
                    CLUSTER_METRICS
                        .node_state_keys
                        .set(node_state.num_key_values() as i64);
                    CLUSTER_METRICS
                        .node_state_size_bytes
                        .set(node_state_size_bytes as i64);
                }
            }
            drop(chitchat_guard);

            CLUSTER_METRICS.live_nodes.set(num_live_nodes as i64);
            CLUSTER_METRICS.ready_nodes.set(num_ready_nodes as i64);
            CLUSTER_METRICS.zombie_nodes.set(num_zombie_nodes as i64);
            CLUSTER_METRICS.dead_nodes.set(num_dead_nodes as i64);

            CLUSTER_METRICS
                .cluster_state_size_bytes
                .set(cluster_state_size_bytes as i64);
        }
    };
    tokio::spawn(future);
}


================================================
FILE: quickwit/quickwit-cluster/src/node.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::fmt::Debug;
use std::net::SocketAddr;
use std::sync::Arc;

use chitchat::{ChitchatId, NodeState};
use quickwit_config::service::QuickwitService;
use quickwit_proto::indexing::{CpuCapacity, IndexingTask};
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::types::NodeIdRef;
use tonic::transport::Channel;

use crate::member::build_cluster_member;

#[derive(Clone)]
pub struct ClusterNode {
    inner: Arc<InnerNode>,
}

impl ClusterNode {
    /// Attempts to create a new `ClusterNode` from a Chitchat `NodeState`.
    pub(crate) fn try_new(
        chitchat_id: ChitchatId,
        node_state: &NodeState,
        channel: Channel,
        is_self_node: bool,
    ) -> anyhow::Result<Self> {
        let member = build_cluster_member(chitchat_id.clone(), node_state)?;
        let inner = InnerNode {
            chitchat_id,
            channel,
            enabled_services: member.enabled_services,
            grpc_advertise_addr: member.grpc_advertise_addr,
            indexing_tasks: member.indexing_tasks,
            indexing_capacity: member.indexing_cpu_capacity,
            ingester_status: member.ingester_status,
            is_ready: member.is_ready,
            is_self_node,
            availability_zone: member.availability_zone,
        };
        let node = ClusterNode {
            inner: Arc::new(inner),
        };
        Ok(node)
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub async fn for_test(
        node_id: &str,
        port: u16,
        is_self_node: bool,
        enabled_services: &[&str],
        indexing_tasks: &[IndexingTask],
        ingester_status: IngesterStatus,
    ) -> Self {
        use quickwit_common::shared_consts::INGESTER_STATUS_KEY;
        use quickwit_common::tower::{ClientGrpcConfig, make_channel};

        use crate::cluster::set_indexing_tasks_in_node_state;
        use crate::member::{ENABLED_SERVICES_KEY, GRPC_ADVERTISE_ADDR_KEY};

        let gossip_advertise_addr = ([127, 0, 0, 1], port).into();
        let grpc_advertise_addr = ([127, 0, 0, 1], port + 1).into();
        let chitchat_id = ChitchatId::new(node_id.to_string(), 0, gossip_advertise_addr);
        let channel = make_channel(grpc_advertise_addr, ClientGrpcConfig::default()).await;
        let mut node_state = NodeState::for_test();
        node_state.set(ENABLED_SERVICES_KEY, enabled_services.join(","));
        node_state.set(GRPC_ADVERTISE_ADDR_KEY, grpc_advertise_addr.to_string());
        node_state.set(INGESTER_STATUS_KEY, ingester_status.as_json_str_name());
        set_indexing_tasks_in_node_state(indexing_tasks, &mut node_state);
        Self::try_new(chitchat_id, &node_state, channel, is_self_node).unwrap()
    }

    pub fn chitchat_id(&self) -> &ChitchatId {
        &self.inner.chitchat_id
    }

    pub fn node_id(&self) -> &NodeIdRef {
        NodeIdRef::from_str(&self.inner.chitchat_id.node_id)
    }

    pub fn channel(&self) -> Channel {
        self.inner.channel.clone()
    }

    pub fn enabled_services(&self) -> &HashSet<QuickwitService> {
        &self.inner.enabled_services
    }

    pub fn is_indexer(&self) -> bool {
        self.inner
            .enabled_services
            .contains(&QuickwitService::Indexer)
    }

    pub fn is_ingester(&self) -> bool {
        self.inner
            .enabled_services
            .contains(&QuickwitService::Indexer)
    }

    pub fn is_searcher(&self) -> bool {
        self.inner
            .enabled_services
            .contains(&QuickwitService::Searcher)
    }

    pub fn grpc_advertise_addr(&self) -> SocketAddr {
        self.inner.grpc_advertise_addr
    }

    pub fn indexing_tasks(&self) -> &[IndexingTask] {
        &self.inner.indexing_tasks
    }

    pub fn indexing_capacity(&self) -> CpuCapacity {
        self.inner.indexing_capacity
    }

    pub fn ingester_status(&self) -> IngesterStatus {
        self.inner.ingester_status
    }

    pub fn is_ready(&self) -> bool {
        self.inner.is_ready
    }

    pub fn is_self_node(&self) -> bool {
        self.inner.is_self_node
    }

    pub fn availability_zone(&self) -> Option<&str> {
        self.inner.availability_zone.as_deref()
    }
}

impl Debug for ClusterNode {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("Node")
            .field("node_id", &self.inner.chitchat_id.node_id)
            .field("enabled_services", &self.inner.enabled_services)
            .field("is_ready", &self.inner.is_ready)
            .finish()
    }
}

#[cfg(test)]
impl PartialEq for ClusterNode {
    fn eq(&self, other: &Self) -> bool {
        self.inner.chitchat_id == other.inner.chitchat_id
            && self.inner.enabled_services == other.inner.enabled_services
            && self.inner.grpc_advertise_addr == other.inner.grpc_advertise_addr
            && self.inner.indexing_tasks == other.inner.indexing_tasks
            && self.inner.is_ready == other.inner.is_ready
            && self.inner.is_self_node == other.inner.is_self_node
            && self.inner.availability_zone == other.inner.availability_zone
    }
}

struct InnerNode {
    chitchat_id: ChitchatId,
    channel: Channel,
    enabled_services: HashSet<QuickwitService>,
    grpc_advertise_addr: SocketAddr,
    indexing_tasks: Vec<IndexingTask>,
    indexing_capacity: CpuCapacity,
    ingester_status: IngesterStatus,
    is_ready: bool,
    is_self_node: bool,
    availability_zone: Option<String>,
}


================================================
FILE: quickwit/quickwit-codegen/Cargo.toml
================================================
[package]
name = "quickwit-codegen"
description = "Generate traits, adapters, and gRPC clients/servers from proto files."

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
heck = { workspace = true }
prettyplease = { workspace = true }
proc-macro2 = { workspace = true }
prost-build = { workspace = true }
quote = { workspace = true }
syn = { workspace = true }
tonic-prost-build = { workspace = true }

[dev-dependencies]
futures = { workspace = true }
serde = { workspace = true }


================================================
FILE: quickwit/quickwit-codegen/README.md
================================================
# Quickwit codegen

## Getting Started

1. Describe your service in a proto file.

2. Define an error and a result type for your service. The error type must implement `quickwit_proto::error::GrpcServiceError` and have at least the three following variants: `Internal`, `Timeout`, and `Unavailable`.

3. Add the following dependencies to your project:

```toml
[dependencies]
async-trait = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
http = { workspace = true }
hyper = { workspace = true }
prost = { workspace = true }
serde = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tonic = { workspace = true }
tower = { workspace = true }
utoipa = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-proto = { workspace = true }

[dev-dependencies]
mockall = { workspace = true }

[build-dependencies]
quickwit-codegen = { workspace = true }
```

4. Run the code generation logic as part of a Cargo build script:

```rust
use quickwit_codegen::Codegen;

fn main() {
    Codegen::builder()
        .with_protos(&["src/hello.proto"])
        .with_output_dir("src/")
        .with_result_type_path("crate::HelloResult")
        .with_error_type_path("crate::HelloError")
        .run()
        .unwrap();
}
```

5. If additional prost settings need to be configured they can be provided the following way:

```rust
use quickwit_codegen::Codegen;

fn main() {
    let mut config = prost_build::Config::default();
    config.bytes(["PingRequest.name", "PingResponse.name"]);
    Codegen::builder()
        .with_protos(&["src/hello.proto"])
        .with_output_dir("src/codegen/")
        .with_result_type_path("crate::HelloResult")
        .with_error_type_path("crate::HelloError")
        .with_prost_config(config)
        .run()
        .unwrap();
}
```


6. Import and implement the generated service trait and use the various generated adapters to instantiate a gRPC server, or use a local or remote gRPC implementation with the same client interface.

Checkout the complete working example in the `quickwit-codegen-example` crate.


================================================
FILE: quickwit/quickwit-codegen/example/Cargo.toml
================================================
[package]
name = "quickwit-codegen-example"
description = "Demonstrates how to set up, configure, and run code generation for a simple service"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
bytesize = { workspace = true }
futures = { workspace = true }
http = { workspace = true }
mockall = { workspace = true, optional = true }
prost = { workspace = true }
serde = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tonic = { workspace = true }
tonic-prost = { workspace = true }
tower = { workspace = true }
utoipa = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-common = { workspace = true }
quickwit-proto = { workspace = true }

[dev-dependencies]
mockall = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }

[build-dependencies]
quickwit-codegen = { workspace = true }

[features]
testsuite = ["mockall"]


================================================
FILE: quickwit/quickwit-codegen/example/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_codegen::Codegen;

fn main() {
    Codegen::builder()
        .with_protos(&["src/hello.proto"])
        .with_output_dir("src/codegen/")
        .with_result_type_path("crate::HelloResult")
        .with_error_type_path("crate::HelloError")
        .generate_extra_service_methods()
        .generate_rpc_name_impls()
        .run()
        .unwrap();
}


================================================
FILE: quickwit/quickwit-codegen/example/src/codegen/hello.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct HelloRequest {
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct HelloResponse {
    #[prost(string, tag = "1")]
    pub message: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GoodbyeRequest {
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GoodbyeResponse {
    #[prost(string, tag = "1")]
    pub message: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PingRequest {
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PingResponse {
    #[prost(string, tag = "1")]
    pub message: ::prost::alloc::string::String,
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for HelloRequest {
    fn rpc_name() -> &'static str {
        "hello"
    }
}
impl RpcName for GoodbyeRequest {
    fn rpc_name() -> &'static str {
        "goodbye"
    }
}
impl RpcName for PingRequest {
    fn rpc_name() -> &'static str {
        "ping"
    }
}
pub type HelloStream<T> = quickwit_common::ServiceStream<crate::HelloResult<T>>;
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait Hello: std::fmt::Debug + Send + Sync + 'static {
    ///Says hello.
    async fn hello(&self, request: HelloRequest) -> crate::HelloResult<HelloResponse>;
    ///Says goodbye.
    async fn goodbye(
        &self,
        request: GoodbyeRequest,
    ) -> crate::HelloResult<GoodbyeResponse>;
    ///Ping pong.
    async fn ping(
        &self,
        request: quickwit_common::ServiceStream<PingRequest>,
    ) -> crate::HelloResult<HelloStream<PingResponse>>;
    async fn check_connectivity(&self) -> anyhow::Result<()>;
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri>;
}
#[derive(Debug, Clone)]
pub struct HelloClient {
    inner: InnerHelloClient,
}
#[derive(Debug, Clone)]
struct InnerHelloClient(std::sync::Arc<dyn Hello>);
impl HelloClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: Hello,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: < MockHello > (),
            "`MockHello` must be wrapped in a `MockHelloWrapper`: use `HelloClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerHelloClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> hello_grpc_server::HelloGrpcServer<HelloGrpcServerAdapter> {
        let adapter = HelloGrpcServerAdapter::new(self.clone());
        hello_grpc_server::HelloGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = hello_grpc_client::HelloGrpcClient::new(channel)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = HelloGrpcClientAdapter::new(client, connection_keys_watcher);
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> HelloClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = hello_grpc_client::HelloGrpcClient::new(balance_channel)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = HelloGrpcClientAdapter::new(client, connection_keys_watcher);
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        HelloMailbox<A>: Hello,
    {
        HelloClient::new(HelloMailbox::new(mailbox))
    }
    pub fn tower() -> HelloTowerLayerStack {
        HelloTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockHello) -> Self {
        let mock_wrapper = mock_hello::MockHelloWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockHello::new())
    }
}
#[async_trait::async_trait]
impl Hello for HelloClient {
    async fn hello(&self, request: HelloRequest) -> crate::HelloResult<HelloResponse> {
        self.inner.0.hello(request).await
    }
    async fn goodbye(
        &self,
        request: GoodbyeRequest,
    ) -> crate::HelloResult<GoodbyeResponse> {
        self.inner.0.goodbye(request).await
    }
    async fn ping(
        &self,
        request: quickwit_common::ServiceStream<PingRequest>,
    ) -> crate::HelloResult<HelloStream<PingResponse>> {
        self.inner.0.ping(request).await
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.inner.0.check_connectivity().await
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        self.inner.0.endpoints()
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_hello {
    use super::*;
    #[derive(Debug)]
    pub struct MockHelloWrapper {
        pub(super) inner: tokio::sync::Mutex<MockHello>,
    }
    #[async_trait::async_trait]
    impl Hello for MockHelloWrapper {
        async fn hello(
            &self,
            request: super::HelloRequest,
        ) -> crate::HelloResult<super::HelloResponse> {
            self.inner.lock().await.hello(request).await
        }
        async fn goodbye(
            &self,
            request: super::GoodbyeRequest,
        ) -> crate::HelloResult<super::GoodbyeResponse> {
            self.inner.lock().await.goodbye(request).await
        }
        async fn ping(
            &self,
            request: quickwit_common::ServiceStream<super::PingRequest>,
        ) -> crate::HelloResult<HelloStream<super::PingResponse>> {
            self.inner.lock().await.ping(request).await
        }
        async fn check_connectivity(&self) -> anyhow::Result<()> {
            self.inner.lock().await.check_connectivity().await
        }
        fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
            futures::executor::block_on(self.inner.lock()).endpoints()
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<HelloRequest> for InnerHelloClient {
    type Response = HelloResponse;
    type Error = crate::HelloError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: HelloRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.hello(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<GoodbyeRequest> for InnerHelloClient {
    type Response = GoodbyeResponse;
    type Error = crate::HelloError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: GoodbyeRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.goodbye(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<quickwit_common::ServiceStream<PingRequest>> for InnerHelloClient {
    type Response = HelloStream<PingResponse>;
    type Error = crate::HelloError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(
        &mut self,
        request: quickwit_common::ServiceStream<PingRequest>,
    ) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.ping(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct HelloTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerHelloClient,
    hello_svc: quickwit_common::tower::BoxService<
        HelloRequest,
        HelloResponse,
        crate::HelloError,
    >,
    goodbye_svc: quickwit_common::tower::BoxService<
        GoodbyeRequest,
        GoodbyeResponse,
        crate::HelloError,
    >,
    ping_svc: quickwit_common::tower::BoxService<
        quickwit_common::ServiceStream<PingRequest>,
        HelloStream<PingResponse>,
        crate::HelloError,
    >,
}
#[async_trait::async_trait]
impl Hello for HelloTowerServiceStack {
    async fn hello(&self, request: HelloRequest) -> crate::HelloResult<HelloResponse> {
        self.hello_svc.clone().ready().await?.call(request).await
    }
    async fn goodbye(
        &self,
        request: GoodbyeRequest,
    ) -> crate::HelloResult<GoodbyeResponse> {
        self.goodbye_svc.clone().ready().await?.call(request).await
    }
    async fn ping(
        &self,
        request: quickwit_common::ServiceStream<PingRequest>,
    ) -> crate::HelloResult<HelloStream<PingResponse>> {
        self.ping_svc.clone().ready().await?.call(request).await
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.inner.0.check_connectivity().await
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        self.inner.0.endpoints()
    }
}
type HelloLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<HelloRequest, HelloResponse, crate::HelloError>,
    HelloRequest,
    HelloResponse,
    crate::HelloError,
>;
type GoodbyeLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        GoodbyeRequest,
        GoodbyeResponse,
        crate::HelloError,
    >,
    GoodbyeRequest,
    GoodbyeResponse,
    crate::HelloError,
>;
type PingLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        quickwit_common::ServiceStream<PingRequest>,
        HelloStream<PingResponse>,
        crate::HelloError,
    >,
    quickwit_common::ServiceStream<PingRequest>,
    HelloStream<PingResponse>,
    crate::HelloError,
>;
#[derive(Debug, Default)]
pub struct HelloTowerLayerStack {
    hello_layers: Vec<HelloLayer>,
    goodbye_layers: Vec<GoodbyeLayer>,
    ping_layers: Vec<PingLayer>,
}
impl HelloTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    HelloRequest,
                    HelloResponse,
                    crate::HelloError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                HelloRequest,
                HelloResponse,
                crate::HelloError,
            >,
        >>::Service: tower::Service<
                HelloRequest,
                Response = HelloResponse,
                Error = crate::HelloError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                HelloRequest,
                HelloResponse,
                crate::HelloError,
            >,
        >>::Service as tower::Service<HelloRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GoodbyeRequest,
                    GoodbyeResponse,
                    crate::HelloError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                GoodbyeRequest,
                GoodbyeResponse,
                crate::HelloError,
            >,
        >>::Service: tower::Service<
                GoodbyeRequest,
                Response = GoodbyeResponse,
                Error = crate::HelloError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                GoodbyeRequest,
                GoodbyeResponse,
                crate::HelloError,
            >,
        >>::Service as tower::Service<GoodbyeRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    quickwit_common::ServiceStream<PingRequest>,
                    HelloStream<PingResponse>,
                    crate::HelloError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                quickwit_common::ServiceStream<PingRequest>,
                HelloStream<PingResponse>,
                crate::HelloError,
            >,
        >>::Service: tower::Service<
                quickwit_common::ServiceStream<PingRequest>,
                Response = HelloStream<PingResponse>,
                Error = crate::HelloError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                quickwit_common::ServiceStream<PingRequest>,
                HelloStream<PingResponse>,
                crate::HelloError,
            >,
        >>::Service as tower::Service<
            quickwit_common::ServiceStream<PingRequest>,
        >>::Future: Send + 'static,
    {
        self.hello_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.goodbye_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.ping_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_hello_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    HelloRequest,
                    HelloResponse,
                    crate::HelloError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                HelloRequest,
                Response = HelloResponse,
                Error = crate::HelloError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<HelloRequest>>::Future: Send + 'static,
    {
        self.hello_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_goodbye_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GoodbyeRequest,
                    GoodbyeResponse,
                    crate::HelloError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                GoodbyeRequest,
                Response = GoodbyeResponse,
                Error = crate::HelloError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<GoodbyeRequest>>::Future: Send + 'static,
    {
        self.goodbye_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_ping_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    quickwit_common::ServiceStream<PingRequest>,
                    HelloStream<PingResponse>,
                    crate::HelloError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                quickwit_common::ServiceStream<PingRequest>,
                Response = HelloStream<PingResponse>,
                Error = crate::HelloError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            quickwit_common::ServiceStream<PingRequest>,
        >>::Future: Send + 'static,
    {
        self.ping_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> HelloClient
    where
        T: Hello,
    {
        let inner_client = InnerHelloClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> HelloClient {
        let client = HelloClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> HelloClient {
        let client = HelloClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> HelloClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        HelloMailbox<A>: Hello,
    {
        let inner_client = InnerHelloClient(
            std::sync::Arc::new(HelloMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockHello) -> HelloClient {
        let client = HelloClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(self, inner_client: InnerHelloClient) -> HelloClient {
        let hello_svc = self
            .hello_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let goodbye_svc = self
            .goodbye_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let ping_svc = self
            .ping_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = HelloTowerServiceStack {
            inner: inner_client,
            hello_svc,
            goodbye_svc,
            ping_svc,
        };
        HelloClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct HelloMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::HelloError>,
}
impl<A: quickwit_actors::Actor> HelloMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for HelloMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for HelloMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::HelloError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::HelloError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> Hello for HelloMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    HelloMailbox<
        A,
    >: tower::Service<
            HelloRequest,
            Response = HelloResponse,
            Error = crate::HelloError,
            Future = BoxFuture<HelloResponse, crate::HelloError>,
        >
        + tower::Service<
            GoodbyeRequest,
            Response = GoodbyeResponse,
            Error = crate::HelloError,
            Future = BoxFuture<GoodbyeResponse, crate::HelloError>,
        >
        + tower::Service<
            quickwit_common::ServiceStream<PingRequest>,
            Response = HelloStream<PingResponse>,
            Error = crate::HelloError,
            Future = BoxFuture<HelloStream<PingResponse>, crate::HelloError>,
        >,
{
    async fn hello(&self, request: HelloRequest) -> crate::HelloResult<HelloResponse> {
        self.clone().call(request).await
    }
    async fn goodbye(
        &self,
        request: GoodbyeRequest,
    ) -> crate::HelloResult<GoodbyeResponse> {
        self.clone().call(request).await
    }
    async fn ping(
        &self,
        request: quickwit_common::ServiceStream<PingRequest>,
    ) -> crate::HelloResult<HelloStream<PingResponse>> {
        self.clone().call(request).await
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if self.inner.is_disconnected() {
            anyhow::bail!("actor `{}` is disconnected", self.inner.actor_instance_id())
        }
        Ok(())
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        vec![
            quickwit_common::uri::Uri::from_str(& format!("actor://localhost/{}", self
            .inner.actor_instance_id())).expect("URI should be valid")
        ]
    }
}
#[derive(Debug, Clone)]
pub struct HelloGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> HelloGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> Hello for HelloGrpcClientAdapter<hello_grpc_client::HelloGrpcClient<T>>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn hello(&self, request: HelloRequest) -> crate::HelloResult<HelloResponse> {
        self.inner
            .clone()
            .hello(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                HelloRequest::rpc_name(),
            ))
    }
    async fn goodbye(
        &self,
        request: GoodbyeRequest,
    ) -> crate::HelloResult<GoodbyeResponse> {
        self.inner
            .clone()
            .goodbye(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                GoodbyeRequest::rpc_name(),
            ))
    }
    async fn ping(
        &self,
        request: quickwit_common::ServiceStream<PingRequest>,
    ) -> crate::HelloResult<HelloStream<PingResponse>> {
        self.inner
            .clone()
            .ping(request)
            .await
            .map(|response| {
                let streaming: tonic::Streaming<_> = response.into_inner();
                let stream = quickwit_common::ServiceStream::from(streaming);
                stream
                    .map_err(|status| crate::error::grpc_status_to_service_error(
                        status,
                        PingRequest::rpc_name(),
                    ))
            })
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                PingRequest::rpc_name(),
            ))
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if self.connection_addrs_rx.borrow().is_empty() {
            anyhow::bail!("no server currently available")
        }
        Ok(())
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        self.connection_addrs_rx
            .borrow()
            .iter()
            .flat_map(|addr| quickwit_common::uri::Uri::from_str(
                &format!("grpc://{addr}/{}.{}", "hello", "Hello"),
            ))
            .collect()
    }
}
#[derive(Debug)]
pub struct HelloGrpcServerAdapter {
    inner: InnerHelloClient,
}
impl HelloGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: Hello,
    {
        Self {
            inner: InnerHelloClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl hello_grpc_server::HelloGrpc for HelloGrpcServerAdapter {
    async fn hello(
        &self,
        request: tonic::Request<HelloRequest>,
    ) -> Result<tonic::Response<HelloResponse>, tonic::Status> {
        self.inner
            .0
            .hello(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn goodbye(
        &self,
        request: tonic::Request<GoodbyeRequest>,
    ) -> Result<tonic::Response<GoodbyeResponse>, tonic::Status> {
        self.inner
            .0
            .goodbye(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    type PingStream = quickwit_common::ServiceStream<tonic::Result<PingResponse>>;
    async fn ping(
        &self,
        request: tonic::Request<tonic::Streaming<PingRequest>>,
    ) -> Result<tonic::Response<Self::PingStream>, tonic::Status> {
        self.inner
            .0
            .ping({
                let streaming: tonic::Streaming<_> = request.into_inner();
                quickwit_common::ServiceStream::from(streaming)
            })
            .await
            .map(|stream| tonic::Response::new(
                stream.map_err(crate::error::grpc_error_to_grpc_status),
            ))
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod hello_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct HelloGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl HelloGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> HelloGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> HelloGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            HelloGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Says hello.
        pub async fn hello(
            &mut self,
            request: impl tonic::IntoRequest<super::HelloRequest>,
        ) -> std::result::Result<tonic::Response<super::HelloResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static("/hello.Hello/Hello");
            let mut req = request.into_request();
            req.extensions_mut().insert(GrpcMethod::new("hello.Hello", "Hello"));
            self.inner.unary(req, path, codec).await
        }
        /// Says goodbye.
        pub async fn goodbye(
            &mut self,
            request: impl tonic::IntoRequest<super::GoodbyeRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GoodbyeResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static("/hello.Hello/Goodbye");
            let mut req = request.into_request();
            req.extensions_mut().insert(GrpcMethod::new("hello.Hello", "Goodbye"));
            self.inner.unary(req, path, codec).await
        }
        /// Ping pong.
        pub async fn ping(
            &mut self,
            request: impl tonic::IntoStreamingRequest<Message = super::PingRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::PingResponse>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static("/hello.Hello/Ping");
            let mut req = request.into_streaming_request();
            req.extensions_mut().insert(GrpcMethod::new("hello.Hello", "Ping"));
            self.inner.streaming(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod hello_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with HelloGrpcServer.
    #[async_trait]
    pub trait HelloGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Says hello.
        async fn hello(
            &self,
            request: tonic::Request<super::HelloRequest>,
        ) -> std::result::Result<tonic::Response<super::HelloResponse>, tonic::Status>;
        /// Says goodbye.
        async fn goodbye(
            &self,
            request: tonic::Request<super::GoodbyeRequest>,
        ) -> std::result::Result<tonic::Response<super::GoodbyeResponse>, tonic::Status>;
        /// Server streaming response type for the Ping method.
        type PingStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::PingResponse, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// Ping pong.
        async fn ping(
            &self,
            request: tonic::Request<tonic::Streaming<super::PingRequest>>,
        ) -> std::result::Result<tonic::Response<Self::PingStream>, tonic::Status>;
    }
    #[derive(Debug)]
    pub struct HelloGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> HelloGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for HelloGrpcServer<T>
    where
        T: HelloGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/hello.Hello/Hello" => {
                    #[allow(non_camel_case_types)]
                    struct HelloSvc<T: HelloGrpc>(pub Arc<T>);
                    impl<T: HelloGrpc> tonic::server::UnaryService<super::HelloRequest>
                    for HelloSvc<T> {
                        type Response = super::HelloResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::HelloRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as HelloGrpc>::hello(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = HelloSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/hello.Hello/Goodbye" => {
                    #[allow(non_camel_case_types)]
                    struct GoodbyeSvc<T: HelloGrpc>(pub Arc<T>);
                    impl<T: HelloGrpc> tonic::server::UnaryService<super::GoodbyeRequest>
                    for GoodbyeSvc<T> {
                        type Response = super::GoodbyeResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GoodbyeRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as HelloGrpc>::goodbye(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GoodbyeSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/hello.Hello/Ping" => {
                    #[allow(non_camel_case_types)]
                    struct PingSvc<T: HelloGrpc>(pub Arc<T>);
                    impl<
                        T: HelloGrpc,
                    > tonic::server::StreamingService<super::PingRequest>
                    for PingSvc<T> {
                        type Response = super::PingResponse;
                        type ResponseStream = T::PingStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<tonic::Streaming<super::PingRequest>>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as HelloGrpc>::ping(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = PingSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for HelloGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "hello.Hello";
    impl<T> tonic::server::NamedService for HelloGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-codegen/example/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use quickwit_actors::AskError;
use quickwit_common::tower::TimeoutExceeded;
use quickwit_proto::error::GrpcServiceError;
pub use quickwit_proto::error::{grpc_error_to_grpc_status, grpc_status_to_service_error};
use quickwit_proto::{ServiceError, ServiceErrorCode};
use serde::{Deserialize, Serialize};

// Service errors have to be handwritten before codegen.
#[derive(Debug, thiserror::Error, Serialize, Deserialize)]
pub enum HelloError {
    #[error("internal error: {0}")]
    Internal(String),
    #[error("invalid argument: {0}")]
    InvalidArgument(String),
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests,
    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl ServiceError for HelloError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(_) => ServiceErrorCode::Internal,
            Self::InvalidArgument(_) => ServiceErrorCode::BadRequest,
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for HelloError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}

impl<E> From<AskError<E>> for HelloError
where E: fmt::Debug
{
    fn from(error: AskError<E>) -> Self {
        HelloError::Internal(format!("{error:?}"))
    }
}

impl From<TimeoutExceeded> for HelloError {
    fn from(_: TimeoutExceeded) -> Self {
        HelloError::Timeout("client".to_string())
    }
}


================================================
FILE: quickwit/quickwit-codegen/example/src/hello.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package hello;

message HelloRequest {
    string name = 1;
}

message HelloResponse {
    string message = 1;
}

message GoodbyeRequest {
    string name = 1;
}

message GoodbyeResponse {
    string message = 1;
}

message PingRequest {
    string name = 1;
}

message PingResponse {
    string message = 1;
}

service Hello {
    // Says hello.
    rpc Hello(HelloRequest) returns (HelloResponse);

    // Says goodbye.
    rpc Goodbye(GoodbyeRequest) returns (GoodbyeResponse);

    // Ping pong.
    rpc Ping(stream PingRequest) returns (stream PingResponse);
}


================================================
FILE: quickwit/quickwit-codegen/example/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod error;

#[path = "codegen/hello.rs"]
mod hello;

use std::sync::Arc;
use std::sync::atomic::{AtomicUsize, Ordering};
use std::task::{Context, Poll};
use std::time::Duration;

use async_trait::async_trait;
use futures::StreamExt;
use quickwit_common::ServiceStream;
use quickwit_common::uri::Uri;
use tower::{Layer, Service};

pub use crate::error::HelloError;
pub use crate::hello::*;

pub type HelloResult<T> = Result<T, HelloError>;

#[derive(Debug, Clone)]
struct Counter<S> {
    counter: Arc<AtomicUsize>,
    inner: S,
}

impl<S, R> Service<R> for Counter<S>
where S: Service<R>
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = S::Future;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, req: R) -> Self::Future {
        self.counter.fetch_add(1, Ordering::Relaxed);
        self.inner.call(req)
    }
}

#[derive(Debug, Clone, Default)]
#[allow(dead_code)]
struct CounterLayer {
    counter: Arc<AtomicUsize>,
}

impl<S> Layer<S> for CounterLayer {
    type Service = Counter<S>;

    fn layer(&self, inner: S) -> Self::Service {
        Counter {
            counter: self.counter.clone(),
            inner,
        }
    }
}

#[allow(dead_code)]
fn spawn_ping_response_stream(
    mut request_stream: ServiceStream<PingRequest>,
) -> ServiceStream<HelloResult<PingResponse>> {
    let (ping_tx, service_stream) = ServiceStream::new_bounded(1);
    let future = async move {
        let mut name = "".to_string();
        let mut interval = tokio::time::interval(Duration::from_millis(100));

        loop {
            tokio::select! {
                request_opt = request_stream.next() => {
                    match request_opt {
                        Some(request) => name = request.name,
                        _ => break,
                    };
                }
                _ = interval.tick() => {
                    if name.is_empty() {
                        continue;
                    }
                    if name == "stop" {
                        break;
                    }
                    if ping_tx.send(Ok(PingResponse {
                        message: format!("Pong, {name}!")
                    })).await.is_err() {
                        break;
                    }
                }
            }
        }
    };
    tokio::spawn(future);
    service_stream
}

#[derive(Debug, Clone, Default)]
#[allow(dead_code)]
struct HelloImpl {
    delay: Duration,
}

#[async_trait]
impl Hello for HelloImpl {
    async fn hello(&self, request: HelloRequest) -> HelloResult<HelloResponse> {
        tokio::time::sleep(self.delay).await;

        if request.name.is_empty() {
            return Err(HelloError::InvalidArgument("name is empty".to_string()));
        }
        Ok(HelloResponse {
            message: format!("Hello, {}!", request.name),
        })
    }

    async fn goodbye(&self, request: GoodbyeRequest) -> HelloResult<GoodbyeResponse> {
        tokio::time::sleep(self.delay).await;

        Ok(GoodbyeResponse {
            message: format!("Goodbye, {}!", request.name),
        })
    }

    async fn ping(
        &self,
        request: ServiceStream<PingRequest>,
    ) -> HelloResult<HelloStream<PingResponse>> {
        Ok(spawn_ping_response_stream(request))
    }

    async fn check_connectivity(&self) -> anyhow::Result<()> {
        Ok(())
    }

    fn endpoints(&self) -> Vec<Uri> {
        Vec::new()
    }
}

#[cfg(test)]
mod tests {
    use std::fmt;
    use std::net::SocketAddr;
    use std::str::FromStr;
    use std::sync::atomic::Ordering;

    use bytesize::ByteSize;
    use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Universe};
    use quickwit_common::tower::{BalanceChannel, Change, TimeoutLayer};
    use tokio::sync::mpsc::error::TrySendError;
    use tokio_stream::StreamExt;
    use tonic::codec::CompressionEncoding;
    use tonic::transport::{Endpoint, Server};
    use tonic::{Code, Status};

    use super::*;
    use crate::hello::MockHello;
    use crate::hello::hello_grpc_server::HelloGrpcServer;
    use crate::hello_grpc_client::HelloGrpcClient;
    use crate::{CounterLayer, GoodbyeRequest, GoodbyeResponse};

    const MAX_GRPC_MESSAGE_SIZE: ByteSize = ByteSize::mib(1);

    #[tokio::test]
    async fn test_hello_codegen() {
        let hello = HelloImpl::default();

        assert_eq!(
            hello
                .hello(HelloRequest {
                    name: "World".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, World!".to_string()
            }
        );

        let client = HelloClient::new(hello.clone()).clone();

        assert_eq!(
            client
                .hello(HelloRequest {
                    name: "World".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, World!".to_string()
            }
        );

        let (ping_stream_tx, ping_stream) = ServiceStream::new_bounded(1);
        let mut pong_stream = client.ping(ping_stream).await.unwrap();

        ping_stream_tx
            .try_send(PingRequest {
                name: "World".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, World!"
        );
        ping_stream_tx
            .try_send(PingRequest {
                name: "Mundo".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, Mundo!"
        );
        ping_stream_tx
            .try_send(PingRequest {
                name: "stop".to_string(),
            })
            .unwrap();
        assert!(pong_stream.next().await.is_none());

        let error = ping_stream_tx
            .try_send(PingRequest {
                name: "stop".to_string(),
            })
            .unwrap_err();
        assert!(matches!(error, TrySendError::Closed(_)));

        let mut mock_hello = MockHello::new();

        mock_hello.expect_hello().returning(|_| {
            Ok(HelloResponse {
                message: "Hello, Mock!".to_string(),
            })
        });

        assert_eq!(
            mock_hello
                .hello(HelloRequest {
                    name: "".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, Mock!".to_string()
            }
        );
    }

    #[tokio::test]
    async fn test_hello_codegen_grpc() {
        let grpc_server =
            HelloClient::new(HelloImpl::default()).as_grpc_service(MAX_GRPC_MESSAGE_SIZE);
        let addr: SocketAddr = "127.0.0.1:6666".parse().unwrap();

        tokio::spawn({
            async move {
                Server::builder()
                    .add_service(grpc_server)
                    .serve(addr)
                    .await
                    .unwrap();
            }
        });
        let channel = BalanceChannel::from_channel(
            "127.0.0.1:6666".parse().unwrap(),
            Endpoint::from_static("http://127.0.0.1:6666").connect_lazy(),
        );
        let grpc_client = HelloClient::from_balance_channel(channel, MAX_GRPC_MESSAGE_SIZE, None);

        assert_eq!(
            grpc_client
                .hello(HelloRequest {
                    name: "gRPC client".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, gRPC client!".to_string()
            }
        );

        assert!(matches!(
            grpc_client
                .hello(HelloRequest {
                    name: "".to_string()
                })
                .await
                .unwrap_err(),
            HelloError::InvalidArgument(_)
        ));

        let (ping_stream_tx, ping_stream) = ServiceStream::new_bounded(1);
        let mut pong_stream = grpc_client.ping(ping_stream).await.unwrap();

        ping_stream_tx
            .try_send(PingRequest {
                name: "gRPC client".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, gRPC client!"
        );

        ping_stream_tx
            .try_send(PingRequest {
                name: "stop".to_string(),
            })
            .unwrap();
        assert!(pong_stream.next().await.is_none());

        let error = ping_stream_tx
            .try_send(PingRequest {
                name: "stop".to_string(),
            })
            .unwrap_err();
        assert!(matches!(error, TrySendError::Closed(_)));

        grpc_client.check_connectivity().await.unwrap();
        assert_eq!(
            grpc_client.endpoints(),
            vec![Uri::from_str("grpc://127.0.0.1:6666/hello.Hello").unwrap()]
        );

        // The connectivity check fails if there is no client behind the channel.
        let (balance_channel, _): (BalanceChannel<SocketAddr>, _) = BalanceChannel::new();
        let grpc_client =
            HelloClient::from_balance_channel(balance_channel, MAX_GRPC_MESSAGE_SIZE, None);
        assert_eq!(
            grpc_client
                .check_connectivity()
                .await
                .unwrap_err()
                .to_string(),
            "no server currently available"
        );
    }

    #[tokio::test]
    async fn test_hello_codegen_grpc_with_compression() {
        #[derive(Debug, Clone)]
        struct CheckCompression<S> {
            inner: S,
        }

        impl<S, ReqBody, ResBody> Service<http::Request<ReqBody>> for CheckCompression<S>
        where
            S: Service<http::Request<ReqBody>, Response = http::Response<ResBody>>
                + Clone
                + Send
                + 'static,
            S::Future: Send + 'static,
            ReqBody: Send + 'static,
        {
            type Response = S::Response;
            type Error = S::Error;
            type Future = BoxFuture<Self::Response, Self::Error>;

            fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
                self.inner.poll_ready(cx)
            }

            fn call(&mut self, request: http::Request<ReqBody>) -> Self::Future {
                let Some(grpc_encoding) = request.headers().get("grpc-encoding") else {
                    panic!("request should be compressed");
                };
                assert!(grpc_encoding.to_str().unwrap().contains("zstd"));

                let Some(grpc_accept_encoding) = request.headers().get("grpc-accept-encoding")
                else {
                    panic!("client should accept compressed responses");
                };
                assert!(grpc_accept_encoding.to_str().unwrap().contains("zstd"));
                let fut = self.inner.call(request);

                Box::pin(async move {
                    let response = fut.await?;

                    let grpc_status_code = Status::from_header_map(response.headers())
                        .map(|status| status.code())
                        .unwrap_or(Code::Ok);

                    if grpc_status_code == Code::Ok {
                        let Some(grpc_encoding) = response.headers().get("grpc-encoding") else {
                            panic!("response should be compressed");
                        };
                        assert!(grpc_encoding.to_str().unwrap().contains("zstd"));
                    }
                    Ok(response)
                })
            }
        }

        #[derive(Debug, Clone)]
        struct CheckCompressionLayer;

        impl<S> Layer<S> for CheckCompressionLayer {
            type Service = CheckCompression<S>;

            fn layer(&self, inner: S) -> Self::Service {
                Self::Service { inner }
            }
        }

        let grpc_server =
            HelloClient::new(HelloImpl::default()).as_grpc_service(MAX_GRPC_MESSAGE_SIZE);
        let addr: SocketAddr = "127.0.0.1:33333".parse().unwrap();

        tokio::spawn({
            async move {
                Server::builder()
                    .layer(CheckCompressionLayer)
                    .add_service(grpc_server)
                    .serve(addr)
                    .await
                    .unwrap();
            }
        });
        let channel = BalanceChannel::from_channel(
            "127.0.0.1:33333".parse().unwrap(),
            Endpoint::from_static("http://127.0.0.1:33333").connect_lazy(),
        );
        let grpc_client = HelloClient::from_balance_channel(
            channel,
            MAX_GRPC_MESSAGE_SIZE,
            Some(CompressionEncoding::Zstd),
        );

        assert_eq!(
            grpc_client
                .hello(HelloRequest {
                    name: "gRPC client".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, gRPC client!".to_string()
            }
        );

        assert!(matches!(
            grpc_client
                .hello(HelloRequest {
                    name: "".to_string()
                })
                .await
                .unwrap_err(),
            HelloError::InvalidArgument(_)
        ));

        let (ping_stream_tx, ping_stream) = ServiceStream::new_bounded(1);
        let mut pong_stream = grpc_client.ping(ping_stream).await.unwrap();

        ping_stream_tx
            .try_send(PingRequest {
                name: "gRPC client".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, gRPC client!"
        );

        ping_stream_tx
            .try_send(PingRequest {
                name: "stop".to_string(),
            })
            .unwrap();
        assert!(pong_stream.next().await.is_none());

        let error = ping_stream_tx
            .try_send(PingRequest {
                name: "stop".to_string(),
            })
            .unwrap_err();
        assert!(matches!(error, TrySendError::Closed(_)));
    }

    #[tokio::test]
    async fn test_hello_codegen_actor() {
        #[derive(Debug)]
        struct HelloActor;

        impl Actor for HelloActor {
            type ObservableState = ();

            fn observable_state(&self) -> Self::ObservableState {}
        }

        #[async_trait]
        impl Handler<HelloRequest> for HelloActor {
            type Reply = HelloResult<HelloResponse>;

            async fn handle(
                &mut self,
                message: HelloRequest,
                _ctx: &ActorContext<Self>,
            ) -> Result<Self::Reply, ActorExitStatus> {
                Ok(Ok(HelloResponse {
                    message: format!("Hello, {}!", message.name),
                }))
            }
        }

        #[async_trait]
        impl Handler<GoodbyeRequest> for HelloActor {
            type Reply = HelloResult<GoodbyeResponse>;

            async fn handle(
                &mut self,
                message: GoodbyeRequest,
                _ctx: &ActorContext<Self>,
            ) -> Result<Self::Reply, ActorExitStatus> {
                Ok(Ok(GoodbyeResponse {
                    message: format!("Goodbye, {}!", message.name),
                }))
            }
        }

        #[async_trait]
        impl Handler<ServiceStream<PingRequest>> for HelloActor {
            type Reply = HelloResult<HelloStream<PingResponse>>;

            async fn handle(
                &mut self,
                message: ServiceStream<PingRequest>,
                _ctx: &ActorContext<Self>,
            ) -> Result<Self::Reply, ActorExitStatus> {
                Ok(Ok(spawn_ping_response_stream(message)))
            }
        }

        let universe = Universe::new();
        let hello_actor = HelloActor;
        let (actor_mailbox, _actor_handle) = universe.spawn_builder().spawn(hello_actor);
        let actor_client = HelloClient::from_mailbox(actor_mailbox.clone());

        assert_eq!(
            actor_client
                .hello(HelloRequest {
                    name: "beautiful actor".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, beautiful actor!".to_string()
            }
        );

        actor_client.check_connectivity().await.unwrap();
        assert_eq!(
            actor_client.endpoints(),
            vec![
                Uri::from_str(&format!(
                    "actor://localhost/{}",
                    actor_mailbox.actor_instance_id()
                ))
                .unwrap()
            ]
        );

        let (ping_stream_tx, ping_stream) = ServiceStream::new_bounded(1);
        let mut pong_stream = actor_client.ping(ping_stream).await.unwrap();

        ping_stream_tx
            .try_send(PingRequest {
                name: "beautiful actor".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, beautiful actor!"
        );

        let hello_tower = HelloClient::tower().build_from_mailbox(actor_mailbox);

        assert_eq!(
            hello_tower
                .hello(HelloRequest {
                    name: "Tower actor".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, Tower actor!".to_string()
            }
        );

        assert_eq!(
            hello_tower
                .goodbye(GoodbyeRequest {
                    name: "Tower actor".to_string()
                })
                .await
                .unwrap(),
            GoodbyeResponse {
                message: "Goodbye, Tower actor!".to_string()
            }
        );

        let (ping_stream_tx, ping_stream) = ServiceStream::new_bounded(1);
        let mut pong_stream = actor_client.ping(ping_stream).await.unwrap();

        ping_stream_tx
            .try_send(PingRequest {
                name: "beautiful Tower actor".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, beautiful Tower actor!"
        );

        universe.assert_quit().await;

        actor_client.check_connectivity().await.unwrap_err();
    }

    #[tokio::test]
    async fn test_hello_codegen_tower_stack_layers() {
        let layer = CounterLayer::default();
        let hello_layer = CounterLayer::default();
        let goodbye_layer = CounterLayer::default();
        let ping_layer = CounterLayer::default();

        let hello_tower = HelloClient::tower()
            .stack_layer(layer.clone())
            .stack_hello_layer(hello_layer.clone())
            .stack_goodbye_layer(goodbye_layer.clone())
            .stack_ping_layer(ping_layer.clone())
            .build(HelloImpl::default());

        hello_tower
            .hello(HelloRequest {
                name: "Tower".to_string(),
            })
            .await
            .unwrap();

        hello_tower
            .goodbye(GoodbyeRequest {
                name: "Tower".to_string(),
            })
            .await
            .unwrap();

        let (ping_stream_tx, ping_stream) = ServiceStream::new_bounded(1);
        let mut pong_stream = hello_tower.ping(ping_stream).await.unwrap();

        ping_stream_tx
            .try_send(PingRequest {
                name: "Tower".to_string(),
            })
            .unwrap();
        assert_eq!(
            pong_stream.next().await.unwrap().unwrap().message,
            "Pong, Tower!"
        );

        assert_eq!(layer.counter.load(Ordering::Relaxed), 3);
        assert_eq!(hello_layer.counter.load(Ordering::Relaxed), 1);
        assert_eq!(goodbye_layer.counter.load(Ordering::Relaxed), 1);
        assert_eq!(ping_layer.counter.load(Ordering::Relaxed), 1);
    }

    #[tokio::test]
    async fn test_hello_codegen_tower_stack_layer_ordering() {
        trait AppendSuffix {
            fn append_suffix(&mut self, suffix: &'static str);
        }

        impl AppendSuffix for HelloRequest {
            fn append_suffix(&mut self, suffix: &'static str) {
                self.name.push_str(suffix);
            }
        }

        impl AppendSuffix for GoodbyeRequest {
            fn append_suffix(&mut self, suffix: &'static str) {
                self.name.push_str(suffix);
            }
        }

        impl AppendSuffix for PingRequest {
            fn append_suffix(&mut self, suffix: &'static str) {
                self.name.push_str(suffix);
            }
        }

        impl AppendSuffix for ServiceStream<PingRequest> {
            fn append_suffix(&mut self, _suffix: &'static str) {}
        }

        #[derive(Debug, Clone)]
        struct AppendSuffixService<S> {
            inner: S,
            suffix: &'static str,
        }

        impl<S, R> Service<R> for AppendSuffixService<S>
        where
            S: Service<R, Error = HelloError>,
            S::Response: fmt::Debug,
            S::Future: Send + 'static,
            R: AppendSuffix,
        {
            type Response = S::Response;
            type Error = HelloError;
            type Future = BoxFuture<S::Response, S::Error>;

            fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
                self.inner.poll_ready(cx)
            }

            fn call(&mut self, mut req: R) -> Self::Future {
                req.append_suffix(self.suffix);
                let inner = self.inner.call(req);
                Box::pin(inner)
            }
        }

        #[derive(Debug, Clone)]
        struct AppendSuffixLayer {
            suffix: &'static str,
        }

        impl AppendSuffixLayer {
            fn new(suffix: &'static str) -> Self {
                Self { suffix }
            }
        }

        impl<S> Layer<S> for AppendSuffixLayer {
            type Service = AppendSuffixService<S>;

            fn layer(&self, inner: S) -> Self::Service {
                AppendSuffixService {
                    inner,
                    suffix: self.suffix,
                }
            }
        }
        let hello_tower = HelloClient::tower()
            .stack_layer(AppendSuffixLayer::new("->foo"))
            .stack_hello_layer(AppendSuffixLayer::new("->bar"))
            .stack_layer(AppendSuffixLayer::new("->qux"))
            .stack_hello_layer(AppendSuffixLayer::new("->tox"))
            .stack_goodbye_layer(AppendSuffixLayer::new("->moo"))
            .build(HelloImpl::default());

        let response = hello_tower
            .hello(HelloRequest {
                name: "".to_string(),
            })
            .await
            .unwrap();
        assert_eq!(response.message, "Hello, ->foo->bar->qux->tox!");

        let response = hello_tower
            .goodbye(GoodbyeRequest {
                name: "".to_string(),
            })
            .await
            .unwrap();
        assert_eq!(response.message, "Goodbye, ->foo->qux->moo!");
    }

    #[tokio::test]
    async fn test_from_channel() {
        let balance_channed = BalanceChannel::from_channel(
            "127.0.0.1:7777".parse().unwrap(),
            Endpoint::from_static("http://127.0.0.1:7777").connect_lazy(),
        );
        HelloClient::from_balance_channel(balance_channed, MAX_GRPC_MESSAGE_SIZE, None);
    }

    #[tokio::test]
    async fn test_balance_channel() {
        let hello = HelloImpl::default();
        let grpc_server_adapter = HelloGrpcServerAdapter::new(hello);
        let grpc_server = HelloGrpcServer::new(grpc_server_adapter);
        let addr: SocketAddr = "127.0.0.1:11111".parse().unwrap();

        tokio::spawn({
            async move {
                Server::builder()
                    .add_service(grpc_server)
                    .serve(addr)
                    .await
                    .unwrap();
            }
        });
        let (balance_channel, balance_channel_tx) = BalanceChannel::new();
        let channel = Endpoint::from_static("http://127.0.0.1:11111").connect_lazy();
        balance_channel_tx
            .send(Change::Insert("foo", channel))
            .unwrap();

        let mut grpc_client = HelloGrpcClient::new(balance_channel.clone());

        assert_eq!(
            grpc_client
                .hello(HelloRequest {
                    name: "Client".to_string()
                })
                .await
                .unwrap()
                .into_inner(),
            HelloResponse {
                message: "Hello, Client!".to_string()
            }
        );
        assert_eq!(balance_channel.num_connections(), 1);
    }

    #[tokio::test]
    async fn test_hello_codegen_mock() {
        let mut mock_hello = MockHello::new();
        mock_hello.expect_hello().returning(|_| {
            Ok(HelloResponse {
                message: "Hello, mock!".to_string(),
            })
        });
        mock_hello.expect_check_connectivity().returning(|| Ok(()));
        let hello = HelloClient::from_mock(mock_hello);

        assert_eq!(
            hello
                .hello(HelloRequest {
                    name: "World".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, mock!".to_string()
            }
        );
        assert_eq!(
            hello
                .clone()
                .hello(HelloRequest {
                    name: "World".to_string()
                })
                .await
                .unwrap(),
            HelloResponse {
                message: "Hello, mock!".to_string()
            }
        );
        hello.check_connectivity().await.unwrap();
    }

    #[tokio::test]
    async fn test_transport_errors_handling() {
        quickwit_common::setup_logging_for_tests();

        let addr: SocketAddr = "127.0.0.1:9999".parse().unwrap();
        let channel = Endpoint::from_static("http://127.0.0.1:9999")
            .timeout(Duration::from_millis(100))
            .connect_lazy();
        let max_message_size = ByteSize::mib(1);
        let grpc_client = HelloClient::from_channel(addr, channel, max_message_size, None);

        let error = grpc_client
            .hello(HelloRequest {
                name: "Client".to_string(),
            })
            .await
            .unwrap_err();
        assert!(matches!(error, HelloError::Unavailable(_)));

        let hello = HelloImpl {
            delay: Duration::from_secs(1),
        };
        let grpc_server_adapter = HelloGrpcServerAdapter::new(hello);
        let grpc_server: HelloGrpcServer<HelloGrpcServerAdapter> =
            HelloGrpcServer::new(grpc_server_adapter);
        let addr: SocketAddr = "127.0.0.1:9999".parse().unwrap();

        tokio::spawn({
            async move {
                Server::builder()
                    .add_service(grpc_server)
                    .serve(addr)
                    .await
                    .unwrap();
            }
        });
        let error = grpc_client
            .hello(HelloRequest {
                name: "Client".to_string(),
            })
            .await
            .unwrap_err();
        assert!(matches!(error, HelloError::Timeout(_)));
    }

    #[tokio::test]
    async fn test_balanced_channel_timeout_with_server_crash() {
        let addr_str = "127.0.0.1:11112";
        let addr: SocketAddr = addr_str.parse().unwrap();
        // We want to abruptly stop a server without even sending the connection
        // RST packet. Simply dropping the tonic Server is not enough, so we
        // spawn a thread and freeze it with thread::park().
        std::thread::spawn(move || {
            let server_fut = async {
                let hello = HelloImpl {
                    // delay the response so that the server freezes in the middle of the request
                    delay: Duration::from_millis(1000),
                };
                let grpc_server_adapter = HelloGrpcServerAdapter::new(hello);
                let grpc_server = HelloGrpcServer::new(grpc_server_adapter);
                tokio::select! {
                    // wait just enough to let the client perform its request
                    _ = tokio::time::sleep(Duration::from_millis(100)) => {}
                    _ = Server::builder().add_service(grpc_server).serve(addr) => {}
                };
                std::thread::park();
                println!("Thread unparked, unexpected");
            };
            tokio::runtime::Builder::new_current_thread()
                .enable_all()
                .build()
                .unwrap()
                .block_on(server_fut);
        });

        // create a client that will try to connect to the server
        let (balance_channel, balance_channel_tx) = BalanceChannel::new();
        let channel = Endpoint::from_str(&format!("http://{addr_str}"))
            .unwrap()
            .connect_lazy();
        balance_channel_tx
            .send(Change::Insert(addr, channel))
            .unwrap();

        let grpc_client = HelloClient::tower()
            // this test hangs forever if we comment out the TimeoutLayer, which
            // shows that a request without explicit timeout might hang forever
            .stack_layer(TimeoutLayer::new(Duration::from_secs(3)))
            .build_from_balance_channel(balance_channel, ByteSize::mib(1), None);

        let response_fut = async move {
            grpc_client
                .hello(HelloRequest {
                    name: "World".to_string(),
                })
                .await
        };
        response_fut
            .await
            .expect_err("should have timed out at the client level");
    }
}


================================================
FILE: quickwit/quickwit-codegen/src/codegen.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use anyhow::ensure;
use heck::{ToSnakeCase, ToUpperCamelCase};
use proc_macro2::TokenStream;
use prost_build::{Comments, Method, Service, ServiceGenerator};
use quote::{ToTokens, quote};
use syn::{Ident, parse_quote};

use crate::ProstConfig;

pub struct Codegen;

impl Codegen {
    pub fn run(mut args: CodegenBuilder) -> anyhow::Result<()> {
        let service_generator = Box::new(QuickwitServiceGenerator::new(
            args.result_type_path,
            args.error_type_path,
            args.generate_extra_service_methods,
            args.generate_prom_labels_for_requests,
        ));
        args.prost_config
            .protoc_arg("--experimental_allow_proto3_optional")
            .type_attribute(
                ".",
                "#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]",
            )
            .field_attribute(
                "DocBatch.doc_buffer",
                "#[schema(value_type = String, format = Binary)]",
            )
            .enum_attribute(".", "#[serde(rename_all=\"snake_case\")]")
            .service_generator(service_generator)
            .out_dir(args.output_dir);

        for proto in args.protos {
            println!("cargo:rerun-if-changed={proto}");
            args.prost_config.compile_protos(&[proto], &args.includes)?;
        }
        Ok(())
    }

    pub fn builder() -> CodegenBuilder {
        CodegenBuilder::default()
    }
}

#[derive(Default)]
pub struct CodegenBuilder {
    protos: Vec<String>,
    includes: Vec<String>,
    output_dir: String,
    prost_config: ProstConfig,
    result_type_path: String,
    error_type_path: String,
    generate_extra_service_methods: bool,
    generate_prom_labels_for_requests: bool,
}

impl CodegenBuilder {
    pub fn with_protos(mut self, protos: &[&str]) -> Self {
        self.protos = protos.iter().map(|proto| proto.to_string()).collect();
        self
    }

    pub fn with_includes(mut self, includes: &[&str]) -> Self {
        self.includes = includes.iter().map(|include| include.to_string()).collect();
        self
    }

    pub fn with_output_dir(mut self, path: &str) -> Self {
        self.output_dir = path.to_string();
        self
    }

    pub fn with_result_type_path(mut self, path: &str) -> Self {
        self.result_type_path = path.to_string();
        self
    }

    pub fn with_error_type_path(mut self, path: &str) -> Self {
        self.error_type_path = path.to_string();
        self
    }

    pub fn with_prost_config(mut self, prost_config: ProstConfig) -> Self {
        self.prost_config = prost_config;
        self
    }

    pub fn generate_extra_service_methods(mut self) -> Self {
        self.generate_extra_service_methods = true;
        self
    }

    /// Generates `RpcName` trait implementations for request types.
    pub fn generate_rpc_name_impls(mut self) -> Self {
        self.generate_prom_labels_for_requests = true;
        self
    }

    pub fn run(self) -> anyhow::Result<()> {
        ensure!(!self.protos.is_empty(), "proto file list is empty");
        ensure!(!self.output_dir.is_empty(), "output directory is undefined");
        ensure!(!self.result_type_path.is_empty(),);
        ensure!(!self.error_type_path.is_empty(), "error type is undefined");

        Codegen::run(self)
    }
}

struct QuickwitServiceGenerator {
    result_type_path: String,
    error_type_path: String,
    generate_extra_service_methods: bool,
    generate_prom_labels_for_requests: bool,
    inner: Box<dyn ServiceGenerator>,
}

impl QuickwitServiceGenerator {
    fn new(
        result_type_path: String,
        error_type_path: String,
        generate_extra_service_methods: bool,
        generate_prom_labels_for_requests: bool,
    ) -> Self {
        let inner = Box::new(WithSuffixServiceGenerator::new(
            "Grpc",
            tonic_prost_build::configure().service_generator(),
        ));
        Self {
            result_type_path,
            error_type_path,
            generate_extra_service_methods,
            generate_prom_labels_for_requests,
            inner,
        }
    }
}

impl ServiceGenerator for QuickwitServiceGenerator {
    fn generate(&mut self, service: Service, buf: &mut String) {
        let tokens = generate_all(
            &service,
            &self.result_type_path,
            &self.error_type_path,
            self.generate_extra_service_methods,
            self.generate_prom_labels_for_requests,
        );
        let ast: syn::File = syn::parse2(tokens).expect("Tokenstream should be a valid Syn AST.");
        let pretty_code = prettyplease::unparse(&ast);
        buf.push_str(&pretty_code);

        self.inner.generate(service, buf)
    }

    fn finalize(&mut self, buf: &mut String) {
        self.inner.finalize(buf);
    }
}

struct CodegenContext {
    package_name: String,
    service_name: Ident,
    result_type: syn::Path,
    error_type: syn::Path,
    stream_type: Ident,
    stream_type_alias: TokenStream,
    methods: Vec<SynMethod>,
    client_name: Ident,
    inner_client_name: Ident,
    tower_svc_stack_name: Ident,
    tower_layer_stack_name: Ident,
    mailbox_name: Ident,
    mock_mod_name: Ident,
    mock_name: Ident,
    grpc_client_name: Ident,
    grpc_client_adapter_name: Ident,
    grpc_client_package_name: Ident,
    grpc_server_name: Ident,
    grpc_server_adapter_name: Ident,
    grpc_server_package_name: Ident,
    grpc_service_name: Ident,
    generate_extra_service_methods: bool,
}

impl CodegenContext {
    fn from_service(
        service: &Service,
        result_type_path: &str,
        error_type_path: &str,
        generate_extra_service_methods: bool,
    ) -> Self {
        let service_name = quote::format_ident!("{}", service.name);
        let mock_mod_name = quote::format_ident!("mock_{}", service.name.to_snake_case());
        let mock_name = quote::format_ident!("Mock{}", service.name);

        let result_type = syn::parse_str::<syn::Path>(result_type_path)
            .expect("Result path should be a valid result path such as `crate::HelloResult`.");
        let error_type = syn::parse_str::<syn::Path>(error_type_path)
            .expect("Error path should be a valid result path such as `crate::error::HelloError`.");
        let stream_type = quote::format_ident!("{}Stream", service.name);
        let stream_type_alias = if service.methods.iter().any(|method| method.server_streaming) {
            quote! {
                pub type #stream_type<T> = quickwit_common::ServiceStream<#result_type<T>>;
            }
        } else {
            TokenStream::new()
        };

        let methods = SynMethod::parse_prost_methods(&service.methods);

        let client_name = quote::format_ident!("{}Client", service.name);
        let inner_client_name = quote::format_ident!("Inner{}", client_name);
        let tower_svc_stack_name = quote::format_ident!("{}TowerServiceStack", service.name);
        let tower_layer_stack_name = quote::format_ident!("{}TowerLayerStack", service.name);
        let mailbox_name = quote::format_ident!("{}Mailbox", service.name);

        let grpc_client_name = quote::format_ident!("{}GrpcClient", service.name);
        let grpc_client_adapter_name = quote::format_ident!("{}GrpcClientAdapter", service.name);
        let grpc_client_package_name =
            quote::format_ident!("{}_grpc_client", service.name.to_snake_case());
        let package_name = service.package.clone();

        let grpc_server_name = quote::format_ident!("{}GrpcServer", service.name);
        let grpc_server_adapter_name = quote::format_ident!("{}GrpcServerAdapter", service.name);
        let grpc_server_package_name =
            quote::format_ident!("{}_grpc_server", service.name.to_snake_case());

        let grpc_service_name = quote::format_ident!("{}Grpc", service.name);

        Self {
            package_name,
            service_name,
            result_type,
            error_type,
            stream_type,
            stream_type_alias,
            methods,
            client_name,
            inner_client_name,
            tower_svc_stack_name,
            tower_layer_stack_name,
            mailbox_name,
            mock_mod_name,
            mock_name,
            grpc_client_name,
            grpc_client_adapter_name,
            grpc_client_package_name,
            grpc_server_name,
            grpc_server_adapter_name,
            grpc_server_package_name,
            grpc_service_name,
            generate_extra_service_methods,
        }
    }
}

fn generate_all(
    service: &Service,
    result_type_path: &str,
    error_type_path: &str,
    generate_extra_service_methods: bool,
    generate_prom_labels_for_requests: bool,
) -> TokenStream {
    let context = CodegenContext::from_service(
        service,
        result_type_path,
        error_type_path,
        generate_extra_service_methods,
    );
    let stream_type_alias = &context.stream_type_alias;
    let service_trait = generate_service_trait(&context);
    let client = generate_client(&context);
    let tower_services = generate_tower_services(&context);
    let tower_svc_stack = generate_tower_svc_stack(&context);
    let tower_layer_stack = generate_tower_layer_stack(&context);
    let tower_mailbox = generate_tower_mailbox(&context);
    let grpc_client_adapter = generate_grpc_client_adapter(&context);
    let grpc_server_adapter = generate_grpc_server_adapter(&context);
    let prom_labels_impl = if generate_prom_labels_for_requests {
        generate_prom_labels_impl_for_requests(&context)
    } else {
        TokenStream::new()
    };

    quote! {
        // The line below is necessary to opt out of the license header check.
        /// BEGIN quickwit-codegen
        #[allow(unused_imports)]
        use std::str::FromStr;
        use tower::{Layer, Service, ServiceExt};
        #prom_labels_impl

        #stream_type_alias

        #service_trait

        #client

        pub type BoxFuture<T, E> = std::pin::Pin<Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>>;

        #tower_services

        #tower_svc_stack

        #tower_layer_stack

        #tower_mailbox

        #grpc_client_adapter

        #grpc_server_adapter
    }
}

struct SynMethod {
    name: Ident,
    proto_name: Ident,
    comments: Vec<syn::Attribute>,
    request_type: syn::Path,
    response_type: syn::Path,
    client_streaming: bool,
    server_streaming: bool,
}

impl SynMethod {
    fn request_type(&self, mock: bool) -> TokenStream {
        let request_type = if mock {
            let request_type = &self.request_type;
            quote! { super::#request_type }
        } else {
            self.request_type.to_token_stream()
        };
        if self.client_streaming {
            quote! { quickwit_common::ServiceStream<#request_type> }
        } else {
            request_type
        }
    }

    fn rpc_name(&self, mock: bool) -> TokenStream {
        let request_type = &self.request_type;

        if mock {
            quote! { super::#request_type::rpc_name() }
        } else {
            quote! { #request_type::rpc_name() }
        }
    }

    fn response_type(&self, context: &CodegenContext, mock: bool) -> TokenStream {
        let response_type = if mock {
            let response_type = &self.response_type;
            quote! { super::#response_type }
        } else {
            self.response_type.to_token_stream()
        };
        if self.server_streaming {
            let stream_type = &context.stream_type;
            quote! { #stream_type<#response_type> }
        } else {
            response_type
        }
    }

    fn parse_prost_methods(methods: &[Method]) -> Vec<Self> {
        let mut syn_methods = Vec::with_capacity(methods.len());

        for method in methods {
            let name = quote::format_ident!("{}", method.name);
            let proto_name = quote::format_ident!("{}", method.proto_name);
            let comments = generate_comment_attributes(&method.comments);
            let request_type = syn::parse_str::<syn::Path>(&method.input_type).unwrap();
            let response_type = syn::parse_str::<syn::Path>(&method.output_type).unwrap();

            let syn_method = SynMethod {
                name,
                proto_name,
                comments,
                request_type,
                response_type,
                client_streaming: method.client_streaming,
                server_streaming: method.server_streaming,
            };
            syn_methods.push(syn_method);
        }
        syn_methods
    }
}

fn generate_prom_labels_impl_for_requests(context: &CodegenContext) -> TokenStream {
    let mut rpc_name_impls = Vec::new();

    for syn_method in &context.methods {
        let request_type = syn_method.request_type.to_token_stream();
        let rpc_name = &syn_method.name.to_string();
        let rpc_name_impl = quote! {
            impl RpcName for #request_type {
                fn rpc_name() -> &'static str {
                    #rpc_name
                }
            }
        };
        rpc_name_impls.extend(rpc_name_impl);
    }
    if rpc_name_impls.is_empty() {
        return TokenStream::new();
    }
    quote! {
        use quickwit_common::tower::RpcName;

        #(#rpc_name_impls)*
    }
}

fn generate_comment_attributes(comments: &Comments) -> Vec<syn::Attribute> {
    let mut attributes = Vec::with_capacity(comments.leading.len());

    for comment in &comments.leading {
        let comment = syn::LitStr::new(comment, proc_macro2::Span::call_site());
        let attribute: syn::Attribute = parse_quote! {
            #[doc = #comment]
        };
        attributes.push(attribute);
    }
    attributes
}

fn generate_service_trait(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let trait_methods = generate_service_trait_methods(context);
    let extra_trait_methods = if context.generate_extra_service_methods {
        quote! {
            async fn check_connectivity(&self) -> anyhow::Result<()>;
            fn endpoints(&self) -> Vec<quickwit_common::uri::Uri>;
        }
    } else {
        TokenStream::new()
    };

    quote! {
        #[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
        #[async_trait::async_trait]
        pub trait #service_name: std::fmt::Debug + Send + Sync + 'static {
            #trait_methods
            #extra_trait_methods
        }
    }
}

fn generate_service_trait_methods(context: &CodegenContext) -> TokenStream {
    let result_type = &context.result_type;

    let mut stream = TokenStream::new();

    for syn_method in &context.methods {
        let comments = &syn_method.comments;
        let method_name = syn_method.name.to_token_stream();
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);
        let method = quote! {
            #(#comments)*
            async fn #method_name(&self, request: #request_type) -> #result_type<#response_type>;
        };
        stream.extend(method);
    }
    stream
}

fn generate_extra_methods_calling_inner() -> TokenStream {
    quote! {
        async fn check_connectivity(&self) -> anyhow::Result<()> {
            self.inner.0.check_connectivity().await
        }

        fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
            self.inner.0.endpoints()
        }
    }
}

fn generate_client(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let client_name = &context.client_name;
    let inner_client_name = &context.inner_client_name;

    let grpc_client_name = &context.grpc_client_name;
    let grpc_client_adapter_name = &context.grpc_client_adapter_name;
    let grpc_client_package_name = &context.grpc_client_package_name;

    let grpc_server_name = &context.grpc_server_name;
    let grpc_server_adapter_name = &context.grpc_server_adapter_name;
    let grpc_server_package_name = &context.grpc_server_package_name;

    let client_methods = generate_client_methods(context, false);
    let mock_mod_name = &context.mock_mod_name;
    let mock_methods = generate_client_methods(context, true);
    let mailbox_name = &context.mailbox_name;
    let tower_layer_stack_name = &context.tower_layer_stack_name;
    let mock_name = &context.mock_name;
    let mock_wrapper_name = quote::format_ident!("{}Wrapper", mock_name);
    let error_message = format!(
        "`{mock_name}` must be wrapped in a `{mock_wrapper_name}`: use \
         `{client_name}::from_mock(mock)` to instantiate the client"
    );
    let extra_client_methods = if context.generate_extra_service_methods {
        generate_extra_methods_calling_inner()
    } else {
        TokenStream::new()
    };
    let extra_mock_methods = if context.generate_extra_service_methods {
        quote! {
            async fn check_connectivity(&self) -> anyhow::Result<()> {
                self.inner.lock().await.check_connectivity().await
            }

            fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
                futures::executor::block_on(self.inner.lock()).endpoints()
            }
        }
    } else {
        TokenStream::new()
    };

    quote! {
        #[derive(Debug, Clone)]
        pub struct #client_name {
            inner: #inner_client_name,
        }

        #[derive(Debug, Clone)]
        struct #inner_client_name(std::sync::Arc<dyn #service_name>);

        impl #client_name {
            pub fn new<T>(instance: T) -> Self
            where
                T: #service_name,
            {
                #[cfg(any(test, feature = "testsuite"))]
                assert!(std::any::TypeId::of::<T>() != std::any::TypeId::of::<#mock_name>(), #error_message);
                Self {
                    inner: #inner_client_name(std::sync::Arc::new(instance)),
                }
            }

            pub fn as_grpc_service(&self, max_message_size: bytesize::ByteSize) -> #grpc_server_package_name::#grpc_server_name<#grpc_server_adapter_name> {
                let adapter = #grpc_server_adapter_name::new(self.clone());
                #grpc_server_package_name::#grpc_server_name::new(adapter)
                    // Servers accept both Gzip and Zstd. The order is not important because the client decides which encoding to use.
                    .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
                    .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
                    .send_compressed(tonic::codec::CompressionEncoding::Gzip)
                    .send_compressed(tonic::codec::CompressionEncoding::Zstd)
                    .max_decoding_message_size(max_message_size.0 as usize)
                    .max_encoding_message_size(max_message_size.0 as usize)
            }

            pub fn from_channel(
                addr: std::net::SocketAddr,
                channel: tonic::transport::Channel,
                max_message_size: bytesize::ByteSize,
                compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
            ) -> Self
            {
                let (_, connection_keys_watcher) = tokio::sync::watch::channel(std::collections::HashSet::from_iter([addr]));
                let mut client = #grpc_client_package_name::#grpc_client_name::new(channel)
                    .max_decoding_message_size(max_message_size.0 as usize)
                    .max_encoding_message_size(max_message_size.0 as usize);
                if let Some(compression_encoding) = compression_encoding_opt {
                    client = client
                        .accept_compressed(compression_encoding)
                        .send_compressed(compression_encoding);
                }
                let adapter = #grpc_client_adapter_name::new(client, connection_keys_watcher);
                Self::new(adapter)
            }

            pub fn from_balance_channel(
                balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
                max_message_size: bytesize::ByteSize,
                compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
            ) -> #client_name
            {
                let connection_keys_watcher = balance_channel.connection_keys_watcher();
                let mut client = #grpc_client_package_name::#grpc_client_name::new(balance_channel)
                    .max_decoding_message_size(max_message_size.0 as usize)
                    .max_encoding_message_size(max_message_size.0 as usize);
                if let Some(compression_encoding) = compression_encoding_opt {
                    client = client
                        .accept_compressed(compression_encoding)
                        .send_compressed(compression_encoding);
                }
                let adapter = #grpc_client_adapter_name::new(client, connection_keys_watcher);
                Self::new(adapter)
            }

            pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
            where
                A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
                #mailbox_name<A>: #service_name,
            {
                #client_name::new(#mailbox_name::new(mailbox))
            }

            pub fn tower() -> #tower_layer_stack_name {
                #tower_layer_stack_name::default()
            }

            #[cfg(any(test, feature = "testsuite"))]
            pub fn from_mock(mock: #mock_name) -> Self {
                let mock_wrapper = #mock_mod_name::#mock_wrapper_name {
                    inner: tokio::sync::Mutex::new(mock)
                };
                Self::new(mock_wrapper)
            }

            #[cfg(any(test, feature = "testsuite"))]
            pub fn mocked() -> Self {
                Self::from_mock(#mock_name::new())
            }
        }

        #[async_trait::async_trait]
        impl #service_name for #client_name {
            #client_methods
            #extra_client_methods
        }

        #[cfg(any(test, feature = "testsuite"))]
        pub mod #mock_mod_name {
            use super::*;

            #[derive(Debug)]
            pub struct #mock_wrapper_name {
                pub(super) inner: tokio::sync::Mutex<#mock_name>
            }

            #[async_trait::async_trait]
            impl #service_name for #mock_wrapper_name {
                #mock_methods
                #extra_mock_methods
            }
        }
    }
}

fn generate_client_methods(context: &CodegenContext, mock: bool) -> TokenStream {
    let result_type = &context.result_type;

    let mut stream = TokenStream::new();

    for syn_method in &context.methods {
        let method_name = syn_method.name.to_token_stream();
        let request_type = syn_method.request_type(mock);
        let response_type = syn_method.response_type(context, mock);

        let body = if !mock {
            quote! {
                self.inner.0.#method_name(request).await
            }
        } else {
            quote! {
                self.inner.lock().await.#method_name(request).await
            }
        };
        let method = quote! {
            async fn #method_name(&self, request: #request_type) -> #result_type<#response_type> {
                #body
            }
        };
        stream.extend(method);
    }
    stream
}

fn generate_tower_services(context: &CodegenContext) -> TokenStream {
    let inner_client_name = &context.inner_client_name;
    let error_type = &context.error_type;

    let mut stream = TokenStream::new();

    for syn_method in &context.methods {
        let method_name = syn_method.name.to_token_stream();
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);

        let service = quote! {
            impl tower::Service<#request_type> for #inner_client_name {
                type Response = #response_type;
                type Error = #error_type;
                type Future = BoxFuture<Self::Response, Self::Error>;

                fn poll_ready(
                    &mut self,
                    _cx: &mut std::task::Context<'_>,
                ) -> std::task::Poll<Result<(), Self::Error>> {
                    std::task::Poll::Ready(Ok(()))
                }

                fn call(&mut self, request: #request_type) -> Self::Future {
                    let svc = self.clone();
                    let fut = async move { svc.0.#method_name(request).await };
                    Box::pin(fut)
                }
            }
        };
        stream.extend(service);
    }
    stream
}

fn generate_tower_svc_stack(context: &CodegenContext) -> TokenStream {
    let tower_svc_stack_name = &context.tower_svc_stack_name;
    let inner_client_name = &context.inner_client_name;
    let tower_svc_stack_attributes = generate_tower_svc_stack_attributes(context);
    let tower_svc_stack_service_impl = generate_tower_svc_stack_service_impl(context);

    quote! {
        /// A tower service stack is a set of tower services.
        #[derive(Debug)]
        struct #tower_svc_stack_name {
            // TODO: remove this field once `check_connectivity` is used for all services.
            #[allow(dead_code)]
            inner: #inner_client_name,

            #tower_svc_stack_attributes
        }

        #tower_svc_stack_service_impl
    }
}

fn generate_tower_svc_stack_attributes(context: &CodegenContext) -> TokenStream {
    let error_type = &context.error_type;

    let mut stream = TokenStream::new();

    for syn_method in &context.methods {
        let attribute_name = quote::format_ident!("{}_svc", syn_method.name);
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);

        let attribute = quote! {
            #attribute_name: quickwit_common::tower::BoxService<#request_type, #response_type, #error_type>,
        };
        stream.extend(attribute);
    }
    stream
}

fn generate_tower_svc_stack_service_impl(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let tower_svc_stack_name = &context.tower_svc_stack_name;
    let result_type = &context.result_type;
    let extra_client_methods = if context.generate_extra_service_methods {
        generate_extra_methods_calling_inner()
    } else {
        TokenStream::new()
    };
    let mut methods = TokenStream::new();

    for syn_method in &context.methods {
        let attribute_name = quote::format_ident!("{}_svc", syn_method.name);
        let method_name = syn_method.name.to_token_stream();
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);

        let attribute = quote! {
            async fn #method_name(&self, request: #request_type) -> #result_type<#response_type> {
                self.#attribute_name.clone().ready().await?.call(request).await
            }
        };
        methods.extend(attribute);
    }

    quote! {
        #[async_trait::async_trait]
        impl #service_name for #tower_svc_stack_name {
            #methods
            #extra_client_methods
        }
    }
}

fn generate_tower_layer_stack(context: &CodegenContext) -> TokenStream {
    let tower_layer_stack_name = &context.tower_layer_stack_name;
    let (tower_layer_stack_types, layer_stack_attributes) =
        generate_layer_stack_types_and_attributes(context);
    let layer_stack_impl = generate_layer_stack_impl(context);

    quote! {
        #tower_layer_stack_types

        #[derive(Debug, Default)]
        pub struct #tower_layer_stack_name {
            #layer_stack_attributes
        }

        #layer_stack_impl
    }
}

fn generate_layer_stack_types_and_attributes(
    context: &CodegenContext,
) -> (TokenStream, TokenStream) {
    let error_type = &context.error_type;

    let mut type_aliases = TokenStream::new();
    let mut attributes = TokenStream::new();

    for syn_method in &context.methods {
        let service_name_upper_camel_case = syn_method.name.to_string().to_upper_camel_case();
        let type_alias_name = quote::format_ident!("{service_name_upper_camel_case}Layer");
        let attribute_name = quote::format_ident!("{}_layers", syn_method.name);
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);

        let type_alias = quote! {
            type #type_alias_name = quickwit_common::tower::BoxLayer<quickwit_common::tower::BoxService<#request_type, #response_type, #error_type>, #request_type, #response_type, #error_type>;
        };
        let attribute = quote! {
            #attribute_name: Vec<#type_alias_name>,
        };
        type_aliases.extend(type_alias);
        attributes.extend(attribute);
    }
    (type_aliases, attributes)
}

fn generate_layer_stack_impl(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let client_name = &context.client_name;
    let inner_client_name = &context.inner_client_name;
    let mailbox_name = &context.mailbox_name;
    let mock_name = &context.mock_name;
    let tower_svc_stack_name = &context.tower_svc_stack_name;
    let tower_layer_stack_name = &context.tower_layer_stack_name;
    let error_type = &context.error_type;

    let mut shared_layer_method_bounds = TokenStream::new();
    let mut layer_method_bounds = TokenStream::new();
    let mut layer_method_statements = TokenStream::new();
    let mut layer_methods = TokenStream::new();
    let mut svc_statements = TokenStream::new();
    let mut svc_attribute_idents = Vec::with_capacity(context.methods.len());

    for syn_method in &context.methods {
        let layer_attribute_name = quote::format_ident!("{}_layers", syn_method.name);
        let layer_method_name = quote::format_ident!("stack_{}_layer", syn_method.name);
        let svc_attribute_name = quote::format_ident!("{}_svc", syn_method.name);
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);

        let shared_layer_method_bound = quote! {
            L: tower::Layer<quickwit_common::tower::BoxService<#request_type, #response_type, #error_type>> + Clone + Send + Sync + 'static,
            <L as tower::Layer<quickwit_common::tower::BoxService<#request_type, #response_type, #error_type>>>::Service: tower::Service<#request_type, Response = #response_type, Error = #error_type> + Clone + Send + Sync + 'static,
            <<L as tower::Layer<quickwit_common::tower::BoxService<#request_type, #response_type, #error_type>>>::Service as tower::Service<#request_type>>::Future: Send + 'static,
        };
        let layer_method_bound = quote! {
            L: tower::Layer<quickwit_common::tower::BoxService<#request_type, #response_type, #error_type>> + Send + Sync + 'static,
            L::Service: tower::Service<#request_type, Response = #response_type, Error = #error_type> + Clone + Send + Sync + 'static,
            <L::Service as tower::Service<#request_type>>::Future: Send + 'static,
        };
        let layer_method_statement = quote! {
            self.#layer_attribute_name.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        };
        let layer_method = quote! {
            pub fn #layer_method_name<L>(
                mut self,
                layer: L
            ) -> Self
            where
                #layer_method_bound
            {
                self.#layer_attribute_name.push(quickwit_common::tower::BoxLayer::new(layer));
                self
            }
        };
        shared_layer_method_bounds.extend(shared_layer_method_bound);
        layer_method_bounds.extend(layer_method_bound);
        layer_method_statements.extend(layer_method_statement);
        layer_methods.extend(layer_method);

        let svc_statement = quote! {
            let #svc_attribute_name = self.#layer_attribute_name.into_iter().rev().fold(quickwit_common::tower::BoxService::new(inner_client.clone()), |svc, layer| layer.layer(svc));
        };
        svc_statements.extend(svc_statement);

        svc_attribute_idents.push(svc_attribute_name);
    }

    quote! {
        impl #tower_layer_stack_name {
            pub fn stack_layer<L>(mut self, layer: L) -> Self
            where
                #shared_layer_method_bounds
            {
                #layer_method_statements
                self
            }

            #layer_methods

            pub fn build<T>(self, instance: T) -> #client_name
            where
                T: #service_name
            {
                let inner_client = #inner_client_name(std::sync::Arc::new(instance));
                self.build_from_inner_client(inner_client)
            }

            pub fn build_from_channel(
                self,
                addr: std::net::SocketAddr,
                channel: tonic::transport::Channel,
                max_message_size: bytesize::ByteSize,
                compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
            ) -> #client_name
            {
                let client =  #client_name::from_channel(addr, channel, max_message_size, compression_encoding_opt);
                let inner_client = client.inner;
                self.build_from_inner_client(inner_client)
            }

            pub fn build_from_balance_channel(
                self,
                balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
                max_message_size: bytesize::ByteSize,
                compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
            ) -> #client_name
            {
                let client =  #client_name::from_balance_channel(balance_channel, max_message_size, compression_encoding_opt);
                let inner_client = client.inner;
                self.build_from_inner_client(inner_client)
            }

            pub fn build_from_mailbox<A>(self, mailbox: quickwit_actors::Mailbox<A>) -> #client_name
            where
                A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
                #mailbox_name<A>: #service_name,
            {
                let inner_client = #inner_client_name(std::sync::Arc::new(#mailbox_name::new(mailbox)));
                self.build_from_inner_client(inner_client)
            }

            #[cfg(any(test, feature = "testsuite"))]
            pub fn build_from_mock(self, mock: #mock_name) -> #client_name {
                let client = #client_name::from_mock(mock);
                let inner_client = client.inner;
                self.build_from_inner_client(inner_client)
            }

            fn build_from_inner_client(self, inner_client: #inner_client_name) -> #client_name
            {
                #svc_statements

                let tower_svc_stack = #tower_svc_stack_name {
                    inner: inner_client,
                    #(#svc_attribute_idents),*
                };
                #client_name::new(tower_svc_stack)
            }
        }
    }
}

fn generate_tower_mailbox(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let mailbox_name = &context.mailbox_name;
    let error_type = &context.error_type;
    let extra_mailbox_methods = if context.generate_extra_service_methods {
        quote! {
            async fn check_connectivity(&self) -> anyhow::Result<()> {
                if self.inner.is_disconnected() {
                    anyhow::bail!("actor `{}` is disconnected", self.inner.actor_instance_id())
                }
                Ok(())
            }

            fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
                vec![quickwit_common::uri::Uri::from_str(&format!("actor://localhost/{}", self.inner.actor_instance_id())).expect("URI should be valid")]
            }
        }
    } else {
        TokenStream::new()
    };

    let (mailbox_bounds, mailbox_methods) = generate_mailbox_bounds_and_methods(context);

    quote! {
        #[derive(Debug, Clone)]
        struct MailboxAdapter<A: quickwit_actors::Actor, E> {
            inner: quickwit_actors::Mailbox<A>,
            phantom: std::marker::PhantomData<E>,
        }

        impl<A, E> std::ops::Deref for MailboxAdapter<A, E> where A: quickwit_actors::Actor {
            type Target = quickwit_actors::Mailbox<A>;

            fn deref(&self) -> &Self::Target {
                &self.inner
            }
        }

        #[derive(Debug)]
        pub struct #mailbox_name<A: quickwit_actors::Actor> {
            inner: MailboxAdapter<A, #error_type>
        }

        impl <A: quickwit_actors::Actor> #mailbox_name<A> {
            pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
                let inner = MailboxAdapter {
                    inner: instance,
                    phantom: std::marker::PhantomData,
                };
                Self {
                    inner
                }
            }
        }

        impl <A: quickwit_actors::Actor> Clone for #mailbox_name<A> {
            fn clone(&self) -> Self {
                let inner = MailboxAdapter {
                    inner: self.inner.clone(),
                    phantom: std::marker::PhantomData,
                };
                Self { inner }
            }
        }

        impl<A, M, T, E> tower::Service<M> for #mailbox_name<A>
        where
            A: quickwit_actors::Actor + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send + 'static,
            M: std::fmt::Debug + Send + 'static,
            T: Send + 'static,
            E: std::fmt::Debug + Send + 'static,
            #error_type: From<quickwit_actors::AskError<E>>,
        {
            type Response = T;
            type Error = #error_type;
            type Future = BoxFuture<Self::Response, Self::Error>;

            fn poll_ready(&mut self, _cx: &mut std::task::Context<'_>) -> std::task::Poll<Result<(), Self::Error>> {
                //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
                //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
                //! mailbox in `poll_ready` and consume it in `call`.
                std::task::Poll::Ready(Ok(()))
            }

            fn call(&mut self, message: M) -> Self::Future {
                let mailbox = self.inner.clone();
                let fut = async move {
                    mailbox
                        .ask_for_res(message)
                        .await
                        .map_err(|error| error.into())
                };
                Box::pin(fut)
            }
        }

        #[async_trait::async_trait]
        impl<A> #service_name for #mailbox_name<A>
        where
            A: quickwit_actors::Actor + std::fmt::Debug,
            #mailbox_name<A>: #(#mailbox_bounds)+*,
        {
            #mailbox_methods
            #extra_mailbox_methods
        }
    }
}

fn generate_mailbox_bounds_and_methods(
    context: &CodegenContext,
) -> (Vec<TokenStream>, TokenStream) {
    let result_type = &context.result_type;
    let error_type = &context.error_type;

    let mut bounds = Vec::with_capacity(context.methods.len());
    let mut methods = TokenStream::new();

    for syn_method in &context.methods {
        let method_name = syn_method.name.to_token_stream();
        let request_type = syn_method.request_type(false);
        let response_type = syn_method.response_type(context, false);

        let bound = quote! {
            tower::Service<#request_type, Response = #response_type, Error = #error_type, Future = BoxFuture<#response_type, #error_type>>
        };
        bounds.push(bound);

        let method = quote! {
            async fn #method_name(&self, request: #request_type) -> #result_type<#response_type> {
                self.clone().call(request).await
            }
        };
        methods.extend(method);
    }
    (bounds, methods)
}

fn generate_grpc_client_adapter(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let service_name_string = service_name.to_string();
    let grpc_client_package_name = &context.grpc_client_package_name;
    let grpc_client_package_name_string = &context.package_name.to_string();
    let grpc_client_name = &context.grpc_client_name;
    let grpc_client_adapter_name = &context.grpc_client_adapter_name;
    let grpc_server_adapter_methods = generate_grpc_client_adapter_methods(context);
    let extra_grpc_server_adapter_methods = if context.generate_extra_service_methods {
        quote! {
            async fn check_connectivity(&self) -> anyhow::Result<()> {
                if self.connection_addrs_rx.borrow().is_empty() {
                    anyhow::bail!("no server currently available")
                }
                Ok(())
            }

            fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
                self.connection_addrs_rx
                    .borrow()
                    .iter()
                    .flat_map(|addr| quickwit_common::uri::Uri::from_str(&format!("grpc://{addr}/{}.{}", #grpc_client_package_name_string, #service_name_string)))
                    .collect()
            }
        }
    } else {
        TokenStream::new()
    };

    quote! {
        #[derive(Debug, Clone)]
        pub struct #grpc_client_adapter_name<T> {
            inner: T,
            // TODO: remove this field once `check_connectivity` is used for all services.
            #[allow(dead_code)]
            connection_addrs_rx: tokio::sync::watch::Receiver<std::collections::HashSet<std::net::SocketAddr>>,
        }

        impl<T> #grpc_client_adapter_name<T> {
            pub fn new(instance: T, connection_addrs_rx: tokio::sync::watch::Receiver<std::collections::HashSet<std::net::SocketAddr>>) -> Self {
                Self {
                    inner: instance,
                    connection_addrs_rx
                }
            }
        }

        #[async_trait::async_trait]
        impl<T> #service_name for #grpc_client_adapter_name<#grpc_client_package_name::#grpc_client_name<T>>
        where
            T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send + Sync + 'static,
            T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
            <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError> + Send,
            T::Future: Send
        {
            #grpc_server_adapter_methods
            #extra_grpc_server_adapter_methods
        }
    }
}

fn generate_grpc_client_adapter_methods(context: &CodegenContext) -> TokenStream {
    let result_type = &context.result_type;

    let mut stream = TokenStream::new();

    for syn_method in &context.methods {
        let method_name = syn_method.name.to_token_stream();
        let request_type = syn_method.request_type(false);
        let rpc_name = syn_method.rpc_name(false);
        let response_type = syn_method.response_type(context, false);

        let into_response_type = if syn_method.server_streaming {
            quote! { |response|
                {
                    let streaming: tonic::Streaming<_> = response.into_inner();
                    let stream = quickwit_common::ServiceStream::from(streaming);
                    stream.map_err(|status| crate::error::grpc_status_to_service_error(status, #rpc_name))
                }
            }
        } else {
            quote! { |response| response.into_inner() }
        };
        let method = quote! {
            async fn #method_name(&self, request: #request_type) -> #result_type<#response_type> {
                self.inner
                    .clone()
                    .#method_name(request)
                    .await
                    .map(#into_response_type)
                    .map_err(|status| crate::error::grpc_status_to_service_error(status, #rpc_name))
            }
        };
        stream.extend(method);
    }
    stream
}

fn generate_grpc_server_adapter(context: &CodegenContext) -> TokenStream {
    let service_name = &context.service_name;
    let inner_client_name = &context.inner_client_name;
    let grpc_server_package_name = &context.grpc_server_package_name;
    let grpc_service_name = &context.grpc_service_name;
    let grpc_server_adapter_name = &context.grpc_server_adapter_name;
    let grpc_server_adapter_methods = generate_grpc_server_adapter_methods(context);

    quote! {
        #[derive(Debug)]
        pub struct #grpc_server_adapter_name {
            inner: #inner_client_name,
        }

        impl #grpc_server_adapter_name {
            pub fn new<T>(instance: T) -> Self
            where T: #service_name {
                Self {
                    inner: #inner_client_name(std::sync::Arc::new(instance)),
                }
            }
        }

        #[async_trait::async_trait]
        impl #grpc_server_package_name::#grpc_service_name for #grpc_server_adapter_name {
            #grpc_server_adapter_methods
        }
    }
}

fn generate_grpc_server_adapter_methods(context: &CodegenContext) -> TokenStream {
    let mut stream = TokenStream::new();

    for syn_method in &context.methods {
        let method_name = syn_method.name.to_token_stream();
        let request_type = if syn_method.client_streaming {
            let request_type = &syn_method.request_type;
            quote! { tonic::Streaming<#request_type> }
        } else {
            syn_method.request_type.to_token_stream()
        };
        let method_arg = if syn_method.client_streaming {
            quote! {
                {
                    let streaming: tonic::Streaming<_> = request.into_inner();
                    quickwit_common::ServiceStream::from(streaming)
                }
            }
        } else {
            quote! { request.into_inner() }
        };
        let response_type = if syn_method.server_streaming {
            let associated_type_name = quote::format_ident!("{}Stream", syn_method.proto_name);
            quote! { Self::#associated_type_name }
        } else {
            syn_method.response_type.to_token_stream()
        };
        let associated_type = if syn_method.server_streaming {
            let associated_type_name = quote::format_ident!("{}Stream", syn_method.proto_name);
            let response_type = &syn_method.response_type;
            quote! { type #associated_type_name = quickwit_common::ServiceStream<tonic::Result<#response_type>>; }
        } else {
            TokenStream::new()
        };
        let into_response_type = if syn_method.server_streaming {
            quote! {
                |stream| tonic::Response::new(stream.map_err(crate::error::grpc_error_to_grpc_status))
            }
        } else {
            quote! { tonic::Response::new }
        };
        let method = quote! {
            #associated_type

            async fn #method_name(&self, request: tonic::Request<#request_type>) -> Result<tonic::Response<#response_type>, tonic::Status> {
                self.inner
                    .0
                    .#method_name(#method_arg)
                    .await
                    .map(#into_response_type)
                    .map_err(crate::error::grpc_error_to_grpc_status)
            }
        };
        stream.extend(method);
    }
    stream
}

/// A [`ServiceGenerator`] wrapper that appends a suffix to the name of the wrapped service. It is
/// used to add a `Grpc` suffix to the service, client, and server generated by tonic.
struct WithSuffixServiceGenerator {
    suffix: String,
    inner: Box<dyn ServiceGenerator>,
}

impl WithSuffixServiceGenerator {
    fn new(suffix: &str, service_generator: Box<dyn ServiceGenerator>) -> Self {
        Self {
            suffix: suffix.to_string(),
            inner: service_generator,
        }
    }
}

impl ServiceGenerator for WithSuffixServiceGenerator {
    fn generate(&mut self, mut service: Service, buf: &mut String) {
        service.name = format!("{}{}", service.name, self.suffix);
        self.inner.generate(service, buf);
    }

    fn finalize(&mut self, buf: &mut String) {
        self.inner.finalize(buf);
    }

    fn finalize_package(&mut self, package: &str, buf: &mut String) {
        self.inner.finalize_package(package, buf);
    }
}


================================================
FILE: quickwit/quickwit-codegen/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod codegen;

pub use codegen::Codegen;
pub use prost_build::Config as ProstConfig;


================================================
FILE: quickwit/quickwit-common/Cargo.toml
================================================
[package]
name = "quickwit-common"
description = "Shared utilities for Quickwit"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-speed-limit = { workspace = true }
async-trait = { workspace = true }
backtrace = { workspace = true, optional = true }
bytesize = { workspace = true }
coarsetime = { workspace = true }
dyn-clone = { workspace = true }
env_logger = { workspace = true }
fnv = { workspace = true }
futures = { workspace = true }
governor = { workspace = true }
home = { workspace = true }
hostname = { workspace = true }
http = { workspace = true }
hyper = { workspace = true }
hyper-util = { workspace = true, optional = true }
itertools = { workspace = true }
once_cell = { workspace = true }
pin-project = { workspace = true }
pnet = { workspace = true }
prometheus = { workspace = true }
rand = { workspace = true }
rayon = { workspace = true }
regex = { workspace = true }
serde = { workspace = true }
siphasher = { workspace = true }
sysinfo = { workspace = true }
tempfile = { workspace = true }
thiserror = { workspace = true }
tikv-jemallocator = { workspace = true, optional = true }
tokio = { workspace = true }
tokio-metrics = { workspace = true }
tokio-stream = { workspace = true }
tonic = { workspace = true, features = [
    "tls-native-roots",
    "server",
    "channel",
] }
tower = { workspace = true }
tracing = { workspace = true }

[features]
testsuite = ["hyper-util"]
named_tasks = ["tokio/tracing"]
jemalloc-profiled = [
    "named_tasks",
    "dep:backtrace",
    "dep:tikv-jemallocator",
]

[dev-dependencies]
hyper-util = { workspace = true }
proptest = { workspace = true }
serde_json = { workspace = true }
serial_test = { workspace = true }
tempfile = { workspace = true }
tokio = { workspace = true, features = ["test-util"] }


================================================
FILE: quickwit/quickwit-common/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

fn main() {
    println!("cargo::rustc-check-cfg=cfg(tokio_unstable)");
}


================================================
FILE: quickwit/quickwit-common/src/alloc_tracker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::collections::hash_map::Entry;

use bytesize::ByteSize;

#[derive(Debug)]
struct Allocation {
    pub callsite_hash: u64,
    pub size: ByteSize,
}

#[derive(Debug, Copy, Clone)]
pub struct AllocStat {
    pub count: u64,
    pub size: ByteSize,
    pub last_report: ByteSize,
}

#[derive(Debug)]
enum TrackerStatus {
    Started { reporting_interval: ByteSize },
    Stopped,
}

/// WARN:
/// - keys and values in these maps should not allocate!
/// - we assume HashMaps don't allocate if their capacity is not exceeded
#[derive(Debug)]
pub struct Allocations {
    memory_locations: HashMap<usize, Allocation>,
    max_tracked_memory_locations: usize,
    callsite_statistics: HashMap<u64, AllocStat>,
    max_tracked_callsites: usize,
    status: TrackerStatus,
}

impl Default for Allocations {
    fn default() -> Self {
        let max_tracked_memory_locations = 128 * 1024;
        let max_tracked_callsites = 32 * 1024;
        // TODO: We use a load factor of 0.5 to avoid resizing. There is no
        // strict guarantee with std::collections::HashMap that it's enough, but
        // it seems to be the case in practice (see test_tracker_full).
        Self {
            memory_locations: HashMap::with_capacity(2 * max_tracked_memory_locations),
            max_tracked_memory_locations,
            callsite_statistics: HashMap::with_capacity(2 * max_tracked_callsites),
            max_tracked_callsites,
            status: TrackerStatus::Stopped,
        }
    }
}

pub enum AllocRecordingResponse {
    ThresholdExceeded(AllocStat),
    ThresholdNotExceeded,
    TrackerFull(&'static str),
    NotStarted,
}

pub enum ReallocRecordingResponse {
    ThresholdExceeded {
        statistics: AllocStat,
        callsite_hash: u64,
    },
    ThresholdNotExceeded,
    NotStarted,
}

impl Allocations {
    pub fn init(&mut self, reporting_interval_bytes: u64) {
        self.memory_locations.clear();
        self.callsite_statistics.clear();
        self.status = TrackerStatus::Started {
            reporting_interval: ByteSize(reporting_interval_bytes),
        }
    }

    /// Records an allocation and occasionally reports the cumulated allocation
    /// size for the provided callsite_hash.
    ///
    /// Every time the total allocated size for a given callsite_hash exceeds
    /// the previous reported value by at least reporting_interval, the new total
    /// allocated size is reported.
    ///
    /// WARN: this function should not allocate!
    pub fn record_allocation(
        &mut self,
        callsite_hash: u64,
        size_bytes: u64,
        ptr: *mut u8,
    ) -> AllocRecordingResponse {
        let TrackerStatus::Started { reporting_interval } = self.status else {
            return AllocRecordingResponse::NotStarted;
        };
        if self.max_tracked_memory_locations == self.memory_locations.len() {
            return AllocRecordingResponse::TrackerFull("memory_locations");
        }
        if self.max_tracked_callsites == self.callsite_statistics.len() {
            return AllocRecordingResponse::TrackerFull("tracked_callsites");
        }
        self.memory_locations.insert(
            ptr as usize,
            Allocation {
                callsite_hash,
                size: ByteSize(size_bytes),
            },
        );
        let entry = self
            .callsite_statistics
            .entry(callsite_hash)
            .and_modify(|stat| {
                stat.count += 1;
                stat.size += size_bytes;
            })
            .or_insert(AllocStat {
                count: 1,
                size: ByteSize(size_bytes),
                last_report: ByteSize(0),
            });
        let new_threshold_exceeded = entry.size >= (entry.last_report + reporting_interval);
        if new_threshold_exceeded {
            let reported_statistic = *entry;
            entry.last_report = entry.size;
            AllocRecordingResponse::ThresholdExceeded(reported_statistic)
        } else {
            AllocRecordingResponse::ThresholdNotExceeded
        }
    }

    /// Updates the memory location and size of an existing allocation. Only
    /// update the statistics if the original allocation was recorded.
    ///
    /// WARN: this function should not allocate!
    pub fn record_reallocation(
        &mut self,
        new_size_bytes: u64,
        old_ptr: *mut u8,
        new_ptr: *mut u8,
    ) -> ReallocRecordingResponse {
        let TrackerStatus::Started { reporting_interval } = self.status else {
            return ReallocRecordingResponse::NotStarted;
        };
        let (callsite_hash, old_size_bytes) = if old_ptr != new_ptr {
            let Some(old_alloc) = self.memory_locations.remove(&(old_ptr as usize)) else {
                return ReallocRecordingResponse::ThresholdNotExceeded;
            };
            self.memory_locations.insert(
                new_ptr as usize,
                Allocation {
                    callsite_hash: old_alloc.callsite_hash,
                    size: ByteSize(new_size_bytes),
                },
            );
            (old_alloc.callsite_hash, old_alloc.size.0)
        } else {
            let Some(alloc) = self.memory_locations.get_mut(&(old_ptr as usize)) else {
                return ReallocRecordingResponse::ThresholdNotExceeded;
            };
            let old_size_bytes = alloc.size.0;
            alloc.size = ByteSize(new_size_bytes);
            (alloc.callsite_hash, old_size_bytes)
        };

        let delta = new_size_bytes as i64 - old_size_bytes as i64;

        let Some(current_stat) = self.callsite_statistics.get_mut(&callsite_hash) else {
            // tables are inconsistent, this should not happen
            return ReallocRecordingResponse::ThresholdNotExceeded;
        };
        current_stat.size = ByteSize((current_stat.size.0 as i64 + delta) as u64);
        let new_threshold_exceeded =
            current_stat.size >= (current_stat.last_report + reporting_interval);
        if new_threshold_exceeded {
            let reported_statistic = *current_stat;
            current_stat.last_report = current_stat.size;
            ReallocRecordingResponse::ThresholdExceeded {
                statistics: reported_statistic,
                callsite_hash,
            }
        } else {
            ReallocRecordingResponse::ThresholdNotExceeded
        }
    }

    /// WARN: this function should not allocate!
    pub fn record_deallocation(&mut self, ptr: *mut u8) {
        if let TrackerStatus::Stopped = self.status {
            return;
        }
        let Some(Allocation {
            size,
            callsite_hash,
            ..
        }) = self.memory_locations.remove(&(ptr as usize))
        else {
            // this was allocated before the tracking started
            return;
        };
        if let Entry::Occupied(mut content) = self.callsite_statistics.entry(callsite_hash) {
            let new_size_bytes = content.get().size.0.saturating_sub(size.0);
            let new_count = content.get().count.saturating_sub(1);
            content.get_mut().count = new_count;
            content.get_mut().size = ByteSize(new_size_bytes);
            if content.get().count == 0 {
                content.remove();
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    fn as_ptr(i: usize) -> *mut u8 {
        i as *mut u8
    }

    #[test]
    fn test_record_allocation_and_deallocation() {
        let mut allocations = Allocations::default();
        allocations.init(2000);
        let callsite_hash_1 = 777;

        let ptr_1 = as_ptr(1);
        let response = allocations.record_allocation(callsite_hash_1, 1500, ptr_1);
        assert!(matches!(
            response,
            AllocRecordingResponse::ThresholdNotExceeded
        ));

        let ptr_2 = as_ptr(2);
        let response = allocations.record_allocation(callsite_hash_1, 1500, ptr_2);
        let AllocRecordingResponse::ThresholdExceeded(statistic) = response else {
            panic!("Expected ThresholdExceeded response");
        };
        assert_eq!(statistic.count, 2);
        assert_eq!(statistic.size, ByteSize(3000));
        assert_eq!(statistic.last_report, ByteSize(0));

        allocations.record_deallocation(ptr_2);

        // the threshold was already crossed
        let ptr_3 = as_ptr(3);
        let response = allocations.record_allocation(callsite_hash_1, 1500, ptr_3);
        assert!(matches!(
            response,
            AllocRecordingResponse::ThresholdNotExceeded
        ));

        // this is a brand new call site with different statistics
        let callsite_hash_2 = 42;
        let ptr_4 = as_ptr(4);
        let response = allocations.record_allocation(callsite_hash_2, 1500, ptr_4);
        assert!(matches!(
            response,
            AllocRecordingResponse::ThresholdNotExceeded
        ));
    }

    #[test]
    fn test_record_allocation_and_reallocation() {
        let mut allocations = Allocations::default();
        allocations.init(2000);
        let callsite_hash_1 = 777;

        let ptr_1 = as_ptr(1);
        let response = allocations.record_allocation(callsite_hash_1, 1500, ptr_1);
        assert!(matches!(
            response,
            AllocRecordingResponse::ThresholdNotExceeded
        ));

        let ptr_2 = as_ptr(2);
        let response = allocations.record_allocation(callsite_hash_1, 1500, ptr_2);
        let AllocRecordingResponse::ThresholdExceeded(statistic) = response else {
            panic!("Expected ThresholdExceeded response");
        };
        assert_eq!(statistic.count, 2);
        assert_eq!(statistic.size, ByteSize(3000));
        assert_eq!(statistic.last_report, ByteSize(0));

        // alloc grows a little bit
        let response = allocations.record_reallocation(2000, ptr_1, ptr_1);
        assert!(matches!(
            response,
            ReallocRecordingResponse::ThresholdNotExceeded
        ));

        // alloc grows a lot
        let response = allocations.record_reallocation(4000, ptr_1, ptr_1);
        let ReallocRecordingResponse::ThresholdExceeded {
            statistics,
            callsite_hash,
        } = response
        else {
            panic!("Expected ThresholdExceeded response");
        };
        assert_eq!(statistics.count, 2);
        assert_eq!(statistics.size, ByteSize(5500));
        assert_eq!(statistics.last_report, ByteSize(3000));
        assert_eq!(callsite_hash, callsite_hash_1);

        // alloc grows a little bit and moves
        let ptr_3 = as_ptr(3);
        let response = allocations.record_reallocation(4500, ptr_1, ptr_3);
        assert!(matches!(
            response,
            ReallocRecordingResponse::ThresholdNotExceeded
        ));

        // alloc grows a lot and moves
        let ptr_4 = as_ptr(4);
        let response = allocations.record_reallocation(6000, ptr_3, ptr_4);
        let ReallocRecordingResponse::ThresholdExceeded {
            statistics,
            callsite_hash,
        } = response
        else {
            panic!("Expected ThresholdExceeded response");
        };
        assert_eq!(statistics.count, 2);
        assert_eq!(statistics.size, ByteSize(7500));
        assert_eq!(statistics.last_report, ByteSize(5500));
        assert_eq!(callsite_hash, callsite_hash_1);

        // once an existing allocation moved, it's previous location can be re-allocated
        let response = allocations.record_allocation(callsite_hash_1, 2000, ptr_1);
        let AllocRecordingResponse::ThresholdExceeded(statistics) = response else {
            panic!("Expected ThresholdExceeded response");
        };
        assert_eq!(statistics.count, 3);
        assert_eq!(statistics.size, ByteSize(9500));
        assert_eq!(statistics.last_report, ByteSize(7500));
        assert_eq!(callsite_hash, callsite_hash_1);

        // reallocation is ignored on unknown allocation
        let ptr_404 = as_ptr(404);
        let response = allocations.record_reallocation(10000, ptr_404, ptr_404);
        assert!(matches!(
            response,
            ReallocRecordingResponse::ThresholdNotExceeded
        ));
    }

    #[test]
    fn test_tracker_full() {
        let mut allocations = Allocations::default();
        allocations.init(1024 * 1024 * 1024);
        let max_tracked_locations = allocations.max_tracked_memory_locations;

        // Track a first allocation. This one is not removed thoughout this test.
        let first_location_ptr = as_ptr(1);
        let response = allocations.record_allocation(777, 10, first_location_ptr);
        assert!(matches!(
            response,
            AllocRecordingResponse::ThresholdNotExceeded
        ));
        let ref_addr = allocations
            .memory_locations
            .get(&(first_location_ptr as usize))
            .unwrap() as *const Allocation;
        // Assert that no hashmap resize occurs by tracking the address
        // stability of the first value. Using HashMap::capacity() proved not to
        // be reliable (unclear spec).
        let assert_locations_map_didnt_move = |allocations: &Allocations, loc: &str| {
            assert_eq!(
                allocations
                    .memory_locations
                    .get(&(first_location_ptr as usize))
                    .unwrap() as *const Allocation,
                ref_addr,
                "{loc}",
            );
        };

        // fill the table
        let moving_ptr_range = (first_location_ptr as usize + 1)
            ..(first_location_ptr as usize + max_tracked_locations);
        for i in moving_ptr_range.clone() {
            let ptr = as_ptr(i);
            let response = allocations.record_allocation(777, 10, ptr);
            assert!(matches!(
                response,
                AllocRecordingResponse::ThresholdNotExceeded
            ));
            assert_locations_map_didnt_move(&allocations, "fill");
        }
        assert_eq!(allocations.memory_locations.len(), max_tracked_locations);

        // the table is full, no more allocation is tracked
        let response = allocations.record_allocation(777, 10, as_ptr(moving_ptr_range.end));
        assert!(matches!(
            response,
            AllocRecordingResponse::TrackerFull("memory_locations")
        ));
        assert_locations_map_didnt_move(&allocations, "full");

        // run a heavy insert/remove workload
        let last_location = 10 * max_tracked_locations;
        for i in moving_ptr_range.end..=last_location {
            let removed_ptr = as_ptr(i - 1);
            allocations.record_deallocation(removed_ptr);
            let inserted_ptr = as_ptr(i);
            let response = allocations.record_allocation(888, 10, inserted_ptr);
            assert!(matches!(
                response,
                AllocRecordingResponse::ThresholdNotExceeded
            ));
            assert_locations_map_didnt_move(&allocations, "reinsert");
        }

        // reallocations are fine because they don't create an entry in the map
        let response =
            allocations.record_reallocation(10, as_ptr(last_location), as_ptr(last_location + 1));
        assert!(matches!(
            response,
            ReallocRecordingResponse::ThresholdNotExceeded,
        ));
        assert_locations_map_didnt_move(&allocations, "realloc");
    }
}


================================================
FILE: quickwit/quickwit-common/src/binary_heap.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::{Ordering, Reverse};
use std::collections::BinaryHeap;
use std::iter::FusedIterator;

// TODO: Remove this once `BinaryHeap::into_iter_sorted` is stabilized.

#[must_use = "iterators are lazy and do nothing unless consumed"]
#[derive(Clone, Debug)]
pub struct IntoIterSorted<T> {
    inner: BinaryHeap<T>,
}

impl<T> IntoIterSorted<T> {
    pub fn new(instance: BinaryHeap<T>) -> Self {
        Self { inner: instance }
    }
}

impl<T: Ord> Iterator for IntoIterSorted<T> {
    type Item = T;

    #[inline]
    fn next(&mut self) -> Option<T> {
        self.inner.pop()
    }

    #[inline]
    fn size_hint(&self) -> (usize, Option<usize>) {
        let exact = self.inner.len();
        (exact, Some(exact))
    }
}

impl<T: Ord> ExactSizeIterator for IntoIterSorted<T> {}

impl<T: Ord> FusedIterator for IntoIterSorted<T> {}

/// Consumes an iterator entirely and return the top-K best element according to a scoring key.
/// Behavior under the presence of ties is unspecified.
pub fn top_k<T, SortKeyFn, O>(
    mut items: impl Iterator<Item = T>,
    k: usize,
    sort_key_fn: SortKeyFn,
) -> Vec<T>
where
    SortKeyFn: Fn(&T) -> O,
    O: Ord,
{
    if k == 0 {
        return Vec::new();
    }
    let mut heap: BinaryHeap<Reverse<OrderItemPair<O, T>>> = BinaryHeap::with_capacity(k);
    for _ in 0..k {
        if let Some(item) = items.next() {
            let order: O = sort_key_fn(&item);
            heap.push(Reverse(OrderItemPair { order, item }));
        } else {
            break;
        }
    }
    if heap.len() == k {
        for item in items {
            let mut head = heap.peek_mut().unwrap();
            let order = sort_key_fn(&item);
            if head.0.order < order {
                *head = Reverse(OrderItemPair { order, item });
            }
        }
    }
    let resulting_top_k: Vec<T> = heap
        .into_sorted_vec()
        .into_iter()
        .map(|order_item| order_item.0.item)
        .collect();
    resulting_top_k
}

#[derive(Clone)]
struct OrderItemPair<O: Ord, T> {
    order: O,
    item: T,
}

impl<O: Ord, T> Ord for OrderItemPair<O, T> {
    fn cmp(&self, other: &Self) -> Ordering {
        self.order.cmp(&other.order)
    }
}

impl<O: Ord, T> PartialOrd for OrderItemPair<O, T> {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl<O: Ord, T> PartialEq for OrderItemPair<O, T> {
    fn eq(&self, other: &Self) -> bool {
        self.order.cmp(&other.order) == Ordering::Equal
    }
}

impl<O: Ord, T> Eq for OrderItemPair<O, T> {}

pub trait SortKeyMapper<Value> {
    type Key;
    fn get_sort_key(&self, value: &Value) -> Self::Key;
}

/// Progressively compute top-k.
#[derive(Clone)]
pub struct TopK<T, O: Ord, S> {
    heap: BinaryHeap<Reverse<OrderItemPair<O, T>>>,
    pub sort_key_mapper: S,
    k: usize,
}

impl<T, O, S> TopK<T, O, S>
where
    O: Ord,
    S: SortKeyMapper<T, Key = O>,
{
    /// Create a new top-k computer.
    pub fn new(k: usize, sort_key_mapper: S) -> Self {
        TopK {
            heap: BinaryHeap::with_capacity(k),
            sort_key_mapper,
            k,
        }
    }

    /// Whether there are k element ready already.
    pub fn at_capacity(&self) -> bool {
        self.heap.len() >= self.k
    }

    pub fn max_len(&self) -> usize {
        self.k
    }

    /// Try to add new entries, if they are better than the current worst.
    pub fn add_entries(&mut self, mut items: impl Iterator<Item = T>) {
        if self.k == 0 {
            return;
        }
        while !self.at_capacity() {
            if let Some(item) = items.next() {
                let order: O = self.sort_key_mapper.get_sort_key(&item);
                self.heap.push(Reverse(OrderItemPair { order, item }));
            } else {
                return;
            }
        }

        for item in items {
            let mut head = self.heap.peek_mut().unwrap();
            let order = self.sort_key_mapper.get_sort_key(&item);
            if head.0.order < order {
                *head = Reverse(OrderItemPair { order, item });
            }
        }
    }

    pub fn add_entry(&mut self, item: T) {
        self.add_entries(std::iter::once(item))
    }

    /// Get a reference to the worst entry.
    pub fn peek_worst(&self) -> Option<&T> {
        self.heap.peek().map(|entry| &entry.0.item)
    }

    /// Get a Vec of sorted entries.
    pub fn finalize(self) -> Vec<T> {
        self.heap
            .into_sorted_vec()
            .into_iter()
            .map(|order_item| order_item.0.item)
            .collect()
    }
}

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn test_top_k() {
        let top_k = super::top_k(vec![1u32, 2, 3].into_iter(), 2, |n| *n);
        assert_eq!(&top_k, &[3, 2]);
        let top_k = super::top_k(vec![1u32, 2, 3].into_iter(), 2, |n| Reverse(*n));
        assert_eq!(&top_k, &[1, 2]);
        let top_k = super::top_k(vec![1u32, 2, 2].into_iter(), 4, |n| *n);
        assert_eq!(&top_k, &[2u32, 2, 1]);
        let top_k = super::top_k(vec![1u32, 2, 2].into_iter(), 4, |n| *n);
        assert_eq!(&top_k, &[2u32, 2, 1]);
        let top_k: Vec<u32> = super::top_k(Vec::new().into_iter(), 4, |n| *n);
        assert!(top_k.is_empty());
    }

    #[test]
    fn test_incremental_top_k() {
        struct Mapper(bool);
        impl SortKeyMapper<u32> for Mapper {
            type Key = u32;
            fn get_sort_key(&self, value: &u32) -> u32 {
                if self.0 { u32::MAX - value } else { *value }
            }
        }
        let mut top_k = TopK::new(2, Mapper(false));
        top_k.add_entries([1u32, 2, 3].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&2));
        assert_eq!(&top_k.finalize(), &[3, 2]);

        let mut top_k = TopK::new(2, Mapper(false));
        top_k.add_entries([1u32].into_iter());
        assert!(!top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&1));
        top_k.add_entries([3].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&1));
        top_k.add_entries([2].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&2));
        assert_eq!(&top_k.finalize(), &[3, 2]);

        let mut top_k = TopK::new(2, Mapper(true));
        top_k.add_entries([1u32, 2, 3].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&2));
        assert_eq!(&top_k.finalize(), &[1, 2]);

        let mut top_k = TopK::new(2, Mapper(true));
        top_k.add_entries([1u32].into_iter());
        assert!(!top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&1));
        top_k.add_entries([3].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&3));
        top_k.add_entries([2].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&2));
        assert_eq!(&top_k.finalize(), &[1, 2]);

        let mut top_k = TopK::new(4, Mapper(false));
        top_k.add_entries([2u32, 1, 2].into_iter());
        assert!(!top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&1));
        assert_eq!(&top_k.finalize(), &[2, 2, 1]);

        let mut top_k = TopK::new(4, Mapper(false));
        top_k.add_entries([2u32].into_iter());
        assert!(!top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&2));
        top_k.add_entries([1].into_iter());
        assert!(!top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&1));
        top_k.add_entries([2].into_iter());
        assert!(!top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), Some(&1));
        assert_eq!(&top_k.finalize(), &[2, 2, 1]);

        let mut top_k = TopK::<u32, u32, _>::new(4, Mapper(false));
        top_k.add_entries([].into_iter());
        assert!(top_k.finalize().is_empty());

        let mut top_k = TopK::new(0, Mapper(false));
        top_k.add_entries([1u32, 2, 3].into_iter());
        assert!(top_k.at_capacity());
        assert_eq!(top_k.peek_worst(), None);
        assert!(top_k.finalize().is_empty());
    }
}


================================================
FILE: quickwit/quickwit-common/src/coolid.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use rand::distr::Alphanumeric;
use rand::prelude::*;

const ADJECTIVES: &[&str] = &[
    "aged",
    "ancient",
    "autumn",
    "billowing",
    "bitter",
    "black",
    "blue",
    "bold",
    "broken",
    "cold",
    "cool",
    "crimson",
    "damp",
    "dark",
    "dawn",
    "delicate",
    "divine",
    "dry",
    "empty",
    "falling",
    "floral",
    "fragrant",
    "frosty",
    "green",
    "hidden",
    "holy",
    "icy",
    "late",
    "lingering",
    "little",
    "lively",
    "long",
    "misty",
    "morning",
    "muddy",
    "nameless",
    "old",
    "patient",
    "polished",
    "proud",
    "purple",
    "quiet",
    "red",
    "restless",
    "rough",
    "shy",
    "silent",
    "small",
    "snowy",
    "solitary",
    "sparkling",
    "spring",
    "still",
    "summer",
    "throbbing",
    "twilight",
    "wandering",
    "weathered",
    "white",
    "wild",
    "winter",
    "wispy",
    "withered",
    "young",
];

/// Returns a randomly generated id
pub fn new_coolid(name: &str) -> String {
    let mut rng = rand::rng();
    let adjective = ADJECTIVES[rng.random_range(0..ADJECTIVES.len())];
    let slug: String = rng
        .sample_iter(&Alphanumeric)
        .take(4)
        .map(char::from)
        .collect();
    format!("{name}-{adjective}-{slug}")
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;

    use super::new_coolid;

    #[test]
    fn test_coolid() {
        let cool_ids: HashSet<String> = std::iter::repeat_with(|| new_coolid("hello"))
            .take(100)
            .collect();
        assert_eq!(cool_ids.len(), 100);
    }
}


================================================
FILE: quickwit/quickwit-common/src/cpus.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZero;
use std::sync::OnceLock;

use tracing::{error, info, warn};

const QW_NUM_CPUS_ENV_KEY: &str = "QW_NUM_CPUS";
const KUBERNETES_LIMITS_CPU: &str = "KUBERNETES_LIMITS_CPU";

/// Return the number of vCPU/hyperthreads available.
/// The following methods are used in order:
/// - from the `QW_NUM_CPUS` environment variable
/// - from the `KUBERNETES_LIMITS_CPU` environment variable
/// - from the operating system
/// - default to 2.
pub fn num_cpus() -> usize {
    static NUM_CPUS: OnceLock<usize> = OnceLock::new();
    *NUM_CPUS.get_or_init(num_cpus_aux)
}

fn num_cpus_aux() -> usize {
    let num_cpus_from_os_opt = std::thread::available_parallelism()
        .map(NonZero::get)
        .inspect_err(|err| {
            error!(error=?err, "failed to detect the number of threads available: arbitrarily returning 2");
        })
        .ok();
    let num_cpus_from_env_opt = get_num_cpus_from_env(QW_NUM_CPUS_ENV_KEY);
    let num_cpus_from_k8s_limit = get_num_cpus_from_env(KUBERNETES_LIMITS_CPU);

    if let Some(num_cpus) = num_cpus_from_env_opt {
        return num_cpus;
    }

    if let Some(num_cpus_from_k8s_limit) = num_cpus_from_k8s_limit {
        info!(
            "num cpus from k8s limit: {},  possibly overriding os value {:?}",
            num_cpus_from_k8s_limit, num_cpus_from_env_opt
        );
        return num_cpus_from_k8s_limit;
    }

    if let Some(num_cpus_from_os_opt) = num_cpus_from_os_opt {
        info!("num cpus from os: {}", num_cpus_from_os_opt);
        return num_cpus_from_os_opt;
    }

    warn!("failed to detect number of cpus. defaulting to 2");
    2
}

fn parse_cpu_to_mcpu(cpu_string: &str) -> Result<usize, &'static str> {
    let trimmed_str = cpu_string.trim();

    if trimmed_str.is_empty() {
        return Err("input cpu_string cannot be empty");
    }

    if let Some(val_str) = trimmed_str.strip_suffix('m') {
        // The value is already in millicores.
        val_str
            .parse::<usize>()
            .map_err(|_| "invalid millicore value")
    } else {
        // The value is in CPU cores.
        let value = trimmed_str
            .parse::<f64>()
            .map_err(|_| "invalid float value")?;
        Ok((value * 1000.0f64) as usize)
    }
}

// Get the number of CPUs from an environment variable.
// The value is expected to be in k8s format (200m means 200 millicores, 2 means 2 cores)
//
// We then get the number of vCPUs by ceiling any non integer value.
fn get_num_cpus_from_env(env_key: &str) -> Option<usize> {
    let k8s_cpu_limit_str: String = crate::get_from_env_opt(env_key, false)?;
    let mcpus = parse_cpu_to_mcpu(&k8s_cpu_limit_str)
        .inspect_err(|err_msg| {
            warn!(
                "failed to parse k8s cpu limit (`{}`): {}",
                k8s_cpu_limit_str, err_msg
            );
        })
        .ok()?;
    let num_vcpus = mcpus.div_ceil(1000);
    Some(num_vcpus)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_millicores() {
        assert_eq!(parse_cpu_to_mcpu("500m").unwrap(), 500);
        assert_eq!(parse_cpu_to_mcpu("100m").unwrap(), 100);
        assert_eq!(parse_cpu_to_mcpu("2500m").unwrap(), 2500);
    }

    #[test]
    fn test_cores() {
        assert_eq!(parse_cpu_to_mcpu("1").unwrap(), 1000);
        assert_eq!(parse_cpu_to_mcpu("2").unwrap(), 2000);
    }

    #[test]
    fn test_fractional_cores() {
        assert_eq!(parse_cpu_to_mcpu("0.5").unwrap(), 500);
        assert_eq!(parse_cpu_to_mcpu("1.5").unwrap(), 1500);
        assert_eq!(parse_cpu_to_mcpu("0.25").unwrap(), 250);
    }

    #[test]
    fn test_with_whitespace() {
        assert_eq!(parse_cpu_to_mcpu(" 750m ").unwrap(), 750);
        assert_eq!(parse_cpu_to_mcpu(" 0.75 ").unwrap(), 750);
    }

    #[test]
    fn test_invalid_input() {
        assert!(parse_cpu_to_mcpu("").is_err());
        assert!(parse_cpu_to_mcpu("   ").is_err());
        assert!(parse_cpu_to_mcpu("abc").is_err());
        assert!(parse_cpu_to_mcpu("1a").is_err());
        assert!(parse_cpu_to_mcpu("m500").is_err());
        assert!(parse_cpu_to_mcpu("500m1").is_err());
    }
}


================================================
FILE: quickwit/quickwit-common/src/fs.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::{Path, PathBuf};

use bytesize::ByteSize;
use sysinfo::{Disk, DiskRefreshKind};
use tokio;

/// Deletes the contents of a directory.
pub async fn empty_dir<P: AsRef<Path>>(path: P) -> anyhow::Result<()> {
    let mut entries = tokio::fs::read_dir(path).await?;
    while let Some(entry) = entries.next_entry().await? {
        if entry.file_type().await?.is_dir() {
            tokio::fs::remove_dir_all(entry.path()).await?
        } else {
            tokio::fs::remove_file(entry.path()).await?;
        }
    }
    Ok(())
}

/// Helper function to get the indexer split cache path.
pub fn get_cache_directory_path(data_dir_path: &Path) -> PathBuf {
    data_dir_path.join("indexer-split-cache").join("splits")
}

/// Get the total size of the disk containing the given directory, or `None` if
/// it couldn't be determined.
pub fn get_disk_size(dir_path: &Path) -> Option<ByteSize> {
    let disks = sysinfo::Disks::new_with_refreshed_list_specifics(
        DiskRefreshKind::nothing().with_storage(),
    );
    let mut best_match: Option<(&Disk, PathBuf)> = None;
    let dir_path = dir_path.canonicalize().ok()?;
    for disk in disks.list() {
        let canonical_mount_path = disk.mount_point().canonicalize().ok()?;
        if dir_path.starts_with(&canonical_mount_path) {
            match best_match {
                Some((_, best_mount_point))
                    if canonical_mount_path.starts_with(&best_mount_point) =>
                {
                    best_match = Some((disk, canonical_mount_path.clone()));
                }
                None => {
                    best_match = Some((disk, canonical_mount_path.clone()));
                }
                _ => {}
            }
        }
        if canonical_mount_path.starts_with(&dir_path) && canonical_mount_path != dir_path {
            // if a disk is mounted within the directory, we can't determine the
            // size of the directories disk
            return None;
        }
    }
    best_match.map(|(disk, _)| ByteSize::b(disk.total_space()))
}

#[cfg(test)]
mod tests {
    use tempfile;

    use super::*;

    #[tokio::test]
    async fn test_empty_dir() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;

        let file_path = temp_dir.path().join("file");
        tokio::fs::File::create(file_path).await?;

        let subdir = temp_dir.path().join("subdir");
        tokio::fs::create_dir(&subdir).await?;

        let subfile_path = subdir.join("subfile");
        tokio::fs::File::create(subfile_path).await?;

        empty_dir(temp_dir.path()).await?;
        assert!(
            tokio::fs::read_dir(temp_dir.path())
                .await?
                .next_entry()
                .await?
                .is_none()
        );
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-common/src/io.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// This file contains code copied from the Resource trait
// in async-speed-limit from the TiKV project.
// https://github.com/tikv/async-speed-limit/blob/master/src/io.rs
//
// Copyright 2019 TiKV Project Authors. Licensed under MIT or Apache-2.0.

// We are simply porting the logic to tokio here and adding the functionality to
// plug some metrics.

use std::future::Future;
use std::io;
use std::io::IoSlice;
use std::pin::Pin;
use std::task::{Context, Poll};
use std::time::Duration;

pub use async_speed_limit::Limiter;
use async_speed_limit::clock::StandardClock;
use async_speed_limit::limiter::Consume;
use bytesize::ByteSize;
use once_cell::sync::Lazy;
use pin_project::pin_project;
use prometheus::IntCounter;
use tokio::io::AsyncWrite;

use crate::metrics::{IntCounterVec, new_counter_vec};
use crate::{KillSwitch, Progress, ProtectedZoneGuard};

// Max 1MB at a time.
const MAX_NUM_BYTES_WRITTEN_AT_ONCE: usize = 1 << 20;

fn truncate_bytes(bytes: &[u8]) -> &[u8] {
    let num_bytes = bytes.len().min(MAX_NUM_BYTES_WRITTEN_AT_ONCE);
    &bytes[..num_bytes]
}

struct IoMetrics {
    write_bytes: IntCounterVec<1>,
}

impl Default for IoMetrics {
    fn default() -> Self {
        let write_bytes = new_counter_vec(
            "write_bytes",
            "Number of bytes written by a given component in [indexer, merger, deleter, \
             split_downloader_{merge,delete}]",
            "",
            &[],
            ["component"],
        );
        Self { write_bytes }
    }
}

static IO_METRICS: Lazy<IoMetrics> = Lazy::new(IoMetrics::default);

/// Parameter used in `async_speed_limit`.
///
/// The default value is good and does not need to be tweaked.
/// We use a smaller value in unit test to get reasonably accurate throttling one very
/// short period of times.
///
/// For more details, please refer to `async_speed_limit` documentation.
const REFILL_DURATION: Duration = if cfg!(test) {
    Duration::from_millis(10)
} else {
    // Default value in async_speed_limit
    Duration::from_millis(100)
};

pub fn limiter(throughput: ByteSize) -> Limiter {
    Limiter::builder(throughput.as_u64() as f64)
        .refill(REFILL_DURATION)
        .build()
}

#[derive(Clone)]
pub struct IoControls {
    throughput_limiter_opt: Option<Limiter>,
    bytes_counter: IntCounter,
    progress: Progress,
    kill_switch: KillSwitch,
}

impl Default for IoControls {
    fn default() -> Self {
        let default_bytes_counter =
            IntCounter::new("default_write_num_bytes", "Default write counter.").unwrap();
        IoControls {
            throughput_limiter_opt: None,
            progress: Progress::default(),
            kill_switch: KillSwitch::default(),
            bytes_counter: default_bytes_counter,
        }
    }
}

impl IoControls {
    #[must_use]
    pub fn progress(&self) -> &Progress {
        &self.progress
    }

    pub fn kill(&self) {
        self.kill_switch.kill();
    }

    pub fn num_bytes(&self) -> u64 {
        self.bytes_counter.get()
    }

    pub fn check_if_alive(&self) -> io::Result<ProtectedZoneGuard> {
        if self.kill_switch.is_dead() {
            return Err(io::Error::other("directory kill switch was activated"));
        }
        let guard = self.progress.protect_zone();
        Ok(guard)
    }

    pub fn set_component(mut self, component: &str) -> Self {
        self.bytes_counter = IO_METRICS.write_bytes.with_label_values([component]);
        self
    }

    pub fn set_throughput_limit(self, throughput: ByteSize) -> Self {
        let throughput_limiter = Limiter::builder(throughput.as_u64() as f64)
            .refill(REFILL_DURATION)
            .build();
        self.set_throughput_limiter_opt(Some(throughput_limiter))
    }

    pub fn set_throughput_limiter_opt(mut self, throughput_limiter_opt: Option<Limiter>) -> Self {
        self.throughput_limiter_opt = throughput_limiter_opt;
        self
    }

    pub fn set_bytes_counter(mut self, bytes_counter: IntCounter) -> Self {
        self.bytes_counter = bytes_counter;
        self
    }

    pub fn set_progress(mut self, progress: Progress) -> Self {
        self.progress = progress;
        self
    }

    pub fn set_kill_switch(mut self, kill_switch: KillSwitch) -> Self {
        self.kill_switch = kill_switch;
        self
    }
    fn consume_blocking(&self, num_bytes: usize) -> io::Result<()> {
        let _guard = self.check_if_alive()?;
        if let Some(throughput_limiter) = &self.throughput_limiter_opt {
            throughput_limiter.blocking_consume(num_bytes);
        }
        self.bytes_counter.inc_by(num_bytes as u64);
        Ok(())
    }
}

#[pin_project]
pub struct ControlledWrite<A: IoControlsAccess, W> {
    #[pin]
    underlying_wrt: W,
    waiter: Option<Consume<StandardClock, ()>>,
    io_controls_access: A,
}

impl<A: IoControlsAccess, W: AsyncWrite> ControlledWrite<A, W> {
    // This function was copied from TiKV's `async-speed-limit`.
    // Copyright 2019 TiKV Project Authors. Licensed under MIT or Apache-2.0.
    /// Wraps a poll function with a delay after it.
    ///
    /// This method calls the given `poll` function until it is fulfilled. After
    /// that, the result is saved into this `Resource` instance (therefore
    /// different `poll_***` calls should not be interleaving), while returning
    /// `Pending` until the limiter has completely consumed the result.
    #[allow(dead_code)]
    pub(crate) fn poll_limited(
        self: Pin<&mut Self>,
        cx: &mut Context<'_>,
        poll: impl FnOnce(Pin<&mut W>, &mut Context<'_>) -> Poll<io::Result<usize>>,
    ) -> Poll<io::Result<usize>> {
        let this = self.project();

        let _protect_guard = match this
            .io_controls_access
            .apply(|io_controls| io_controls.check_if_alive())
        {
            Ok(protect_guard) => protect_guard,
            Err(io_err) => {
                return Poll::Ready(Err(io_err));
            }
        };

        if let Some(waiter) = this.waiter {
            let res = Pin::new(waiter).poll(cx);
            if res.is_pending() {
                return Poll::Pending;
            }
            *this.waiter = None;
        }

        let res: Poll<io::Result<usize>> = poll(this.underlying_wrt, cx);
        if let Poll::Ready(obj) = &res {
            let len = *obj.as_ref().unwrap_or(&0);
            if len > 0 {
                let waiter = this.io_controls_access.apply(|io_controls| {
                    io_controls.bytes_counter.inc_by(len as u64);
                    io_controls
                        .throughput_limiter_opt
                        .as_ref()
                        .map(|limiter| limiter.consume(len))
                });
                *this.waiter = waiter
            }
        }
        res
    }
}

/// Quirky spec: truncates the list of bufs, and keep as many leftmost elements
/// as possible, within the constraint of not exceeding `max_len` bytes.
///
/// Please keep this function private
fn quirky_truncate_slices<'a, 'b>(bufs: &'b [IoSlice<'a>], max_len: usize) -> &'b [IoSlice<'a>] {
    if bufs.is_empty() {
        return bufs;
    }
    let mut cumulated_len = bufs[0].len();
    for (i, buf) in bufs.iter().enumerate().skip(1) {
        cumulated_len += buf.len();
        if cumulated_len > max_len {
            return &bufs[..i];
        }
    }
    bufs
}

impl<A: IoControlsAccess, W: AsyncWrite> AsyncWrite for ControlledWrite<A, W> {
    fn poll_write(
        self: Pin<&mut Self>,
        cx: &mut Context<'_>,
        buf: &[u8],
    ) -> Poll<io::Result<usize>> {
        let buf = truncate_bytes(buf);
        // The shadowing is on purpose.
        self.poll_limited(cx, |r, cx| r.poll_write(cx, buf))
    }

    fn poll_write_vectored(
        self: Pin<&mut Self>,
        cx: &mut Context<'_>,
        bufs: &[IoSlice<'_>],
    ) -> Poll<io::Result<usize>> {
        if bufs.is_empty() {
            return Poll::Ready(Ok(0));
        }
        // The shadowing is on purpose.
        let bufs = quirky_truncate_slices(bufs, MAX_NUM_BYTES_WRITTEN_AT_ONCE);
        self.poll_limited(cx, |r, cx| r.poll_write_vectored(cx, bufs))
    }

    fn poll_flush(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<io::Result<()>> {
        self.project().underlying_wrt.poll_flush(cx)
    }

    fn poll_shutdown(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), io::Error>> {
        self.project().underlying_wrt.poll_shutdown(cx)
    }
}

pub trait IoControlsAccess: Sized {
    fn wrap_write<W>(self, wrt: W) -> ControlledWrite<Self, W> {
        ControlledWrite {
            underlying_wrt: wrt,
            waiter: None,
            io_controls_access: self,
        }
    }

    fn apply<F, R>(&self, f: F) -> R
    where F: Fn(&IoControls) -> R;
}

impl IoControlsAccess for IoControls {
    fn apply<F, R>(&self, f: F) -> R
    where F: Fn(&IoControls) -> R {
        f(self)
    }
}

impl<A, W> ControlledWrite<A, W>
where A: IoControlsAccess
{
    pub fn underlying_wrt(&mut self) -> &mut W {
        &mut self.underlying_wrt
    }

    fn check_if_alive(&self) -> io::Result<ProtectedZoneGuard> {
        self.io_controls_access
            .apply(|io_controls| io_controls.check_if_alive())
    }
}

impl<A, W: io::Write> io::Write for ControlledWrite<A, W>
where A: IoControlsAccess
{
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        let buf = truncate_bytes(buf);
        let written_num_bytes = self.underlying_wrt.write(buf)?;
        self.io_controls_access
            .apply(|io_controls| io_controls.consume_blocking(written_num_bytes))?;
        Ok(written_num_bytes)
    }

    fn flush(&mut self) -> io::Result<()> {
        // We voluntarily avoid to check the kill switch on flush.
        // This is because the `RAMDirectory` currently panics if flush
        // is not called before `Drop`.
        let _guard = self.check_if_alive();
        self.underlying_wrt.flush()
    }
}

#[cfg(test)]
mod tests {
    use std::io::{IoSlice, Write};
    use std::time::Duration;

    use bytesize::ByteSize;
    use tokio::io::{AsyncWriteExt, sink};
    use tokio::time::Instant;

    use crate::io::{IoControls, IoControlsAccess};

    #[tokio::test]
    async fn test_controlled_writer_limited_async() {
        let io_controls = IoControls::default().set_throughput_limit(ByteSize::mb(2));
        let mut controlled_write = io_controls.clone().wrap_write(sink());
        let buf = vec![44u8; 1_000];
        let start = Instant::now();
        // We write 200 KB
        for _ in 0..200 {
            controlled_write.write_all(&buf).await.unwrap();
        }
        controlled_write.flush().await.unwrap();
        let elapsed = start.elapsed();
        assert!(elapsed >= Duration::from_millis(50));
        assert!(elapsed <= Duration::from_millis(150));
        assert_eq!(io_controls.num_bytes(), 200_000u64);
    }

    #[tokio::test]
    async fn test_controlled_writer_no_limit_async() {
        let io_controls = IoControls::default();
        let mut controlled_write = io_controls.clone().wrap_write(sink());
        let buf = vec![44u8; 1_000];
        let start = Instant::now();
        // We write 2MB
        for _ in 0..2_000 {
            controlled_write.write_all(&buf).await.unwrap();
        }
        controlled_write.flush().await.unwrap();
        let elapsed = start.elapsed();
        assert!(elapsed <= Duration::from_millis(10));
        assert_eq!(io_controls.num_bytes(), 2_000_000u64);
    }

    #[test]
    fn test_controlled_writer_limited_sync() {
        let io_controls = IoControls::default().set_throughput_limit(ByteSize::mb(2));
        let mut controlled_write = io_controls.clone().wrap_write(std::io::sink());
        let buf = vec![44u8; 1_000];
        let start = Instant::now();
        // We write 200 KB
        for _ in 0..200 {
            controlled_write.write_all(&buf).unwrap();
        }
        controlled_write.flush().unwrap();
        let elapsed = start.elapsed();
        assert!(elapsed >= Duration::from_millis(50));
        assert!(elapsed <= Duration::from_millis(150));
        assert_eq!(io_controls.num_bytes(), 200_000u64);
    }

    #[test]
    fn test_controlled_writer_no_limit_sync() {
        let io_controls = IoControls::default();
        let mut controlled_write = io_controls.clone().wrap_write(std::io::sink());
        let buf = vec![44u8; 1_000];
        let start = Instant::now();
        // We write 2MB
        for _ in 0..2_000 {
            controlled_write.write_all(&buf).unwrap();
        }
        controlled_write.flush().unwrap();
        let elapsed = start.elapsed();
        assert!(elapsed <= Duration::from_millis(5));
        assert_eq!(io_controls.num_bytes(), 2_000_000u64);
    }

    #[test]
    fn test_truncate_io_slices_one_slice_too_long_corner_case() {
        let one_slice = IoSlice::new(&b"abcdef"[..]);
        assert_eq!(super::quirky_truncate_slices(&[one_slice], 2).len(), 1);
    }

    #[test]
    fn test_truncate_io_empty() {
        assert_eq!(super::quirky_truncate_slices(&[], 2).len(), 0);
    }

    #[test]
    fn test_truncate_io_slices() {
        let slices = &[
            IoSlice::new(&b"abc"[..]),
            IoSlice::new(&b"defg"[..]),
            IoSlice::new(&b"hi"[..]),
        ];
        assert_eq!(super::quirky_truncate_slices(slices, 0).len(), 1);
        assert_eq!(super::quirky_truncate_slices(slices, 6).len(), 1);
        assert_eq!(super::quirky_truncate_slices(slices, 7).len(), 2);
        assert_eq!(super::quirky_truncate_slices(slices, 9).len(), 3);
        assert_eq!(super::quirky_truncate_slices(slices, 10).len(), 3);
    }
}


================================================
FILE: quickwit/quickwit-common/src/jemalloc_profiled.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::alloc::{GlobalAlloc, Layout};
use std::hash::Hasher;
use std::sync::Mutex;
use std::sync::atomic::{AtomicBool, AtomicU64, Ordering};

use bytesize::ByteSize;
use once_cell::sync::Lazy;
use tikv_jemallocator::Jemalloc;
use tracing::{error, info, trace};

use crate::alloc_tracker::{
    AllocRecordingResponse, AllocStat, Allocations, ReallocRecordingResponse,
};

const DEFAULT_MIN_ALLOC_BYTES_FOR_PROFILING: u64 = 64 * 1024;
const DEFAULT_REPORTING_INTERVAL_BYTES: u64 = 1024 * 1024 * 1024;

/// This custom target name is used to filter profiling events in the tracing
/// subscriber. It is also included in the printed log.
pub const JEMALLOC_PROFILER_TARGET: &str = "jemprof";

/// Atomics are used to communicate configurations between the start/stop
/// endpoints and the [JemallocProfiled] allocator wrapper.
///
/// The flags are padded to avoid false sharing of the CPU cache line between
/// threads. 128 bytes is the cache line size on x86_64 and arm64.
#[repr(align(128))]
struct Flags {
    /// The minimum allocation size that is recorded by the tracker.
    min_alloc_bytes_for_profiling: AtomicU64,
    /// Whether the profiling is started or not.
    enabled: AtomicBool,
    /// Padding to make sure we fill the cache line.
    _padding: [u8; 119], // 128 (align) - 8 (u64) - 1 (bool)
}

static FLAGS: Flags = Flags {
    min_alloc_bytes_for_profiling: AtomicU64::new(DEFAULT_MIN_ALLOC_BYTES_FOR_PROFILING),
    enabled: AtomicBool::new(false),
    _padding: [0; 119],
};

static ALLOCATION_TRACKER: Lazy<Mutex<Allocations>> =
    Lazy::new(|| Mutex::new(Allocations::default()));

/// Starts measuring heap allocations and logs important leaks.
///
/// This function uses a wrapper around the global Jemalloc allocator to
/// instrument it.
///
/// Each time an allocation bigger than min_alloc_bytes_for_profiling is
/// performed, it is recorded in a map and the statistics for its call site are
/// updated. Tracking allocations is costly because it requires acquiring a
/// global mutex. Setting a reasonable value for min_alloc_bytes_for_profiling
/// is crucial. For instance for a search aggregation request, tracking every
/// allocations (min_alloc_bytes_for_profiling=1) is typically 100x slower than
/// using a minimum of 64kB.
///
/// During profiling, the statistics per call site are used to log when specific
/// thresholds are exceeded. For each call site, the allocated memory is logged
/// (with a backtrace) every time it exceeds the last logged allocated memory by
/// at least alloc_bytes_triggering_backtrace. This logging interval should
/// usually be set to a value of at least 500MB to limit the logging verbosity.
pub fn start_profiling(
    min_alloc_bytes_for_profiling: Option<u64>,
    alloc_bytes_triggering_backtrace: Option<u64>,
) {
    #[cfg(miri)]
    warn!(
        "heap profiling is not supported with Miri because in that case the `backtrace` crate \
         allocates"
    );

    // Call backtrace once to warmup symbolization allocations (~30MB)
    backtrace::trace(|frame| {
        backtrace::resolve_frame(frame, |_| {});
        true
    });

    let alloc_bytes_triggering_backtrace =
        alloc_bytes_triggering_backtrace.unwrap_or(DEFAULT_REPORTING_INTERVAL_BYTES);
    ALLOCATION_TRACKER
        .lock()
        .unwrap()
        .init(alloc_bytes_triggering_backtrace);

    let min_alloc_bytes_for_profiling =
        min_alloc_bytes_for_profiling.unwrap_or(DEFAULT_MIN_ALLOC_BYTES_FOR_PROFILING);

    // stdout() might allocate a buffer on first use. If the first allocation
    // tracked comes from stdout, it will trigger a deadlock. Logging here
    // guarantees that it doesn't happen.
    info!(
        min_alloc_for_profiling = %ByteSize(min_alloc_bytes_for_profiling),
        alloc_triggering_backtrace = %ByteSize(alloc_bytes_triggering_backtrace),
        "heap profiling running"
    );

    // Use strong ordering to make sure all threads see these changes in this order
    FLAGS
        .min_alloc_bytes_for_profiling
        .store(min_alloc_bytes_for_profiling, Ordering::SeqCst);
    FLAGS.enabled.store(true, Ordering::SeqCst);
}

/// Stops measuring heap allocations.
///
/// The allocation tracking tables and the symbol cache are not cleared.
pub fn stop_profiling() {
    // Use strong ordering to make sure all threads see these changes in this order
    let previously_enabled = FLAGS.enabled.swap(false, Ordering::SeqCst);
    FLAGS
        .min_alloc_bytes_for_profiling
        .store(DEFAULT_MIN_ALLOC_BYTES_FOR_PROFILING, Ordering::SeqCst);

    info!(previously_enabled, "heap profiling stopped");
}

/// Wraps the Jemalloc global allocator calls with tracking routines.
///
/// The tracking routines are called only when FLAGS.enabled is set to true
/// (calling [start_profiling()]). We load it with [Ordering::Relaxed] because
/// it's fine to miss or record extra allocation events and prefer limiting the
/// performance impact when profiling is not enabled.
///
/// Note: It's important to ensure that no allocations are performed inside the
/// allocator! It can cause an abort, a panic or even a deadlock.
pub struct JemallocProfiled(pub Jemalloc);

unsafe impl GlobalAlloc for JemallocProfiled {
    #[inline]
    unsafe fn alloc(&self, layout: Layout) -> *mut u8 {
        let ptr = unsafe { self.0.alloc(layout) };
        if FLAGS.enabled.load(Ordering::Relaxed) {
            track_alloc_call(ptr, layout);
        }
        ptr
    }

    #[inline]
    unsafe fn alloc_zeroed(&self, layout: Layout) -> *mut u8 {
        let ptr = unsafe { self.0.alloc_zeroed(layout) };
        if FLAGS.enabled.load(Ordering::Relaxed) {
            track_alloc_call(ptr, layout);
        }
        ptr
    }

    #[inline]
    unsafe fn dealloc(&self, ptr: *mut u8, layout: Layout) {
        if FLAGS.enabled.load(Ordering::Relaxed) {
            track_dealloc_call(ptr, layout);
        }
        unsafe { self.0.dealloc(ptr, layout) }
    }

    #[inline]
    unsafe fn realloc(&self, old_ptr: *mut u8, layout: Layout, new_size: usize) -> *mut u8 {
        let new_ptr = unsafe { self.0.realloc(old_ptr, layout, new_size) };
        if FLAGS.enabled.load(Ordering::Relaxed) {
            track_realloc_call(old_ptr, new_ptr, layout, new_size);
        }
        new_ptr
    }
}

/// Prints both a backtrace and a Tokio tracing log
///
/// Warning: stdout writer might allocate a buffer on first use
fn identify_callsite(callsite_hash: u64, stat: AllocStat) {
    // To generate a complete trace:
    // - tokio/tracing feature must be enabled, otherwise un-instrumented tasks will not propagate
    //   parent spans
    // - the tracing fmt subscriber filter must keep all spans for this event (TRACE level). See the
    //   logger configuration for more details.
    trace!(target: JEMALLOC_PROFILER_TARGET, callsite=callsite_hash, allocs=stat.count, size=%stat.size);
}

fn backtrace_hash() -> u64 {
    let mut hasher = fnv::FnvHasher::default();
    backtrace::trace(|frame| {
        hasher.write_usize(frame.ip() as usize);
        true
    });
    hasher.finish()
}

/// Warning: this function should not allocate!
#[cold]
fn track_alloc_call(ptr: *mut u8, layout: Layout) {
    if layout.size() >= FLAGS.min_alloc_bytes_for_profiling.load(Ordering::Relaxed) as usize {
        let callsite_hash = backtrace_hash();
        let recording_response = ALLOCATION_TRACKER.lock().unwrap().record_allocation(
            callsite_hash,
            layout.size() as u64,
            ptr,
        );

        match recording_response {
            AllocRecordingResponse::ThresholdExceeded(stat_for_trace) => {
                identify_callsite(callsite_hash, stat_for_trace);
            }
            AllocRecordingResponse::TrackerFull(table_name) => {
                // this message might be displayed multiple times but that's fine
                // warning: stdout writer might allocate a buffer on first use
                error!("heap profiling stopped, {table_name} full");
                FLAGS.enabled.store(false, Ordering::Relaxed);
            }
            AllocRecordingResponse::ThresholdNotExceeded => {}
            AllocRecordingResponse::NotStarted => {}
        }
    }
}

/// Warning: this function should not allocate!
#[cold]
fn track_dealloc_call(ptr: *mut u8, layout: Layout) {
    if layout.size() >= FLAGS.min_alloc_bytes_for_profiling.load(Ordering::Relaxed) as usize {
        ALLOCATION_TRACKER.lock().unwrap().record_deallocation(ptr);
    }
}

/// Warning: this function should not allocate!
#[cold]
fn track_realloc_call(old_ptr: *mut u8, new_ptr: *mut u8, current_layout: Layout, new_size: usize) {
    if current_layout.size() >= FLAGS.min_alloc_bytes_for_profiling.load(Ordering::Relaxed) as usize
    {
        let recording_response = ALLOCATION_TRACKER.lock().unwrap().record_reallocation(
            new_size as u64,
            old_ptr,
            new_ptr,
        );

        match recording_response {
            ReallocRecordingResponse::ThresholdExceeded {
                statistics,
                callsite_hash,
            } => {
                identify_callsite(callsite_hash, statistics);
            }
            ReallocRecordingResponse::ThresholdNotExceeded => {}
            ReallocRecordingResponse::NotStarted => {}
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_size_of_flags() {
        assert_eq!(std::mem::size_of::<Flags>(), 128);
    }
}


================================================
FILE: quickwit/quickwit-common/src/kill_switch.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::atomic::{AtomicBool, Ordering};
use std::sync::{Arc, Mutex, Weak};

use tracing::debug;

#[derive(Clone, Default)]
pub struct KillSwitch {
    inner: Arc<Inner>,
}

struct Inner {
    alive: AtomicBool,
    children: Mutex<Vec<Weak<Inner>>>,
}

impl Default for Inner {
    fn default() -> Self {
        Self {
            alive: AtomicBool::new(true),
            children: Mutex::default(),
        }
    }
}

fn garbage_collect(children: &mut Vec<Weak<Inner>>) {
    let mut i = 0;
    while i < children.len() {
        if Weak::strong_count(&children[i]) == 0 {
            children.swap_remove(i);
        } else {
            i += 1;
        }
    }
}

impl KillSwitch {
    pub fn is_alive(&self) -> bool {
        self.inner.alive.load(Ordering::Relaxed)
    }

    pub fn is_dead(&self) -> bool {
        !self.is_alive()
    }

    pub fn kill(&self) {
        self.inner.kill();
    }

    // Creates a child killswitch.
    //
    // If the parent kill switch is dead to begin with, the child will be dead too.
    pub fn child(&self) -> KillSwitch {
        let mut lock = self.inner.children.lock().unwrap();
        let child_inner = Inner {
            alive: AtomicBool::new(self.is_alive()),
            ..Default::default()
        };
        garbage_collect(&mut lock);
        let child_inner_arc = Arc::new(child_inner);
        lock.push(Arc::downgrade(&child_inner_arc));
        KillSwitch {
            inner: child_inner_arc,
        }
    }
}

impl Inner {
    pub fn kill(&self) {
        debug!("kill-switch-activated");
        self.alive.store(false, Ordering::Relaxed);
        let mut lock = self.children.lock().unwrap();
        for weak in lock.drain(..) {
            if let Some(inner) = weak.upgrade() {
                inner.kill();
            }
        }
    }
}
#[cfg(test)]
mod tests {
    use super::KillSwitch;

    #[test]
    fn test_kill_switch() {
        let kill_switch = KillSwitch::default();
        assert!(kill_switch.is_alive());
        assert!(!kill_switch.is_dead());
        kill_switch.kill();
        assert!(!kill_switch.is_alive());
        assert!(kill_switch.is_dead());
        kill_switch.kill();
        assert!(!kill_switch.is_alive());
        assert!(kill_switch.is_dead());
    }

    #[test]
    fn test_kill_switch_child() {
        let kill_switch = KillSwitch::default();
        let child_kill_switch = kill_switch.child();
        let child_kill_switch2 = kill_switch.child();
        assert!(child_kill_switch.is_alive());
        assert!(child_kill_switch2.is_alive());
        kill_switch.kill();
        assert!(child_kill_switch.is_dead());
        assert!(child_kill_switch2.is_dead());
    }

    #[test]
    fn test_kill_switch_grandchildren() {
        let kill_switch = KillSwitch::default();
        let child_kill_switch = kill_switch.child();
        let grandchild_kill_switch = child_kill_switch.child();
        assert!(kill_switch.is_alive());
        assert!(child_kill_switch.is_alive());
        assert!(grandchild_kill_switch.is_alive());
        kill_switch.kill();
        assert!(kill_switch.is_dead());
        assert!(child_kill_switch.is_dead());
        assert!(grandchild_kill_switch.is_dead());
    }

    #[test]
    fn test_kill_switch_to_quoque_me_fili() {
        let kill_switch = KillSwitch::default();
        let child_kill_switch = kill_switch.child();
        assert!(kill_switch.is_alive());
        assert!(child_kill_switch.is_alive());
        child_kill_switch.kill();
        assert!(kill_switch.is_alive());
        assert!(child_kill_switch.is_dead());
    }
}


================================================
FILE: quickwit/quickwit-common/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

mod coolid;

#[cfg(feature = "jemalloc-profiled")]
pub(crate) mod alloc_tracker;
pub mod binary_heap;
mod cpus;
pub mod fs;
pub mod io;
#[cfg(feature = "jemalloc-profiled")]
pub mod jemalloc_profiled;
mod kill_switch;
pub mod metrics;
pub mod net;
mod path_hasher;
pub mod pretty;
mod progress;
pub mod pubsub;
pub mod rand;
pub mod rate_limited_tracing;
pub mod rate_limiter;
pub mod rendezvous_hasher;
pub mod retry;
pub mod ring_buffer;
pub mod runtimes;
pub mod shared_consts;
pub mod sorted_iter;
pub mod stream_utils;
pub mod temp_dir;
#[cfg(any(test, feature = "testsuite"))]
pub mod test_utils;
pub mod thread_pool;
pub mod tower;
pub mod type_map;
pub mod uri;

mod socket_addr_legacy_hash;

use std::env;
use std::fmt::{Debug, Display};
use std::future::Future;
use std::ops::{Range, RangeInclusive};
use std::str::FromStr;

pub use coolid::new_coolid;
pub use cpus::num_cpus;
pub use kill_switch::KillSwitch;
pub use path_hasher::PathHasher;
pub use progress::{Progress, ProtectedZoneGuard};
pub use socket_addr_legacy_hash::SocketAddrLegacyHash;
pub use stream_utils::{BoxStream, ServiceStream};
use tracing::{error, info};

/// Returns true at compile time. This function is mostly used with serde to initialize boolean
/// fields to true.
pub const fn true_fn() -> bool {
    true
}

/// Returns whether the given boolean value is true. This function is mostly used with serde to skip
/// serializing boolean fields with `skip_serializing_if = "is_true"` when the value is true.
pub fn is_true(value: &bool) -> bool {
    *value
}

pub fn chunk_range(range: Range<usize>, chunk_size: usize) -> impl Iterator<Item = Range<usize>> {
    range.clone().step_by(chunk_size).map(move |block_start| {
        let block_end = (block_start + chunk_size).min(range.end);
        block_start..block_end
    })
}

pub fn into_u64_range(range: Range<usize>) -> Range<u64> {
    range.start as u64..range.end as u64
}

pub fn setup_logging_for_tests() {
    let _ = env_logger::builder().format_timestamp(None).try_init();
}

pub fn split_file(split_id: impl Display) -> String {
    format!("{split_id}.split")
}

fn get_from_env_opt_aux<T: Debug>(
    key: &str,
    parse_fn: impl FnOnce(&str) -> Option<T>,
    sensitive: bool,
) -> Option<T> {
    let value_str = std::env::var(key).ok()?;
    let Some(value) = parse_fn(&value_str) else {
        error!(value=%value_str, "failed to parse environment variable `{key}` value");
        return None;
    };
    if sensitive {
        info!("using environment variable `{key}` value");
    } else {
        info!(value=?value, "using environment variable `{key}` value");
    }
    Some(value)
}

pub fn get_from_env<T: FromStr + Debug>(key: &str, default_value: T, sensitive: bool) -> T {
    if let Some(value) = get_from_env_opt(key, sensitive) {
        value
    } else {
        info!(default_value=?default_value, "using environment variable `{key}` default value");
        default_value
    }
}

pub fn get_from_env_opt<T: FromStr + Debug>(key: &str, sensitive: bool) -> Option<T> {
    get_from_env_opt_aux(key, |val_str| val_str.parse().ok(), sensitive)
}

pub fn get_bool_from_env_opt(key: &str) -> Option<bool> {
    get_from_env_opt_aux(key, parse_bool_lenient, false)
}

pub fn get_bool_from_env(key: &str, default_value: bool) -> bool {
    if let Some(flag_value) = get_bool_from_env_opt(key) {
        flag_value
    } else {
        info!(default_value=%default_value, "using environment variable `{key}` default value");
        default_value
    }
}

pub fn truncate_str(text: &str, max_len: usize) -> &str {
    if max_len > text.len() {
        return text;
    }

    let mut truncation_index = max_len;
    while !text.is_char_boundary(truncation_index) {
        truncation_index -= 1;
    }
    &text[..truncation_index]
}

/// Extracts time range from optional start and end timestamps.
pub fn extract_time_range(
    start_timestamp_opt: Option<i64>,
    end_timestamp_opt: Option<i64>,
) -> Option<Range<i64>> {
    match (start_timestamp_opt, end_timestamp_opt) {
        (Some(start_timestamp), Some(end_timestamp)) => Some(Range {
            start: start_timestamp,
            end: end_timestamp,
        }),
        (_, Some(end_timestamp)) => Some(Range {
            start: i64::MIN,
            end: end_timestamp,
        }),
        (Some(start_timestamp), _) => Some(Range {
            start: start_timestamp,
            end: i64::MAX,
        }),
        _ => None,
    }
}

/// Takes 2 intervals and returns true iff their intersection is empty
pub fn is_disjoint(left: &Range<i64>, right: &RangeInclusive<i64>) -> bool {
    left.end <= *right.start() || *right.end() < left.start
}

/// For use with the `skip_serializing_if` serde attribute.
pub fn is_false(value: &bool) -> bool {
    !*value
}

pub fn no_color() -> bool {
    matches!(env::var("NO_COLOR"), Ok(value) if !value.is_empty())
}

#[macro_export]
macro_rules! assert_eventually {
    ($cond:expr, $timeout:expr, $interval:expr) => {
        let start = std::time::Instant::now();
        loop {
            if $cond {
                break;
            }
            if start.elapsed() > $timeout {
                panic!(
                    "assertion failed: condition `{}` never became true within {} ms",
                    stringify!($cond),
                    $timeout.as_millis()
                );
            }
            tokio::time::sleep($interval).await;
        }
    };
    ($cond:expr, $timeout:expr) => {
        assert_eventually!($cond, $timeout, std::time::Duration::from_millis(50));
    };
    ($cond:expr) => {
        assert_eventually!($cond, std::time::Duration::from_secs(1));
    };
}

#[macro_export]
macro_rules! ignore_error_kind {
    ($kind:path, $expr:expr) => {
        match $expr {
            Ok(_) => Ok(()),
            Err(error) if error.kind() == $kind => Ok(()),
            Err(error) => Err(error),
        }
    };
}

#[inline]
pub const fn div_ceil_u32(lhs: u32, rhs: u32) -> u32 {
    let d = lhs / rhs;
    let r = lhs % rhs;
    if r > 0 { d + 1 } else { d }
}

#[inline]
pub const fn div_ceil(lhs: i64, rhs: i64) -> i64 {
    let d = lhs / rhs;
    let r = lhs % rhs;
    if (r > 0 && rhs > 0) || (r < 0 && rhs < 0) {
        d + 1
    } else {
        d
    }
}

// The following are helpers to build named tasks.
//
// Named tasks require the tokio feature `tracing` to be enabled. If the
// `named_tasks` feature is disabled, this is no-op.
//
// By default, these function will just ignore the name passed and just act like
// a regular call to `tokio::spawn`.
//
// If the user compiles `quickwit-cli` with the `tokio-console` feature, then
// tasks will automatically be named. This is not just "visual sugar".
//
// Without names, tasks will only show their spawn site on tokio-console. This
// is a catastrophy for actors who all share the same spawn site.
//
// The #[track_caller] annotation is used to show the right spawn site in the
// Tokio TRACE spans (only available when the tokio/tracing feature is on).
//
// # Naming
//
// Actors will get named after their type, which is fine. For other tasks,
// please use `snake_case`.

#[cfg(not(all(tokio_unstable, feature = "named_tasks")))]
#[track_caller]
pub fn spawn_named_task<F>(future: F, _name: &'static str) -> tokio::task::JoinHandle<F::Output>
where
    F: Future + Send + 'static,
    F::Output: Send + 'static,
{
    tokio::task::spawn(future)
}

#[cfg(not(all(tokio_unstable, feature = "named_tasks")))]
#[track_caller]
pub fn spawn_named_task_on<F>(
    future: F,
    _name: &'static str,
    runtime: &tokio::runtime::Handle,
) -> tokio::task::JoinHandle<F::Output>
where
    F: Future + Send + 'static,
    F::Output: Send + 'static,
{
    runtime.spawn(future)
}

#[cfg(all(tokio_unstable, feature = "named_tasks"))]
#[track_caller]
pub fn spawn_named_task<F>(future: F, name: &'static str) -> tokio::task::JoinHandle<F::Output>
where
    F: Future + Send + 'static,
    F::Output: Send + 'static,
{
    tokio::task::Builder::new()
        .name(name)
        .spawn(future)
        .unwrap()
}

#[cfg(all(tokio_unstable, feature = "named_tasks"))]
#[track_caller]
pub fn spawn_named_task_on<F>(
    future: F,
    name: &'static str,
    runtime: &tokio::runtime::Handle,
) -> tokio::task::JoinHandle<F::Output>
where
    F: Future + Send + 'static,
    F::Output: Send + 'static,
{
    tokio::task::Builder::new()
        .name(name)
        .spawn_on(future, runtime)
        .unwrap()
}

pub fn parse_bool_lenient(bool_str: &str) -> Option<bool> {
    let trimmed_bool_str = bool_str.trim();

    for truthy_value in ["true", "yes", "1"] {
        if trimmed_bool_str.eq_ignore_ascii_case(truthy_value) {
            return Some(true);
        }
    }
    for falsy_value in ["false", "no", "0"] {
        if trimmed_bool_str.eq_ignore_ascii_case(falsy_value) {
            return Some(false);
        }
    }
    None
}

#[cfg(test)]
mod tests {
    use std::io::ErrorKind;

    use super::*;

    #[test]
    fn test_get_from_env() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremely inconvenient to run it in a different
        // way, we are keeping it that way

        const TEST_KEY: &str = "TEST_KEY";
        assert_eq!(super::get_from_env(TEST_KEY, 10, false), 10);
        unsafe { std::env::set_var(TEST_KEY, "15") };
        assert_eq!(super::get_from_env(TEST_KEY, 10, false), 15);
        unsafe { std::env::set_var(TEST_KEY, "1invalidnumber") };
        assert_eq!(super::get_from_env(TEST_KEY, 10, false), 10);
    }

    #[test]
    fn test_truncate_str() {
        assert_eq!(truncate_str("", 0), "");
        assert_eq!(truncate_str("", 3), "");
        assert_eq!(truncate_str("hello", 0), "");
        assert_eq!(truncate_str("hello", 5), "hello");
        assert_eq!(truncate_str("hello", 6), "hello");
        assert_eq!(truncate_str("hello-world", 5), "hello");
        assert_eq!(truncate_str("hello-world", 6), "hello-");
        assert_eq!(truncate_str("hello🧑‍🔬world", 6), "hello");
        assert_eq!(truncate_str("hello🧑‍🔬world", 7), "hello");
    }

    #[test]
    fn test_ignore_io_error_macro() {
        ignore_error_kind!(
            ErrorKind::NotFound,
            std::fs::remove_file("file-does-not-exist")
        )
        .unwrap();
    }

    #[test]
    fn test_div_ceil() {
        assert_eq!(div_ceil(5, 1), 5);
        assert_eq!(div_ceil(5, 2), 3);
        assert_eq!(div_ceil(6, 2), 3);

        assert_eq!(div_ceil(3, 3), 1);
        assert_eq!(div_ceil(2, 3), 1);
        assert_eq!(div_ceil(1, 3), 1);
        assert_eq!(div_ceil(0, 3), 0);
        assert_eq!(div_ceil(-1, 3), 0);
        assert_eq!(div_ceil(-2, 3), 0);

        assert_eq!(div_ceil(-5, 1), -5);
        assert_eq!(div_ceil(-5, 2), -2);
        assert_eq!(div_ceil(-6, 2), -3);

        assert_eq!(div_ceil(5, -1), -5);
        assert_eq!(div_ceil(5, -2), -2);
        assert_eq!(div_ceil(6, -2), -3);

        assert_eq!(div_ceil(-5, -1), 5);
        assert_eq!(div_ceil(-5, -2), 3);
        assert_eq!(div_ceil(-6, -2), 3);
    }

    #[test]
    fn test_div_ceil_u32() {
        assert_eq!(div_ceil_u32(5, 1), 5);
        assert_eq!(div_ceil_u32(5, 2), 3);
        assert_eq!(div_ceil_u32(6, 2), 3);
        assert_eq!(div_ceil_u32(3, 3), 1);
        assert_eq!(div_ceil_u32(2, 3), 1);
        assert_eq!(div_ceil_u32(1, 3), 1);
        assert_eq!(div_ceil_u32(0, 3), 0);
    }

    #[test]
    fn test_parse_bool_lenient() {
        assert_eq!(parse_bool_lenient("true"), Some(true));
        assert_eq!(parse_bool_lenient("TRUE"), Some(true));
        assert_eq!(parse_bool_lenient("True"), Some(true));
        assert_eq!(parse_bool_lenient("yes"), Some(true));
        assert_eq!(parse_bool_lenient(" 1"), Some(true));

        assert_eq!(parse_bool_lenient("false"), Some(false));
        assert_eq!(parse_bool_lenient("FALSE"), Some(false));
        assert_eq!(parse_bool_lenient("False"), Some(false));
        assert_eq!(parse_bool_lenient("no"), Some(false));
        assert_eq!(parse_bool_lenient("0 "), Some(false));

        assert_eq!(parse_bool_lenient("foo"), None);
    }
}


================================================
FILE: quickwit/quickwit-common/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, HashMap};
use std::sync::{LazyLock, OnceLock};

use prometheus::{Gauge, HistogramOpts, Opts, TextEncoder};
pub use prometheus::{
    Histogram, HistogramTimer, HistogramVec as PrometheusHistogramVec, IntCounter,
    IntCounterVec as PrometheusIntCounterVec, IntGauge, IntGaugeVec as PrometheusIntGaugeVec,
    exponential_buckets, linear_buckets,
};

#[derive(Clone)]
pub struct HistogramVec<const N: usize> {
    underlying: PrometheusHistogramVec,
}

impl<const N: usize> HistogramVec<N> {
    pub fn with_label_values(&self, label_values: [&str; N]) -> Histogram {
        self.underlying.with_label_values(&label_values)
    }
}

#[derive(Clone)]
pub struct IntCounterVec<const N: usize> {
    underlying: PrometheusIntCounterVec,
}

impl<const N: usize> IntCounterVec<N> {
    pub fn new(
        name: &str,
        help: &str,
        subsystem: &str,
        const_labels: &[(&str, &str)],
        label_names: [&str; N],
    ) -> IntCounterVec<N> {
        let owned_const_labels: HashMap<String, String> = const_labels
            .iter()
            .map(|(label_name, label_value)| (label_name.to_string(), label_value.to_string()))
            .collect();
        let counter_opts = Opts::new(name, help)
            .namespace("quickwit")
            .subsystem(subsystem)
            .const_labels(owned_const_labels);
        let underlying = PrometheusIntCounterVec::new(counter_opts, &label_names)
            .expect("failed to create counter vec");
        IntCounterVec { underlying }
    }

    pub fn with_label_values(&self, label_values: [&str; N]) -> IntCounter {
        self.underlying.with_label_values(&label_values)
    }
}

#[derive(Clone)]
pub struct IntGaugeVec<const N: usize> {
    underlying: PrometheusIntGaugeVec,
}

impl<const N: usize> IntGaugeVec<N> {
    pub fn with_label_values(&self, label_values: [&str; N]) -> IntGauge {
        self.underlying.with_label_values(&label_values)
    }
}

pub fn register_info(name: &'static str, help: &'static str, kvs: BTreeMap<&'static str, String>) {
    let mut counter_opts = Opts::new(name, help).namespace("quickwit");
    for (k, v) in kvs {
        counter_opts = counter_opts.const_label(k, v);
    }
    let counter = IntCounter::with_opts(counter_opts).expect("failed to create counter");
    counter.inc();
    prometheus::register(Box::new(counter)).expect("failed to register counter");
}

pub fn new_counter(
    name: &str,
    help: &str,
    subsystem: &str,
    const_labels: &[(&str, &str)],
) -> IntCounter {
    let owned_const_labels: HashMap<String, String> = const_labels
        .iter()
        .map(|(label_name, label_value)| (label_name.to_string(), label_value.to_string()))
        .collect();
    let counter_opts = Opts::new(name, help)
        .namespace("quickwit")
        .subsystem(subsystem)
        .const_labels(owned_const_labels);
    let counter = IntCounter::with_opts(counter_opts).expect("failed to create counter");
    prometheus::register(Box::new(counter.clone())).expect("failed to register counter");
    counter
}

pub fn new_counter_vec<const N: usize>(
    name: &str,
    help: &str,
    subsystem: &str,
    const_labels: &[(&str, &str)],
    label_names: [&str; N],
) -> IntCounterVec<N> {
    let int_counter_vec = IntCounterVec::new(name, help, subsystem, const_labels, label_names);
    let collector = Box::new(int_counter_vec.underlying.clone());
    prometheus::register(collector).expect("failed to register counter vec");
    int_counter_vec
}

pub fn new_float_gauge(
    name: &str,
    help: &str,
    subsystem: &str,
    const_labels: &[(&str, &str)],
) -> Gauge {
    let owned_const_labels: HashMap<String, String> = const_labels
        .iter()
        .map(|(label_name, label_value)| (label_name.to_string(), label_value.to_string()))
        .collect();
    let gauge_opts = Opts::new(name, help)
        .namespace("quickwit")
        .subsystem(subsystem)
        .const_labels(owned_const_labels);
    let gauge = Gauge::with_opts(gauge_opts).expect("failed to create float gauge");
    prometheus::register(Box::new(gauge.clone())).expect("failed to register float gauge");
    gauge
}

pub fn new_gauge(
    name: &str,
    help: &str,
    subsystem: &str,
    const_labels: &[(&str, &str)],
) -> IntGauge {
    let owned_const_labels: HashMap<String, String> = const_labels
        .iter()
        .map(|(label_name, label_value)| (label_name.to_string(), label_value.to_string()))
        .collect();
    let gauge_opts = Opts::new(name, help)
        .namespace("quickwit")
        .subsystem(subsystem)
        .const_labels(owned_const_labels);
    let gauge = IntGauge::with_opts(gauge_opts).expect("failed to create gauge");
    prometheus::register(Box::new(gauge.clone())).expect("failed to register gauge");
    gauge
}

pub fn new_gauge_vec<const N: usize>(
    name: &str,
    help: &str,
    subsystem: &str,
    const_labels: &[(&str, &str)],
    label_names: [&str; N],
) -> IntGaugeVec<N> {
    let owned_const_labels: HashMap<String, String> = const_labels
        .iter()
        .map(|(label_name, label_value)| (label_name.to_string(), label_value.to_string()))
        .collect();
    let gauge_opts = Opts::new(name, help)
        .namespace("quickwit")
        .subsystem(subsystem)
        .const_labels(owned_const_labels);
    let underlying =
        PrometheusIntGaugeVec::new(gauge_opts, &label_names).expect("failed to create gauge vec");

    let collector = Box::new(underlying.clone());
    prometheus::register(collector).expect("failed to register counter vec");

    IntGaugeVec { underlying }
}

pub fn new_histogram(name: &str, help: &str, subsystem: &str, buckets: Vec<f64>) -> Histogram {
    let histogram_opts = HistogramOpts::new(name, help)
        .namespace("quickwit")
        .subsystem(subsystem)
        .buckets(buckets);
    let histogram = Histogram::with_opts(histogram_opts).expect("failed to create histogram");
    prometheus::register(Box::new(histogram.clone())).expect("failed to register histogram");
    histogram
}

pub fn new_histogram_vec<const N: usize>(
    name: &str,
    help: &str,
    subsystem: &str,
    const_labels: &[(&str, &str)],
    label_names: [&str; N],
    buckets: Vec<f64>,
) -> HistogramVec<N> {
    let owned_const_labels: HashMap<String, String> = const_labels
        .iter()
        .map(|(label_name, label_value)| (label_name.to_string(), label_value.to_string()))
        .collect();
    let histogram_opts = HistogramOpts::new(name, help)
        .namespace("quickwit")
        .subsystem(subsystem)
        .const_labels(owned_const_labels)
        .buckets(buckets);
    let underlying = PrometheusHistogramVec::new(histogram_opts, &label_names)
        .expect("failed to create histogram vec");

    let collector = Box::new(underlying.clone());
    prometheus::register(collector).expect("failed to register histogram vec");

    HistogramVec { underlying }
}

pub struct GaugeGuard<'a> {
    gauge: &'a IntGauge,
    delta: i64,
}

impl std::fmt::Debug for GaugeGuard<'_> {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        self.delta.fmt(f)
    }
}

impl<'a> GaugeGuard<'a> {
    pub fn from_gauge(gauge: &'a IntGauge) -> Self {
        Self { gauge, delta: 0i64 }
    }

    pub fn get(&self) -> i64 {
        self.delta
    }

    pub fn add(&mut self, delta: i64) {
        self.gauge.add(delta);
        self.delta += delta;
    }

    pub fn sub(&mut self, delta: i64) {
        self.gauge.sub(delta);
        self.delta -= delta;
    }
}

impl Drop for GaugeGuard<'_> {
    fn drop(&mut self) {
        self.gauge.sub(self.delta)
    }
}

pub struct OwnedGaugeGuard {
    gauge: IntGauge,
    delta: i64,
}

impl std::fmt::Debug for OwnedGaugeGuard {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        self.delta.fmt(f)
    }
}

impl OwnedGaugeGuard {
    pub fn from_gauge(gauge: IntGauge) -> Self {
        Self { gauge, delta: 0i64 }
    }

    pub fn get(&self) -> i64 {
        self.delta
    }

    pub fn add(&mut self, delta: i64) {
        self.gauge.add(delta);
        self.delta += delta;
    }

    pub fn sub(&mut self, delta: i64) {
        self.gauge.sub(delta);
        self.delta -= delta;
    }
}

impl Drop for OwnedGaugeGuard {
    fn drop(&mut self) {
        self.gauge.sub(self.delta)
    }
}

pub fn metrics_text_payload() -> Result<String, String> {
    let metric_families = prometheus::gather();
    // Arbitrary non-zero size in order to skip a bunch of
    // buffer growth-reallocations when encoding metrics.
    let mut buffer = String::with_capacity(1024);
    let encoder = TextEncoder::new();
    match encoder.encode_utf8(&metric_families, &mut buffer) {
        Ok(()) => Ok(buffer),
        Err(e) => Err(e.to_string()),
    }
}

#[derive(Clone)]
pub struct MemoryMetrics {
    pub active_bytes: IntGauge,
    pub allocated_bytes: IntGauge,
    pub resident_bytes: IntGauge,
    pub in_flight: InFlightDataGauges,
}

impl Default for MemoryMetrics {
    fn default() -> Self {
        Self {
            active_bytes: new_gauge(
                "active_bytes",
                "Total number of bytes in active pages allocated by the application, as reported \
                 by jemalloc `stats.active`.",
                "memory",
                &[],
            ),
            allocated_bytes: new_gauge(
                "allocated_bytes",
                "Total number of bytes allocated by the application, as reported by jemalloc \
                 `stats.allocated`.",
                "memory",
                &[],
            ),
            resident_bytes: new_gauge(
                "resident_bytes",
                " Total number of bytes in physically resident data pages mapped by the \
                 allocator, as reported by jemalloc `stats.resident`.",
                "memory",
                &[],
            ),
            in_flight: InFlightDataGauges::default(),
        }
    }
}

#[derive(Clone)]
pub struct InFlightDataGauges {
    pub rest_server: IntGauge,
    pub ingest_router: IntGauge,
    pub ingester_persist: IntGauge,
    pub ingester_replicate: IntGauge,
    pub wal: IntGauge,
    pub fetch_stream: IntGauge,
    pub multi_fetch_stream: IntGauge,
    pub doc_processor_mailbox: IntGauge,
    pub indexer_mailbox: IntGauge,
    pub index_writer: IntGauge,
    in_flight_gauge_vec: IntGaugeVec<1>,
}

impl Default for InFlightDataGauges {
    fn default() -> Self {
        let in_flight_gauge_vec = new_gauge_vec(
            "in_flight_data_bytes",
            "Amount of data in-flight in various buffers in bytes.",
            "memory",
            &[],
            ["component"],
        );
        Self {
            rest_server: in_flight_gauge_vec.with_label_values(["rest_server"]),
            ingest_router: in_flight_gauge_vec.with_label_values(["ingest_router"]),
            ingester_persist: in_flight_gauge_vec.with_label_values(["ingester_persist"]),
            ingester_replicate: in_flight_gauge_vec.with_label_values(["ingester_replicate"]),
            wal: in_flight_gauge_vec.with_label_values(["wal"]),
            fetch_stream: in_flight_gauge_vec.with_label_values(["fetch_stream"]),
            multi_fetch_stream: in_flight_gauge_vec.with_label_values(["multi_fetch_stream"]),
            doc_processor_mailbox: in_flight_gauge_vec.with_label_values(["doc_processor_mailbox"]),
            indexer_mailbox: in_flight_gauge_vec.with_label_values(["indexer_mailbox"]),
            index_writer: in_flight_gauge_vec.with_label_values(["index_writer"]),
            in_flight_gauge_vec: in_flight_gauge_vec.clone(),
        }
    }
}

impl InFlightDataGauges {
    #[inline]
    pub fn file(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| self.in_flight_gauge_vec.with_label_values(["file_source"]))
    }

    #[inline]
    pub fn ingest(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| {
            self.in_flight_gauge_vec
                .with_label_values(["ingest_source"])
        })
    }

    #[inline]
    pub fn kafka(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| self.in_flight_gauge_vec.with_label_values(["kafka_source"]))
    }

    #[inline]
    pub fn kinesis(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| {
            self.in_flight_gauge_vec
                .with_label_values(["kinesis_source"])
        })
    }

    #[inline]
    pub fn pubsub(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| {
            self.in_flight_gauge_vec
                .with_label_values(["pubsub_source"])
        })
    }

    #[inline]
    pub fn pulsar(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| {
            self.in_flight_gauge_vec
                .with_label_values(["pulsar_source"])
        })
    }

    #[inline]
    pub fn other(&self) -> &IntGauge {
        static GAUGE: OnceLock<IntGauge> = OnceLock::new();
        GAUGE.get_or_init(|| {
            self.in_flight_gauge_vec
                .with_label_values(["pulsar_source"])
        })
    }
}

/// This function returns `index_id` as is if per-index metrics are enabled, or projects it to
/// `"__any__"` otherwise.
pub fn index_label(index_id: &str) -> &str {
    static PER_INDEX_METRICS_ENABLED: LazyLock<bool> =
        LazyLock::new(|| !crate::get_bool_from_env("QW_DISABLE_PER_INDEX_METRICS", false));

    if *PER_INDEX_METRICS_ENABLED {
        index_id
    } else {
        "__any__"
    }
}

pub static MEMORY_METRICS: LazyLock<MemoryMetrics> = LazyLock::new(MemoryMetrics::default);


================================================
FILE: quickwit/quickwit-common/src/net.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ffi::OsString;
use std::fmt::Display;
use std::io;
use std::net::{IpAddr, Ipv4Addr, Ipv6Addr, SocketAddr, TcpListener};
use std::str::FromStr;

use anyhow::{Context, bail};
use itertools::Itertools;
use once_cell::sync::OnceCell;
use pnet::datalink::{self, NetworkInterface};
use pnet::ipnetwork::IpNetwork;
use serde::{Deserialize, Serialize, Serializer};
use tokio::net::{ToSocketAddrs, lookup_host};

/// Represents a host, i.e. an IP address (`127.0.0.1`) or a hostname (`localhost`).
#[derive(Clone, Debug, Eq, PartialEq)]
pub enum Host {
    Hostname(String),
    IpAddr(IpAddr),
}

impl Host {
    /// Returns [`true`] for the "unspecified" address (all bits set to zero).
    pub fn is_unspecified(&self) -> bool {
        match &self {
            Host::Hostname(_) => false,
            Host::IpAddr(ip_addr) => ip_addr.is_unspecified(),
        }
    }

    /// Appends `port` to `self` and returns a [`HostAddr`].
    pub fn with_port(&self, port: u16) -> HostAddr {
        HostAddr {
            host: self.clone(),
            port,
        }
    }

    /// Resolves the host if necessary and returns an [`IpAddr`].
    pub async fn resolve(&self) -> anyhow::Result<IpAddr> {
        match &self {
            Host::Hostname(hostname) => get_socket_addr(&(hostname.as_str(), 0))
                .await
                .map(|socket_addr| socket_addr.ip()),
            Host::IpAddr(ip_addr) => Ok(*ip_addr),
        }
    }
}

impl Default for Host {
    fn default() -> Self {
        Host::IpAddr(IpAddr::V4(Ipv4Addr::LOCALHOST))
    }
}

impl Display for Host {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        match self {
            Host::Hostname(hostname) => hostname.fmt(formatter),
            Host::IpAddr(ip_addr) => ip_addr.fmt(formatter),
        }
    }
}

impl Serialize for Host {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        match self {
            Host::Hostname(hostname) => hostname.serialize(serializer),
            Host::IpAddr(ip_addr) => ip_addr.serialize(serializer),
        }
    }
}

impl<'de> Deserialize<'de> for Host {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        let host_str: String = Deserialize::deserialize(deserializer)?;
        host_str.parse().map_err(serde::de::Error::custom)
    }
}

impl From<IpAddr> for Host {
    fn from(ip_addr: IpAddr) -> Self {
        Host::IpAddr(ip_addr)
    }
}

impl From<Ipv4Addr> for Host {
    fn from(ip_addr: Ipv4Addr) -> Self {
        Host::IpAddr(IpAddr::V4(ip_addr))
    }
}

impl From<Ipv6Addr> for Host {
    fn from(ip_addr: Ipv6Addr) -> Self {
        Host::IpAddr(IpAddr::V6(ip_addr))
    }
}

impl FromStr for Host {
    type Err = anyhow::Error;

    fn from_str(host: &str) -> Result<Self, Self::Err> {
        if let Ok(ip_addr) = host.parse::<IpAddr>() {
            return Ok(Self::IpAddr(ip_addr));
        }
        if is_valid_hostname(host) {
            return Ok(Self::Hostname(host.to_string()));
        }
        bail!("failed to parse host: `{host}`")
    }
}

/// Represents an address `<host>:<port>` where `host` can be an IP address or a hostname.
#[derive(Clone, Debug)]
pub struct HostAddr {
    host: Host,
    port: u16,
}

impl HostAddr {
    /// Attempts to parse a `host_addr`.
    /// If no port is defined, it just accepts the host and uses the given default port.
    ///
    /// This function supports:
    /// - IPv4
    /// - IPv4:port
    /// - IPv6
    /// - \[IPv6\]:port -- IpV6 contains colon. It is customary to require bracket for this reason.
    /// - hostname
    /// - hostname:port
    pub fn parse_with_default_port(host_addr: &str, default_port: u16) -> anyhow::Result<Self> {
        if let Ok(socket_addr) = host_addr.parse::<SocketAddr>() {
            return Ok(Self {
                host: Host::IpAddr(socket_addr.ip()),
                port: socket_addr.port(),
            });
        }
        if let Ok(ip_addr) = host_addr.parse::<IpAddr>() {
            return Ok(Self {
                host: Host::IpAddr(ip_addr),
                port: default_port,
            });
        }
        let (hostname, port) = if let Some((hostname_str, port_str)) = host_addr.split_once(':') {
            let port_u16 = port_str.parse::<u16>().with_context(|| {
                format!("failed to parse address `{host_addr}`: port is invalid")
            })?;
            (hostname_str, port_u16)
        } else {
            (host_addr, default_port)
        };
        if !is_valid_hostname(hostname) {
            bail!(
                "failed to parse address `{}`: hostname is invalid",
                host_addr
            )
        }
        Ok(Self {
            host: Host::Hostname(hostname.to_string()),
            port,
        })
    }

    /// Resolves the host if necessary and returns a `SocketAddr`.
    pub async fn resolve(&self) -> anyhow::Result<SocketAddr> {
        self.host
            .resolve()
            .await
            .map(|ip_addr| SocketAddr::new(ip_addr, self.port))
    }

    /// Skips DNS resolution if possible and returns the host address as a `SocketAddr`.
    pub fn to_socket_addr(self) -> Option<SocketAddr> {
        if let Host::IpAddr(ip_addr) = self.host {
            Some(SocketAddr::new(ip_addr, self.port))
        } else {
            None
        }
    }
}

impl Display for HostAddr {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        match self.host {
            Host::IpAddr(IpAddr::V6(_)) => write!(formatter, "[{}]:{}", self.host, self.port),
            _ => write!(formatter, "{}:{}", self.host, self.port),
        }
    }
}

/// Finds a random available TCP port.
///
/// This function induces a race condition, use it only in unit tests.
pub fn find_available_tcp_port() -> anyhow::Result<u16> {
    let socket: SocketAddr = ([127, 0, 0, 1], 0u16).into();
    let listener = TcpListener::bind(socket)?;
    let port = listener.local_addr()?.port();
    Ok(port)
}

/// Attempts to find the private IP of the host. Returns the matching interface name along with it.
pub fn find_private_ip() -> Option<(String, IpAddr)> {
    _find_private_ip(&datalink::interfaces())
}

// Inner function for testing purposes.
fn _find_private_ip(interfaces: &[NetworkInterface]) -> Option<(String, IpAddr)> {
    // The way we do this is the following:
    // 1. List the network interfaces
    // 2. Filter out the interfaces that are not up
    // 3. Filter out the networks that are not routable and private
    // 4. Sort the IP addresses by:
    //      - type (IPv4 first)
    //      - mode (default first)
    //      - size of network address space (desc)
    // 5. Pick the first one
    interfaces
        .iter()
        .filter(|interface| interface.is_up())
        .flat_map(|interface| {
            interface
                .ips
                .iter()
                .filter(|ip_net| is_forwardable_ip(&ip_net.ip()) && is_private_ip(&ip_net.ip()))
                .map(move |ip_net| (interface, ip_net))
        })
        .sorted_by_key(|(interface, ip_net)| {
            (
                ip_net.is_ipv6(),
                is_dormant(interface),
                std::cmp::Reverse(ip_net.prefix()),
            )
        })
        .next()
        .map(|(interface, ip_net)| (interface.name.clone(), ip_net.ip()))
}

#[cfg(any(target_os = "linux", target_os = "android"))]
fn is_dormant(interface: &NetworkInterface) -> bool {
    interface.is_dormant()
}

#[cfg(not(any(target_os = "linux", target_os = "android")))]
fn is_dormant(_interface: &NetworkInterface) -> bool {
    false
}

/// Converts an object into a resolved `SocketAddr`.
pub async fn get_socket_addr<T: ToSocketAddrs + std::fmt::Debug>(
    addr: &T,
) -> anyhow::Result<SocketAddr> {
    lookup_host(addr)
        .await
        .with_context(|| format!("failed to parse address or resolve hostname {addr:?}"))?
        .next()
        .ok_or_else(|| {
            anyhow::anyhow!("DNS resolution did not yield any record for hostname {addr:?}")
        })
}

fn is_forwardable_ip(ip_addr: &IpAddr) -> bool {
    static NON_FORWARDABLE_NETWORKS: OnceCell<Vec<IpNetwork>> = OnceCell::new();
    NON_FORWARDABLE_NETWORKS
        .get_or_init(|| {
            // Blacklist of non-forwardable IP blocks taken from RFC6890
            [
                "0.0.0.0/8",
                "127.0.0.0/8",
                "169.254.0.0/16",
                "192.0.0.0/24",
                "192.0.2.0/24",
                "198.51.100.0/24",
                "2001:10::/28",
                "2001:db8::/32",
                "203.0.113.0/24",
                "240.0.0.0/4",
                "255.255.255.255/32",
                "::/128",
                "::1/128",
                "::ffff:0:0/96",
                "fe80::/10",
            ]
            .iter()
            .map(|network| network.parse().expect("Failed to parse network range. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues."))
            .collect()
        })
        .iter()
        .all(|network| !network.contains(*ip_addr))
}

fn is_private_ip(ip_addr: &IpAddr) -> bool {
    static PRIVATE_NETWORKS: OnceCell<Vec<IpNetwork>> = OnceCell::new();
    PRIVATE_NETWORKS
        .get_or_init(|| {
            ["192.168.0.0/16", "172.16.0.0/12", "10.0.0.0/8", "fc00::/7"]
                .iter()
                .map(|network| network.parse().expect("Failed to parse network range. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues."))
                .collect()
        })
        .iter()
        .any(|network| network.contains(*ip_addr))
}

pub fn get_hostname() -> io::Result<String> {
    _get_hostname(hostname::get()?)
}

// Inner function for testing purposes.
fn _get_hostname(hostname: OsString) -> io::Result<String> {
    let hostname_lossy = hostname.to_string_lossy();
    if is_valid_hostname(&hostname_lossy) {
        Ok(hostname_lossy.to_string())
    } else {
        Err(io::Error::other(format!(
            "invalid hostname: `{hostname_lossy}`"
        )))
    }
}

pub fn get_short_hostname() -> io::Result<String> {
    Ok(get_hostname()?
        .split('.')
        .next()
        .expect("Split should never fail.")
        .to_string())
}

/// Returns whether a hostname is valid according to [RFC 1123](https://www.rfc-editor.org/rfc/rfc1123).
///
/// A hostname is valid if the following conditions are met:
///
/// - It does not start or end with `-` or `.`.
/// - It does not contain any characters outside of the alphanumeric range, except for `-` and `.`.
/// - It is not empty.
/// - It is 253 or fewer characters.
/// - Its labels (characters separated by `.`) are not empty.
/// - Its labels are 63 or fewer characters.
/// - Its labels do not start or end with '-' or '.'.
pub fn is_valid_hostname(hostname: &str) -> bool {
    if hostname.is_empty() || hostname.len() > 253 {
        return false;
    }
    if !hostname
        .chars()
        .all(|ch| ch.is_ascii_alphanumeric() || ch == '-' || ch == '.')
    {
        return false;
    }
    if hostname.split('.').any(|label| {
        label.is_empty() || label.len() > 63 || label.starts_with('-') || label.ends_with('-')
    }) {
        return false;
    }
    true
}

#[cfg(test)]
mod tests {
    use std::net::Ipv6Addr;

    use pnet::ipnetwork::{Ipv4Network, Ipv6Network};
    use serde_json::Value as JsonValue;

    use super::*;

    #[test]
    fn test_parse_host() {
        assert_eq!(
            "127.0.0.1".parse::<Host>().unwrap(),
            Host::from(Ipv4Addr::LOCALHOST)
        );
        assert_eq!(
            "::1".parse::<Host>().unwrap(),
            Host::from(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 1))
        );
        assert_eq!(
            "localhost".parse::<Host>().unwrap(),
            Host::Hostname("localhost".to_string())
        );
    }

    #[test]
    fn test_deserialize_host() {
        assert_eq!(
            serde_json::from_str::<Host>("\"127.0.0.1\"").unwrap(),
            Host::from(Ipv4Addr::LOCALHOST)
        );
        assert_eq!(
            serde_json::from_str::<Host>("\"::1\"").unwrap(),
            Host::from(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 1))
        );
        assert_eq!(
            serde_json::from_str::<Host>("\"localhost\"").unwrap(),
            Host::Hostname("localhost".to_string())
        );
    }

    #[test]
    fn test_serialize_host() {
        assert_eq!(
            serde_json::to_value(Host::from(Ipv4Addr::LOCALHOST)).unwrap(),
            JsonValue::String("127.0.0.1".to_string())
        );
        assert_eq!(
            serde_json::to_value(Host::from(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 1))).unwrap(),
            JsonValue::String("::1".to_string())
        );
        assert_eq!(
            serde_json::to_value(Host::Hostname("localhost".to_string())).unwrap(),
            JsonValue::String("localhost".to_string())
        );
    }

    fn test_parse_addr_helper(addr: &str, expected_addr_opt: Option<&str>) {
        let addr_res = HostAddr::parse_with_default_port(addr, 1337);
        if let Some(expected_addr) = expected_addr_opt {
            assert!(
                addr_res.is_ok(),
                "Parsing `{addr}` was expected to succeed."
            );
            assert_eq!(addr_res.unwrap().to_string(), expected_addr);
        } else {
            assert!(
                addr_res.is_err(),
                "Parsing `{}` was expected to fail, got `{}`",
                addr,
                addr_res.unwrap()
            );
        }
    }

    #[tokio::test]
    async fn test_parse_addr_with_ips() {
        // IPv4
        test_parse_addr_helper("127.0.0.1", Some("127.0.0.1:1337"));
        test_parse_addr_helper("127.0.0.1:100", Some("127.0.0.1:100"));
        test_parse_addr_helper("127.0..1:100", None);

        // IPv6
        test_parse_addr_helper(
            "2001:0db8:85a3:0000:0000:8a2e:0370:7334",
            Some("[2001:db8:85a3::8a2e:370:7334]:1337"),
        );
        test_parse_addr_helper("2001:0db8:85a3:0000:0000:8a2e:0370:7334:1000", None);
        test_parse_addr_helper(
            "[2001:0db8:85a3:0000:0000:8a2e:0370:7334]:1000",
            Some("[2001:db8:85a3::8a2e:370:7334]:1000"),
        );
        test_parse_addr_helper("[2001:0db8:1000", None);
        test_parse_addr_helper("2001:0db8:85a3:0000:0000:8a2e:0370:7334]:1000", None);

        // Hostname
        test_parse_addr_helper("google.com", Some("google.com:1337"));
        test_parse_addr_helper("google.com:1000", Some("google.com:1000"));
    }

    #[test]
    fn test_is_valid_hostname() {
        for hostname in &[
            "VaLiD-HoStNaMe",
            "50-name",
            "235235",
            "example.com",
            "VaLid.HoStNaMe",
            "123.456",
        ] {
            assert!(
                is_valid_hostname(hostname),
                "Hostname `{hostname}` is valid.",
            );
        }

        for hostname in &[
            "-invalid-name",
            "also-invalid-",
            "asdf@fasd",
            "@asdfl",
            "asd f@",
            ".invalid",
            "invalid.name.",
            "foo.label-is-way-to-longgggggggggggggggggggggggggggggggggggggggggggg.org",
            "invalid.-starting.char",
            "invalid.ending-.char",
            "empty..label",
        ] {
            assert!(
                !is_valid_hostname(hostname),
                "Hostname `{hostname}` is invalid."
            );
        }
    }

    #[test]
    fn test_find_private_ip() {
        assert!(_find_private_ip(&[]).is_none());

        let interfaces = [
            NetworkInterface {
                name: "lo".to_string(),
                description: "".to_string(),
                index: 1,
                mac: None,
                ips: vec![
                    IpNetwork::V4(Ipv4Network::new("127.0.0.1".parse().unwrap(), 8).unwrap()),
                    IpNetwork::V6(Ipv6Network::new("::1".parse().unwrap(), 128).unwrap()),
                ],
                flags: 65609,
            },
            NetworkInterface {
                name: "docker0".to_string(),
                description: "".to_string(),
                index: 2,
                mac: None,
                ips: vec![
                    IpNetwork::V6(
                        Ipv6Network::new("fe80::42:69ff:fe8e:e739".parse().unwrap(), 64).unwrap(),
                    ),
                    IpNetwork::V4(Ipv4Network::new("172.17.0.1".parse().unwrap(), 8).unwrap()),
                ],
                flags: 4099,
            },
            NetworkInterface {
                name: "eth0".to_string(),
                description: "".to_string(),
                index: 3,
                mac: None,
                ips: vec![
                    IpNetwork::V6(
                        Ipv6Network::new("fe80::84ed:78c:ec06:bf53".parse().unwrap(), 64).unwrap(),
                    ),
                    IpNetwork::V4(Ipv4Network::new("192.168.1.70".parse().unwrap(), 24).unwrap()),
                ],
                flags: 69699,
            },
        ];
        let (interface_name, ip_addr) = _find_private_ip(&interfaces).unwrap();
        assert_eq!(interface_name, "eth0");
        assert_eq!(ip_addr, "192.168.1.70".parse::<IpAddr>().unwrap());
    }

    #[test]
    fn test_is_forwardable_ip() {
        for ip in ["192.168.0.42", "172.16.0.42", "10.0.0.42"] {
            assert!(
                is_forwardable_ip(&ip.parse::<IpAddr>().unwrap()),
                "IP `{ip}` is forwardable!"
            );
        }
        for ip in ["127.0.0.42", "169.254.0.42", "192.0.0.42"] {
            assert!(
                !is_forwardable_ip(&ip.parse::<IpAddr>().unwrap()),
                "IP `{ip}` is not forwardable!"
            );
        }
    }

    #[test]
    fn test_is_private_ip() {
        for ip in ["192.168.0.42", "172.16.0.42", "10.0.0.42"] {
            assert!(
                is_private_ip(&ip.parse::<IpAddr>().unwrap()),
                "IP `{ip}` is private!"
            );
        }
        for ip in ["192.169.0.42", "172.32.0.42", "11.0.0.42"] {
            assert!(
                !is_private_ip(&ip.parse::<IpAddr>().unwrap()),
                "IP `{ip}` is public!"
            );
        }
    }

    #[test]
    fn test_get_hostname() {
        assert_eq!(
            get_hostname().unwrap(),
            hostname::get().unwrap().to_string_lossy().to_string()
        );
        _get_hostname(OsString::from("")).unwrap_err();
    }
}


================================================
FILE: quickwit/quickwit-common/src/path_hasher.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::hash::Hasher;

/// We use 255 as a separator as it isn't used by utf-8.
///
/// Tantivy uses 1 because it is more convenient for range queries, but we don't
/// care about the sort order here.
///
/// Note: changing this is not retro-compatible!
const SEPARATOR: &[u8] = &[255];

/// Mini wrapper over the FnvHasher to incrementally hash nodes
/// in a tree.
///
/// Its purpose is to:
/// - work around the lack of Clone in the fnv Hasher
/// - enforce a 1 byte separator between segments
#[derive(Default)]
pub struct PathHasher {
    hasher: fnv::FnvHasher,
}

impl Clone for PathHasher {
    #[inline(always)]
    fn clone(&self) -> PathHasher {
        PathHasher {
            hasher: fnv::FnvHasher::with_key(self.hasher.finish()),
        }
    }
}

impl PathHasher {
    #[cfg(any(test, feature = "testsuite"))]
    pub fn hash_path(segments: &[&[u8]]) -> u64 {
        let mut hasher = Self::default();
        for segment in segments {
            hasher.append(segment);
        }
        hasher.finish_leaf()
    }

    /// Appends a new segment to our path.
    ///
    /// In order to avoid natural collisions, (e.g. &["ab", "c"] and &["a", "bc"]),
    /// we add a null byte between each segment as a separator.
    #[inline]
    pub fn append(&mut self, payload: &[u8]) {
        self.hasher.write(payload);
        self.hasher.write(SEPARATOR);
    }

    #[inline]
    pub fn finish_leaf(&self) -> u64 {
        self.hasher.finish()
    }

    #[inline]
    pub fn finish_intermediate(&self) -> u64 {
        let mut intermediate = fnv::FnvHasher::with_key(self.hasher.finish());
        intermediate.write(SEPARATOR);
        intermediate.finish()
    }
}


================================================
FILE: quickwit/quickwit-common/src/pretty.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

pub struct PrettySample<I>(I, usize);

impl<I> PrettySample<I> {
    pub fn new(slice: I, sample_size: usize) -> Self {
        Self(slice, sample_size)
    }
}

impl<I> fmt::Debug for PrettySample<I>
where
    I: IntoIterator + Clone,
    I::Item: fmt::Debug,
{
    fn fmt(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(formatter, "[")?;

        // In general, we will receive a reference (&[...], &HashMap...) or a Map<_> of them.
        // So we either perform a Copy, or a cheap Clone of a simple struct
        let mut iter = self.0.clone().into_iter().enumerate();
        for (i, item) in &mut iter {
            if i > 0 {
                write!(formatter, ", ")?;
            }
            write!(formatter, "{item:?}")?;
            if i == self.1 - 1 {
                break;
            }
        }
        let left = iter.count();
        if left > 0 {
            write!(formatter, ", and {left} more")?;
        }
        write!(formatter, "]")?;
        Ok(())
    }
}

pub trait PrettyDisplay {
    fn pretty_display(&self) -> impl fmt::Display;
}

struct DurationPrettyDisplay<'a>(&'a Duration);

impl fmt::Display for DurationPrettyDisplay<'_> {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        // This is enough for my current use cases. To be extended as you see fit.
        let duration_millis = self.0.as_millis();

        if duration_millis < 1_000 {
            return write!(formatter, "{duration_millis}ms");
        }
        write!(
            formatter,
            "{}.{}s",
            duration_millis / 1_000,
            duration_millis % 1_000 / 10
        )
    }
}

impl PrettyDisplay for Duration {
    fn pretty_display(&self) -> impl fmt::Display {
        DurationPrettyDisplay(self)
    }
}

struct SequencePrettyDisplay<I>(I);

impl<I> fmt::Display for SequencePrettyDisplay<I>
where
    I: IntoIterator + Clone,
    I::Item: fmt::Display,
{
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "[")?;

        // In general, we will receive a reference (&[...], &HashMap...) or a Map<_> of them.
        // So we either perform a Copy, or a cheap Clone of a simple struct
        let mut iter = self.0.clone().into_iter().peekable();

        while let Some(item) = iter.next() {
            write!(f, "{item}")?;
            if iter.peek().is_some() {
                write!(f, ", ")?;
            }
        }
        write!(f, "]")
    }
}

impl<T: fmt::Display> PrettyDisplay for &[T] {
    fn pretty_display(&self) -> impl fmt::Display {
        SequencePrettyDisplay(*self)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_pretty_sample() {
        let pretty_sample = PrettySample::<&[usize]>::new(&[], 2);
        assert_eq!(format!("{pretty_sample:?}"), "[]");

        let pretty_sample = PrettySample::new(&[1], 2);
        assert_eq!(format!("{pretty_sample:?}"), "[1]");

        let pretty_sample = PrettySample::new(&[1, 2], 2);
        assert_eq!(format!("{pretty_sample:?}"), "[1, 2]");

        let pretty_sample = PrettySample::new(&[1, 2, 3], 2);
        assert_eq!(format!("{pretty_sample:?}"), "[1, 2, and 1 more]");

        let pretty_sample = PrettySample::new(&[1, 2, 3, 4], 2);
        assert_eq!(format!("{pretty_sample:?}"), "[1, 2, and 2 more]");
    }

    #[test]
    fn test_duration_pretty_display() {
        let duration = Duration::from_millis(0);
        assert_eq!(format!("{}", duration.pretty_display()), "0ms");

        let duration = Duration::from_millis(125);
        assert_eq!(format!("{}", duration.pretty_display()), "125ms");

        let duration = Duration::from_millis(1_000);
        assert_eq!(format!("{}", duration.pretty_display()), "1.0s");

        let duration = Duration::from_millis(1_125);
        assert_eq!(format!("{}", duration.pretty_display()), "1.12s");
    }

    #[test]
    fn test_sequence_pretty_display() {
        let empty_slice: &[i32] = &[];
        assert_eq!(format!("{}", empty_slice.pretty_display()), "[]");

        let slice_one: &[i32] = &[1];
        assert_eq!(format!("{}", slice_one.pretty_display()), "[1]");

        let slice_two: &[i32] = &[1, 2];
        assert_eq!(format!("{}", slice_two.pretty_display()), "[1, 2]");
    }
}


================================================
FILE: quickwit/quickwit-common/src/progress.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;
use std::sync::atomic::{AtomicU32, Ordering};

use futures::Future;

/// Progress makes it possible to register some progress.
/// It is used in lieu of healthcheck.
///
/// If no progress is observed until the next heartbeat, the actor will be killed.
#[derive(Clone)]
pub struct Progress(Arc<AtomicU32>);

#[derive(Clone, Copy, Debug, Eq, PartialEq)]
enum ProgressState {
    // No update recorded since the last call to .check_for_update()
    NoUpdate,
    // An update was recorded since the last call to .check_for_update()
    Updated,
    // The actor is in the protected zone.
    //
    // The protected zone should seldom be used. It is useful
    // when calling an external library that is blocking for instance.
    //
    // Another use case is blocking when sending a message to another actor
    // with a saturated message bus.
    // The failure detection is then considered to be the problem of
    // the downstream actor.
    //
    // As long as the actor is in the protected zone, healthchecking won't apply
    // to it.
    //
    // The value inside starts at 0.
    ProtectedZone(u32),
}

#[allow(clippy::from_over_into)]
impl Into<u32> for ProgressState {
    fn into(self) -> u32 {
        match self {
            ProgressState::NoUpdate => 0,
            ProgressState::Updated => 1,
            ProgressState::ProtectedZone(level) => 2 + level,
        }
    }
}

impl From<u32> for ProgressState {
    fn from(level: u32) -> Self {
        match level {
            0 => ProgressState::NoUpdate,
            1 => ProgressState::Updated,
            level => ProgressState::ProtectedZone(level - 2),
        }
    }
}

impl Default for Progress {
    fn default() -> Progress {
        Progress(Arc::new(AtomicU32::new(ProgressState::Updated.into())))
    }
}

impl Progress {
    pub fn record_progress(&self) {
        self.0
            .fetch_max(ProgressState::Updated.into(), Ordering::Relaxed);
    }

    /// Executes a future in a protected zone.
    pub async fn protect_future<Fut, T>(&self, future: Fut) -> T
    where Fut: Future<Output = T> {
        let _guard = self.protect_zone();
        future.await
    }

    pub fn protect_zone(&self) -> ProtectedZoneGuard {
        loop {
            let previous_state: ProgressState = self.0.load(Ordering::SeqCst).into();
            let new_state = match previous_state {
                ProgressState::NoUpdate | ProgressState::Updated => ProgressState::ProtectedZone(0),
                ProgressState::ProtectedZone(level) => ProgressState::ProtectedZone(level + 1),
            };
            if self
                .0
                .compare_exchange(
                    previous_state.into(),
                    new_state.into(),
                    Ordering::SeqCst,
                    Ordering::SeqCst,
                )
                .is_ok()
            {
                return ProtectedZoneGuard(self.0.clone());
            }
        }
    }

    /// This method mutates the state as follows and returns true if
    /// the object was in the protected zone or had change registered.
    /// - Updated -> NoUpdate, returns true
    /// - NoUpdate -> NoUpdate, returns false
    /// - ProtectedZone -> ProtectedZone, returns true
    pub fn registered_activity_since_last_call(&self) -> bool {
        let previous_state: ProgressState = self
            .0
            .compare_exchange(
                ProgressState::Updated.into(),
                ProgressState::NoUpdate.into(),
                Ordering::Relaxed,
                Ordering::Relaxed,
            )
            .unwrap_or_else(|previous_value| previous_value)
            .into();
        previous_state != ProgressState::NoUpdate
    }
}

pub struct ProtectedZoneGuard(Arc<AtomicU32>);

impl Drop for ProtectedZoneGuard {
    fn drop(&mut self) {
        let previous_state: ProgressState = self.0.fetch_sub(1, Ordering::SeqCst).into();
        assert!(matches!(previous_state, ProgressState::ProtectedZone(_)));
    }
}

#[cfg(test)]
mod tests {
    use super::Progress;

    #[test]
    fn test_progress() {
        let progress = Progress::default();
        assert!(progress.registered_activity_since_last_call());
        progress.record_progress();
        assert!(progress.registered_activity_since_last_call());
        assert!(!progress.registered_activity_since_last_call());
    }

    #[test]
    fn test_progress_protect_zone() {
        let progress = Progress::default();
        assert!(progress.registered_activity_since_last_call());
        progress.record_progress();
        assert!(progress.registered_activity_since_last_call());
        {
            let _protect_guard = progress.protect_zone();
            assert!(progress.registered_activity_since_last_call());
            assert!(progress.registered_activity_since_last_call());
        }
        assert!(progress.registered_activity_since_last_call());
        assert!(!progress.registered_activity_since_last_call());
    }

    #[test]
    fn test_progress_several_protect_zone() {
        let progress = Progress::default();
        assert!(progress.registered_activity_since_last_call());
        progress.record_progress();
        assert!(progress.registered_activity_since_last_call());
        let first_protect_guard = progress.protect_zone();
        let second_protect_guard = progress.protect_zone();
        assert!(progress.registered_activity_since_last_call());
        assert!(progress.registered_activity_since_last_call());
        std::mem::drop(first_protect_guard);
        assert!(progress.registered_activity_since_last_call());
        assert!(progress.registered_activity_since_last_call());
        std::mem::drop(second_protect_guard);
        assert!(progress.registered_activity_since_last_call());
        assert!(!progress.registered_activity_since_last_call());
    }
}


================================================
FILE: quickwit/quickwit-common/src/pubsub.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::sync::atomic::{AtomicUsize, Ordering};
use std::sync::{Arc, Mutex, Weak};
use std::time::Duration;

use async_trait::async_trait;
use tokio::sync::Mutex as TokioMutex;

use crate::rate_limited_warn;
use crate::type_map::TypeMap;

const EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT: Duration = Duration::from_secs(10);

pub trait Event: fmt::Debug + Clone + Send + Sync + 'static {}

#[async_trait]
pub trait EventSubscriber<E>: Send + Sync + 'static {
    async fn handle_event(&mut self, event: E);
}

#[async_trait]
impl<E, F> EventSubscriber<E> for F
where
    E: Event,
    F: FnMut(E) + Send + Sync + 'static,
{
    async fn handle_event(&mut self, event: E) {
        (self)(event);
    }
}

type EventSubscriptions<E> = HashMap<usize, EventSubscription<E>>;

/// The event broker makes it possible to
/// - emit specific local events
/// - subscribe to these local events
///
/// The event broker is not distributed in itself. Only events emitted
/// locally will be received by the subscribers.
///
/// It is however possible to locally subscribe a handler to a kind of event,
/// that will in turn run a RPC to other nodes.
#[derive(Debug, Clone, Default)]
pub struct EventBroker {
    inner: Arc<InnerEventBroker>,
}

#[derive(Debug, Default)]
struct InnerEventBroker {
    subscription_sequence: AtomicUsize,
    subscriptions: Mutex<TypeMap>,
}

impl EventBroker {
    // The point of this private method is to allow the public subscribe method to have only one
    // generic argument and avoid the ugly `::<E, _>` syntax.
    fn subscribe_aux<E, S>(&self, subscriber: S, with_timeout: bool) -> EventSubscriptionHandle
    where
        E: Event,
        S: EventSubscriber<E> + Send + Sync + 'static,
    {
        let mut subscriptions = self
            .inner
            .subscriptions
            .lock()
            .expect("lock should not be poisoned");

        if !subscriptions.contains::<EventSubscriptions<E>>() {
            subscriptions.insert::<EventSubscriptions<E>>(HashMap::new());
        }
        let subscription_id = self
            .inner
            .subscription_sequence
            .fetch_add(1, Ordering::Relaxed);

        let subscriber_name = std::any::type_name::<S>();
        let subscription = EventSubscription {
            subscriber_name,
            subscriber: Arc::new(TokioMutex::new(Box::new(subscriber))),
            with_timeout,
        };
        let typed_subscriptions = subscriptions
            .get_mut::<EventSubscriptions<E>>()
            .expect("subscription map should exist");
        typed_subscriptions.insert(subscription_id, subscription);

        EventSubscriptionHandle {
            subscription_id,
            broker: Arc::downgrade(&self.inner),
            drop_me: |subscription_id, broker| {
                let mut subscriptions = broker
                    .subscriptions
                    .lock()
                    .expect("lock should not be poisoned");
                if let Some(typed_subscriptions) = subscriptions.get_mut::<EventSubscriptions<E>>()
                {
                    typed_subscriptions.remove(&subscription_id);
                }
            },
        }
    }

    /// Subscribes to an event type.
    ///
    /// The callback should be as light as possible.
    ///
    /// # Disclaimer
    ///
    /// If the callback takes more than `EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT` to execute,
    /// the callback future will be aborted.
    #[must_use]
    pub fn subscribe<E>(&self, subscriber: impl EventSubscriber<E>) -> EventSubscriptionHandle
    where E: Event {
        self.subscribe_aux(subscriber, true)
    }

    /// Subscribes to an event type.
    ///
    /// The callback should be as light as possible.
    #[must_use]
    pub fn subscribe_without_timeout<E>(
        &self,
        subscriber: impl EventSubscriber<E>,
    ) -> EventSubscriptionHandle
    where
        E: Event,
    {
        self.subscribe_aux(subscriber, false)
    }

    /// Publishes an event.
    pub fn publish<E>(&self, event: E)
    where E: Event {
        let subscriptions = self
            .inner
            .subscriptions
            .lock()
            .expect("lock should not be poisoned");
        if let Some(typed_subscriptions) = subscriptions.get::<EventSubscriptions<E>>() {
            for subscription in typed_subscriptions.values() {
                subscription.trigger(event.clone());
            }
        }
    }
}

struct EventSubscription<E> {
    // We put that in the subscription in order to avoid having to take the lock
    // to access it.
    subscriber_name: &'static str,
    subscriber: Arc<TokioMutex<Box<dyn EventSubscriber<E>>>>,
    with_timeout: bool,
}

impl<E: Event> EventSubscription<E> {
    /// Call the callback associated with the subscription.
    fn trigger(&self, event: E) {
        if self.with_timeout {
            self.trigger_abort_on_timeout(event);
        } else {
            self.trigger_just_log_on_timeout(event)
        }
    }

    /// Spawns a task to run the given subscription.
    ///
    /// Just logs a warning if it took more than `EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT`
    /// for the future to execute.
    fn trigger_just_log_on_timeout(&self, event: E) {
        let subscriber_name = self.subscriber_name;
        let subscriber = self.subscriber.clone();
        // This task is just here to log a warning if the callback takes too long to execute.
        let log_timeout_task_handle = tokio::task::spawn(async move {
            tokio::time::sleep(EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT).await;
            let event_name = std::any::type_name::<E>();
            rate_limited_warn!(
                limit_per_min = 10,
                "{subscriber_name}'s handler for {event_name} did not finished within {}ms",
                EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT.as_millis()
            );
        });
        tokio::task::spawn(async move {
            subscriber.lock().await.handle_event(event).await;
            // The callback has terminated, let's abort the timeout task.
            log_timeout_task_handle.abort();
        });
    }

    /// Spawns a task to run the given subscription.
    ///
    /// Aborts the future execution and logs a warning if it takes more than
    /// `EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT`.
    fn trigger_abort_on_timeout(&self, event: E) {
        let subscriber_name = self.subscriber_name;
        let subscriber = self.subscriber.clone();
        let fut = async move {
            if tokio::time::timeout(EVENT_SUBSCRIPTION_CALLBACK_TIMEOUT, async {
                subscriber.lock().await.handle_event(event).await
            })
            .await
            .is_err()
            {
                let event_name = std::any::type_name::<E>();
                rate_limited_warn!(
                    limit_per_min = 10,
                    "{subscriber_name}'s handler for {event_name} timed out, abort"
                );
            }
        };
        tokio::task::spawn(fut);
    }
}

#[derive(Clone)]
pub struct EventSubscriptionHandle {
    subscription_id: usize,
    broker: Weak<InnerEventBroker>,
    drop_me: fn(usize, &InnerEventBroker),
}

impl EventSubscriptionHandle {
    pub fn cancel(self) {}

    /// By default, dropping a subscription handle cancels the subscription.
    /// `forever` consumes the handle and avoids cancelling the subscription on drop.
    pub fn forever(mut self) {
        self.broker = Weak::new();
    }
}

impl Drop for EventSubscriptionHandle {
    fn drop(&mut self) {
        if let Some(broker) = self.broker.upgrade() {
            (self.drop_me)(self.subscription_id, &broker);
        }
    }
}

#[cfg(test)]
mod tests {

    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};

    use super::*;

    #[derive(Debug, Clone)]
    struct MyEvent {
        value: usize,
    }

    impl Event for MyEvent {}

    #[derive(Debug, Clone)]
    struct MySubscriber {
        counter: Arc<AtomicUsize>,
    }

    #[async_trait]
    impl EventSubscriber<MyEvent> for MySubscriber {
        async fn handle_event(&mut self, event: MyEvent) {
            self.counter.store(event.value, Ordering::Relaxed);
        }
    }

    #[tokio::test]
    async fn test_event_broker() {
        let event_broker = EventBroker::default();
        let counter = Arc::new(AtomicUsize::new(0));
        let subscriber = MySubscriber {
            counter: counter.clone(),
        };
        let subscription_handle = event_broker.subscribe(subscriber);

        let event = MyEvent { value: 42 };
        event_broker.publish(event);

        tokio::time::sleep(Duration::from_millis(1)).await;
        assert_eq!(counter.load(Ordering::Relaxed), 42);

        subscription_handle.cancel();

        let event = MyEvent { value: 1337 };
        event_broker.publish(event);

        tokio::time::sleep(Duration::from_millis(1)).await;
        assert_eq!(counter.load(Ordering::Relaxed), 42);
    }

    #[tokio::test]
    async fn test_event_broker_handle_drop() {
        let event_broker = EventBroker::default();
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        drop(event_broker.subscribe(move |event: MyEvent| {
            tx.send(event.value).unwrap();
        }));
        event_broker.publish(MyEvent { value: 42 });
        assert!(rx.recv().await.is_none());
    }

    #[tokio::test]
    async fn test_event_broker_handle_cancel() {
        let event_broker = EventBroker::default();
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        event_broker
            .subscribe(move |event: MyEvent| {
                tx.send(event.value).unwrap();
            })
            .cancel();
        event_broker.publish(MyEvent { value: 42 });
        assert!(rx.recv().await.is_none());
    }

    #[tokio::test]
    async fn test_event_broker_handle_forever() {
        let event_broker = EventBroker::default();
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        event_broker
            .subscribe(move |event: MyEvent| {
                tx.send(event.value).unwrap();
            })
            .forever();
        event_broker.publish(MyEvent { value: 42 });
        assert_eq!(rx.recv().await, Some(42));
    }
}


================================================
FILE: quickwit/quickwit-common/src/rand.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use rand::Rng;
use rand::distr::Alphanumeric;

/// Appends a random suffix composed of a hyphen and five random alphanumeric characters.
pub fn append_random_suffix(string: &str) -> String {
    let rng = rand::rng();
    let mut randomized_string = String::with_capacity(string.len() + 6);
    randomized_string.push_str(string);
    randomized_string.push('-');

    for random_byte in rng.sample_iter(&Alphanumeric).take(5) {
        randomized_string.push(char::from(random_byte));
    }
    randomized_string
}

#[cfg(test)]
mod tests {
    use super::append_random_suffix;

    #[test]
    fn test_append_random_suffix() -> anyhow::Result<()> {
        let randomized = append_random_suffix("");
        let mut chars = randomized.chars();
        assert_eq!(chars.next(), Some('-'));
        assert_eq!(chars.clone().count(), 5);
        assert!(chars.all(|ch| ch.is_ascii_alphanumeric()));
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-common/src/rate_limited_tracing.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// TODO coasetime has a recent() instead of now() which is essentially free (atomic read instead of
// vdso call), but needs us to spawn a future/thread updating that value regularly

use std::sync::atomic::{AtomicU64, Ordering};

use coarsetime::{Duration, Instant};

/// Metadata for a log site. This is stored inside a single AtomicU64 when not in use.
///
/// `call_count` is the number of calls since the last upgrade of generation, it's stored
/// in the lower 32b of the atomic, so it can just be incremented on the fast path.
/// `generation` is the number of time we reset the `call_count`. It isn't used as is, and
/// is just compared to itself to detect and handle properly concurrent resets from multiple
/// threads.
#[derive(Clone, Copy)]
struct LogSiteMetadata {
    generation: u32,
    call_count: u32,
}

impl From<u64> for LogSiteMetadata {
    fn from(val: u64) -> LogSiteMetadata {
        LogSiteMetadata {
            generation: (val >> 32) as u32,
            call_count: (val & ((1 << 32) - 1)) as u32,
        }
    }
}

impl From<LogSiteMetadata> for u64 {
    fn from(count: LogSiteMetadata) -> u64 {
        ((count.generation as u64) << 32) + count.call_count as u64
    }
}

/// Helper function used in [`rate_limited_tracing`] to determine if this line should log,
/// and update the related counters.
pub fn should_log<F: Fn() -> Instant>(
    count_atomic: &AtomicU64,
    last_reset_atomic: &AtomicU64,
    limit: u32,
    now: F,
) -> bool {
    //  count_atomic is treated as 2 u32: upper bits count "generation", lower bits count number of
    //  calls since LAST_RESET. We assume there won't be 2**32 calls to this log in ~60s.
    //  Generation is free to wrap around.

    // Because the lower 32 bits are storing the log count, we can
    // increment the entire u64 to record this log call.
    let logsite_meta_u64 = count_atomic.fetch_add(1, Ordering::Acquire);
    if logsite_meta_u64 == 0 {
        // this can only be reached the very 1st time we log
        last_reset_atomic.store(now().as_ticks(), Ordering::Release);
    }

    let LogSiteMetadata {
        generation,
        call_count,
    } = logsite_meta_u64.into();

    if call_count < limit {
        return true;
    }

    let current_time = Duration::from_ticks(now().as_ticks());
    let last_reset = Duration::from_ticks(last_reset_atomic.load(Ordering::Acquire));

    let should_reset = current_time.abs_diff(last_reset) >= Duration::from_secs(60);

    if !should_reset {
        // we are over-limit and not far enough in time to reset: don't log
        return false;
    }

    let mut update_time = false;

    let update_res =
        count_atomic.fetch_update(Ordering::Release, Ordering::Acquire, |current_count| {
            let mut current_count: LogSiteMetadata = current_count.into();
            if generation == current_count.generation {
                // we can update generation&time, so we can definitely log
                update_time = true;
                let new_count = LogSiteMetadata {
                    generation: generation.wrapping_add(1),
                    call_count: 1,
                };
                Some(new_count.into())
            } else {
                // we can't update generation&time, but maybe we can still log?
                update_time = false;
                if current_count.call_count < limit {
                    // we can log, update the count
                    current_count.call_count += 1;
                    Some(current_count.into())
                } else {
                    // we can't log, save some contention by not recording that we tried to
                    // log, and exit in error
                    None
                }
            }
        });
    let can_log = update_res.is_ok();

    // technically there is a race condition if we stay stuck *here* for > 60s, which
    // could cause us to log more than required. This is unlikely to happen, and not
    // really a big issue.

    if update_time {
        // *we* updated generation, so we must update last_reset too
        last_reset_atomic.store(current_time.as_ticks(), Ordering::Release);
    }
    can_log
}

#[macro_export]
macro_rules! rate_limited_tracing {
    ($log_fn:ident, limit_per_min=$limit:literal, $($args:tt)*) => {{
        use ::std::sync::atomic::AtomicU64;
        use $crate::rate_limited_tracing::CoarsetimeInstant;

        static COUNT: AtomicU64 = AtomicU64::new(0);
        // we can't get time from constant context, so we pre-initialize with zero
        static LAST_RESET: AtomicU64 = AtomicU64::new(0);

        if $crate::rate_limited_tracing::should_log(&COUNT, &LAST_RESET, $limit, CoarsetimeInstant::now) {
            ::tracing::$log_fn!($($args)*);
        }
    }};
}

#[macro_export]
macro_rules! rate_limited_trace {
    ($unit:ident=$limit:literal, $($args:tt)*) => {
        $crate::rate_limited_tracing::rate_limited_tracing!(trace, $unit=$limit, $($args)*)
    };
}
#[macro_export]
macro_rules! rate_limited_debug {
    ($unit:ident=$limit:literal, $($args:tt)*) => {
        $crate::rate_limited_tracing::rate_limited_tracing!(debug, $unit=$limit, $($args)*)
    };
}
#[macro_export]
macro_rules! rate_limited_info {
    ($unit:ident=$limit:literal, $($args:tt)*) => {
        $crate::rate_limited_tracing::rate_limited_tracing!(info, $unit=$limit, $($args)*)
    };
}
#[macro_export]
macro_rules! rate_limited_warn {
    ($unit:ident=$limit:literal, $($args:tt)*) => {
        $crate::rate_limited_tracing::rate_limited_tracing!(warn, $unit=$limit, $($args)*)
    };
}
#[macro_export]
macro_rules! rate_limited_error {
    ($unit:ident=$limit:literal, $($args:tt)*) => {
        $crate::rate_limited_tracing::rate_limited_tracing!(error, $unit=$limit, $($args)*)
    };
}

fn _check_macro_works() {
    rate_limited_info!(limit_per_min = 10, "test {}", "test");
}

#[doc(hidden)]
pub use coarsetime::Instant as CoarsetimeInstant;
pub use rate_limited_debug;
pub use rate_limited_error;
pub use rate_limited_info;
pub use rate_limited_trace;
#[doc(hidden)]
pub use rate_limited_tracing;
pub use rate_limited_warn;

#[cfg(test)]
mod tests {
    use std::sync::atomic::{AtomicU64, Ordering};

    use coarsetime::{Duration, Instant};

    use super::should_log;

    // TODO as this is atomic code, we should test it with multiple threads to verify it behaves
    // like we'd expect, maybe using something like `loom`?

    #[test]
    fn test_rate_limited_log_single_thread() {
        let count = AtomicU64::new(0);
        let last_reset = AtomicU64::new(0);
        let limit = 5u64;

        let mut simulated_time = Instant::now();
        let simulation_step = Duration::from_secs(1);

        assert!(should_log(&count, &last_reset, limit as _, || {
            simulated_time
        }));
        assert_eq!(count.load(Ordering::Relaxed), 1);
        let reset_timestamp = last_reset.load(Ordering::Relaxed);
        assert_ne!(reset_timestamp, 0);

        simulated_time += simulation_step;

        for i in 1..limit {
            // we log as many time as expected
            assert!(should_log(&count, &last_reset, limit as _, || {
                simulated_time
            }));
            assert_eq!(count.load(Ordering::Relaxed), i + 1);
            assert_eq!(last_reset.load(Ordering::Relaxed), reset_timestamp);
            simulated_time += simulation_step;
        }

        for i in limit..(limit * 2) {
            // we don't log, nor update
            assert!(!should_log(&count, &last_reset, limit as _, || {
                simulated_time
            }));
            assert_eq!(count.load(Ordering::Relaxed), i + 1);
            assert_eq!(last_reset.load(Ordering::Relaxed), reset_timestamp);
            simulated_time += simulation_step;
        }

        // advance enough to reset counter
        simulated_time += simulation_step * 60;

        assert!(should_log(&count, &last_reset, limit as _, || {
            simulated_time
        }));
        // counter got reset, generation increased
        assert_eq!(count.load(Ordering::Relaxed), 1 + (1 << 32));
        // last reset changed too
        assert_ne!(last_reset.load(Ordering::Relaxed), reset_timestamp);
        let reset_timestamp = last_reset.load(Ordering::Relaxed);

        for i in 1..limit {
            // we log as many time as expected
            assert!(should_log(&count, &last_reset, limit as _, || {
                simulated_time
            }));
            assert_eq!(count.load(Ordering::Relaxed), i + 1 + (1 << 32));
            assert_eq!(last_reset.load(Ordering::Relaxed), reset_timestamp);
            simulated_time += simulation_step;
        }

        for i in limit..(limit * 2) {
            // we don't log, nor update
            assert!(!should_log(&count, &last_reset, limit as _, || {
                simulated_time
            }));
            assert_eq!(count.load(Ordering::Relaxed), i + 1 + (1 << 32));
            assert_eq!(last_reset.load(Ordering::Relaxed), reset_timestamp);
            simulated_time += simulation_step;
        }
    }
}


================================================
FILE: quickwit/quickwit-common/src/rate_limiter.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Add;
use std::time::Duration;

use bytesize::ByteSize;
use governor::clock::{Clock, DefaultClock, Reference};
use governor::nanos::Nanos;

use crate::tower::{ConstantRate, Rate};

#[derive(Debug, Clone, Copy)]
pub struct RateLimiterSettings {
    // After a long period of inactivity, the rate limiter can accumulate some "credits"
    // up to what we call a `burst_limit`.
    //
    // Until these credits are expired, the rate limiter may exceed temporarily its rate limit.
    pub burst_limit: u64,
    pub rate_limit: ConstantRate,
    // The refill period has an effect on the resolution at which the
    // rate limiting is enforced.
    //
    // `Instant::now()` is guaranteed to be called at most once per refill_period.
    pub refill_period: Duration,
}

#[cfg(any(test, feature = "testsuite"))]
impl Default for RateLimiterSettings {
    fn default() -> Self {
        // 10 MB burst limit.
        let burst_limit = ByteSize::mb(10).as_u64();
        // 5 MB/s rate limit.
        let rate_limit = ConstantRate::bytes_per_sec(ByteSize::mb(5));
        // Refill every 100ms.
        let refill_period = Duration::from_millis(100);

        Self {
            burst_limit,
            rate_limit,
            refill_period,
        }
    }
}

/// A bursty token-based rate limiter.
#[derive(Debug, Clone)]
pub struct RateLimiter<C: Clock = DefaultClock> {
    // Maximum number of permits that can be accumulated.
    max_capacity: u64,
    // Number of permits available.
    available_permits: u64,
    refill_amount: u64,
    refill_period: Duration,
    refill_period_nanos: u64,
    refill_at: C::Instant,
    clock: C,
}

#[cfg(any(test, feature = "testsuite"))]
impl Default for RateLimiter<DefaultClock> {
    fn default() -> Self {
        Self::from_settings(RateLimiterSettings::default())
    }
}

impl RateLimiter<DefaultClock> {
    /// Creates a new rate limiter from the given settings using the default clock.
    pub fn from_settings(settings: RateLimiterSettings) -> Self {
        Self::from_settings_with_clock(settings, DefaultClock::default())
    }
}

impl<C: Clock> RateLimiter<C> {
    /// Creates a new rate limiter from the given settings with a custom clock.
    pub fn from_settings_with_clock(settings: RateLimiterSettings, clock: C) -> Self {
        let max_capacity = settings.burst_limit;
        let refill_period = settings.refill_period;
        let rate_limit = settings.rate_limit.rescale(refill_period);
        let now = clock.now();

        Self {
            max_capacity,
            available_permits: max_capacity,
            refill_amount: rate_limit.work(),
            refill_period,
            refill_period_nanos: refill_period.as_nanos() as u64,
            refill_at: now.add(Nanos::from(refill_period)),
            clock,
        }
    }

    /// Returns the number of permits available.
    pub fn available_permits(&mut self) -> u64 {
        self.refill(self.clock.now());
        self.available_permits
    }

    /// Acquires some permits from the rate limiter. Returns whether the permits were acquired.
    pub fn acquire(&mut self, num_permits: u64) -> bool {
        self.refill(self.clock.now());
        self.acquire_inner(num_permits)
    }

    /// Acquires some permits expressed in bytes from the rate limiter. Returns whether the permits
    /// were acquired.
    pub fn acquire_bytes(&mut self, bytes: ByteSize) -> bool {
        self.acquire(bytes.as_u64())
    }

    /// Drains all the permits from the rate limiter, effectively disabling all the operations
    /// guarded by the rate limiter for one refill period.
    pub fn drain(&mut self) {
        self.available_permits = 0;
        self.refill_at = self.clock.now().add(Nanos::from(self.refill_period));
    }

    /// Gives back some unused permits to the rate limiter.
    pub fn release(&mut self, num_permits: u64) {
        self.available_permits = self.max_capacity.min(self.available_permits + num_permits);
    }

    fn acquire_inner(&mut self, num_permits: u64) -> bool {
        if self.available_permits >= num_permits {
            self.available_permits -= num_permits;
            true
        } else {
            false
        }
    }

    fn refill(&mut self, now: C::Instant) {
        if now.lt(&self.refill_at) {
            return;
        }
        let elapsed_nanos = now.duration_since(self.refill_at).as_u64();
        // More than one refill period may have elapsed so we need to take that into account.
        let refill =
            self.refill_amount + self.refill_amount * elapsed_nanos / self.refill_period_nanos;
        self.available_permits = self.max_capacity.min(self.available_permits + refill);
        self.refill_at = now.add(Nanos::from(self.refill_period));
    }
}

#[cfg(test)]
mod tests {
    use governor::clock::FakeRelativeClock;

    use super::*;

    #[test]
    fn test_rate_limiter_acquire() {
        let settings = RateLimiterSettings {
            burst_limit: ByteSize::mb(2).as_u64(),
            rate_limit: ConstantRate::bytes_per_sec(ByteSize::mb(1)),
            refill_period: Duration::from_millis(100),
        };
        let clock = FakeRelativeClock::default();
        let mut rate_limiter = RateLimiter::from_settings_with_clock(settings, clock.clone());
        assert_eq!(rate_limiter.max_capacity, ByteSize::mb(2).as_u64());
        assert_eq!(rate_limiter.available_permits, ByteSize::mb(2).as_u64());
        assert_eq!(rate_limiter.refill_amount, ByteSize::kb(100).as_u64());
        assert_eq!(rate_limiter.refill_period, Duration::from_millis(100));

        assert!(rate_limiter.acquire_bytes(ByteSize::mb(1)));
        assert!(rate_limiter.acquire_bytes(ByteSize::mb(1)));
        assert!(!rate_limiter.acquire_bytes(ByteSize::kb(1)));

        clock.advance(Duration::from_millis(100));

        assert!(rate_limiter.acquire_bytes(ByteSize::kb(100)));
        assert!(!rate_limiter.acquire_bytes(ByteSize::kb(20)));

        clock.advance(Duration::from_millis(250));

        assert!(rate_limiter.acquire_bytes(ByteSize::kb(125)));
        assert!(rate_limiter.acquire_bytes(ByteSize::kb(125)));
        assert!(!rate_limiter.acquire_bytes(ByteSize::kb(20)));
    }

    #[test]
    fn test_rate_limiter_drain() {
        let settings = RateLimiterSettings {
            burst_limit: ByteSize::mb(2).as_u64(),
            rate_limit: ConstantRate::bytes_per_sec(ByteSize::mb(1)),
            refill_period: Duration::from_millis(100),
        };
        let clock = FakeRelativeClock::default();
        let mut rate_limiter = RateLimiter::from_settings_with_clock(settings, clock.clone());
        rate_limiter.drain();
        assert_eq!(rate_limiter.available_permits, 0);

        clock.advance(Duration::from_millis(50));
        rate_limiter.refill(clock.now());
        assert_eq!(rate_limiter.available_permits, 0);

        clock.advance(Duration::from_millis(50));
        rate_limiter.refill(clock.now());
        assert!(rate_limiter.available_permits >= ByteSize::kb(100).as_u64());
    }

    #[test]
    fn test_rate_limiter_release() {
        let settings = RateLimiterSettings {
            burst_limit: 1,
            rate_limit: ConstantRate::bytes_per_sec(ByteSize::mb(1)),
            refill_period: Duration::from_millis(100),
        };
        let mut rate_limiter = RateLimiter::from_settings(settings);
        rate_limiter.acquire(1);
        assert_eq!(rate_limiter.available_permits, 0);

        rate_limiter.release(1);
        assert_eq!(rate_limiter.available_permits, 1);

        rate_limiter.release(1);
        assert_eq!(rate_limiter.available_permits, 1);
    }

    #[test]
    fn test_rate_limiter_refill() {
        let settings = RateLimiterSettings {
            burst_limit: ByteSize::mb(2).as_u64(),
            rate_limit: ConstantRate::bytes_per_sec(ByteSize::mb(1)),
            refill_period: Duration::from_millis(100),
        };
        let clock = FakeRelativeClock::default();
        let mut rate_limiter = RateLimiter::from_settings_with_clock(settings, clock.clone());

        rate_limiter.available_permits = 0;
        assert_eq!(rate_limiter.available_permits, 0);

        rate_limiter.available_permits = 0;
        clock.advance(Duration::from_millis(100));
        rate_limiter.refill(clock.now());
        assert_eq!(rate_limiter.available_permits, ByteSize::kb(100).as_u64());

        rate_limiter.available_permits = 0;
        clock.advance(Duration::from_millis(110));
        rate_limiter.refill(clock.now());
        assert_eq!(rate_limiter.available_permits, ByteSize::kb(110).as_u64());

        rate_limiter.available_permits = 0;
        clock.advance(Duration::from_millis(210));
        rate_limiter.refill(clock.now());
        assert_eq!(rate_limiter.available_permits, ByteSize::kb(210).as_u64());
    }

    #[test]
    fn test_rate_limiter_available_permits() {
        let settings = RateLimiterSettings {
            burst_limit: ByteSize::mb(2).as_u64(),
            rate_limit: ConstantRate::bytes_per_sec(ByteSize::mb(1)),
            refill_period: Duration::from_millis(100),
        };
        let clock = FakeRelativeClock::default();
        let mut rate_limiter = RateLimiter::from_settings_with_clock(settings, clock.clone());

        rate_limiter.available_permits = 0;
        clock.advance(Duration::from_millis(100));
        assert_eq!(rate_limiter.available_permits(), ByteSize::kb(100).as_u64());
    }
}


================================================
FILE: quickwit/quickwit-common/src/rendezvous_hasher.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Reverse;
use std::hash::{Hash, Hasher};

use siphasher::sip::SipHasher;

/// Computes the affinity of a node for a given `key`.
/// A higher value means a higher affinity.
/// This is the `rendezvous hash`.
pub fn node_affinity<T: Hash, U: Hash>(node: T, key: &U) -> u64 {
    let mut state = SipHasher::new();
    key.hash(&mut state);
    node.hash(&mut state);
    state.finish()
}

/// Sorts the list of node ordered by decreasing affinity values.
/// This is called rendezvous hashing.
pub fn sort_by_rendez_vous_hash<T: Hash, U: Hash>(nodes: &mut [T], key: U) {
    nodes.sort_by_cached_key(|node| Reverse(node_affinity(node, &key)));
}

#[cfg(test)]
mod tests {
    use std::net::SocketAddr;

    use super::*;
    use crate::SocketAddrLegacyHash;

    fn test_socket_addr(last_byte: u8) -> SocketAddr {
        ([127, 0, 0, last_byte], 10_000u16).into()
    }

    #[test]
    fn test_utils_sort_by_rendez_vous_hash() {
        let socket1 = test_socket_addr(1);
        let socket2 = test_socket_addr(2);
        let socket3 = test_socket_addr(3);
        let socket4 = test_socket_addr(4);

        let legacy_socket1 = SocketAddrLegacyHash(&socket1);
        let legacy_socket2 = SocketAddrLegacyHash(&socket2);
        let legacy_socket3 = SocketAddrLegacyHash(&socket3);
        let legacy_socket4 = SocketAddrLegacyHash(&socket4);

        let mut socket_set1 = vec![
            legacy_socket4,
            legacy_socket3,
            legacy_socket1,
            legacy_socket2,
        ];
        sort_by_rendez_vous_hash(&mut socket_set1, "key");

        let mut socket_set2 = vec![legacy_socket1, legacy_socket2, legacy_socket4];
        sort_by_rendez_vous_hash(&mut socket_set2, "key");

        let mut socket_set3 = vec![legacy_socket1, legacy_socket4];
        sort_by_rendez_vous_hash(&mut socket_set3, "key");

        assert_eq!(
            socket_set1,
            &[
                legacy_socket1,
                legacy_socket2,
                legacy_socket3,
                legacy_socket4
            ]
        );
        assert_eq!(
            socket_set2,
            &[legacy_socket1, legacy_socket2, legacy_socket4]
        );
        assert_eq!(socket_set3, &[legacy_socket1, legacy_socket4]);
    }
}


================================================
FILE: quickwit/quickwit-common/src/retry.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Debug;
use std::time::Duration;

use async_trait::async_trait;
use futures::Future;
use rand::Rng;
use tracing::{debug, warn};

pub trait Retryable {
    fn is_retryable(&self) -> bool {
        false
    }
}

#[derive(Debug, Eq, PartialEq)]
pub enum Retry<E> {
    Permanent(E),
    Transient(E),
}

impl<E> Retry<E> {
    pub fn into_inner(self) -> E {
        match self {
            Self::Transient(error) => error,
            Self::Permanent(error) => error,
        }
    }
}

impl<E> Retryable for Retry<E> {
    fn is_retryable(&self) -> bool {
        match self {
            Retry::Permanent(_) => false,
            Retry::Transient(_) => true,
        }
    }
}

#[derive(Debug, Clone, Copy)]
pub struct RetryParams {
    pub base_delay: Duration,
    pub max_delay: Duration,
    pub max_attempts: usize,
}

impl RetryParams {
    /// Creates a new [`RetryParams`] instance using the same settings as the standard retry policy
    /// defined in the AWS SDK for Rust.
    pub fn standard() -> Self {
        Self {
            base_delay: Duration::from_secs(1),
            max_delay: Duration::from_secs(20),
            max_attempts: 3,
        }
    }

    /// Creates a new [`RetryParams`] instance using settings that are more aggressive than those of
    /// the standard policy for services that are more resilient to retries, usually managed
    /// cloud services.
    pub fn aggressive() -> Self {
        Self {
            base_delay: Duration::from_millis(250),
            max_delay: Duration::from_secs(20),
            max_attempts: 5,
        }
    }

    /// Creates a new [`RetryParams`] instance that does not perform any retries.
    pub fn no_retries() -> Self {
        Self {
            base_delay: Duration::ZERO,
            max_delay: Duration::ZERO,
            max_attempts: 1,
        }
    }

    /// Computes the delay after which a new attempt should be performed. The randomized delay
    /// increases after each attempt (exponential backoff and full jitter). Implementation and
    /// default values originate from the Java SDK. See also: <https://aws.amazon.com/blogs/architecture/exponential-backoff-and-jitter/>.
    ///
    /// The caller should pass the number of attempts that have been performed so far. Not to be
    /// confused with the number of retries, which is one less than the number of attempts.
    ///
    /// # Panics
    ///
    /// Panics if `num_attempts` is zero.
    pub fn compute_delay(&self, num_attempts: usize) -> Duration {
        assert!(num_attempts > 0, "num_attempts should be greater than zero");
        let num_attempts = num_attempts.min(32);
        let delay_ms = (self.base_delay.as_millis() as u64)
            .saturating_mul(2u64.saturating_pow(num_attempts as u32 - 1));
        let capped_delay_ms = delay_ms.min(self.max_delay.as_millis() as u64);
        let half_delay_ms = capped_delay_ms.div_ceil(2);
        let jitter_range = half_delay_ms..capped_delay_ms + 1;
        let jittered_delay_ms = rand::rng().random_range(jitter_range);
        Duration::from_millis(jittered_delay_ms)
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        Self {
            base_delay: Duration::from_millis(1),
            max_delay: Duration::from_millis(2),
            max_attempts: 3,
        }
    }
}

#[async_trait]
pub trait MockableSleep {
    async fn sleep(&self, duration: Duration);
}

pub struct TokioSleep;

#[async_trait]
impl MockableSleep for TokioSleep {
    async fn sleep(&self, duration: Duration) {
        tokio::time::sleep(duration).await;
    }
}

pub async fn retry_with_mockable_sleep<U, E, Fut>(
    retry_params: &RetryParams,
    f: impl Fn() -> Fut,
    mockable_sleep: impl MockableSleep,
) -> Result<U, E>
where
    Fut: Future<Output = Result<U, E>>,
    E: Retryable + Debug + 'static,
{
    let mut num_attempts = 0;

    loop {
        let response = f().await;

        let error = match response {
            Ok(response) => {
                return Ok(response);
            }
            Err(error) => error,
        };
        if !error.is_retryable() {
            return Err(error);
        }
        num_attempts += 1;

        if num_attempts >= retry_params.max_attempts {
            warn!(
                num_attempts=%num_attempts,
                "request failed"
            );
            return Err(error);
        }
        let delay = retry_params.compute_delay(num_attempts);
        debug!(
            num_attempts=%num_attempts,
            delay_ms=%delay.as_millis(),
            error=?error,
            "request failed, retrying"
        );
        mockable_sleep.sleep(delay).await;
    }
}

pub async fn retry<U, E, Fut>(retry_params: &RetryParams, f: impl Fn() -> Fut) -> Result<U, E>
where
    Fut: Future<Output = Result<U, E>>,
    E: Retryable + Debug + 'static,
{
    retry_with_mockable_sleep(retry_params, f, TokioSleep).await
}

#[cfg(test)]
mod tests {
    use std::sync::RwLock;
    use std::time::Duration;

    use futures::future::ready;

    use super::{MockableSleep, RetryParams, Retryable, retry_with_mockable_sleep};

    #[derive(Debug, Eq, PartialEq)]
    pub enum Retry<E> {
        Permanent(E),
        Transient(E),
    }

    impl<E> Retryable for Retry<E> {
        fn is_retryable(&self) -> bool {
            match self {
                Retry::Permanent(_) => false,
                Retry::Transient(_) => true,
            }
        }
    }

    struct NoopSleep;

    #[async_trait::async_trait]
    impl MockableSleep for NoopSleep {
        async fn sleep(&self, _duration: Duration) {
            // This is a no-op implementation, so we do nothing here.
        }
    }

    async fn simulate_retries<T>(values: Vec<Result<T, Retry<usize>>>) -> Result<T, Retry<usize>> {
        let noop_mock = NoopSleep;
        let values_it = RwLock::new(values.into_iter());
        retry_with_mockable_sleep(
            &RetryParams {
                base_delay: Duration::from_millis(1),
                max_delay: Duration::from_millis(2),
                max_attempts: 30,
            },
            || ready(values_it.write().unwrap().next().unwrap()),
            noop_mock,
        )
        .await
    }

    #[tokio::test]
    async fn test_retry_accepts_ok() {
        assert_eq!(simulate_retries(vec![Ok(())]).await, Ok(()));
    }

    #[tokio::test]
    async fn test_retry_does_retry() {
        assert_eq!(
            simulate_retries(vec![Err(Retry::Transient(1)), Ok(())]).await,
            Ok(())
        );
    }

    #[tokio::test]
    async fn test_retry_stops_retrying_on_non_retryable_error() {
        assert_eq!(
            simulate_retries(vec![Err(Retry::Permanent(1)), Ok(())]).await,
            Err(Retry::Permanent(1))
        );
    }

    #[tokio::test]
    async fn test_retry_retries_up_at_most_attempts_times() {
        let retry_sequence: Vec<_> = (0..30)
            .map(|retry_id| Err(Retry::Transient(retry_id)))
            .chain(Some(Ok(())))
            .collect();
        assert_eq!(
            simulate_retries(retry_sequence).await,
            Err(Retry::Transient(29))
        );
    }

    #[tokio::test]
    async fn test_retry_retries_up_to_max_attempts_times() {
        let retry_sequence: Vec<_> = (0..29)
            .map(|retry_id| Err(Retry::Transient(retry_id)))
            .chain(Some(Ok(())))
            .collect();
        assert_eq!(simulate_retries(retry_sequence).await, Ok(()));
    }

    fn test_retry_delay_does_not_overflow_aux(retry_params: RetryParams) {
        for i in 1..100 {
            let delay = retry_params.compute_delay(i);
            assert!(delay <= retry_params.max_delay);
            if retry_params.base_delay <= retry_params.max_delay {
                assert!(delay * 2 >= retry_params.base_delay);
            }
        }
    }

    proptest::proptest! {
        #[test]
        fn test_retry_delay_does_not_overflow(
            max_attempts in 1..1_000usize,
            base_delay in 0..1_000u64,
            max_delay in 0..60_000u64,
        ) {
            let retry_params = RetryParams {
                max_attempts,
                base_delay: Duration::from_millis(base_delay),
                max_delay: Duration::from_millis(max_delay),
            };
            test_retry_delay_does_not_overflow_aux(retry_params);
        }
    }
}


================================================
FILE: quickwit/quickwit-common/src/ring_buffer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::{Debug, Formatter};

/// Fixed-size buffer that keeps the last N elements pushed into it.
///
/// `head` is the write cursor. It advances by one on each push and wraps
/// back to 0 when it reaches N, overwriting the oldest element.
///
/// ```text
/// RingBuffer<u32, 4> after pushing 1, 2, 3, 4, 5, 6:
///
///   buffer = [5, 6, 3, 4]    head = 2    len = 4
///                 ^
///                 next write goes here
///
///   logical view (oldest → newest): [3, 4, 5, 6]
/// ```
pub struct RingBuffer<T: Copy + Default, const N: usize> {
    buffer: [T; N],
    head: usize,
    len: usize,
}

impl<T: Copy + Default, const N: usize> Default for RingBuffer<T, N> {
    fn default() -> Self {
        Self {
            buffer: [T::default(); N],
            head: 0,
            len: 0,
        }
    }
}

impl<T: Copy + Default + Debug, const N: usize> Debug for RingBuffer<T, N> {
    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
        f.debug_list().entries(self.iter()).finish()
    }
}

impl<T: Copy + Default, const N: usize> RingBuffer<T, N> {
    pub fn push_back(&mut self, value: T) {
        self.buffer[self.head] = value;
        self.head = (self.head + 1) % N;
        if self.len < N {
            self.len += 1;
        }
    }

    pub fn last(&self) -> Option<T> {
        if self.len == 0 {
            return None;
        }
        Some(self.buffer[(self.head + N - 1) % N])
    }

    pub fn front(&self) -> Option<T> {
        if self.len == 0 {
            return None;
        }
        Some(self.buffer[(self.head + N - self.len) % N])
    }

    pub fn len(&self) -> usize {
        self.len
    }

    pub fn is_empty(&self) -> bool {
        self.len == 0
    }

    pub fn iter(&self) -> impl Iterator<Item = &T> + '_ {
        let start = (self.head + N - self.len) % N;
        (0..self.len).map(move |i| &self.buffer[(start + i) % N])
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_empty() {
        let rb = RingBuffer::<u32, 4>::default();
        assert!(rb.is_empty());
        assert_eq!(rb.len(), 0);
        assert_eq!(rb.last(), None);
        assert_eq!(rb.front(), None);
        assert_eq!(rb.iter().count(), 0);
    }

    #[test]
    fn test_single_push() {
        let mut rb = RingBuffer::<u32, 4>::default();
        rb.push_back(10);
        assert_eq!(rb.len(), 1);
        assert!(!rb.is_empty());
        assert_eq!(rb.last(), Some(10));
        assert_eq!(rb.front(), Some(10));
        assert_eq!(rb.iter().copied().collect::<Vec<_>>(), vec![10]);
    }

    #[test]
    fn test_partial_fill() {
        let mut rb = RingBuffer::<u32, 4>::default();
        rb.push_back(1);
        rb.push_back(2);
        rb.push_back(3);
        assert_eq!(rb.len(), 3);
        assert_eq!(rb.last(), Some(3));
        assert_eq!(rb.front(), Some(1));
        assert_eq!(rb.iter().copied().collect::<Vec<_>>(), vec![1, 2, 3]);
    }

    #[test]
    fn test_exactly_full() {
        let mut rb = RingBuffer::<u32, 4>::default();
        for i in 1..=4 {
            rb.push_back(i);
        }
        assert_eq!(rb.len(), 4);
        assert_eq!(rb.last(), Some(4));
        assert_eq!(rb.front(), Some(1));
        assert_eq!(rb.iter().copied().collect::<Vec<_>>(), vec![1, 2, 3, 4]);
    }

    #[test]
    fn test_wrap_around() {
        let mut rb = RingBuffer::<u32, 4>::default();
        for i in 1..=6 {
            rb.push_back(i);
        }
        assert_eq!(rb.len(), 4);
        assert_eq!(rb.last(), Some(6));
        assert_eq!(rb.front(), Some(3));
        assert_eq!(rb.iter().copied().collect::<Vec<_>>(), vec![3, 4, 5, 6]);
    }

    #[test]
    fn test_many_wraps() {
        let mut rb = RingBuffer::<u32, 3>::default();
        for i in 1..=100 {
            rb.push_back(i);
        }
        assert_eq!(rb.len(), 3);
        assert_eq!(rb.last(), Some(100));
        assert_eq!(rb.front(), Some(98));
        assert_eq!(rb.iter().copied().collect::<Vec<_>>(), vec![98, 99, 100]);
    }

    #[test]
    fn test_debug() {
        let mut rb = RingBuffer::<u32, 3>::default();
        rb.push_back(1);
        rb.push_back(2);
        assert_eq!(format!("{:?}", rb), "[1, 2]");
    }
}


================================================
FILE: quickwit/quickwit-common/src/runtimes.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::sync::atomic::{AtomicUsize, Ordering};
use std::time::Duration;

use once_cell::sync::OnceCell;
use prometheus::{Gauge, IntCounter, IntGauge};
use tokio::runtime::Runtime;
use tokio_metrics::{RuntimeMetrics, RuntimeMonitor};

use crate::metrics::{new_counter, new_float_gauge, new_gauge};

static RUNTIMES: OnceCell<HashMap<RuntimeType, tokio::runtime::Runtime>> = OnceCell::new();

/// Describes which runtime an actor should run on.
#[derive(Clone, Copy, Debug, Hash, Eq, PartialEq)]
pub enum RuntimeType {
    /// The blocking runtime runs blocking actors.
    /// This runtime is only used as a nice thread pool with
    /// the interface as tokio stasks.
    ///
    /// This runtime should not be used to run tokio
    /// io operations.
    ///
    /// Tasks are allowed to block for an arbitrary amount of time.
    Blocking,

    /// The non-blocking runtime is closer to what one would expect from
    /// a regular tokio runtime.
    ///
    /// Task are expect to yield within 500 micros.
    NonBlocking,
}

#[derive(Debug, Clone, Copy)]
pub struct RuntimesConfig {
    /// Number of worker threads allocated to the non-blocking runtime.
    pub num_threads_non_blocking: usize,
    /// Number of worker threads allocated to the blocking runtime.
    pub num_threads_blocking: usize,
}

impl RuntimesConfig {
    #[cfg(any(test, feature = "testsuite"))]
    pub fn light_for_tests() -> RuntimesConfig {
        RuntimesConfig {
            num_threads_blocking: 1,
            num_threads_non_blocking: 1,
        }
    }

    pub fn with_num_cpus(num_cpus: usize) -> Self {
        // Non blocking task are supposed to be io intensive, and not require many threads.
        // On the other hand the blocking actors are cpu intensive. We allocate
        // almost all of the threads to them.
        match num_cpus {
            0..=3 => {
                // We do not have enough vCPUs to allocate a full thread to
                // non-blocking.
                RuntimesConfig {
                    num_threads_non_blocking: 1,
                    num_threads_blocking: num_cpus,
                }
            }
            4..=6 => RuntimesConfig {
                num_threads_non_blocking: 1,
                num_threads_blocking: num_cpus - 1,
            },
            7.. => RuntimesConfig {
                num_threads_non_blocking: 2,
                num_threads_blocking: num_cpus - 2,
            },
        }
    }
}

impl Default for RuntimesConfig {
    fn default() -> Self {
        let num_cpus = crate::num_cpus();
        Self::with_num_cpus(num_cpus)
    }
}

fn start_runtimes(config: RuntimesConfig) -> HashMap<RuntimeType, Runtime> {
    let mut runtimes = HashMap::with_capacity(2);

    let disable_lifo_slot = crate::get_bool_from_env("QW_DISABLE_TOKIO_LIFO_SLOT", true);

    let mut blocking_runtime_builder = tokio::runtime::Builder::new_multi_thread();
    if disable_lifo_slot {
        blocking_runtime_builder.disable_lifo_slot();
    }
    let blocking_runtime = blocking_runtime_builder
        .worker_threads(config.num_threads_blocking)
        .thread_name_fn(|| {
            static ATOMIC_ID: AtomicUsize = AtomicUsize::new(0);
            let id = ATOMIC_ID.fetch_add(1, Ordering::AcqRel);
            format!("blocking-{id}")
        })
        .enable_all()
        .build()
        .unwrap();

    scrape_tokio_runtime_metrics(blocking_runtime.handle(), "blocking");
    runtimes.insert(RuntimeType::Blocking, blocking_runtime);

    let non_blocking_runtime = tokio::runtime::Builder::new_multi_thread()
        .worker_threads(config.num_threads_non_blocking)
        .thread_name_fn(|| {
            static ATOMIC_ID: AtomicUsize = AtomicUsize::new(0);
            let id = ATOMIC_ID.fetch_add(1, Ordering::AcqRel);
            format!("non-blocking-{id}")
        })
        .enable_all()
        .build()
        .unwrap();

    scrape_tokio_runtime_metrics(non_blocking_runtime.handle(), "non_blocking");
    runtimes.insert(RuntimeType::NonBlocking, non_blocking_runtime);

    runtimes
}

pub fn initialize_runtimes(runtimes_config: RuntimesConfig) -> anyhow::Result<()> {
    RUNTIMES.get_or_init(|| start_runtimes(runtimes_config));
    Ok(())
}

impl RuntimeType {
    pub fn get_runtime_handle(self) -> tokio::runtime::Handle {
        RUNTIMES
            .get_or_init(|| {
                #[cfg(any(test, feature = "testsuite"))]
                {
                    tracing::warn!("starting Tokio actor runtimes for tests");
                    start_runtimes(RuntimesConfig::light_for_tests())
                }
                #[cfg(not(any(test, feature = "testsuite")))]
                {
                    panic!("Tokio runtimes not initialized. Please, report this issue on GitHub: https://github.com/quickwit-oss/quickwit/issues.");
                }
            })
            .get(&self)
            .unwrap()
            .handle()
            .clone()
    }
}

/// Spawns a background task
pub fn scrape_tokio_runtime_metrics(handle: &tokio::runtime::Handle, label: &'static str) {
    let runtime_monitor = RuntimeMonitor::new(handle);
    handle.spawn(async move {
        let mut interval = tokio::time::interval(Duration::from_secs(1));
        let mut prometheus_runtime_metrics = PrometheusRuntimeMetrics::new(label);

        for tokio_runtime_metrics in runtime_monitor.intervals() {
            interval.tick().await;
            prometheus_runtime_metrics.update(&tokio_runtime_metrics);
        }
    });
}

struct PrometheusRuntimeMetrics {
    scheduled_tasks: IntGauge,
    worker_busy_duration_milliseconds_total: IntCounter,
    worker_busy_ratio: Gauge,
    worker_threads: IntGauge,
}

impl PrometheusRuntimeMetrics {
    pub fn new(label: &'static str) -> Self {
        Self {
            scheduled_tasks: new_gauge(
                "tokio_scheduled_tasks",
                "The total number of tasks currently scheduled in workers' local queues.",
                "runtime",
                &[("runtime_type", label)],
            ),
            worker_busy_duration_milliseconds_total: new_counter(
                "tokio_worker_busy_duration_milliseconds_total",
                " The total amount of time worker threads were busy.",
                "runtime",
                &[("runtime_type", label)],
            ),
            worker_busy_ratio: new_float_gauge(
                "tokio_worker_busy_ratio",
                "The ratio of time worker threads were busy since the last time runtime metrics \
                 were collected.",
                "runtime",
                &[("runtime_type", label)],
            ),
            worker_threads: new_gauge(
                "tokio_worker_threads",
                "The number of worker threads used by the runtime.",
                "runtime",
                &[("runtime_type", label)],
            ),
        }
    }

    pub fn update(&mut self, runtime_metrics: &RuntimeMetrics) {
        self.scheduled_tasks
            .set(runtime_metrics.total_local_queue_depth as i64);
        self.worker_busy_duration_milliseconds_total
            .inc_by(runtime_metrics.total_busy_duration.as_millis() as u64);
        self.worker_busy_ratio.set(runtime_metrics.busy_ratio());
        self.worker_threads
            .set(runtime_metrics.workers_count as i64);
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_runtimes_config_default() {
        let runtime_default = RuntimesConfig::default();
        assert!(runtime_default.num_threads_non_blocking <= runtime_default.num_threads_blocking);
        assert!(runtime_default.num_threads_non_blocking <= 2);
    }

    #[test]
    fn test_runtimes_with_given_num_cpus_10() {
        let runtime = RuntimesConfig::with_num_cpus(10);
        assert_eq!(runtime.num_threads_blocking, 8);
        assert_eq!(runtime.num_threads_non_blocking, 2);
    }

    #[test]
    fn test_runtimes_with_given_num_cpus_3() {
        let runtime = RuntimesConfig::with_num_cpus(3);
        assert_eq!(runtime.num_threads_blocking, 3);
        assert_eq!(runtime.num_threads_non_blocking, 1);
    }
}


================================================
FILE: quickwit/quickwit-common/src/shared_consts.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::OnceLock;
use std::time::Duration;

use bytesize::ByteSize;
use tracing::warn;

/// Field name reserved for storing the dynamically indexed fields.
pub const FIELD_PRESENCE_FIELD_NAME: &str = "_field_presence";

pub const MINIMUM_DELETION_GRACE_PERIOD: Duration = Duration::from_secs(5 * 60); // 5mn
const MAXIMUM_DELETION_GRACE_PERIOD: Duration = Duration::from_secs(2 * 24 * 3600); // 2 days

/// We cannot safely delete splits right away as a:
/// - in-flight queries could actually have selected this split,
/// - scroll queries may also have a point in time on these splits.
///
/// We deal this probably by introducing a grace period. A split is first marked as delete,
/// and hence won't be selected for search. After a few minutes, once it reasonably safe to assume
/// that all queries involving this split have terminated, we effectively delete the split.
/// This duration is controlled by `DELETION_GRACE_PERIOD`.
pub fn split_deletion_grace_period() -> Duration {
    const DEFAULT_DELETION_GRACE_PERIOD: Duration = Duration::from_secs(60 * 32); // 32 min

    static SPLIT_DELETION_GRACE_PERIOD_SECS_LOCK: OnceLock<Duration> = std::sync::OnceLock::new();
    *SPLIT_DELETION_GRACE_PERIOD_SECS_LOCK.get_or_init(|| {
        let deletion_grace_period_secs: u64 = crate::get_from_env(
            "QW_SPLIT_DELETION_GRACE_PERIOD_SECS",
            DEFAULT_DELETION_GRACE_PERIOD.as_secs(),
            false,
        );
        let deletion_grace_period_secs_clamped: u64 = deletion_grace_period_secs.clamp(
            MINIMUM_DELETION_GRACE_PERIOD.as_secs(),
            MAXIMUM_DELETION_GRACE_PERIOD.as_secs(),
        );
        if deletion_grace_period_secs_clamped != deletion_grace_period_secs {
            warn!(
                "The deletion grace period is clamped to {} seconds. The provided value was {} \
                 seconds.",
                deletion_grace_period_secs_clamped, deletion_grace_period_secs
            );
        }
        Duration::from_secs(deletion_grace_period_secs_clamped)
    })
}

/// In order to amortized search with scroll, we fetch more documents than are
/// being requested.
pub const SCROLL_BATCH_LEN: usize = 1_000;

/// Key prefix used in chitchat to broadcast the list of primary shards hosted by a leader.
pub const INGESTER_PRIMARY_SHARDS_PREFIX: &str = "ingester.primary_shards:";

/// Key used in chitchat to broadcast the status of an ingester.
pub const INGESTER_STATUS_KEY: &str = "ingester.status";

/// Prefix used in chitchat to broadcast per-source ingester capacity scores and open shard counts.
pub const INGESTER_CAPACITY_SCORE_PREFIX: &str = "ingester.capacity_score:";

/// File name for the encoded list of fields in the split
pub const SPLIT_FIELDS_FILE_NAME: &str = "split_fields";

/// More or less the indexing throughput of a core
/// i.e. PIPELINE_THROUGHPUT / PIPELINE_FULL_CAPACITY
pub const DEFAULT_SHARD_THROUGHPUT_LIMIT: ByteSize = ByteSize::mib(5);
/// Large enough to absorb small bursts but should remain defensive against unbalanced shards.
pub const DEFAULT_SHARD_BURST_LIMIT: ByteSize = ByteSize::mib(50);

/// A compromise between "exponential" scale up and moderate shard count increase.
pub const DEFAULT_SHARD_SCALE_UP_FACTOR: f32 = 1.5;

// (Just a reexport).
pub use bytesize::MIB;


================================================
FILE: quickwit/quickwit-common/src/socket_addr_legacy_hash.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::hash::Hasher;
use std::net::SocketAddr;

/// Computes the hash of socket addr, the way it was done before Rust 1.81
///
/// In <https://github.com/rust-lang/rust/commit/ba620344301aaa3b2733575a0696cdfd877edbdf>
/// rustc change the implementation of Hash for IpAddr v4 and v6.
///
/// The idea was to not hash an array of bytes but instead interpret it as a register
/// and hash this.
///
/// This was done for performance reason, but this change the result of the hash function
/// used to compute affinity in quickwit. As a result, the switch would invalidate all
/// existing cache.
///
/// In order to avoid this, we introduce the following function that reproduces the old
/// behavior.
#[repr(transparent)]
#[derive(Debug, Eq, PartialEq, Copy, Clone)]
pub struct SocketAddrLegacyHash<'a>(pub &'a SocketAddr);

impl std::hash::Hash for SocketAddrLegacyHash<'_> {
    fn hash<H: Hasher>(&self, state: &mut H) {
        std::mem::discriminant(self.0).hash(state);
        match self.0 {
            SocketAddr::V4(socket_addr_v4) => {
                socket_addr_v4.ip().octets().hash(state);
                socket_addr_v4.port().hash(state);
            }
            SocketAddr::V6(socket_addr_v6) => {
                socket_addr_v6.ip().octets().hash(state);
                socket_addr_v6.port().hash(state);
                socket_addr_v6.flowinfo().hash(state);
                socket_addr_v6.scope_id().hash(state);
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use std::net::SocketAddrV6;

    use super::*;

    fn sample_socket_addr_v4() -> SocketAddr {
        "17.12.15.3:1834".parse().unwrap()
    }

    fn sample_socket_addr_v6() -> SocketAddr {
        let mut socket_addr_v6: SocketAddrV6 = "[fe80::240:63ff:fede:3c19]:8080".parse().unwrap();
        socket_addr_v6.set_scope_id(4047u32);
        socket_addr_v6.set_flowinfo(303u32);
        socket_addr_v6.into()
    }

    fn compute_hash(hashable: impl std::hash::Hash) -> u64 {
        // I wish I could have used the sip hasher but we don't have the deps here and I did
        // not want to move that code to quickwit-common.
        //
        // If test break because rust changed its default hasher, we can just update the tests in
        // this file with the new values.
        let mut hasher = siphasher::sip::SipHasher::default();
        hashable.hash(&mut hasher);
        hasher.finish()
    }

    #[test]
    fn test_legacy_hash_socket_addr_v4() {
        let h = compute_hash(SocketAddrLegacyHash(&sample_socket_addr_v4()));
        // This value is coming from using rust 1.80 to hash socket addr
        assert_eq!(h, 8725442259486497862);
    }

    #[test]
    fn test_legacy_hash_socket_addr_v6() {
        let h = compute_hash(SocketAddrLegacyHash(&sample_socket_addr_v6()));
        // This value is coming from using rust 1.80 to hash socket addr
        assert_eq!(h, 14277248675058176752);
    }
}


================================================
FILE: quickwit/quickwit-common/src/sorted_iter.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Ordering;
use std::collections::{btree_map, btree_set};
use std::iter::Peekable;

/// Marks sorted iterators, typically iterators over [`btree_set::BTreeSet`] and
/// [`btree_map::BTreeMap`].
trait Sorted {}

/// Defines helper methods on sorted iterators.
pub trait SortedIterator: Iterator + Sized {
    /// Compares two sorted iterators and returns the diff.
    fn diff<U>(self, other: U) -> DiffIterator<Self, U>
    where U: SortedIterator<Item = Self::Item> {
        DiffIterator {
            left: self.peekable(),
            right: other.peekable(),
        }
    }
}

#[derive(Debug, Eq, PartialEq)]
pub enum Diff<K> {
    Added(K),
    Unchanged(K),
    Removed(K),
}

pub struct DiffIterator<T: Iterator, U: Iterator> {
    left: Peekable<T>,
    right: Peekable<U>,
}

impl<T, U, K> Iterator for DiffIterator<T, U>
where
    T: Iterator<Item = K>,
    U: Iterator<Item = K>,
    K: Ord,
{
    type Item = Diff<K>;

    fn next(&mut self) -> Option<Self::Item> {
        match (self.left.peek(), self.right.peek()) {
            (Some(left), Some(right)) => match left.cmp(right) {
                Ordering::Less => {
                    let left = self
                        .left
                        .next()
                        .expect("The left iterator should not be empty.");
                    Some(Diff::Removed(left))
                }
                Ordering::Equal => {
                    let left = self
                        .left
                        .next()
                        .expect("The left iterator should not be empty.");
                    self.right.next();
                    Some(Diff::Unchanged(left))
                }
                Ordering::Greater => {
                    let right = self
                        .right
                        .next()
                        .expect("The right iterator should not be empty.");
                    Some(Diff::Added(right))
                }
            },
            (Some(_), None) => {
                let left = self
                    .left
                    .next()
                    .expect("The left iterator should not be empty.");
                Some(Diff::Removed(left))
            }
            (None, Some(_)) => {
                let right = self
                    .right
                    .next()
                    .expect("The right iterator should not be empty.");
                Some(Diff::Added(right))
            }
            (None, None) => None,
        }
    }
}

impl<T> SortedIterator for T where T: Iterator + Sorted {}

impl<K, V> Sorted for btree_map::IntoKeys<K, V> {}
impl<K, V> Sorted for btree_map::IntoValues<K, V> {}
impl<K, V> Sorted for btree_map::Keys<'_, K, V> {}
impl<K, V> Sorted for btree_map::Values<'_, K, V> {}
impl<K> Sorted for btree_set::IntoIter<K> {}
impl<K> Sorted for btree_set::Iter<'_, K> {}

/// Same as [`SortedIterator`] but for (key, value) pairs sorted by key.
pub trait SortedByKeyIterator<K, V>: Iterator + Sized {
    /// Compares the keys of two sorted key-value iterators and returns the diff.
    fn diff_by_key<U, W>(self, other: U) -> DiffByKeyIterator<Self, U>
    where U: SortedByKeyIterator<K, W> {
        DiffByKeyIterator {
            left: self.peekable(),
            right: other.peekable(),
        }
    }
}

#[derive(Debug, Eq, PartialEq)]
pub enum KeyDiff<K, V, W> {
    Added(K, W),
    Unchanged(K, V, W),
    Removed(K, V),
}

pub struct DiffByKeyIterator<T: Iterator, U: Iterator> {
    left: Peekable<T>,
    right: Peekable<U>,
}

impl<T, U, K, V, W> Iterator for DiffByKeyIterator<T, U>
where
    T: Iterator<Item = (K, V)>,
    U: Iterator<Item = (K, W)>,
    K: Ord,
{
    type Item = KeyDiff<K, V, W>;

    fn next(&mut self) -> Option<Self::Item> {
        match (self.left.peek(), self.right.peek()) {
            (Some((left_key, _)), Some((right_key, _))) => match left_key.cmp(right_key) {
                Ordering::Less => {
                    let (left_key, left_value) = self
                        .left
                        .next()
                        .expect("The left iterator should not be empty.");
                    Some(KeyDiff::Removed(left_key, left_value))
                }
                Ordering::Equal => {
                    let (left_key, left_value) = self
                        .left
                        .next()
                        .expect("The left iterator should not be empty.");
                    let (_, right_value) = self
                        .right
                        .next()
                        .expect("The right iterator should not be empty.");
                    Some(KeyDiff::Unchanged(left_key, left_value, right_value))
                }
                Ordering::Greater => {
                    let (right_key, right_value) = self
                        .right
                        .next()
                        .expect("The right iterator should not be empty.");
                    Some(KeyDiff::Added(right_key, right_value))
                }
            },
            (Some(_), None) => {
                let (left_key, left_value) = self
                    .left
                    .next()
                    .expect("The left iterator should not be empty.");
                Some(KeyDiff::Removed(left_key, left_value))
            }
            (None, Some(_)) => {
                let (right_key, right_value) = self
                    .right
                    .next()
                    .expect("The right iterator should not be empty.");
                Some(KeyDiff::Added(right_key, right_value))
            }
            (None, None) => None,
        }
    }
}

impl<T, K, V> SortedByKeyIterator<K, V> for T where T: Iterator<Item = (K, V)> + Sorted {}

impl<K, V> Sorted for btree_map::IntoIter<K, V> {}
impl<K, V> Sorted for btree_map::Iter<'_, K, V> {}

#[cfg(test)]
mod tests {
    use std::collections::{BTreeMap, BTreeSet};

    use super::*;

    #[test]
    fn test_diff() {
        {
            let left: BTreeSet<u64> = Vec::new().into_iter().collect();
            let right: BTreeSet<u64> = Vec::new().into_iter().collect();
            let diff: Vec<_> = left.iter().diff(right.iter()).collect();
            assert_eq!(diff, Vec::new());
        }
        {
            let left: BTreeSet<_> = vec![1].into_iter().collect();
            let right: BTreeSet<_> = Vec::new().into_iter().collect();
            let diff: Vec<_> = left.iter().diff(right.iter()).collect();
            assert_eq!(diff, vec![Diff::Removed(&1)]);
        }
        {
            let left: BTreeSet<_> = Vec::new().into_iter().collect();
            let right: BTreeSet<_> = vec![1].into_iter().collect();
            let diff: Vec<_> = left.iter().diff(right.iter()).collect();
            assert_eq!(diff, vec![Diff::Added(&1)]);
        }
        {
            let left: BTreeSet<_> = vec![1].into_iter().collect();
            let right: BTreeSet<_> = vec![1].into_iter().collect();
            let diff: Vec<_> = left.iter().diff(right.iter()).collect();
            assert_eq!(diff, vec![Diff::Unchanged(&1)]);
        }
        {
            let left: BTreeSet<_> = vec![1, 3, 5, 7].into_iter().collect();
            let right: BTreeSet<_> = vec![2, 4, 5, 6].into_iter().collect();
            let diff: Vec<_> = left.iter().diff(right.iter()).collect();
            assert_eq!(
                diff,
                vec![
                    Diff::Removed(&1),
                    Diff::Added(&2),
                    Diff::Removed(&3),
                    Diff::Added(&4),
                    Diff::Unchanged(&5),
                    Diff::Added(&6),
                    Diff::Removed(&7),
                ]
            );
        }
    }

    #[test]
    fn test_diff_by_key() {
        {
            let left: BTreeMap<u64, u64> = Vec::new().into_iter().collect();
            let right: BTreeMap<u64, u64> = Vec::new().into_iter().collect();
            let key_diff: Vec<_> = left.iter().diff_by_key(right.iter()).collect();
            assert_eq!(key_diff, Vec::new());
        }
        {
            let left: BTreeMap<_, _> = vec![(1, 1)].into_iter().collect();
            let right: BTreeMap<_, &'static str> = Vec::new().into_iter().collect();
            let key_diff: Vec<_> = left.iter().diff_by_key(right.iter()).collect();
            assert_eq!(key_diff, vec![KeyDiff::Removed(&1, &1)]);
        }
        {
            let left: BTreeMap<_, usize> = Vec::new().into_iter().collect();
            let right: BTreeMap<_, _> = vec![(1, "a")].into_iter().collect();
            let key_diff: Vec<_> = left.iter().diff_by_key(right.iter()).collect();
            assert_eq!(key_diff, vec![KeyDiff::Added(&1, &"a")]);
        }
        {
            let left: BTreeMap<_, _> = vec![(1, 11)].into_iter().collect();
            let right: BTreeMap<_, _> = vec![(1, "a")].into_iter().collect();
            let key_diff: Vec<_> = left.iter().diff_by_key(right.iter()).collect();
            assert_eq!(key_diff, vec![KeyDiff::Unchanged(&1, &11, &"a")]);
        }
        {
            let left: BTreeMap<_, _> = vec![(1, 1), (3, 3), (5, 5), (7, 7)].into_iter().collect();
            let right: BTreeMap<_, _> = vec![(2, "b"), (4, "d"), (5, "e"), (6, "f")]
                .into_iter()
                .collect();
            let key_diff: Vec<_> = left.iter().diff_by_key(right.iter()).collect();
            assert_eq!(
                key_diff,
                vec![
                    KeyDiff::Removed(&1, &1),
                    KeyDiff::Added(&2, &"b"),
                    KeyDiff::Removed(&3, &3),
                    KeyDiff::Added(&4, &"d"),
                    KeyDiff::Unchanged(&5, &5, &"e"),
                    KeyDiff::Added(&6, &"f"),
                    KeyDiff::Removed(&7, &7),
                ]
            );
        }
    }
}


================================================
FILE: quickwit/quickwit-common/src/stream_utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::TypeId;
use std::fmt;
use std::pin::Pin;

use bytesize::ByteSize;
use futures::{Stream, StreamExt, TryStreamExt, stream};
use prometheus::IntGauge;
use tokio::sync::{mpsc, watch};
use tokio_stream::wrappers::{ReceiverStream, UnboundedReceiverStream, WatchStream};
use tracing::warn;

use crate::metrics::GaugeGuard;
use crate::tower::RpcName;

pub type BoxStream<T> = Pin<Box<dyn Stream<Item = T> + Send + Unpin + 'static>>;

/// A stream impl for code-generated services with streaming endpoints.
pub struct ServiceStream<T> {
    inner: BoxStream<T>,
}

impl<T> ServiceStream<T>
where T: Send + 'static
{
    pub fn new(inner: BoxStream<T>) -> Self {
        Self { inner }
    }

    pub fn empty() -> Self {
        Self {
            inner: Box::pin(stream::empty()),
        }
    }

    pub fn map<F, U>(self, f: F) -> ServiceStream<U>
    where
        F: FnMut(T) -> U + Send + 'static,
        U: Send + 'static,
    {
        ServiceStream {
            inner: Box::pin(self.inner.map(f)),
        }
    }
}

impl<T> fmt::Debug for ServiceStream<T>
where T: 'static
{
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "ServiceStream<{:?}>", TypeId::of::<T>())
    }
}

impl<T> Unpin for ServiceStream<T> {}

impl<T> ServiceStream<T>
where T: Send + 'static
{
    pub fn new_bounded(capacity: usize) -> (mpsc::Sender<T>, Self) {
        let (sender, receiver) = mpsc::channel(capacity);
        (sender, receiver.into())
    }

    pub fn new_bounded_with_gauge(
        capacity: usize,
        gauge: &'static IntGauge,
    ) -> (TrackedSender<T>, Self) {
        let (sender, receiver) = mpsc::channel(capacity);
        let tracked_sender = TrackedSender { sender, gauge };
        let receiver_stream =
            ReceiverStream::new(receiver).map(|value: InFlightValue<T>| value.into_inner());
        let service_stream = Self {
            inner: Box::pin(receiver_stream),
        };
        (tracked_sender, service_stream)
    }

    pub fn new_unbounded() -> (mpsc::UnboundedSender<T>, Self) {
        let (sender, receiver) = mpsc::unbounded_channel();
        (sender, receiver.into())
    }

    pub fn new_unbounded_with_gauge(gauge: &'static IntGauge) -> (TrackedUnboundedSender<T>, Self) {
        let (sender, receiver) = mpsc::unbounded_channel();
        let tracked_sender = TrackedUnboundedSender { sender, gauge };
        let receiver_stream = UnboundedReceiverStream::new(receiver)
            .map(|value: InFlightValue<T>| value.into_inner());
        let service_stream = Self {
            inner: Box::pin(receiver_stream),
        };
        (tracked_sender, service_stream)
    }
}

impl<T> ServiceStream<T>
where T: Clone + Send + Sync + 'static
{
    pub fn new_watch(init: T) -> (watch::Sender<T>, Self) {
        let (sender, receiver) = watch::channel(init);
        (sender, receiver.into())
    }
}

impl<T, E> ServiceStream<Result<T, E>>
where
    T: Send + 'static,
    E: Send + 'static,
{
    pub fn map_err<F, U>(self, f: F) -> ServiceStream<Result<T, U>>
    where
        F: FnMut(E) -> U + Send + 'static,
        U: Send + 'static,
    {
        ServiceStream {
            inner: Box::pin(self.inner.map_err(f)),
        }
    }
}

impl<T> Stream for ServiceStream<T> {
    type Item = T;

    fn poll_next(
        mut self: std::pin::Pin<&mut Self>,
        cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Option<Self::Item>> {
        Pin::new(&mut self.inner).poll_next(cx)
    }
}

impl<T> From<mpsc::Receiver<T>> for ServiceStream<T>
where T: Send + 'static
{
    fn from(receiver: mpsc::Receiver<T>) -> Self {
        Self {
            inner: Box::pin(ReceiverStream::new(receiver)),
        }
    }
}

impl<T> From<mpsc::UnboundedReceiver<T>> for ServiceStream<T>
where T: Send + 'static
{
    fn from(receiver: mpsc::UnboundedReceiver<T>) -> Self {
        Self {
            inner: Box::pin(UnboundedReceiverStream::new(receiver)),
        }
    }
}

impl<T> From<watch::Receiver<T>> for ServiceStream<T>
where T: Clone + Send + Sync + 'static
{
    fn from(receiver: watch::Receiver<T>) -> Self {
        Self {
            inner: Box::pin(WatchStream::new(receiver)),
        }
    }
}

/// Adapts a server-side tonic::Streaming into a ServiceStream of `Result<T, tonic::Status>`. Once
/// an error is encountered, the stream will be closed and subsequent calls to `poll_next` will
/// return `None`.
impl<T> From<tonic::Streaming<T>> for ServiceStream<Result<T, tonic::Status>>
where T: Send + 'static
{
    fn from(streaming: tonic::Streaming<T>) -> Self {
        Self {
            inner: Box::pin(streaming),
        }
    }
}

/// Adapts a client-side tonic::Streaming into a ServiceStream of `T`. Once an error is encountered,
/// the stream will be closed and subsequent calls to `poll_next` will return `None`.
impl<T> From<tonic::Streaming<T>> for ServiceStream<T>
where T: Send + 'static
{
    fn from(streaming: tonic::Streaming<T>) -> Self {
        let message_stream = stream::unfold(streaming, |mut streaming| {
            Box::pin(async {
                match streaming.message().await {
                    Ok(Some(message)) => Some((message, streaming)),
                    Ok(None) => None,
                    Err(error) => {
                        warn!(error=?error, "gRPC transport error");
                        None
                    }
                }
            })
        });
        Self {
            inner: Box::pin(message_stream),
        }
    }
}

#[cfg(any(test, feature = "testsuite"))]
impl<T> From<Vec<T>> for ServiceStream<T>
where T: Send + 'static
{
    fn from(values: Vec<T>) -> Self {
        Self {
            inner: Box::pin(stream::iter(values)),
        }
    }
}

impl<T> RpcName for ServiceStream<T>
where T: RpcName
{
    fn rpc_name() -> &'static str {
        T::rpc_name()
    }
}

pub struct InFlightValue<T>(T, #[allow(dead_code)] GaugeGuard<'static>);

impl<T> fmt::Debug for InFlightValue<T>
where T: fmt::Debug
{
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "{:?}", self.0)
    }
}

impl<T> InFlightValue<T> {
    pub fn new(value: T, value_size: ByteSize, gauge: &'static IntGauge) -> Self {
        let mut gauge_guard = GaugeGuard::from_gauge(gauge);
        gauge_guard.add(value_size.as_u64() as i64);

        Self(value, gauge_guard)
    }

    pub fn into_inner(self) -> T {
        self.0
    }
}

pub struct TrackedSender<T> {
    sender: mpsc::Sender<InFlightValue<T>>,
    gauge: &'static IntGauge,
}

impl<T> TrackedSender<T> {
    pub async fn send(
        &self,
        value: T,
        value_size: ByteSize,
    ) -> Result<(), mpsc::error::SendError<T>> {
        self.sender
            .send(InFlightValue::new(value, value_size, self.gauge))
            .await
            .map_err(|send_error| mpsc::error::SendError(send_error.0.0))
    }
}

pub struct TrackedUnboundedSender<T> {
    sender: mpsc::UnboundedSender<InFlightValue<T>>,
    gauge: &'static IntGauge,
}

impl<T> TrackedUnboundedSender<T> {
    pub fn send(&self, value: T, value_size: ByteSize) -> Result<(), mpsc::error::SendError<T>> {
        self.sender
            .send(InFlightValue::new(value, value_size, self.gauge))
            .map_err(|send_error| mpsc::error::SendError(send_error.0.0))
    }
}

#[cfg(test)]
mod tests {
    use once_cell::sync::Lazy;

    use super::*;
    use crate::metrics::new_gauge;

    #[tokio::test]
    async fn test_service_stream_map() {
        let mapped_values = ServiceStream::from(vec![0, 1, 2, 3])
            .map(|x| x * 2)
            .collect::<Vec<_>>()
            .await;
        assert_eq!(mapped_values, vec![0, 2, 4, 6]);
    }

    #[tokio::test]
    async fn test_tracked_service_stream_bounded() {
        static TEST_GAUGE: Lazy<IntGauge> =
            Lazy::new(|| new_gauge("common", "help", "test_tracked_service_stream_bounded", &[]));

        let (service_stream_tx, mut service_stream) =
            ServiceStream::new_bounded_with_gauge(3, &TEST_GAUGE);

        service_stream_tx.send(1, ByteSize(42)).await.unwrap();
        assert_eq!(TEST_GAUGE.get(), 42);

        service_stream_tx.send(2, ByteSize(1337)).await.unwrap();
        assert_eq!(TEST_GAUGE.get(), 1379);

        let value = service_stream.next().await.unwrap();
        assert_eq!(value, 1);
        assert_eq!(TEST_GAUGE.get(), 1337);
    }

    #[tokio::test]
    async fn test_tracked_service_stream_unbounded() {
        static TEST_GAUGE: Lazy<IntGauge> = Lazy::new(|| {
            new_gauge(
                "common",
                "help",
                "test_tracked_service_stream_unbounded",
                &[],
            )
        });

        let (service_stream_tx, mut service_stream) =
            ServiceStream::new_unbounded_with_gauge(&TEST_GAUGE);

        service_stream_tx.send(1, ByteSize(42)).unwrap();
        assert_eq!(TEST_GAUGE.get(), 42);

        service_stream_tx.send(2, ByteSize(1337)).unwrap();
        assert_eq!(TEST_GAUGE.get(), 1379);

        let value = service_stream.next().await.unwrap();
        assert_eq!(value, 1);
        assert_eq!(TEST_GAUGE.get(), 1337);
    }
}


================================================
FILE: quickwit/quickwit-common/src/temp_dir.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use tempfile::TempDir;
use tokio::fs;

use crate::ignore_error_kind;

const MAX_LENGTH: usize = 255;

const SEPARATOR: char = '%';

const NUM_RAND_CHARS: usize = 6;

/// Creates the specified directory. If the directory already exists, deletes its contents.
pub async fn create_or_purge_directory(path: &Path) -> io::Result<PathBuf> {
    // Delete if exists and recreate scratch directory.
    ignore_error_kind!(io::ErrorKind::NotFound, fs::remove_dir_all(path).await)?;
    fs::create_dir_all(path).await?;
    Ok(path.to_path_buf())
}

/// A temporary directory. This directory is deleted when the object is dropped.
#[derive(Debug, Clone)]
pub struct TempDirectory {
    inner: Arc<TempDir>,
    _parent: Option<Arc<TempDir>>,
}

impl TempDirectory {
    /// A path where the temporary directory is pointing to.
    pub fn path(&self) -> &Path {
        self.inner.path()
    }

    /// Creates a new temporary directory with the current temporary directory.
    /// The new directory keeps a pointer to the parent directory to perevent it
    /// from premature deletion. The directory is deleted when the object is dropped.
    pub fn named_temp_child(&self, prefix: &str) -> io::Result<TempDirectory> {
        Ok(TempDirectory {
            inner: Arc::new(
                tempfile::Builder::new()
                    .prefix(prefix)
                    .tempdir_in(self.path())?,
            ),
            _parent: Some(self.inner.clone()),
        })
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        Builder::default().tempdir().unwrap()
    }
}

/// A temporary directory builder.
#[derive(Debug)]
pub struct Builder<'a> {
    parts: Vec<&'a str>,
    max_length: usize,
    separator: char,
    num_rand_chars: usize,
}

impl Default for Builder<'_> {
    fn default() -> Self {
        Self {
            parts: Default::default(),
            max_length: MAX_LENGTH,
            separator: SEPARATOR,
            num_rand_chars: NUM_RAND_CHARS,
        }
    }
}

impl<'a> Builder<'a> {
    /// Specifies the number of random bytes to add at the end of the directory name. Default is 6.
    pub fn rand_bytes(&mut self, rand: usize) -> &mut Self {
        self.num_rand_chars = rand;
        self
    }

    /// Specifies the maximum length of the directory name in characters. Default is 255 characters.
    pub fn max_length(&mut self, max_length: usize) -> &mut Self {
        self.max_length = max_length;
        self
    }

    /// Adds a prefix to the directory name.
    pub fn join(&mut self, name: &'a str) -> &mut Self {
        if !name.is_empty() {
            self.parts.push(name.as_ref());
        }
        self
    }

    fn push_str(buffer: &mut String, addition: &'a str, size: usize) -> usize {
        let len = addition.len();
        if len <= size {
            buffer.push_str(addition);
            return len;
        } else if size < 3 {
            buffer.push_str(&addition[0..size]);
        } else {
            let half = size - size / 2;
            buffer.push_str(&addition[0..half - 1]);
            buffer.push_str("..");
            buffer.push_str(&addition[addition.len() - (size - half) + 1..]);
        }
        size
    }

    /// Constructs the prefix from the parts specified by the join function.
    /// If parts are small enough they will be simply concatenated with the
    /// separator character in between. If parts are too large they will
    /// truncated by replacing the middle of each part with "..". The resulting
    /// string will be at most max_length characters long.
    fn prefix(&self) -> io::Result<String> {
        if self.parts.is_empty() {
            return Ok(String::new());
        }
        let separator_count = if self.num_rand_chars > 0 {
            self.parts.len()
        } else {
            self.parts.len() - 1
        };
        // We want to preserve at least one letter from each part with separators.
        if self.max_length < self.parts.len() + separator_count + self.num_rand_chars {
            return Err(io::Error::new(
                io::ErrorKind::InvalidInput,
                "the filename limit is too small",
            ));
        }
        // Calculate how many characters from the parts we can use in the final string.
        let len_without_separators = self.max_length - separator_count - self.num_rand_chars;
        // Calculate how many characters per part can we use.
        let average_len = len_without_separators / self.parts.len();
        // Account for the average length may not be a whole number.
        let mut leftovers = len_without_separators % self.parts.len();
        // We will have some long parts and some short parts. The short parts (part shorter
        // than average can "donate" their space to the large parts. That will allows us to
        // use all available space. In this loop we are counting how many characters large
        // parts can use in addition to the average.
        for part in &self.parts {
            if part.len() <= average_len {
                // Adjust the available length from the parts that are shorter
                leftovers += average_len - part.len();
            }
        }
        // Build the final string by cancatenating the parts while cutting the to the desired
        // length.
        let mut buf = String::new();
        for (i, part) in self.parts.iter().enumerate() {
            if part.len() <= average_len {
                // If the part is shorter than the average - we just add it
                Self::push_str(&mut buf, part, average_len);
            } else {
                // If the part is longer than the average - we can cut it down to average_len +
                // leftovers
                let pushed = Self::push_str(&mut buf, part, average_len + leftovers) - average_len;
                // We now need to adjust leftovers by the number of additional characters the we
                // pushed above average_len
                leftovers -= pushed;
            }
            // The last separator is only added if there are random bytes at the end
            if i < self.parts.len() - 1 || self.num_rand_chars > 0 {
                buf.push(self.separator)
            }
        }
        Ok(buf)
    }

    /// Creates a temporary directory in the temp directory of operation system
    pub fn tempdir(&self) -> io::Result<TempDirectory> {
        Ok(TempDirectory {
            inner: Arc::new(
                tempfile::Builder::new()
                    .rand_bytes(self.num_rand_chars)
                    .prefix(&self.prefix()?)
                    .tempdir()?,
            ),
            _parent: None,
        })
    }

    /// Creates a temporary directory in the specified directory
    pub fn tempdir_in<P: AsRef<Path>>(&self, dir: P) -> io::Result<TempDirectory> {
        Ok(TempDirectory {
            inner: Arc::new(
                tempfile::Builder::new()
                    .rand_bytes(self.num_rand_chars)
                    .prefix(&self.prefix()?)
                    .tempdir_in(dir)?,
            ),
            _parent: None,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::cmp;

    use rand::Rng;

    use super::*;

    #[test]
    fn test_push_str() {
        assert_truncate("abcdef", 100, "abcdef", 6);
        assert_truncate("abcdef", 6, "abcdef", 6);
        assert_truncate("abcdefghijklmnopqrstuvwxyz", 5, "ab..z", 5);
        assert_truncate("abcdefghijklmnopqrstuvwxyz", 4, "a..z", 4);
        assert_truncate("abcdefghijklmnopqrstuvwxyz", 3, "a..", 3);
        assert_truncate("abcdefghijklmnopqrstuvwxyz", 2, "ab", 2);
        assert_truncate("abcdefghijklmnopqrstuvwxyz", 1, "a", 1);
        assert_truncate("abcde", 10, "abcde", 5);
        assert_truncate("abcde", 5, "abcde", 5);
        assert_truncate("abcde", 4, "a..e", 4);
        assert_truncate("abcde", 3, "a..", 3);
        assert_truncate("abcde", 2, "ab", 2);
        assert_truncate("abcde", 1, "a", 1);
    }

    fn assert_truncate(addition: &str, size: usize, expected_addition: &str, expected_size: usize) {
        let mut buf = String::new();
        let size = Builder::push_str(&mut buf, addition, size);
        assert_eq!(expected_addition, buf);
        assert_eq!(expected_size, size);
    }

    #[test]
    fn test_random_failures() {
        assert_prefix(
            vec!["AAAAAAAAAA", "AA", "AAAAAAA", "AAAA", "AAAA", "AAAAAAAAA"],
            35,
            "AAAAAAAAAA%AA%AA..A%AAAA%AAAA%A..A%",
        );
        assert_prefix(
            vec![
                "AAAAAA",
                "AAAAAAAAA",
                "AAAAAA",
                "AAA",
                "A",
                "AAAAAAA",
                "AAAAAAAAAA",
                "AAAAA",
            ],
            55,
            "AAAAAA%AAAAAAAAA%AAAAAA%AAA%A%AAAAAAA%AAAAAAAAAA%AAAAA%",
        );
        assert_prefix(
            vec!["AAAAAAAAA", "", "AAAAAAA", "AAAAAAA"],
            25,
            "AAA..AAA%AAAAAAA%AAAAAAA%",
        );
    }

    #[test]
    fn test_prefix() {
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 15, "0%abcde%uvwxyz%");

        assert_prefix(vec!["a", "b"], 100, "a%b%");
        assert_prefix(vec!["abcde", "uvwxyz"], 100, "abcde%uvwxyz%");
        assert_prefix(vec!["abcde", "uvwxyz"], 13, "abcde%uvwxyz%");
        assert_prefix(vec!["abcde", "uvwxyz"], 12, "abcde%uv..z%");
        assert_prefix(vec!["abcde", "uvwxyz"], 11, "abcde%u..z%");
        assert_prefix(vec!["abcde", "uvwxyz"], 10, "a..e%u..z%");
        assert_prefix(vec!["abcde", "uvwxyz"], 9, "a..e%u..%");
        assert_prefix(vec!["abcde", "uvwxyz"], 8, "a..%u..%");
        assert_prefix(vec!["abcde", "uvwxyz"], 7, "a..%uv%");
        assert_prefix(vec!["abcde", "uvwxyz"], 6, "ab%uv%");
        assert_prefix(vec!["abcde", "uvwxyz"], 5, "ab%u%");
        assert_prefix(vec!["abcde", "uvwxyz"], 4, "a%u%");
        assert_prefix_err(
            "the filename limit is too small",
            vec!["abcde", "uvwxyz"],
            3,
        );

        assert_prefix(vec!["0", "abcde", "uvwxyz"], 15, "0%abcde%uvwxyz%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 14, "0%abcde%uv..z%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 13, "0%abcde%u..z%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 12, "0%abcde%u..%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 11, "0%abcde%uv%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 10, "0%a..e%uv%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 9, "0%a..%uv%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 8, "0%a..%u%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 7, "0%ab%u%");
        assert_prefix(vec!["0", "abcde", "uvwxyz"], 6, "0%a%u%");
        assert_prefix_err(
            "the filename limit is too small",
            vec!["0", "abcde", "uvwxyz"],
            5,
        );
    }

    fn assert_prefix(parts: Vec<&str>, size: usize, expected_path: &str) {
        let mut builder = Builder::default();
        builder.rand_bytes(5);
        builder.max_length(size + 5); // Size of random suffix
        for part in parts.iter() {
            builder.join(part);
        }
        let prefix = builder.prefix().unwrap();
        assert_eq!(expected_path, prefix, "parts: {parts:?} len: {size:?}");
    }

    fn assert_prefix_err(expected_err: &str, parts: Vec<&str>, size: usize) {
        let mut builder = Builder::default();
        builder.rand_bytes(5);
        builder.max_length(size + 5); // Size of random suffix
        for part in parts.iter() {
            builder.join(part);
        }
        let error = builder.prefix().unwrap_err();
        assert_eq!(expected_err, error.to_string());
    }

    #[test]
    fn test_prefix_random() {
        let mut rng = rand::rng();
        let template = "A".repeat(100);
        for _ in 0..10000 {
            let rand_bytes = rng.random_range(0..4);
            let parts_num = rng.random_range(0..10);
            let mut builder = Builder::default();
            builder.rand_bytes(rand_bytes);
            let mut max_size = 0;
            for _ in 0..parts_num {
                let size = 1 + rng.random_range(0..10);
                builder.join(&template[0..size]);
                max_size += size + 1;
            }
            let separator_count = if rand_bytes > 0 {
                parts_num
            } else {
                // no separator at the end
                if max_size > 0 {
                    max_size -= 1;
                    parts_num - 1
                } else {
                    parts_num
                }
            };
            let limit_threshold = parts_num + separator_count + rand_bytes;
            if parts_num > 0 && rng.random() {
                builder.max_length(rng.random_range(0..limit_threshold));
                assert_eq!(
                    "the filename limit is too small",
                    builder.prefix().unwrap_err().to_string()
                );
            } else {
                let len = limit_threshold + rng.random_range(0..100);
                builder.max_length(len);
                let builder_debug = format!("{builder:?}, len {len}");
                let builder_prefix = builder.prefix().unwrap();
                assert_eq!(
                    builder_prefix.len(),
                    cmp::min(len - rand_bytes, max_size),
                    "{builder_debug} -> {builder_prefix}"
                );
            }
        }
    }

    #[test]
    fn test_directory_creation_and_removal() {
        let directory = Builder::default()
            .join("foo")
            .join("bar")
            .join("baz")
            .rand_bytes(0)
            .tempdir()
            .unwrap();
        assert_eq!(directory.path().file_name().unwrap(), "foo%bar%baz");
        let path = directory.path().to_path_buf();
        assert!(path.try_exists().unwrap());
        drop(directory);
        assert!(!path.try_exists().unwrap());
    }

    #[test]
    fn test_directory_creation_and_removal_with_random_bytes() {
        let directory = Builder::default()
            .join("foo")
            .join("bar")
            .join("baz")
            .rand_bytes(4)
            .tempdir()
            .unwrap();
        let filename = directory.path().file_name().unwrap().to_str().unwrap();
        assert_eq!(&filename[0..filename.len() - 4], "foo%bar%baz%");
        let path = directory.path().to_path_buf();
        assert!(path.try_exists().unwrap());
        drop(directory);
        assert!(!path.try_exists().unwrap());
    }

    #[test]
    fn test_directory_randomness() {
        let mut directories = Vec::new();
        let mut paths = Vec::new();
        let temp_dir = Builder::default().tempdir().unwrap();
        // Try creating the maximum number of directories for a single random byte
        // On case-insensitive filesystems we can only have 36 different directories a-z,0-9
        for _ in 0..36 {
            let dir = Builder::default()
                .join("test")
                .rand_bytes(1)
                .tempdir_in(temp_dir.path())
                .unwrap();
            assert_eq!(dir.path().parent().unwrap(), temp_dir.path());
            paths.push(dir.path().to_path_buf());
            directories.push(dir);
        }
        for path in paths.iter() {
            assert!(path.try_exists().unwrap());
        }
        drop(directories);
        for path in paths.iter() {
            assert!(!path.try_exists().unwrap());
        }
    }
}


================================================
FILE: quickwit/quickwit-common/src/test_utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::net::SocketAddr;
use std::time::Duration;

use futures::Future;
use hyper::Uri;
use tokio::time::error::Elapsed;
use tower::Service as _;

pub async fn wait_until_predicate<Fut>(
    predicate: impl Fn() -> Fut,
    timeout: Duration,
    retry_interval: Duration,
) -> Result<(), Elapsed>
where
    Fut: Future<Output = bool>,
{
    tokio::time::timeout(timeout, async move {
        loop {
            if predicate().await {
                break;
            }
            tokio::time::sleep(retry_interval).await
        }
    })
    .await
}

/// Tries to connect at most 3 times to `SocketAddr`.
/// If not successful, returns an error.
/// This is a convenient function to wait before sending gRPC requests
/// to this `SocketAddr`.
pub async fn wait_for_server_ready(socket_addr: SocketAddr) -> anyhow::Result<()> {
    let mut num_attempts = 0;
    let max_num_attempts = 10;
    let uri = Uri::builder()
        .scheme("http")
        .authority(socket_addr.to_string().as_str())
        .path_and_query("/")
        .build()?;

    while num_attempts < max_num_attempts {
        tokio::time::sleep(Duration::from_millis(50 * (num_attempts + 1))).await;
        let mut http = hyper_util::client::legacy::connect::HttpConnector::new();
        match http.call(uri.clone()).await {
            Ok(_) => break,
            Err(_) => {
                println!(
                    "Failed to connect to `{}` failed, retrying {}/{}",
                    socket_addr,
                    num_attempts + 1,
                    max_num_attempts
                );
                num_attempts += 1;
            }
        }
    }
    if num_attempts == max_num_attempts {
        anyhow::bail!("too many attempts to connect to `{}`", socket_addr);
    }
    Ok(())
}


================================================
FILE: quickwit/quickwit-common/src/thread_pool.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::sync::Arc;

use futures::{Future, TryFutureExt};
use once_cell::sync::Lazy;
use prometheus::IntGauge;
use tokio::sync::oneshot;
use tracing::error;

use crate::metrics::{GaugeGuard, IntGaugeVec, OwnedGaugeGuard, new_gauge_vec};

/// An executor backed by a thread pool to run CPU-intensive tasks.
///
/// tokio::spawn_blocking should only used for IO-bound tasks, as it has not limit on its
/// thread count.
#[derive(Clone)]
pub struct ThreadPool {
    thread_pool: Arc<rayon::ThreadPool>,
    ongoing_tasks: IntGauge,
    pending_tasks: IntGauge,
}

impl ThreadPool {
    pub fn new(name: &'static str, num_threads_opt: Option<usize>) -> ThreadPool {
        let mut rayon_pool_builder = rayon::ThreadPoolBuilder::new()
            .thread_name(move |thread_id| format!("quickwit-{name}-{thread_id}"))
            .panic_handler(move |_my_panic| {
                error!("task running in the quickwit {name} thread pool panicked");
            });
        if let Some(num_threads) = num_threads_opt {
            rayon_pool_builder = rayon_pool_builder.num_threads(num_threads);
        }
        let thread_pool = rayon_pool_builder
            .build()
            .expect("failed to spawn thread pool");
        let ongoing_tasks = THREAD_POOL_METRICS.ongoing_tasks.with_label_values([name]);
        let pending_tasks = THREAD_POOL_METRICS.pending_tasks.with_label_values([name]);
        ThreadPool {
            thread_pool: Arc::new(thread_pool),
            ongoing_tasks,
            pending_tasks,
        }
    }

    pub fn get_underlying_rayon_thread_pool(&self) -> Arc<rayon::ThreadPool> {
        self.thread_pool.clone()
    }

    /// Function similar to `tokio::spawn_blocking`.
    ///
    /// Here are two important differences however:
    ///
    /// 1) The task runs on a rayon thread pool managed by Quickwit. This pool is specifically used
    ///    only to run CPU-intensive work and is configured to contain `num_cpus` cores.
    ///
    /// 2) Before the task is effectively scheduled, we check that the spawner is still interested
    ///    in its result.
    ///
    /// It is therefore required to `await` the result of this
    /// function to get any work done.
    ///
    /// This is nice because it makes work that has been scheduled
    /// but is not running yet "cancellable".
    pub fn run_cpu_intensive<F, R>(
        &self,
        cpu_intensive_fn: F,
    ) -> impl Future<Output = Result<R, Panicked>>
    where
        F: FnOnce() -> R + Send + 'static,
        R: Send + 'static,
    {
        let span = tracing::Span::current();
        let ongoing_tasks = self.ongoing_tasks.clone();
        let mut pending_tasks_guard: OwnedGaugeGuard =
            OwnedGaugeGuard::from_gauge(self.pending_tasks.clone());
        pending_tasks_guard.add(1i64);
        let (tx, rx) = oneshot::channel();
        self.thread_pool.spawn(move || {
            drop(pending_tasks_guard);
            if tx.is_closed() {
                return;
            }
            let _guard = span.enter();
            let mut ongoing_task_guard = GaugeGuard::from_gauge(&ongoing_tasks);
            ongoing_task_guard.add(1i64);
            let result = cpu_intensive_fn();
            let _ = tx.send(result);
        });
        rx.map_err(|_| Panicked)
    }
}

/// Run a small (<200ms) CPU-intensive task on a dedicated thread pool with a few threads.
///
/// When running blocking io (or side-effects in general), prefer using `tokio::spawn_blocking`
/// instead. When running long tasks or a set of tasks that you expect to take more than 33% of
/// your vCPUs, use a dedicated thread/runtime or executor instead.
///
/// Disclaimer: The function will no be executed if the Future is dropped.
#[must_use = "run_cpu_intensive will not run if the future it returns is dropped"]
pub fn run_cpu_intensive<F, R>(cpu_intensive_fn: F) -> impl Future<Output = Result<R, Panicked>>
where
    F: FnOnce() -> R + Send + 'static,
    R: Send + 'static,
{
    static SMALL_TASK_EXECUTOR: std::sync::OnceLock<ThreadPool> = std::sync::OnceLock::new();
    SMALL_TASK_EXECUTOR
        .get_or_init(|| {
            let num_threads: usize = (crate::num_cpus() / 3).max(2);
            ThreadPool::new("small_tasks", Some(num_threads))
        })
        .run_cpu_intensive(cpu_intensive_fn)
}

#[derive(Clone, Copy, Debug, Eq, PartialEq)]
pub struct Panicked;

impl fmt::Display for Panicked {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "scheduled task panicked")
    }
}

impl std::error::Error for Panicked {}

struct ThreadPoolMetrics {
    ongoing_tasks: IntGaugeVec<1>,
    pending_tasks: IntGaugeVec<1>,
}

impl Default for ThreadPoolMetrics {
    fn default() -> Self {
        ThreadPoolMetrics {
            ongoing_tasks: new_gauge_vec(
                "ongoing_tasks",
                "number of tasks being currently processed by threads in the thread pool",
                "thread_pool",
                &[],
                ["pool"],
            ),
            pending_tasks: new_gauge_vec(
                "pending_tasks",
                "number of tasks waiting in the queue before being processed by the thread pool",
                "thread_pool",
                &[],
                ["pool"],
            ),
        }
    }
}

static THREAD_POOL_METRICS: Lazy<ThreadPoolMetrics> = Lazy::new(ThreadPoolMetrics::default);

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::sync::atomic::{AtomicU64, Ordering};
    use std::time::Duration;

    use super::*;

    #[tokio::test]
    async fn test_run_cpu_intensive() {
        assert_eq!(run_cpu_intensive(|| 1).await, Ok(1));
    }

    #[tokio::test]
    async fn test_run_cpu_intensive_panicks() {
        assert!(run_cpu_intensive(|| panic!("")).await.is_err());
    }

    #[tokio::test]
    async fn test_run_cpu_intensive_panicks_do_not_shrink_thread_pool() {
        for _ in 0..100 {
            assert!(run_cpu_intensive(|| panic!("")).await.is_err());
        }
    }

    #[tokio::test]
    async fn test_run_cpu_intensive_abort() {
        let counter: Arc<AtomicU64> = Default::default();
        let mut futures = Vec::new();
        for _ in 0..1_000 {
            let counter_clone = counter.clone();
            let fut = run_cpu_intensive(move || {
                std::thread::sleep(Duration::from_millis(5));
                counter_clone.fetch_add(1, Ordering::SeqCst)
            });
            // The first few num_cores tasks should run, but the other should get cancelled.
            futures.push(tokio::time::timeout(Duration::from_millis(1), fut));
        }
        futures::future::join_all(futures).await;
        assert!(counter.load(Ordering::SeqCst) < 100);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/box_layer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::sync::Arc;

use tower::layer::layer_fn;
use tower::{Layer, Service};

use crate::tower::BoxService;

pub struct BoxLayer<S, R, T, E> {
    inner: Arc<dyn Layer<S, Service = BoxService<R, T, E>> + Send + Sync + 'static>,
}

impl<S, R, T, E> BoxLayer<S, R, T, E> {
    pub fn new<L>(inner_layer: L) -> Self
    where
        L: Layer<S> + Send + Sync + 'static,
        L::Service: Service<R, Response = T, Error = E> + Clone + Send + Sync + 'static,
        <L::Service as Service<R>>::Future: Send + 'static,
    {
        let layer = layer_fn(move |inner_svc: S| {
            let outer_layer = inner_layer.layer(inner_svc);
            BoxService::new(outer_layer)
        });

        Self {
            inner: Arc::new(layer),
        }
    }
}

impl<S, R, T, E> Layer<S> for BoxLayer<S, R, T, E> {
    type Service = BoxService<R, T, E>;

    fn layer(&self, inner: S) -> Self::Service {
        self.inner.layer(inner)
    }
}

impl<S, R, T, E> Clone for BoxLayer<S, R, T, E> {
    fn clone(&self) -> Self {
        Self {
            inner: self.inner.clone(),
        }
    }
}

impl<S, R, T, E> fmt::Debug for BoxLayer<S, R, T, E> {
    fn fmt(&self, fmt: &mut fmt::Formatter) -> fmt::Result {
        fmt.debug_struct("BoxLayer").finish()
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/box_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::task::{Context, Poll};

use tower::{Service, ServiceExt};

use super::BoxFuture;

trait CloneService<R, T, E>:
    Service<R, Response = T, Error = E, Future = BoxFuture<T, E>>
    + dyn_clone::DynClone
    + Send
    + Sync
    + 'static
{
}

dyn_clone::clone_trait_object!(<R, T, E> CloneService<R, T, E>);

impl<S, R, T, E> CloneService<R, T, E> for S where S: Service<R, Response = T, Error = E, Future = BoxFuture<T, E>>
        + Clone
        + Send
        + Sync
        + 'static
{
}

pub struct BoxService<R, T, E> {
    inner: Box<dyn CloneService<R, T, E>>,
}

impl<R, T, E> Clone for BoxService<R, T, E> {
    fn clone(&self) -> Self {
        Self {
            inner: self.inner.clone(),
        }
    }
}

impl<R, T, E> BoxService<R, T, E> {
    pub fn new<S>(inner: S) -> Self
    where
        S: Service<R, Response = T, Error = E> + Clone + Send + Sync + 'static,
        S::Future: Send + 'static,
    {
        let inner = Box::new(inner.map_future(|fut| Box::pin(fut) as _));
        BoxService { inner }
    }
}

impl<R, T, E> Service<R> for BoxService<R, T, E> {
    type Response = T;
    type Error = E;
    type Future = BoxFuture<T, E>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), E>> {
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> BoxFuture<T, E> {
        self.inner.call(request)
    }
}

impl<T, U, E> fmt::Debug for BoxService<T, U, E> {
    fn fmt(&self, fmt: &mut fmt::Formatter) -> fmt::Result {
        fmt.debug_struct("BoxService").finish()
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/buffer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::error::Error;
use std::marker::PhantomData;
use std::task::{Context, Poll};
use std::{error, fmt};

use futures::TryFutureExt as _;
use tower::buffer::Buffer as TowerBuffer;
use tower::buffer::error::{Closed, ServiceError};
use tower::{Layer, Service};

use super::{BoxError, BoxFuture};

#[derive(Debug, thiserror::Error)]
pub enum BufferError {
    #[error("the buffer's worker closed unexpectedly")]
    Closed,
    #[error("the buffer service returned an unknown error")]
    Unknown,
}

/// A wrapper around [`tower::buffer::Buffer`] service that preserves the original error type.
pub struct Buffer<S, R>
where S: Service<R>
{
    bound: usize,
    inner: TowerBuffer<R, <S as Service<R>>::Future>,
}

impl<S, R> Buffer<S, R>
where
    S: Service<R>,
    S::Error: Into<BoxError>,
{
    pub fn new(service: S, bound: usize) -> Self
    where
        S: Send + 'static,
        S::Future: Send,
        S::Error: Send + Sync,
        R: Send + 'static,
    {
        Self {
            bound,
            inner: TowerBuffer::new(service, bound),
        }
    }
}

impl<S, R> Service<R> for Buffer<S, R>
where
    R: Send + 'static,
    S: Service<R>,
    S::Error: error::Error + From<BufferError> + Into<BoxError> + Clone + Send + Sync + 'static,
    S::Future: Send + 'static,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = BoxFuture<Self::Response, Self::Error>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.inner.poll_ready(cx).map_err(downcast_error)
    }

    fn call(&mut self, request: R) -> Self::Future {
        let fut = self.inner.call(request).map_err(downcast_error);
        Box::pin(fut)
    }
}

/// Downcasts an error boxed as [`tower::BoxError`] by the buffer service back into the original
/// error `E`.
fn downcast_error<E>(error: BoxError) -> E
where E: error::Error + From<BufferError> + Clone + 'static {
    if let Some(error) = error.downcast_ref::<E>() {
        return error.clone();
    }
    // This happens when the buffer worker is dead.
    if error.downcast_ref::<Closed>().is_some() {
        return BufferError::Closed.into();
    }
    // This happens when the inner service returns an error on `poll_ready`.
    if let Some(service_error) = error.downcast_ref::<ServiceError>()
        && let Some(source) = service_error.source()
        && let Some(inner) = source.downcast_ref::<E>()
    {
        return inner.clone();
    }
    // This will happen only if the buffer service implementation adds a new error type.
    BufferError::Unknown.into()
}

impl<S, R> fmt::Debug for Buffer<S, R>
where S: Service<R>
{
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("Buffer")
            .field("bound", &self.bound)
            .finish()
    }
}

impl<S, R> Clone for Buffer<S, R>
where
    S: Service<R>,
    R: Send + 'static,
    <S as Service<R>>::Future: Send + 'static,
{
    fn clone(&self) -> Self {
        Self {
            bound: self.bound,
            inner: self.inner.clone(),
        }
    }
}

pub struct BufferLayer<R> {
    bound: usize,
    _phantom: PhantomData<fn(R)>,
}

impl<R> BufferLayer<R> {
    pub fn new(bound: usize) -> Self {
        Self {
            bound,
            _phantom: PhantomData,
        }
    }
}

impl<S, R> Layer<S> for BufferLayer<R>
where
    S: Service<R> + Send + 'static,
    S::Future: Send,
    S::Error: error::Error + From<BufferError> + Into<BoxError> + Clone + Send + Sync + 'static,
    R: Send + 'static,
{
    type Service = Buffer<S, R>;

    fn layer(&self, service: S) -> Self::Service {
        Buffer::new(service, self.bound)
    }
}

impl<R> fmt::Debug for BufferLayer<R> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("BufferLayer")
            .field("bound", &self.bound)
            .finish()
    }
}

impl<R> Clone for BufferLayer<R> {
    fn clone(&self) -> Self {
        *self
    }
}

impl<R> Copy for BufferLayer<R> {}

#[cfg(test)]
mod tests {
    use tower::ServiceExt;

    use super::*;

    #[derive(Debug, Clone, thiserror::Error, PartialEq, Eq)]
    enum MyServiceError {
        #[error("service is exhausted")]
        Exhausted,
        #[error("service is unavailable")]
        Unavailable,
        #[error("service attempted to divide by zero")]
        ZeroDivision,
    }

    impl From<BufferError> for MyServiceError {
        fn from(_: BufferError) -> Self {
            MyServiceError::Unavailable
        }
    }

    #[derive(Debug, Default)]
    struct MyService {
        num_calls: usize,
    }

    impl Service<(usize, usize)> for MyService {
        type Response = usize;
        type Error = MyServiceError;
        type Future = BoxFuture<Self::Response, Self::Error>;

        fn poll_ready(&mut self, _cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
            self.num_calls += 1;

            if self.num_calls > 2 {
                Poll::Ready(Err(MyServiceError::Exhausted))
            } else {
                Poll::Ready(Ok(()))
            }
        }

        fn call(&mut self, (dividend, divisor): (usize, usize)) -> Self::Future {
            let fut = async move {
                if divisor == 0 {
                    Err(MyServiceError::ZeroDivision)
                } else {
                    Ok(dividend / divisor)
                }
            };
            Box::pin(fut)
        }
    }

    #[tokio::test]
    async fn test_buffer_error() {
        let mut service = BufferLayer::new(1).layer(MyService::default());

        assert_eq!(
            service.ready().await.unwrap().call((10, 2)).await.unwrap(),
            5
        );
        assert_eq!(
            service
                .ready()
                .await
                .unwrap()
                .call((10, 0))
                .await
                .unwrap_err(),
            MyServiceError::ZeroDivision
        );
        assert_eq!(
            service
                .ready()
                .await
                .unwrap()
                .call((10, 0))
                .await
                .unwrap_err(),
            MyServiceError::Exhausted
        );
    }

    #[tokio::test]
    async fn test_buffer_closed() {
        let (inner, worker) = TowerBuffer::pair(MyService::default(), 1);
        let handle = tokio::spawn(worker);

        let mut service: Buffer<MyService, (usize, usize)> = Buffer { bound: 1, inner };
        let res: usize = service.ready().await.unwrap().call((10, 2)).await.unwrap();
        assert_eq!(res, 5);

        handle.abort();
        handle.await.unwrap_err();

        assert_eq!(
            service.ready().await.unwrap_err(),
            MyServiceError::Unavailable
        );
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/change.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

/// A change enum similar to `tower::discover::Change` but cloneable.
// TODO: Remove when the next version of tower (0.4.14?) is released.
#[derive(Debug, Clone)]
pub enum Change<K, V> {
    Insert(K, V),
    Remove(K),
}


================================================
FILE: quickwit/quickwit-common/src/tower/circuit_breaker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::future::Future;
use std::pin::Pin;
use std::sync::{Arc, Mutex};
use std::task::{Context, Poll};
use std::time::Duration;

use pin_project::pin_project;
use prometheus::IntCounter;
use tokio::time::Instant;
use tower::{Layer, Service};

/// The circuit breaker layer implements the [circuit breaker pattern](https://martinfowler.com/bliki/CircuitBreaker.html).
///
/// It counts the errors emitted by the inner service, and if the number of errors exceeds a certain
/// threshold within a certain time window, it will "open" the circuit.
///
/// Requests will then be rejected for a given timeout.
/// After this timeout, the circuit breaker ends up in a HalfOpen state. It will allow a single
/// request to pass through. Depending on the result of this request, the circuit breaker will
/// either close the circuit again or open it again.
///
/// Implementation detail:
///
/// A circuit breaker needs to have some logic to estimate the chances for the next request
/// to fail. In this implementation, we use a simple heuristic that does not take in account
/// successes. We simply count the number or errors which happened in the last window.
///
/// The circuit breaker does not attempt to measure accurately the error rate.
/// Instead, it counts errors, and check for the time window in which these errors occurred.
/// This approach is accurate enough, robust, very easy to code and avoids calling the
/// `Instant::now()` at every error in the open state.
#[derive(Debug, Clone)]
pub struct CircuitBreakerLayer<Evaluator> {
    max_error_count_per_time_window: u32,
    time_window: Duration,
    timeout: Duration,
    evaluator: Evaluator,
    circuit_break_total: prometheus::IntCounter,
}

pub trait CircuitBreakerEvaluator: Clone {
    type Response;
    type Error;
    fn is_circuit_breaker_error(&self, output: &Result<Self::Response, Self::Error>) -> bool;
    fn make_circuit_breaker_output(&self) -> Self::Error;
    fn make_layer(
        self,
        max_num_errors_per_secs: u32,
        timeout: Duration,
        circuit_break_total: prometheus::IntCounter,
    ) -> CircuitBreakerLayer<Self> {
        CircuitBreakerLayer {
            max_error_count_per_time_window: max_num_errors_per_secs,
            time_window: Duration::from_secs(1),
            timeout,
            evaluator: self,
            circuit_break_total,
        }
    }
}

impl<S, Evaluator: CircuitBreakerEvaluator> Layer<S> for CircuitBreakerLayer<Evaluator> {
    type Service = CircuitBreaker<S, Evaluator>;

    fn layer(&self, service: S) -> CircuitBreaker<S, Evaluator> {
        let time_window = Duration::from_millis(self.time_window.as_millis() as u64);
        let timeout = Duration::from_millis(self.timeout.as_millis() as u64);
        CircuitBreaker {
            underlying: service,
            circuit_breaker_inner: Arc::new(Mutex::new(CircuitBreakerInner {
                max_error_count_per_time_window: self.max_error_count_per_time_window,
                time_window,
                timeout,
                state: CircuitBreakerState::Closed(ClosedState {
                    error_counter: 0u32,
                    error_window_end: Instant::now() + time_window,
                }),
                evaluator: self.evaluator.clone(),
                circuit_break_total: self.circuit_break_total.clone(),
            })),
        }
    }
}

struct CircuitBreakerInner<Evaluator> {
    max_error_count_per_time_window: u32,
    time_window: Duration,
    timeout: Duration,
    evaluator: Evaluator,
    state: CircuitBreakerState,
    circuit_break_total: IntCounter,
}

impl<Evaluator> CircuitBreakerInner<Evaluator> {
    fn get_state(&mut self) -> CircuitBreakerState {
        let new_state = match self.state {
            CircuitBreakerState::Open { until } => {
                let now = Instant::now();
                if now < until {
                    CircuitBreakerState::Open { until }
                } else {
                    CircuitBreakerState::HalfOpen
                }
            }
            other => other,
        };
        self.state = new_state;
        new_state
    }

    fn receive_error(&mut self) {
        match self.state {
            CircuitBreakerState::HalfOpen => {
                self.circuit_break_total.inc();
                self.state = CircuitBreakerState::Open {
                    until: Instant::now() + self.timeout,
                }
            }
            CircuitBreakerState::Open { .. } => {}
            CircuitBreakerState::Closed(ClosedState {
                error_counter,
                error_window_end,
            }) => {
                if error_counter < self.max_error_count_per_time_window {
                    self.state = CircuitBreakerState::Closed(ClosedState {
                        error_counter: error_counter + 1,
                        error_window_end,
                    });
                    return;
                }
                let now = Instant::now();
                if now < error_window_end {
                    self.circuit_break_total.inc();
                    self.state = CircuitBreakerState::Open {
                        until: now + self.timeout,
                    };
                } else {
                    self.state = CircuitBreakerState::Closed(ClosedState {
                        error_counter: 0u32,
                        error_window_end: now + self.time_window,
                    });
                }
            }
        }
    }

    fn receive_success(&mut self) {
        match self.state {
            CircuitBreakerState::HalfOpen | CircuitBreakerState::Open { .. } => {
                self.state = CircuitBreakerState::Closed(ClosedState {
                    error_counter: 0u32,
                    error_window_end: Instant::now() + self.time_window,
                });
            }
            CircuitBreakerState::Closed { .. } => {
                // We could actually take that as a signal.
            }
        }
    }
}

#[derive(Clone)]
pub struct CircuitBreaker<S, Evaluator> {
    underlying: S,
    circuit_breaker_inner: Arc<Mutex<CircuitBreakerInner<Evaluator>>>,
}

impl<S, Evaluator> std::fmt::Debug for CircuitBreaker<S, Evaluator> {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        f.debug_struct("CircuitBreaker").finish()
    }
}

#[derive(Debug, Clone, Copy)]
enum CircuitBreakerState {
    Open { until: Instant },
    HalfOpen,
    Closed(ClosedState),
}

#[derive(Debug, Clone, Copy)]
struct ClosedState {
    error_counter: u32,
    error_window_end: Instant,
}

impl<S, R, Evaluator> Service<R> for CircuitBreaker<S, Evaluator>
where
    S: Service<R>,
    Evaluator: CircuitBreakerEvaluator<Response = S::Response, Error = S::Error>,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = CircuitBreakerFuture<S::Future, Evaluator>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        let mut inner = self.circuit_breaker_inner.lock().unwrap();
        let state = inner.get_state();
        match state {
            CircuitBreakerState::Closed { .. } | CircuitBreakerState::HalfOpen => {
                self.underlying.poll_ready(cx)
            }
            CircuitBreakerState::Open { .. } => {
                let circuit_break_error = inner.evaluator.make_circuit_breaker_output();
                Poll::Ready(Err(circuit_break_error))
            }
        }
    }

    fn call(&mut self, request: R) -> Self::Future {
        CircuitBreakerFuture {
            underlying_fut: self.underlying.call(request),
            circuit_breaker_inner: self.circuit_breaker_inner.clone(),
        }
    }
}

#[pin_project]
pub struct CircuitBreakerFuture<F, Evaluator> {
    #[pin]
    underlying_fut: F,
    circuit_breaker_inner: Arc<Mutex<CircuitBreakerInner<Evaluator>>>,
}

impl<Response, Error, F, Evaluator> Future for CircuitBreakerFuture<F, Evaluator>
where
    F: Future<Output = Result<Response, Error>>,
    Evaluator: CircuitBreakerEvaluator<Response = Response, Error = Error>,
{
    type Output = F::Output;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let circuit_breaker_inner = self.circuit_breaker_inner.clone();
        let poll_res = self.project().underlying_fut.poll(cx);
        match poll_res {
            Poll::Pending => Poll::Pending,
            Poll::Ready(result) => {
                let mut circuit_breaker_inner_lock = circuit_breaker_inner.lock().unwrap();
                let is_circuit_breaker_error = circuit_breaker_inner_lock
                    .evaluator
                    .is_circuit_breaker_error(&result);
                if is_circuit_breaker_error {
                    circuit_breaker_inner_lock.receive_error();
                } else {
                    circuit_breaker_inner_lock.receive_success();
                }
                Poll::Ready(result)
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use std::sync::atomic::{AtomicBool, Ordering};

    use tower::{ServiceBuilder, ServiceExt};

    use super::*;

    #[derive(Debug)]
    enum TestError {
        CircuitBreak,
        ServiceError,
    }

    #[derive(Debug, Clone, Copy)]
    struct TestCircuitBreakerEvaluator;

    impl CircuitBreakerEvaluator for TestCircuitBreakerEvaluator {
        type Response = ();
        type Error = TestError;

        fn is_circuit_breaker_error(&self, output: &Result<Self::Response, Self::Error>) -> bool {
            output.is_err()
        }

        fn make_circuit_breaker_output(&self) -> TestError {
            TestError::CircuitBreak
        }
    }

    #[tokio::test]
    async fn test_circuit_breaker() {
        tokio::time::pause();
        let test_switch: Arc<AtomicBool> = Arc::new(AtomicBool::new(true));

        const TIMEOUT: Duration = Duration::from_millis(500);

        let int_counter: prometheus::IntCounter =
            IntCounter::new("circuit_break_total_test", "test circuit breaker counter").unwrap();
        let mut service = ServiceBuilder::new()
            .layer(TestCircuitBreakerEvaluator.make_layer(10, TIMEOUT, int_counter))
            .service_fn(|_| async {
                if test_switch.load(Ordering::Relaxed) {
                    Ok(())
                } else {
                    Err(TestError::ServiceError)
                }
            });

        service.ready().await.unwrap().call(()).await.unwrap();

        for _ in 0..1_000 {
            service.ready().await.unwrap().call(()).await.unwrap();
        }

        test_switch.store(false, Ordering::Relaxed);

        let mut service_error_count = 0;
        let mut circuit_break_count = 0;
        for _ in 0..1_000 {
            match service.ready().await {
                Ok(service) => {
                    service.call(()).await.unwrap_err();
                    service_error_count += 1;
                }
                Err(_circuit_breaker_error) => {
                    circuit_break_count += 1;
                }
            }
        }

        assert_eq!(service_error_count + circuit_break_count, 1_000);
        assert_eq!(service_error_count, 11);

        tokio::time::advance(TIMEOUT).await;

        // The test request at half open fails.
        for _ in 0..1_000 {
            match service.ready().await {
                Ok(service) => {
                    service.call(()).await.unwrap_err();
                    service_error_count += 1;
                }
                Err(_circuit_breaker_error) => {
                    circuit_break_count += 1;
                }
            }
        }

        assert_eq!(service_error_count + circuit_break_count, 2_000);
        assert_eq!(service_error_count, 12);

        test_switch.store(true, Ordering::Relaxed);
        tokio::time::advance(TIMEOUT).await;

        // The test request at half open succeeds.
        for _ in 0..1_000 {
            service.ready().await.unwrap().call(()).await.unwrap();
        }
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/delay.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::future::Future;
use std::pin::Pin;
use std::task::{Context, Poll};
use std::time::Duration;

use pin_project::pin_project;
use tokio::time::Sleep;
use tower::{Layer, Service};

/// Delays a request by `delay` seconds.
#[derive(Debug, Clone)]
pub struct Delay<S> {
    inner: S,
    delay: Duration,
}

impl<S, R> Service<R> for Delay<S>
where S: Service<R>
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = DelayFuture<S::Future>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> Self::Future {
        DelayFuture {
            inner: self.inner.call(request),
            sleep: tokio::time::sleep(self.delay),
            slept: false,
        }
    }
}

#[pin_project]
#[derive(Debug)]
pub struct DelayFuture<F> {
    #[pin]
    inner: F,
    #[pin]
    sleep: Sleep,
    slept: bool,
}

impl<F, T, E> Future for DelayFuture<F>
where F: Future<Output = Result<T, E>>
{
    type Output = Result<T, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let this = self.project();

        if !*this.slept {
            match this.sleep.poll(cx) {
                Poll::Ready(_) => *this.slept = true,
                Poll::Pending => return Poll::Pending,
            }
        }
        this.inner.poll(cx)
    }
}

/// Applies a delay to requests via the supplied inner service.
#[derive(Debug, Clone)]
pub struct DelayLayer {
    delay: Duration,
}

impl DelayLayer {
    /// Creates a new `DelayLayer` with the specified delay.
    pub fn new(delay: Duration) -> Self {
        Self { delay }
    }
}

impl<S> Layer<S> for DelayLayer {
    type Service = Delay<S>;

    fn layer(&self, service: S) -> Self::Service {
        Delay {
            inner: service,
            delay: self.delay,
        }
    }
}

#[cfg(test)]
mod tests {
    use std::time::Instant;

    use tokio::time::Duration;
    use tower::{ServiceBuilder, ServiceExt};

    use super::*;

    #[tokio::test]
    async fn test_delay() {
        let delay = Duration::from_millis(100);
        let mut service = ServiceBuilder::new()
            .layer(DelayLayer::new(delay))
            .service_fn(|_| async { Ok::<_, ()>(()) });

        let start = Instant::now();
        service.ready().await.unwrap().call(()).await.unwrap();

        let elapsed = start.elapsed();
        assert!(elapsed >= delay);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/estimate_rate.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::marker::PhantomData;
use std::task::{Context, Poll};
use std::time::Instant;

use tower::load::CompleteOnResponse;
use tower::load::completion::TrackCompletionFuture;
use tower::{Layer, Service};

use super::{Cost, RateEstimator};

pub struct Handle<T: RateEstimator> {
    started_at: Instant,
    work: u64,
    estimator: T,
}

impl<T> Drop for Handle<T>
where T: RateEstimator
{
    fn drop(&mut self) {
        let ended_at = Instant::now();
        self.estimator.update(self.started_at, ended_at, self.work);
    }
}

/// Estimates the quantity of work the underlying service can handle over a period of time.
///
/// Each request is decorated with a `Handle` that measures the time necessary to process the
/// request and, on drop, updates the rate estimator on which it holds a reference.
#[derive(Debug, Clone)]
pub struct EstimateRate<S, T> {
    service: S,
    estimator: T,
}

impl<S, T> EstimateRate<S, T>
where T: RateEstimator
{
    /// Creates a new rate estimator.
    pub fn new(service: S, estimator: T) -> Self {
        Self { service, estimator }
    }

    fn handle(&self, work: u64) -> Handle<T> {
        Handle {
            started_at: Instant::now(),
            work,
            estimator: self.estimator.clone(),
        }
    }
}

impl<S, R, T> Service<R> for EstimateRate<S, T>
where
    S: Service<R>,
    R: Cost,
    T: RateEstimator,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = TrackCompletionFuture<S::Future, CompleteOnResponse, Handle<T>>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.service.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> Self::Future {
        let handle = self.handle(request.cost());
        TrackCompletionFuture::new(
            CompleteOnResponse::default(),
            handle,
            self.service.call(request),
        )
    }
}

/// Estimates the quantity of work the underlying
/// service can handle over a period of time.
#[derive(Debug, Clone)]
pub struct EstimateRateLayer<R, T> {
    estimator: T,
    _phantom: PhantomData<R>,
}

impl<R, T> EstimateRateLayer<R, T> {
    /// Creates new estimate rate layer.
    pub fn new(estimator: T) -> Self {
        Self {
            estimator,
            _phantom: PhantomData,
        }
    }
}

impl<S, R, T> Layer<S> for EstimateRateLayer<R, T>
where
    S: Service<R>,
    R: Cost,
    T: RateEstimator,
{
    type Service = EstimateRate<S, T>;

    fn layer(&self, service: S) -> Self::Service {
        EstimateRate::new(service, self.estimator.clone())
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::sync::atomic::{AtomicU64, Ordering};
    use std::time::Duration;

    use tower::ServiceExt;

    use super::*;
    use crate::tower::Rate;

    struct Request;

    impl Cost for Request {
        fn cost(&self) -> u64 {
            42
        }
    }

    #[derive(Debug, Clone, Default)]
    struct DummyEstimator {
        work: Arc<AtomicU64>,
        duration_micros: Arc<AtomicU64>,
    }

    impl Rate for DummyEstimator {
        fn work(&self) -> u64 {
            self.work.load(Ordering::Relaxed)
        }

        fn period(&self) -> Duration {
            Duration::from_micros(self.duration_micros.load(Ordering::Relaxed))
        }
    }

    impl RateEstimator for DummyEstimator {
        fn update(&mut self, started_at: Instant, ended_at: Instant, work: u64) {
            self.work.store(work, Ordering::Relaxed);
            self.duration_micros.store(
                (ended_at - started_at).as_micros() as u64,
                Ordering::Relaxed,
            );
        }
    }

    #[tokio::test]
    async fn test_estimate_rate() {
        let estimator = DummyEstimator::default();
        let mut service = EstimateRate::new(
            tower::service_fn(|_: Request| async move { Ok::<_, ()>(()) }),
            estimator.clone(),
        );
        service.ready().await.unwrap().call(Request).await.unwrap();
        assert_eq!(service.estimator.work(), 42);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/event_listener.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::pin::Pin;
use std::task::{Context, Poll};

use futures::{Future, ready};
use pin_project::pin_project;
use tower::{Layer, Service};

use crate::pubsub::{Event, EventBroker};

#[derive(Clone)]
pub struct EventListener<S> {
    inner: S,
    event_broker: EventBroker,
}

impl<S> EventListener<S> {
    pub fn new(inner: S, event_broker: EventBroker) -> Self {
        Self {
            inner,
            event_broker,
        }
    }
}

impl<S, R> Service<R> for EventListener<S>
where
    S: Service<R>,
    R: Event,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = ResponseFuture<S::Future, R>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> Self::Future {
        let inner = self.inner.call(request.clone());
        ResponseFuture {
            inner,
            event_broker: self.event_broker.clone(),
            request: Some(request),
        }
    }
}

#[derive(Debug, Clone)]
pub struct EventListenerLayer {
    event_broker: EventBroker,
}

impl EventListenerLayer {
    pub fn new(event_broker: EventBroker) -> Self {
        Self { event_broker }
    }
}

impl<S> Layer<S> for EventListenerLayer {
    type Service = EventListener<S>;

    fn layer(&self, service: S) -> Self::Service {
        EventListener::new(service, self.event_broker.clone())
    }
}

/// Response future for [`EventListener`].
#[pin_project]
pub struct ResponseFuture<F, R> {
    #[pin]
    inner: F,
    event_broker: EventBroker,
    request: Option<R>,
}

impl<R, F, T, E> Future for ResponseFuture<F, R>
where
    R: Event,
    F: Future<Output = Result<T, E>>,
{
    type Output = Result<T, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let this = self.project();
        let response = ready!(this.inner.poll(cx));

        if response.is_ok() {
            this.event_broker
                .publish(this.request.take().expect("request should be set"));
        }
        Poll::Ready(Ok(response?))
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};
    use std::time::Duration;

    use async_trait::async_trait;

    use super::*;
    use crate::pubsub::EventSubscriber;

    #[derive(Debug, Clone, Copy)]
    struct MyEvent {
        return_ok: bool,
    }

    impl Event for MyEvent {}

    struct MySubscriber {
        counter: Arc<AtomicUsize>,
    }

    #[async_trait]
    impl EventSubscriber<MyEvent> for MySubscriber {
        async fn handle_event(&mut self, _event: MyEvent) {
            self.counter.fetch_add(1, Ordering::Relaxed);
        }
    }

    #[tokio::test]
    async fn test_event_listener() {
        let event_broker = EventBroker::default();
        let counter = Arc::new(AtomicUsize::new(0));
        let subscriber = MySubscriber {
            counter: counter.clone(),
        };
        let _subscription_handle = event_broker.subscribe::<MyEvent>(subscriber);

        let layer = EventListenerLayer::new(event_broker);

        let mut service = layer.layer(tower::service_fn(|request: MyEvent| async move {
            if request.return_ok { Ok(()) } else { Err(()) }
        }));
        let request = MyEvent { return_ok: false };
        service.call(request).await.unwrap_err();

        tokio::time::sleep(Duration::from_millis(1)).await;
        assert_eq!(counter.load(Ordering::Relaxed), 0);

        let request = MyEvent { return_ok: true };
        service.call(request).await.unwrap();

        tokio::time::sleep(Duration::from_millis(1)).await;
        assert_eq!(counter.load(Ordering::Relaxed), 1);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/load_shed.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::future::Future;
use std::pin::Pin;
use std::sync::Arc;
use std::task::{Context, Poll};

use pin_project::pin_project;
use tokio::sync::{OwnedSemaphorePermit, Semaphore};
use tower::{Layer, Service};

/// Tracks the number of in-flight requests being processed by a service and rejects new incoming
/// requests if the number of in-flight requests exceeds a specified limit.
#[derive(Debug)]
pub struct LoadShed<S> {
    inner: S,
    permits: Arc<Semaphore>,
    permit_opt: Option<OwnedSemaphorePermit>,
}

impl<S> Clone for LoadShed<S>
where S: Clone
{
    fn clone(&self) -> Self {
        Self {
            inner: self.inner.clone(),
            permits: self.permits.clone(),
            permit_opt: None,
        }
    }
}

pub trait MakeLoadShedError {
    fn make_load_shed_error() -> Self;
}

impl<S, R> Service<R> for LoadShed<S>
where
    S: Service<R>,
    S::Error: MakeLoadShedError,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = LoadShedFuture<S::Future>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        if self.permit_opt.is_none() {
            if let Ok(permit) = self.permits.clone().try_acquire_owned() {
                self.permit_opt = Some(permit);
            } else {
                return Poll::Ready(Err(S::Error::make_load_shed_error()));
            }
        }
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> Self::Future {
        let permit = self
            .permit_opt
            .take()
            .expect("`poll_ready` should be called before `call`");

        LoadShedFuture {
            inner: self.inner.call(request),
            permit,
        }
    }
}

#[pin_project]
#[derive(Debug)]
pub struct LoadShedFuture<F> {
    #[pin]
    inner: F,
    permit: OwnedSemaphorePermit,
}

impl<F, T, E> Future for LoadShedFuture<F>
where F: Future<Output = Result<T, E>>
{
    type Output = Result<T, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        self.project().inner.poll(cx)
    }
}

/// Allows at most `max_in_flight_requests` in-flight requests before rejecting new incoming
/// requests.
#[derive(Debug, Clone)]
pub struct LoadShedLayer {
    max_in_flight_requests: usize,
}

impl LoadShedLayer {
    /// Creates a new `LoadShedLayer` allowing at most `max_in_flight_requests` in-flight requests
    /// before rejecting new incoming requests.
    pub fn new(max_in_flight_requests: usize) -> Self {
        Self {
            max_in_flight_requests,
        }
    }
}

impl<S> Layer<S> for LoadShedLayer {
    type Service = LoadShed<S>;

    fn layer(&self, service: S) -> Self::Service {
        LoadShed {
            inner: service,
            permits: Arc::new(Semaphore::new(self.max_in_flight_requests)),
            permit_opt: None,
        }
    }
}

#[cfg(test)]
mod tests {
    use tower::{ServiceBuilder, ServiceExt};

    use super::*;

    #[tokio::test]
    async fn test_load_shed() {
        #[derive(Debug)]
        struct MyError;

        impl MakeLoadShedError for MyError {
            fn make_load_shed_error() -> Self {
                MyError
            }
        }
        let mut service = ServiceBuilder::new()
            .layer(LoadShedLayer::new(1))
            .service_fn(|_| async { Ok::<_, MyError>(()) });

        let in_fight_fut = service.ready().await.unwrap().call(());
        service.ready().await.unwrap_err();

        drop(in_fight_fut);
        service.ready().await.unwrap().call(()).await.unwrap();
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::pin::Pin;
use std::task::{Context, Poll};
use std::time::Instant;

use futures::{Future, ready};
use pin_project::{pin_project, pinned_drop};
use prometheus::exponential_buckets;
use tower::{Layer, Service};

use crate::metrics::{
    HistogramVec, IntCounterVec, IntGaugeVec, new_counter_vec, new_gauge_vec, new_histogram_vec,
};

pub trait RpcName {
    fn rpc_name() -> &'static str;
}

#[derive(Clone)]
pub struct GrpcMetrics<S> {
    inner: S,
    requests_total: IntCounterVec<2>,
    requests_in_flight: IntGaugeVec<1>,
    request_duration_seconds: HistogramVec<2>,
}

impl<S, R> Service<R> for GrpcMetrics<S>
where
    S: Service<R>,
    R: RpcName,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = ResponseFuture<S::Future>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> Self::Future {
        let start = Instant::now();
        let rpc_name = R::rpc_name();
        let inner = self.inner.call(request);

        self.requests_in_flight.with_label_values([rpc_name]).inc();

        ResponseFuture {
            inner,
            start,
            rpc_name,
            status: "cancelled",
            requests_total: self.requests_total.clone(),
            requests_in_flight: self.requests_in_flight.clone(),
            request_duration_seconds: self.request_duration_seconds.clone(),
        }
    }
}

#[derive(Clone)]
pub struct GrpcMetricsLayer {
    requests_total: IntCounterVec<2>,
    requests_in_flight: IntGaugeVec<1>,
    request_duration_seconds: HistogramVec<2>,
}

impl GrpcMetricsLayer {
    pub fn new(subsystem: &'static str, kind: &'static str) -> Self {
        Self {
            requests_total: new_counter_vec(
                "grpc_requests_total",
                "Total number of gRPC requests processed.",
                subsystem,
                &[("kind", kind)],
                ["rpc", "status"],
            ),
            requests_in_flight: new_gauge_vec(
                "grpc_requests_in_flight",
                "Number of gRPC requests in-flight.",
                subsystem,
                &[("kind", kind)],
                ["rpc"],
            ),
            request_duration_seconds: new_histogram_vec(
                "grpc_request_duration_seconds",
                "Duration of request in seconds.",
                subsystem,
                &[("kind", kind)],
                ["rpc", "status"],
                exponential_buckets(0.001, 2.0, 12).unwrap(),
            ),
        }
    }
}

impl<S> Layer<S> for GrpcMetricsLayer {
    type Service = GrpcMetrics<S>;

    fn layer(&self, inner: S) -> Self::Service {
        GrpcMetrics {
            inner,
            requests_total: self.requests_total.clone(),
            requests_in_flight: self.requests_in_flight.clone(),
            request_duration_seconds: self.request_duration_seconds.clone(),
        }
    }
}

/// Response future for [`PrometheusMetrics`].
#[pin_project(PinnedDrop)]
pub struct ResponseFuture<F> {
    #[pin]
    inner: F,
    start: Instant,
    rpc_name: &'static str,
    status: &'static str,
    requests_total: IntCounterVec<2>,
    requests_in_flight: IntGaugeVec<1>,
    request_duration_seconds: HistogramVec<2>,
}

#[pinned_drop]
impl<F> PinnedDrop for ResponseFuture<F> {
    fn drop(self: Pin<&mut Self>) {
        let elapsed = self.start.elapsed().as_secs_f64();
        let label_values = [self.rpc_name, self.status];

        self.requests_total.with_label_values(label_values).inc();
        self.request_duration_seconds
            .with_label_values(label_values)
            .observe(elapsed);
        self.requests_in_flight
            .with_label_values([self.rpc_name])
            .dec();
    }
}

impl<F, T, E> Future for ResponseFuture<F>
where F: Future<Output = Result<T, E>>
{
    type Output = Result<T, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let this = self.project();
        let response = ready!(this.inner.poll(cx));
        *this.status = if response.is_ok() { "success" } else { "error" };
        Poll::Ready(Ok(response?))
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    struct HelloRequest;

    impl RpcName for HelloRequest {
        fn rpc_name() -> &'static str {
            "hello"
        }
    }

    struct GoodbyeRequest;

    impl RpcName for GoodbyeRequest {
        fn rpc_name() -> &'static str {
            "goodbye"
        }
    }

    #[tokio::test]
    async fn test_grpc_metrics() {
        let layer = GrpcMetricsLayer::new("quickwit_test", "server");

        let mut hello_service =
            layer
                .clone()
                .layer(tower::service_fn(|request: HelloRequest| async move {
                    Ok::<_, ()>(request)
                }));
        let mut goodbye_service =
            layer
                .clone()
                .layer(tower::service_fn(|request: GoodbyeRequest| async move {
                    Ok::<_, ()>(request)
                }));

        hello_service.call(HelloRequest).await.unwrap();

        assert_eq!(
            layer
                .requests_total
                .with_label_values(["hello", "success"])
                .get(),
            1
        );
        assert_eq!(
            layer
                .requests_total
                .with_label_values(["goodbye", "success"])
                .get(),
            0
        );

        goodbye_service.call(GoodbyeRequest).await.unwrap();

        assert_eq!(
            layer
                .requests_total
                .with_label_values(["goodbye", "success"])
                .get(),
            1
        );

        let hello_future = hello_service.call(HelloRequest);
        drop(hello_future);

        assert_eq!(
            layer
                .requests_total
                .with_label_values(["hello", "cancelled"])
                .get(),
            1
        );
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod box_layer;
mod box_service;
mod buffer;
mod change;
mod circuit_breaker;
mod delay;
mod estimate_rate;
mod event_listener;
mod load_shed;
mod metrics;
mod one_task_per_call_layer;
mod pool;
mod rate;
mod rate_estimator;
mod rate_limit;
mod retry;
mod timeout;
mod transport;

use std::error;
use std::pin::Pin;

pub use box_layer::BoxLayer;
pub use box_service::BoxService;
pub use buffer::{Buffer, BufferError, BufferLayer};
pub use change::Change;
pub use circuit_breaker::{CircuitBreaker, CircuitBreakerEvaluator, CircuitBreakerLayer};
pub use delay::{Delay, DelayLayer};
pub use estimate_rate::{EstimateRate, EstimateRateLayer};
pub use event_listener::{EventListener, EventListenerLayer};
use futures::Future;
pub use load_shed::{LoadShed, LoadShedLayer, MakeLoadShedError};
pub use metrics::{GrpcMetrics, GrpcMetricsLayer, RpcName};
pub use one_task_per_call_layer::{OneTaskPerCallLayer, TaskCancelled};
pub use pool::Pool;
pub use rate::{ConstantRate, Rate};
pub use rate_estimator::{RateEstimator, SmaRateEstimator};
pub use rate_limit::{RateLimit, RateLimitLayer};
pub use retry::{RetryLayer, RetryPolicy};
pub use timeout::{Timeout, TimeoutExceeded, TimeoutLayer};
pub use transport::{
    BalanceChannel, ClientGrpcConfig, KeepAliveConfig, make_channel, warmup_channel,
};

pub type BoxError = Box<dyn error::Error + Send + Sync + 'static>;

pub type BoxFuture<T, E> = Pin<Box<dyn Future<Output = Result<T, E>> + Send + 'static>>;

pub type BoxFutureInfaillible<T> = Pin<Box<dyn Future<Output = T> + Send + 'static>>;

pub trait Cost {
    fn cost(&self) -> u64;
}


================================================
FILE: quickwit/quickwit-common/src/tower/one_task_per_call_layer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::future::Future;
use std::pin::Pin;
use std::task::{Context, Poll};

use pin_project::pin_project;
use tokio::task::{JoinError, JoinHandle};
use tower::{Layer, Service};
use tracing::error;

use crate::tower::RpcName;

/// This layer spawns a new task for each call to the inner service.
///
/// This is useful for service where the handle is not cancel-safe:
/// On a connection drop for instance, tonic can cancel the Future associated
/// to a request execution.
///
/// By executing it on a dedicated task, we ensure the future is run to
/// completion.
///
/// Disclaimer: This layer should be used with caution, as it means that timeout
/// are not possible anymore.
///
/// It also can behave in an unexpected way when combined with layers like the
/// `GlobalConcurrencyLimitLayer`.
pub struct OneTaskPerCallLayer;

impl<S: Clone> Layer<S> for OneTaskPerCallLayer {
    type Service = OneTaskPerCallService<S>;

    fn layer(&self, service: S) -> Self::Service {
        OneTaskPerCallService { service }
    }
}

#[derive(Clone)]
pub struct OneTaskPerCallService<S> {
    service: S,
}

impl<S, Request> Service<Request> for OneTaskPerCallService<S>
where
    S: Service<Request>,
    S::Future: Send + 'static,
    S::Response: Send + 'static,
    S::Error: From<TaskCancelled> + Send + 'static,
    Request: fmt::Debug + Send + RpcName + 'static,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = UnwrapOrElseFuture<S::Response, S::Error>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.service.poll_ready(cx)
    }

    fn call(&mut self, request: Request) -> Self::Future {
        let request_name: &'static str = Request::rpc_name();
        let future = self.service.call(request);
        let join_handle = tokio::spawn(future);
        UnwrapOrElseFuture {
            request_name,
            join_handle,
        }
    }
}

#[pin_project]
pub struct UnwrapOrElseFuture<T, E> {
    request_name: &'static str,
    #[pin]
    join_handle: JoinHandle<Result<T, E>>,
}

impl<T, E> Future for UnwrapOrElseFuture<T, E>
where E: From<TaskCancelled>
{
    type Output = Result<T, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let request_name = self.request_name;
        let pinned_join_handle: Pin<&mut JoinHandle<Result<T, E>>> = self.project().join_handle;
        match pinned_join_handle.poll(cx) {
            Poll::Ready(Ok(Ok(t))) => Poll::Ready(Ok(t)),
            Poll::Ready(Ok(Err(e))) => Poll::Ready(Err(e)),
            Poll::Ready(Err(join_error)) => {
                error!(
                    "task running the request `{}` was cancelled or panicked. please report! \
                     JoinError: {:?}",
                    request_name, join_error
                );
                let task_cancelled = TaskCancelled {
                    request_name,
                    join_error,
                };
                Poll::Ready(Err(E::from(task_cancelled)))
            }
            Poll::Pending => Poll::Pending,
        }
    }
}

pub struct TaskCancelled {
    pub request_name: &'static str,
    pub join_error: JoinError,
}

impl std::fmt::Display for TaskCancelled {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let TaskCancelled {
            request_name,
            join_error,
        } = self;
        write!(
            f,
            "task running `{request_name}` was cancelled or panicked. JoinError: {join_error:?})"
        )
    }
}

#[cfg(test)]
mod tests {

    use std::sync::Arc;
    use std::time::Duration;

    use tokio::sync::Mutex;
    use tower::ServiceExt;

    use super::*;
    use crate::tower::RpcName;

    #[derive(Debug)]
    struct Request;

    impl RpcName for Request {
        fn rpc_name() -> &'static str {
            "dummy_request"
        }
    }

    #[derive(Debug)]
    struct DummyError;

    impl From<TaskCancelled> for DummyError {
        fn from(_task_cancelled: TaskCancelled) -> DummyError {
            DummyError
        }
    }

    // In this toy example, we want to make sure, upon all observation
    // left == right.
    //
    // In reality, OneTaskPerCallLayer is meant to protect more complicated
    // invariants.
    #[derive(Default)]
    struct State {
        left: usize,
        right: usize,
    }

    #[tokio::test]
    async fn test_task_cancelled() {
        let state: Arc<Mutex<State>> = Default::default();
        let state_clone: Arc<Mutex<State>> = state.clone();
        let service = tower::service_fn(move |_request: Request| {
            let state_clone = state.clone();
            async move {
                let mut lock = state_clone.lock().await;
                assert_eq!(lock.left, lock.right);
                lock.left += 1;
                // If the task was cancelled at this point, it would leave us with
                // a broken invariant.
                tokio::time::sleep(Duration::from_millis(100)).await;
                lock.right += 1;
                Result::Ok::<(), DummyError>(())
            }
        });
        let mut one_task_per_call_service = OneTaskPerCallService { service };
        tokio::select!(
            _ = async { one_task_per_call_service.ready().await.unwrap().call(Request).await } => {
                panic!("this should have timed out");
            },
            _ = tokio::time::sleep(Duration::from_millis(10)) => (),
        );
        let state_guard = state_clone.lock().await;
        assert_eq!(state_guard.left, state_guard.right);
        assert_eq!(state_guard.left, 1);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/pool.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::TypeId;
use std::borrow::Borrow;
use std::cmp::{Eq, PartialEq};
use std::collections::HashMap;
use std::fmt;
use std::hash::Hash;
use std::sync::{Arc, RwLock};

use futures::{Stream, StreamExt};

use super::Change;

/// A pool of `V` values identified by `K` keys. The pool can be updated manually by calling the
/// `add/remove` methods or by listening to a stream of changes.
pub struct Pool<K, V> {
    pool: Arc<RwLock<HashMap<K, V>>>,
}

impl<K, V> fmt::Debug for Pool<K, V>
where
    K: 'static,
    V: 'static,
{
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "Pool<{:?}, {:?}>", TypeId::of::<K>(), TypeId::of::<V>())
    }
}

impl<K, V> Clone for Pool<K, V> {
    fn clone(&self) -> Self {
        Self {
            pool: self.pool.clone(),
        }
    }
}

impl<K, V> Default for Pool<K, V>
where K: Eq + PartialEq + Hash
{
    fn default() -> Self {
        Self {
            pool: Arc::new(RwLock::new(HashMap::default())),
        }
    }
}

impl<K, V> Pool<K, V>
where
    K: Eq + PartialEq + Hash + Clone + Send + Sync + 'static,
    V: Clone + Send + Sync + 'static,
{
    /// Listens for the changes emitted by the stream and updates the pool accordingly.
    pub fn listen_for_changes(
        &self,
        change_stream: impl Stream<Item = Change<K, V>> + Send + 'static,
    ) {
        let pool = self.clone();
        let future = async move {
            change_stream
                .for_each(|change| async {
                    match change {
                        Change::Insert(key, service) => {
                            pool.insert(key, service);
                        }
                        Change::Remove(key) => {
                            pool.remove(&key);
                        }
                    }
                })
                .await;
        };
        tokio::spawn(future);
    }

    /// Returns whether the pool is empty.
    pub fn is_empty(&self) -> bool {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .is_empty()
    }

    /// Returns the number of values in the pool.
    pub fn len(&self) -> usize {
        self.pool.read().expect("lock should not be poisoned").len()
    }

    /// Returns all the keys in the pool.
    pub fn keys(&self) -> Vec<K> {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .keys()
            .cloned()
            .collect()
    }

    /// Returns all the key-value pairs in the pool.
    pub fn keys_values(&self) -> Vec<(K, V)> {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .iter()
            .map(|(key, value)| (key.clone(), value.clone()))
            .collect()
    }

    /// Returns all the values in the pool.
    pub fn values(&self) -> Vec<V> {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .values()
            .cloned()
            .collect()
    }

    /// Returns all the key-value pairs in the pool.
    pub fn pairs(&self) -> Vec<(K, V)> {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .iter()
            .map(|(key, value)| (key.clone(), value.clone()))
            .collect()
    }

    /// Returns the value associated with the given key.
    pub fn contains_key<Q>(&self, key: &Q) -> bool
    where
        Q: Hash + Eq + ?Sized,
        K: Borrow<Q>,
    {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .contains_key(key)
    }

    /// Returns the value associated with the given key.
    pub fn get<Q>(&self, key: &Q) -> Option<V>
    where
        Q: Hash + Eq + ?Sized,
        K: Borrow<Q>,
    {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .get(key)
            .cloned()
    }

    /// Finds a key in the pool that satisfies the given predicate.
    pub fn find(&self, func: impl Fn(&K, &V) -> bool) -> Option<(K, V)> {
        self.pool
            .read()
            .expect("lock should not be poisoned")
            .iter()
            .find(|(key, value)| func(key, value))
            .map(|(key, value)| (key.clone(), value.clone()))
    }

    /// Adds a value to the pool.
    pub fn insert(&self, key: K, service: V) {
        self.pool
            .write()
            .expect("lock should not be poisoned")
            .insert(key, service);
    }

    /// Removes a value from the pool.
    fn remove(&self, key: &K) {
        self.pool
            .write()
            .expect("lock should not be poisoned")
            .remove(key);
    }
}

impl<K, V> FromIterator<(K, V)> for Pool<K, V>
where K: Eq + PartialEq + Hash
{
    fn from_iter<I>(iter: I) -> Self
    where I: IntoIterator<Item = (K, V)> {
        Self {
            pool: Arc::new(RwLock::new(HashMap::from_iter(iter))),
        }
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use tokio_stream::wrappers::ReceiverStream;

    use super::*;

    #[tokio::test]
    async fn test_pool() {
        let (change_stream_tx, change_stream_rx) = tokio::sync::mpsc::channel(10);
        let change_stream = ReceiverStream::new(change_stream_rx);

        let pool = Pool::default();
        pool.listen_for_changes(change_stream);

        assert!(pool.is_empty());
        assert_eq!(pool.len(), 0);

        change_stream_tx.send(Change::Insert(1, 11)).await.unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert!(!pool.is_empty());
        assert_eq!(pool.len(), 1);

        assert!(pool.contains_key(&1));
        assert_eq!(pool.get(&1), Some(11));

        change_stream_tx.send(Change::Insert(2, 21)).await.unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert_eq!(pool.len(), 2);
        assert_eq!(pool.get(&2), Some(21));

        assert_eq!(pool.find(|k, _| *k == 1), Some((1, 11)));

        let mut pairs = pool.pairs();
        pairs.sort();

        assert_eq!(pairs, vec![(1, 11), (2, 21)]);

        change_stream_tx.send(Change::Insert(1, 12)).await.unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert_eq!(pool.get(&1), Some(12));

        change_stream_tx.send(Change::Remove(1)).await.unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert_eq!(pool.len(), 1);

        change_stream_tx.send(Change::Remove(2)).await.unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert!(pool.is_empty());
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/rate.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use bytesize::ByteSize;

pub trait Rate: Clone {
    /// Returns the amount of work per time period.
    fn work(&self) -> u64;

    /// Returns the amount of work in bytes per time period.
    fn work_bytes(&self) -> ByteSize {
        ByteSize(self.work())
    }

    /// Returns the duration of a time period.
    fn period(&self) -> Duration;
}

/// A rate of unit of work per time period.
#[derive(Debug, Copy, Clone)]
pub struct ConstantRate {
    work: u64,
    period: Duration,
}

impl ConstantRate {
    /// Creates a new constant rate.
    ///
    /// # Panics
    ///
    /// This function panics if `period` is 0 while work is != 0.
    pub const fn new(work: u64, period: Duration) -> Self {
        assert!(!period.is_zero() || work == 0u64);
        Self { work, period }
    }

    pub const fn bytes_per_period(bytes: ByteSize, period: Duration) -> Self {
        let work = bytes.as_u64();
        Self::new(work, period)
    }

    pub const fn bytes_per_sec(bytes: ByteSize) -> Self {
        Self::bytes_per_period(bytes, Duration::from_secs(1))
    }

    /// Changes the scale of the rate, i.e. the duration of the time period, while keeping the rate
    /// constant.
    ///
    /// # Panics
    ///
    /// This function panics if `new_period` is 0.
    pub fn rescale(&self, new_period: Duration) -> Self {
        if self.work == 0u64 {
            return Self::new(0u64, new_period);
        }
        assert!(!new_period.is_zero());
        let new_work = self.work() as u128 * new_period.as_nanos() / self.period().as_nanos();
        Self::new(new_work as u64, new_period)
    }
}

impl Rate for ConstantRate {
    fn work(&self) -> u64 {
        self.work
    }

    fn period(&self) -> Duration {
        self.period
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    #[should_panic]
    fn test_rescale_zero_duration_panics() {
        ConstantRate::bytes_per_period(ByteSize::b(1), Duration::default());
    }

    #[test]
    fn test_rescale_zero_duration_accepted_if_no_work() {
        let rate = ConstantRate::bytes_per_period(ByteSize::b(0), Duration::default());
        let rescaled_rate = rate.rescale(Duration::from_secs(1));
        assert_eq!(rescaled_rate.work_bytes(), ByteSize::b(0));
        assert_eq!(rescaled_rate.period(), Duration::from_secs(1));
    }

    #[test]
    fn test_rescale() {
        let rate = ConstantRate::bytes_per_period(ByteSize::mib(5), Duration::from_secs(5));
        let rescaled_rate = rate.rescale(Duration::from_secs(1));
        assert_eq!(rescaled_rate.work_bytes(), ByteSize::mib(1));
        assert_eq!(rescaled_rate.period(), Duration::from_secs(1));
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/rate_estimator.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;
use std::sync::Arc;
use std::sync::atomic::{AtomicU64, Ordering};
use std::time::{Duration, Instant};

use super::Rate;

pub trait RateEstimator: Rate {
    fn update(&mut self, started_at: Instant, ended_at: Instant, work: u64);
}

/// Simple moving average rate estimator. Tracks the average rate of work over a sliding time
/// window.
#[derive(Debug, Clone)]
pub struct SmaRateEstimator {
    inner: Arc<InnerSmaRateEstimator>,
}

#[derive(Debug)]
struct InnerSmaRateEstimator {
    anchor: Instant,
    buckets: Box<[Bucket]>,
    bucket_period_millis: u64,
    period_millis: u64,
    num_buckets: u64,
}

impl SmaRateEstimator {
    /// Creates a new simple moving average rate estimator.
    ///
    /// The rate returned is the rate measured over the last `n - 1` buckets. The
    /// ongoing bucket is not taken in account.
    /// In other words, we are returning a rolling average that spans over a period
    /// of `num_buckets * bucket_period`.
    ///
    /// The `period` argument is just a `scaling unit`. A period of 1s means that the
    /// the number returned by `work` is expressed in `bytes / second`.
    ///
    /// This rate estimator is bucket-based and outputs the average rate of work over the previous
    /// closed `n-1` buckets.
    ///
    /// # Panics
    ///
    /// This function panics if `bucket_period` is < 1s  or `period` is < 1ms.
    pub fn new(num_buckets: NonZeroUsize, bucket_period: Duration, period: Duration) -> Self {
        assert!(bucket_period.as_millis() >= 100);
        assert!(period.as_millis() > 0);

        let mut buckets = Vec::with_capacity(num_buckets.get());
        for _ in 0..num_buckets.get() {
            buckets.push(Bucket::default());
        }
        let inner = InnerSmaRateEstimator {
            anchor: Instant::now(),
            buckets: buckets.into_boxed_slice(),
            bucket_period_millis: bucket_period.as_millis() as u64,
            num_buckets: num_buckets.get() as u64,
            period_millis: period.as_millis() as u64,
        };
        Self {
            inner: Arc::new(inner),
        }
    }

    fn work_in_bucket(&self, bucket_ord: u64) -> u64 {
        self.inner.buckets[bucket_ord as usize % self.inner.buckets.len()]
            .work_for_bucket(bucket_ord)
    }

    fn work_at(&self, now: Instant) -> u64 {
        let elapsed_ms: u64 = now.duration_since(self.inner.anchor).as_millis() as u64;
        let current_bucket_ord = elapsed_ms / self.inner.bucket_period_millis;
        let num_buckets = self.inner.num_buckets - 1u64;
        let bucket_range = current_bucket_ord.saturating_sub(num_buckets)..current_bucket_ord;
        let cumulative_work: u64 = bucket_range
            .map(|bucket_ord| self.work_in_bucket(bucket_ord))
            .sum();
        (cumulative_work * self.inner.period_millis)
            / (self.inner.bucket_period_millis * num_buckets)
    }
}

impl Rate for SmaRateEstimator {
    /// Returns the estimated amount of work performed during a `period`.
    ///
    /// This estimation is computed by summing the amount of work performed tracked in the previous
    /// `n-1` buckets and dividing it by the duration of the `n-1` periods.
    fn work(&self) -> u64 {
        self.work_at(Instant::now())
    }

    fn period(&self) -> Duration {
        Duration::from_millis(self.inner.period_millis)
    }
}

#[inline]
fn compute_bucket_ord_hash(bucket_ord: u64) -> u8 {
    // We pick 241 because it is the highest prime number below 256
    // that can be computed easily.
    //
    // The fact that it is prime makes it so that it is complemented by the
    // bucket id for any value of num_buckets (well except multiples of 241)
    // thanks to the chinese theorem.
    (bucket_ord % 241) as u8
}

impl RateEstimator for SmaRateEstimator {
    fn update(&mut self, _started_at: Instant, ended_at: Instant, work: u64) {
        let elapsed = ended_at.duration_since(self.inner.anchor).as_millis() as u64;
        let num_buckets = self.inner.num_buckets;
        let bucket_ord = elapsed / self.inner.bucket_period_millis;
        let bucket = &self.inner.buckets[(bucket_ord % num_buckets) as usize];
        bucket.increment_work(work, bucket_ord);
    }
}

/// Rate estimator bucket. The 56 least significant bits of the atomic integer store the amount of
/// work, while the most significant 8 bits are encoding a well-thought hash of the bucket ord.
///
/// The hash is used to ensure that we know exactly when to reset the bucket's work.
#[derive(Debug, Default)]
struct Bucket {
    // This atomic is actually encoding two things:
    // - low bits [0..56): the amount of work recorded in the bucket.
    // - high bits [56..64): the bucket ord, or rather its last 8 bits.
    bits: AtomicU64,
}

const WORK_MASK: u64 = (1u64 << 56) - 1;

struct BucketVal {
    work: u64,
    bucket_ord_hash: u8,
}

impl From<u64> for BucketVal {
    #[inline]
    fn from(bucket_bits: u64) -> BucketVal {
        BucketVal {
            work: bucket_bits & WORK_MASK,
            bucket_ord_hash: (bucket_bits >> 56) as u8,
        }
    }
}

impl From<BucketVal> for u64 {
    #[inline]
    fn from(value: BucketVal) -> Self {
        (value.bucket_ord_hash as u64) << 56 | value.work
    }
}

impl Bucket {
    fn work_for_bucket(&self, bucket_ord: u64) -> u64 {
        let bucket_val = BucketVal::from(self.bits.load(Ordering::Relaxed));
        if bucket_val.bucket_ord_hash == compute_bucket_ord_hash(bucket_ord) {
            bucket_val.work
        } else {
            0
        }
    }

    fn increment_work(&self, work: u64, bucket_ord: u64) {
        let expected_bucket_ord_hash: u8 = compute_bucket_ord_hash(bucket_ord);
        let current_bits = self.bits.fetch_add(work, Ordering::Relaxed) + work;
        let bucket_val = BucketVal::from(current_bits);

        // This is not the bucket we targeted, we need to retry and update the bucket with the new
        // bucket_ord and a reset value.
        if bucket_val.bucket_ord_hash != expected_bucket_ord_hash {
            let mut expected_bits = current_bits;
            let new_bits: u64 = BucketVal {
                work,
                bucket_ord_hash: expected_bucket_ord_hash,
            }
            .into();

            while let Err(current_bits) = self.bits.compare_exchange(
                expected_bits,
                new_bits,
                Ordering::AcqRel,
                Ordering::Acquire,
            ) {
                if BucketVal::from(current_bits).bucket_ord_hash == expected_bucket_ord_hash {
                    // Some thread managed to successfully flip the color. We're good.
                    self.bits.fetch_add(work, Ordering::Relaxed);
                    break;
                } else {
                    // We keep trying.
                    expected_bits = current_bits;
                }
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Barrier;
    use std::thread;

    use super::*;

    #[test]
    fn test_bucket() {
        let bucket = Bucket::default();
        assert_eq!(bucket.work_for_bucket(0u64), 0);

        // First pass, the bucket is red.
        bucket.increment_work(1, 0u64);
        assert_eq!(bucket.work_for_bucket(0u64), 1);
        assert_eq!(bucket.work_for_bucket(1u64), 0);

        bucket.increment_work(2, 0u64);
        assert_eq!(bucket.work_for_bucket(0u64), 3);

        // Second pass, the bucket is now black.
        bucket.increment_work(5, 1u64);
        assert_eq!(bucket.work_for_bucket(1u64), 5);
        assert_eq!(bucket.work_for_bucket(0u64), 0);

        bucket.increment_work(7, 1u64);
        assert_eq!(bucket.work_for_bucket(1u64), 12);

        // Third pass, the bucket is red again.
        bucket.increment_work(9, 2u64);
        assert_eq!(bucket.work_for_bucket(2u64), 9);

        bucket.increment_work(11, 2u64);
        assert_eq!(bucket.work_for_bucket(2u64), 20);

        for num_threads in [1, 2, 3, 5, 10, 20] {
            let barrier = Arc::new(Barrier::new(num_threads));
            let bucket = Arc::new(Bucket::default());
            let mut cumulative_work = 0;
            let mut handles = Vec::with_capacity(num_threads);

            for i in 0..num_threads {
                let barrier = barrier.clone();
                let bucket = bucket.clone();
                cumulative_work += i as u64;

                handles.push(thread::spawn(move || {
                    barrier.wait();
                    // First time we increment the work in this second pass. All the threads will
                    // attempt to flip the bucket's color. Only one should succeed.
                    bucket.increment_work(i as u64, 3u64);
                }));
            }
            for handle in handles {
                handle.join().unwrap();
            }
            assert_eq!(bucket.work_for_bucket(3u64), cumulative_work);
        }
    }

    #[test]
    fn test_sma_rate_estimator() {
        let num_buckets = NonZeroUsize::new(3).unwrap();
        let bucket_period = Duration::from_secs(1);
        let period = Duration::from_millis(100);

        let mut estimator = SmaRateEstimator::new(num_buckets, bucket_period, period);
        assert_eq!(estimator.work(), 0);
        assert_eq!(estimator.period(), Duration::from_millis(100));

        let anchor = estimator.inner.anchor;

        let started_at = anchor;
        let ended_at = started_at + Duration::from_millis(0);
        estimator.update(started_at, ended_at, 100);
        assert_eq!(estimator.inner.buckets[0].work_for_bucket(0), 100);

        let ended_at = started_at + Duration::from_millis(999);
        estimator.update(started_at, ended_at, 200);
        assert_eq!(estimator.inner.buckets[0].work_for_bucket(0), 300);

        assert_eq!(estimator.work_at(anchor), 0);

        let ended_at = started_at + Duration::from_millis(1_000);
        estimator.update(started_at, ended_at, 300);
        assert_eq!(estimator.inner.buckets[1].work_for_bucket(1), 300);

        let ended_at = started_at + Duration::from_millis(1_999);
        estimator.update(started_at, ended_at, 600);
        assert_eq!(estimator.inner.buckets[1].work_for_bucket(1), 900);

        assert_eq!(
            estimator.work_at(anchor + Duration::from_secs(2)),
            (300 + 900) / 20
        );

        let ended_at = started_at + Duration::from_millis(2_000);
        estimator.update(started_at, ended_at, 800);
        assert_eq!(estimator.inner.buckets[2].work_for_bucket(2), 800);

        let ended_at = started_at + Duration::from_millis(2_999);
        estimator.update(started_at, ended_at, 1_000);
        assert_eq!(estimator.inner.buckets[2].work_for_bucket(2), 1_800);

        assert_eq!(estimator.work_at(anchor + Duration::from_secs(3)), 135);

        let ended_at = started_at + Duration::from_millis(3_000);
        estimator.update(started_at, ended_at, 500);
        assert_eq!(estimator.inner.buckets[0].work_for_bucket(0), 0);
        assert_eq!(estimator.inner.buckets[0].work_for_bucket(3), 500);
    }

    #[test]
    fn test_sma_rate_skipped_bucket() {
        let num_buckets = NonZeroUsize::new(10).unwrap();
        let bucket_period = Duration::from_secs(1);
        let period = Duration::from_secs(1);

        let mut estimator = SmaRateEstimator::new(num_buckets, bucket_period, period);

        assert_eq!(estimator.work(), 0);

        let anchor = estimator.inner.anchor;

        // We fill all of the bucket with 100 work.
        for i in 0..10 {
            let ended_at = anchor + Duration::from_secs(1) * i;
            estimator.update(ended_at, ended_at, 100);
        }

        assert_eq!(estimator.work_at(anchor + Duration::from_secs(10)), 100);

        // Now let's assume there isn't any work ongoing for 4s.
        // Over the last 9 seconds, we have received 500 works
        //
        // After the reset, we should have the following buckets:
        // We expect a mean of 44 work/s.
        // |0, 0, 0, 0, 0, 100*, 100, 100, 100, 100|
        //
        // Since the current bucket (idx = 5) is not taken into account, this leads
        // to an average of 400 / 9 = 44 work units.
        assert_eq!(estimator.work_at(anchor + Duration::from_secs(15)), 44);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/rate_limit.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::future::Future;
use std::pin::Pin;
use std::task::{Context, Poll};

use futures::ready;
use tokio::time::{Instant, Sleep};
use tower::{Layer, Service};

use super::Cost;
use super::rate::Rate;

/// Enforces a rate limit on the quantity of work the underlying
/// service can handle over a period of time. This implementation is a generalization of
/// `tower::limit::RateLimit`, which is limited to a constant rate of requests over a period of
/// time.
#[derive(Debug)]
pub struct RateLimit<S, T> {
    inner: S,
    rate: T,
    state: State,
    sleep: Pin<Box<Sleep>>,
}

#[derive(Debug)]
enum State {
    // The service has hit its limit.
    Limited { debit: u64 },
    Ready { deadline: Instant, credit: u64 },
}

impl<S, T> RateLimit<S, T>
where T: Rate
{
    /// Creates a new rate limiter.
    pub fn new(inner: S, rate: T) -> Self {
        let deadline = Instant::now();
        let state = State::Ready {
            deadline,
            credit: rate.work(),
        };

        Self {
            inner,
            rate,
            state,
            // The sleep won't actually be used with this duration, but
            // we create it eagerly so that we can reset it in place rather than
            // `Box::pin`ning a new `Sleep` every time we need one.
            sleep: Box::pin(tokio::time::sleep_until(deadline)),
        }
    }

    /// Gets a reference to the inner service.
    pub fn get_ref(&self) -> &S {
        &self.inner
    }

    /// Gets a mutable reference to the inner service.
    pub fn get_mut(&mut self) -> &mut S {
        &mut self.inner
    }

    /// Consumes `self`, returning the inner service
    pub fn into_inner(self) -> S {
        self.inner
    }
}

impl<S, R, T> Service<R> for RateLimit<S, T>
where
    S: Service<R>,
    R: Cost,
    T: Rate,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = S::Future;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        let debit = match self.state {
            State::Ready { .. } => return Poll::Ready(ready!(self.inner.poll_ready(cx))),
            State::Limited { debit } => {
                if Pin::new(&mut self.sleep).poll(cx).is_pending() {
                    return Poll::Pending;
                }
                debit
            }
        };
        let deposit = self.rate.work();

        if deposit >= debit {
            self.state = State::Ready {
                deadline: Instant::now() + self.rate.period(),
                credit: deposit - debit,
            };
            Poll::Ready(ready!(self.inner.poll_ready(cx)))
        } else {
            self.state = State::Limited {
                debit: debit - deposit,
            };
            self.sleep
                .as_mut()
                .reset(Instant::now() + self.rate.period());
            Poll::Pending
        }
    }

    fn call(&mut self, request: R) -> Self::Future {
        match self.state {
            State::Ready {
                mut deadline,
                mut credit,
            } => {
                let now = Instant::now();

                // If the period has elapsed, reset it.
                if now >= deadline {
                    deadline = now + self.rate.period();
                    credit = self.rate.work();
                }
                let withdrawal = request.cost();

                if credit >= withdrawal {
                    credit -= withdrawal;
                    self.state = State::Ready { deadline, credit };
                } else {
                    // The service is disabled until further notice
                    // Reset the sleep future in place, so that we don't have to
                    // deallocate the existing box and allocate a new one.
                    let debit = withdrawal - credit;
                    self.state = State::Limited { debit };
                    self.sleep.as_mut().reset(deadline);
                }

                // Call the inner future
                self.inner.call(request)
            }
            State::Limited { .. } => {
                panic!("Service not ready; `poll_ready` must be called first!")
            }
        }
    }
}

/// Enforces a rate limit on the quantity of work the underlying
/// service can handle over a period of time.
#[derive(Debug, Clone)]
pub struct RateLimitLayer<T> {
    rate: T,
}

impl<T> RateLimitLayer<T> {
    /// Creates new rate limit layer.
    pub fn new(rate: T) -> Self {
        Self { rate }
    }
}

impl<S, T> Layer<S> for RateLimitLayer<T>
where T: Rate
{
    type Service = RateLimit<S, T>;

    fn layer(&self, service: S) -> Self::Service {
        RateLimit::new(service, self.rate.clone())
    }
}

#[cfg(test)]
mod tests {

    use std::sync::Arc;
    use std::sync::atomic::{AtomicU64, Ordering};
    use std::time::Duration;

    use futures::future::join_all;
    use tower::{ServiceBuilder, ServiceExt};

    use super::*;
    use crate::tower::buffer::BufferError;
    use crate::tower::{BufferLayer, ConstantRate};

    struct Request {
        cost: u64,
    }

    impl Request {
        fn random() -> Self {
            Self {
                cost: rand::random::<u64>() % 100,
            }
        }
    }

    impl Cost for Request {
        fn cost(&self) -> u64 {
            self.cost
        }
    }

    #[derive(Debug, Clone, thiserror::Error)]
    #[error("rate meter error")]
    struct RateMeterError;

    impl From<BufferError> for RateMeterError {
        fn from(_: BufferError) -> Self {
            Self
        }
    }

    #[derive(Debug, Clone)]
    struct RateMeter {
        cumulated_work: Arc<AtomicU64>,
    }

    impl RateMeter {
        fn new() -> Self {
            Self {
                cumulated_work: Arc::new(AtomicU64::new(0)),
            }
        }
    }

    impl Service<Request> for RateMeter {
        type Response = ();
        type Error = RateMeterError;
        type Future = futures::future::Ready<Result<Self::Response, Self::Error>>;

        fn poll_ready(&mut self, _: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }

        fn call(&mut self, request: Request) -> Self::Future {
            self.cumulated_work
                .fetch_add(request.cost, Ordering::Relaxed);
            futures::future::ready(Ok(()))
        }
    }

    #[tokio::test]
    async fn test_rate_limit_over_multiple_periods() {
        let work = 1000;
        let period = 100;

        let rate = ConstantRate::new(work, Duration::from_millis(period));
        let meter = RateMeter::new();
        let mut service = ServiceBuilder::new()
            .layer(BufferLayer::new(10))
            .layer(RateLimitLayer::new(rate))
            .service(meter.clone());

        let now = Instant::now();
        service
            .ready()
            .await
            .unwrap()
            .call(Request { cost: 1 })
            .await
            .unwrap();
        // The request should go through immediately but in some rare instance the test is slow to
        // run and the call to `call` takes more than 1 ms.
        assert!(now.elapsed() < Duration::from_millis(5));

        let now = Instant::now();
        // The first request goes through, but the second one is rate limited.
        service
            .ready()
            .await
            .unwrap()
            .call(Request { cost: 2 * work - 1 })
            .await
            .unwrap();
        service
            .ready()
            .await
            .unwrap()
            .call(Request { cost: 1 })
            .await
            .unwrap();
        assert!(now.elapsed() >= Duration::from_millis(period));
        assert!(now.elapsed() < Duration::from_millis(2 * period));
    }

    #[tokio::test]
    async fn test_rate_limit() {
        let work = 1000;
        let period = 100;
        let deadline = 500;
        let expected_cumulated_work = work * (deadline / period);

        let rate = ConstantRate::new(work, Duration::from_millis(period));
        let meter = RateMeter::new();
        let service = ServiceBuilder::new()
            .layer(BufferLayer::new(10))
            .layer(RateLimitLayer::new(rate))
            .service(meter.clone());

        let futures = (0..5).map(|_| {
            let mut service = service.clone();
            tokio::time::timeout(Duration::from_millis(deadline), async move {
                loop {
                    service
                        .ready()
                        .await
                        .unwrap()
                        .call(Request::random())
                        .await
                        .unwrap();
                }
            })
        });
        join_all(futures).await;
        let cumulated_work = meter.cumulated_work.load(Ordering::Relaxed);
        assert!(cumulated_work > expected_cumulated_work * 95 / 100);
        assert!(cumulated_work < expected_cumulated_work * 105 / 100)
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/retry.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::type_name;
use std::fmt;

use tokio::time::Sleep;
use tower::Layer;
use tower::retry::{Policy, Retry};
use tracing::debug;

use crate::retry::{RetryParams, Retryable};

/// Retry layer copy/pasted from `tower::retry::RetryLayer`
/// but which implements `Clone`.
impl<P, S> Layer<S> for RetryLayer<P>
where P: Clone
{
    type Service = Retry<P, S>;

    fn layer(&self, service: S) -> Self::Service {
        let policy = self.policy.clone();
        Retry::new(policy, service)
    }
}

#[derive(Clone, Debug)]
pub struct RetryLayer<P> {
    policy: P,
}

impl<P> RetryLayer<P> {
    /// Create a new [`RetryLayer`] from a retry policy
    pub fn new(policy: P) -> Self {
        RetryLayer { policy }
    }
}

#[derive(Clone, Copy, Debug)]
pub struct RetryPolicy {
    num_attempts: usize,
    retry_params: RetryParams,
}

impl From<RetryParams> for RetryPolicy {
    fn from(retry_params: RetryParams) -> Self {
        Self {
            num_attempts: 0,
            retry_params,
        }
    }
}

impl<R, T, E> Policy<R, T, E> for RetryPolicy
where
    R: Clone,
    E: fmt::Debug + Retryable,
{
    type Future = Sleep;

    fn retry(&mut self, _request: &mut R, result: &mut Result<T, E>) -> Option<Self::Future> {
        match result {
            Ok(_) => None,
            Err(error) => {
                self.num_attempts += 1;

                if !error.is_retryable() || self.num_attempts >= self.retry_params.max_attempts {
                    None
                } else {
                    let delay = self.retry_params.compute_delay(self.num_attempts);
                    debug!(
                        num_attempts=%self.num_attempts,
                        delay_millis=%delay.as_millis(),
                        error=?error,
                        "{} request failed, retrying.", type_name::<R>()
                    );
                    let sleep_fut = tokio::time::sleep(delay);
                    Some(sleep_fut)
                }
            }
        }
    }

    fn clone_request(&mut self, request: &R) -> Option<R> {
        Some(request.clone())
    }
}

#[cfg(test)]
mod tests {
    use std::sync::atomic::{AtomicUsize, Ordering};
    use std::sync::{Arc, Mutex};
    use std::task::{Context, Poll};

    use futures::future::{Ready, ready};
    use tower::{Layer, Service, ServiceExt};

    use super::*;

    #[derive(Debug, Eq, PartialEq)]
    pub enum Retry<E> {
        Permanent(E),
        Transient(E),
    }

    impl<E> Retryable for Retry<E> {
        fn is_retryable(&self) -> bool {
            match self {
                Retry::Permanent(_) => false,
                Retry::Transient(_) => true,
            }
        }
    }

    #[derive(Debug, Clone, Default)]
    struct HelloService;

    type HelloResults = Arc<Mutex<Vec<Result<(), Retry<()>>>>>;

    #[derive(Debug, Clone, Default)]
    struct HelloRequest {
        num_attempts: Arc<AtomicUsize>,
        results: HelloResults,
    }

    impl Service<HelloRequest> for HelloService {
        type Response = ();
        type Error = Retry<()>;
        type Future = Ready<Result<(), Retry<()>>>;

        fn poll_ready(&mut self, _cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }

        fn call(&mut self, request: HelloRequest) -> Self::Future {
            request.num_attempts.fetch_add(1, Ordering::Relaxed);
            let result = request
                .results
                .lock()
                .expect("lock should not be poisoned")
                .pop()
                .unwrap_or(Err(Retry::Permanent(())));
            ready(result)
        }
    }

    #[tokio::test]
    async fn test_retry_policy() {
        let retry_policy = RetryPolicy::from(RetryParams::for_test());
        let retry_layer = RetryLayer::new(retry_policy);
        let mut retry_hello_service = retry_layer.layer(HelloService);

        let hello_request = HelloRequest {
            results: Arc::new(Mutex::new(vec![Ok(())])),
            ..Default::default()
        };
        retry_hello_service
            .ready()
            .await
            .unwrap()
            .call(hello_request.clone())
            .await
            .unwrap();
        assert_eq!(hello_request.num_attempts.load(Ordering::Relaxed), 1);

        let hello_request = HelloRequest {
            results: Arc::new(Mutex::new(vec![Ok(()), Err(Retry::Transient(()))])),
            ..Default::default()
        };
        retry_hello_service
            .ready()
            .await
            .unwrap()
            .call(hello_request.clone())
            .await
            .unwrap();
        assert_eq!(hello_request.num_attempts.load(Ordering::Relaxed), 2);

        let hello_request = HelloRequest {
            results: Arc::new(Mutex::new(vec![
                Err(Retry::Transient(())),
                Err(Retry::Transient(())),
                Err(Retry::Transient(())),
            ])),
            ..Default::default()
        };
        retry_hello_service
            .ready()
            .await
            .unwrap()
            .call(hello_request.clone())
            .await
            .unwrap_err();
        assert_eq!(hello_request.num_attempts.load(Ordering::Relaxed), 3);

        let hello_request = HelloRequest::default();
        retry_hello_service
            .ready()
            .await
            .unwrap()
            .call(hello_request.clone())
            .await
            .unwrap_err();
        assert_eq!(hello_request.num_attempts.load(Ordering::Relaxed), 1);
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/timeout.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::future::Future;
use std::pin::Pin;
use std::task::{Context, Poll};
use std::time::Duration;

use pin_project::pin_project;
use tokio::time::Sleep;
use tower::{Layer, Service};

#[derive(Debug, Clone)]
pub struct Timeout<S> {
    service: S,
    timeout: Duration,
}
impl<S> Timeout<S> {
    /// Creates a new [`Timeout`]
    pub fn new(service: S, timeout: Duration) -> Self {
        Timeout { service, timeout }
    }
}

impl<S, R> Service<R> for Timeout<S>
where
    S: Service<R>,
    S::Error: From<TimeoutExceeded>,
{
    type Response = S::Response;
    type Error = S::Error;
    type Future = TimeoutFuture<S::Future>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.service.poll_ready(cx)
    }

    fn call(&mut self, request: R) -> Self::Future {
        TimeoutFuture {
            inner: self.service.call(request),
            sleep: tokio::time::sleep(self.timeout),
        }
    }
}

/// The error type for the `Timeout` service.
#[derive(Debug, PartialEq, Eq)]
pub struct TimeoutExceeded;

#[pin_project]
#[derive(Debug)]
pub struct TimeoutFuture<F> {
    #[pin]
    inner: F,
    #[pin]
    sleep: Sleep,
}

impl<F, T, E> Future for TimeoutFuture<F>
where
    F: Future<Output = Result<T, E>>,
    E: From<TimeoutExceeded>,
{
    type Output = Result<T, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let this = self.project();

        match this.inner.poll(cx) {
            Poll::Ready(v) => return Poll::Ready(v),
            Poll::Pending => {}
        }

        // Now check the timeout
        match this.sleep.poll(cx) {
            Poll::Pending => Poll::Pending,
            Poll::Ready(_) => Poll::Ready(Err(TimeoutExceeded.into())),
        }
    }
}

/// This is similar to tower's Timeout Layer except it requires
/// the error of the service to implement `From<TimeoutExceeded>`.
///
/// If the inner service does not complete within the specified duration,
/// the response will be aborted with the error `TimeoutExceeded`.
///
/// Note that when used in combination with a retry layer, this should be
/// stacked on top of it for the timeout to be retried.
#[derive(Debug, Clone)]
pub struct TimeoutLayer {
    timeout: Duration,
}

impl TimeoutLayer {
    /// Creates a new `TimeoutLayer` with the specified delay.
    pub fn new(timeout: Duration) -> Self {
        Self { timeout }
    }
}

impl<S> Layer<S> for TimeoutLayer {
    type Service = Timeout<S>;

    fn layer(&self, service: S) -> Self::Service {
        Timeout::new(service, self.timeout)
    }
}

#[cfg(test)]
mod tests {
    use tokio::time::Duration;
    use tower::{ServiceBuilder, ServiceExt};

    use super::*;

    #[tokio::test]
    async fn test_timeout() {
        let delay = Duration::from_millis(100);
        let mut service = ServiceBuilder::new()
            .layer(TimeoutLayer::new(delay))
            .service_fn(|_| async {
                // sleep for 1 sec
                tokio::time::sleep(Duration::from_secs(1)).await;
                Ok::<_, TimeoutExceeded>(())
            });

        let res = service.ready().await.unwrap().call(()).await;
        assert_eq!(res, Err(TimeoutExceeded));
    }
}


================================================
FILE: quickwit/quickwit-common/src/tower/transport.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::convert::Infallible;
use std::fmt;
use std::hash::Hash;
use std::net::SocketAddr;
use std::pin::Pin;
use std::task::{Context, Poll};
use std::time::Duration;

use futures::stream::once;
use futures::{Stream, StreamExt};
use tokio::sync::{mpsc, watch};
use tokio_stream::wrappers::UnboundedReceiverStream;
use tonic::transport::channel::ClientTlsConfig;
use tonic::transport::{Channel, Endpoint, Uri};
use tower::balance::p2c::Balance;
use tower::buffer::Buffer;
use tower::discover::Change as TowerChange;
use tower::load::{CompleteOnResponse, PendingRequestsDiscover};
use tower::{BoxError, Service, ServiceExt};

use super::{BoxFuture, Change};
use crate::BoxStream;

// Transforms a boxed stream of `Change<K, Channel>` into a stream of `Result<TowerChange<K,
// Channel>, Infallible>>` while keeping track of the number of connections.
struct ChangeStreamAdapter<K> {
    changes: BoxStream<Change<K, Channel>>,
    connection_keys_tx: watch::Sender<HashSet<K>>,
    keys: HashSet<K>,
}

// A blanket `Discover` implementation exists for any `Stream<Item = Result<Change<K, V>, E>>`
impl<K> Stream for ChangeStreamAdapter<K>
where K: Hash + Eq + Clone
{
    type Item = Result<TowerChange<K, Channel>, Infallible>;

    fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
        match Pin::new(&mut *self.changes).poll_next(cx) {
            Poll::Pending | Poll::Ready(None) => Poll::Pending,
            Poll::Ready(Some(change)) => match change {
                Change::Insert(key, channel) => {
                    if self.keys.insert(key.clone()) {
                        self.connection_keys_tx.send_modify(|connection_keys| {
                            connection_keys.insert(key.clone());
                        });
                    }
                    Poll::Ready(Some(Ok(TowerChange::Insert(key, channel))))
                }
                Change::Remove(key) => {
                    if self.keys.remove(&key) {
                        self.connection_keys_tx.send_modify(|connection_keys| {
                            connection_keys.remove(&key);
                        });
                    }
                    Poll::Ready(Some(Ok(TowerChange::Remove(key))))
                }
            },
        }
    }
}

impl<K> Unpin for ChangeStreamAdapter<K> where K: Hash + Eq + Clone {}

type HttpRequest = http::Request<tonic::body::Body>;
type HttpResponse = http::Response<tonic::body::Body>;
type ChangeStream<K> = UnboundedReceiverStream<Result<TowerChange<K, Channel>, Infallible>>;
type Discover<K> = PendingRequestsDiscover<ChangeStream<K>, CompleteOnResponse>;
type ChannelImpl<K> =
    Buffer<HttpRequest, <Balance<Discover<K>, HttpRequest> as Service<HttpRequest>>::Future>;

#[derive(Clone)]
pub struct BalanceChannel<K: Hash + Eq + Clone + Send> {
    inner: ChannelImpl<K>,
    connection_keys_rx: watch::Receiver<HashSet<K>>,
}

impl<K> BalanceChannel<K>
where K: Hash + Eq + Send + Sync + Clone + 'static
{
    pub fn new() -> (Self, mpsc::UnboundedSender<Change<K, Channel>>) {
        let (change_tx, change_rx) = mpsc::unbounded_channel();
        let changes = UnboundedReceiverStream::new(change_rx);
        let channel = Self::from_stream(changes);
        (channel, change_tx)
    }

    pub fn from_channel(key: K, channel: Channel) -> Self {
        Self::from_stream(once(Box::pin(async { Change::Insert(key, channel) })))
    }

    pub fn from_stream<S>(changes: S) -> Self
    where S: Stream<Item = Change<K, Channel>> + Send + Unpin + 'static {
        let (connection_keys_tx, connection_keys_rx) = watch::channel(HashSet::new());
        let change_stream = unlazy_stream(ChangeStreamAdapter::<K> {
            changes: Box::pin(changes),
            connection_keys_tx,
            keys: HashSet::new(),
        });
        let completion = CompleteOnResponse::default();
        let pending_requests_discover = PendingRequestsDiscover::new(change_stream, completion);
        let balance_svc = Balance::new(pending_requests_discover);
        let buffer_svc = Buffer::new(balance_svc, 512);

        BalanceChannel {
            inner: buffer_svc,
            connection_keys_rx,
        }
    }

    pub fn num_connections(&self) -> usize {
        self.connection_keys_rx.borrow().len()
    }

    pub fn connection_keys_watcher(&self) -> watch::Receiver<HashSet<K>> {
        self.connection_keys_rx.clone()
    }

    pub async fn wait_for(
        &self,
        timeout_after: Duration,
        predicate: impl Fn(&HashSet<K>) -> bool,
    ) -> bool {
        tokio::time::timeout(
            timeout_after,
            self.connection_keys_watcher().wait_for(predicate),
        )
        .await
        .is_ok()
    }
}

/// `tower::buffer::Buffer` and `tower::balance::Balance` lazily polls their inner services. As a
/// result, the underlying discover stream is only polled when requests are made to the
/// `BalanceChannel`. When the channel is idle, the pool of connections is not updated and
/// `num_connections` can be inaccurate. Since this number is used to determine whether a service is
/// ready or not, we must poll the stream eagerly to always supply an up-to-date value.
fn unlazy_stream<S, T>(mut inner_stream: S) -> UnboundedReceiverStream<T>
where
    T: Send + 'static,
    S: Stream<Item = T> + Send + Unpin + 'static,
{
    let (outer_stream_tx, outer_stream_rx) = mpsc::unbounded_channel();
    let future = async move {
        while let Some(item) = inner_stream.next().await {
            if outer_stream_tx.send(item).is_err() {
                break;
            }
        }
    };
    tokio::spawn(future);
    UnboundedReceiverStream::new(outer_stream_rx)
}

impl<K> Service<HttpRequest> for BalanceChannel<K>
where K: Hash + Eq + Clone + Send
{
    type Response = HttpResponse;
    type Error = BoxError;
    type Future = BoxFuture<HttpResponse, BoxError>;

    fn poll_ready(&mut self, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
        self.inner.poll_ready(cx)
    }

    fn call(&mut self, request: HttpRequest) -> Self::Future {
        Box::pin(self.inner.call(request))
    }
}

impl<K> fmt::Debug for BalanceChannel<K>
where K: Hash + Eq + Clone + Send + Sync + 'static
{
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("BalanceChannel")
            .field("num_connections", &self.num_connections())
            .finish()
    }
}

#[derive(Clone, Debug, Eq, PartialEq)]
pub struct KeepAliveConfig {
    pub interval: Duration,
    pub timeout: Duration,
}

#[derive(Clone, Default)]
pub struct ClientGrpcConfig {
    pub keep_alive_opt: Option<KeepAliveConfig>,
    pub tls_config_opt: Option<ClientTlsConfig>,
}

/// Creates a channel from a socket address.
///
/// The function is marked as `async` because it requires an executor (`connect_lazy`).
pub async fn make_channel(
    socket_addr: SocketAddr,
    client_grpc_config: ClientGrpcConfig,
) -> Channel {
    let ClientGrpcConfig {
        keep_alive_opt,
        tls_config_opt,
    } = client_grpc_config;
    let scheme = if tls_config_opt.is_some() {
        "https"
    } else {
        "http"
    };
    let uri = Uri::builder()
        .scheme(scheme)
        .authority(socket_addr.to_string())
        .path_and_query("/")
        .build()
        .expect("provided arguments should be valid");
    let mut endpoint = Endpoint::from(uri).connect_timeout(Duration::from_secs(5));
    if let Some(tls_config) = tls_config_opt {
        endpoint = endpoint.tls_config(tls_config).expect("sadness TODO");
    }
    if let Some(keep_alive) = keep_alive_opt {
        endpoint = endpoint
            .keep_alive_while_idle(true)
            .http2_keep_alive_interval(keep_alive.interval)
            .keep_alive_timeout(keep_alive.timeout);
    }
    endpoint.connect_lazy()
}

/// Forces a channel to initiate the underlying HTTP connection. Calling this function only makes
/// sense for channels connected lazily.
///
/// The function is marked as `async` because it requires a tokio runtime.
pub async fn warmup_channel(channel: Channel) {
    tokio::spawn(channel.ready_oneshot());
}

#[cfg(test)]
mod tests {
    use futures::StreamExt;
    use tonic::transport::Endpoint;
    use tower::ServiceExt;

    use super::*;

    #[tokio::test]
    async fn test_channel_discover() {
        let (change_tx, change_rx) = mpsc::unbounded_channel();
        let (connection_keys_tx, connection_keys_rx) = watch::channel(HashSet::new());

        let mut channel_discover = ChangeStreamAdapter::<&str> {
            changes: Box::pin(UnboundedReceiverStream::new(change_rx)),
            connection_keys_tx,
            keys: HashSet::new(),
        };
        assert!(connection_keys_rx.borrow().is_empty());

        let channel = Endpoint::from_static("http://[::1]:1212").connect_lazy();
        change_tx.send(Change::Insert("foo", channel)).unwrap();

        let change = channel_discover.next().await.unwrap().unwrap();
        assert!(matches!(change, TowerChange::Insert("foo", _)));
        assert_eq!(*connection_keys_rx.borrow(), HashSet::from_iter(["foo"]));

        let channel = Endpoint::from_static("http://[::1]:1337").connect_lazy();
        change_tx.send(Change::Insert("foo", channel)).unwrap();

        let change = channel_discover.next().await.unwrap().unwrap();
        assert!(matches!(change, TowerChange::Insert("foo", _)));
        assert_eq!(*connection_keys_rx.borrow(), HashSet::from_iter(["foo"]));

        change_tx.send(Change::Remove("bar")).unwrap();
        let change = channel_discover.next().await.unwrap().unwrap();

        assert!(matches!(change, TowerChange::Remove("bar")));
        assert_eq!(*connection_keys_rx.borrow(), HashSet::from_iter(["foo"]));

        change_tx.send(Change::Remove("foo")).unwrap();
        let change = channel_discover.next().await.unwrap().unwrap();

        assert!(matches!(change, TowerChange::Remove("foo")));
        assert!(connection_keys_rx.borrow().is_empty());
    }

    #[tokio::test]
    async fn test_balance_channel() {
        let (mut balance_channel, change_tx) = BalanceChannel::<&str>::new();
        let mut num_connections_watcher = balance_channel.connection_keys_watcher();
        assert_eq!(balance_channel.num_connections(), 0);

        let channel = Endpoint::from_static("http://[::1]:1212").connect_lazy();
        change_tx.send(Change::Insert("foo", channel)).unwrap();
        num_connections_watcher.changed().await.unwrap();
        assert_eq!(balance_channel.num_connections(), 1);

        change_tx.send(Change::Remove("foo")).unwrap();
        num_connections_watcher.changed().await.unwrap();
        assert_eq!(balance_channel.num_connections(), 0);

        // `ready()` is lying... See `unlazy_stream()` comment.
        balance_channel.ready().await.unwrap();

        // The rest of the test lives in the `quickwit-codegen-example` crate.
        // TODO: Move the test here.
    }
}


================================================
FILE: quickwit/quickwit-common/src/type_map.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::{Any, TypeId};
use std::collections::HashMap;

#[derive(Debug, Default)]
pub struct TypeMap(HashMap<TypeId, Box<dyn Any + Send + Sync>>);

impl TypeMap {
    pub fn contains<T: Any + Send + Sync>(&self) -> bool {
        self.0.contains_key(&TypeId::of::<T>())
    }

    pub fn insert<T: Any + Send + Sync>(&mut self, instance: T) {
        self.0.insert(TypeId::of::<T>(), Box::new(instance));
    }

    pub fn get<T: Any + Send + Sync>(&self) -> Option<&T> {
        self.0.get(&TypeId::of::<T>()).map(|instance| {
            instance
                .downcast_ref::<T>()
                .expect("Instance should be of type T.")
        })
    }

    pub fn get_mut<T: Any + Send + Sync>(&mut self) -> Option<&mut T> {
        self.0.get_mut(&TypeId::of::<T>()).map(|instance| {
            instance
                .downcast_mut::<T>()
                .expect("Instance should be of type T.")
        })
    }
}


================================================
FILE: quickwit/quickwit-common/src/uri.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::env;
use std::fmt::{Debug, Display};
use std::hash::Hash;
use std::path::{Component, Path, PathBuf};
use std::str::FromStr;

use anyhow::{Context, bail};
use once_cell::sync::OnceCell;
use regex::Regex;
use serde::de::Error;
use serde::{Deserialize, Serialize, Serializer};

#[derive(Debug, Clone, Copy, Eq, PartialEq, Hash, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
#[repr(u8)]
pub enum Protocol {
    Actor = 1,
    Azure = 2,
    File = 3,
    Grpc = 4,
    PostgreSQL = 5,
    Ram = 6,
    S3 = 7,
    Google = 8,
}

impl Protocol {
    pub fn as_str(&self) -> &str {
        match &self {
            Protocol::Actor => "actor",
            Protocol::Azure => "azure",
            Protocol::File => "file",
            Protocol::Grpc => "grpc",
            Protocol::PostgreSQL => "postgresql",
            Protocol::Ram => "ram",
            Protocol::S3 => "s3",
            Protocol::Google => "gs",
        }
    }

    pub fn is_file(&self) -> bool {
        matches!(&self, Protocol::File)
    }

    pub fn is_file_storage(&self) -> bool {
        matches!(&self, Protocol::File | Protocol::Ram)
    }

    pub fn is_object_storage(&self) -> bool {
        matches!(&self, Protocol::Azure | Protocol::S3 | Protocol::Google)
    }

    pub fn is_database(&self) -> bool {
        matches!(&self, Protocol::PostgreSQL)
    }
}

impl Display for Protocol {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        write!(formatter, "{}", self.as_str())
    }
}

impl FromStr for Protocol {
    type Err = anyhow::Error;

    fn from_str(protocol: &str) -> anyhow::Result<Self> {
        match protocol {
            "azure" => Ok(Protocol::Azure),
            "file" => Ok(Protocol::File),
            "grpc" => Ok(Protocol::Grpc),
            "actor" => Ok(Protocol::Actor),
            "pg" | "postgres" | "postgresql" => Ok(Protocol::PostgreSQL),
            "ram" => Ok(Protocol::Ram),
            "s3" => Ok(Protocol::S3),
            "gs" => Ok(Protocol::Google),
            _ => bail!("unknown URI protocol `{protocol}`"),
        }
    }
}

const PROTOCOL_SEPARATOR: &str = "://";

/// Encapsulates the URI type.
///
/// URI's string representation are guaranteed to start
/// by the protocol `str()` representation.
///
/// # Disclaimer
///
/// Uri has to be built using `Uri::from_str`.
/// This function has some normalization behavior.
/// Some protocol have several acceptable string representation (`pg`, `postgres`, `postgresql`).
///
/// If the representation in the input string is not canonical, it will get normalized.
/// In other words, a parsed URI may not have the exact string representation as the original
/// string.
#[derive(Clone, Eq, PartialEq, Hash)]
pub struct Uri {
    uri: String,
    protocol: Protocol,
}

impl Uri {
    /// This is only used for test. We artificially restrict the lifetime to 'static
    /// to avoid misuses.
    pub fn for_test(uri: &'static str) -> Self {
        Uri::from_str(uri).unwrap()
    }

    /// Returns the extension of the URI.
    pub fn extension(&self) -> Option<&str> {
        Path::new(&self.uri).extension()?.to_str()
    }

    /// Returns the URI as a string slice.
    pub fn as_str(&self) -> &str {
        &self.uri
    }

    /// Returns the protocol of the URI.
    pub fn protocol(&self) -> Protocol {
        self.protocol
    }

    /// Strips sensitive information such as credentials from URI.
    fn as_redacted_str(&self) -> Cow<'_, str> {
        if self.protocol().is_database() {
            static DATABASE_URI_PATTERN: OnceCell<Regex> = OnceCell::new();
            DATABASE_URI_PATTERN
                .get_or_init(|| {
                    Regex::new("(?P<before>^.*://.*)(?P<password>:.*@)(?P<after>.*)")
                        .expect("regular expression should compile")
                })
                .replace(&self.uri, "$before:***redacted***@$after")
        } else {
            Cow::Borrowed(&self.uri)
        }
    }

    pub fn redact(&mut self) {
        self.uri = self.as_redacted_str().into_owned();
    }

    /// Returns the file path of the URI.
    /// Applies only to `file://` and `ram://` URIs.
    pub fn filepath(&self) -> Option<&Path> {
        if self.protocol().is_file_storage() {
            Some(self.path())
        } else {
            None
        }
    }

    /// Returns the parent URI.
    /// Does not apply to PostgreSQL URIs.
    pub fn parent(&self) -> Option<Uri> {
        if self.protocol().is_database() {
            return None;
        }
        let path = self.path();
        let protocol = self.protocol();

        if protocol == Protocol::S3 && path.components().count() < 2 {
            return None;
        }
        if protocol == Protocol::Azure && path.components().count() < 3 {
            return None;
        }
        if protocol == Protocol::Google && path.components().count() < 2 {
            return None;
        }
        let parent_path = path.parent()?;

        Some(Self {
            uri: format!("{protocol}{PROTOCOL_SEPARATOR}{}", parent_path.display()),
            protocol,
        })
    }

    fn path(&self) -> &Path {
        Path::new(&self.uri[self.protocol.as_str().len() + PROTOCOL_SEPARATOR.len()..])
    }

    /// Returns the last component of the URI.
    pub fn file_name(&self) -> Option<&Path> {
        if self.protocol() == Protocol::PostgreSQL {
            return None;
        }
        let path = self.path();

        if self.protocol() == Protocol::S3 && path.components().count() < 2 {
            return None;
        }
        if self.protocol() == Protocol::Azure && path.components().count() < 3 {
            return None;
        }
        if self.protocol() == Protocol::Google && path.components().count() < 2 {
            return None;
        }
        path.file_name().map(Path::new)
    }

    /// Consumes the [`Uri`] struct and returns the normalized URI as a string.
    pub fn into_string(self) -> String {
        self.uri
    }

    /// Creates a new [`Uri`] with `path` adjoined to `self`.
    /// Fails if `path` is absolute.
    pub fn join<P: AsRef<Path> + std::fmt::Debug>(&self, path: P) -> anyhow::Result<Self> {
        if path.as_ref().is_absolute() {
            bail!(
                "cannot join URI `{}` with absolute path `{:?}`",
                self.uri,
                path
            );
        }
        let joined = match self.protocol() {
            Protocol::File => Path::new(&self.uri)
                .join(path)
                .to_string_lossy()
                .to_string(),
            Protocol::PostgreSQL => bail!(
                "cannot join PostgreSQL URI `{}` with path `{:?}`",
                self.uri,
                path
            ),
            _ => format!(
                "{}{}{}",
                self.uri,
                if self.uri.ends_with('/') { "" } else { "/" },
                path.as_ref().display(),
            ),
        };
        Ok(Self {
            uri: joined,
            protocol: self.protocol,
        })
    }

    /// Attempts to construct a [`Uri`] from a string.
    /// A `file://` protocol is assumed if not specified.
    /// File URIs are resolved (normalized) relative to the current working directory
    /// unless an absolute path is specified.
    /// Handles special characters such as `~`, `.`, `..`.
    fn parse_str(uri_str: &str) -> anyhow::Result<Self> {
        // CAUTION: Do not display the URI in error messages to avoid leaking credentials.
        if uri_str.is_empty() {
            bail!("failed to parse empty URI");
        }
        let (protocol, mut path) = match uri_str.split_once(PROTOCOL_SEPARATOR) {
            None => (Protocol::File, uri_str.to_string()),
            Some((protocol, path)) => (Protocol::from_str(protocol)?, path.to_string()),
        };
        if protocol == Protocol::File {
            if path.starts_with('~') {
                // We only accept `~` (alias to the home directory) and `~/path/to/something`.
                // If there is something following the `~` that is not `/`, we bail.
                if path.len() > 1 && !path.starts_with("~/") {
                    bail!("failed to normalize URI: tilde expansion is only partially supported");
                }

                let home_dir_path = home::home_dir()
                    .context("failed to normalize URI: could not resolve home directory")?
                    .to_string_lossy()
                    .to_string();

                path.replace_range(0..1, &home_dir_path);
            }
            if Path::new(&path).is_relative() {
                let current_dir = env::current_dir().context(
                    "failed to normalize URI: could not resolve current working directory. the \
                     directory does not exist or user has insufficient permissions",
                )?;
                path = current_dir.join(path).to_string_lossy().to_string();
            }
            path = normalize_path(Path::new(&path))
                .to_string_lossy()
                .to_string();
        }
        Ok(Self {
            uri: format!("{protocol}{PROTOCOL_SEPARATOR}{path}"),
            protocol,
        })
    }
}

impl AsRef<str> for Uri {
    fn as_ref(&self) -> &str {
        &self.uri
    }
}

impl Debug for Uri {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        formatter
            .debug_struct("Uri")
            .field("uri", &self.as_redacted_str())
            .finish()
    }
}

impl Display for Uri {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        write!(formatter, "{}", self.as_redacted_str())
    }
}

impl FromStr for Uri {
    type Err = anyhow::Error;

    fn from_str(uri_str: &str) -> anyhow::Result<Self> {
        Uri::parse_str(uri_str)
    }
}

impl PartialEq<&str> for Uri {
    fn eq(&self, other: &&str) -> bool {
        &self.uri == other
    }
}

impl PartialEq<String> for Uri {
    fn eq(&self, other: &String) -> bool {
        &self.uri == other
    }
}

impl<'de> Deserialize<'de> for Uri {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        let uri_str: Cow<'de, str> = Deserialize::deserialize(deserializer)?;
        let uri = Uri::from_str(&uri_str).map_err(D::Error::custom)?;
        Ok(uri)
    }
}

impl Serialize for Uri {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.serialize_str(&self.uri)
    }
}

/// Normalizes a path by resolving the components like (., ..).
/// This helper does the same thing as `Path::canonicalize`.
/// It only differs from `Path::canonicalize` by not checking file existence
/// during resolution.
/// <https://github.com/rust-lang/cargo/blob/fede83ccf973457de319ba6fa0e36ead454d2e20/src/cargo/util/paths.rs#L61>
fn normalize_path(path: &Path) -> PathBuf {
    let mut components = path.components().peekable();
    let mut resulting_path_buf =
        if let Some(component @ Component::Prefix(..)) = components.peek().cloned() {
            components.next();
            PathBuf::from(component.as_os_str())
        } else {
            PathBuf::new()
        };

    for component in components {
        match component {
            Component::Prefix(..) => unreachable!(),
            Component::RootDir => {
                resulting_path_buf.push(component.as_os_str());
            }
            Component::CurDir => {}
            Component::ParentDir => {
                resulting_path_buf.pop();
            }
            Component::Normal(inner_component) => {
                resulting_path_buf.push(inner_component);
            }
        }
    }
    resulting_path_buf
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_try_new_uri() {
        Uri::from_str("").unwrap_err();

        let home_dir = home::home_dir().unwrap();
        let current_dir = env::current_dir().unwrap();

        let uri = Uri::from_str("file:///home/foo/bar").unwrap();
        assert_eq!(uri.protocol(), Protocol::File);
        assert_eq!(uri.filepath(), Some(Path::new("/home/foo/bar")));
        assert_eq!(uri, "file:///home/foo/bar");
        assert_eq!(uri, "file:///home/foo/bar".to_string());
        assert_eq!(
            Uri::from_str("file:///foo./bar..").unwrap(),
            "file:///foo./bar.."
        );
        assert_eq!(
            Uri::from_str("home/homer/docs/dognuts").unwrap(),
            format!("file://{}/home/homer/docs/dognuts", current_dir.display())
        );
        assert_eq!(
            Uri::from_str("home/homer/docs/../dognuts").unwrap(),
            format!("file://{}/home/homer/dognuts", current_dir.display())
        );
        assert_eq!(
            Uri::from_str("home/homer/docs/../../dognuts").unwrap(),
            format!("file://{}/home/dognuts", current_dir.display())
        );
        assert_eq!(
            Uri::from_str("/home/homer/docs/dognuts").unwrap(),
            "file:///home/homer/docs/dognuts"
        );
        assert_eq!(
            Uri::from_str("~").unwrap(),
            format!("file://{}", home_dir.display())
        );
        assert_eq!(
            Uri::from_str("~/").unwrap(),
            format!("file://{}", home_dir.display())
        );
        assert_eq!(
            Uri::from_str("~anything/bar").unwrap_err().to_string(),
            "failed to normalize URI: tilde expansion is only partially supported"
        );
        assert_eq!(
            Uri::from_str("~/.").unwrap(),
            format!("file://{}", home_dir.display())
        );
        assert_eq!(
            Uri::from_str("~/..").unwrap(),
            format!("file://{}", home_dir.parent().unwrap().display())
        );
        assert_eq!(
            Uri::from_str("file://").unwrap(),
            format!("file://{}", current_dir.display())
        );
        assert_eq!(Uri::from_str("file:///").unwrap(), "file:///");
        assert_eq!(
            Uri::from_str("file://.").unwrap(),
            format!("file://{}", current_dir.display())
        );
        assert_eq!(
            Uri::from_str("file://..").unwrap(),
            format!("file://{}", current_dir.parent().unwrap().display())
        );
        assert_eq!(
            Uri::from_str("s3://home/homer/docs/dognuts").unwrap(),
            "s3://home/homer/docs/dognuts"
        );
        assert_eq!(
            Uri::from_str("s3://home/homer/docs/../dognuts").unwrap(),
            "s3://home/homer/docs/../dognuts"
        );
        assert_eq!(
            Uri::from_str("azure://account/container/docs/dognuts").unwrap(),
            "azure://account/container/docs/dognuts"
        );
        assert_eq!(
            Uri::from_str("azure://account/container/homer/docs/../dognuts").unwrap(),
            "azure://account/container/homer/docs/../dognuts"
        );
        assert_eq!(
            Uri::from_str("gs://bucket/docs/dognuts").unwrap(),
            "gs://bucket/docs/dognuts"
        );
        assert_eq!(
            Uri::from_str("gs://bucket/homer/docs/../dognuts").unwrap(),
            "gs://bucket/homer/docs/../dognuts"
        );
        assert_eq!(
            Uri::from_str("actor://localhost:7281/an-actor-id").unwrap(),
            "actor://localhost:7281/an-actor-id"
        );

        assert_eq!(
            Uri::from_str("http://localhost:9000/quickwit")
                .unwrap_err()
                .to_string(),
            "unknown URI protocol `http`"
        );
    }

    #[test]
    fn test_uri_protocol() {
        assert_eq!(Uri::for_test("file:///home").protocol(), Protocol::File);
        assert_eq!(Uri::for_test("ram:///in-memory").protocol(), Protocol::Ram);
        assert_eq!(Uri::for_test("s3://bucket/key").protocol(), Protocol::S3);
        assert_eq!(
            Uri::for_test("azure://account/bucket/key").protocol(),
            Protocol::Azure
        );
        assert_eq!(
            Uri::for_test("gs://bucket/key").protocol(),
            Protocol::Google
        );
        assert_eq!(
            Uri::for_test("postgres://localhost:5432/metastore").protocol(),
            Protocol::PostgreSQL
        );
        assert_eq!(
            Uri::for_test("postgresql://localhost:5432/metastore").protocol(),
            Protocol::PostgreSQL
        );
    }

    #[test]
    fn test_uri_extension() {
        assert!(Uri::for_test("s3://").extension().is_none());

        assert_eq!(
            Uri::for_test("s3://config.json").extension().unwrap(),
            "json"
        );
        assert_eq!(
            Uri::for_test("azure://config.foo").extension().unwrap(),
            "foo"
        );
    }

    #[test]
    fn test_uri_join() {
        assert_eq!(
            Uri::for_test("file:///").join("foo").unwrap(),
            "file:///foo"
        );
        assert_eq!(
            Uri::for_test("file:///foo").join("bar").unwrap(),
            "file:///foo/bar"
        );
        assert_eq!(
            Uri::for_test("file:///foo/").join("bar").unwrap(),
            "file:///foo/bar"
        );
        assert_eq!(
            Uri::for_test("ram://foo").join("bar").unwrap(),
            "ram://foo/bar"
        );
        assert_eq!(
            Uri::for_test("s3://bucket/").join("key").unwrap(),
            "s3://bucket/key"
        );
        assert_eq!(
            Uri::for_test("azure://account/container")
                .join("key")
                .unwrap(),
            "azure://account/container/key"
        );
        assert_eq!(
            Uri::for_test("gs://bucket").join("key").unwrap(),
            "gs://bucket/key"
        );
        Uri::for_test("s3://bucket/").join("/key").unwrap_err();
        Uri::for_test("azure://account/container/")
            .join("/key")
            .unwrap_err();
        Uri::for_test("postgres://username:password@localhost:5432/metastore")
            .join("table")
            .unwrap_err();
    }

    #[test]
    fn test_uri_parent() {
        assert!(Uri::for_test("file:///").parent().is_none());
        assert_eq!(Uri::for_test("file:///foo").parent().unwrap(), "file:///");
        assert_eq!(Uri::for_test("file:///foo/").parent().unwrap(), "file:///");
        assert_eq!(
            Uri::for_test("file:///foo/bar").parent().unwrap(),
            "file:///foo"
        );
        assert!(
            Uri::for_test("postgres://localhost:5432/db")
                .parent()
                .is_none()
        );

        assert!(Uri::for_test("ram:///").parent().is_none());
        assert_eq!(Uri::for_test("ram:///foo").parent().unwrap(), "ram:///");
        assert_eq!(Uri::for_test("ram:///foo/").parent().unwrap(), "ram:///");
        assert_eq!(
            Uri::for_test("ram:///foo/bar").parent().unwrap(),
            "ram:///foo"
        );
        assert!(Uri::for_test("s3://bucket").parent().is_none());
        assert!(Uri::for_test("s3://bucket/").parent().is_none());
        assert_eq!(
            Uri::for_test("s3://bucket/foo").parent().unwrap(),
            "s3://bucket"
        );
        assert_eq!(
            Uri::for_test("s3://bucket/foo/").parent().unwrap(),
            "s3://bucket"
        );
        assert_eq!(
            Uri::for_test("s3://bucket/foo/bar").parent().unwrap(),
            "s3://bucket/foo"
        );
        assert_eq!(
            Uri::for_test("s3://bucket/foo/bar/").parent().unwrap(),
            "s3://bucket/foo"
        );
        assert!(Uri::for_test("azure://account/").parent().is_none());
        assert!(Uri::for_test("azure://account").parent().is_none());
        assert!(
            Uri::for_test("azure://account/container/")
                .parent()
                .is_none()
        );
        assert!(
            Uri::for_test("azure://account/container")
                .parent()
                .is_none()
        );
        assert_eq!(
            Uri::for_test("azure://account/container/foo")
                .parent()
                .unwrap(),
            "azure://account/container"
        );
        assert_eq!(
            Uri::for_test("azure://account/container/foo/")
                .parent()
                .unwrap(),
            "azure://account/container"
        );
        assert_eq!(
            Uri::for_test("azure://account/container/foo/bar")
                .parent()
                .unwrap(),
            "azure://account/container/foo"
        );
        assert!(Uri::for_test("gs://bucket").parent().is_none());
        assert!(Uri::for_test("gs://bucket/").parent().is_none());
        assert_eq!(
            Uri::for_test("gs://bucket/foo").parent().unwrap(),
            "gs://bucket"
        );
        assert_eq!(
            Uri::for_test("gs://bucket/foo/").parent().unwrap(),
            "gs://bucket"
        );
        assert_eq!(
            Uri::for_test("gs://bucket/foo/bar").parent().unwrap(),
            "gs://bucket/foo"
        );
        assert_eq!(
            Uri::for_test("gs://bucket/foo/bar/").parent().unwrap(),
            "gs://bucket/foo"
        );
    }

    #[test]
    fn test_uri_file_name() {
        assert!(Uri::for_test("file:///").file_name().is_none());
        assert_eq!(
            Uri::for_test("file:///foo").file_name().unwrap(),
            Path::new("foo")
        );
        assert_eq!(
            Uri::for_test("file:///foo/").file_name().unwrap(),
            Path::new("foo")
        );
        assert!(
            Uri::for_test("postgres://localhost:5432/db")
                .file_name()
                .is_none()
        );

        assert!(Uri::for_test("ram:///").file_name().is_none());
        assert_eq!(
            Uri::for_test("ram:///foo").file_name().unwrap(),
            Path::new("foo")
        );
        assert_eq!(
            Uri::for_test("ram:///foo/").file_name().unwrap(),
            Path::new("foo")
        );
        assert!(Uri::for_test("s3://bucket").file_name().is_none());
        assert!(Uri::for_test("s3://bucket/").file_name().is_none());
        assert_eq!(
            Uri::for_test("s3://bucket/foo").file_name().unwrap(),
            Path::new("foo"),
        );
        assert_eq!(
            Uri::for_test("s3://bucket/foo/").file_name().unwrap(),
            Path::new("foo"),
        );
        assert!(Uri::for_test("azure://account").file_name().is_none());
        assert!(Uri::for_test("azure://account/").file_name().is_none());
        assert!(
            Uri::for_test("azure://account/container")
                .file_name()
                .is_none()
        );
        assert!(
            Uri::for_test("azure://account/container/")
                .file_name()
                .is_none()
        );
        assert_eq!(
            Uri::for_test("azure://account/container/foo")
                .file_name()
                .unwrap(),
            Path::new("foo"),
        );
        assert_eq!(
            Uri::for_test("azure://account/container/foo/")
                .file_name()
                .unwrap(),
            Path::new("foo"),
        );
        assert!(Uri::for_test("gs://bucket").file_name().is_none());
        assert!(Uri::for_test("gs://bucket/").file_name().is_none());
        assert_eq!(
            Uri::for_test("gs://bucket/foo").file_name().unwrap(),
            Path::new("foo"),
        );
        assert_eq!(
            Uri::for_test("gs://bucket/foo/").file_name().unwrap(),
            Path::new("foo"),
        );
    }

    #[test]
    fn test_uri_filepath() {
        assert_eq!(
            Uri::for_test("file:///").filepath().unwrap(),
            Path::new("/")
        );
        assert_eq!(
            Uri::for_test("file:///foo").filepath().unwrap(),
            Path::new("/foo")
        );
        assert_eq!(Uri::for_test("ram:///").filepath().unwrap(), Path::new("/"));
        assert_eq!(
            Uri::for_test("ram:///foo").filepath().unwrap(),
            Path::new("/foo")
        );
        assert!(Uri::for_test("s3://bucket/").filepath().is_none());
        assert!(
            Uri::for_test("azure://account/container/")
                .filepath()
                .is_none()
        );
        assert!(
            Uri::for_test("azure://account/container/foo.json")
                .filepath()
                .is_none()
        );
        assert!(Uri::for_test("gs://bucket/").filepath().is_none());
    }

    #[test]
    fn test_uri_as_redacted_str() {
        assert_eq!(
            Uri::for_test("s3://bucket/key").as_redacted_str(),
            "s3://bucket/key"
        );
        assert_eq!(
            Uri::for_test("azure://account/container/key").as_redacted_str(),
            "azure://account/container/key"
        );
        assert_eq!(
            Uri::for_test("gs://bucket/key").as_redacted_str(),
            "gs://bucket/key"
        );
        assert_eq!(
            Uri::for_test("postgres://localhost:5432/metastore").as_redacted_str(),
            "postgresql://localhost:5432/metastore"
        );
        assert_eq!(
            Uri::for_test("pg://username@localhost:5432/metastore").as_redacted_str(),
            "postgresql://username@localhost:5432/metastore"
        );
        {
            for protocol in ["postgres", "postgresql"] {
                let uri = Uri::from_str(&format!(
                    "{protocol}://username:password@localhost:5432/metastore"
                ))
                .unwrap();
                let expected_uri =
                    "postgresql://username:***redacted***@localhost:5432/metastore".to_string();
                assert_eq!(uri.as_redacted_str(), expected_uri);
                assert_eq!(format!("{uri}"), expected_uri);
                assert_eq!(
                    format!("{uri:?}"),
                    format!("Uri {{ uri: \"{expected_uri}\" }}")
                );
            }
        }
    }

    #[test]
    fn test_uri_serialize() {
        let uri = Uri::for_test("s3://bucket/key");
        assert_eq!(
            serde_json::to_value(uri).unwrap(),
            serde_json::Value::String("s3://bucket/key".to_string())
        );
    }
}


================================================
FILE: quickwit/quickwit-config/Cargo.toml
================================================
[package]
name = "quickwit-config"
description = "Define and manage Quickwit configuration objects"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
chrono = { workspace = true }
cron = { workspace = true }
enum-iterator = { workspace = true }
http = { workspace = true }
http-serde = { workspace = true }
humantime = { workspace = true }
itertools = { workspace = true }
json_comments = { workspace = true }
new_string_template = { workspace = true }
once_cell = { workspace = true }
regex = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
serde_with = { workspace = true }
serde_yaml = { workspace = true }
siphasher = { workspace = true }
toml = { workspace = true }
tracing = { workspace = true }
utoipa = { workspace = true }
vrl = { workspace = true, optional = true }

quickwit-common = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-proto = { workspace = true }

[dev-dependencies]
tokio = { workspace = true }

quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }

[features]
testsuite = []
vrl = ["dep:vrl"]


================================================
FILE: quickwit/quickwit-config/resources/tests/index_config/hdfs-logs-create-config.yaml
================================================
version: 0.8

doc_mapping:
  field_mappings:
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: timestamp
      type: i64
      fast: true


================================================
FILE: quickwit/quickwit-config/resources/tests/index_config/hdfs-logs.json
================================================
# Comments are supported.
{
    "version": "0.7",
    "index_id": "hdfs-logs",
    "index_uri": "s3://quickwit-indexes/hdfs-logs",
    "doc_mapping": {
        "tokenizers": [
            {
                "name": "service_regex",
                "type": "regex",
                "pattern": "\\w*"
            }
        ],
        "field_mappings": [
            {
                "name": "tenant_id",
                "type": "u64",
                "fast": true
            },
            {
                "name": "timestamp",
                "type": "datetime",
                "fast": true
            },
            {
                "name": "severity_text",
                "type": "text",
                "tokenizer": "raw"
            },
            {
                "name": "body",
                "type": "text",
                "tokenizer": "default",
                "record": "position"
            },
            {
                "name": "resource",
                "type": "object",
                "field_mappings": [
                    {
                        "name": "service",
                        "type": "text",
                        "tokenizer": "service_regex"
                    }
                ]
            }
        ],
        "tag_fields": ["tenant_id"],
        "timestamp_field": "timestamp",
        "store_source": true
    },
    "retention": {
        "period": "90 days",
        "schedule": "daily"
    },
    "indexing_settings": {
        "commit_timeout_secs": 61,
        "split_num_docs_target": 10000001,
        "merge_policy": {
            "type": "stable_log",
            "merge_factor": 9,
            "max_merge_factor": 11,
            "maturation_period": "48 hours"
        },
        "resources": {
            "heap_size": "3G"
        }
    },
    "ingest_settings": {
        "min_shards": 12
    },
    "search_settings": {
        "default_search_fields": ["severity_text", "body"]
    }
}


================================================
FILE: quickwit/quickwit-config/resources/tests/index_config/hdfs-logs.toml
================================================
version = "0.7"
index_id = "hdfs-logs"
index_uri = "s3://quickwit-indexes/hdfs-logs"

[doc_mapping]
tokenizers = [
  { name = "service_regex", type = "regex", pattern = "\\w*" },
]
field_mappings = [
  { name = "tenant_id", type = "u64", fast = true },
  { name = "timestamp", type = "datetime", fast = true },
  { name = "severity_text", type = "text", tokenizer = "raw" },
  { name = "body", type = "text", tokenizer = "default", record = "position" },
  { name = "resource", type = "object", field_mappings = [ { name = "service", type = "text", tokenizer = "service_regex" } ] },
]
tag_fields = [ "tenant_id" ]
store_source = true
timestamp_field = "timestamp"

[retention]
period = "90 days"
schedule = "daily"

[indexing_settings]
commit_timeout_secs = 61
split_num_docs_target = 10_000_001

[indexing_settings.merge_policy]
type = "stable_log"
merge_factor = 9
max_merge_factor = 11
maturation_period = "48 hours"

[indexing_settings.resources]
heap_size = "3G"

[ingest_settings]
min_shards = 12

[search_settings]
default_search_fields = [ "severity_text", "body" ]


================================================
FILE: quickwit/quickwit-config/resources/tests/index_config/hdfs-logs.yaml
================================================
version: 0.8
index_id: hdfs-logs
index_uri: s3://quickwit-indexes/hdfs-logs

doc_mapping:
  tokenizers:
    - name: service_regex
      type: regex
      pattern: "\\w*"
  field_mappings:
    - name: tenant_id
      type: u64
      fast: true
    - name: timestamp
      type: datetime
      fast: true
    - name: severity_text
      type: text
      tokenizer: raw
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: resource
      type: object
      field_mappings:
        - name: service
          type: text
          tokenizer: service_regex
  tag_fields: [tenant_id]
  timestamp_field: timestamp
  store_source: true

retention:
  period: 90 days
  schedule: daily

indexing_settings:
  commit_timeout_secs: 61
  split_num_docs_target: 10000001
  merge_policy:
    type: "stable_log"
    merge_factor: 9
    max_merge_factor: 11
    maturation_period: 48 hours
  resources:
    heap_size: 3G

ingest_settings:
  min_shards: 12

search_settings:
  default_search_fields: [severity_text, body]


================================================
FILE: quickwit/quickwit-config/resources/tests/index_config/minimal-hdfs-logs.yaml
================================================
version: 0.8

index_id: hdfs-logs
index_uri: s3://quickwit-indexes/hdfs-logs

doc_mapping:
  field_mappings:
    - name: body
      type: text
      tokenizer: default
      record: position

search_settings:
  default_search_fields: [body]


================================================
FILE: quickwit/quickwit-config/resources/tests/index_config/partial-hdfs-logs.yaml
================================================
version: 0.8

index_id: hdfs-logs
index_uri: s3://quickwit-indexes/hdfs-logs

doc_mapping:
  field_mappings:
    - name: body
      type: text
      tokenizer: default
      record: position
    - name: timestamp
      type: i64
      fast: true

indexing_settings:
  commit_timeout_secs: 42
  merge_policy:
    type: "stable_log"

search_settings:
  default_search_fields: [body]


================================================
FILE: quickwit/quickwit-config/resources/tests/node_config/quickwit.json
================================================
# Comments are supported.
{
    "version": "0.7",
    "cluster_id": "quickwit-cluster",
    "node_id": "my-unique-node-id",
    "availability_zone": "az-1",
    "enabled_services": [
        "janitor",
        "metastore"
    ],
    "listen_address": "0.0.0.0",
    "advertise_address": "172.0.0.12",
    "gossip_listen_port": 2222,
    "grpc_listen_port": 3333,
    "peer_seeds": [
        "quickwit-searcher-0.local",
        "quickwit-searcher-1.local"
    ],
    "data_dir": "/opt/quickwit/data",
    "metastore_uri": "postgres://username:password@host:port/db",
    "default_index_root_uri": "s3://quickwit-indexes",
    "rest": {
        "listen_port": 1111,
        "extra_headers": {
            "x-header-1": "header-value-1",
            "x-header-2": "header-value-2"
        }
    },
    "grpc": {
        "max_message_size": "10 MB"
    },
    "storage": {
        "azure": {
            "account": "quickwit-dev"
        },
        "s3": {
            "flavor": "gcs",
            "endpoint": "http://localhost:4566",
            "force_path_style_access": true
        }
    },
    "metastore": {
        "postgres": {
            "min_connections": 1,
            "max_num_connections": 12,
            "acquire_connection_timeout": "30s",
            "idle_connection_timeout": "30min",
            "max_connection_lifetime": "1h"
        }
    },
    "indexer": {
        "enable_otlp_endpoint": true,
        "split_store_max_num_bytes": "1T",
        "split_store_max_num_splits": 10000,
        "max_concurrent_split_uploads": 8,
        "max_merge_write_throughput": "100mb",
        "merge_concurrency": 2
    },
    "ingest_api": {
        "replication_factor": 2
    },
    "searcher": {
        "aggregation_memory_limit": "1G",
        "aggregation_bucket_limit": 500000,
        "fast_field_cache_capacity": "10G",
        "split_footer_cache_capacity": "1G",
        "max_num_concurrent_split_streams": 120,
        "max_num_concurrent_split_searches": 150,
        "storage_timeout_policy": {
            "min_throughtput_bytes_per_secs": 100000,
            "timeout_millis": 2000,
            "max_num_retries": 2
        },
        "lambda": {
            "function_name": "quickwit-lambda-leaf-search",
            "max_splits_per_invocation": 10,
            "offload_threshold": 30,
            "auto_deploy": {
                "execution_role_arn": "arn:aws:iam::123456789012:role/quickwit-lambda-role",
                "memory_size": "5 GiB",
                "invocation_timeout_secs": 15
            }
        }
    },
    "jaeger": {
        "enable_endpoint": true,
        "lookback_period_hours": 24,
        "max_trace_duration_secs": 600,
        "max_fetch_spans": 1000
    }
}


================================================
FILE: quickwit/quickwit-config/resources/tests/node_config/quickwit.toml
================================================
version = "0.7"

cluster_id = "quickwit-cluster"
node_id = "my-unique-node-id"
availability_zone = "az-1"
enabled_services = [ "janitor", "metastore" ]
listen_address = "0.0.0.0"
advertise_address = "172.0.0.12"
gossip_listen_port = 2222
grpc_listen_port = 3333
peer_seeds = [ "quickwit-searcher-0.local", "quickwit-searcher-1.local" ]
data_dir = "/opt/quickwit/data"
metastore_uri = "postgres://username:password@host:port/db"
default_index_root_uri = "s3://quickwit-indexes"

[rest]
listen_port = 1111

[rest.extra_headers]
x-header-1 = "header-value-1"
x-header-2 = "header-value-2"

[grpc]
max_message_size = "10 MB"

[storage.azure]
account = "quickwit-dev"

[storage.s3]
flavor = "gcs"
endpoint = "http://localhost:4566"
force_path_style_access = true

[metastore.postgres]
min_connections = 1
max_num_connections = 12
acquire_connection_timeout = "30s"
idle_connection_timeout = "30min"
max_connection_lifetime = "1h"

[indexer]
enable_otlp_endpoint = true
split_store_max_num_bytes = "1T"
split_store_max_num_splits = 10_000
max_concurrent_split_uploads = 8
max_merge_write_throughput = "100mb"
merge_concurrency = 2

[ingest_api]
replication_factor = 2

[searcher]
aggregation_memory_limit = "1G"
aggregation_bucket_limit = 500_000
fast_field_cache_capacity = "10G"
split_footer_cache_capacity = "1G"
max_num_concurrent_split_streams = 120
max_num_concurrent_split_searches = 150

[searcher.storage_timeout_policy]
min_throughtput_bytes_per_secs = 100000
timeout_millis = 2000
max_num_retries = 2

[searcher.lambda]
function_name = "quickwit-lambda-leaf-search"
max_splits_per_invocation = 10
offload_threshold = 30

[searcher.lambda.auto_deploy]
execution_role_arn = "arn:aws:iam::123456789012:role/quickwit-lambda-role"
memory_size = "5 GiB"
invocation_timeout_secs = 15

[jaeger]
enable_endpoint = true
lookback_period_hours = 24
max_trace_duration_secs = 600
max_fetch_spans = 1_000


================================================
FILE: quickwit/quickwit-config/resources/tests/node_config/quickwit.wrongkey.yaml
================================================
version: 0.8
searcher:
  fast_field_cache_capacity: 10G
  # Typo here. It is supposed to be searches.
  max_num_concurrent_split_searches_with_typo: 150


================================================
FILE: quickwit/quickwit-config/resources/tests/node_config/quickwit.yaml
================================================
version: 0.8

cluster_id: quickwit-cluster
node_id: my-unique-node-id
availability_zone: az-1
enabled_services:
  - janitor
  - metastore
listen_address: 0.0.0.0
advertise_address: 172.0.0.12
gossip_listen_port: 2222
grpc_listen_port: 3333
peer_seeds:
  - quickwit-searcher-0.local
  - quickwit-searcher-1.local
data_dir: /opt/quickwit/data
metastore_uri: postgres://username:password@host:port/db
default_index_root_uri: s3://quickwit-indexes

rest:
  listen_port: 1111
  extra_headers:
    x-header-1: header-value-1
    x-header-2: header-value-2

grpc:
  max_message_size: 10 MB

storage:
  azure:
    account: quickwit-dev
  s3:
    flavor: gcs
    endpoint: http://localhost:4566
    force_path_style_access: true

metastore:
  postgres:
    min_connections: 1
    max_num_connections: 12
    acquire_connection_timeout: 30s
    idle_connection_timeout: 30min
    max_connection_lifetime: 1h

indexer:
  enable_otlp_endpoint: true
  split_store_max_num_bytes: 1T
  split_store_max_num_splits: 10000
  max_concurrent_split_uploads: 8
  max_merge_write_throughput: 100mb
  merge_concurrency: 2

ingest_api:
  replication_factor: 2

searcher:
  aggregation_memory_limit: 1G
  aggregation_bucket_limit: 500000
  fast_field_cache_capacity: 10G
  split_footer_cache_capacity: 1G
  max_num_concurrent_split_streams: 120
  max_num_concurrent_split_searches: 150
  storage_timeout_policy:
    min_throughtput_bytes_per_secs: 100000
    timeout_millis: 2000
    max_num_retries: 2
  lambda:
    function_name: quickwit-lambda-leaf-search
    max_splits_per_invocation: 10
    offload_threshold: 30
    auto_deploy:
      execution_role_arn: arn:aws:iam::123456789012:role/quickwit-lambda-role
      memory_size: 5 GiB
      invocation_timeout_secs: 15

jaeger:
  enable_endpoint: true
  lookback_period_hours: 24
  max_trace_duration_secs: 600
  max_fetch_spans: 1000


================================================
FILE: quickwit/quickwit-config/resources/tests/source_config/ingest-api-source.json
================================================
{
  "version": "0.7",
  "source_id": "_ingest-api-source",
  "enabled": true,
  "source_type": "ingest-api",
  "transform": {
    "script": ".message = downcase(string!(.message))"
  }
}


================================================
FILE: quickwit/quickwit-config/resources/tests/source_config/kafka-source.json
================================================
{
    "version": "0.7",
    "source_id": "hdfs-logs-kafka-source",
    "desired_num_pipelines": 2,
    "source_type": "kafka",
    "params": {
        "topic": "cloudera-cluster-logs",
        "client_params": {
            "bootstrap.servers": "localhost:9092"
        }
    },
    "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "local"
    }
}


================================================
FILE: quickwit/quickwit-config/resources/tests/source_config/kinesis-source.yaml
================================================
version: 0.8
source_id: hdfs-logs-kinesis-source
source_type: kinesis
params:
  stream_name: emr-cluster-logs
transform:
  script: .message = downcase(string!(.message))
  timezone: local


================================================
FILE: quickwit/quickwit-config/src/cluster_config/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytesize::ByteSize;
use quickwit_common::uri::Uri;

/// An embryo of a cluster config.
// TODO: Move to `quickwit-config` and version object.
#[derive(Debug, Clone)]
pub struct ClusterConfig {
    pub cluster_id: String,
    pub auto_create_indexes: bool,
    pub default_index_root_uri: Uri,
    pub replication_factor: usize,
    pub shard_throughput_limit: ByteSize,
    pub shard_scale_up_factor: f32,
}

impl ClusterConfig {
    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        ClusterConfig {
            cluster_id: "test-cluster".to_string(),
            auto_create_indexes: false,
            default_index_root_uri: Uri::for_test("ram:///indexes"),
            replication_factor: 1,
            shard_throughput_limit: quickwit_common::shared_consts::DEFAULT_SHARD_THROUGHPUT_LIMIT,
            shard_scale_up_factor: 1.01,
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/config_value.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::str::FromStr;
use std::{any, fmt};

use anyhow::{self, Context};
use serde::{Deserialize, Deserializer};
use tracing::warn;

use crate::qw_env_vars::{QW_ENV_VARS, QW_NONE};

#[derive(Debug, Clone, Eq, PartialEq)]
pub(crate) struct ConfigValue<T, const E: usize> {
    /// Value provided by the user in a config file.
    provided: Option<T>,
    /// Value provided by Quickwit as default.
    default: Option<T>,
}

impl<T, const E: usize> ConfigValue<T, E>
where
    T: FromStr,
    <T as FromStr>::Err: fmt::Debug,
{
    pub(crate) fn with_default(value: T) -> Self {
        Self {
            provided: None,
            default: Some(value),
        }
    }

    pub(crate) fn none() -> Self {
        Self {
            provided: None,
            default: None,
        }
    }

    #[cfg(test)]
    pub(crate) fn for_test(value: T) -> Self {
        Self {
            provided: Some(value),
            default: None,
        }
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub(crate) fn unwrap(self) -> T {
        self.provided.or(self.default).unwrap()
    }

    pub(crate) fn resolve_optional(
        self,
        env_vars: &HashMap<String, String>,
    ) -> anyhow::Result<Option<T>> {
        // QW env vars take precedence over the config file values.
        if E > QW_NONE
            && let Some(env_var_key) = QW_ENV_VARS.get(&E)
            && let Some(env_var_value) = env_vars.get(*env_var_key).filter(|val| {
                if val.is_empty() {
                    warn!(
                        "environment variable `{}` is set but value is empty",
                        *env_var_key
                    );
                    false
                } else {
                    true
                }
            })
        {
            let value = env_var_value.parse::<T>().map_err(|error| {
                anyhow::anyhow!(
                    "failed to convert value `{env_var_value}` read from environment variable \
                     `{env_var_key}` to type `{}`: {error:?}",
                    any::type_name::<T>(),
                )
            })?;
            return Ok(Some(value));
        }
        Ok(self.provided.or(self.default))
    }

    pub(crate) fn resolve(self, env_vars: &HashMap<String, String>) -> anyhow::Result<T> {
        self.resolve_optional(env_vars)?.context(
            "failed to resolve field value: no value was provided via environment variable or \
             config file, and the field has no default",
        )
    }
}

impl<T, const E: usize> Default for ConfigValue<T, E>
where T: Default
{
    fn default() -> Self {
        Self {
            provided: None,
            default: Some(T::default()),
        }
    }
}

impl<'de, T, const E: usize> Deserialize<'de> for ConfigValue<T, E>
where T: Deserialize<'de>
{
    fn deserialize<D>(deserializer: D) -> Result<ConfigValue<T, E>, D::Error>
    where D: Deserializer<'de> {
        let value: Option<T> = Deserialize::deserialize(deserializer)?;
        Ok(ConfigValue {
            provided: value,
            default: None,
        })
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::qw_env_vars::{
        QW_AVAILABILITY_ZONE, QW_CLUSTER_ID, QW_GOSSIP_LISTEN_PORT, QW_NODE_ID, QW_REST_LISTEN_PORT,
    };

    #[test]
    fn test_config_value_resolve_optional() {
        {
            let env_vars = HashMap::new();
            let rest_listen_port = ConfigValue::<usize, QW_REST_LISTEN_PORT>::none();
            assert!(
                rest_listen_port
                    .resolve_optional(&env_vars)
                    .unwrap()
                    .is_none()
            );
        }
        {
            let env_vars = HashMap::new();
            let rest_listen_port = ConfigValue::<usize, QW_REST_LISTEN_PORT>::with_default(7280);
            assert_eq!(
                rest_listen_port
                    .resolve_optional(&env_vars)
                    .unwrap()
                    .unwrap(),
                7280
            );
        }
        {
            let env_vars = HashMap::new();
            let rest_listen_port = ConfigValue::<usize, QW_REST_LISTEN_PORT> {
                provided: Some(5678),
                default: Some(7820),
            };
            assert_eq!(
                rest_listen_port
                    .resolve_optional(&env_vars)
                    .unwrap()
                    .unwrap(),
                5678
            );
        }
        {
            let mut env_vars = HashMap::new();
            env_vars.insert("QW_REST_LISTEN_PORT".to_string(), "foobar".to_string());
            let rest_listen_port = ConfigValue::<usize, QW_REST_LISTEN_PORT> {
                provided: Some(5678),
                default: Some(7820),
            };
            rest_listen_port.resolve_optional(&env_vars).unwrap_err();
        }
        {
            let mut env_vars = HashMap::new();
            env_vars.insert("QW_REST_LISTEN_PORT".to_string(), "1234".to_string());
            let rest_listen_port = ConfigValue::<usize, QW_REST_LISTEN_PORT> {
                provided: Some(5678),
                default: Some(7820),
            };
            assert_eq!(
                rest_listen_port
                    .resolve_optional(&env_vars)
                    .unwrap()
                    .unwrap(),
                1234
            );
        }
    }

    #[test]
    fn test_config_value_resolve() {
        let env_vars = HashMap::new();
        let rest_listen_port = ConfigValue::<usize, QW_REST_LISTEN_PORT>::none();
        rest_listen_port.resolve(&env_vars).unwrap_err();
    }

    #[test]
    fn test_config_value_resolve_optional_empty_string() {
        let mut env_vars = HashMap::new();
        env_vars.insert("QW_AVAILABILITY_ZONE".to_string(), "".to_string());
        let az = ConfigValue::<usize, QW_AVAILABILITY_ZONE>::none();
        assert!(az.resolve_optional(&env_vars).unwrap().is_none());
    }

    #[test]
    fn test_config_value_deserialize() {
        fn default_cluster_id() -> ConfigValue<String, QW_CLUSTER_ID> {
            ConfigValue::with_default("default-cluster".to_string())
        }

        fn default_node_id() -> ConfigValue<String, QW_NODE_ID> {
            ConfigValue::with_default("default-node".to_string())
        }

        fn default_rest_listen_port() -> ConfigValue<usize, QW_REST_LISTEN_PORT> {
            ConfigValue::with_default(7280)
        }

        #[derive(Deserialize)]
        struct Config {
            #[serde(default)]
            version: ConfigValue<usize, QW_NONE>,
            #[serde(default = "default_cluster_id")]
            cluster_id: ConfigValue<String, QW_CLUSTER_ID>,
            #[serde(default = "default_node_id")]
            node_id: ConfigValue<String, QW_NODE_ID>,
            #[serde(default = "default_rest_listen_port")]
            rest_listen_port: ConfigValue<usize, QW_REST_LISTEN_PORT>,
            gossip_listen_port: ConfigValue<String, QW_GOSSIP_LISTEN_PORT>,
        }
        let config = serde_yaml::from_str::<Config>(
            r#"
            cluster_id: qw-cluster
            "#,
        )
        .unwrap();

        let mut env_vars = HashMap::new();
        env_vars.insert("QW_REST_LISTEN_PORT".to_string(), "1234".to_string());

        assert_eq!(config.version.resolve(&env_vars).unwrap(), 0);
        assert_eq!(config.cluster_id.resolve(&env_vars).unwrap(), "qw-cluster");
        assert_eq!(config.node_id.resolve(&env_vars).unwrap(), "default-node");
        assert_eq!(config.rest_listen_port.resolve(&env_vars).unwrap(), 1234);
        assert!(
            config
                .gossip_listen_port
                .resolve_optional(&env_vars)
                .unwrap()
                .is_none()
        );
    }
}


================================================
FILE: quickwit/quickwit-config/src/index_config/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub(crate) mod serialize;

use std::collections::HashSet;
use std::hash::{Hash, Hasher};
use std::num::NonZeroUsize;
use std::str::FromStr;
use std::sync::Arc;
use std::time::Duration;

use anyhow::{Context, ensure};
use bytesize::ByteSize;
use chrono::Utc;
use cron::Schedule;
use humantime::parse_duration;
use quickwit_common::uri::Uri;
use quickwit_common::{is_true, true_fn};
use quickwit_doc_mapper::{DocMapper, DocMapperBuilder, DocMapping};
use quickwit_proto::types::IndexId;
use serde::{Deserialize, Serialize};
pub use serialize::{load_index_config_from_user_config, load_index_config_update};
use siphasher::sip::SipHasher;
use tracing::warn;

use crate::index_config::serialize::VersionedIndexConfig;
use crate::merge_policy_config::MergePolicyConfig;

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct IndexingResources {
    #[schema(value_type = String, default = "2 GB")]
    #[serde(default = "IndexingResources::default_heap_size")]
    #[serde(with = "crate::serde_utils::bytesize_serde")]
    pub heap_size: ByteSize,
    // DEPRECATED: See #4439
    #[schema(value_type = String)]
    #[serde(default)]
    #[serde(skip_serializing)]
    max_merge_write_throughput: Option<ByteSize>,
}

impl PartialEq for IndexingResources {
    fn eq(&self, other: &Self) -> bool {
        self.heap_size == other.heap_size
    }
}

impl Hash for IndexingResources {
    fn hash<H: Hasher>(&self, state: &mut H) {
        self.heap_size.hash(state);
    }
}

impl IndexingResources {
    fn default_heap_size() -> ByteSize {
        ByteSize::gb(2)
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        Self {
            heap_size: ByteSize::mb(20),
            ..Default::default()
        }
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        if self.max_merge_write_throughput.is_some() {
            warn!(
                "`max_merge_write_throughput` is deprecated and will be removed in a future \
                 version. See #4439. A global limit now exists in indexer configuration."
            );
        }
        Ok(())
    }
}

impl Default for IndexingResources {
    fn default() -> Self {
        Self {
            heap_size: Self::default_heap_size(),
            max_merge_write_throughput: None,
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize, PartialEq, Hash, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct IndexingSettings {
    #[schema(default = 60)]
    #[serde(default = "IndexingSettings::default_commit_timeout_secs")]
    pub commit_timeout_secs: usize,
    #[schema(default = 8)]
    #[serde(default = "IndexingSettings::default_docstore_compression_level")]
    pub docstore_compression_level: i32,
    #[schema(default = 1_000_000)]
    #[serde(default = "IndexingSettings::default_docstore_blocksize")]
    pub docstore_blocksize: usize,
    /// The merge policy aims to eventually produce mature splits that have a larger size but
    /// are within close range of `split_num_docs_target`.
    ///
    /// In other words, splits that contain a number of documents greater than or equal to
    /// `split_num_docs_target` are considered mature and never merged.
    #[serde(default = "IndexingSettings::default_split_num_docs_target")]
    pub split_num_docs_target: usize,
    #[serde(default)]
    pub merge_policy: MergePolicyConfig,
    #[serde(default)]
    pub resources: IndexingResources,
}

impl IndexingSettings {
    pub fn commit_timeout(&self) -> Duration {
        Duration::from_secs(self.commit_timeout_secs as u64)
    }

    fn default_commit_timeout_secs() -> usize {
        60
    }

    pub fn default_docstore_blocksize() -> usize {
        1_000_000
    }

    pub fn default_docstore_compression_level() -> i32 {
        8
    }

    pub fn default_split_num_docs_target() -> usize {
        10_000_000
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        Self {
            resources: IndexingResources::for_test(),
            ..Default::default()
        }
    }
}

impl Default for IndexingSettings {
    fn default() -> Self {
        Self {
            commit_timeout_secs: Self::default_commit_timeout_secs(),
            docstore_blocksize: Self::default_docstore_blocksize(),
            docstore_compression_level: Self::default_docstore_compression_level(),
            split_num_docs_target: Self::default_split_num_docs_target(),
            merge_policy: MergePolicyConfig::default(),
            resources: IndexingResources::default(),
        }
    }
}

/// Settings for ingestion.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct IngestSettings {
    /// Configures the minimum number of shards to use for ingestion.
    #[schema(default = 1, value_type = usize)]
    #[serde(default = "IngestSettings::default_min_shards")]
    pub min_shards: NonZeroUsize,
    /// Whether to validate documents against the current doc mapping during ingestion.
    /// Defaults to true. When false, documents will be written directly to the WAL without
    /// validation, but might still be rejected during indexing when applying the doc mapping
    /// in the doc processor, in that case the documents are dropped and a warning is logged.
    ///
    /// Note that when a source has a VRL transform configured, documents are not validated against
    /// the doc mapping during ingestion either.
    #[schema(default = true, value_type = bool)]
    #[serde(default = "true_fn", skip_serializing_if = "is_true")]
    pub validate_docs: bool,
}

impl IngestSettings {
    pub fn default_min_shards() -> NonZeroUsize {
        NonZeroUsize::MIN
    }
}

impl Default for IngestSettings {
    fn default() -> Self {
        Self {
            min_shards: Self::default_min_shards(),
            validate_docs: true,
        }
    }
}

#[derive(Clone, Debug, Default, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct SearchSettings {
    #[serde(default)]
    pub default_search_fields: Vec<String>,
}

#[derive(Clone, Debug, Hash, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct RetentionPolicy {
    /// Duration of time for which the splits should be retained, expressed in a human-friendly way
    /// (`1 hour`, `3 days`, `1 week`, ...).
    #[serde(rename = "period")]
    pub retention_period: String,

    /// Defines the frequency at which the retention policy is evaluated and applied, expressed in
    /// a human-friendly way (`hourly`, `daily`, ...) or as a cron expression (`0 0 * * * *`,
    /// `0 0 0 * * *`).
    #[serde(default = "RetentionPolicy::default_schedule")]
    #[serde(rename = "schedule")]
    pub evaluation_schedule: String,
}

impl RetentionPolicy {
    pub fn default_schedule() -> String {
        "hourly".to_string()
    }

    pub fn retention_period(&self) -> anyhow::Result<Duration> {
        parse_duration(&self.retention_period).with_context(|| {
            format!(
                "failed to parse retention period `{}`",
                self.retention_period
            )
        })
    }

    pub fn evaluation_schedule(&self) -> anyhow::Result<Schedule> {
        let evaluation_schedule = prepend_at_char(&self.evaluation_schedule);

        Schedule::from_str(&evaluation_schedule).with_context(|| {
            format!(
                "failed to parse retention evaluation schedule `{}`",
                self.evaluation_schedule
            )
        })
    }

    pub fn duration_until_next_evaluation(&self) -> anyhow::Result<Duration> {
        let schedule = self.evaluation_schedule()?;
        let future_date = schedule
            .upcoming(Utc)
            .next()
            .expect("Failed to obtain next evaluation date.");
        let duration = (future_date - Utc::now())
            .to_std()
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        Ok(duration)
    }

    pub(super) fn validate(&self) -> anyhow::Result<()> {
        self.retention_period()?;
        self.evaluation_schedule()?;
        Ok(())
    }
}

/// Prepends an `@` char at the start of the cron expression if necessary:
/// `hourly` -> `@hourly`
fn prepend_at_char(schedule: &str) -> String {
    let trimmed_schedule = schedule.trim();

    if !trimmed_schedule.is_empty()
        && !trimmed_schedule.starts_with('@')
        && trimmed_schedule.chars().all(|ch| ch.is_ascii_alphabetic())
    {
        return format!("@{trimmed_schedule}");
    }
    trimmed_schedule.to_string()
}

#[derive(Clone, Debug, Serialize, Deserialize, PartialEq)]
#[serde(deny_unknown_fields)]
#[serde(into = "VersionedIndexConfig")]
#[serde(try_from = "VersionedIndexConfig")]
pub struct IndexConfig {
    pub index_id: IndexId,
    pub index_uri: Uri,
    pub doc_mapping: DocMapping,
    pub indexing_settings: IndexingSettings,
    pub ingest_settings: IngestSettings,
    pub search_settings: SearchSettings,
    pub retention_policy_opt: Option<RetentionPolicy>,
}

impl IndexConfig {
    /// Return a fingerprint of parameters relevant for indexers
    ///
    /// This should remain private to this crate to avoid confusion with the
    /// full indexing pipeline fingerprint that also includes the source's
    /// fingerprint.
    pub(crate) fn indexing_params_fingerprint(&self) -> u64 {
        let mut hasher = SipHasher::new();
        self.doc_mapping.doc_mapping_uid.hash(&mut hasher);
        self.indexing_settings.hash(&mut hasher);
        hasher.finish()
    }

    /// Compares IndexConfig level fingerprints
    ///
    /// This method is meant to enable IndexConfig level fingerprint comparison
    /// without taking the risk of mixing them up with pipeline level
    /// fingerprints (computed by
    /// [`crate::indexing_pipeline_params_fingerprint()`]).
    pub fn equals_fingerprint(&self, other: &Self) -> bool {
        self.indexing_params_fingerprint() == other.indexing_params_fingerprint()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(index_id: &str, index_uri: &str) -> Self {
        let index_uri = Uri::from_str(index_uri).unwrap();
        let doc_mapping_json = r#"{
            "doc_mapping_uid": "00000000000000000000000000",
            "mode": "lenient",
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "body",
                    "type": "text",
                    "stored": true
                },
                {
                    "name": "response_date",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "response_time",
                    "type": "f64",
                    "fast": true
                },
                {
                    "name": "response_payload",
                    "type": "bytes",
                    "fast": true
                },
                {
                    "name": "owner",
                    "type": "text",
                    "tokenizer": "raw"
                },
                {
                    "name": "attributes",
                    "type": "object",
                    "field_mappings": [
                        {
                            "name": "tags",
                            "type": "array<i64>"
                        },
                        {
                            "name": "server",
                            "type": "text"
                        },
                        {
                            "name": "server.status",
                            "type": "array<text>"
                        },
                        {
                            "name": "server.payload",
                            "type": "array<bytes>"
                        }
                    ]
                }
            ],
            "timestamp_field": "timestamp",
            "tag_fields": ["owner"],
            "store_source": true
        }"#;
        let doc_mapping = serde_json::from_str(doc_mapping_json).unwrap();
        let indexing_settings = IndexingSettings {
            resources: IndexingResources::for_test(),
            ..Default::default()
        };
        let search_settings = SearchSettings {
            default_search_fields: vec![
                "body".to_string(),
                r#"attributes.server"#.to_string(),
                r"attributes.server\.status".to_string(),
            ],
        };
        IndexConfig {
            index_id: index_id.to_string(),
            index_uri,
            doc_mapping,
            indexing_settings,
            ingest_settings: IngestSettings::default(),
            search_settings,
            retention_policy_opt: None,
        }
    }
}

#[cfg(any(test, feature = "testsuite"))]
impl crate::TestableForRegression for IndexConfig {
    fn sample_for_regression() -> Self {
        use std::collections::BTreeSet;
        use std::num::NonZeroU32;

        use quickwit_doc_mapper::Mode;
        use quickwit_proto::types::DocMappingUid;

        use crate::merge_policy_config::StableLogMergePolicyConfig;

        let tenant_id_mapping = serde_json::from_str(
            r#"{
                "name": "tenant_id",
                "type": "u64",
                "fast": true
        }"#,
        )
        .unwrap();
        let timestamp_mapping = serde_json::from_str(
            r#"{
                "name": "timestamp",
                "type": "datetime",
                "fast": true
        }"#,
        )
        .unwrap();
        let log_level_mapping = serde_json::from_str(
            r#"{
                "name": "log_level",
                "type": "text",
                "tokenizer": "raw"
        }"#,
        )
        .unwrap();
        let message_mapping = serde_json::from_str(
            r#"{
                "name": "message",
                "type": "text",
                "record": "position",
                "tokenizer": "default"
        }"#,
        )
        .unwrap();
        let tokenizer = serde_json::from_str(
            r#"{
                "name": "custom_tokenizer",
                "type": "regex",
                "pattern": "[^\\p{L}\\p{N}]+"
            }"#,
        )
        .unwrap();
        let doc_mapping = DocMapping {
            doc_mapping_uid: DocMappingUid::for_test(1),
            mode: Mode::default(),
            field_mappings: vec![
                tenant_id_mapping,
                timestamp_mapping,
                log_level_mapping,
                message_mapping,
            ],
            timestamp_field: Some("timestamp".to_string()),
            tag_fields: BTreeSet::from_iter(["tenant_id".to_string(), "log_level".to_string()]),
            partition_key: Some("tenant_id".to_string()),
            max_num_partitions: NonZeroU32::new(100).unwrap(),
            index_field_presence: true,
            store_document_size: false,
            store_source: true,
            tokenizers: vec![tokenizer],
        };
        let stable_log_config = StableLogMergePolicyConfig {
            merge_factor: 9,
            max_merge_factor: 11,
            ..Default::default()
        };
        let merge_policy = MergePolicyConfig::StableLog(stable_log_config);
        let indexing_resources = IndexingResources {
            heap_size: ByteSize::mb(50),
            ..Default::default()
        };
        let indexing_settings = IndexingSettings {
            commit_timeout_secs: 301,
            split_num_docs_target: 10_000_001,
            merge_policy,
            resources: indexing_resources,
            ..Default::default()
        };
        let ingest_settings = IngestSettings {
            min_shards: NonZeroUsize::new(12).unwrap(),
            validate_docs: true,
        };
        let search_settings = SearchSettings {
            default_search_fields: vec!["message".to_string()],
        };
        let retention_policy_opt = Some(RetentionPolicy {
            retention_period: "90 days".to_string(),
            evaluation_schedule: "daily".to_string(),
        });
        IndexConfig {
            index_id: "my-index".to_string(),
            index_uri: Uri::for_test("s3://quickwit-indexes/my-index"),
            doc_mapping,
            indexing_settings,
            ingest_settings,
            search_settings,
            retention_policy_opt,
        }
    }

    fn assert_equality(&self, other: &Self) {
        assert_eq!(self.index_id, other.index_id);
        assert_eq!(self.index_uri, other.index_uri);
        assert_eq!(self.doc_mapping, other.doc_mapping);
        assert_eq!(self.indexing_settings, other.indexing_settings);
        assert_eq!(self.ingest_settings, other.ingest_settings);
        assert_eq!(self.search_settings, other.search_settings);
        assert_eq!(self.retention_policy_opt, other.retention_policy_opt);
    }
}

/// Builds and returns the doc mapper associated with an index.
pub fn build_doc_mapper(
    doc_mapping: &DocMapping,
    search_settings: &SearchSettings,
) -> anyhow::Result<Arc<DocMapper>> {
    let builder = DocMapperBuilder {
        doc_mapping: doc_mapping.clone(),
        default_search_fields: search_settings.default_search_fields.clone(),
        legacy_type_tag: None,
    };
    let doc_mapper = builder.try_build()?;
    Ok(Arc::new(doc_mapper))
}

/// Validates the objects that make up an index configuration. This is a "free" function as opposed
/// to a method on `IndexConfig` so we can reuse it for validating index templates.
pub(super) fn validate_index_config(
    doc_mapping: &DocMapping,
    indexing_settings: &IndexingSettings,
    search_settings: &SearchSettings,
    retention_policy_opt: &Option<RetentionPolicy>,
) -> anyhow::Result<()> {
    // Note: this needs a deep refactoring to separate the doc mapping configuration,
    // and doc mapper implementations.
    // TODO see if we should store the byproducton the IndexConfig.
    build_doc_mapper(doc_mapping, search_settings)?;

    indexing_settings.merge_policy.validate()?;
    indexing_settings.resources.validate()?;

    if let Some(retention_policy) = retention_policy_opt {
        retention_policy.validate()?;

        ensure!(
            doc_mapping.timestamp_field.is_some(),
            "retention policy requires a timestamp field, but doc mapping does not declare one"
        );
    }
    Ok(())
}

/// Returns the updated doc mapping and a boolean indicating whether a mutation occurred.
///
/// The logic goes as follows:
/// 1. If the new doc mapping is the same as the current doc mapping, ignoring their UIDs, returns
///    the current doc mapping and `false`, indicating that no mutation occurred.
/// 2. If the new doc mapping is different from the current doc mapping, verifies the following
///    constraints before returning the new doc mapping and `true`, indicating that a mutation
///    occurred:
///    - The doc mapping UID should differ from the current one
///    - The timestamp field should remain the same
///    - The tokenizers should be a superset of the current tokenizers
///    - A doc mapper can be built from the new doc mapping
pub fn prepare_doc_mapping_update(
    mut new_doc_mapping: DocMapping,
    current_doc_mapping: &DocMapping,
    search_settings: &SearchSettings,
) -> anyhow::Result<(DocMapping, bool)> {
    // Save the new doc mapping UID in a temporary variable and override it with the current doc
    // mapping UID to compare the two doc mappings, ignoring their UIDs.
    let new_doc_mapping_uid = new_doc_mapping.doc_mapping_uid;
    new_doc_mapping.doc_mapping_uid = current_doc_mapping.doc_mapping_uid;

    if new_doc_mapping == *current_doc_mapping {
        return Ok((new_doc_mapping, false));
    }
    // Restore the new doc mapping UID.
    new_doc_mapping.doc_mapping_uid = new_doc_mapping_uid;

    ensure!(
        new_doc_mapping.doc_mapping_uid != current_doc_mapping.doc_mapping_uid,
        "new doc mapping UID should differ from the current one, current UID `{}`, new UID `{}`",
        current_doc_mapping.doc_mapping_uid,
        new_doc_mapping.doc_mapping_uid,
    );
    let new_timestamp_field = new_doc_mapping.timestamp_field.as_deref();
    let current_timestamp_field = current_doc_mapping.timestamp_field.as_deref();
    ensure!(
        new_timestamp_field == current_timestamp_field,
        "updating timestamp field is not allowed, current timestamp field `{}`, new timestamp \
         field `{}`",
        current_timestamp_field.unwrap_or("none"),
        new_timestamp_field.unwrap_or("none"),
    );
    // TODO: Unsure this constraint is required, should we relax it?
    let new_tokenizers: HashSet<_> = new_doc_mapping.tokenizers.iter().collect();
    let current_tokenizers: HashSet<_> = current_doc_mapping.tokenizers.iter().collect();
    ensure!(
        new_tokenizers.is_superset(&current_tokenizers),
        "updating tokenizers is allowed only if adding new tokenizers, current tokenizers \
         `{current_tokenizers:?}`, new tokenizers `{new_tokenizers:?}`",
    );
    build_doc_mapper(&new_doc_mapping, search_settings).context("invalid doc mapping")?;
    Ok((new_doc_mapping, true))
}

#[cfg(test)]
mod tests {

    use cron::TimeUnitSpec;
    use quickwit_doc_mapper::{Mode, ModeType, TokenizerEntry};
    use quickwit_proto::types::DocMappingUid;

    use super::*;
    use crate::ConfigFormat;
    use crate::merge_policy_config::MergePolicyConfig;

    fn get_index_config_filepath(index_config_filename: &str) -> String {
        format!(
            "{}/resources/tests/index_config/{}",
            env!("CARGO_MANIFEST_DIR"),
            index_config_filename
        )
    }

    #[track_caller]
    fn test_index_config_parse_aux(config_format: ConfigFormat) {
        let index_config_filepath =
            get_index_config_filepath(&format!("hdfs-logs.{config_format:?}").to_lowercase());
        let file = std::fs::read_to_string(index_config_filepath).unwrap();
        let index_config = load_index_config_from_user_config(
            config_format,
            file.as_bytes(),
            &Uri::for_test("s3://defaultbucket/"),
        )
        .unwrap();
        assert_eq!(index_config.doc_mapping.tokenizers.len(), 1);
        assert_eq!(index_config.doc_mapping.tokenizers[0].name, "service_regex");
        assert_eq!(index_config.doc_mapping.field_mappings.len(), 5);
        assert_eq!(index_config.doc_mapping.field_mappings[0].name, "tenant_id");
        assert_eq!(index_config.doc_mapping.field_mappings[1].name, "timestamp");
        assert_eq!(
            index_config.doc_mapping.field_mappings[2].name,
            "severity_text"
        );
        assert_eq!(index_config.doc_mapping.field_mappings[3].name, "body");
        assert_eq!(index_config.doc_mapping.field_mappings[4].name, "resource");

        assert_eq!(
            index_config
                .doc_mapping
                .tag_fields
                .into_iter()
                .collect::<Vec<String>>(),
            vec!["tenant_id".to_string()]
        );
        let expected_retention_policy = RetentionPolicy {
            retention_period: "90 days".to_string(),
            evaluation_schedule: "daily".to_string(),
        };
        assert_eq!(
            index_config.retention_policy_opt.unwrap(),
            expected_retention_policy
        );
        assert!(index_config.doc_mapping.store_source);

        assert_eq!(
            index_config.doc_mapping.timestamp_field.unwrap(),
            "timestamp"
        );
        assert_eq!(index_config.indexing_settings.commit_timeout_secs, 61);
        assert_eq!(
            index_config.indexing_settings.merge_policy,
            MergePolicyConfig::StableLog(crate::StableLogMergePolicyConfig {
                merge_factor: 9,
                max_merge_factor: 11,
                maturation_period: Duration::from_secs(48 * 3600),
                ..Default::default()
            })
        );
        assert_eq!(
            index_config.indexing_settings.resources,
            IndexingResources {
                heap_size: ByteSize::gb(3),
                ..Default::default()
            }
        );
        assert_eq!(index_config.ingest_settings.min_shards.get(), 12);
        assert_eq!(
            index_config.search_settings,
            SearchSettings {
                default_search_fields: vec!["severity_text".to_string(), "body".to_string()],
            }
        );
    }

    #[test]
    fn test_index_config_from_json() {
        test_index_config_parse_aux(ConfigFormat::Json);
    }

    #[test]
    fn test_index_config_from_toml() {
        test_index_config_parse_aux(ConfigFormat::Toml);
    }

    #[test]
    fn test_index_config_from_yaml() {
        test_index_config_parse_aux(ConfigFormat::Yaml);
    }

    #[test]
    fn test_indexer_config_default_values() {
        let default_index_root_uri = Uri::for_test("s3://defaultbucket/");
        {
            let index_config_filepath = get_index_config_filepath("minimal-hdfs-logs.yaml");
            let file_content = std::fs::read_to_string(index_config_filepath).unwrap();
            let index_config = load_index_config_from_user_config(
                ConfigFormat::Yaml,
                file_content.as_bytes(),
                &default_index_root_uri,
            )
            .unwrap();

            assert_eq!(index_config.index_id, "hdfs-logs");
            assert_eq!(index_config.index_uri, "s3://quickwit-indexes/hdfs-logs");
            assert_eq!(index_config.doc_mapping.field_mappings.len(), 1);
            assert_eq!(index_config.doc_mapping.field_mappings[0].name, "body");
            assert!(!index_config.doc_mapping.store_source);
            assert_eq!(index_config.indexing_settings, IndexingSettings::default());
            assert_eq!(index_config.ingest_settings, IngestSettings::default());

            let expected_search_settings = SearchSettings {
                default_search_fields: vec!["body".to_string()],
            };
            assert_eq!(index_config.search_settings, expected_search_settings);
            assert!(index_config.retention_policy_opt.is_none());
        }
        {
            let index_config_filepath = get_index_config_filepath("partial-hdfs-logs.yaml");
            let file_content = std::fs::read_to_string(index_config_filepath).unwrap();
            let index_config = load_index_config_from_user_config(
                ConfigFormat::Yaml,
                file_content.as_bytes(),
                &default_index_root_uri,
            )
            .unwrap();

            assert_eq!(index_config.index_id, "hdfs-logs");
            assert_eq!(index_config.index_uri, "s3://quickwit-indexes/hdfs-logs");
            assert_eq!(index_config.doc_mapping.field_mappings.len(), 2);
            assert_eq!(index_config.doc_mapping.field_mappings[0].name, "body");
            assert_eq!(index_config.doc_mapping.field_mappings[1].name, "timestamp");
            assert!(!index_config.doc_mapping.store_source);
            assert_eq!(
                index_config.indexing_settings,
                IndexingSettings {
                    commit_timeout_secs: 42,
                    merge_policy: MergePolicyConfig::default(),
                    resources: IndexingResources {
                        ..Default::default()
                    },
                    ..Default::default()
                }
            );
            assert_eq!(
                index_config.search_settings,
                SearchSettings {
                    default_search_fields: vec!["body".to_string()],
                }
            );
        }
    }

    #[test]
    #[should_panic(expected = "empty URI")]
    fn test_config_validates_uris() {
        let config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            index_uri: ''
            doc_mapping: {}
        "#;
        serde_yaml::from_str::<IndexConfig>(config_yaml).unwrap();
    }

    #[test]
    fn test_minimal_index_config_default_dynamic() {
        let config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            index_uri: "s3://my-index"
            doc_mapping: {}
        "#;
        let minimal_config: IndexConfig = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            config_yaml.as_bytes(),
            &Uri::for_test("s3://my-index"),
        )
        .unwrap();
        assert_eq!(
            minimal_config.doc_mapping.mode.mode_type(),
            ModeType::Dynamic
        );
    }

    #[test]
    fn test_index_config_with_malformed_maturation_duration() {
        let config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            index_uri: "s3://my-index"
            doc_mapping: {}
            indexing_settings:
              merge_policy:
                type: limit_merge
                maturation_period: x
        "#;
        let parsing_config_error = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            config_yaml.as_bytes(),
            &Uri::for_test("s3://my-index"),
        )
        .unwrap_err();
        println!("{parsing_config_error:?}");
        assert!(
            parsing_config_error
                .root_cause()
                .to_string()
                .contains("failed to parse human-readable duration `x`")
        );
    }

    #[test]
    fn test_retention_policy_serialization() {
        let retention_policy = RetentionPolicy {
            retention_period: "90 days".to_string(),
            evaluation_schedule: "hourly".to_string(),
        };
        let retention_policy_yaml = serde_yaml::to_string(&retention_policy).unwrap();
        assert_eq!(
            serde_yaml::from_str::<RetentionPolicy>(&retention_policy_yaml).unwrap(),
            retention_policy,
        );
    }

    #[test]
    fn test_retention_policy_deserialization() {
        {
            let retention_policy_yaml = r#"
            period: 90 days
        "#;
            let retention_policy =
                serde_yaml::from_str::<RetentionPolicy>(retention_policy_yaml).unwrap();

            let expected_retention_policy = RetentionPolicy {
                retention_period: "90 days".to_string(),
                evaluation_schedule: "hourly".to_string(),
            };
            assert_eq!(retention_policy, expected_retention_policy);
        }
        {
            let retention_policy_yaml = r#"
            period: 90 days
            schedule: daily
        "#;
            let retention_policy =
                serde_yaml::from_str::<RetentionPolicy>(retention_policy_yaml).unwrap();

            let expected_retention_policy = RetentionPolicy {
                retention_period: "90 days".to_string(),
                evaluation_schedule: "daily".to_string(),
            };
            assert_eq!(retention_policy, expected_retention_policy);
        }
    }

    #[test]
    fn test_parse_retention_policy_period() {
        {
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: "hourly".to_string(),
            };
            assert_eq!(
                retention_policy.retention_period().unwrap(),
                Duration::from_secs(3600)
            );
            {
                let retention_policy = RetentionPolicy {
                    retention_period: "foo".to_string(),
                    evaluation_schedule: "hourly".to_string(),
                };
                assert_eq!(
                    retention_policy.retention_period().unwrap_err().to_string(),
                    "failed to parse retention period `foo`"
                );
            }
        }
    }

    #[test]
    fn test_prepend_at_char() {
        assert_eq!(prepend_at_char(""), "");
        assert_eq!(prepend_at_char("* * 0 0 0"), "* * 0 0 0");
        assert_eq!(prepend_at_char("hourly"), "@hourly");
        assert_eq!(prepend_at_char("@hourly"), "@hourly");
    }

    #[test]
    fn test_parse_retention_policy_schedule() {
        let hourly_schedule = Schedule::from_str("@hourly").unwrap();
        {
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: "@hourly".to_string(),
            };
            assert_eq!(
                retention_policy.evaluation_schedule().unwrap(),
                hourly_schedule
            );
        }
        {
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: "hourly".to_string(),
            };
            assert_eq!(
                retention_policy.evaluation_schedule().unwrap(),
                hourly_schedule
            );
        }
        {
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: "0 * * * * *".to_string(),
            };
            let evaluation_schedule = retention_policy.evaluation_schedule().unwrap();
            assert_eq!(evaluation_schedule.seconds().count(), 1);
            assert_eq!(evaluation_schedule.minutes().count(), 60);
        }
    }

    #[test]
    fn test_retention_policy_validate() {
        {
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: "hourly".to_string(),
            };
            retention_policy.validate().unwrap();
        }
        {
            let retention_policy = RetentionPolicy {
                retention_period: "foo".to_string(),
                evaluation_schedule: "hourly".to_string(),
            };
            retention_policy.validate().unwrap_err();
        }
        {
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: "foo".to_string(),
            };
            retention_policy.validate().unwrap_err();
        }
    }

    #[test]
    fn test_retention_schedule_duration() {
        let schedule_test_helper_fn = |schedule_str: &str| {
            let hourly_schedule = Schedule::from_str(&prepend_at_char(schedule_str)).unwrap();
            let retention_policy = RetentionPolicy {
                retention_period: "1 hour".to_string(),
                evaluation_schedule: schedule_str.to_string(),
            };

            let next_evaluation_duration = chrono::Duration::nanoseconds(
                retention_policy
                    .duration_until_next_evaluation()
                    .unwrap()
                    .as_nanos() as i64,
            );
            let next_evaluation_date = Utc::now() + next_evaluation_duration;
            let expected_date = hourly_schedule.upcoming(Utc).next().unwrap();
            assert_eq!(next_evaluation_date.timestamp(), expected_date.timestamp());
        };

        schedule_test_helper_fn("hourly");
        schedule_test_helper_fn("daily");
        schedule_test_helper_fn("weekly");
        schedule_test_helper_fn("monthly");
        schedule_test_helper_fn("* * * ? * ?");
    }

    #[test]
    fn test_ingest_settings_serde() {
        let settings = IngestSettings {
            min_shards: NonZeroUsize::MIN,
            validate_docs: false,
        };
        let settings_yaml = serde_yaml::to_string(&settings).unwrap();
        assert!(settings_yaml.contains("validate_docs"));

        let expected_settings: IngestSettings = serde_yaml::from_str(&settings_yaml).unwrap();
        assert_eq!(settings, expected_settings);

        let settings = IngestSettings {
            min_shards: NonZeroUsize::MIN,
            validate_docs: true,
        };
        let settings_yaml = serde_yaml::to_string(&settings).unwrap();
        assert!(!settings_yaml.contains("validate_docs"));

        let expected_settings: IngestSettings = serde_yaml::from_str(&settings_yaml).unwrap();
        assert_eq!(settings, expected_settings);

        let settings_yaml = r#"
            min_shards: 0
        "#;
        let error = serde_yaml::from_str::<IngestSettings>(settings_yaml).unwrap_err();
        assert!(error.to_string().contains("expected a nonzero"));
    }

    #[test]
    fn test_prepare_doc_mapping_update() {
        let current_index_config = IndexConfig::for_test("test-index", "s3://test-index");
        let mut current_doc_mapping = current_index_config.doc_mapping;
        let search_settings = current_index_config.search_settings;

        let tokenizer_json = r#"
            {
                "name": "breton-tokenizer",
                "type": "regex",
                "pattern": "crêpes*"
            }
            "#;
        let tokenizer: TokenizerEntry = serde_json::from_str(tokenizer_json).unwrap();

        current_doc_mapping.tokenizers.push(tokenizer.clone());

        // The new doc mapping should have a different doc mapping UID.
        let mut new_doc_mapping = current_doc_mapping.clone();
        new_doc_mapping.store_source = false; // This is set to `true` for the current doc mapping.
        let error =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap_err()
                .to_string();
        assert!(error.contains("doc mapping UID should differ"));

        // The new doc mapping should not change the timestamp field.
        let mut new_doc_mapping = current_doc_mapping.clone();
        new_doc_mapping.doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.timestamp_field = Some("ts".to_string()); // This is set to `timestamp` for the current doc mapping.
        let error =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap_err()
                .to_string();
        assert!(error.contains("timestamp field"));

        // The new doc mapping should not remove the timestamp field.
        let mut new_doc_mapping = current_doc_mapping.clone();
        new_doc_mapping.doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.timestamp_field = None;
        let error =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap_err()
                .to_string();
        assert!(error.contains("timestamp field"));

        // The new doc mapping should not remove tokenizers.
        let mut new_doc_mapping = current_doc_mapping.clone();
        new_doc_mapping.doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.tokenizers.clear();
        let error =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap_err()
                .to_string();
        assert!(error.contains("tokenizers"));

        // The new doc mapping should be "buildable" into a doc mapper.
        let mut new_doc_mapping = current_doc_mapping.clone();
        new_doc_mapping.doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.tokenizers.push(tokenizer);
        let error =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap_err()
                .source()
                .unwrap()
                .to_string();
        assert!(error.contains("duplicated custom tokenizer"));

        let mut new_doc_mapping = current_doc_mapping.clone();
        new_doc_mapping.doc_mapping_uid = DocMappingUid::random();
        let (updated_doc_mapping, mutation_occurred) =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap();
        assert!(!mutation_occurred);
        assert_eq!(
            updated_doc_mapping.doc_mapping_uid,
            current_doc_mapping.doc_mapping_uid
        );
        assert_eq!(updated_doc_mapping, current_doc_mapping);

        let mut new_doc_mapping = current_doc_mapping.clone();
        let new_doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.doc_mapping_uid = new_doc_mapping_uid;
        new_doc_mapping.mode = Mode::Strict;
        let (updated_doc_mapping, mutation_occurred) =
            prepare_doc_mapping_update(new_doc_mapping, &current_doc_mapping, &search_settings)
                .unwrap();
        assert!(mutation_occurred);
        assert_eq!(updated_doc_mapping.doc_mapping_uid, new_doc_mapping_uid);
        assert_eq!(updated_doc_mapping.mode, Mode::Strict);
    }
}


================================================
FILE: quickwit/quickwit-config/src/index_config/serialize.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use anyhow::{Context, ensure};
use quickwit_common::uri::Uri;
use quickwit_proto::types::{DocMappingUid, IndexId};
use serde::{Deserialize, Serialize};
use tracing::info;

use super::{IngestSettings, validate_index_config};
use crate::{
    ConfigFormat, DocMapping, IndexConfig, IndexingSettings, RetentionPolicy, SearchSettings,
    prepare_doc_mapping_update, validate_identifier,
};

/// Alias for the latest serialization format.
type IndexConfigForSerialization = IndexConfigV0_8;

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(tag = "version")]
pub(crate) enum VersionedIndexConfig {
    // The two versions use the same format but for v0.8 and below, we need to set the
    // `doc_mapping_uid` to the nil value upon deserialization.
    #[serde(rename = "0.9")]
    V0_9(IndexConfigV0_8),
    // Retro compatibility
    #[serde(rename = "0.8")]
    #[serde(alias = "0.7")]
    V0_8(IndexConfigV0_8),
}

impl From<VersionedIndexConfig> for IndexConfigForSerialization {
    fn from(versioned_config: VersionedIndexConfig) -> IndexConfigForSerialization {
        match versioned_config {
            VersionedIndexConfig::V0_8(v0_8) => v0_8,
            VersionedIndexConfig::V0_9(v0_8) => v0_8,
        }
    }
}

/// Parses and validates an [`IndexConfig`] as supplied by a user with a given [`ConfigFormat`],
/// config content and a `default_index_root_uri`.
pub fn load_index_config_from_user_config(
    config_format: ConfigFormat,
    config_content: &[u8],
    default_index_root_uri: &Uri,
) -> anyhow::Result<IndexConfig> {
    let versioned_index_config: VersionedIndexConfig = config_format.parse(config_content)?;
    let index_config_for_serialization: IndexConfigForSerialization = versioned_index_config.into();
    index_config_for_serialization.build_and_validate(Some(default_index_root_uri))
}

/// Parses and validates an [`IndexConfig`] update.
///
/// Ensures that the new configuration is valid in itself and compared to the
/// current index config. If the new configuration omits some fields, the
/// default values will be used, not those of the current index config.
pub fn load_index_config_update(
    config_format: ConfigFormat,
    index_config_bytes: &[u8],
    default_index_root_uri: &Uri,
    current_index_config: &IndexConfig,
) -> anyhow::Result<IndexConfig> {
    let mut new_index_config = load_index_config_from_user_config(
        config_format,
        index_config_bytes,
        default_index_root_uri,
    )?;
    ensure!(
        current_index_config.index_id == new_index_config.index_id,
        "`index_id` in config file {} does not match updated `index_id` {}",
        current_index_config.index_id,
        new_index_config.index_id
    );
    ensure!(
        current_index_config.index_uri == new_index_config.index_uri,
        "`index_uri` cannot be updated, current value {}, new expected value {}",
        current_index_config.index_uri,
        new_index_config.index_uri
    );
    let (updated_doc_mapping, _mutation_occurred) = prepare_doc_mapping_update(
        new_index_config.doc_mapping,
        &current_index_config.doc_mapping,
        &new_index_config.search_settings,
    )?;
    new_index_config.doc_mapping = updated_doc_mapping;

    Ok(new_index_config)
}

impl IndexConfigForSerialization {
    fn index_uri_or_fallback_to_default(
        &self,
        default_index_root_uri_opt: Option<&Uri>,
    ) -> anyhow::Result<Uri> {
        if let Some(index_uri) = &self.index_uri {
            return Ok(index_uri.clone());
        }
        let default_index_root_uri = default_index_root_uri_opt.context("missing `index_uri`")?;
        let index_uri: Uri = default_index_root_uri.join(&self.index_id)
            .context("failed to create default index URI. this should never happen! please, report on https://github.com/quickwit-oss/quickwit/issues")?;
        info!(
            index_id=%self.index_id,
            index_uri=%index_uri,
            "index config does not specify `index_uri`, falling back to default value",
        );
        Ok(index_uri)
    }

    pub fn build_and_validate(
        self,
        default_index_root_uri: Option<&Uri>,
    ) -> anyhow::Result<IndexConfig> {
        validate_identifier("index", &self.index_id)?;

        let index_uri = self.index_uri_or_fallback_to_default(default_index_root_uri)?;

        let index_config = IndexConfig {
            index_id: self.index_id,
            index_uri,
            doc_mapping: self.doc_mapping,
            indexing_settings: self.indexing_settings,
            ingest_settings: self.ingest_settings,
            search_settings: self.search_settings,
            retention_policy_opt: self.retention_policy_opt,
        };
        validate_index_config(
            &index_config.doc_mapping,
            &index_config.indexing_settings,
            &index_config.search_settings,
            &index_config.retention_policy_opt,
        )?;
        Ok(index_config)
    }
}

impl From<IndexConfig> for VersionedIndexConfig {
    fn from(index_config: IndexConfig) -> Self {
        VersionedIndexConfig::V0_9(index_config.into())
    }
}

impl TryFrom<VersionedIndexConfig> for IndexConfig {
    type Error = anyhow::Error;

    fn try_from(versioned_index_config: VersionedIndexConfig) -> anyhow::Result<Self> {
        match versioned_index_config {
            VersionedIndexConfig::V0_8(mut v0_8) => {
                // Override the randomly generated doc mapping UID with the nil value.
                v0_8.doc_mapping.doc_mapping_uid = DocMappingUid::default();
                v0_8.build_and_validate(None)
            }
            VersionedIndexConfig::V0_9(v0_8) => v0_8.build_and_validate(None),
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct IndexConfigV0_8 {
    #[schema(value_type = String)]
    pub index_id: IndexId,
    #[schema(value_type = String)]
    #[serde(default)]
    pub index_uri: Option<Uri>,
    pub doc_mapping: DocMapping,
    #[serde(default)]
    pub indexing_settings: IndexingSettings,
    #[serde(default)]
    pub ingest_settings: IngestSettings,
    #[serde(default)]
    pub search_settings: SearchSettings,
    #[serde(rename = "retention")]
    #[serde(default)]
    pub retention_policy_opt: Option<RetentionPolicy>,
}

impl From<IndexConfig> for IndexConfigV0_8 {
    fn from(index_config: IndexConfig) -> Self {
        IndexConfigV0_8 {
            index_id: index_config.index_id,
            index_uri: Some(index_config.index_uri),
            doc_mapping: index_config.doc_mapping,
            indexing_settings: index_config.indexing_settings,
            ingest_settings: index_config.ingest_settings,
            search_settings: index_config.search_settings,
            retention_policy_opt: index_config.retention_policy_opt,
        }
    }
}

#[cfg(test)]
mod test {
    use super::*;
    use crate::merge_policy_config::{MergePolicyConfig, StableLogMergePolicyConfig};

    fn minimal_index_config_for_serialization() -> IndexConfigForSerialization {
        serde_yaml::from_str(
            r#"
            index_id: hdfs-logs
            index_uri: s3://quickwit-indexes/hdfs-logs

            doc_mapping:
                field_mappings:
                    - name: body
                      type: text
                      tokenizer: default
                      record: position

            search_settings:
                default_search_fields: [body]
        "#,
        )
        .unwrap()
    }

    #[test]
    fn test_validate_invalid_merge_policy() {
        // Not yet invalid, but we modify it right after this.
        let mut invalid_index_config: IndexConfigForSerialization =
            minimal_index_config_for_serialization();
        // Set a max merge factor to an inconsistent value.
        let mut stable_log_merge_policy_config = StableLogMergePolicyConfig::default();
        stable_log_merge_policy_config.max_merge_factor =
            stable_log_merge_policy_config.merge_factor - 1;
        invalid_index_config.indexing_settings.merge_policy =
            MergePolicyConfig::StableLog(stable_log_merge_policy_config);
        let validation_err = invalid_index_config
            .build_and_validate(None)
            .unwrap_err()
            .to_string();
        assert_eq!(
            validation_err,
            "index config merge policy `max_merge_factor` must be superior or equal to \
             `merge_factor`"
        );
    }

    #[test]
    fn test_validate_retention_policy() {
        // Not yet invalid, but we modify it right after this.
        let mut invalid_index_config: IndexConfigForSerialization =
            minimal_index_config_for_serialization();
        invalid_index_config.retention_policy_opt = Some(RetentionPolicy {
            retention_period: "90 days".to_string(),
            evaluation_schedule: "hourly".to_string(),
        });
        let validation_err = invalid_index_config
            .build_and_validate(None)
            .unwrap_err()
            .to_string();
        assert!(validation_err.contains("retention policy requires a timestamp field"));
    }

    #[test]
    fn test_minimal_index_config_missing_root_uri_no_default_uri() {
        let config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping: {}
        "#;
        let config_parse_result: anyhow::Result<IndexConfig> =
            ConfigFormat::Yaml.parse(config_yaml.as_bytes());
        assert!(format!("{:?}", config_parse_result.unwrap_err()).contains("missing `index_uri`"));
    }

    #[test]
    fn test_minimal_index_config_missing_root_uri_with_default_index_root_uri() {
        let config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping: {}
        "#;
        {
            let index_config: IndexConfig = load_index_config_from_user_config(
                ConfigFormat::Yaml,
                config_yaml.as_bytes(),
                // same but without the trailing slash.
                &Uri::for_test("s3://mybucket"),
            )
            .unwrap();
            assert_eq!(index_config.index_uri.as_str(), "s3://mybucket/hdfs-logs");
        }
    }

    #[test]
    fn test_update_index_root_uri() {
        let original_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping: {}
        "#;
        let default_root = Uri::for_test("s3://mybucket");
        let original_config: IndexConfig = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            original_config_yaml.as_bytes(),
            &default_root,
        )
        .unwrap();
        {
            // use default in update
            let updated_config_yaml = r#"
                version: 0.8
                index_id: hdfs-logs
                doc_mapping: {}
            "#;
            let updated_config = load_index_config_update(
                ConfigFormat::Yaml,
                updated_config_yaml.as_bytes(),
                &default_root,
                &original_config,
            )
            .unwrap();
            assert_eq!(updated_config.index_uri.as_str(), "s3://mybucket/hdfs-logs");
        }
        {
            // use the current index_uri explicitly
            let updated_config_yaml = r#"
                version: 0.8
                index_id: hdfs-logs
                index_uri: s3://mybucket/hdfs-logs
                doc_mapping: {}
            "#;
            let updated_config = load_index_config_update(
                ConfigFormat::Yaml,
                updated_config_yaml.as_bytes(),
                &default_root,
                &original_config,
            )
            .unwrap();
            assert_eq!(updated_config.index_uri.as_str(), "s3://mybucket/hdfs-logs");
        }
        {
            // try using a different index_uri
            let updated_config_yaml = r#"
                version: 0.8
                index_id: hdfs-logs
                index_uri: s3://mybucket/new-directory/
                doc_mapping: {}
            "#;
            let load_error = load_index_config_update(
                ConfigFormat::Yaml,
                updated_config_yaml.as_bytes(),
                &default_root,
                &original_config,
            )
            .unwrap_err();
            assert!(format!("{load_error:?}").contains("`index_uri` cannot be updated"));
        }
    }

    #[test]
    fn test_update_reset_defaults() {
        let original_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                field_mappings:
                    - name: timestamp
                      type: datetime
                      fast: true
                timestamp_field: timestamp

            search_settings:
                default_search_fields: [body]

            indexing_settings:
                commit_timeout_secs: 10

            retention:
                period: 90 days
                schedule: daily
        "#;
        let default_root = Uri::for_test("s3://mybucket");
        let original_config: IndexConfig = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            original_config_yaml.as_bytes(),
            &default_root,
        )
        .unwrap();

        let updated_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                field_mappings:
                    - name: timestamp
                      type: datetime
                      fast: true
                timestamp_field: timestamp
        "#;
        let updated_config = load_index_config_update(
            ConfigFormat::Yaml,
            updated_config_yaml.as_bytes(),
            &default_root,
            &original_config,
        )
        .unwrap();
        assert_eq!(
            updated_config.search_settings.default_search_fields,
            Vec::<String>::default(),
        );
        assert_eq!(
            updated_config.indexing_settings.commit_timeout_secs,
            IndexingSettings::default_commit_timeout_secs()
        );
        assert_eq!(updated_config.retention_policy_opt, None);
    }

    #[test]
    fn test_update_doc_mappings() {
        let original_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping: {}
        "#;
        let default_root = Uri::for_test("s3://mybucket");
        let original_config: IndexConfig = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            original_config_yaml.as_bytes(),
            &default_root,
        )
        .unwrap();

        let updated_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                field_mappings:
                    - name: body
                      type: text
                      tokenizer: default
                      record: position
        "#;
        let updated_config = load_index_config_update(
            ConfigFormat::Yaml,
            updated_config_yaml.as_bytes(),
            &default_root,
            &original_config,
        )
        .unwrap();
        assert_eq!(updated_config.doc_mapping.field_mappings.len(), 1);
    }

    #[test]
    fn test_update_doc_mappings_failing_cases() {
        let original_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                mode: lenient
                doc_mapping_uid: 00000000000000000000000000
                timestamp_field: timestamp
                field_mappings:
                    - name: timestamp
                      type: datetime
                      fast: true
        "#;
        let default_root = Uri::for_test("s3://mybucket");
        let original_config: IndexConfig = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            original_config_yaml.as_bytes(),
            &default_root,
        )
        .unwrap();

        let updated_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                mode: lenient
                doc_mapping_uid: 00000000000000000000000000
                timestamp_field: timestamp
                field_mappings:
                    - name: timestamp
                      type: datetime
                      fast: true
                    - name: body
                      type: text
                      tokenizer: default
                      record: position
        "#;
        load_index_config_update(
            ConfigFormat::Yaml,
            updated_config_yaml.as_bytes(),
            &default_root,
            &original_config,
        )
        .expect_err("mapping changed but uid fixed should error");

        let updated_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                mode: lenient
                field_mappings:
                    - name: timestamp
                      type: datetime
                      fast: true
        "#;
        load_index_config_update(
            ConfigFormat::Yaml,
            updated_config_yaml.as_bytes(),
            &default_root,
            &original_config,
        )
        .expect_err("timestamp field removed should error");

        let updated_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                mode: lenient
                timestamp_field: timestamp
                field_mappings:
                    - name: body
                      type: text
                      tokenizer: default
                      record: position
        "#;
        load_index_config_update(
            ConfigFormat::Yaml,
            updated_config_yaml.as_bytes(),
            &default_root,
            &original_config,
        )
        .expect_err("field required for timestamp is absent");

        let updated_config_yaml = r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
                mode: lenient
                timestamp_field: timestamp
                field_mappings:
                    - name: timestamp
                      type: datetime
                      fast: true
            search_settings:
              default_search_fields: ["i_dont_exist"]
        "#;
        load_index_config_update(
            ConfigFormat::Yaml,
            updated_config_yaml.as_bytes(),
            &default_root,
            &original_config,
        )
        .expect_err("field required for default search is absent");
    }
}


================================================
FILE: quickwit/quickwit-config/src/index_template/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod serialize;

use anyhow::ensure;
use quickwit_common::uri::Uri;
use quickwit_proto::types::{DocMappingUid, IndexId};
use serde::{Deserialize, Serialize};
pub use serialize::{IndexTemplateV0_8, VersionedIndexTemplate};

use crate::index_config::{IngestSettings, validate_index_config};
use crate::{
    DocMapping, IndexConfig, IndexingSettings, RetentionPolicy, SearchSettings,
    validate_identifier, validate_index_id_pattern,
};

pub type IndexTemplateId = String;
pub type IndexIdPattern = String;

#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
#[serde(into = "VersionedIndexTemplate")]
#[serde(from = "VersionedIndexTemplate")]
pub struct IndexTemplate {
    pub template_id: IndexTemplateId,
    pub index_id_patterns: Vec<IndexIdPattern>,
    #[serde(default)]
    pub index_root_uri: Option<Uri>,
    #[serde(default)]
    pub priority: usize,
    #[serde(default)]
    pub description: Option<String>,
    pub doc_mapping: DocMapping,
    #[serde(default)]
    pub indexing_settings: IndexingSettings,
    #[serde(default)]
    pub ingest_settings: IngestSettings,
    #[serde(default)]
    pub search_settings: SearchSettings,
    #[serde(rename = "retention")]
    #[serde(default)]
    pub retention_policy_opt: Option<RetentionPolicy>,
}

impl IndexTemplate {
    pub fn apply_template(
        &self,
        index_id: IndexId,
        default_index_root_uri: &Uri,
    ) -> anyhow::Result<IndexConfig> {
        let index_uri = self
            .index_root_uri
            .as_ref()
            .unwrap_or(default_index_root_uri)
            .join(&index_id)?;

        // Ensure that the doc mapping UID is truly unique per index.
        let mut doc_mapping = self.doc_mapping.clone();
        doc_mapping.doc_mapping_uid = DocMappingUid::random();

        let index_config = IndexConfig {
            index_id,
            index_uri,
            doc_mapping,
            indexing_settings: self.indexing_settings.clone(),
            ingest_settings: self.ingest_settings.clone(),
            search_settings: self.search_settings.clone(),
            retention_policy_opt: self.retention_policy_opt.clone(),
        };
        Ok(index_config)
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        validate_identifier("template", &self.template_id)?;

        ensure!(
            !self.index_id_patterns.is_empty(),
            "`index_id_patterns` must not be empty"
        );
        for index_id_pattern in &self.index_id_patterns {
            validate_index_id_pattern(index_id_pattern, true)?;
        }
        validate_index_config(
            &self.doc_mapping,
            &self.indexing_settings,
            &self.search_settings,
            &self.retention_policy_opt,
        )?;
        Ok(())
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(template_id: &str, index_id_patterns: &[&str], priority: usize) -> Self {
        let index_id_patterns: Vec<IndexIdPattern> = index_id_patterns
            .iter()
            .map(|pattern| pattern.to_string())
            .collect();

        let doc_mapping_json = r#"{
            "field_mappings": [
                {
                    "name": "ts",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "message",
                    "type": "json"
                }
            ],
            "timestamp_field": "ts"
        }"#;
        let doc_mapping: DocMapping = serde_json::from_str(doc_mapping_json).unwrap();

        IndexTemplate {
            template_id: template_id.to_string(),
            index_root_uri: Some(Uri::for_test("ram:///indexes")),
            index_id_patterns,
            priority,
            description: Some("Test description.".to_string()),
            doc_mapping,
            indexing_settings: IndexingSettings::default(),
            ingest_settings: IngestSettings::default(),
            search_settings: SearchSettings::default(),
            retention_policy_opt: None,
        }
    }
}

#[cfg(any(test, feature = "testsuite"))]
impl crate::TestableForRegression for IndexTemplate {
    fn sample_for_regression() -> Self {
        let template_id = "test-template".to_string();
        let index_id_patterns = vec![
            "test-index-foo*".to_string(),
            "-test-index-foobar".to_string(),
        ];

        let doc_mapping_json = r#"{
            "doc_mapping_uid": "00000000000000000000000001",
            "field_mappings": [
                {
                    "name": "ts",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "message",
                    "type": "json"
                }
            ],
            "timestamp_field": "ts"
        }"#;
        let doc_mapping: DocMapping = serde_json::from_str(doc_mapping_json).unwrap();

        IndexTemplate {
            template_id: template_id.to_string(),
            index_root_uri: Some(Uri::for_test("ram:///indexes")),
            index_id_patterns,
            priority: 100,
            description: Some("Test description.".to_string()),
            doc_mapping,
            indexing_settings: IndexingSettings::default(),
            ingest_settings: IngestSettings::default(),
            search_settings: SearchSettings::default(),
            retention_policy_opt: Some(RetentionPolicy {
                retention_period: "42 days".to_string(),
                evaluation_schedule: "daily".to_string(),
            }),
        }
    }

    fn assert_equality(&self, other: &Self) {
        assert_eq!(self, other);
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_index_template_serde() {
        let index_template_yaml = r#"
            version: 0.8

            template_id: test-template
            index_id_patterns:
              - test-index-*
              - -test-index-foo
            description: Test description.
            priority: 100
            doc_mapping:
              field_mappings:
                - name: ts
                  type: datetime
                  fast: true
                - name: message
                  type: json
              timestamp_field: ts
        "#;
        let index_template: IndexTemplate = serde_yaml::from_str(index_template_yaml).unwrap();
        assert_eq!(index_template.template_id, "test-template");
        assert_eq!(index_template.index_id_patterns.len(), 2);
        assert_eq!(
            index_template.index_id_patterns,
            ["test-index-*", "-test-index-foo"]
        );
        assert_eq!(index_template.priority, 100);
        assert_eq!(index_template.description.unwrap(), "Test description.");
        assert_eq!(index_template.doc_mapping.timestamp_field.unwrap(), "ts");
    }

    #[test]
    fn test_index_template_apply() {
        let mut index_template = IndexTemplate::for_test("test-template", &["test-index-*"], 0);

        index_template.indexing_settings = IndexingSettings {
            commit_timeout_secs: 42,
            ..Default::default()
        };
        index_template.search_settings = SearchSettings {
            default_search_fields: vec!["message".to_string()],
        };
        index_template.retention_policy_opt = Some(RetentionPolicy {
            retention_period: "42 days".to_string(),
            evaluation_schedule: "hourly".to_string(),
        });
        let default_index_root_uri = Uri::for_test("s3://test-bucket/indexes");

        let index_config_foo = index_template
            .apply_template("test-index-foo".to_string(), &default_index_root_uri)
            .unwrap();

        assert_eq!(index_config_foo.index_id, "test-index-foo");
        assert_eq!(index_config_foo.index_uri, "ram:///indexes/test-index-foo");

        assert_eq!(index_config_foo.doc_mapping.timestamp_field.unwrap(), "ts");
        assert_eq!(index_config_foo.indexing_settings.commit_timeout_secs, 42);
        assert_eq!(
            index_config_foo.search_settings.default_search_fields,
            ["message"]
        );
        let retention_policy = index_config_foo.retention_policy_opt.unwrap();
        assert_eq!(retention_policy.retention_period, "42 days");
        assert_eq!(retention_policy.evaluation_schedule, "hourly");

        index_template.index_root_uri = None;

        let index_config_bar = index_template
            .apply_template("test-index-bar".to_string(), &default_index_root_uri)
            .unwrap();

        assert_eq!(index_config_bar.index_id, "test-index-bar");
        assert_eq!(
            index_config_bar.index_uri,
            "s3://test-bucket/indexes/test-index-bar"
        );
        assert_ne!(
            index_config_foo.doc_mapping.doc_mapping_uid,
            index_config_bar.doc_mapping.doc_mapping_uid
        );
    }

    #[test]
    fn test_index_template_validate() {
        let index_template = IndexTemplate::for_test("", &[], 0);
        let error = index_template.validate().unwrap_err();
        assert!(error.to_string().contains("template ID `` is invalid"));

        let index_template = IndexTemplate::for_test("test-template", &[], 0);
        let error = index_template.validate().unwrap_err();
        assert!(error.to_string().contains("empty"));

        let index_template = IndexTemplate::for_test("test-template", &[""], 0);
        let error = index_template.validate().unwrap_err();
        assert!(error.to_string().contains("index ID pattern `` is invalid"));

        let mut index_template = IndexTemplate::for_test("test-template", &["test-index-*"], 0);
        index_template.retention_policy_opt = Some(RetentionPolicy {
            retention_period: "".to_string(),
            evaluation_schedule: "".to_string(),
        });
        let error = index_template.validate().unwrap_err();
        assert!(
            error
                .to_string()
                .contains("failed to parse retention period")
        );
    }
}


================================================
FILE: quickwit/quickwit-config/src/index_template/serialize.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::uri::Uri;
use serde::{Deserialize, Serialize};

use super::{IndexIdPattern, IndexTemplate, IndexTemplateId};
use crate::index_config::IngestSettings;
use crate::{DocMapping, IndexingSettings, RetentionPolicy, SearchSettings};

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(tag = "version")]
pub enum VersionedIndexTemplate {
    #[serde(rename = "0.9")]
    #[serde(alias = "0.8")]
    #[serde(alias = "0.7")]
    V0_8(IndexTemplateV0_8),
}

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct IndexTemplateV0_8 {
    #[schema(value_type = String)]
    pub template_id: IndexTemplateId,
    /// Glob patterns (e.g., `logs-foo*`) with negation by prepending `-` (e.g `-logs-fool`).
    #[schema(value_type = Vec<String>)]
    pub index_id_patterns: Vec<IndexIdPattern>,
    /// The actual index URI is the concatenation of this with the index id.
    #[schema(value_type = String)]
    #[serde(default)]
    pub index_root_uri: Option<Uri>,
    /// When multiple templates match an index, the one with the highest priority is selected.
    #[serde(default)]
    pub priority: usize,
    #[serde(default)]
    pub description: Option<String>,

    pub doc_mapping: DocMapping,
    #[serde(default)]
    pub indexing_settings: IndexingSettings,
    #[serde(default)]
    pub ingest_settings: IngestSettings,
    #[serde(default)]
    pub search_settings: SearchSettings,
    #[serde(default)]
    pub retention: Option<RetentionPolicy>,
}

impl From<VersionedIndexTemplate> for IndexTemplate {
    fn from(versioned_index_template: VersionedIndexTemplate) -> Self {
        match versioned_index_template {
            VersionedIndexTemplate::V0_8(v0_8) => v0_8.into(),
        }
    }
}

impl From<IndexTemplate> for VersionedIndexTemplate {
    fn from(index_template: IndexTemplate) -> Self {
        VersionedIndexTemplate::V0_8(index_template.into())
    }
}

impl From<IndexTemplateV0_8> for IndexTemplate {
    fn from(index_template_v0_8: IndexTemplateV0_8) -> Self {
        IndexTemplate {
            template_id: index_template_v0_8.template_id,
            index_id_patterns: index_template_v0_8.index_id_patterns,
            index_root_uri: index_template_v0_8.index_root_uri,
            priority: index_template_v0_8.priority,
            description: index_template_v0_8.description,
            doc_mapping: index_template_v0_8.doc_mapping,
            indexing_settings: index_template_v0_8.indexing_settings,
            ingest_settings: index_template_v0_8.ingest_settings,
            search_settings: index_template_v0_8.search_settings,
            retention_policy_opt: index_template_v0_8.retention,
        }
    }
}

impl From<IndexTemplate> for IndexTemplateV0_8 {
    fn from(index_template: IndexTemplate) -> Self {
        IndexTemplateV0_8 {
            template_id: index_template.template_id,
            index_id_patterns: index_template.index_id_patterns,
            index_root_uri: index_template.index_root_uri,
            priority: index_template.priority,
            description: index_template.description,
            doc_mapping: index_template.doc_mapping,
            indexing_settings: index_template.indexing_settings,
            ingest_settings: index_template.ingest_settings,
            search_settings: index_template.search_settings,
            retention: index_template.retention_policy_opt,
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

use std::hash::Hasher;
use std::str::FromStr;

use anyhow::{Context, bail, ensure};
use json_comments::StripComments;
use once_cell::sync::Lazy;
use quickwit_common::get_bool_from_env;
use quickwit_common::net::is_valid_hostname;
use quickwit_common::uri::Uri;
use quickwit_proto::types::NodeIdRef;
use regex::Regex;

mod cluster_config;
mod config_value;
mod index_config;
mod index_template;
pub mod merge_policy_config;
mod metastore_config;
mod node_config;
mod qw_env_vars;
pub(crate) mod serde_utils;
pub mod service;
mod source_config;
mod storage_config;
mod templating;

pub use cluster_config::ClusterConfig;
// We export that one for backward compatibility.
// See #2048
use index_config::serialize::{IndexConfigV0_8, VersionedIndexConfig};
pub use index_config::{
    IndexConfig, IndexingResources, IndexingSettings, IngestSettings, RetentionPolicy,
    SearchSettings, build_doc_mapper, load_index_config_from_user_config, load_index_config_update,
    prepare_doc_mapping_update,
};
pub use quickwit_doc_mapper::DocMapping;
use serde::Serialize;
use serde::de::DeserializeOwned;
use serde_json::Value as JsonValue;
use siphasher::sip::SipHasher;
use source_config::FileSourceParamsForSerde;
pub use source_config::{
    CLI_SOURCE_ID, FileSourceMessageType, FileSourceNotification, FileSourceParams, FileSourceSqs,
    INGEST_API_SOURCE_ID, INGEST_V2_SOURCE_ID, KafkaSourceParams, KinesisSourceParams,
    PubSubSourceParams, PulsarSourceAuth, PulsarSourceParams, RegionOrEndpoint, SourceConfig,
    SourceInputFormat, SourceParams, TransformConfig, VecSourceParams, VoidSourceParams,
    load_source_config_from_user_config, load_source_config_update,
};
use tracing::warn;

use crate::index_template::IndexTemplateV0_8;
pub use crate::index_template::{IndexTemplate, IndexTemplateId, VersionedIndexTemplate};
use crate::merge_policy_config::{
    ConstWriteAmplificationMergePolicyConfig, MergePolicyConfig, StableLogMergePolicyConfig,
};
pub use crate::metastore_config::{
    MetastoreBackend, MetastoreConfig, MetastoreConfigs, PostgresMetastoreConfig,
};
pub use crate::node_config::{
    CacheConfig, CachePolicy, DEFAULT_QW_CONFIG_PATH, GrpcConfig, IndexerConfig, IngestApiConfig,
    JaegerConfig, KeepAliveConfig, LambdaConfig, LambdaDeployConfig, NodeConfig, RestConfig,
    SearcherConfig, SplitCacheLimits, StorageTimeoutPolicy, TlsConfig,
};
use crate::source_config::serialize::{SourceConfigV0_7, SourceConfigV0_8, VersionedSourceConfig};
pub use crate::storage_config::{
    AzureStorageConfig, FileStorageConfig, GoogleCloudStorageConfig, RamStorageConfig,
    S3StorageConfig, StorageBackend, StorageBackendFlavor, StorageConfig, StorageConfigs,
};

/// Returns true if the ingest API v2 is enabled.
pub fn enable_ingest_v2() -> bool {
    static ENABLE_INGEST_V2: Lazy<bool> =
        Lazy::new(|| get_bool_from_env("QW_ENABLE_INGEST_V2", true));
    *ENABLE_INGEST_V2
}

/// Returns true if the ingest API v1 is disabled.
pub fn disable_ingest_v1() -> bool {
    static DISABLE_INGEST_V1: Lazy<bool> =
        Lazy::new(|| get_bool_from_env("QW_DISABLE_INGEST_V1", false));
    *DISABLE_INGEST_V1
}

#[derive(utoipa::OpenApi)]
#[openapi(components(schemas(
    ConstWriteAmplificationMergePolicyConfig,
    DocMapping,
    FileSourceMessageType,
    FileSourceNotification,
    FileSourceParamsForSerde,
    FileSourceSqs,
    IndexConfigV0_8,
    IndexingResources,
    IndexingSettings,
    IndexTemplateV0_8,
    IngestSettings,
    KafkaSourceParams,
    KinesisSourceParams,
    MergePolicyConfig,
    PubSubSourceParams,
    PulsarSourceAuth,
    PulsarSourceParams,
    RegionOrEndpoint,
    RetentionPolicy,
    SearchSettings,
    SourceConfigV0_7,
    SourceConfigV0_8,
    SourceInputFormat,
    SourceParams,
    StableLogMergePolicyConfig,
    TransformConfig,
    VecSourceParams,
    VersionedIndexConfig,
    VersionedIndexTemplate,
    VersionedSourceConfig,
    VoidSourceParams,
)))]
/// Schema used for the OpenAPI generation which are apart of this crate.
pub struct ConfigApiSchemas;

/// Checks whether an identifier conforms to Quickwit naming conventions.
pub fn validate_identifier(label: &str, value: &str) -> anyhow::Result<()> {
    static IDENTIFIER_REGEX: Lazy<Regex> = Lazy::new(|| {
        Regex::new(r"^[a-zA-Z][a-zA-Z0-9-_\.]{2,254}$").expect("regular expression should compile")
    });
    ensure!(
        IDENTIFIER_REGEX.is_match(value),
        "{label} ID `{value}` is invalid: identifiers must match the following regular \
         expression: `^[a-zA-Z][a-zA-Z0-9-_\\.]{{2,254}}$`"
    );
    Ok(())
}

/// Checks whether an index ID pattern conforms to Quickwit conventions.
/// Index ID patterns accept the same characters as identifiers AND accept `*`
/// chars to allow for glob-like patterns.
pub fn validate_index_id_pattern(pattern: &str, allow_negative: bool) -> anyhow::Result<()> {
    static IDENTIFIER_REGEX_WITH_GLOB_PATTERN: Lazy<Regex> = Lazy::new(|| {
        Regex::new(r"^[a-zA-Z\*][a-zA-Z0-9-_\.\*]{0,254}$")
            .expect("regular expression should compile")
    });
    static IDENTIFIER_REGEX_WITH_GLOB_PATTERN_NEGATIVE: Lazy<Regex> = Lazy::new(|| {
        Regex::new(r"^-?[a-zA-Z\*][a-zA-Z0-9-_\.\*]{0,254}$")
            .expect("regular expression should compile")
    });

    let regex = if allow_negative {
        &IDENTIFIER_REGEX_WITH_GLOB_PATTERN_NEGATIVE
    } else {
        &IDENTIFIER_REGEX_WITH_GLOB_PATTERN
    };

    if !regex.is_match(pattern) {
        bail!(
            "index ID pattern `{pattern}` is invalid: patterns must match the following regular \
             expression: `^[a-zA-Z\\*][a-zA-Z0-9-_\\.\\*]{{0,254}}$`"
        );
    }
    // Forbid multiple stars in the pattern to force the user making simpler patterns
    // as multiple stars does not bring any value.
    if pattern.contains("**") {
        bail!(
            "index ID pattern `{pattern}` is invalid: patterns must not contain multiple \
             consecutive `*`"
        );
    }
    // If there is no star in the pattern, we need at least 3 characters.
    if !pattern.contains('*') && pattern.len() < 3 {
        bail!(
            "index ID pattern `{pattern}` is invalid: an index ID must have at least 3 characters"
        );
    }
    Ok(())
}

pub fn validate_node_id(node_id: &NodeIdRef) -> anyhow::Result<()> {
    if !is_valid_hostname(node_id.as_str()) {
        bail!(
            "node identifier `{node_id}` is invalid. node identifiers must be valid short \
             hostnames (see RFC 1123)"
        );
    }
    Ok(())
}

#[derive(Copy, Clone, Debug, Eq, PartialEq)]
pub enum ConfigFormat {
    Json,
    Toml,
    Yaml,
}

impl ConfigFormat {
    pub fn as_str(&self) -> &'static str {
        match self {
            ConfigFormat::Json => "json",
            ConfigFormat::Toml => "toml",
            ConfigFormat::Yaml => "yaml",
        }
    }

    pub fn sniff_from_uri(uri: &Uri) -> anyhow::Result<ConfigFormat> {
        let extension_str: &str = uri.extension().with_context(|| {
            format!(
                "failed to parse config file `{uri}`: file extension is missing. supported file \
                 formats and extensions are JSON (.json), TOML (.toml), and YAML (.yaml or .yml)"
            )
        })?;
        ConfigFormat::from_str(extension_str)
            .with_context(|| format!("failed to identify configuration file format {uri}"))
    }

    pub fn parse<T>(&self, payload: &[u8]) -> anyhow::Result<T>
    where T: DeserializeOwned {
        match self {
            ConfigFormat::Json => {
                let mut json_value: JsonValue =
                    serde_json::from_reader(StripComments::new(payload))?;
                let version_value = json_value.get_mut("version").context("missing version")?;
                if let Some(version_number) = version_value.as_u64() {
                    warn!(version_value=?version_value, "`version` should be a string");
                    *version_value = JsonValue::String(version_number.to_string());
                }
                serde_json::from_value(json_value).context("failed to parse JSON file")
            }
            ConfigFormat::Toml => {
                let payload_str = std::str::from_utf8(payload)
                    .context("configuration file contains invalid UTF-8 characters")?;
                let mut toml_value: toml::Value =
                    toml::from_str(payload_str).context("failed to parse TOML file")?;
                let version_value = toml_value.get_mut("version").context("missing version")?;
                if let Some(version_number) = version_value.as_integer() {
                    warn!(version_value=?version_value, "`version` should be a string");
                    *version_value = toml::Value::String(version_number.to_string());
                    let reserialized = toml::to_string(version_value)
                        .context("failed to reserialize toml config")?;
                    toml::from_str(&reserialized).context("failed to parse TOML file")
                } else {
                    toml::from_str(payload_str).context("failed to parse TOML file")
                }
            }
            ConfigFormat::Yaml => {
                serde_yaml::from_slice(payload).context("failed to parse YAML file")
            }
        }
    }
}

impl FromStr for ConfigFormat {
    type Err = anyhow::Error;

    fn from_str(ext: &str) -> anyhow::Result<Self> {
        match ext {
            "json" => Ok(Self::Json),
            "toml" => Ok(Self::Toml),
            "yaml" | "yml" => Ok(Self::Yaml),
            _ => bail!(
                "file extension `.{ext}` is not supported. supported file formats and extensions \
                 are JSON (.json), TOML (.toml), and YAML (.yaml or .yml)",
            ),
        }
    }
}

pub trait TestableForRegression: Serialize + DeserializeOwned {
    /// Produces an instance of `Self` whose serialization output will be tested against future
    /// versions of the format for backward compatibility.
    fn sample_for_regression() -> Self;

    /// Asserts that `self` and `other` are equal. It must panic if they are not.
    fn assert_equality(&self, other: &Self);
}

/// Returns a fingerprint (a hash) of all the parameters that should force an
/// indexing pipeline to restart upon index or source config updates.
pub fn indexing_pipeline_params_fingerprint(
    index_config: &IndexConfig,
    source_config: &SourceConfig,
) -> u64 {
    let mut hasher = SipHasher::new();
    hasher.write_u64(index_config.indexing_params_fingerprint());
    hasher.write_u64(source_config.indexing_params_fingerprint());
    hasher.finish()
}

#[cfg(test)]
mod tests {
    use super::validate_identifier;
    use crate::validate_index_id_pattern;

    #[test]
    fn test_validate_identifier() {
        validate_identifier("cluster", "").unwrap_err();
        validate_identifier("cluster", "-").unwrap_err();
        validate_identifier("cluster", "_").unwrap_err();
        validate_identifier("cluster", "f").unwrap_err();
        validate_identifier("cluster", "fo").unwrap_err();
        validate_identifier("cluster", "_fo").unwrap_err();
        validate_identifier("cluster", "_foo").unwrap_err();
        validate_identifier("cluster", ".foo.bar").unwrap_err();
        validate_identifier("cluster", "foo").unwrap();
        validate_identifier("cluster", "f-_").unwrap();
        validate_identifier("index", "foo.bar").unwrap();

        assert!(
            validate_identifier("cluster", "foo!")
                .unwrap_err()
                .to_string()
                .contains("cluster ID `foo!` is invalid")
        );
    }

    #[test]
    fn test_validate_index_id_pattern() {
        validate_index_id_pattern("*", false).unwrap();
        validate_index_id_pattern("abc.*", false).unwrap();
        validate_index_id_pattern("ab", false).unwrap_err();
        validate_index_id_pattern("", false).unwrap_err();
        validate_index_id_pattern("**", false).unwrap_err();
        assert!(
            validate_index_id_pattern("foo!", false)
                .unwrap_err()
                .to_string()
                .contains("index ID pattern `foo!` is invalid:")
        );
        validate_index_id_pattern("-abc", true).unwrap();
        validate_index_id_pattern("-abc", false).unwrap_err();
    }
}


================================================
FILE: quickwit/quickwit-config/src/merge_policy_config.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use serde::{Deserialize, Deserializer, Serialize, Serializer, de};

fn is_zero(value: &usize) -> bool {
    *value == 0
}

#[derive(Debug, Clone, Serialize, Deserialize, Eq, PartialEq, Hash, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct ConstWriteAmplificationMergePolicyConfig {
    /// Number of splits to merge together in a single merge operation.
    #[serde(default = "default_merge_factor")]
    pub merge_factor: usize,
    /// Maximum number of splits that can be merged together in a single merge operation.
    #[serde(default = "default_max_merge_factor")]
    pub max_merge_factor: usize,
    /// Maximum number of merges that a given split should undergo.
    #[serde(default = "default_max_merge_ops")]
    pub max_merge_ops: usize,
    /// Duration relative to `split.created_timestamp` after which a split
    /// becomes mature.
    /// If `now() >= split.created_timestamp + maturation_period` then
    /// the split is considered mature.
    #[schema(value_type = String)]
    #[serde(default = "default_maturation_period")]
    #[serde(deserialize_with = "parse_human_duration")]
    #[serde(serialize_with = "serialize_duration")]
    pub maturation_period: Duration,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub max_finalize_merge_operations: usize,
    /// Splits with a number of docs higher than
    /// `max_finalize_split_num_docs` will not be considered
    /// for finalize split merge operations.
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub max_finalize_split_num_docs: Option<usize>,
}

impl Default for ConstWriteAmplificationMergePolicyConfig {
    fn default() -> ConstWriteAmplificationMergePolicyConfig {
        ConstWriteAmplificationMergePolicyConfig {
            max_merge_ops: default_max_merge_ops(),
            merge_factor: default_merge_factor(),
            max_merge_factor: default_max_merge_factor(),
            maturation_period: default_maturation_period(),
            max_finalize_merge_operations: 0,
            max_finalize_split_num_docs: None,
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize, Eq, PartialEq, Hash, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct StableLogMergePolicyConfig {
    /// Number of docs below which all splits are considered as belonging to the same level.
    #[serde(default = "default_min_level_num_docs")]
    pub min_level_num_docs: usize,
    /// Number of splits to merge together in a single merge operation.
    #[serde(default = "default_merge_factor")]
    pub merge_factor: usize,
    /// Maximum number of splits that can be merged together in a single merge operation.
    #[serde(default = "default_max_merge_factor")]
    pub max_merge_factor: usize,
    /// Duration relative to `split.created_timestamp` after which a split
    /// becomes mature.
    /// If `now() >= split.created_timestamp + maturation_period` then
    /// the split is mature.
    #[schema(value_type = String)]
    #[serde(default = "default_maturation_period")]
    #[serde(deserialize_with = "parse_human_duration")]
    #[serde(serialize_with = "serialize_duration")]
    pub maturation_period: Duration,
}

fn default_merge_factor() -> usize {
    10
}

fn default_max_merge_factor() -> usize {
    12
}

fn default_max_merge_ops() -> usize {
    4
}

fn default_min_level_num_docs() -> usize {
    100_000
}

fn default_maturation_period() -> Duration {
    Duration::from_secs(48 * 3600)
}

impl Default for StableLogMergePolicyConfig {
    fn default() -> Self {
        StableLogMergePolicyConfig {
            min_level_num_docs: default_min_level_num_docs(),
            merge_factor: default_merge_factor(),
            max_merge_factor: default_max_merge_factor(),
            maturation_period: default_maturation_period(),
        }
    }
}

fn parse_human_duration<'de, D>(deserializer: D) -> Result<Duration, D::Error>
where D: Deserializer<'de> {
    let value: String = Deserialize::deserialize(deserializer)?;
    let duration = humantime::parse_duration(&value).map_err(|error| {
        de::Error::custom(format!(
            "failed to parse human-readable duration `{value}`: {error:?}",
        ))
    })?;
    Ok(duration)
}

fn serialize_duration<S>(value: &Duration, s: S) -> Result<S::Ok, S::Error>
where S: Serializer {
    let value_str = humantime::format_duration(*value).to_string();
    s.serialize_str(&value_str)
}

#[derive(Debug, Serialize, Deserialize, Clone, Eq, PartialEq, Hash, utoipa::ToSchema)]
#[serde(tag = "type")]
#[serde(deny_unknown_fields)]
pub enum MergePolicyConfig {
    #[serde(rename = "no_merge")]
    Nop,
    #[serde(rename = "limit_merge")]
    ConstWriteAmplification(ConstWriteAmplificationMergePolicyConfig),
    #[serde(rename = "stable_log")]
    #[serde(alias = "default")]
    StableLog(StableLogMergePolicyConfig),
}

impl Default for MergePolicyConfig {
    fn default() -> Self {
        MergePolicyConfig::StableLog(StableLogMergePolicyConfig::default())
    }
}

impl MergePolicyConfig {
    pub fn noop() -> Self {
        MergePolicyConfig::Nop
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        let (merge_factor, max_merge_factor) = match self {
            MergePolicyConfig::Nop => {
                return Ok(());
            }
            MergePolicyConfig::ConstWriteAmplification(config) => {
                (config.merge_factor, config.max_merge_factor)
            }
            MergePolicyConfig::StableLog(config) => (config.merge_factor, config.max_merge_factor),
        };
        if max_merge_factor < merge_factor {
            anyhow::bail!(
                "index config merge policy `max_merge_factor` must be superior or equal to \
                 `merge_factor`"
            );
        }
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-config/src/metastore_config.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;
use std::ops::Deref;
use std::time::Duration;

use anyhow::{Context, ensure};
use humantime::parse_duration;
use itertools::Itertools;
use serde::{Deserialize, Serialize};
use serde_with::{EnumMap, serde_as};

#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum MetastoreBackend {
    File,
    #[serde(alias = "pg", alias = "postgres")]
    PostgreSQL,
}

/// Holds the metastore configurations defined in the `metastore` section of node config files.
///
/// ```yaml
/// metastore:
///   file:
///     polling_interval: 30s
///
///   postgres:
///     max_connections: 12
/// ```
#[serde_as]
#[derive(Debug, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
pub struct MetastoreConfigs(#[serde_as(as = "EnumMap")] Vec<MetastoreConfig>);

impl MetastoreConfigs {
    pub fn redact(&mut self) {
        for metastore_config in &mut self.0 {
            metastore_config.redact();
        }
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        for metastore_config in &self.0 {
            metastore_config.validate()?;
        }
        let backends: Vec<MetastoreBackend> = self
            .0
            .iter()
            .map(|metastore_config| metastore_config.backend())
            .sorted()
            .collect();

        for (left, right) in backends.iter().zip(backends.iter().skip(1)) {
            ensure!(
                left != right,
                "{left:?} metastore config is defined multiple times"
            );
        }
        Ok(())
    }

    pub fn find_file(&self) -> Option<&FileMetastoreConfig> {
        self.0
            .iter()
            .find_map(|metastore_config| match metastore_config {
                MetastoreConfig::File(file_metastore_config) => Some(file_metastore_config),
                _ => None,
            })
    }

    pub fn find_postgres(&self) -> Option<&PostgresMetastoreConfig> {
        self.0
            .iter()
            .find_map(|metastore_config| match metastore_config {
                MetastoreConfig::PostgreSQL(postgres_metastore_config) => {
                    Some(postgres_metastore_config)
                }
                _ => None,
            })
    }
}

impl Deref for MetastoreConfigs {
    type Target = Vec<MetastoreConfig>;

    fn deref(&self) -> &Self::Target {
        &self.0
    }
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum MetastoreConfig {
    File(FileMetastoreConfig),
    #[serde(alias = "pg", alias = "postgres")]
    PostgreSQL(PostgresMetastoreConfig),
}

impl MetastoreConfig {
    pub fn backend(&self) -> MetastoreBackend {
        match self {
            Self::File(_) => MetastoreBackend::File,
            Self::PostgreSQL(_) => MetastoreBackend::PostgreSQL,
        }
    }

    pub fn as_file(&self) -> Option<&FileMetastoreConfig> {
        match self {
            Self::File(file_metastore_config) => Some(file_metastore_config),
            _ => None,
        }
    }

    pub fn as_postgres(&self) -> Option<&PostgresMetastoreConfig> {
        match self {
            Self::PostgreSQL(postgres_metastore_config) => Some(postgres_metastore_config),
            _ => None,
        }
    }

    pub fn redact(&mut self) {
        // TODO: Implement this method when we end up storing secrets in the
        // metastore config.
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        match self {
            Self::File(file_metastore_config) => file_metastore_config.validate()?,
            Self::PostgreSQL(postgres_metastore_config) => postgres_metastore_config.validate()?,
        }
        Ok(())
    }
}

impl From<FileMetastoreConfig> for MetastoreConfig {
    fn from(file_metastore_config: FileMetastoreConfig) -> Self {
        Self::File(file_metastore_config)
    }
}

impl From<PostgresMetastoreConfig> for MetastoreConfig {
    fn from(postgres_metastore_config: PostgresMetastoreConfig) -> Self {
        Self::PostgreSQL(postgres_metastore_config)
    }
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct PostgresMetastoreConfig {
    #[serde(default = "PostgresMetastoreConfig::default_min_connections")]
    pub min_connections: usize,
    #[serde(
        alias = "max_num_connections",
        default = "PostgresMetastoreConfig::default_max_connections"
    )]
    pub max_connections: NonZeroUsize,
    #[serde(default = "PostgresMetastoreConfig::default_acquire_connection_timeout")]
    pub acquire_connection_timeout: String,
    #[serde(default = "PostgresMetastoreConfig::default_idle_connection_timeout")]
    pub idle_connection_timeout: String,
    #[serde(default = "PostgresMetastoreConfig::default_max_connection_lifetime")]
    pub max_connection_lifetime: String,
}

impl Default for PostgresMetastoreConfig {
    fn default() -> Self {
        Self {
            min_connections: Self::default_min_connections(),
            max_connections: Self::default_max_connections(),
            acquire_connection_timeout: Self::default_acquire_connection_timeout(),
            idle_connection_timeout: Self::default_idle_connection_timeout(),
            max_connection_lifetime: Self::default_max_connection_lifetime(),
        }
    }
}

impl PostgresMetastoreConfig {
    pub fn default_min_connections() -> usize {
        0
    }

    pub fn default_max_connections() -> NonZeroUsize {
        NonZeroUsize::new(10).unwrap()
    }

    pub fn default_acquire_connection_timeout() -> String {
        "10s".to_string()
    }

    pub fn default_idle_connection_timeout() -> String {
        "10min".to_string()
    }

    pub fn default_max_connection_lifetime() -> String {
        "30min".to_string()
    }

    pub fn acquire_connection_timeout(&self) -> anyhow::Result<Duration> {
        parse_duration(&self.acquire_connection_timeout).with_context(|| {
            format!(
                "failed to parse `acquire_connection_timeout` value `{}`",
                self.acquire_connection_timeout
            )
        })
    }

    pub fn idle_connection_timeout_opt(&self) -> anyhow::Result<Option<Duration>> {
        if self.idle_connection_timeout.is_empty() || self.idle_connection_timeout == "0" {
            return Ok(None);
        }
        let idle_connection_timeout =
            parse_duration(&self.idle_connection_timeout).with_context(|| {
                format!(
                    "failed to parse `idle_connection_timeout` value `{}`",
                    self.idle_connection_timeout
                )
            })?;
        if idle_connection_timeout.is_zero() {
            Ok(None)
        } else {
            Ok(Some(idle_connection_timeout))
        }
    }

    pub fn max_connection_lifetime_opt(&self) -> anyhow::Result<Option<Duration>> {
        if self.max_connection_lifetime.is_empty() || self.max_connection_lifetime == "0" {
            return Ok(None);
        }
        let max_connection_lifetime =
            parse_duration(&self.max_connection_lifetime).with_context(|| {
                format!(
                    "failed to parse `max_connection_lifetime` value `{}`",
                    self.max_connection_lifetime
                )
            })?;
        if max_connection_lifetime.is_zero() {
            Ok(None)
        } else {
            Ok(Some(max_connection_lifetime))
        }
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        ensure!(
            self.min_connections <= self.max_connections.get(),
            "`min_connections` must be less than or equal to `max_connections`"
        );
        self.acquire_connection_timeout()?;
        self.idle_connection_timeout_opt()?;
        self.max_connection_lifetime_opt()?;
        Ok(())
    }
}

#[derive(Debug, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct FileMetastoreConfig;

impl FileMetastoreConfig {
    pub fn validate(&self) -> anyhow::Result<()> {
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_metastore_configs_serde() {
        let metastore_configs_yaml = "";
        let metastore_configs: MetastoreConfigs =
            serde_yaml::from_str(metastore_configs_yaml).unwrap();
        assert!(metastore_configs.is_empty());

        let metastore_configs_yaml = r#"
                postgres:
                    max_connections: 12
            "#;
        let metastore_configs: MetastoreConfigs =
            serde_yaml::from_str(metastore_configs_yaml).unwrap();

        let expected_metastore_configs = MetastoreConfigs(vec![
            PostgresMetastoreConfig {
                max_connections: NonZeroUsize::new(12).unwrap(),
                ..Default::default()
            }
            .into(),
        ]);
        assert_eq!(metastore_configs, expected_metastore_configs);
    }

    #[test]
    fn test_metastore_configs_validate() {
        let metastore_configs = MetastoreConfigs(vec![
            PostgresMetastoreConfig {
                max_connections: NonZeroUsize::new(12).unwrap(),
                ..Default::default()
            }
            .into(),
            PostgresMetastoreConfig {
                max_connections: NonZeroUsize::new(12).unwrap(),
                ..Default::default()
            }
            .into(),
        ]);
        let error = metastore_configs.validate().unwrap_err();
        assert!(error.to_string().contains("defined multiple times"));

        let metastore_configs = MetastoreConfigs(vec![
            PostgresMetastoreConfig {
                acquire_connection_timeout: "15".to_string(),
                ..Default::default()
            }
            .into(),
        ]);
        let error = metastore_configs.validate().unwrap_err();
        assert!(error.to_string().contains("`acquire_connection_timeout`"));
    }

    #[test]
    fn test_pg_metastore_config_serde() {
        {
            let pg_metastore_config_yaml = "";
            let pg_metastore_config: PostgresMetastoreConfig =
                serde_yaml::from_str(pg_metastore_config_yaml).unwrap();
            assert_eq!(pg_metastore_config, PostgresMetastoreConfig::default());
        }
        {
            let pg_metastore_config_yaml = r#"
                max_connections: 12
            "#;
            let pg_metastore_config: PostgresMetastoreConfig =
                serde_yaml::from_str(pg_metastore_config_yaml).unwrap();

            let expected_pg_metastore_config = PostgresMetastoreConfig {
                max_connections: NonZeroUsize::new(12).unwrap(),
                ..Default::default()
            };
            assert_eq!(pg_metastore_config, expected_pg_metastore_config);
        }
        {
            let pg_metastore_config_yaml = r#"
                min_connections: 6
                max_connections: 12
                acquire_connection_timeout: 500ms
                idle_connection_timeout: 1h
                max_connection_lifetime: 1d
            "#;
            let pg_metastore_config: PostgresMetastoreConfig =
                serde_yaml::from_str(pg_metastore_config_yaml).unwrap();

            let expected_pg_metastore_config = PostgresMetastoreConfig {
                min_connections: 6,
                max_connections: NonZeroUsize::new(12).unwrap(),
                acquire_connection_timeout: "500ms".to_string(),
                idle_connection_timeout: "1h".to_string(),
                max_connection_lifetime: "1d".to_string(),
            };
            assert_eq!(pg_metastore_config, expected_pg_metastore_config);
            assert_eq!(
                pg_metastore_config.acquire_connection_timeout().unwrap(),
                Duration::from_millis(500)
            );
            assert_eq!(
                pg_metastore_config.idle_connection_timeout_opt().unwrap(),
                Some(Duration::from_secs(3600))
            );
            assert_eq!(
                pg_metastore_config.max_connection_lifetime_opt().unwrap(),
                Some(Duration::from_secs(24 * 3600))
            );
        }
        {
            let pg_metastore_config_yaml = r#"
                min_connections: 6
                max_connections: 12
                acquire_connection_timeout: 15s
                idle_connection_timeout: ""
                max_connection_lifetime: 0
            "#;
            let pg_metastore_config: PostgresMetastoreConfig =
                serde_yaml::from_str(pg_metastore_config_yaml).unwrap();

            let expected_pg_metastore_config = PostgresMetastoreConfig {
                min_connections: 6,
                max_connections: NonZeroUsize::new(12).unwrap(),
                acquire_connection_timeout: "15s".to_string(),
                idle_connection_timeout: "".to_string(),
                max_connection_lifetime: "0".to_string(),
            };
            assert_eq!(pg_metastore_config, expected_pg_metastore_config);
            assert_eq!(
                pg_metastore_config.acquire_connection_timeout().unwrap(),
                Duration::from_secs(15)
            );
            assert!(
                pg_metastore_config
                    .idle_connection_timeout_opt()
                    .unwrap()
                    .is_none()
            );
            assert!(
                pg_metastore_config
                    .max_connection_lifetime_opt()
                    .unwrap()
                    .is_none(),
            );
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/node_config/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod serialize;

use std::collections::{HashMap, HashSet};
use std::env;
use std::net::SocketAddr;
use std::num::{NonZeroU32, NonZeroU64, NonZeroUsize};
use std::path::PathBuf;
use std::time::Duration;

use anyhow::{bail, ensure};
use bytesize::ByteSize;
use http::HeaderMap;
use quickwit_common::net::HostAddr;
use quickwit_common::shared_consts::{
    DEFAULT_SHARD_BURST_LIMIT, DEFAULT_SHARD_SCALE_UP_FACTOR, DEFAULT_SHARD_THROUGHPUT_LIMIT,
};
use quickwit_common::uri::Uri;
use quickwit_proto::indexing::CpuCapacity;
use quickwit_proto::tonic::codec::CompressionEncoding;
use quickwit_proto::types::NodeId;
use serde::{Deserialize, Deserializer, Serialize};
use tracing::{info, warn};

use crate::node_config::serialize::load_node_config_with_env;
use crate::serde_utils::DurationAsStr;
use crate::service::QuickwitService;
use crate::storage_config::StorageConfigs;
use crate::{ConfigFormat, MetastoreConfigs};

pub const DEFAULT_QW_CONFIG_PATH: &str = "config/quickwit.yaml";

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct RestConfig {
    pub listen_addr: SocketAddr,
    pub cors_allow_origins: Vec<String>,
    #[serde(with = "http_serde::header_map")]
    pub extra_headers: HeaderMap,
    #[serde(default)]
    pub tls: Option<TlsConfig>,
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct GrpcConfig {
    #[serde(default = "GrpcConfig::default_max_message_size")]
    pub max_message_size: ByteSize,
    #[serde(default)]
    pub tls: Option<TlsConfig>,
    // If set, keeps idle connection alive by periodically perform a
    // keep alive ping request.
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub keep_alive: Option<KeepAliveConfig>,
}

fn default_http2_keep_alive_interval() -> DurationAsStr {
    DurationAsStr::try_from("10s".to_string()).unwrap()
}

fn default_keep_alive_timeout() -> DurationAsStr {
    DurationAsStr::try_from("5s".to_string()).unwrap()
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct KeepAliveConfig {
    // Set the HTTP/2 KEEP_ALIVE_INTERVAL. This is the time the connection
    // should be idle before sending a keepalive ping.
    #[serde(default = "default_http2_keep_alive_interval")]
    pub interval: DurationAsStr,

    // Set the HTTP/2 KEEP_ALIVE_TIMEOUT. This is the time to wait for an ACK
    // after sending a keepalive ping. If the server doesn't respond within
    // this time, the connection might be considered dead.
    // Tonic uses hyper's default (20 seconds) if not set.
    #[serde(default = "default_keep_alive_timeout")]
    pub timeout: DurationAsStr,
}

impl From<KeepAliveConfig> for quickwit_common::tower::KeepAliveConfig {
    fn from(val: KeepAliveConfig) -> Self {
        quickwit_common::tower::KeepAliveConfig {
            interval: *val.interval,
            timeout: *val.timeout,
        }
    }
}

impl GrpcConfig {
    fn default_max_message_size() -> ByteSize {
        ByteSize::mib(20)
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        ensure!(
            self.max_message_size >= ByteSize::mb(1),
            "max gRPC message size (`grpc.max_message_size`) must be at least 1MB, got `{}`",
            self.max_message_size
        );
        Ok(())
    }
}

impl Default for GrpcConfig {
    fn default() -> Self {
        Self {
            max_message_size: Self::default_max_message_size(),
            tls: None,
            keep_alive: None,
        }
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct TlsConfig {
    pub cert_path: String,
    pub key_path: String,
    #[serde(default)]
    pub ca_path: String,
    #[serde(default)]
    pub expected_name: Option<String>,
    #[serde(default)]
    pub validate_client: bool,
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct IndexerConfig {
    #[serde(default = "IndexerConfig::default_split_store_max_num_bytes")]
    pub split_store_max_num_bytes: ByteSize,
    #[serde(default = "IndexerConfig::default_split_store_max_num_splits")]
    pub split_store_max_num_splits: usize,
    #[serde(default = "IndexerConfig::default_max_concurrent_split_uploads")]
    pub max_concurrent_split_uploads: usize,
    /// Limits the IO throughput of the `SplitDownloader` and the `MergeExecutor`.
    /// On hardware where IO is constrained, it makes sure that Merges (a batch operation)
    /// does not starve indexing itself (as it is a latency sensitive operation).
    #[serde(default)]
    pub max_merge_write_throughput: Option<ByteSize>,
    /// Maximum number of merge or delete operation that can be executed concurrently.
    /// (defaults to num_cpu / 2).
    #[serde(default = "IndexerConfig::default_merge_concurrency")]
    pub merge_concurrency: NonZeroUsize,
    /// Enables the OpenTelemetry exporter endpoint to ingest logs and traces via the OpenTelemetry
    /// Protocol (OTLP).
    #[serde(default = "IndexerConfig::default_enable_otlp_endpoint")]
    pub enable_otlp_endpoint: bool,
    #[serde(default = "IndexerConfig::default_enable_cooperative_indexing")]
    pub enable_cooperative_indexing: bool,
    #[serde(default = "IndexerConfig::default_cpu_capacity")]
    pub cpu_capacity: CpuCapacity,
}

impl IndexerConfig {
    fn default_enable_cooperative_indexing() -> bool {
        false
    }

    fn default_enable_otlp_endpoint() -> bool {
        #[cfg(any(test, feature = "testsuite"))]
        {
            false
        }
        #[cfg(not(any(test, feature = "testsuite")))]
        {
            quickwit_common::get_bool_from_env("QW_ENABLE_OTLP_ENDPOINT", true)
        }
    }

    fn default_max_concurrent_split_uploads() -> usize {
        12
    }

    pub fn default_split_store_max_num_bytes() -> ByteSize {
        ByteSize::gib(100)
    }

    pub fn default_split_store_max_num_splits() -> usize {
        1_000
    }

    pub fn default_merge_concurrency() -> NonZeroUsize {
        NonZeroUsize::new(quickwit_common::num_cpus() * 2 / 3).unwrap_or(NonZeroUsize::MIN)
    }

    fn default_cpu_capacity() -> CpuCapacity {
        CpuCapacity::one_cpu_thread() * (quickwit_common::num_cpus() as u32)
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> anyhow::Result<Self> {
        use quickwit_proto::indexing::PIPELINE_FULL_CAPACITY;
        let indexer_config = IndexerConfig {
            enable_cooperative_indexing: false,
            enable_otlp_endpoint: true,
            split_store_max_num_bytes: ByteSize::mb(1),
            split_store_max_num_splits: 3,
            max_concurrent_split_uploads: 4,
            cpu_capacity: PIPELINE_FULL_CAPACITY * 4u32,
            max_merge_write_throughput: None,
            merge_concurrency: NonZeroUsize::new(3).unwrap(),
        };
        Ok(indexer_config)
    }
}

impl Default for IndexerConfig {
    fn default() -> Self {
        Self {
            enable_cooperative_indexing: Self::default_enable_cooperative_indexing(),
            enable_otlp_endpoint: Self::default_enable_otlp_endpoint(),
            split_store_max_num_bytes: Self::default_split_store_max_num_bytes(),
            split_store_max_num_splits: Self::default_split_store_max_num_splits(),
            max_concurrent_split_uploads: Self::default_max_concurrent_split_uploads(),
            cpu_capacity: Self::default_cpu_capacity(),
            merge_concurrency: Self::default_merge_concurrency(),
            max_merge_write_throughput: None,
        }
    }
}

#[derive(Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct SplitCacheLimits {
    pub max_num_bytes: ByteSize,
    #[serde(default = "SplitCacheLimits::default_max_num_splits")]
    pub max_num_splits: NonZeroU32,
    #[serde(default = "SplitCacheLimits::default_num_concurrent_downloads")]
    pub num_concurrent_downloads: NonZeroU32,
    #[serde(default = "SplitCacheLimits::default_max_file_descriptors")]
    pub max_file_descriptors: NonZeroU32,
}

impl SplitCacheLimits {
    fn default_max_num_splits() -> NonZeroU32 {
        NonZeroU32::new(10_000).unwrap()
    }

    fn default_num_concurrent_downloads() -> NonZeroU32 {
        NonZeroU32::new(1).unwrap()
    }

    fn default_max_file_descriptors() -> NonZeroU32 {
        NonZeroU32::new(100).unwrap()
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields, default)]
pub struct SearcherConfig {
    pub aggregation_memory_limit: ByteSize,
    pub aggregation_bucket_limit: u32,

    #[serde(alias = "fast_field_cache_capacity")]
    #[serde(
        deserialize_with = "CacheConfig::deserialize_with_default::<_, {ByteSize::gb(1).as_u64()}>"
    )]
    pub fast_field_cache: CacheConfig,
    #[serde(alias = "split_footer_cache_capacity")]
    #[serde(deserialize_with = "CacheConfig::deserialize_with_default::<_, \
                                {ByteSize::mb(500).as_u64()}>")]
    pub split_footer_cache: CacheConfig,
    #[serde(alias = "partial_request_cache_capacity")]
    #[serde(deserialize_with = "CacheConfig::deserialize_with_default::<_, \
                                {ByteSize::mb(64).as_u64()}>")]
    pub partial_request_cache: CacheConfig,
    #[serde(alias = "predicate_cache_capacity")]
    #[serde(deserialize_with = "CacheConfig::deserialize_with_default::<_, \
                                {ByteSize::mb(256).as_u64()}>")]
    pub predicate_cache: CacheConfig,

    pub max_num_concurrent_split_searches: usize,
    pub max_splits_per_search: Option<usize>,
    // Deprecated: stream search requests are no longer supported.
    #[serde(alias = "max_num_concurrent_split_streams", default, skip_serializing)]
    pub _max_num_concurrent_split_streams: Option<serde::de::IgnoredAny>,
    // Strangely, if None, this will also have the effect of not forwarding
    // to searcher.
    // TODO document and fix if necessary.
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub split_cache: Option<SplitCacheLimits>,
    #[serde(default = "SearcherConfig::default_request_timeout_secs")]
    request_timeout_secs: NonZeroU64,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub storage_timeout_policy: Option<StorageTimeoutPolicy>,
    pub warmup_memory_budget: ByteSize,
    pub warmup_single_split_initial_allocation: ByteSize,
    /// Lambda configuration for serverless leaf search execution.
    /// If set, enables Lambda execution for leaf search.
    ///
    /// If set, and Quickwit cannot access the Lambda (after a deploy attempt if
    /// auto deploy is set up), Quickwit will log an error and
    /// fail on startup.
    #[serde(default)]
    pub lambda: Option<LambdaConfig>,
}

/// Configuration for AWS Lambda leaf search execution.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct LambdaConfig {
    /// AWS Lambda function name.
    #[serde(default = "LambdaConfig::default_function_name")]
    pub function_name: String,
    /// Maximum number of splits per Lambda invocation.
    #[serde(default = "LambdaConfig::default_max_splits_per_invocation")]
    pub max_splits_per_invocation: NonZeroUsize,
    /// Maximum number of splits to process locally before offloading to Lambda.
    /// When the number of pending split searches exceeds this threshold,
    /// new splits are offloaded to Lambda instead of being queued locally.
    /// A value of 0 offloads everything to Lambda.
    #[serde(default = "LambdaConfig::default_offload_threshold")]
    pub offload_threshold: usize,
    /// Auto-deploy configuration. If set, Quickwit will automatically deploy
    /// the Lambda function at startup.
    /// If deploying a lambda fails, Quickwit will log an error and fail.
    #[serde(default)]
    pub auto_deploy: Option<LambdaDeployConfig>,
}

impl LambdaConfig {
    #[cfg(feature = "testsuite")]
    pub fn for_test() -> Self {
        Self {
            function_name: Self::default_function_name(),
            max_splits_per_invocation: Self::default_max_splits_per_invocation(),
            offload_threshold: Self::default_offload_threshold(),
            auto_deploy: None,
        }
    }

    fn default_function_name() -> String {
        "quickwit-lambda-search".to_string()
    }
    fn default_max_splits_per_invocation() -> NonZeroUsize {
        NonZeroUsize::new(10).unwrap()
    }
    fn default_offload_threshold() -> usize {
        100
    }
}

/// Configuration for automatic Lambda function deployment.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct LambdaDeployConfig {
    /// IAM execution role ARN for the Lambda function.
    /// The role only requires GetObject permission to the targeted S3 bucket.
    pub execution_role_arn: String,
    /// Memory size for the Lambda function.
    /// It will be rounded up to the nearest multiple of 1MiB.
    #[serde(default = "LambdaDeployConfig::default_memory_size")]
    pub memory_size: ByteSize,
    /// Timeout for Lambda invocations in seconds.
    #[serde(default = "LambdaDeployConfig::default_invocation_timeout_secs")]
    pub invocation_timeout_secs: u64,
}

impl LambdaDeployConfig {
    fn default_memory_size() -> ByteSize {
        // Empirically this implies between 4 and 6 vCPUs.
        ByteSize::gib(5)
    }
    fn default_invocation_timeout_secs() -> u64 {
        15
    }
}

#[derive(Clone, Debug, PartialEq, Eq, Hash, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct CacheConfig {
    #[serde(default)]
    capacity: Option<ByteSize>,
    #[serde(default)]
    policy: Option<CachePolicy>,

    // Cache configs inside the virtual cache aren't allowed to contain virtual cache
    #[serde(default)]
    pub virtual_caches: Vec<CacheConfig>,
}

impl CacheConfig {
    pub fn no_cache() -> Self {
        CacheConfig {
            capacity: None,
            policy: None,
            virtual_caches: Vec::new(),
        }
    }

    pub fn default_with_capacity(capacity: ByteSize) -> Self {
        CacheConfig {
            capacity: Some(capacity),
            policy: None,
            virtual_caches: Vec::new(),
        }
    }

    pub fn capacity(&self) -> ByteSize {
        // this should always be there
        self.capacity.unwrap_or_default()
    }

    pub fn capacity_for_virtual_cache(&mut self, real_capacity: ByteSize) -> ByteSize {
        let capacity = self.capacity.unwrap_or(real_capacity);
        self.capacity = Some(capacity);
        capacity
    }

    pub fn policy(&self) -> CachePolicy {
        self.policy.unwrap_or_default()
    }

    pub fn policy_for_virtual_cache(&mut self, real_policy: CachePolicy) -> CachePolicy {
        let policy = self.policy.unwrap_or(real_policy);
        self.policy = Some(policy);
        policy
    }

    fn deserialize_with_default<'de, D, const DEFAULT_CAPACITY: u64>(
        deserializer: D,
    ) -> Result<CacheConfig, D::Error>
    where D: Deserializer<'de> {
        use serde_with::{DeserializeAs, FromInto, PickFirst, Same};

        let mut cache_config: CacheConfig =
            PickFirst::<(Same, FromInto<ByteSize>)>::deserialize_as(deserializer)?;
        if cache_config.capacity.is_none() {
            cache_config.capacity = Some(ByteSize::b(DEFAULT_CAPACITY));
        }
        Ok(cache_config)
    }
}

impl From<ByteSize> for CacheConfig {
    fn from(capacity: ByteSize) -> Self {
        CacheConfig::default_with_capacity(capacity)
    }
}

#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, Serialize, Deserialize, Default)]
#[serde(rename_all = "kebab-case")]
pub enum CachePolicy {
    #[default]
    Lru,
    S3Fifo,
    TinyLfu,
}

impl std::fmt::Display for CachePolicy {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        match self {
            CachePolicy::Lru => f.write_str("lru"),
            CachePolicy::S3Fifo => f.write_str("s3-fifo"),
            CachePolicy::TinyLfu => f.write_str("tiny-lfu"),
        }
    }
}

/// Configuration controlling how fast a searcher should timeout a `get_slice`
/// request to retry it.
///
/// [Amazon's best practise](https://docs.aws.amazon.com/whitepapers/latest/s3-optimizing-performance-best-practices/timeouts-and-retries-for-latency-sensitive-applications.html)
/// suggests that to ensure low latency, it is best to:
/// - retry small GET request after 2s
/// - retry large GET request when the throughput is below some percentile.
///
/// This policy is inspired by this guidance. It does not track instanteneous throughput, but
/// computes an overall timeout using the following formula:
/// `timeout_offset + num_bytes_get_request / min_throughtput`
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct StorageTimeoutPolicy {
    pub min_throughtput_bytes_per_secs: u64,
    pub timeout_millis: u64,
    // Disclaimer: this is a number of retry, so the overall max number of
    // attempts is `max_num_retries + 1``.
    pub max_num_retries: usize,
}

impl StorageTimeoutPolicy {
    pub fn compute_timeout(&self, num_bytes: usize) -> impl Iterator<Item = Duration> {
        let min_download_time_secs: f64 = if self.min_throughtput_bytes_per_secs == 0 {
            0.0f64
        } else {
            num_bytes as f64 / self.min_throughtput_bytes_per_secs as f64
        };
        let timeout = Duration::from_millis(self.timeout_millis)
            + Duration::from_secs_f64(min_download_time_secs);
        std::iter::repeat_n(timeout, self.max_num_retries + 1)
    }
}

impl Default for SearcherConfig {
    fn default() -> Self {
        SearcherConfig {
            fast_field_cache: CacheConfig::default_with_capacity(ByteSize::gb(1)),
            split_footer_cache: CacheConfig::default_with_capacity(ByteSize::mb(500)),
            partial_request_cache: CacheConfig::default_with_capacity(ByteSize::mb(64)),
            predicate_cache: CacheConfig::default_with_capacity(ByteSize::mb(256)),
            max_num_concurrent_split_searches: 100,
            max_splits_per_search: None,
            _max_num_concurrent_split_streams: None,
            aggregation_memory_limit: ByteSize::mb(500),
            aggregation_bucket_limit: 65000,
            split_cache: None,
            request_timeout_secs: Self::default_request_timeout_secs(),
            storage_timeout_policy: None,
            warmup_memory_budget: ByteSize::gb(100),
            warmup_single_split_initial_allocation: ByteSize::gb(1),
            lambda: None,
        }
    }
}

impl SearcherConfig {
    /// The timeout after which a search should be cancelled
    pub fn request_timeout(&self) -> Duration {
        Duration::from_secs(self.request_timeout_secs.get())
    }
    fn default_request_timeout_secs() -> NonZeroU64 {
        NonZeroU64::new(30).unwrap()
    }
    fn validate(&self) -> anyhow::Result<()> {
        if let Some(split_cache_limits) = self.split_cache {
            if self.max_num_concurrent_split_searches
                > split_cache_limits.max_file_descriptors.get() as usize
            {
                anyhow::bail!(
                    "max_num_concurrent_split_searches ({}) must be lower or equal to \
                     split_cache.max_file_descriptors ({})",
                    self.max_num_concurrent_split_searches,
                    split_cache_limits.max_file_descriptors
                );
            }
            if self.warmup_single_split_initial_allocation > self.warmup_memory_budget {
                anyhow::bail!(
                    "warmup_single_split_initial_allocation ({}) must be lower or equal to \
                     warmup_memory_budget ({})",
                    self.warmup_single_split_initial_allocation,
                    self.warmup_memory_budget
                );
            }
        }
        Ok(())
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "lowercase")]
pub enum CompressionAlgorithm {
    Gzip,
    Zstd,
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields, default)]
pub struct IngestApiConfig {
    /// Maximum memory space taken by the ingest WAL
    pub max_queue_memory_usage: ByteSize,
    /// Maximum disk space taken by the ingest WAL
    pub max_queue_disk_usage: ByteSize,
    replication_factor: usize,
    pub content_length_limit: ByteSize,
    /// (hidden) Targeted throughput for each shard
    pub shard_throughput_limit: ByteSize,
    /// (hidden) Maximum accumulated throughput capacity for underutilized
    /// shards, allowing the throughput limit to be temporarily exceeded
    pub shard_burst_limit: ByteSize,
    /// (hidden) new_shard_count = ceil(old_shard_count * shard_scale_up_factor)
    ///
    /// Setting this too high will be cancelled out by the arbiter that prevents
    /// creating too many shards at once.
    pub shard_scale_up_factor: f32,
    #[serde(default)]
    pub grpc_compression_algorithm: Option<CompressionAlgorithm>,
}

impl Default for IngestApiConfig {
    fn default() -> Self {
        Self {
            max_queue_memory_usage: ByteSize::gib(2),
            max_queue_disk_usage: ByteSize::gib(4),
            replication_factor: 1,
            content_length_limit: ByteSize::mib(10),
            shard_throughput_limit: DEFAULT_SHARD_THROUGHPUT_LIMIT,
            shard_burst_limit: DEFAULT_SHARD_BURST_LIMIT,
            shard_scale_up_factor: DEFAULT_SHARD_SCALE_UP_FACTOR,
            grpc_compression_algorithm: None,
        }
    }
}

impl IngestApiConfig {
    /// Returns the replication factor, as defined in environment variable or in the configuration
    /// in that order (the environment variable can overrides the configuration).
    pub fn replication_factor(&self) -> anyhow::Result<NonZeroUsize> {
        if let Ok(replication_factor_str) = env::var("QW_INGEST_REPLICATION_FACTOR") {
            let replication_factor = match replication_factor_str.trim() {
                "1" => 1,
                "2" => 2,
                _ => bail!(
                    "replication factor must be either 1 or 2, got `{replication_factor_str}`"
                ),
            };
            return Ok(NonZeroUsize::new(replication_factor)
                .expect("replication factor should be either 1 or 2"));
        }
        ensure!(
            self.replication_factor >= 1 && self.replication_factor <= 2,
            "replication factor must be either 1 or 2, got `{}`",
            self.replication_factor
        );
        Ok(NonZeroUsize::new(self.replication_factor)
            .expect("replication factor should be either 1 or 2"))
    }

    pub fn grpc_compression_encoding(&self) -> Option<CompressionEncoding> {
        self.grpc_compression_algorithm
            .as_ref()
            .map(|algorithm| match algorithm {
                CompressionAlgorithm::Gzip => CompressionEncoding::Gzip,
                CompressionAlgorithm::Zstd => CompressionEncoding::Zstd,
            })
    }

    fn validate(&self) -> anyhow::Result<()> {
        self.replication_factor()?;
        ensure!(
            self.max_queue_disk_usage > ByteSize::mib(256),
            "max_queue_disk_usage must be at least 256 MiB, got `{}`",
            self.max_queue_disk_usage.display().si()
        );
        ensure!(
            self.max_queue_disk_usage >= self.max_queue_memory_usage,
            "max_queue_disk_usage ({}) must be at least max_queue_memory_usage ({})",
            self.max_queue_disk_usage.display().si(),
            self.max_queue_memory_usage.display().si()
        );
        info!(
            "ingestion shard throughput limit: {}",
            self.shard_throughput_limit.display().si()
        );
        ensure!(
            self.shard_throughput_limit >= ByteSize::mib(1)
                && self.shard_throughput_limit <= ByteSize::mib(20),
            "shard_throughput_limit ({}) must be within 1mb and 20mb",
            self.shard_throughput_limit.display().si()
        );
        // The newline delimited format is persisted as something a bit larger
        // (lines prefixed with their length)
        let estimated_persist_size = ByteSize::b(3 * self.content_length_limit.as_u64() / 2);
        ensure!(
            self.shard_burst_limit >= estimated_persist_size,
            "shard_burst_limit ({}) must be at least 1.5*content_length_limit ({})",
            self.shard_burst_limit,
            estimated_persist_size,
        );
        ensure!(
            self.shard_scale_up_factor > 1.0,
            "shard_scale_up_factor ({}) must be greater than 1",
            self.shard_scale_up_factor,
        );
        Ok(())
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct JaegerConfig {
    /// Enables the gRPC endpoint that allows the Jaeger Query Service to connect and retrieve
    /// traces.
    #[serde(default = "JaegerConfig::default_enable_endpoint")]
    pub enable_endpoint: bool,
    /// How far back in time we look for spans when queries at not time-bound (`get_services`,
    /// `get_operations`, `get_trace` operations).
    #[serde(default = "JaegerConfig::default_lookback_period_hours")]
    lookback_period_hours: NonZeroU64,
    /// The assumed maximum duration of a trace in seconds.
    ///
    /// Finding a trace happens in two phases: the first phase identifies at least one span that
    /// matches the query, while the second phase retrieves the spans that belong to the trace.
    /// The `max_trace_duration_secs` parameter is used during the second phase to restrict the
    /// search time interval to [span.end_timestamp - max_trace_duration, span.start_timestamp
    /// + max_trace_duration].
    #[serde(default = "JaegerConfig::default_max_trace_duration_secs")]
    max_trace_duration_secs: NonZeroU64,
    /// The maximum number of spans that can be retrieved in a single request.
    #[serde(default = "JaegerConfig::default_max_fetch_spans")]
    pub max_fetch_spans: NonZeroU64,
}

impl JaegerConfig {
    pub fn lookback_period(&self) -> Duration {
        Duration::from_secs(self.lookback_period_hours.get() * 3600)
    }

    pub fn max_trace_duration(&self) -> Duration {
        Duration::from_secs(self.max_trace_duration_secs.get())
    }

    fn default_enable_endpoint() -> bool {
        #[cfg(any(test, feature = "testsuite"))]
        {
            false
        }
        #[cfg(not(any(test, feature = "testsuite")))]
        {
            quickwit_common::get_bool_from_env("QW_ENABLE_JAEGER_ENDPOINT", true)
        }
    }

    fn default_lookback_period_hours() -> NonZeroU64 {
        NonZeroU64::new(72).unwrap() // 3 days
    }

    fn default_max_trace_duration_secs() -> NonZeroU64 {
        NonZeroU64::new(3600).unwrap() // 1 hour
    }

    fn default_max_fetch_spans() -> NonZeroU64 {
        NonZeroU64::new(10_000).unwrap() // 10k spans
    }
}

impl Default for JaegerConfig {
    fn default() -> Self {
        Self {
            enable_endpoint: Self::default_enable_endpoint(),
            lookback_period_hours: Self::default_lookback_period_hours(),
            max_trace_duration_secs: Self::default_max_trace_duration_secs(),
            max_fetch_spans: Self::default_max_fetch_spans(),
        }
    }
}

#[derive(Clone, Debug, Serialize)]
pub struct NodeConfig {
    pub cluster_id: String,
    pub node_id: NodeId,
    pub availability_zone: Option<String>,
    pub enabled_services: HashSet<QuickwitService>,
    pub gossip_listen_addr: SocketAddr,
    pub grpc_listen_addr: SocketAddr,
    pub gossip_advertise_addr: SocketAddr,
    pub grpc_advertise_addr: SocketAddr,
    pub gossip_interval: Duration,
    pub peer_seeds: Vec<String>,
    pub data_dir_path: PathBuf,
    pub metastore_uri: Uri,
    pub default_index_root_uri: Uri,
    pub rest_config: RestConfig,
    pub grpc_config: GrpcConfig,
    pub storage_configs: StorageConfigs,
    pub metastore_configs: MetastoreConfigs,
    pub indexer_config: IndexerConfig,
    pub searcher_config: SearcherConfig,
    pub ingest_api_config: IngestApiConfig,
    pub jaeger_config: JaegerConfig,
}

impl NodeConfig {
    pub fn is_service_enabled(&self, service: QuickwitService) -> bool {
        self.enabled_services.contains(&service)
    }

    /// Parses and validates a [`NodeConfig`] from a given URI and config content.
    pub async fn load(config_format: ConfigFormat, config_content: &[u8]) -> anyhow::Result<Self> {
        let env_vars = env::vars().collect::<HashMap<_, _>>();
        let config = load_node_config_with_env(config_format, config_content, &env_vars).await?;
        if !config.data_dir_path.try_exists()? {
            bail!(
                "data dir `{}` does not exist",
                config.data_dir_path.display()
            );
        }
        Ok(config)
    }

    /// Returns the list of peer seed addresses. The addresses MUST NOT be resolved. Otherwise, the
    /// DNS-based discovery mechanism implemented in Chitchat will not work correctly.
    pub async fn peer_seed_addrs(&self) -> anyhow::Result<Vec<String>> {
        let mut peer_seed_addrs = Vec::new();
        let default_gossip_port = self.gossip_listen_addr.port();

        // We want to pass non-resolved addresses to Chitchat but still want to resolve them for
        // validation purposes. Additionally, we need to append a default port if necessary and
        // finally return the addresses as strings, which is tricky for IPv6. We let the logic baked
        // in `HostAddr` handle this complexity.
        let mut found_something = false;
        for peer_seed in &self.peer_seeds {
            let peer_seed_addr = HostAddr::parse_with_default_port(peer_seed, default_gossip_port)?;
            if let Err(error) = peer_seed_addr.resolve().await {
                warn!(peer_seed = %peer_seed_addr, error = ?error, "failed to resolve peer seed address");
            } else {
                found_something = true;
            }
            peer_seed_addrs.push(peer_seed_addr.to_string())
        }
        if !self.peer_seeds.is_empty() && !found_something {
            warn!("failed to resolve all the peer seed addresses")
        }
        Ok(peer_seed_addrs)
    }

    pub fn redact(&mut self) {
        self.metastore_configs.redact();
        self.metastore_uri.redact();
        self.storage_configs.redact();
    }

    /// Creates a config with defaults suitable for testing.
    ///
    /// Uses the default ports without ensuring that they are available.
    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        serialize::node_config_for_tests_from_ports(7280, 7281)
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test_from_ports(rest_listen_port: u16, grpc_listen_port: u16) -> Self {
        serialize::node_config_for_tests_from_ports(rest_listen_port, grpc_listen_port)
    }
}

#[cfg(test)]
mod tests {
    use quickwit_proto::indexing::CpuCapacity;

    use super::*;
    use crate::IndexerConfig;

    #[test]
    fn test_indexer_config_serialization() {
        {
            let indexer_config: IndexerConfig = serde_json::from_str(r#"{}"#).unwrap();
            assert_eq!(&indexer_config, &IndexerConfig::default());
            assert!(indexer_config.cpu_capacity.cpu_millis() > 0);
            assert_eq!(indexer_config.cpu_capacity.cpu_millis() % 1_000, 0);
        }
        {
            let indexer_config: IndexerConfig =
                serde_yaml::from_str(r#"cpu_capacity: 1.5"#).unwrap();
            assert_eq!(
                indexer_config.cpu_capacity,
                CpuCapacity::from_cpu_millis(1500)
            );
            let indexer_config_json = serde_json::to_value(&indexer_config).unwrap();
            assert_eq!(
                indexer_config_json
                    .get("cpu_capacity")
                    .unwrap()
                    .as_str()
                    .unwrap(),
                "1500m"
            );
        }
        {
            let indexer_config: IndexerConfig =
                serde_yaml::from_str(r#"merge_concurrency: 5"#).unwrap();
            assert_eq!(
                indexer_config.merge_concurrency,
                NonZeroUsize::new(5).unwrap()
            );
            let indexer_config_json = serde_json::to_value(&indexer_config).unwrap();
            assert_eq!(
                indexer_config_json
                    .get("merge_concurrency")
                    .unwrap()
                    .as_u64()
                    .unwrap(),
                5
            );
        }
        {
            let indexer_config: IndexerConfig =
                serde_yaml::from_str(r#"cpu_capacity: 1500m"#).unwrap();
            assert_eq!(
                indexer_config.cpu_capacity,
                CpuCapacity::from_cpu_millis(1500)
            );
            let indexer_config_json = serde_json::to_value(&indexer_config).unwrap();
            assert_eq!(
                indexer_config_json
                    .get("cpu_capacity")
                    .unwrap()
                    .as_str()
                    .unwrap(),
                "1500m"
            );
        }
    }

    #[test]
    fn test_validate_ingest_api_default() {
        let ingest_api_config: IngestApiConfig = serde_yaml::from_str("").unwrap();
        assert!(ingest_api_config.validate().is_ok());
        assert_eq!(ingest_api_config, IngestApiConfig::default());
    }

    #[test]
    fn test_validate_ingest_api_config() {
        {
            let ingest_api_config: IngestApiConfig = serde_yaml::from_str(
                r#"
                    max_queue_disk_usage: 100M
                    grpc_compression_algorithm: zstd
                "#,
            )
            .unwrap();
            assert_eq!(
                ingest_api_config.validate().unwrap_err().to_string(),
                "max_queue_disk_usage must be at least 256 MiB, got `100.0 MB`"
            );
            assert_eq!(
                ingest_api_config.grpc_compression_encoding().unwrap(),
                CompressionEncoding::Zstd
            );
        }
        {
            let ingest_api_config: IngestApiConfig = serde_yaml::from_str(
                r#"
                    max_queue_memory_usage: 600M
                    max_queue_disk_usage: 500M
                "#,
            )
            .unwrap();
            assert_eq!(
                ingest_api_config.validate().unwrap_err().to_string(),
                "max_queue_disk_usage (500.0 MB) must be at least max_queue_memory_usage (600.0 \
                 MB)"
            );
        }
        {
            let ingest_api_config: IngestApiConfig = serde_yaml::from_str(
                r#"
                    shard_throughput_limit: 21M
                "#,
            )
            .unwrap();
            assert_eq!(
                ingest_api_config.validate().unwrap_err().to_string(),
                "shard_throughput_limit (21.0 MB) must be within 1mb and 20mb"
            );
        }
    }

    #[track_caller]
    fn test_keepalive_config_serialization_aux(
        keep_alive_json: serde_json::Value,
        expected: quickwit_common::tower::KeepAliveConfig,
    ) {
        let keep_alive_config: KeepAliveConfig =
            serde_json::from_value(keep_alive_json.clone()).unwrap();
        let keep_alive_deser: quickwit_common::tower::KeepAliveConfig =
            keep_alive_config.clone().into();
        assert_eq!(&keep_alive_deser, &expected);
        let keep_alive_config_deser_ser = serde_json::to_value(keep_alive_config).unwrap();
        let keep_alive_config_deser_ser_deser: KeepAliveConfig =
            serde_json::from_value(keep_alive_config_deser_ser).unwrap();
        let keep_alive_config_deser_ser_deser: quickwit_common::tower::KeepAliveConfig =
            keep_alive_config_deser_ser_deser.into();
        assert_eq!(&keep_alive_config_deser_ser_deser, &expected);
    }

    #[test]
    fn test_keepalive_config_serialization() {
        test_keepalive_config_serialization_aux(
            serde_json::json!({}),
            quickwit_common::tower::KeepAliveConfig {
                interval: Duration::from_secs(10),
                timeout: Duration::from_secs(5),
            },
        );
        test_keepalive_config_serialization_aux(
            serde_json::json!({
                "interval": "3s",
                "timeout": "1s",
            }),
            quickwit_common::tower::KeepAliveConfig {
                interval: Duration::from_secs(3),
                timeout: Duration::from_secs(1),
            },
        );
    }

    #[test]
    fn test_grpc_config_serialization_default() {
        let grpc_config: GrpcConfig = serde_json::from_str(r#"{}"#).unwrap();
        assert_eq!(
            grpc_config.max_message_size,
            GrpcConfig::default().max_message_size
        );

        let grpc_config: GrpcConfig = serde_yaml::from_str(
            r#"
                max_message_size: 4MiB
            "#,
        )
        .unwrap();
        assert_eq!(grpc_config.max_message_size, ByteSize::mib(4));
    }

    #[test]
    fn test_grpc_config_validate() {
        let grpc_config = GrpcConfig {
            max_message_size: ByteSize::mb(1),
            tls: None,
            keep_alive: None,
        };
        assert!(grpc_config.validate().is_ok());

        let grpc_config = GrpcConfig {
            max_message_size: ByteSize::kb(1),
            tls: None,
            keep_alive: None,
        };
        assert!(grpc_config.validate().is_err());
    }
}


================================================
FILE: quickwit/quickwit-config/src/node_config/serialize.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::net::{IpAddr, SocketAddr};
use std::str::FromStr;
use std::time::Duration;

use anyhow::{Context, bail};
use bytesize::ByteSize;
use http::HeaderMap;
use quickwit_common::fs::get_disk_size;
use quickwit_common::net::{Host, find_private_ip, get_short_hostname};
use quickwit_common::new_coolid;
use quickwit_common::uri::Uri;
use quickwit_proto::types::NodeId;
use serde::{Deserialize, Serialize};
use tracing::{info, warn};

use super::{GrpcConfig, RestConfig};
use crate::config_value::ConfigValue;
use crate::qw_env_vars::*;
use crate::service::QuickwitService;
use crate::storage_config::StorageConfigs;
use crate::templating::render_config;
use crate::{
    ConfigFormat, IndexerConfig, IngestApiConfig, JaegerConfig, MetastoreConfigs, NodeConfig,
    SearcherConfig, TlsConfig, validate_identifier, validate_node_id,
};

pub const DEFAULT_CLUSTER_ID: &str = "quickwit-default-cluster";

pub const DEFAULT_DATA_DIR_PATH: &str = "qwdata";

pub const DEFAULT_GOSSIP_INTERVAL: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(25)
} else {
    Duration::from_secs(1)
};

// Default config values in the order they appear in [`NodeConfigBuilder`].
fn default_cluster_id() -> ConfigValue<String, QW_CLUSTER_ID> {
    ConfigValue::with_default(DEFAULT_CLUSTER_ID.to_string())
}

fn default_node_id() -> ConfigValue<String, QW_NODE_ID> {
    let node_id = match get_short_hostname() {
        Ok(short_hostname) => short_hostname,
        Err(error) => {
            let node_id = new_coolid("node");
            warn!(error=?error, "failed to determine hostname or hostname was invalid, falling back to random node ID `{}`", node_id);
            node_id
        }
    };
    ConfigValue::with_default(node_id)
}

fn default_availability_zone() -> ConfigValue<String, QW_AVAILABILITY_ZONE> {
    ConfigValue::none()
}

#[derive(Clone, Debug, Default, Serialize, Deserialize, PartialEq)]
struct List(Vec<String>);

impl FromStr for List {
    type Err = anyhow::Error;

    fn from_str(list_str: &str) -> Result<Self, Self::Err> {
        let list = list_str
            .split(',')
            .map(|elem| elem.trim().to_string())
            .filter(|elem| !elem.is_empty())
            .collect();
        Ok(List(list))
    }
}

fn default_enabled_services() -> ConfigValue<List, QW_ENABLED_SERVICES> {
    ConfigValue::with_default(List(
        QuickwitService::supported_services()
            .into_iter()
            .map(|service| service.to_string())
            .collect(),
    ))
}

fn default_listen_address() -> ConfigValue<String, QW_LISTEN_ADDRESS> {
    ConfigValue::with_default(Host::default().to_string())
}

fn default_rest_listen_port() -> u16 {
    7280
}

fn default_data_dir_uri() -> ConfigValue<Uri, QW_DATA_DIR> {
    ConfigValue::with_default(Uri::from_str(DEFAULT_DATA_DIR_PATH).unwrap())
}

/// Returns the default advertise host.
fn default_advertise_host(listen_ip: &IpAddr) -> anyhow::Result<Host> {
    if listen_ip.is_unspecified() {
        if let Some((interface_name, private_ip)) = find_private_ip() {
            info!(advertise_address=%private_ip, interface_name=%interface_name, "using sniffed advertise address `{private_ip}`");
            return Ok(Host::from(private_ip));
        }
        bail!("listen address `{listen_ip}` is unspecified and advertise address is not set");
    }
    info!(advertise_address=%listen_ip, "using listen address `{listen_ip}` as advertise address");
    Ok(Host::from(*listen_ip))
}

// Surprisingly, the default metastore and the index root uri are the same (if you exclude the
// polling_interval parameter). Indeed, this is a convenient setting for testing with a file backed
// metastore and indexes splits stored locally too.
// For a given index `index-id`, it means that we have the metastore file
// in  `./qwdata/indexes/{index-id}/metastore.json` and splits in
// dir `./qwdata/indexes/{index-id}/splits`.
fn default_metastore_uri(data_dir_uri: &Uri) -> Uri {
    data_dir_uri.join("indexes#polling_interval=30s").expect("Failed to create default metastore URI. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues.")
}

// See comment above.
fn default_index_root_uri(data_dir_uri: &Uri) -> Uri {
    data_dir_uri.join("indexes").expect("Failed to create default index root URI. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues.")
}

pub async fn load_node_config_with_env(
    config_format: ConfigFormat,
    config_content: &[u8],
    env_vars: &HashMap<String, String>,
) -> anyhow::Result<NodeConfig> {
    let rendered_config_content = render_config(config_content)?;
    let versioned_node_config: VersionedNodeConfig =
        config_format.parse(rendered_config_content.as_bytes())?;
    let node_config_builder: NodeConfigBuilder = versioned_node_config.into();
    let config = node_config_builder.build_and_validate(env_vars).await?;
    Ok(config)
}

#[derive(Debug, Deserialize)]
#[serde(tag = "version")]
enum VersionedNodeConfig {
    #[serde(rename = "0.8")]
    // Retro compatibility.
    #[serde(alias = "0.7")]
    V0_8(NodeConfigBuilder),
}

impl From<VersionedNodeConfig> for NodeConfigBuilder {
    fn from(versioned_node_config: VersionedNodeConfig) -> Self {
        match versioned_node_config {
            VersionedNodeConfig::V0_8(node_config_builder) => node_config_builder,
        }
    }
}

#[serde_with::serde_as]
#[derive(Debug, Deserialize, PartialEq)]
#[serde(deny_unknown_fields)]
struct NodeConfigBuilder {
    #[serde(default = "default_cluster_id")]
    cluster_id: ConfigValue<String, QW_CLUSTER_ID>,
    #[serde(default = "default_node_id")]
    node_id: ConfigValue<String, QW_NODE_ID>,
    #[serde(default = "default_availability_zone")]
    availability_zone: ConfigValue<String, QW_AVAILABILITY_ZONE>,
    #[serde(default = "default_enabled_services")]
    enabled_services: ConfigValue<List, QW_ENABLED_SERVICES>,
    #[serde(default = "default_listen_address")]
    listen_address: ConfigValue<String, QW_LISTEN_ADDRESS>,
    advertise_address: ConfigValue<String, QW_ADVERTISE_ADDRESS>,
    // Deprecated, use `rest.listen_port` instead.
    rest_listen_port: Option<u16>,
    gossip_listen_port: ConfigValue<u16, QW_GOSSIP_LISTEN_PORT>,
    grpc_listen_port: ConfigValue<u16, QW_GRPC_LISTEN_PORT>,
    gossip_interval_ms: ConfigValue<u32, QW_GOSSIP_INTERVAL_MS>,
    #[serde(default)]
    peer_seeds: ConfigValue<List, QW_PEER_SEEDS>,
    #[serde(rename = "data_dir")]
    #[serde(default = "default_data_dir_uri")]
    data_dir_uri: ConfigValue<Uri, QW_DATA_DIR>,
    metastore_uri: ConfigValue<Uri, QW_METASTORE_URI>,
    default_index_root_uri: ConfigValue<Uri, QW_DEFAULT_INDEX_ROOT_URI>,
    #[serde(rename = "rest")]
    #[serde(default)]
    rest_config_builder: RestConfigBuilder,
    #[serde(rename = "grpc")]
    #[serde(default)]
    grpc_config: GrpcConfig,
    #[serde(rename = "storage")]
    #[serde(default)]
    storage_configs: StorageConfigs,
    #[serde(rename = "metastore")]
    #[serde(default)]
    metastore_configs: MetastoreConfigs,
    #[serde(rename = "indexer")]
    #[serde(default)]
    indexer_config: IndexerConfig,
    #[serde(rename = "searcher")]
    #[serde(default)]
    searcher_config: SearcherConfig,
    #[serde(rename = "ingest_api")]
    #[serde(default)]
    ingest_api_config: IngestApiConfig,
    #[serde(rename = "jaeger")]
    #[serde(default)]
    jaeger_config: JaegerConfig,
}

impl NodeConfigBuilder {
    pub async fn build_and_validate(
        mut self,
        env_vars: &HashMap<String, String>,
    ) -> anyhow::Result<NodeConfig> {
        let node_id = self.node_id.resolve(env_vars).map(NodeId::new)?;
        let availability_zone = self.availability_zone.resolve_optional(env_vars)?;

        let enabled_services = self
            .enabled_services
            .resolve(env_vars)?
            .0
            .into_iter()
            .map(|service| service.parse())
            .collect::<Result<_, _>>()?;

        let listen_address = self.listen_address.resolve(env_vars)?;
        let listen_host = listen_address.parse::<Host>()?;
        let listen_ip = listen_host.resolve().await?;

        if let Some(rest_listen_port) = self.rest_listen_port {
            if self.rest_config_builder.listen_port.is_some() {
                bail!(
                    "conflicting configuration values: please use only `rest.listen_port`, \
                     `rest_listen_port` is deprecated and should not be used alongside \
                     `rest.listen_port`. Update your configuration to use `rest.listen_port`."
                );
            }
            warn!("`rest_listen_port` is deprecated, use `rest.listen_port` instead");
            self.rest_config_builder.listen_port = Some(rest_listen_port);
        }

        let rest_config = self
            .rest_config_builder
            .build_and_validate(listen_ip, env_vars)?;

        self.grpc_config.validate()?;

        let gossip_listen_port = self
            .gossip_listen_port
            .resolve_optional(env_vars)?
            .unwrap_or(rest_config.listen_addr.port());
        let gossip_listen_addr = SocketAddr::new(listen_ip, gossip_listen_port);

        let grpc_listen_port = self
            .grpc_listen_port
            .resolve_optional(env_vars)?
            .unwrap_or(rest_config.listen_addr.port() + 1);
        let grpc_listen_addr = SocketAddr::new(listen_ip, grpc_listen_port);

        let advertise_address = self.advertise_address.resolve_optional(env_vars)?;
        let advertise_host = advertise_address
            .map(|addr| addr.parse::<Host>())
            .unwrap_or_else(|| default_advertise_host(&listen_ip))?;

        let advertise_ip = advertise_host.resolve().await?;
        let gossip_advertise_addr = SocketAddr::new(advertise_ip, gossip_listen_port);
        let grpc_advertise_addr = SocketAddr::new(advertise_ip, grpc_listen_port);

        let data_dir_uri = self.data_dir_uri.resolve(env_vars)?;
        let data_dir_path = data_dir_uri
            .filepath()
            .with_context(|| {
                format!(
                    "data dir must be located on the local file system. current location: \
                     `{data_dir_uri}`"
                )
            })?
            .to_path_buf();

        let metastore_uri = self
            .metastore_uri
            .resolve_optional(env_vars)?
            .unwrap_or_else(|| default_metastore_uri(&data_dir_uri));

        let default_index_root_uri = self
            .default_index_root_uri
            .resolve_optional(env_vars)?
            .unwrap_or_else(|| default_index_root_uri(&data_dir_uri));

        self.storage_configs.validate()?;
        self.storage_configs.apply_flavors();
        self.ingest_api_config.validate()?;
        self.searcher_config.validate()?;

        let gossip_interval = self
            .gossip_interval_ms
            .resolve_optional(env_vars)?
            .map(|gossip_interval_ms| Duration::from_millis(gossip_interval_ms as u64))
            .unwrap_or(DEFAULT_GOSSIP_INTERVAL);

        let node_config = NodeConfig {
            cluster_id: self.cluster_id.resolve(env_vars)?,
            node_id,
            availability_zone,
            enabled_services,
            gossip_listen_addr,
            grpc_listen_addr,
            gossip_advertise_addr,
            grpc_advertise_addr,
            gossip_interval,
            peer_seeds: self.peer_seeds.resolve(env_vars)?.0,
            data_dir_path,
            metastore_uri,
            default_index_root_uri,
            rest_config,
            grpc_config: self.grpc_config,
            metastore_configs: self.metastore_configs,
            storage_configs: self.storage_configs,
            indexer_config: self.indexer_config,
            searcher_config: self.searcher_config,
            ingest_api_config: self.ingest_api_config,
            jaeger_config: self.jaeger_config,
        };

        validate(&node_config)?;
        Ok(node_config)
    }
}

fn validate(node_config: &NodeConfig) -> anyhow::Result<()> {
    validate_identifier("cluster", &node_config.cluster_id)?;
    validate_node_id(&node_config.node_id)?;

    if node_config.cluster_id == DEFAULT_CLUSTER_ID {
        warn!("cluster ID is not set, falling back to default value `{DEFAULT_CLUSTER_ID}`",);
    }
    if node_config.peer_seeds.is_empty() {
        warn!("peer seeds are empty");
    }
    validate_disk_usage(node_config);
    Ok(())
}

/// A list of all the known disk budgets
///
/// External disk usage and unbounded disk usages, e.g the indexing workbench
/// (indexing/) and the delete task workbench (delete_task_service/) are not included.
#[derive(Default, Debug)]
struct ExpectedDiskUsage {
    // indexer / ingester
    split_store_max_num_bytes: Option<ByteSize>,
    max_queue_disk_usage: Option<ByteSize>,
    // searcher
    split_cache: Option<ByteSize>,
}

impl ExpectedDiskUsage {
    fn from_config(node_config: &NodeConfig) -> Self {
        let mut expected = Self::default();
        if node_config.is_service_enabled(QuickwitService::Indexer) {
            expected.max_queue_disk_usage =
                Some(node_config.ingest_api_config.max_queue_disk_usage);
            expected.split_store_max_num_bytes =
                Some(node_config.indexer_config.split_store_max_num_bytes);
        }
        if node_config.is_service_enabled(QuickwitService::Searcher) {
            expected.split_cache = node_config
                .searcher_config
                .split_cache
                .map(|limits| limits.max_num_bytes);
        }
        expected
    }

    fn total(&self) -> ByteSize {
        self.split_store_max_num_bytes.unwrap_or_default()
            + self.max_queue_disk_usage.unwrap_or_default()
            + self.split_cache.unwrap_or_default()
    }
}

fn validate_disk_usage(node_config: &NodeConfig) {
    if let Some(volume_size) = get_disk_size(&node_config.data_dir_path) {
        let expected_disk_usage = ExpectedDiskUsage::from_config(node_config);
        if expected_disk_usage.total() > volume_size {
            warn!(
                ?volume_size,
                ?expected_disk_usage,
                "data dir volume too small"
            );
        }
    }
}

#[cfg(test)]
impl Default for NodeConfigBuilder {
    fn default() -> Self {
        Self {
            cluster_id: default_cluster_id(),
            node_id: default_node_id(),
            availability_zone: ConfigValue::none(),
            enabled_services: default_enabled_services(),
            listen_address: default_listen_address(),
            rest_listen_port: None,
            gossip_listen_port: ConfigValue::none(),
            grpc_listen_port: ConfigValue::none(),
            gossip_interval_ms: ConfigValue::none(),
            advertise_address: ConfigValue::none(),
            peer_seeds: ConfigValue::with_default(List::default()),
            data_dir_uri: default_data_dir_uri(),
            metastore_uri: ConfigValue::none(),
            default_index_root_uri: ConfigValue::none(),
            rest_config_builder: RestConfigBuilder::default(),
            grpc_config: GrpcConfig::default(),
            storage_configs: StorageConfigs::default(),
            metastore_configs: MetastoreConfigs::default(),
            indexer_config: IndexerConfig::default(),
            searcher_config: SearcherConfig::default(),
            ingest_api_config: IngestApiConfig::default(),
            jaeger_config: JaegerConfig::default(),
        }
    }
}

#[serde_with::serde_as]
#[derive(Debug, Deserialize, PartialEq, Default)]
#[serde(deny_unknown_fields)]
struct RestConfigBuilder {
    #[serde(default)]
    listen_port: Option<u16>,
    #[serde(default)]
    #[serde_as(deserialize_as = "serde_with::OneOrMany<_>")]
    pub cors_allow_origins: Vec<String>,
    #[serde(with = "http_serde::header_map")]
    #[serde(default)]
    pub extra_headers: HeaderMap,
    #[serde(default)]
    pub tls: Option<TlsConfig>,
}

impl RestConfigBuilder {
    fn build_and_validate(
        self,
        listen_ip: IpAddr,
        env_vars: &HashMap<String, String>,
    ) -> anyhow::Result<RestConfig> {
        let listen_port_from_config_or_default =
            self.listen_port.unwrap_or(default_rest_listen_port());
        let listen_port = ConfigValue::<u16, QW_REST_LISTEN_PORT>::with_default(
            listen_port_from_config_or_default,
        )
        .resolve(env_vars)?;
        let rest_config = RestConfig {
            listen_addr: SocketAddr::new(listen_ip, listen_port),
            cors_allow_origins: self.cors_allow_origins,
            extra_headers: self.extra_headers,
            tls: self.tls,
        };
        Ok(rest_config)
    }
}

#[cfg(any(test, feature = "testsuite"))]
pub fn node_config_for_tests_from_ports(
    rest_listen_port: u16,
    grpc_listen_port: u16,
) -> NodeConfig {
    let node_id = NodeId::new(default_node_id().unwrap());
    let enabled_services = QuickwitService::supported_services();
    let availability_zone = Some(String::from("az-1"));
    let listen_address = Host::default();
    let rest_listen_addr = listen_address
        .with_port(rest_listen_port)
        .to_socket_addr()
        .expect("default host should be an IP address");
    let gossip_listen_addr = listen_address
        .with_port(rest_listen_port)
        .to_socket_addr()
        .expect("default host should be an IP address");
    let grpc_listen_addr = listen_address
        .with_port(grpc_listen_port)
        .to_socket_addr()
        .expect("default host should be an IP address");

    let data_dir_uri = default_data_dir_uri().unwrap();
    let data_dir_path = data_dir_uri
        .filepath()
        .expect("The default data dir should be valid directory path.")
        .to_path_buf();
    let metastore_uri = default_metastore_uri(&data_dir_uri);
    let default_index_root_uri = default_index_root_uri(&data_dir_uri);
    let rest_config = RestConfig {
        listen_addr: rest_listen_addr,
        cors_allow_origins: Vec::new(),
        extra_headers: HeaderMap::new(),
        tls: None,
    };
    NodeConfig {
        cluster_id: default_cluster_id().unwrap(),
        node_id,
        availability_zone,
        enabled_services,
        gossip_advertise_addr: gossip_listen_addr,
        grpc_advertise_addr: grpc_listen_addr,
        gossip_listen_addr,
        grpc_listen_addr,
        gossip_interval: Duration::from_millis(25u64),
        peer_seeds: Vec::new(),
        data_dir_path,
        metastore_uri,
        default_index_root_uri,
        rest_config,
        grpc_config: GrpcConfig::default(),
        storage_configs: StorageConfigs::default(),
        metastore_configs: MetastoreConfigs::default(),
        indexer_config: IndexerConfig::default(),
        searcher_config: SearcherConfig::default(),
        ingest_api_config: IngestApiConfig::default(),
        jaeger_config: JaegerConfig::default(),
    }
}

#[cfg(test)]
mod tests {
    use std::env;
    use std::net::Ipv4Addr;
    use std::num::{NonZeroU64, NonZeroUsize};
    use std::path::Path;

    use bytesize::ByteSize;
    use itertools::Itertools;

    use super::*;
    use crate::storage_config::StorageBackendFlavor;
    use crate::{CacheConfig, LambdaConfig, LambdaDeployConfig};

    fn get_config_filepath(config_filename: &str) -> String {
        format!(
            "{}/resources/tests/node_config/{}",
            env!("CARGO_MANIFEST_DIR"),
            config_filename
        )
    }

    async fn test_node_config_parse_aux(config_format: ConfigFormat) -> anyhow::Result<()> {
        let config_filepath =
            get_config_filepath(&format!("quickwit.{config_format:?}").to_lowercase());
        let file = std::fs::read_to_string(&config_filepath).unwrap();
        let env_vars = HashMap::default();
        let config = load_node_config_with_env(config_format, file.as_bytes(), &env_vars).await?;
        assert_eq!(config.cluster_id, "quickwit-cluster");
        assert_eq!(config.enabled_services.len(), 2);

        assert!(config.is_service_enabled(QuickwitService::Janitor));
        assert!(config.is_service_enabled(QuickwitService::Metastore));

        assert_eq!(config.availability_zone.unwrap(), "az-1");
        assert_eq!(
            config.rest_config.listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::UNSPECIFIED), 1111)
        );
        assert_eq!(
            config.rest_config.extra_headers.get("x-header-1").unwrap(),
            "header-value-1"
        );
        assert_eq!(
            config.rest_config.extra_headers.get("x-header-2").unwrap(),
            "header-value-2"
        );
        assert_eq!(config.grpc_config.max_message_size, ByteSize::mb(10));

        assert_eq!(
            config.gossip_listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::UNSPECIFIED), 2222)
        );
        assert_eq!(
            config.grpc_listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::UNSPECIFIED), 3333)
        );
        assert_eq!(
            config.gossip_advertise_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 12)), 2222)
        );
        assert_eq!(
            config.grpc_advertise_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 12)), 3333)
        );
        assert_eq!(
            config.peer_seeds,
            vec![
                "quickwit-searcher-0.local".to_string(),
                "quickwit-searcher-1.local".to_string()
            ]
        );
        assert_eq!(config.data_dir_path, Path::new("/opt/quickwit/data"));
        assert_eq!(
            config.metastore_uri,
            "postgresql://username:password@host:port/db"
        );
        assert_eq!(config.default_index_root_uri, "s3://quickwit-indexes");

        let azure_storage_config = config.storage_configs.find_azure().unwrap();
        assert_eq!(
            azure_storage_config.account_name.as_ref().unwrap(),
            "quickwit-dev"
        );

        let s3_storage_config = config.storage_configs.find_s3().unwrap();
        assert_eq!(s3_storage_config.flavor.unwrap(), StorageBackendFlavor::Gcs);
        assert_eq!(
            s3_storage_config.endpoint.as_ref().unwrap(),
            "http://localhost:4566"
        );
        assert!(s3_storage_config.force_path_style_access);
        assert!(s3_storage_config.disable_multi_object_delete);
        assert!(s3_storage_config.disable_multipart_upload);

        let postgres_config = config.metastore_configs.find_postgres().unwrap();
        assert_eq!(postgres_config.min_connections, 1);
        assert_eq!(postgres_config.max_connections.get(), 12);
        assert_eq!(
            postgres_config.acquire_connection_timeout().unwrap(),
            Duration::from_secs(30)
        );
        assert_eq!(
            postgres_config.acquire_connection_timeout().unwrap(),
            Duration::from_secs(30)
        );
        assert_eq!(
            postgres_config.idle_connection_timeout_opt().unwrap(),
            Some(Duration::from_secs(1800))
        );
        assert_eq!(
            postgres_config.max_connection_lifetime_opt().unwrap(),
            Some(Duration::from_secs(3600))
        );

        assert_eq!(
            config.indexer_config,
            IndexerConfig {
                enable_otlp_endpoint: true,
                split_store_max_num_bytes: ByteSize::tb(1),
                split_store_max_num_splits: 10_000,
                max_concurrent_split_uploads: 8,
                merge_concurrency: NonZeroUsize::new(2).unwrap(),
                cpu_capacity: IndexerConfig::default_cpu_capacity(),
                enable_cooperative_indexing: false,
                max_merge_write_throughput: Some(ByteSize::mb(100)),
            }
        );
        assert_eq!(
            config.ingest_api_config,
            IngestApiConfig {
                replication_factor: 2,
                ..Default::default()
            }
        );
        assert_eq!(
            config.searcher_config,
            SearcherConfig {
                aggregation_memory_limit: ByteSize::gb(1),
                aggregation_bucket_limit: 500_000,
                fast_field_cache: CacheConfig::default_with_capacity(ByteSize::gb(10)),
                split_footer_cache: CacheConfig::default_with_capacity(ByteSize::gb(1)),
                partial_request_cache: CacheConfig::default_with_capacity(ByteSize::mb(64)),
                predicate_cache: CacheConfig::default_with_capacity(ByteSize::mb(256)),
                max_num_concurrent_split_searches: 150,
                max_splits_per_search: None,
                _max_num_concurrent_split_streams: Some(serde::de::IgnoredAny),
                split_cache: None,
                request_timeout_secs: NonZeroU64::new(30).unwrap(),
                storage_timeout_policy: Some(crate::StorageTimeoutPolicy {
                    min_throughtput_bytes_per_secs: 100_000,
                    timeout_millis: 2_000,
                    max_num_retries: 2
                }),
                warmup_memory_budget: ByteSize::gb(100),
                warmup_single_split_initial_allocation: ByteSize::gb(1),
                lambda: Some(LambdaConfig {
                    function_name: "quickwit-lambda-leaf-search".to_string(),
                    max_splits_per_invocation: NonZeroUsize::new(10).unwrap(),
                    offload_threshold: 30,
                    auto_deploy: Some(LambdaDeployConfig {
                        execution_role_arn: "arn:aws:iam::123456789012:role/quickwit-lambda-role"
                            .to_string(),
                        memory_size: ByteSize::gib(5),
                        invocation_timeout_secs: 15,
                    }),
                }),
            }
        );
        assert_eq!(
            config.jaeger_config,
            JaegerConfig {
                enable_endpoint: true,
                lookback_period_hours: NonZeroU64::new(24).unwrap(),
                max_trace_duration_secs: NonZeroU64::new(600).unwrap(),
                max_fetch_spans: NonZeroU64::new(1_000).unwrap(),
            }
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_node_config_parse_json() {
        test_node_config_parse_aux(ConfigFormat::Json)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_node_config_parse_toml() {
        test_node_config_parse_aux(ConfigFormat::Toml)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_node_config_parse_yaml() {
        test_node_config_parse_aux(ConfigFormat::Yaml)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_config_contains_wrong_values() {
        let config_filepath = get_config_filepath("quickwit.wrongkey.yaml");
        let config_str = std::fs::read_to_string(&config_filepath).unwrap();
        let parsing_error = super::load_node_config_with_env(
            ConfigFormat::Yaml,
            config_str.as_bytes(),
            &Default::default(),
        )
        .await
        .unwrap_err();
        assert!(
            format!("{parsing_error:?}")
                .contains("unknown field `max_num_concurrent_split_searches_with_typo`")
        );
    }

    #[tokio::test]
    async fn test_node_config_default_values_minimal() {
        let config_yaml = "version: 0.8";
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .unwrap();
        assert_eq!(config.cluster_id, DEFAULT_CLUSTER_ID);
        assert_eq!(config.node_id, get_short_hostname().unwrap());
        assert_eq!(config.availability_zone, None);
        assert_eq!(
            config.enabled_services,
            QuickwitService::supported_services()
        );
        assert_eq!(
            config.rest_config.listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::LOCALHOST), 7280)
        );
        assert_eq!(
            config.gossip_listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::LOCALHOST), 7280)
        );
        assert_eq!(
            config.grpc_listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::LOCALHOST), 7281)
        );
        assert_eq!(
            config.data_dir_path.to_string_lossy(),
            format!("{}/qwdata", env::current_dir().unwrap().display())
        );
        assert_eq!(
            config.metastore_uri,
            format!(
                "file://{}/qwdata/indexes#polling_interval=30s",
                env::current_dir().unwrap().display()
            )
        );
        assert_eq!(
            config.default_index_root_uri,
            format!(
                "file://{}/qwdata/indexes",
                env::current_dir().unwrap().display()
            )
        );
        assert_eq!(config.ingest_api_config.replication_factor, 1);
    }

    #[tokio::test]
    async fn test_node_config_env_var_override() {
        let config_yaml = "version: 0.8";
        let mut env_vars = HashMap::new();
        env_vars.insert("QW_CLUSTER_ID".to_string(), "test-cluster".to_string());
        env_vars.insert("QW_NODE_ID".to_string(), "test-node".to_string());
        env_vars.insert(
            "QW_ENABLED_SERVICES".to_string(),
            "indexer,metastore".to_string(),
        );
        env_vars.insert("QW_LISTEN_ADDRESS".to_string(), "172.0.0.12".to_string());
        env_vars.insert("QW_ADVERTISE_ADDRESS".to_string(), "172.0.0.13".to_string());
        env_vars.insert("QW_REST_LISTEN_PORT".to_string(), "1234".to_string());
        env_vars.insert("QW_GOSSIP_LISTEN_PORT".to_string(), "5678".to_string());
        env_vars.insert("QW_GRPC_LISTEN_PORT".to_string(), "9012".to_string());
        env_vars.insert(
            "QW_PEER_SEEDS".to_string(),
            "test-peer-seed-0,test-peer-seed-1".to_string(),
        );
        env_vars.insert("QW_DATA_DIR".to_string(), "test-data-dir".to_string());
        env_vars.insert(
            "QW_METASTORE_URI".to_string(),
            "postgresql://test-user:test-password@test-host:4321/test-db".to_string(),
        );
        env_vars.insert(
            "QW_DEFAULT_INDEX_ROOT_URI".to_string(),
            "s3://quickwit-indexes/prod".to_string(),
        );
        let config =
            load_node_config_with_env(ConfigFormat::Yaml, config_yaml.as_bytes(), &env_vars)
                .await
                .unwrap();
        assert_eq!(config.cluster_id, "test-cluster");
        assert_eq!(config.node_id, "test-node");
        assert_eq!(config.enabled_services.len(), 2);
        assert_eq!(
            config
                .enabled_services
                .iter()
                .sorted_by_key(|service| service.as_str())
                .collect::<Vec<_>>(),
            &[&QuickwitService::Indexer, &QuickwitService::Metastore]
        );
        assert_eq!(
            config.rest_config.listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 12)), 1234)
        );
        assert_eq!(
            config.gossip_listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 12)), 5678)
        );
        assert_eq!(
            config.grpc_listen_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 12)), 9012)
        );
        assert_eq!(
            config.gossip_advertise_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 13)), 5678)
        );
        assert_eq!(
            config.grpc_advertise_addr,
            SocketAddr::new(IpAddr::V4(Ipv4Addr::new(172, 0, 0, 13)), 9012)
        );
        assert_eq!(
            config.peer_seeds,
            vec![
                "test-peer-seed-0".to_string(),
                "test-peer-seed-1".to_string()
            ]
        );
        assert_eq!(
            config.data_dir_path,
            env::current_dir().unwrap().join("test-data-dir")
        );
        assert_eq!(
            config.metastore_uri,
            "postgresql://test-user:test-password@test-host:4321/test-db"
        );
        assert_eq!(config.default_index_root_uri, "s3://quickwit-indexes/prod");
    }

    #[tokio::test]
    async fn test_quickwwit_config_default_values_storage() {
        let config_yaml = r#"
            version: 0.8
            node_id: "node-1"
            metastore_uri: postgres://username:password@host:port/db
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .unwrap();
        assert_eq!(config.cluster_id, DEFAULT_CLUSTER_ID);
        assert_eq!(config.node_id, "node-1");
        assert_eq!(
            config.metastore_uri,
            "postgresql://username:password@host:port/db"
        );
    }

    #[tokio::test]
    async fn test_node_config_config_default_values_default_indexer_searcher_config() {
        let config_yaml = r#"
            version: 0.8
            metastore_uri: postgres://username:password@host:port/db
            data_dir: /opt/quickwit/data
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .unwrap();
        assert_eq!(
            config.metastore_uri,
            "postgresql://username:password@host:port/db"
        );
        assert_eq!(config.indexer_config, IndexerConfig::default());
        assert_eq!(config.searcher_config, SearcherConfig::default());
        assert_eq!(config.ingest_api_config, IngestApiConfig::default());
        assert_eq!(config.jaeger_config, JaegerConfig::default());
    }

    #[tokio::test]
    async fn test_node_config_validate() {
        let config_filepath = get_config_filepath("quickwit.toml");
        let file_content = std::fs::read_to_string(&config_filepath).unwrap();

        let data_dir_path = env::current_dir().unwrap();
        let mut env_vars = HashMap::new();
        env_vars.insert(
            "QW_DATA_DIR".to_string(),
            data_dir_path.to_string_lossy().to_string(),
        );
        load_node_config_with_env(ConfigFormat::Toml, file_content.as_bytes(), &env_vars)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_peer_socket_addrs() {
        {
            let node_config = NodeConfigBuilder {
                ..Default::default()
            }
            .build_and_validate(&HashMap::new())
            .await
            .unwrap();
            assert!(node_config.peer_seed_addrs().await.unwrap().is_empty());
        }
        {
            let node_config = NodeConfigBuilder {
                rest_config_builder: RestConfigBuilder {
                    listen_port: Some(1789),
                    ..Default::default()
                },
                peer_seeds: ConfigValue::for_test(List(vec![
                    "unresolvable.example.com".to_string(),
                    "localhost".to_string(),
                    "localhost:1337".to_string(),
                    "127.0.0.1".to_string(),
                    "127.0.0.1:1337".to_string(),
                ])),
                ..Default::default()
            }
            .build_and_validate(&HashMap::new())
            .await
            .unwrap();
            assert_eq!(
                node_config.peer_seed_addrs().await.unwrap(),
                vec![
                    "unresolvable.example.com:1789".to_string(),
                    "localhost:1789".to_string(),
                    "localhost:1337".to_string(),
                    "127.0.0.1:1789".to_string(),
                    "127.0.0.1:1337".to_string()
                ]
            );
        }
    }

    #[tokio::test]
    async fn test_socket_addr_ports() {
        {
            let node_config = NodeConfigBuilder {
                listen_address: default_listen_address(),
                ..Default::default()
            }
            .build_and_validate(&HashMap::new())
            .await
            .unwrap();
            assert_eq!(
                node_config.rest_config.listen_addr.to_string(),
                "127.0.0.1:7280"
            );
            assert_eq!(node_config.gossip_listen_addr.to_string(), "127.0.0.1:7280");
            assert_eq!(node_config.grpc_listen_addr.to_string(), "127.0.0.1:7281");
        }
        {
            let node_config = NodeConfigBuilder {
                listen_address: default_listen_address(),
                rest_config_builder: RestConfigBuilder {
                    listen_port: Some(1789),
                    ..Default::default()
                },
                ..Default::default()
            }
            .build_and_validate(&HashMap::new())
            .await
            .unwrap();
            assert_eq!(
                node_config.rest_config.listen_addr.to_string(),
                "127.0.0.1:1789"
            );
            assert_eq!(node_config.gossip_listen_addr.to_string(), "127.0.0.1:1789");
            assert_eq!(node_config.grpc_listen_addr.to_string(), "127.0.0.1:1790");
        }
        {
            let node_config = NodeConfigBuilder {
                listen_address: default_listen_address(),
                gossip_listen_port: ConfigValue::for_test(1889),
                grpc_listen_port: ConfigValue::for_test(1989),
                rest_config_builder: RestConfigBuilder {
                    listen_port: Some(1789),
                    ..Default::default()
                },
                ..Default::default()
            }
            .build_and_validate(&HashMap::new())
            .await
            .unwrap();
            assert_eq!(
                node_config.rest_config.listen_addr.to_string(),
                "127.0.0.1:1789"
            );
            assert_eq!(node_config.gossip_listen_addr.to_string(), "127.0.0.1:1889");
            assert_eq!(node_config.grpc_listen_addr.to_string(), "127.0.0.1:1989");
        }
    }

    #[tokio::test]
    async fn test_rest_deprecated_listen_port_config() {
        // This test should be removed once deprecated `rest_listen_port` field is removed.
        let node_config = NodeConfigBuilder {
            rest_listen_port: Some(1789),
            listen_address: default_listen_address(),
            rest_config_builder: RestConfigBuilder {
                listen_port: None,
                ..Default::default()
            },
            ..Default::default()
        }
        .build_and_validate(&HashMap::new())
        .await
        .unwrap();
        assert_eq!(
            node_config.rest_config.listen_addr.to_string(),
            "127.0.0.1:1789"
        );
        assert_eq!(node_config.gossip_listen_addr.to_string(), "127.0.0.1:1789");
        assert_eq!(node_config.grpc_listen_addr.to_string(), "127.0.0.1:1790");
    }

    #[tokio::test]
    async fn test_load_config_with_validation_error() {
        let config_filepath = get_config_filepath("quickwit.yaml");
        let file = std::fs::read_to_string(&config_filepath).unwrap();
        let error = NodeConfig::load(ConfigFormat::Yaml, file.as_bytes())
            .await
            .unwrap_err();
        assert!(error.to_string().contains("data dir"));
    }

    #[tokio::test]
    async fn test_config_validates_uris() {
        {
            let config_yaml = r#"
            version: 0.8
            node_id: 1
            metastore_uri: ''
        "#;
            assert!(
                load_node_config_with_env(
                    ConfigFormat::Yaml,
                    config_yaml.as_bytes(),
                    &Default::default()
                )
                .await
                .is_err()
            );
        }
        {
            let config_yaml = r#"
            version: 0.8
            node_id: 1
            metastore_uri: postgres://username:password@host:port/db
            default_index_root_uri: ''
        "#;
            assert!(
                load_node_config_with_env(
                    ConfigFormat::Yaml,
                    config_yaml.as_bytes(),
                    &Default::default()
                )
                .await
                .is_err()
            );
        }
    }

    #[tokio::test]
    async fn test_node_config_data_dir_accepts_both_file_uris_and_file_paths() {
        {
            let config_yaml = r#"
                version: 0.8
                data_dir: /opt/quickwit/data
            "#;
            let config = load_node_config_with_env(
                ConfigFormat::Yaml,
                config_yaml.as_bytes(),
                &HashMap::default(),
            )
            .await
            .unwrap();
            assert_eq!(&config.data_dir_path, Path::new("/opt/quickwit/data"));
        }
        {
            let config_yaml = r#"
                version: 0.8
                data_dir: file:///opt/quickwit/data
            "#;
            let config = load_node_config_with_env(
                ConfigFormat::Yaml,
                config_yaml.as_bytes(),
                &HashMap::default(),
            )
            .await
            .unwrap();
            assert_eq!(&config.data_dir_path, Path::new("/opt/quickwit/data"));
        }
        {
            let config_yaml = r#"
                version: 0.8
                data_dir: s3://indexes/foo
            "#;
            let error = load_node_config_with_env(
                ConfigFormat::Yaml,
                config_yaml.as_bytes(),
                &HashMap::default(),
            )
            .await
            .unwrap_err();
            assert!(error.to_string().contains("data dir must be located"));
        }
    }

    #[tokio::test]
    async fn test_config_invalid_when_both_listen_ports_params_are_configured() {
        let config_yaml = r#"
                version: 0.8
                rest_listen_port: 1789
                rest:
                  listen_port: 1789
            "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            config_yaml.as_bytes(),
            &HashMap::default(),
        )
        .await
        .unwrap_err();
        assert_eq!(
            &config.to_string(),
            "conflicting configuration values: please use only `rest.listen_port`, \
             `rest_listen_port` is deprecated and should not be used alongside \
             `rest.listen_port`. Update your configuration to use `rest.listen_port`."
        );
    }

    #[test]
    fn test_jaeger_config_rejects_null_values() {
        let jaeger_config_yaml = r#"
            enable_endpoint: true
            max_trace_duration_secs: 0
        "#;
        let error = serde_yaml::from_str::<JaegerConfig>(jaeger_config_yaml).unwrap_err();
        assert!(
            error
                .to_string()
                .contains("max_trace_duration_secs: invalid value: integer `0`")
        )
    }

    #[tokio::test]
    async fn test_rest_config_accepts_wildcard() {
        let rest_config_yaml = r#"
            version: 0.8
            rest:
              cors_allow_origins: '*'
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect("Deserialize rest config");
        assert_eq!(config.rest_config.cors_allow_origins, ["*"]);
    }

    #[tokio::test]
    async fn test_rest_config_accepts_single_origin() {
        let rest_config_yaml = r#"
            version: 0.8
            rest:
              cors_allow_origins:
                - https://www.my-domain.com
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect("Deserialize rest config");
        assert_eq!(
            config.rest_config.cors_allow_origins,
            ["https://www.my-domain.com"]
        );

        let rest_config_yaml = r#"
            version: 0.8
            rest:
              cors_allow_origins: http://192.168.0.108:7280
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect("Deserialize rest config");
        assert_eq!(
            config.rest_config.cors_allow_origins,
            ["http://192.168.0.108:7280"]
        );
    }

    #[tokio::test]
    async fn test_rest_config_accepts_multi_origin() {
        let rest_config_yaml = r#"
            version: 0.8
            rest:
              cors_allow_origins:
                - https://www.my-domain.com
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect("Deserialize rest config");
        assert_eq!(
            config.rest_config.cors_allow_origins,
            ["https://www.my-domain.com"]
        );

        let rest_config_yaml = r#"
            version: 0.8
            rest:
              cors_allow_origins:
                - https://www.my-domain.com
                - https://www.my-other-domain.com
        "#;
        let config = load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect("Deserialize rest config");
        assert_eq!(
            config.rest_config.cors_allow_origins,
            [
                "https://www.my-domain.com",
                "https://www.my-other-domain.com"
            ]
        );

        let rest_config_yaml = r#"
            version: 0.8
            rest:
              rest_cors_allow_origins:
        "#;
        load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect_err("Config should not allow empty origins.");

        let rest_config_yaml = r#"
            version: 0.8
            rest:
              cors_allow_origins:
                -
        "#;
        load_node_config_with_env(
            ConfigFormat::Yaml,
            rest_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .expect_err("Config should not allow empty origins.");
    }

    #[tokio::test]
    async fn test_node_config_validates_ingest_config() {
        let ingest_config = IngestApiConfig {
            replication_factor: 0,
            ..Default::default()
        };
        let error_message = ingest_config.validate().unwrap_err().to_string();
        assert!(error_message.contains("either 1 or 2, got `0`"));

        let ingest_config = IngestApiConfig {
            replication_factor: 3,
            ..Default::default()
        };
        let error_message = ingest_config.validate().unwrap_err().to_string();
        assert!(error_message.contains("either 1 or 2, got `3`"));

        let node_config_yaml = r#"
            version: 0.8
            ingest_api:
              replication_factor: 0
        "#;
        let error_message = load_node_config_with_env(
            ConfigFormat::Yaml,
            node_config_yaml.as_bytes(),
            &Default::default(),
        )
        .await
        .unwrap_err()
        .to_string();
        assert!(error_message.contains("replication factor"));
    }
}


================================================
FILE: quickwit/quickwit-config/src/qw_env_vars.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use once_cell::sync::Lazy;

/// Expands the list of QW environment variables into constants of the form `const <ENV_VAR_KEY>:
/// usize = <env var index>;` and builds the map `QW_EN_VARS` of environment variable index to
/// environment variable key.
macro_rules! qw_env_vars {
    (@step $idx:expr,) => {};

    (@step $idx:expr, $head:ident, $($tail:ident,)*) => {
        pub(crate) const $head: usize = $idx;

        qw_env_vars!(@step $idx + 1usize, $($tail,)*);
    };

    ($($ident:ident),*) => {
        qw_env_vars!(@step 0usize, $($ident,)*);

        pub(crate) static QW_ENV_VARS: Lazy<HashMap<usize, &'static str>> = Lazy::new(|| {
            let mut env_vars = HashMap::new();
            $(env_vars.insert($ident, stringify!($ident));)*
            env_vars
        });
    }
}

// These environment variable keys can be declared in any order with the exception of `QW_NONE`,
// which must be declared first.
qw_env_vars!(
    QW_NONE,
    QW_CLUSTER_ID,
    QW_NODE_ID,
    QW_AVAILABILITY_ZONE,
    QW_ENABLED_SERVICES,
    QW_LISTEN_ADDRESS,
    QW_ADVERTISE_ADDRESS,
    QW_REST_LISTEN_PORT,
    QW_GOSSIP_LISTEN_PORT,
    QW_GRPC_LISTEN_PORT,
    QW_GOSSIP_INTERVAL_MS,
    QW_PEER_SEEDS,
    QW_DATA_DIR,
    QW_METASTORE_URI,
    QW_DEFAULT_INDEX_ROOT_URI
);

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn test_qw_env_vars_expansion() {
        assert_eq!(QW_NONE, 0);

        assert_eq!(QW_CLUSTER_ID, 1);
        assert_eq!(QW_ENV_VARS.get(&QW_CLUSTER_ID).unwrap(), &"QW_CLUSTER_ID");

        assert_eq!(QW_ENV_VARS.get(&QW_NODE_ID).unwrap(), &"QW_NODE_ID");
        assert_eq!(QW_NODE_ID, 2);
    }
}


================================================
FILE: quickwit/quickwit-config/src/serde_utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::ops::Deref;
use std::time::Duration;

use serde::{Deserialize, Serialize};

/// Custom serde module for ByteSize that serializes as raw byte count (u64).
/// This ensures perfect roundtrip consistency regardless of display format changes
/// in the bytesize crate. Deserialization still accepts human-readable strings
/// like "2 GB" via bytesize's default deserializer.
pub mod bytesize_serde {
    use bytesize::ByteSize;
    use serde::{Deserialize, Deserializer, Serializer};

    pub fn serialize<S>(byte_size: &ByteSize, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.serialize_u64(byte_size.as_u64())
    }

    pub fn deserialize<'de, D>(deserializer: D) -> Result<ByteSize, D::Error>
    where D: Deserializer<'de> {
        ByteSize::deserialize(deserializer)
    }
}

#[derive(Serialize, Deserialize, Clone)]
#[serde(try_from = "String", into = "String")]
pub struct DurationAsStr {
    duration_str: String,
    duration: Duration,
}

impl TryFrom<String> for DurationAsStr {
    type Error = humantime::DurationError;

    fn try_from(duration_str: String) -> Result<Self, Self::Error> {
        let duration = humantime::parse_duration(&duration_str)?;
        Ok(DurationAsStr {
            duration_str,
            duration,
        })
    }
}

impl From<DurationAsStr> for String {
    fn from(duration_as_str: DurationAsStr) -> String {
        duration_as_str.duration_str
    }
}

impl Deref for DurationAsStr {
    type Target = Duration;

    fn deref(&self) -> &Self::Target {
        &self.duration
    }
}

impl From<DurationAsStr> for Duration {
    fn from(duration_as_str: DurationAsStr) -> Self {
        *duration_as_str
    }
}

impl fmt::Debug for DurationAsStr {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        self.duration_str.fmt(f)
    }
}

impl PartialEq for DurationAsStr {
    fn eq(&self, other: &Self) -> bool {
        // We do not check for the chosen representation here
        self.duration == other.duration
    }
}

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn test_duration_deserialize() {
        let duration: DurationAsStr = serde_json::from_str("\"10s\"").unwrap();
        assert_eq!(*duration, Duration::from_secs(10));
        let deser_error = serde_json::from_str::<DurationAsStr>("\"10\"").unwrap_err();
        assert_eq!(
            deser_error.to_string(),
            "time unit needed, for example 10sec or 10ms"
        );
    }
}


================================================
FILE: quickwit/quickwit-config/src/service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::fmt::Display;
use std::str::FromStr;

use anyhow::bail;
use enum_iterator::{Sequence, all};
use itertools::Itertools;
use serde::Serialize;

#[derive(Clone, Copy, Debug, Eq, PartialEq, Hash, Serialize, Sequence)]
#[serde(into = "&'static str")]
pub enum QuickwitService {
    ControlPlane,
    Indexer,
    Searcher,
    Janitor,
    Metastore,
}

#[allow(clippy::from_over_into)]
impl Into<&'static str> for QuickwitService {
    fn into(self) -> &'static str {
        self.as_str()
    }
}

impl QuickwitService {
    pub fn as_str(&self) -> &'static str {
        match self {
            QuickwitService::ControlPlane => "control_plane",
            QuickwitService::Indexer => "indexer",
            QuickwitService::Searcher => "searcher",
            QuickwitService::Janitor => "janitor",
            QuickwitService::Metastore => "metastore",
        }
    }

    pub fn supported_services() -> HashSet<QuickwitService> {
        all::<QuickwitService>().collect()
    }
}

impl Display for QuickwitService {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(f, "{}", self.as_str())
    }
}

impl FromStr for QuickwitService {
    type Err = anyhow::Error;

    fn from_str(service_str: &str) -> Result<Self, Self::Err> {
        match service_str {
            "control-plane" | "control_plane" => Ok(QuickwitService::ControlPlane),
            "indexer" => Ok(QuickwitService::Indexer),
            "searcher" => Ok(QuickwitService::Searcher),
            "janitor" => Ok(QuickwitService::Janitor),
            "metastore" => Ok(QuickwitService::Metastore),
            _ => {
                bail!(
                    "failed to parse service `{service_str}`. supported services are: `{}`",
                    QuickwitService::supported_services().iter().join("`, `")
                )
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/source_config/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub(crate) mod serialize;

use std::borrow::Cow;
use std::hash::{Hash, Hasher};
use std::num::NonZeroUsize;
use std::str::FromStr;

use anyhow::ensure;
use bytes::Bytes;
use quickwit_common::is_false;
use quickwit_common::uri::Uri;
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::SourceId;
use regex::Regex;
use serde::de::Error;
use serde::{Deserialize, Deserializer, Serialize};
use serde_json::Value as JsonValue;
// For backward compatibility.
use serialize::VersionedSourceConfig;
pub use serialize::{load_source_config_from_user_config, load_source_config_update};
use siphasher::sip::SipHasher;

use crate::{disable_ingest_v1, enable_ingest_v2};

/// Reserved source ID for the `quickwit index ingest` CLI command.
pub const CLI_SOURCE_ID: &str = "_ingest-cli-source";

/// Reserved source ID used for Quickwit ingest API.
pub const INGEST_API_SOURCE_ID: &str = "_ingest-api-source";

/// Reserved source ID used for native Quickwit ingest.
/// (this is for ingest v2)
pub const INGEST_V2_SOURCE_ID: &str = "_ingest-source";

pub const RESERVED_SOURCE_IDS: &[&str] =
    &[CLI_SOURCE_ID, INGEST_API_SOURCE_ID, INGEST_V2_SOURCE_ID];

#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize)]
#[serde(into = "VersionedSourceConfig")]
#[serde(try_from = "VersionedSourceConfig")]
pub struct SourceConfig {
    pub source_id: SourceId,

    /// Number of indexing pipelines to run on a cluster for the source.
    pub num_pipelines: NonZeroUsize,

    // Denotes if this source is enabled.
    pub enabled: bool,

    pub source_params: SourceParams,

    pub transform_config: Option<TransformConfig>,

    // Denotes the input data format.
    #[serde(default)]
    pub input_format: SourceInputFormat,
}

impl SourceConfig {
    pub fn source_type(&self) -> SourceType {
        self.source_params.source_type()
    }

    // TODO: Remove after source factory refactor.
    pub fn params(&self) -> JsonValue {
        match &self.source_params {
            SourceParams::File(params) => serde_json::to_value(params),
            SourceParams::PubSub(params) => serde_json::to_value(params),
            SourceParams::Ingest => serde_json::to_value(()),
            SourceParams::IngestApi => serde_json::to_value(()),
            SourceParams::IngestCli => serde_json::to_value(()),
            SourceParams::Kafka(params) => serde_json::to_value(params),
            SourceParams::Kinesis(params) => serde_json::to_value(params),
            SourceParams::Pulsar(params) => serde_json::to_value(params),
            SourceParams::Stdin => serde_json::to_value(()),
            SourceParams::Vec(params) => serde_json::to_value(params),
            SourceParams::Void(params) => serde_json::to_value(params),
        }
        .expect("`SourceParams` should be JSON serializable")
    }

    /// Creates the default CLI source config. The CLI source ingests data from stdin.
    pub fn cli() -> Self {
        Self {
            source_id: CLI_SOURCE_ID.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::IngestCli,
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }
    }

    /// Creates a native Quickwit ingest source. The ingest source ingests data from an ingester.
    pub fn ingest_v2() -> Self {
        Self {
            source_id: INGEST_V2_SOURCE_ID.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: enable_ingest_v2(),
            source_params: SourceParams::Ingest,
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }
    }

    /// Creates the default ingest-api source config.
    pub fn ingest_api_default() -> Self {
        Self {
            source_id: INGEST_API_SOURCE_ID.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: !disable_ingest_v1(),
            source_params: SourceParams::IngestApi,
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }
    }

    /// Returns a fingerprint of parameters relevant for indexers.
    ///
    /// This should remain private to this crate to avoid confusion with the
    /// full indexing pipeline fingerprint that also includes the index config's
    /// fingerprint.
    pub(crate) fn indexing_params_fingerprint(&self) -> u64 {
        let mut hasher = SipHasher::new();
        self.input_format.hash(&mut hasher);
        self.num_pipelines.hash(&mut hasher);
        self.source_params.hash(&mut hasher);
        self.transform_config.hash(&mut hasher);
        hasher.finish()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(source_id: &str, source_params: SourceParams) -> Self {
        Self {
            source_id: source_id.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params,
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }
    }
}

#[cfg(any(test, feature = "testsuite"))]
impl crate::TestableForRegression for SourceConfig {
    fn sample_for_regression() -> Self {
        SourceConfig {
            source_id: "kafka-source".to_string(),
            num_pipelines: NonZeroUsize::new(2).unwrap(),
            enabled: true,
            source_params: SourceParams::Kafka(KafkaSourceParams {
                topic: "kafka-topic".to_string(),
                client_log_level: None,
                client_params: serde_json::json!({}),
                enable_backfill_mode: false,
            }),
            transform_config: Some(TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: default_timezone(),
            }),
            input_format: SourceInputFormat::Json,
        }
    }

    fn assert_equality(&self, other: &Self) {
        assert_eq!(self, other);
    }
}

#[derive(
    Clone, Copy, Debug, Default, Eq, PartialEq, Serialize, Deserialize, Hash, utoipa::ToSchema,
)]
#[serde(rename_all = "snake_case")]
pub enum SourceInputFormat {
    #[default]
    Json,
    OtlpLogsJson,
    #[serde(alias = "otlp_logs_proto")]
    OtlpLogsProtobuf,
    #[serde(alias = "otlp_trace_json")]
    OtlpTracesJson,
    #[serde(
        alias = "otlp_trace_proto",
        alias = "otlp_trace_protobuf",
        alias = "otlp_traces_proto"
    )]
    OtlpTracesProtobuf,
    #[serde(alias = "plain")]
    PlainText,
}

impl FromStr for SourceInputFormat {
    type Err = String;

    fn from_str(format_str: &str) -> Result<Self, String> {
        match format_str {
            "json" => Ok(Self::Json),
            "plain" => Ok(Self::PlainText),
            unknown => Err(format!("unknown source input format: `{unknown}`")),
        }
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize, Hash, utoipa::ToSchema)]
#[serde(tag = "source_type", content = "params", rename_all = "snake_case")]
pub enum SourceParams {
    #[schema(value_type = FileSourceParamsForSerde)]
    File(FileSourceParams),
    Ingest,
    #[serde(rename = "ingest-api")]
    IngestApi,
    #[serde(rename = "ingest-cli")]
    IngestCli,
    Kafka(KafkaSourceParams),
    Kinesis(KinesisSourceParams),
    #[serde(rename = "pubsub")]
    PubSub(PubSubSourceParams),
    Pulsar(PulsarSourceParams),
    Stdin,
    Vec(VecSourceParams),
    Void(VoidSourceParams),
}

impl SourceParams {
    pub fn file_from_uri(uri: Uri) -> Self {
        Self::File(FileSourceParams::Filepath(uri))
    }

    pub fn file_from_str<P: AsRef<str>>(filepath: P) -> anyhow::Result<Self> {
        Uri::from_str(filepath.as_ref()).map(Self::file_from_uri)
    }

    pub fn stdin() -> Self {
        Self::Stdin
    }

    pub fn void() -> Self {
        Self::Void(VoidSourceParams)
    }

    fn source_type(&self) -> SourceType {
        match self {
            SourceParams::File(_) => SourceType::File,
            SourceParams::Ingest => SourceType::IngestV2,
            SourceParams::IngestApi => SourceType::IngestV1,
            SourceParams::IngestCli => SourceType::Cli,
            SourceParams::Kafka(_) => SourceType::Kafka,
            SourceParams::Kinesis(_) => SourceType::Kinesis,
            SourceParams::PubSub(_) => SourceType::PubSub,
            SourceParams::Pulsar(_) => SourceType::Pulsar,
            SourceParams::Stdin => SourceType::Stdin,
            SourceParams::Vec(_) => SourceType::Vec,
            SourceParams::Void(_) => SourceType::Void,
        }
    }

    fn validate_update(&self, new_source_params: &SourceParams) -> anyhow::Result<()> {
        match (self, new_source_params) {
            (
                SourceParams::File(FileSourceParams::Notifications(current)),
                SourceParams::File(FileSourceParams::Notifications(new)),
            ) => current.validate_update(new),
            (SourceParams::Kafka(current), SourceParams::Kafka(new)) => {
                current.validate_update(new)
            }
            (SourceParams::Kinesis(current), SourceParams::Kinesis(new)) => {
                current.validate_update(new)
            }
            (SourceParams::PubSub(current), SourceParams::PubSub(new)) => {
                current.validate_update(new)
            }
            (SourceParams::Pulsar(current), SourceParams::Pulsar(new)) => {
                current.validate_update(new)
            }
            (current, new) if current.source_type() != new.source_type() => Err(anyhow::anyhow!(
                "source type cannot be changed, current type {}",
                current.source_type(),
            )),
            _ => Err(anyhow::anyhow!(
                "source type {} cannot be updated",
                self.source_type(),
            )),
        }
    }
}

#[derive(Clone, Copy, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
pub enum FileSourceMessageType {
    /// See <https://docs.aws.amazon.com/AmazonS3/latest/userguide/notification-content-structure.html>
    S3Notification,
    /// A string with the URI of the file (e.g `s3://bucket/key`)
    RawUri,
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
pub struct FileSourceSqs {
    pub queue_url: String,
    pub message_type: FileSourceMessageType,
    #[serde(default = "default_deduplication_window_duration_secs")]
    pub deduplication_window_duration_secs: u32,
    #[serde(default = "default_deduplication_window_max_messages")]
    pub deduplication_window_max_messages: u32,
    #[serde(default = "default_deduplication_cleanup_interval_secs")]
    pub deduplication_cleanup_interval_secs: u32,
}

fn default_deduplication_window_duration_secs() -> u32 {
    3600
}

fn default_deduplication_window_max_messages() -> u32 {
    100_000
}

fn default_deduplication_cleanup_interval_secs() -> u32 {
    60
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(tag = "type", rename_all = "snake_case")]
pub enum FileSourceNotification {
    Sqs(FileSourceSqs),
}

impl FileSourceNotification {
    fn validate_update(&self, other: &Self) -> anyhow::Result<()> {
        match (self, other) {
            (Self::Sqs(_), Self::Sqs(_)) => {
                // changing the queue or the deduplication settings should be fine
                Ok(())
            }
        }
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Deserialize, Serialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub(super) struct FileSourceParamsForSerde {
    #[serde(default, skip_serializing_if = "Vec::is_empty")]
    notifications: Vec<FileSourceNotification>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    filepath: Option<String>,
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize)]
#[serde(
    try_from = "FileSourceParamsForSerde",
    into = "FileSourceParamsForSerde"
)]
pub enum FileSourceParams {
    Notifications(FileSourceNotification),
    Filepath(Uri),
}

impl TryFrom<FileSourceParamsForSerde> for FileSourceParams {
    type Error = Cow<'static, str>;

    fn try_from(mut value: FileSourceParamsForSerde) -> Result<Self, Self::Error> {
        if value.filepath.is_some() && !value.notifications.is_empty() {
            return Err(
                "File source parameters `notifications` and `filepath` are mutually exclusive"
                    .into(),
            );
        }
        if let Some(filepath) = value.filepath {
            let uri = Uri::from_str(&filepath).map_err(|err| err.to_string())?;
            Ok(FileSourceParams::Filepath(uri))
        } else if value.notifications.len() == 1 {
            Ok(FileSourceParams::Notifications(
                value.notifications.remove(0),
            ))
        } else if value.notifications.len() > 1 {
            Err("Only one notification can be specified for now".into())
        } else {
            Err(
                "Either `notifications` or `filepath` must be specified as file source parameters"
                    .into(),
            )
        }
    }
}

impl From<FileSourceParams> for FileSourceParamsForSerde {
    fn from(value: FileSourceParams) -> Self {
        match value {
            FileSourceParams::Filepath(uri) => Self {
                filepath: Some(uri.to_string()),
                notifications: vec![],
            },
            FileSourceParams::Notifications(notification) => Self {
                filepath: None,
                notifications: vec![notification],
            },
        }
    }
}

impl FileSourceParams {
    pub fn from_filepath<P: AsRef<str>>(filepath: P) -> anyhow::Result<Self> {
        Uri::from_str(filepath.as_ref()).map(Self::Filepath)
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct KafkaSourceParams {
    /// Name of the topic that the source consumes.
    pub topic: String,
    /// Kafka client log level. Possible values are `debug`, `info`, `warn`, and `error`.
    #[schema(value_type = String)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub client_log_level: Option<String>,
    /// Kafka client configuration parameters.
    #[schema(value_type = Object)]
    #[serde(default = "serde_json::Value::default")]
    #[serde(skip_serializing_if = "serde_json::Value::is_null")]
    pub client_params: JsonValue,
    /// When backfill mode is enabled, the source exits after reaching the end of the topic.
    #[serde(default)]
    #[serde(skip_serializing_if = "is_false")]
    pub enable_backfill_mode: bool,
}

impl KafkaSourceParams {
    fn validate_update(&self, other: &Self) -> anyhow::Result<()> {
        // Updating the topic would likely mess up the checkpoints because the
        // Kafka partition IDs are used as metastore checkpoint PartitionId
        // and there uniqueness is not guaranteed across topics.
        ensure!(self.topic == other.topic, "Kafka topic cannot be updated");
        Ok(())
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct PubSubSourceParams {
    /// Name of the subscription that the source consumes.
    pub subscription: String,
    /// When backfill mode is enabled, the source exits after reaching the end of the topic.
    #[serde(default)]
    #[serde(skip_serializing_if = "is_false")]
    pub enable_backfill_mode: bool,
    /// GCP service account credentials (`None` will use default via
    /// GOOGLE_APPLICATION_CREDENTIALS)
    /// Path to a google_cloud_auth::credentials::CredentialsFile serialized in JSON. See also
    /// `<https://cloud.google.com/docs/authentication/application-default-credentials>` and
    /// `<https://github.com/yoshidan/google-cloud-rust/tree/main/pubsub#automatically>` and
    /// `<https://docs.rs/google-cloud-auth/0.12.0/google_cloud_auth/credentials/struct.CredentialsFile.html>`.
    pub credentials_file: Option<String>,
    /// GCP project ID (Defaults to credentials file project ID).
    pub project_id: Option<String>,
    /// Maximum number of messages returned by a pull request (default 1,000)
    pub max_messages_per_pull: Option<i32>,
}

impl PubSubSourceParams {
    fn validate_update(&self, _other: &Self) -> anyhow::Result<()> {
        // experimental source, no validation is performed
        Ok(())
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "lowercase")]
pub enum RegionOrEndpoint {
    Region(String),
    Endpoint(String),
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(try_from = "KinesisSourceParamsInner")]
pub struct KinesisSourceParams {
    pub stream_name: String,
    #[serde(flatten)]
    pub region_or_endpoint: Option<RegionOrEndpoint>,
    /// When backfill mode is enabled, the source exits after reaching the end of the stream.
    #[serde(skip_serializing_if = "is_false")]
    pub enable_backfill_mode: bool,
}

impl KinesisSourceParams {
    fn validate_update(&self, other: &Self) -> anyhow::Result<()> {
        // Changing the stream would likely mess up the checkpoints because the
        // Kinesis shard IDs are used as metastore checkpoint PartitionId, and
        // there uniqueness is only guaranteed within a stream.
        ensure!(
            self.stream_name == other.stream_name,
            "Kinesis stream_name cannot be updated"
        );
        ensure!(
            self.region_or_endpoint == other.region_or_endpoint,
            "Kinesis region or endpoint cannot be updated"
        );
        Ok(())
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Deserialize)]
#[serde(deny_unknown_fields)]
struct KinesisSourceParamsInner {
    pub stream_name: String,
    pub region: Option<String>,
    pub endpoint: Option<String>,
    #[serde(default)]
    pub enable_backfill_mode: bool,
}

impl TryFrom<KinesisSourceParamsInner> for KinesisSourceParams {
    type Error = &'static str;

    fn try_from(value: KinesisSourceParamsInner) -> Result<Self, Self::Error> {
        if value.region.is_some() && value.endpoint.is_some() {
            return Err("Kinesis source parameters `region` and `endpoint` are mutually exclusive");
        }
        let region = value.region.map(RegionOrEndpoint::Region);
        let endpoint = value.endpoint.map(RegionOrEndpoint::Endpoint);
        let region_or_endpoint = region.or(endpoint);

        Ok(KinesisSourceParams {
            stream_name: value.stream_name,
            region_or_endpoint,
            enable_backfill_mode: value.enable_backfill_mode,
        })
    }
}

#[derive(Clone, Debug, Default, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct VecSourceParams {
    #[schema(value_type = Vec<String>)]
    pub docs: Vec<Bytes>,
    pub batch_num_docs: usize,
    #[serde(default)]
    pub partition: String,
}

#[derive(Clone, Debug, Eq, PartialEq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct VoidSourceParams;

#[derive(
    Clone, Debug, Eq, PartialEq, Hash, serde::Serialize, serde::Deserialize, utoipa::ToSchema,
)]
#[serde(deny_unknown_fields)]
pub struct PulsarSourceParams {
    /// List of the topics that the source consumes.
    pub topics: Vec<String>,
    #[serde(deserialize_with = "pulsar_uri")]
    /// The connection URI for pulsar.
    pub address: String,
    #[schema(default = "quickwit")]
    #[serde(default = "default_consumer_name")]
    /// The name to register with the pulsar source.
    pub consumer_name: String,
    // Serde yaml has some specific behaviour when deserializing
    // enums (see https://github.com/dtolnay/serde-yaml/issues/342)
    // and requires explicitly stating `default` in order to make the parameter
    // optional on the yaml config.
    #[serde(default, with = "serde_yaml::with::singleton_map")]
    /// Authentication for pulsar.
    pub authentication: Option<PulsarSourceAuth>,
}

impl PulsarSourceParams {
    fn validate_update(&self, _other: &Self) -> anyhow::Result<()> {
        // In the Pulsar source, we use use combinations of the topic+partition
        // (generated by the Pulsar client library) as metastore checkpoint
        // PartitionId, and those are "guaranteed" to be unique across topics.
        Ok(())
    }
}

#[derive(
    Clone, Debug, Eq, PartialEq, Hash, serde::Serialize, serde::Deserialize, utoipa::ToSchema,
)]
#[serde(rename_all = "lowercase")]
pub enum PulsarSourceAuth {
    Token(String),
    Oauth2 {
        issuer_url: String,
        credentials_url: String,
        audience: Option<String>,
        scope: Option<String>,
    },
}

// Deserializing a string into an pulsar uri.
fn pulsar_uri<'de, D>(deserializer: D) -> Result<String, D::Error>
where D: Deserializer<'de> {
    let uri: String = Deserialize::deserialize(deserializer)?;
    let re: Regex = Regex::new(r"pulsar(\+ssl)?://.*").expect("regular expression should compile");

    if !re.is_match(uri.as_str()) {
        return Err(Error::custom(format!(
            "invalid Pulsar uri provided, must be in the format of `pulsar://host:port/path`. \
             got: `{uri}`"
        )));
    }

    Ok(uri)
}

fn default_consumer_name() -> String {
    "quickwit".to_string()
}

#[derive(Clone, Debug, Serialize, Deserialize, PartialEq, Eq, Hash, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct TransformConfig {
    /// [VRL] source code of the transform compiled to a VRL [`Program`](vrl::compiler::Program).
    ///
    /// [VRL]: https://vector.dev/docs/reference/vrl/
    #[serde(rename = "script")]
    vrl_script: String,

    /// Timezone used in the VRL [`Program`](vrl::compiler::Program) for date and time
    /// manipulations. Defaults to `UTC` if not timezone is specified.
    #[serde(default = "default_timezone")]
    timezone: String,
}

fn default_timezone() -> String {
    "UTC".to_string()
}

impl TransformConfig {
    /// Creates a new [`TransformConfig`] instance from the provided VRL script and optional
    /// timezone.
    pub fn new(vrl_script: String, timezone_opt: Option<String>) -> Self {
        Self {
            vrl_script,
            timezone: timezone_opt.unwrap_or_else(default_timezone),
        }
    }

    #[cfg(feature = "vrl")]
    pub(crate) fn validate_vrl_script(&self) -> anyhow::Result<()> {
        self.compile_vrl_script()?;
        Ok(())
    }

    #[cfg(not(feature = "vrl"))]
    pub(crate) fn validate_vrl_script(&self) -> anyhow::Result<()> {
        // If we are missing the VRL feature we do not return an error here,
        // to avoid breaking unit tests.
        //
        // We do return an explicit error on instantiation of the program however.
        Ok(())
    }

    #[cfg(feature = "vrl")]
    /// Compiles the VRL script to a VRL [`Program`](vrl::compiler::Program) and returns it along
    /// with the timezone.
    pub fn compile_vrl_script(
        &self,
    ) -> anyhow::Result<(vrl::compiler::Program, vrl::compiler::TimeZone)> {
        use anyhow::Context;
        let timezone = vrl::compiler::TimeZone::parse(&self.timezone).with_context(|| {
            format!(
                "failed to parse timezone: `{}`. timezone must be a valid name \
            in the TZ database: https://en.wikipedia.org/wiki/List_of_tz_database_time_zones",
                self.timezone,
            )
        })?;
        // Append "\n." to the script to return the entire document and not only the modified
        // fields.
        let vrl_script = self.vrl_script.clone() + "\n.";
        let functions = vrl::stdlib::all();

        let compilation_res = match vrl::compiler::compile(&vrl_script, &functions) {
            Ok(compilation_res) => compilation_res,
            Err(diagnostics) => {
                let mut formatter = vrl::diagnostic::Formatter::new(&vrl_script, diagnostics);
                formatter.enable_colors(!quickwit_common::no_color());
                anyhow::bail!("failed to compile VRL script:\n {formatter}")
            }
        };

        let vrl::compiler::CompilationResult {
            program, warnings, ..
        } = compilation_res;

        if !warnings.is_empty() {
            let mut formatter = vrl::diagnostic::Formatter::new(&vrl_script, warnings);
            formatter.enable_colors(!quickwit_common::no_color());
            tracing::warn!("VRL program compiled with some warnings: {formatter}");
        }
        Ok((program, timezone))
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(vrl_script: &str) -> Self {
        Self {
            vrl_script: vrl_script.to_string(),
            timezone: default_timezone(),
        }
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZero;
    use std::str::FromStr;

    use quickwit_common::uri::Uri;
    use serde_json::json;

    use super::*;
    use crate::source_config::RegionOrEndpoint;
    use crate::{ConfigFormat, FileSourceParams, KinesisSourceParams};

    fn get_source_config_filepath(source_config_filename: &str) -> String {
        format!(
            "{}/resources/tests/source_config/{}",
            env!("CARGO_MANIFEST_DIR"),
            source_config_filename
        )
    }

    #[tokio::test]
    async fn test_load_kafka_source_config() {
        let source_config_filepath = get_source_config_filepath("kafka-source.json");
        let file_content = std::fs::read_to_string(&source_config_filepath).unwrap();
        let source_config_uri = Uri::from_str(&source_config_filepath).unwrap();
        let config_format = ConfigFormat::sniff_from_uri(&source_config_uri).unwrap();
        let source_config =
            load_source_config_from_user_config(config_format, file_content.as_bytes()).unwrap();
        let expected_source_config = SourceConfig {
            source_id: "hdfs-logs-kafka-source".to_string(),
            num_pipelines: NonZeroUsize::new(2).unwrap(),
            enabled: true,
            source_params: SourceParams::Kafka(KafkaSourceParams {
                topic: "cloudera-cluster-logs".to_string(),
                client_log_level: None,
                client_params: json! {{"bootstrap.servers": "localhost:9092"}},
                enable_backfill_mode: false,
            }),
            transform_config: Some(TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: "local".to_string(),
            }),
            input_format: SourceInputFormat::Json,
        };
        assert_eq!(source_config, expected_source_config);
        assert_eq!(source_config.num_pipelines.get(), 2);
    }

    #[test]
    fn test_kafka_source_params_serialization() {
        {
            let params = KafkaSourceParams {
                topic: "my-topic".to_string(),
                client_log_level: None,
                client_params: json!(null),
                enable_backfill_mode: false,
            };
            let params_yaml = serde_yaml::to_string(&params).unwrap();

            assert_eq!(
                serde_yaml::from_str::<KafkaSourceParams>(&params_yaml).unwrap(),
                params,
            )
        }
        {
            let params = KafkaSourceParams {
                topic: "my-topic".to_string(),
                client_log_level: Some("info".to_string()),
                client_params: json! {{"bootstrap.servers": "localhost:9092"}},
                enable_backfill_mode: false,
            };
            let params_yaml = serde_yaml::to_string(&params).unwrap();

            assert_eq!(
                serde_yaml::from_str::<KafkaSourceParams>(&params_yaml).unwrap(),
                params,
            )
        }
    }

    #[test]
    fn test_kafka_source_params_deserialization() {
        {
            let yaml = r#"
                    topic: my-topic
                "#;
            assert_eq!(
                serde_yaml::from_str::<KafkaSourceParams>(yaml).unwrap(),
                KafkaSourceParams {
                    topic: "my-topic".to_string(),
                    client_log_level: None,
                    client_params: json!(null),
                    enable_backfill_mode: false,
                }
            );
        }
        {
            let yaml = r#"
                    topic: my-topic
                    client_log_level: info
                    client_params:
                        bootstrap.servers: localhost:9092
                    enable_backfill_mode: true
                "#;
            assert_eq!(
                serde_yaml::from_str::<KafkaSourceParams>(yaml).unwrap(),
                KafkaSourceParams {
                    topic: "my-topic".to_string(),
                    client_log_level: Some("info".to_string()),
                    client_params: json! {{"bootstrap.servers": "localhost:9092"}},
                    enable_backfill_mode: true,
                }
            );
        }
    }

    #[tokio::test]
    async fn test_load_kinesis_source_config() {
        let source_config_filepath = get_source_config_filepath("kinesis-source.yaml");
        let file_content = std::fs::read_to_string(&source_config_filepath).unwrap();
        let source_config_uri = Uri::from_str(&source_config_filepath).unwrap();
        let config_format = ConfigFormat::sniff_from_uri(&source_config_uri).unwrap();
        let source_config =
            load_source_config_from_user_config(config_format, file_content.as_bytes()).unwrap();
        let expected_source_config = SourceConfig {
            source_id: "hdfs-logs-kinesis-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Kinesis(KinesisSourceParams {
                stream_name: "emr-cluster-logs".to_string(),
                region_or_endpoint: None,
                enable_backfill_mode: false,
            }),
            transform_config: Some(TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: "local".to_string(),
            }),
            input_format: SourceInputFormat::Json,
        };
        assert_eq!(source_config, expected_source_config);
        assert_eq!(source_config.num_pipelines.get(), 1);
    }

    #[tokio::test]
    async fn test_load_invalid_source_config() {
        {
            let content = r#"
            {
                "version": "0.7",
                "source_id": "hdfs-logs-void-source",
                "desired_num_pipelines": 0,
                "max_num_pipelines_per_indexer": 1,
                "source_type": "void",
                "params": {}
            }
            "#;
            let error = load_source_config_from_user_config(ConfigFormat::Json, content.as_bytes())
                .unwrap_err();
            assert!(
                error
                    .to_string()
                    .contains("`desired_num_pipelines` must be")
            );
        }
        // {
        //     let content = r#"
        //     {
        //         "version": "0.7",
        //         "source_id": "hdfs-logs-void-source",
        //         "desired_num_pipelines": 1,
        //         "max_num_pipelines_per_indexer": 0,
        //         "source_type": "void",
        //         "params": {}
        //     }
        //     "#;
        //     let error = load_source_config_from_user_config(ConfigFormat::Json,
        // content.as_bytes())         .unwrap_err();
        //     assert!(error
        //         .to_string()
        //         .contains("`max_num_pipelines_per_indexer` must be"));
        // }
        {
            let content = r#"
            {
                "version": "0.8",
                "source_id": "hdfs-logs-void-source",
                "num_pipelines": 2,
                "source_type": "void",
                "params": {}
            }
            "#;
            let error = load_source_config_from_user_config(ConfigFormat::Json, content.as_bytes())
                .unwrap_err();
            assert!(error.to_string().contains("supports multiple pipelines"));
        }
        {
            let content = r#"
            {
                "version": "0.7",
                "source_id": "hdfs-logs-void-source",
                "desired_num_pipelines": 2,
                "max_num_pipelines_per_indexer": 1,
                "source_type": "void",
                "params": {}
            }
            "#;
            let error = load_source_config_from_user_config(ConfigFormat::Json, content.as_bytes())
                .unwrap_err();
            assert!(error.to_string().contains("supports multiple pipelines"));
        }
    }

    #[tokio::test]
    async fn test_load_valid_distributed_source_config_0_7() {
        {
            let content = r#"
            {
                "version": "0.7",
                "source_id": "hdfs-logs-kafka-source",
                "desired_num_pipelines": 3,
                "max_num_pipelines_per_indexer": 3,
                "source_type": "kafka",
                "params": {
                    "topic": "my-topic"
                }
            }
            "#;
            let source_config =
                load_source_config_from_user_config(ConfigFormat::Json, content.as_bytes())
                    .unwrap();
            assert_eq!(source_config.num_pipelines.get(), 3);
        }
        {
            let content = r#"
            {
                "version": "0.7",
                "source_id": "hdfs-logs-pulsar-source",
                "desired_num_pipelines": 3,
                "max_num_pipelines_per_indexer": 3,
                "source_type": "pulsar",
                "params": {
                    "topics": ["my-topic"],
                    "address": "http://localhost:6650"
                }
            }
            "#;
            load_source_config_from_user_config(ConfigFormat::Json, content.as_bytes())
                .unwrap_err();
            // TODO: uncomment asserts once distributed indexing is activated for pulsar.
            // assert_eq!(source_config.num_pipelines(), 3);
            // assert_eq!(source_config.max_num_pipelines_per_indexer(), 3);
        }
    }

    #[tokio::test]
    async fn test_load_valid_distributed_source_config() {
        {
            let content = r#"
            {
                "version": "0.8",
                "source_id": "hdfs-logs-kafka-source",
                "num_pipelines": 3,
                "source_type": "kafka",
                "params": {
                    "topic": "my-topic"
                }
            }
            "#;
            let source_config =
                load_source_config_from_user_config(ConfigFormat::Json, content.as_bytes())
                    .unwrap();
            assert_eq!(source_config.num_pipelines.get(), 3);
        }
    }

    #[test]
    fn test_file_source_params_serde() {
        {
            let yaml = r#"
                filepath: source-path.json
            "#;
            let file_params_deserialized = serde_yaml::from_str::<FileSourceParams>(yaml).unwrap();
            let uri = Uri::from_str("source-path.json").unwrap();
            assert_eq!(file_params_deserialized, FileSourceParams::Filepath(uri));
            let file_params_reserialized = serde_json::to_value(file_params_deserialized).unwrap();
            file_params_reserialized
                .get("filepath")
                .unwrap()
                .as_str()
                .unwrap()
                .contains("source-path.json");
        }
        {
            let yaml = r#"
                notifications:
                  - type: sqs
                    queue_url: https://sqs.us-east-1.amazonaws.com/123456789012/queue-name
                    message_type: s3_notification
            "#;
            let file_params_deserialized = serde_yaml::from_str::<FileSourceParams>(yaml).unwrap();
            assert_eq!(
                file_params_deserialized,
                FileSourceParams::Notifications(FileSourceNotification::Sqs(FileSourceSqs {
                    queue_url: "https://sqs.us-east-1.amazonaws.com/123456789012/queue-name"
                        .to_string(),
                    message_type: FileSourceMessageType::S3Notification,
                    deduplication_window_duration_secs: default_deduplication_window_duration_secs(
                    ),
                    deduplication_window_max_messages: default_deduplication_window_max_messages(),
                    deduplication_cleanup_interval_secs:
                        default_deduplication_cleanup_interval_secs()
                })),
            );
            let file_params_reserialized = serde_json::to_value(&file_params_deserialized).unwrap();
            assert_eq!(
                file_params_reserialized,
                json!({"notifications": [{
                    "type": "sqs",
                    "queue_url": "https://sqs.us-east-1.amazonaws.com/123456789012/queue-name",
                    "message_type": "s3_notification",
                    "deduplication_window_duration_secs": default_deduplication_window_duration_secs(),
                    "deduplication_window_max_messages": default_deduplication_window_max_messages(),
                    "deduplication_cleanup_interval_secs": default_deduplication_cleanup_interval_secs(),
                }]})
            );
        }
        {
            let yaml = r#"
                filepath: source-path.json
                notifications:
                  - type: sqs
                    queue_url: https://sqs.us-east-1.amazonaws.com/123456789012/queue-name
                    message_type: s3_notification
            "#;
            let error = serde_yaml::from_str::<FileSourceParams>(yaml).unwrap_err();
            assert_eq!(
                error.to_string(),
                "File source parameters `notifications` and `filepath` are mutually exclusive"
            );
        }
        {
            let yaml = r#"
                notifications:
                  - type: sqs
                    queue_url: https://sqs.us-east-1.amazonaws.com/123456789012/queue1
                    message_type: s3_notification
                  - type: sqs
                    queue_url: https://sqs.us-east-1.amazonaws.com/123456789012/queue2
                    message_type: s3_notification
            "#;
            let error = serde_yaml::from_str::<FileSourceParams>(yaml).unwrap_err();
            assert_eq!(
                error.to_string(),
                "Only one notification can be specified for now"
            );
        }
        {
            let json = r#"
            {
                "notifications": [
                    {
                        "queue_url": "https://sqs.us-east-1.amazonaws.com/123456789012/queue",
                        "message_type": "s3_notification"
                    }
                ]
            }
            "#;
            let error = serde_json::from_str::<FileSourceParams>(json).unwrap_err();
            assert!(error.to_string().contains("missing field `type`"));
        }
    }

    #[test]
    fn test_kinesis_source_params_serialization() {
        {
            let params = KinesisSourceParams {
                stream_name: "my-stream".to_string(),
                region_or_endpoint: None,
                enable_backfill_mode: false,
            };
            let params_yaml = serde_yaml::to_string(&params).unwrap();

            assert_eq!(
                serde_yaml::from_str::<KinesisSourceParams>(&params_yaml).unwrap(),
                params,
            )
        }
        {
            let params = KinesisSourceParams {
                stream_name: "my-stream".to_string(),
                region_or_endpoint: Some(RegionOrEndpoint::Region("us-west-1".to_string())),
                enable_backfill_mode: false,
            };
            let params_yaml = serde_yaml::to_string(&params).unwrap();

            assert_eq!(
                serde_yaml::from_str::<KinesisSourceParams>(&params_yaml).unwrap(),
                params,
            )
        }
        {
            let params = KinesisSourceParams {
                stream_name: "my-stream".to_string(),
                region_or_endpoint: Some(RegionOrEndpoint::Endpoint(
                    "https://localhost:4566".to_string(),
                )),
                enable_backfill_mode: false,
            };
            let params_yaml = serde_yaml::to_string(&params).unwrap();

            assert_eq!(
                ConfigFormat::Yaml
                    .parse::<KinesisSourceParams>(params_yaml.as_bytes())
                    .unwrap(),
                params,
            )
        }
    }

    #[test]
    fn test_kinesis_source_params_deserialization() {
        {
            let yaml = r#"
                    stream_name: my-stream
                "#;
            assert_eq!(
                serde_yaml::from_str::<KinesisSourceParams>(yaml).unwrap(),
                KinesisSourceParams {
                    stream_name: "my-stream".to_string(),
                    region_or_endpoint: None,
                    enable_backfill_mode: false,
                }
            );
        }
        {
            let yaml = r#"
                    stream_name: my-stream
                    region: us-west-1
                    enable_backfill_mode: true
                "#;
            assert_eq!(
                serde_yaml::from_str::<KinesisSourceParams>(yaml).unwrap(),
                KinesisSourceParams {
                    stream_name: "my-stream".to_string(),
                    region_or_endpoint: Some(RegionOrEndpoint::Region("us-west-1".to_string())),
                    enable_backfill_mode: true,
                }
            );
        }
        {
            let yaml = r#"
                    stream_name: my-stream
                    region: us-west-1
                    endpoint: https://localhost:4566
                "#;
            let error = serde_yaml::from_str::<KinesisSourceParams>(yaml).unwrap_err();
            assert!(error.to_string().starts_with("Kinesis source parameters "));
        }
    }

    #[test]
    fn test_pulsar_source_params_deserialization() {
        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://localhost:6560
                    consumer_name: my-pulsar-consumer
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://localhost:6560".to_string(),
                    consumer_name: "my-pulsar-consumer".to_string(),
                    authentication: None,
                }
            );
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://localhost:6560
                    consumer_name: my-pulsar-consumer
                    authentication:
                        token: my-token
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://localhost:6560".to_string(),
                    consumer_name: "my-pulsar-consumer".to_string(),
                    authentication: Some(PulsarSourceAuth::Token("my-token".to_string())),
                }
            );
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://localhost:6560
                    consumer_name: my-pulsar-consumer
                    authentication:
                        oauth2:
                            issuer_url: https://my-issuer:9000/path
                            credentials_url: https://my-credentials.com/path
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://localhost:6560".to_string(),
                    consumer_name: "my-pulsar-consumer".to_string(),
                    authentication: Some(PulsarSourceAuth::Oauth2 {
                        issuer_url: "https://my-issuer:9000/path".to_string(),
                        credentials_url: "https://my-credentials.com/path".to_string(),
                        audience: None,
                        scope: None,
                    }),
                }
            );
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://localhost:6560
                    consumer_name: my-pulsar-consumer
                    authentication:
                        oauth2:
                            issuer_url: https://my-issuer:9000/path
                            credentials_url: https://my-credentials.com/path
                            audience: my-audience
                            scope: "read+write"
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://localhost:6560".to_string(),
                    consumer_name: "my-pulsar-consumer".to_string(),
                    authentication: Some(PulsarSourceAuth::Oauth2 {
                        issuer_url: "https://my-issuer:9000/path".to_string(),
                        credentials_url: "https://my-credentials.com/path".to_string(),
                        audience: Some("my-audience".to_string()),
                        scope: Some("read+write".to_string()),
                    }),
                }
            );
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                "#;
            serde_yaml::from_str::<PulsarSourceParams>(yaml)
                .expect_err("Parameters should error on missing address");
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://localhost:6560
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://localhost:6560".to_string(),
                    consumer_name: default_consumer_name(),
                    authentication: None,
                }
            );
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: invalid-address
                "#;
            serde_yaml::from_str::<PulsarSourceParams>(yaml)
                .expect_err("Pulsar config should reject invalid address");
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://some-host:80/valid-path
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://some-host:80/valid-path".to_string(),
                    consumer_name: default_consumer_name(),
                    authentication: None,
                }
            );
        }

        {
            let yaml = r#"
                    topics:
                        - my-topic
                    address: pulsar://2345:0425:2CA1:0000:0000:0567:5673:23b5:80/valid-path
                "#;
            assert_eq!(
                serde_yaml::from_str::<PulsarSourceParams>(yaml).unwrap(),
                PulsarSourceParams {
                    topics: vec!["my-topic".to_string()],
                    address: "pulsar://2345:0425:2CA1:0000:0000:0567:5673:23b5:80/valid-path"
                        .to_string(),
                    consumer_name: default_consumer_name(),
                    authentication: None,
                }
            );
        }
    }

    #[cfg(feature = "vrl")]
    #[tokio::test]
    async fn test_load_ingest_api_source_config() {
        let source_config_filepath = get_source_config_filepath("ingest-api-source.json");
        let file_content = std::fs::read(source_config_filepath).unwrap();
        let source_config: SourceConfig = ConfigFormat::Json.parse(&file_content).unwrap();
        let expected_source_config = SourceConfig {
            source_id: INGEST_API_SOURCE_ID.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::IngestApi,
            transform_config: Some(TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: default_timezone(),
            }),
            input_format: SourceInputFormat::Json,
        };
        assert_eq!(source_config, expected_source_config);
        assert_eq!(source_config.num_pipelines.get(), 1);
    }

    #[test]
    fn test_transform_config_serialization() {
        {
            let transform_config = TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: "local".to_string(),
            };
            let transform_config_yaml = serde_yaml::to_string(&transform_config).unwrap();
            assert_eq!(
                serde_yaml::from_str::<TransformConfig>(&transform_config_yaml).unwrap(),
                transform_config,
            );
        }
        {
            let transform_config = TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: default_timezone(),
            };
            let transform_config_yaml = serde_yaml::to_string(&transform_config).unwrap();
            assert_eq!(
                serde_yaml::from_str::<TransformConfig>(&transform_config_yaml).unwrap(),
                transform_config,
            );
        }
    }

    #[test]
    fn test_transform_config_deserialization() {
        {
            let transform_config_yaml = r#"
                script: .message = downcase(string!(.message))
            "#;
            let transform_config =
                serde_yaml::from_str::<TransformConfig>(transform_config_yaml).unwrap();

            let expected_transform_config = TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: default_timezone(),
            };
            assert_eq!(transform_config, expected_transform_config);
        }
        {
            let transform_config_yaml = r#"
                script: .message = downcase(string!(.message))
                timezone: Turkey
            "#;
            let transform_config =
                serde_yaml::from_str::<TransformConfig>(transform_config_yaml).unwrap();

            let expected_transform_config = TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: "Turkey".to_string(),
            };
            assert_eq!(transform_config, expected_transform_config);
        }
    }

    #[cfg(feature = "vrl")]
    #[test]
    fn test_transform_config_compile_vrl_script() {
        {
            let transform_config = TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: "Turkey".to_string(),
            };
            transform_config.compile_vrl_script().unwrap();
        }
        {
            let transform_config = TransformConfig {
                vrl_script: r#"
                . = parse_json!(string!(.message))
                .timestamp = to_unix_timestamp(timestamp!(.timestamp))
                del(.username)
                .message = downcase(string!(.message))
                "#
                .to_string(),
                timezone: default_timezone(),
            };
            transform_config.compile_vrl_script().unwrap();
        }
        {
            let transform_config = TransformConfig {
                vrl_script: ".message = downcase(string!(.message))".to_string(),
                timezone: "foo".to_string(),
            };
            let error = transform_config.compile_vrl_script().unwrap_err();
            assert!(error.to_string().starts_with("failed to parse timezone"));
        }
        {
            let transform_config = TransformConfig {
                vrl_script: "foo".to_string(),
                timezone: "Turkey".to_string(),
            };
            let error = transform_config.compile_vrl_script().unwrap_err();
            assert!(error.to_string().starts_with("failed to compile"));
        }
    }

    #[tokio::test]
    async fn test_source_config_plain_text_input_format() {
        let file_content = r#"{
            "version": "0.7",
            "source_id": "logs-file-source",
            "desired_num_pipelines": 1,
            "max_num_pipelines_per_indexer": 1,
            "source_type": "file",
            "params": {
              "filepath": "s3://mybucket/test_non_json_corpus.txt"
            },
            "input_format": "plain_text"
        }"#;
        let source_config =
            load_source_config_from_user_config(ConfigFormat::Json, file_content.as_bytes())
                .unwrap();
        assert_eq!(source_config.input_format, SourceInputFormat::PlainText);
    }

    #[tokio::test]
    async fn test_update_kafka_source_config() {
        let source_config_filepath = get_source_config_filepath("kafka-source.json");
        let file_content = std::fs::read(&source_config_filepath).unwrap();
        let source_config_uri = Uri::from_str(&source_config_filepath).unwrap();
        let config_format = ConfigFormat::sniff_from_uri(&source_config_uri).unwrap();
        {
            let mut existing_source_config =
                load_source_config_from_user_config(config_format, &file_content).unwrap();
            existing_source_config.num_pipelines = NonZero::new(4).unwrap();
            let new_source_config =
                load_source_config_update(config_format, &file_content, &existing_source_config)
                    .unwrap();

            let expected_source_config = SourceConfig {
                source_id: "hdfs-logs-kafka-source".to_string(),
                num_pipelines: NonZeroUsize::new(2).unwrap(),
                enabled: true,
                source_params: SourceParams::Kafka(KafkaSourceParams {
                    topic: "cloudera-cluster-logs".to_string(),
                    client_log_level: None,
                    client_params: json! {{"bootstrap.servers": "localhost:9092"}},
                    enable_backfill_mode: false,
                }),
                transform_config: Some(TransformConfig {
                    vrl_script: ".message = downcase(string!(.message))".to_string(),
                    timezone: "local".to_string(),
                }),
                input_format: SourceInputFormat::Json,
            };
            assert_eq!(new_source_config, expected_source_config);
            assert_eq!(new_source_config.num_pipelines.get(), 2);
        }
        {
            // the source type cannot be updated
            let mut existing_source_config =
                load_source_config_from_user_config(config_format, &file_content).unwrap();
            existing_source_config.source_params = SourceParams::Kinesis(KinesisSourceParams {
                stream_name: "my-stream".to_string(),
                region_or_endpoint: None,
                enable_backfill_mode: false,
            });
            load_source_config_update(config_format, &file_content, &existing_source_config)
                .unwrap_err();
        }
        {
            // the topic cannot be updated
            let mut existing_source_config =
                load_source_config_from_user_config(config_format, &file_content).unwrap();
            let SourceParams::Kafka(kafka_params) = &mut existing_source_config.source_params
            else {
                panic!("expected Kafka source params");
            };
            kafka_params.topic = "other_topic_name".to_string();
            load_source_config_update(config_format, &file_content, &existing_source_config)
                .unwrap_err();
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/source_config/serialize.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;

use anyhow::{bail, ensure};
use quickwit_proto::types::SourceId;
use serde::{Deserialize, Serialize};

use super::{RESERVED_SOURCE_IDS, TransformConfig};
use crate::{
    ConfigFormat, FileSourceParams, SourceConfig, SourceInputFormat, SourceParams,
    validate_identifier,
};

type SourceConfigForSerialization = SourceConfigV0_8;

#[derive(Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
#[serde(tag = "version")]
pub enum VersionedSourceConfig {
    #[serde(rename = "0.9")]
    #[serde(alias = "0.8")]
    V0_8(SourceConfigV0_8),
    // Retro compatibility.
    #[serde(rename = "0.7")]
    V0_7(SourceConfigV0_7),
}

impl From<VersionedSourceConfig> for SourceConfigForSerialization {
    fn from(versioned_source_config: VersionedSourceConfig) -> Self {
        match versioned_source_config {
            VersionedSourceConfig::V0_7(v0_7) => v0_7.into(),
            VersionedSourceConfig::V0_8(v0_8) => v0_8,
        }
    }
}

/// Parses and validates an [`SourceConfig`] as supplied by a user with a given [`ConfigFormat`],
/// and config content.
pub fn load_source_config_from_user_config(
    config_format: ConfigFormat,
    config_content: &[u8],
) -> anyhow::Result<SourceConfig> {
    let versioned_source_config: VersionedSourceConfig = config_format.parse(config_content)?;
    let source_config_for_serialization: SourceConfigForSerialization =
        versioned_source_config.into();
    source_config_for_serialization.validate_and_build()
}

/// Parses and validates a [`SourceConfig`] update.
///
/// Ensures that the new configuration is valid in itself and compared to the
/// current source config. If the new configuration omits some fields, the
/// default values will be used, not those of the current source config.
pub fn load_source_config_update(
    config_format: ConfigFormat,
    config_content: &[u8],
    current_source_config: &SourceConfig,
) -> anyhow::Result<SourceConfig> {
    let versioned_source_config: VersionedSourceConfig = config_format.parse(config_content)?;
    let source_config_for_serialization: SourceConfigForSerialization =
        versioned_source_config.into();
    let new_source_config = source_config_for_serialization.validate_and_build()?;

    ensure!(
        current_source_config.source_id == new_source_config.source_id,
        "existing `source_id` {} does not match updated `source_id` {}",
        current_source_config.source_id,
        new_source_config.source_id
    );

    current_source_config
        .source_params
        .validate_update(&new_source_config.source_params)?;

    Ok(new_source_config)
}

impl SourceConfigForSerialization {
    /// Checks the validity of the `SourceConfig` as a "deserializable source".
    ///
    /// Two remarks:
    /// - This does not check connectivity, it just validate configuration, without performing any
    ///   IO. See `check_connectivity(..)`.
    /// - This is used each time the `SourceConfig` is deserialized (at creation but also during
    ///   communications with the metastore). When ingesting from stdin, we programmatically create
    ///   an invalid `SourceConfig` and only use it locally.
    fn validate_and_build(self) -> anyhow::Result<SourceConfig> {
        if !RESERVED_SOURCE_IDS.contains(&self.source_id.as_str()) {
            validate_identifier("source", &self.source_id)?;
        }
        let num_pipelines = NonZeroUsize::new(self.num_pipelines)
            .ok_or_else(|| anyhow::anyhow!("`desired_num_pipelines` must be strictly positive"))?;
        match &self.source_params {
            SourceParams::Stdin => {
                bail!(
                    "stdin can only be used as source through the CLI command `quickwit tool \
                     local-ingest`"
                );
            }
            SourceParams::File(_)
            | SourceParams::Kafka(_)
            | SourceParams::Kinesis(_)
            | SourceParams::Pulsar(_) => {
                // TODO consider any validation opportunity
            }
            SourceParams::PubSub(_)
            | SourceParams::Ingest
            | SourceParams::IngestApi
            | SourceParams::IngestCli
            | SourceParams::Vec(_)
            | SourceParams::Void(_) => {}
        }
        match &self.source_params {
            SourceParams::PubSub(_)
            | SourceParams::Kafka(_)
            | SourceParams::File(FileSourceParams::Notifications(_)) => {}
            _ => {
                if self.num_pipelines > 1 {
                    bail!("Quickwit currently supports multiple pipelines only for GCP PubSub or Kafka sources. open an issue https://github.com/quickwit-oss/quickwit/issues if you need the feature for other source types");
                }
            }
        }

        if let Some(transform_config) = &self.transform {
            if matches!(
                self.input_format,
                SourceInputFormat::OtlpLogsJson
                    | SourceInputFormat::OtlpLogsProtobuf
                    | SourceInputFormat::OtlpTracesJson
                    | SourceInputFormat::OtlpTracesProtobuf
            ) {
                bail!("VRL transforms are not supported for OTLP input formats");
            }
            transform_config.validate_vrl_script()?;
        }

        Ok(SourceConfig {
            source_id: self.source_id,
            num_pipelines,
            enabled: self.enabled,
            source_params: self.source_params,
            transform_config: self.transform,
            input_format: self.input_format,
        })
    }
}

impl From<SourceConfig> for SourceConfigV0_8 {
    fn from(source_config: SourceConfig) -> Self {
        SourceConfigV0_8 {
            source_id: source_config.source_id,
            num_pipelines: source_config.num_pipelines.get(),
            enabled: source_config.enabled,
            source_params: source_config.source_params,
            transform: source_config.transform_config,
            input_format: source_config.input_format,
        }
    }
}

impl From<SourceConfig> for VersionedSourceConfig {
    fn from(source_config: SourceConfig) -> Self {
        VersionedSourceConfig::V0_8(source_config.into())
    }
}

impl TryFrom<VersionedSourceConfig> for SourceConfig {
    type Error = anyhow::Error;

    fn try_from(versioned_source_config: VersionedSourceConfig) -> anyhow::Result<Self> {
        let v1: SourceConfigV0_8 = versioned_source_config.into();
        v1.validate_and_build()
    }
}

fn default_max_num_pipelines_per_indexer() -> usize {
    1
}

fn default_num_pipelines() -> usize {
    1
}

fn default_source_enabled() -> bool {
    true
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct SourceConfigV0_7 {
    #[schema(value_type = String)]
    pub source_id: SourceId,

    #[serde(
        default = "default_max_num_pipelines_per_indexer",
        alias = "num_pipelines"
    )]
    pub max_num_pipelines_per_indexer: usize,

    #[serde(default = "default_num_pipelines")]
    pub desired_num_pipelines: usize,

    // Denotes if this source is enabled.
    #[serde(default = "default_source_enabled")]
    pub enabled: bool,

    #[serde(flatten)]
    pub source_params: SourceParams,

    #[serde(skip_serializing_if = "Option::is_none")]
    pub transform: Option<TransformConfig>,

    // Denotes the input data format.
    #[serde(default)]
    pub input_format: SourceInputFormat,
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct SourceConfigV0_8 {
    #[schema(value_type = String)]
    pub source_id: SourceId,

    #[serde(default = "default_num_pipelines")]
    pub num_pipelines: usize,

    // Denotes if this source is enabled.
    #[serde(default = "default_source_enabled")]
    pub enabled: bool,

    #[serde(flatten)]
    pub source_params: SourceParams,

    #[serde(skip_serializing_if = "Option::is_none")]
    pub transform: Option<TransformConfig>,

    // Denotes the input data format.
    #[serde(default)]
    pub input_format: SourceInputFormat,
}

impl From<SourceConfigV0_7> for SourceConfigV0_8 {
    fn from(source_config_v0_7: SourceConfigV0_7) -> Self {
        let SourceConfigV0_7 {
            source_id,
            max_num_pipelines_per_indexer: _,
            desired_num_pipelines,
            enabled,
            source_params,
            transform,
            input_format,
        } = source_config_v0_7;
        SourceConfigV0_8 {
            source_id,
            num_pipelines: desired_num_pipelines,
            enabled,
            source_params,
            transform,
            input_format,
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/storage_config.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Deref;
use std::sync::OnceLock;
use std::{env, fmt};

use anyhow::ensure;
use itertools::Itertools;
use quickwit_common::get_bool_from_env;
use serde::{Deserialize, Serialize};
use serde_with::{EnumMap, serde_as};

/// Lists the storage backends supported by Quickwit.
#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum StorageBackend {
    /// Azure Blob Storage
    Azure,
    /// Local file system
    File,
    /// Google Cloud Storage
    Google,
    /// In-memory storage, for testing purposes
    Ram,
    /// Amazon S3 or S3-compatible storage
    S3,
}

#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum StorageBackendFlavor {
    /// Digital Ocean Spaces
    #[serde(alias = "do")]
    DigitalOcean,
    /// Garage
    Garage,
    /// Google Cloud Storage
    #[serde(alias = "gcp", alias = "google")]
    Gcs,
    /// MinIO
    #[serde(rename = "minio")]
    MinIO,
}

/// Holds the storage configurations defined in the `storage` section of node config files.
///
/// ```yaml
/// storage:
///   azure:
///     account: test-account
///
///   s3:
///     endpoint: http://localhost:4566
/// ```
#[serde_as]
#[derive(Debug, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
pub struct StorageConfigs(#[serde_as(as = "EnumMap")] Vec<StorageConfig>);

impl StorageConfigs {
    pub fn new(storage_configs: Vec<StorageConfig>) -> Self {
        Self(storage_configs)
    }

    pub fn redact(&mut self) {
        for storage_config in self.0.iter_mut() {
            storage_config.redact();
        }
    }

    pub fn apply_flavors(&mut self) {
        for storage_config in self.0.iter_mut() {
            if let StorageConfig::S3(s3_storage_config) = storage_config {
                s3_storage_config.apply_flavor();
            }
        }
    }

    pub fn validate(&self) -> anyhow::Result<()> {
        let backends: Vec<StorageBackend> = self
            .0
            .iter()
            .map(|storage_config| storage_config.backend())
            .sorted()
            .collect();

        for (left, right) in backends.iter().zip(backends.iter().skip(1)) {
            ensure!(
                left != right,
                "{left:?} storage config is defined multiple times",
            );
        }
        Ok(())
    }

    pub fn find_azure(&self) -> Option<&AzureStorageConfig> {
        self.0
            .iter()
            .find_map(|storage_config| match storage_config {
                StorageConfig::Azure(azure_storage_config) => Some(azure_storage_config),
                _ => None,
            })
    }

    pub fn find_google(&self) -> Option<&GoogleCloudStorageConfig> {
        self.0
            .iter()
            .find_map(|storage_config| match storage_config {
                StorageConfig::Google(google_storage_config) => Some(google_storage_config),
                _ => None,
            })
    }

    pub fn find_file(&self) -> Option<&FileStorageConfig> {
        self.0
            .iter()
            .find_map(|storage_config| match storage_config {
                StorageConfig::File(file_storage_config) => Some(file_storage_config),
                _ => None,
            })
    }

    pub fn find_ram(&self) -> Option<&RamStorageConfig> {
        self.0
            .iter()
            .find_map(|storage_config| match storage_config {
                StorageConfig::Ram(ram_storage_config) => Some(ram_storage_config),
                _ => None,
            })
    }

    pub fn find_s3(&self) -> Option<&S3StorageConfig> {
        self.0
            .iter()
            .find_map(|storage_config| match storage_config {
                StorageConfig::S3(s3_storage_config) => Some(s3_storage_config),
                _ => None,
            })
    }
}

impl Deref for StorageConfigs {
    type Target = Vec<StorageConfig>;

    fn deref(&self) -> &Self::Target {
        &self.0
    }
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum StorageConfig {
    Azure(AzureStorageConfig),
    File(FileStorageConfig),
    Ram(RamStorageConfig),
    S3(S3StorageConfig),
    Google(GoogleCloudStorageConfig),
}

impl StorageConfig {
    pub fn redact(&mut self) {
        match self {
            Self::Azure(azure_storage_config) => azure_storage_config.redact(),
            Self::File(_) | Self::Ram(_) | Self::Google(_) => {}
            Self::S3(s3_storage_config) => s3_storage_config.redact(),
        }
    }

    pub fn as_azure(&self) -> Option<&AzureStorageConfig> {
        match self {
            Self::Azure(azure_storage_config) => Some(azure_storage_config),
            _ => None,
        }
    }

    pub fn as_file(&self) -> Option<&FileStorageConfig> {
        match self {
            Self::File(file_storage_config) => Some(file_storage_config),
            _ => None,
        }
    }

    pub fn as_ram(&self) -> Option<&RamStorageConfig> {
        match self {
            Self::Ram(ram_storage_config) => Some(ram_storage_config),
            _ => None,
        }
    }

    pub fn as_s3(&self) -> Option<&S3StorageConfig> {
        match self {
            Self::S3(s3_storage_config) => Some(s3_storage_config),
            _ => None,
        }
    }

    pub fn as_google(&self) -> Option<&GoogleCloudStorageConfig> {
        match self {
            Self::Google(google_cloud_storage_config) => Some(google_cloud_storage_config),
            _ => None,
        }
    }
}

impl From<AzureStorageConfig> for StorageConfig {
    fn from(azure_storage_config: AzureStorageConfig) -> Self {
        Self::Azure(azure_storage_config)
    }
}

impl From<FileStorageConfig> for StorageConfig {
    fn from(file_storage_config: FileStorageConfig) -> Self {
        Self::File(file_storage_config)
    }
}

impl From<RamStorageConfig> for StorageConfig {
    fn from(ram_storage_config: RamStorageConfig) -> Self {
        Self::Ram(ram_storage_config)
    }
}

impl From<S3StorageConfig> for StorageConfig {
    fn from(s3_storage_config: S3StorageConfig) -> Self {
        Self::S3(s3_storage_config)
    }
}

impl From<GoogleCloudStorageConfig> for StorageConfig {
    fn from(google_cloud_storage_config: GoogleCloudStorageConfig) -> Self {
        Self::Google(google_cloud_storage_config)
    }
}

impl StorageConfig {
    pub fn backend(&self) -> StorageBackend {
        match self {
            Self::Azure(_) => StorageBackend::Azure,
            Self::File(_) => StorageBackend::File,
            Self::Ram(_) => StorageBackend::Ram,
            Self::S3(_) => StorageBackend::S3,
            Self::Google(_) => StorageBackend::Google,
        }
    }
}

#[derive(Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct AzureStorageConfig {
    #[serde(default)]
    #[serde(rename = "account")]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub account_name: Option<String>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub access_key: Option<String>,
}

impl AzureStorageConfig {
    pub const AZURE_STORAGE_ACCOUNT_ENV_VAR: &'static str = "QW_AZURE_STORAGE_ACCOUNT";

    pub const AZURE_STORAGE_ACCESS_KEY_ENV_VAR: &'static str = "QW_AZURE_STORAGE_ACCESS_KEY";

    /// Redacts the access key.
    pub fn redact(&mut self) {
        if let Some(access_key) = self.access_key.as_mut() {
            *access_key = "***redacted***".to_string();
        }
    }

    /// Attempts to find the storage account name in the environment variable
    /// `QW_AZURE_STORAGE_ACCOUNT` or node config.
    pub fn resolve_account_name(&self) -> Option<String> {
        env::var(Self::AZURE_STORAGE_ACCOUNT_ENV_VAR)
            .ok()
            .or_else(|| self.account_name.clone())
    }

    /// Attempts to find the storage account access key in the environment variable
    /// `QW_AZURE_STORAGE_ACCESS_KEY` or node config.
    pub fn resolve_access_key(&self) -> Option<String> {
        env::var(Self::AZURE_STORAGE_ACCESS_KEY_ENV_VAR)
            .ok()
            .or_else(|| self.access_key.clone())
    }
}

impl fmt::Debug for AzureStorageConfig {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("AzureStorageConfig")
            .field("account_name", &self.account_name)
            .field(
                "access_key",
                &self.access_key.as_ref().map(|_| "***redacted***"),
            )
            .finish()
    }
}

#[derive(Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct S3StorageConfig {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub flavor: Option<StorageBackendFlavor>,
    #[serde(default)]
    pub access_key_id: Option<String>,
    #[serde(default)]
    pub secret_access_key: Option<String>,
    #[serde(default)]
    pub region: Option<String>,
    #[serde(default)]
    pub endpoint: Option<String>,
    #[serde(default)]
    pub force_path_style_access: bool,
    #[serde(alias = "disable_multi_object_delete_requests")]
    #[serde(default)]
    pub disable_multi_object_delete: bool,
    #[serde(default)]
    pub disable_multipart_upload: bool,
}

impl S3StorageConfig {
    fn apply_flavor(&mut self) {
        match self.flavor {
            Some(StorageBackendFlavor::DigitalOcean) => {
                self.force_path_style_access = true;
                self.disable_multi_object_delete = true;
            }
            Some(StorageBackendFlavor::Garage) => {
                self.region = Some("garage".to_string());
                self.force_path_style_access = true;
            }
            Some(StorageBackendFlavor::Gcs) => {
                self.disable_multi_object_delete = true;
                self.disable_multipart_upload = true;
            }
            Some(StorageBackendFlavor::MinIO) => {
                self.region = Some("minio".to_string());
                self.force_path_style_access = true;
            }
            _ => {}
        }
    }

    pub fn redact(&mut self) {
        if let Some(secret_access_key) = self.secret_access_key.as_mut() {
            *secret_access_key = "***redacted***".to_string();
        }
    }

    pub fn endpoint(&self) -> Option<String> {
        env::var("QW_S3_ENDPOINT")
            .ok()
            .or_else(|| self.endpoint.clone())
    }

    pub fn force_path_style_access(&self) -> Option<bool> {
        static FORCE_PATH_STYLE: OnceLock<Option<bool>> = OnceLock::new();
        *FORCE_PATH_STYLE.get_or_init(|| {
            let force_path_style_access = get_bool_from_env(
                "QW_S3_FORCE_PATH_STYLE_ACCESS",
                self.force_path_style_access,
            );
            Some(force_path_style_access)
        })
    }
}

impl fmt::Debug for S3StorageConfig {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("S3StorageConfig")
            .field("access_key_id", &self.access_key_id)
            .field(
                "secret_access_key",
                &self.secret_access_key.as_ref().map(|_| "***redacted***"),
            )
            .field("region", &self.region)
            .field("endpoint", &self.endpoint)
            .field("force_path_style_access", &self.force_path_style_access)
            .field(
                "disable_multi_object_delete",
                &self.disable_multi_object_delete,
            )
            .finish()
    }
}

#[derive(Debug, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct FileStorageConfig;

#[derive(Debug, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct RamStorageConfig;

#[derive(Debug, Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct GoogleCloudStorageConfig {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub credential_path: Option<String>,
}

impl GoogleCloudStorageConfig {
    pub const GOOGLE_CLOUD_STORAGE_CREDENTIAL_PATH_ENV_VAR: &'static str =
        "QW_GOOGLE_CLOUD_STORAGE_CREDENTIAL_PATH";

    /// Attempts to find the credential path in the environment variable
    /// `QW_GOOGLE_CLOUD_STORAGE_CREDENTIAL_PATH` or the config.
    pub fn resolve_credential_path(&self) -> Option<String> {
        env::var(Self::GOOGLE_CLOUD_STORAGE_CREDENTIAL_PATH_ENV_VAR)
            .ok()
            .or_else(|| self.credential_path.clone())
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_storage_configs_serde() {
        let storage_configs_yaml = "";
        let storage_configs: StorageConfigs = serde_yaml::from_str(storage_configs_yaml).unwrap();
        assert!(storage_configs.is_empty());

        let storage_configs_yaml = r#"
                azure:
                    account: test-account
                s3:
                    endpoint: http://localhost:4566
            "#;
        let storage_configs: StorageConfigs = serde_yaml::from_str(storage_configs_yaml).unwrap();

        let expected_storage_configs = StorageConfigs(vec![
            AzureStorageConfig {
                account_name: Some("test-account".to_string()),
                ..Default::default()
            }
            .into(),
            S3StorageConfig {
                endpoint: Some("http://localhost:4566".to_string()),
                ..Default::default()
            }
            .into(),
        ]);
        assert_eq!(storage_configs, expected_storage_configs);
    }

    #[test]
    fn test_storage_configs_apply_flavors() {
        let mut storage_configs = StorageConfigs(vec![
            S3StorageConfig {
                flavor: Some(StorageBackendFlavor::DigitalOcean),
                ..Default::default()
            }
            .into(),
            S3StorageConfig {
                flavor: Some(StorageBackendFlavor::Garage),
                ..Default::default()
            }
            .into(),
            S3StorageConfig {
                flavor: Some(StorageBackendFlavor::Gcs),
                ..Default::default()
            }
            .into(),
            S3StorageConfig {
                flavor: Some(StorageBackendFlavor::MinIO),
                ..Default::default()
            }
            .into(),
        ]);
        storage_configs.apply_flavors();

        let do_storage_config = storage_configs[0].as_s3().unwrap();
        assert!(do_storage_config.force_path_style_access);
        assert!(do_storage_config.disable_multi_object_delete);

        let garage_storage_config = storage_configs[1].as_s3().unwrap();
        assert_eq!(garage_storage_config.region, Some("garage".to_string()));
        assert!(garage_storage_config.force_path_style_access);

        let gcs_storage_config = storage_configs[2].as_s3().unwrap();
        assert!(gcs_storage_config.disable_multi_object_delete);
        assert!(gcs_storage_config.disable_multipart_upload);

        let minio_storage_config = storage_configs[3].as_s3().unwrap();
        assert_eq!(minio_storage_config.region, Some("minio".to_string()));
        assert!(minio_storage_config.force_path_style_access);
    }

    #[test]
    fn test_storage_configs_validate() {
        let storage_configs = StorageConfigs(vec![
            AzureStorageConfig {
                account_name: Some("test-account".to_string()),
                ..Default::default()
            }
            .into(),
            AzureStorageConfig {
                account_name: Some("prod-account".to_string()),
                ..Default::default()
            }
            .into(),
        ]);
        storage_configs.validate().unwrap_err();
    }

    #[test]
    fn test_storage_configs_redact() {
        let mut storage_configs = StorageConfigs(vec![
            AzureStorageConfig {
                access_key: Some("test-azure-access-key".to_string()),
                ..Default::default()
            }
            .into(),
            S3StorageConfig {
                secret_access_key: Some("test-s3-secret-access-key".to_string()),
                ..Default::default()
            }
            .into(),
        ]);
        storage_configs.redact();

        assert_eq!(
            storage_configs
                .find_azure()
                .unwrap()
                .access_key
                .as_ref()
                .unwrap(),
            "***redacted***"
        );
        assert_eq!(
            storage_configs
                .find_s3()
                .unwrap()
                .secret_access_key
                .as_ref()
                .unwrap(),
            "***redacted***"
        );
    }

    #[test]
    fn test_storage_azure_config_serde() {
        {
            let azure_storage_config_yaml = r#"
                account: test-account
            "#;
            let azure_storage_config: AzureStorageConfig =
                serde_yaml::from_str(azure_storage_config_yaml).unwrap();

            let expected_azure_config = AzureStorageConfig {
                account_name: Some("test-account".to_string()),
                ..Default::default()
            };
            assert_eq!(azure_storage_config, expected_azure_config);
        }
        {
            let azure_storage_config_yaml = r#"
                account: test-account
                access_key: test-access-key
            "#;
            let azure_storage_config: AzureStorageConfig =
                serde_yaml::from_str(azure_storage_config_yaml).unwrap();

            let expected_azure_config = AzureStorageConfig {
                account_name: Some("test-account".to_string()),
                access_key: Some("test-access-key".to_string()),
            };
            assert_eq!(azure_storage_config, expected_azure_config);
        }
    }

    #[test]
    fn test_storage_google_config_serde() {
        {
            let google_cloud_storage_config_yaml = r#"
                credential_path: /path/to/credential.json
            "#;
            let google_cloud_storage_config: GoogleCloudStorageConfig =
                serde_yaml::from_str(google_cloud_storage_config_yaml).unwrap();

            let expected_google_cloud_storage_config = GoogleCloudStorageConfig {
                credential_path: Some("/path/to/credential.json".to_string()),
            };
            assert_eq!(
                google_cloud_storage_config,
                expected_google_cloud_storage_config
            );
        }
    }

    #[test]
    fn test_storage_s3_config_serde() {
        {
            let s3_storage_config_yaml = r#"
                endpoint: http://localhost:4566
            "#;
            let s3_storage_config: S3StorageConfig =
                serde_yaml::from_str(s3_storage_config_yaml).unwrap();

            let expected_s3_config = S3StorageConfig {
                endpoint: Some("http://localhost:4566".to_string()),
                ..Default::default()
            };
            assert_eq!(s3_storage_config, expected_s3_config);
        }
        {
            let s3_storage_config_yaml = r#"
                region: us-east-1
                endpoint: http://localhost:4566
                force_path_style_access: true
                disable_multi_object_delete_requests: true
                disable_multipart_upload: true
            "#;
            let s3_storage_config: S3StorageConfig =
                serde_yaml::from_str(s3_storage_config_yaml).unwrap();

            let expected_s3_config = S3StorageConfig {
                region: Some("us-east-1".to_string()),
                endpoint: Some("http://localhost:4566".to_string()),
                force_path_style_access: true,
                disable_multi_object_delete: true,
                disable_multipart_upload: true,
                ..Default::default()
            };
            assert_eq!(s3_storage_config, expected_s3_config);
        }
    }

    #[test]
    fn test_storage_s3_config_flavor_serde() {
        {
            let s3_storage_config_yaml = r#"
                flavor: digital_ocean
            "#;
            let s3_storage_config: S3StorageConfig =
                serde_yaml::from_str(s3_storage_config_yaml).unwrap();

            assert_eq!(
                s3_storage_config.flavor,
                Some(StorageBackendFlavor::DigitalOcean)
            );
        }
        {
            let s3_storage_config_yaml = r#"
                flavor: garage
            "#;
            let s3_storage_config: S3StorageConfig =
                serde_yaml::from_str(s3_storage_config_yaml).unwrap();

            assert_eq!(s3_storage_config.flavor, Some(StorageBackendFlavor::Garage));
        }
        {
            let s3_storage_config_yaml = r#"
                flavor: gcs
            "#;
            let s3_storage_config: S3StorageConfig =
                serde_yaml::from_str(s3_storage_config_yaml).unwrap();

            assert_eq!(s3_storage_config.flavor, Some(StorageBackendFlavor::Gcs));
        }
        {
            let s3_storage_config_yaml = r#"
                flavor: minio
            "#;
            let s3_storage_config: S3StorageConfig =
                serde_yaml::from_str(s3_storage_config_yaml).unwrap();

            assert_eq!(s3_storage_config.flavor, Some(StorageBackendFlavor::MinIO));
        }
    }
}


================================================
FILE: quickwit/quickwit-config/src/templating.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::io::BufRead;

use anyhow::{Context, Result, bail};
use new_string_template::template::Template;
use once_cell::sync::Lazy;
use regex::Regex;
use tracing::debug;

// Matches `${value}` if value is formatted as:
// `ENV_VAR` or `ENV_VAR:DEFAULT`
// Ignores whitespaces in curly braces
static TEMPLATE_ENV_VAR_CAPTURE: Lazy<Regex> = Lazy::new(|| {
    Regex::new(r"\$\{\s*([A-Za-z0-9_]+)\s*(?::\-\s*([^\s\}]+)\s*)?}")
        .expect("regular expression should compile")
});

pub fn render_config(config_content: &[u8]) -> Result<String> {
    let template_str = std::str::from_utf8(config_content)
        .context("config file contains invalid UTF-8 characters")?;

    let mut values = HashMap::new();

    for (line_no, line_result) in config_content.lines().enumerate() {
        let line = line_result?;

        for captures in TEMPLATE_ENV_VAR_CAPTURE.captures_iter(&line) {
            let env_var_key = captures
                .get(1)
                .expect("captures should always have at least one match")
                .as_str();
            let substitution_value = {
                if line.trim_start().starts_with('#') {
                    debug!(
                        env_var_name=%env_var_key,
                        "config file line #{line_no} is commented out, skipping"
                    );
                    // This line is commented out, return the line as is.
                    captures
                        .get(0)
                        .expect("0th capture should always be set")
                        .as_str()
                        .to_string()
                } else if let Ok(env_var_value) = std::env::var(env_var_key) {
                    debug!(
                        env_var_name=%env_var_key,
                        env_var_value=%env_var_value,
                        "environment variable is set, substituting with environment variable value"
                    );
                    env_var_value
                } else if let Some(default_match) = captures.get(2) {
                    let default_value = default_match.as_str().to_string();
                    debug!(
                        env_var_name=%env_var_key,
                        default_value=%default_value,
                        "environment variable is not set, substituting with default value"
                    );
                    default_value
                } else {
                    bail!(
                        "failed to render config file template: environment variable \
                         `{env_var_key}` is not set and no default value is provided"
                    );
                }
            };
            values.insert(env_var_key.to_string(), substitution_value);
        }
    }
    let template = Template::new(template_str).with_regex(&TEMPLATE_ENV_VAR_CAPTURE);
    let rendered = template
        .render_string(&values)
        .context("failed to render config file template")?;
    Ok(rendered)
}

#[cfg(test)]
mod test {
    use std::env;

    use super::render_config;

    #[test]
    fn test_template_render() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremly inconvenient to run it in a different
        // way, we are keeping it that way

        let config_content = b"metastore_uri: ${TEST_TEMPLATE_RENDER_ENV_VAR_PLEASE_DONT_NOTICE}";
        unsafe {
            env::set_var(
                "TEST_TEMPLATE_RENDER_ENV_VAR_PLEASE_DONT_NOTICE",
                "s3://test-bucket/metastore",
            )
        };
        let rendered = render_config(config_content).unwrap();
        unsafe { std::env::remove_var("TEST_TEMPLATE_RENDER_ENV_VAR_PLEASE_DONT_NOTICE") };
        assert_eq!(rendered, "metastore_uri: s3://test-bucket/metastore");
    }

    #[test]
    fn test_template_render_supports_whitespaces() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremly inconvenient to run it in a different
        // way, we are keeping it that way

        unsafe {
            env::set_var(
                "TEST_TEMPLATE_RENDER_WHITESPACE_QW_TEST",
                "s3://test-bucket/metastore",
            )
        };
        {
            let config_content = b"metastore_uri: ${  TEST_TEMPLATE_RENDER_WHITESPACE_QW_TEST  }";
            let rendered = render_config(config_content).unwrap();
            assert_eq!(rendered, "metastore_uri: s3://test-bucket/metastore");
        }
    }

    #[test]
    fn test_template_render_with_default_value() {
        {
            let config_content =
                b"metastore_uri: ${QW_ENV_VAR_DOES_NOT_EXIST:-s3://test-bucket/metastore}";
            let rendered = render_config(config_content).unwrap();
            assert_eq!(rendered, "metastore_uri: s3://test-bucket/metastore");
        }
        {
            let config_content =
                b"metastore_uri: ${  QW_ENV_VAR_DOES_NOT_EXIST  :-  s3://test-bucket/metastore  }";
            let rendered = render_config(config_content).unwrap();
            assert_eq!(rendered, "metastore_uri: s3://test-bucket/metastore");
        }
    }

    #[test]
    fn test_template_render_should_panic() {
        let config_content = b"metastore_uri: ${QW_ENV_VAR_DOES_NOT_EXIST}";
        render_config(config_content).unwrap_err();
    }

    #[test]
    fn test_template_render_with_default_use_env() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremly inconvenient to run it in a different
        // way, we are keeping it that way

        let config_content =
            b"metastore_uri: ${TEST_TEMPLATE_RENDER_ENV_VAR_DEFAULT_USE_ENV:-s3://test-bucket/wrongbucket}";
        unsafe {
            env::set_var(
                "TEST_TEMPLATE_RENDER_ENV_VAR_DEFAULT_USE_ENV",
                "s3://test-bucket/metastore",
            )
        };
        let rendered = render_config(config_content).unwrap();
        unsafe { std::env::remove_var("TEST_TEMPLATE_RENDER_ENV_VAR_DEFAULT_USE_ENV") };
        assert_eq!(rendered, "metastore_uri: s3://test-bucket/metastore");
    }

    #[test]
    fn test_template_render_with_multiple_vars_per_line() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremly inconvenient to run it in a different
        // way, we are keeping it that way

        let config_content =
            b"metastore_uri: s3://${RENDER_MULTIPLE_BUCKET}/${RENDER_MULTIPLE_PREFIX:-index}#polling_interval=${RENDER_MULTIPLE_INTERVAL}s";
        unsafe {
            env::set_var("RENDER_MULTIPLE_BUCKET", "test-bucket");
            env::set_var("RENDER_MULTIPLE_PREFIX", "metastore");
            env::set_var("RENDER_MULTIPLE_INTERVAL", "30");
        }
        let rendered = render_config(config_content).unwrap();
        unsafe {
            std::env::remove_var("RENDER_MULTIPLE_BUCKET");
            std::env::remove_var("RENDER_MULTIPLE_PREFIX");
            std::env::remove_var("RENDER_MULTIPLE_INTERVAL");
        }
        assert_eq!(
            rendered,
            "metastore_uri: s3://test-bucket/metastore#polling_interval=30s"
        );
    }

    #[test]
    fn test_template_render_ignores_commented_lines() {
        {
            let config_content = b"# metastore_uri: ${QW_ENV_VAR_DOES_NOT_EXIST}";
            let rendered = render_config(config_content).unwrap();
            assert_eq!(rendered, "# metastore_uri: ${QW_ENV_VAR_DOES_NOT_EXIST}");
        }
        {
            let config_content =
                b" # metastore_uri: ${ QW_ENV_VAR_DOES_NOT_EXIST :- default-value }";
            let rendered = render_config(config_content).unwrap();
            assert_eq!(
                rendered,
                " # metastore_uri: ${ QW_ENV_VAR_DOES_NOT_EXIST :- default-value }"
            );
        }
    }
}


================================================
FILE: quickwit/quickwit-control-plane/Cargo.toml
================================================
[package]
name = "quickwit-control-plane"
description = "Control plane service implementation"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
bytesize = { workspace = true }
fnv = { workspace = true }
futures = { workspace = true }
itertools = { workspace = true }
lru = { workspace = true }
mockall = { workspace = true, optional = true }
once_cell = { workspace = true }
rand = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
smallvec = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }
ulid = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-ingest = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-proto = { workspace = true }

[dev-dependencies]
futures = { workspace = true }
mockall = { workspace = true }
proptest = { workspace = true }
rand = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-cluster = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true }
quickwit-ingest = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }

[features]
testsuite = ["mockall"]


================================================
FILE: quickwit/quickwit-control-plane/README.md
================================================
# Quickwit Control Plane

The Control Plane is responsible for scheduling indexing tasks to indexers. Its role is to ensure that the cluster is correctly running all indexing tasks on each indexer.

An indexing task is simply identified by a couple `(IndexId, SourceId, Option<Vec<ShardId>>)`.

## Scheduling algorithm

The control plane keeps an up to date partial view of the metastore.
This is enforced by routing all of the index/shards/sources alternating
command be routed through the control plane.

On startup, or when a metastore event is received, the scheduler computes the list of indexing tasks.
It then applies a placement algorithm to decide which indexer should be running each indexing task. The result of this placement is called the physical indexing plan, and associated each indexer to a list of indexing tasks.

The control plane then emits gRPC to the indexers that are not already following their assigned part of the indexing plan.

```mermaid
flowchart TB
    StartScheduling(Start scheduling)--"(Sources, Nodes)"-->BuildPhysical
    style StartScheduling fill:#ff0026,fill-opacity:0.5,stroke:#ff0026,stroke-width:4px
    BuildPhysical[Build Physical Plan]--PhysicalPlan-->Apply
    Apply[Apply plan to each indexer] --IndexerPlan--> Indexer1
    Apply --IndexerPlan--> Indexer2
    Apply --IndexerPlan--> Indexer...
```

## Control loop

Each indexer reports its currently running plan via chitchat.
A control loop makes sure that this cluster state matches the latest applied plan.
If a divergence is observed (for instance, if a node leaves the cluster), or if a node reports not being running a given pipeline, the control plane will take the necessary actions (respectively recompute the physical plan or reapply the plan).

## Read more in the Rust docs

[Scheduler Rust docs](./src/scheduler.rs#L66)


================================================
FILE: quickwit/quickwit-control-plane/src/control_plane.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::btree_map::Entry;
use std::collections::{BTreeMap, BTreeSet};
use std::fmt;
use std::fmt::Formatter;
use std::num::NonZeroUsize;
use std::time::Duration;

use anyhow::Context;
use async_trait::async_trait;
use futures::stream::FuturesUnordered;
use futures::{Future, StreamExt};
use itertools::Itertools;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, DeferableReplyHandler, Handler, Mailbox,
    Supervisor, Universe, WeakMailbox,
};
use quickwit_cluster::{ClusterChange, ClusterChangeStream, ClusterChangeStreamFactory};
use quickwit_common::pretty::PrettyDisplay;
use quickwit_common::pubsub::EventSubscriber;
use quickwit_common::uri::Uri;
use quickwit_common::{Progress, shared_consts};
use quickwit_config::{ClusterConfig, IndexConfig, IndexTemplate, SourceConfig};
use quickwit_ingest::{IngesterPool, LocalShardsUpdate};
use quickwit_metastore::{CreateIndexRequestExt, CreateIndexResponseExt, IndexMetadataResponseExt};
use quickwit_proto::control_plane::{
    AdviseResetShardsRequest, AdviseResetShardsResponse, ControlPlaneError, ControlPlaneResult,
    GetOrCreateOpenShardsRequest, GetOrCreateOpenShardsResponse, GetOrCreateOpenShardsSubrequest,
};
use quickwit_proto::indexing::ShardPositionsUpdate;
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::metastore::{
    AddSourceRequest, CreateIndexRequest, CreateIndexResponse, DeleteIndexRequest,
    DeleteShardsRequest, DeleteSourceRequest, EmptyResponse, FindIndexTemplateMatchesRequest,
    IndexMetadataResponse, IndexTemplateMatch, MetastoreError, MetastoreResult, MetastoreService,
    MetastoreServiceClient, PruneShardsRequest, ToggleSourceRequest, UpdateIndexRequest,
    UpdateSourceRequest, serde_utils,
};
use quickwit_proto::types::{IndexId, IndexUid, NodeId, ShardId, SourceId, SourceUid};
use serde::Serialize;
use serde_json::{Value as JsonValue, json};
use tokio::sync::watch;
use tracing::{Level, debug, enabled, error, info};

use crate::IndexerPool;
use crate::cooldown_map::{CooldownMap, CooldownStatus};
use crate::debouncer::Debouncer;
use crate::indexing_scheduler::{IndexingScheduler, IndexingSchedulerState};
use crate::ingest::IngestController;
use crate::ingest::ingest_controller::{IngestControllerStats, RebalanceShardsCallback};
use crate::model::ControlPlaneModel;

/// Interval between two controls (or checks) of the desired plan VS running plan.
pub(crate) const CONTROL_PLAN_LOOP_INTERVAL: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(100)
} else {
    Duration::from_secs(5)
};

/// Minimum period between two identical shard pruning operations.
const PRUNE_SHARDS_DEFAULT_COOLDOWN_PERIOD: Duration = Duration::from_secs(120);

/// Minimum period between two rebuild plan operations.
const REBUILD_PLAN_COOLDOWN_PERIOD: Duration = Duration::from_secs(2);

#[derive(Debug)]
struct ControlPlanLoop;

#[derive(Debug, Default, Clone, Copy)]
struct RebuildPlan;

pub struct ControlPlane {
    cluster_config: ClusterConfig,
    cluster_change_stream_opt: Option<ClusterChangeStream>,
    // The control plane state is split into to independent functions, that we naturally isolated
    // code wise and state wise.
    //
    // - The indexing scheduler is in charge of managing indexers: it decides which indexer should
    // index which source/shards.
    // - the ingest controller is in charge of managing ingesters: it opens and closes shards on
    // the different ingesters.
    indexing_scheduler: IndexingScheduler,
    ingest_controller: IngestController,
    metastore: MetastoreServiceClient,
    model: ControlPlaneModel,
    prune_shard_cooldown: CooldownMap<(IndexId, SourceId)>,
    rebuild_plan_debouncer: Debouncer,
    readiness_tx: watch::Sender<bool>,
    // Disables the control loop. This is useful for unit testing.
    disable_control_loop: bool,
}

impl fmt::Debug for ControlPlane {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        f.debug_struct("ControlPlane").finish()
    }
}

impl ControlPlane {
    pub fn spawn(
        universe: &Universe,
        cluster_config: ClusterConfig,
        self_node_id: NodeId,
        cluster_change_stream_factory: impl ClusterChangeStreamFactory,
        indexer_pool: IndexerPool,
        ingester_pool: IngesterPool,
        metastore: MetastoreServiceClient,
    ) -> (
        Mailbox<Self>,
        ActorHandle<Supervisor<Self>>,
        watch::Receiver<bool>,
    ) {
        let disable_control_loop = false;
        Self::spawn_inner(
            universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            metastore,
            disable_control_loop,
        )
    }

    #[allow(clippy::too_many_arguments)]
    fn spawn_inner(
        universe: &Universe,
        cluster_config: ClusterConfig,
        self_node_id: NodeId,
        cluster_change_stream_factory: impl ClusterChangeStreamFactory,
        indexer_pool: IndexerPool,
        ingester_pool: IngesterPool,
        metastore: MetastoreServiceClient,
        disable_control_loop: bool,
    ) -> (
        Mailbox<Self>,
        ActorHandle<Supervisor<Self>>,
        watch::Receiver<bool>,
    ) {
        info!("starting control plane");

        let (readiness_tx, readiness_rx) = watch::channel(false);
        let (control_plane_mailbox, control_plane_handle) =
            universe.spawn_builder().supervise_fn(move || {
                let cluster_id = cluster_config.cluster_id.clone();
                let replication_factor = cluster_config.replication_factor;
                let shard_throughput_limit_mib: f32 = cluster_config.shard_throughput_limit.as_u64()
                    as f32
                    / shared_consts::MIB as f32;
                let indexing_scheduler =
                    IndexingScheduler::new(cluster_id, self_node_id.clone(), indexer_pool.clone());
                let ingest_controller = IngestController::new(
                    metastore.clone(),
                    ingester_pool.clone(),
                    replication_factor,
                    shard_throughput_limit_mib,
                    cluster_config.shard_scale_up_factor,
                );

                let readiness_tx = readiness_tx.clone();
                let _ = readiness_tx.send(false);

                ControlPlane {
                    cluster_config: cluster_config.clone(),
                    cluster_change_stream_opt: Some(cluster_change_stream_factory.create()),
                    indexing_scheduler,
                    ingest_controller,
                    metastore: metastore.clone(),
                    model: Default::default(),
                    prune_shard_cooldown: CooldownMap::new(NonZeroUsize::new(1024).unwrap()),
                    rebuild_plan_debouncer: Debouncer::new(REBUILD_PLAN_COOLDOWN_PERIOD),
                    readiness_tx,
                    disable_control_loop,
                }
            });
        (control_plane_mailbox, control_plane_handle, readiness_rx)
    }
}

#[derive(Debug, Clone, Serialize, Default)]
pub struct ControlPlaneObservableState {
    pub indexing_scheduler: IndexingSchedulerState,
    pub ingest_controller: IngestControllerStats,
    pub num_indexes: usize,
    pub num_sources: usize,
    pub readiness: bool,
}

#[async_trait]
impl Actor for ControlPlane {
    type ObservableState = ControlPlaneObservableState;

    fn name(&self) -> String {
        "ControlPlane".to_string()
    }

    fn observable_state(&self) -> Self::ObservableState {
        ControlPlaneObservableState {
            indexing_scheduler: self.indexing_scheduler.observable_state(),
            ingest_controller: self.ingest_controller.stats,
            num_indexes: self.model.num_indexes(),
            num_sources: self.model.num_sources(),
            readiness: *self.readiness_tx.borrow(),
        }
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        crate::metrics::CONTROL_PLANE_METRICS.restart_total.inc();

        self.model
            .load_from_metastore(&mut self.metastore, ctx.progress())
            .await
            .context("failed to initialize control plane model")?;

        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);

        self.ingest_controller.sync_with_all_ingesters(&self.model);

        ctx.schedule_self_msg(CONTROL_PLAN_LOOP_INTERVAL, ControlPlanLoop);

        let weak_mailbox = ctx.mailbox().downgrade();
        let cluster_change_stream = self
            .cluster_change_stream_opt
            .take()
            .expect("`initialize` should be called only once");
        spawn_watch_indexers_task(weak_mailbox, cluster_change_stream);
        let _ = self.readiness_tx.send(true);
        Ok(())
    }
}

impl ControlPlane {
    async fn auto_create_indexes(
        &mut self,
        subrequests: &[GetOrCreateOpenShardsSubrequest],
        progress: &Progress,
    ) -> MetastoreResult<()> {
        if !self.cluster_config.auto_create_indexes {
            return Ok(());
        }
        let mut index_ids = Vec::new();

        for subrequest in subrequests {
            if self.model.index_uid(&subrequest.index_id).is_none() {
                index_ids.push(subrequest.index_id.clone());
            }
        }
        if index_ids.is_empty() {
            return Ok(());
        }
        let find_index_template_matches_request = FindIndexTemplateMatchesRequest { index_ids };
        let find_index_template_matches_response = progress
            .protect_future(
                self.metastore
                    .find_index_template_matches(find_index_template_matches_request),
            )
            .await?;

        let mut create_index_futures = FuturesUnordered::new();

        for index_template_match in find_index_template_matches_response.matches {
            // TODO: It's a bit brutal to fail the entire operation if applying a single index
            // template fails. We should return a partial failure instead for the subrequest. I
            // want to do so in an upcoming refactor where the `GetOrCreateOpenShardsRequest` will
            // be processed in multiple steps in a dedicated workbench.
            let index_config = apply_index_template_match(
                index_template_match,
                &self.cluster_config.default_index_root_uri,
            )?;
            // We disable ingest V1 for index templates.
            let source_configs = [SourceConfig::ingest_v2(), SourceConfig::cli()];

            let create_index_request = CreateIndexRequest::try_from_index_and_source_configs(
                &index_config,
                &source_configs,
            )?;
            let create_index_future = {
                let metastore = self.metastore.clone();
                async move { metastore.create_index(create_index_request).await }
            };
            create_index_futures.push(create_index_future);
        }
        while let Some(create_index_response_result) =
            progress.protect_future(create_index_futures.next()).await
        {
            // Same here.
            let create_index_response = create_index_response_result?;
            let index_metadata = create_index_response.deserialize_index_metadata()?;
            self.model.add_index(index_metadata);
        }
        Ok(())
    }

    /// Deletes a set of shards from the metastore and the control plane model.
    ///
    /// If the shards were already absent this operation is considered successful.
    async fn delete_shards(
        &mut self,
        source_uid: &SourceUid,
        shard_ids: &[ShardId],
        progress: &Progress,
    ) -> anyhow::Result<()> {
        debug!(
            index_uid=%source_uid.index_uid,
            source_id=%source_uid.source_id,
            shard_ids=%shard_ids.pretty_display(),
            "deleting shards"
        );
        let delete_shards_request = DeleteShardsRequest {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.clone(),
            shard_ids: shard_ids.to_vec(),
            force: false,
        };
        // We use a tiny bit different strategy here than for other handlers
        // All metastore errors end up fail/respawn the control plane.
        //
        // This is because deleting shards is done in reaction to an event
        // and we do not really have the freedom to return an error to a caller like for other
        // calls: there is no caller.
        progress
            .protect_future(self.metastore.delete_shards(delete_shards_request))
            .await
            .context("failed to delete shards from metastore")?;

        self.model.delete_shards(source_uid, shard_ids);

        info!(
            index_uid=%source_uid.index_uid,
            source_id=%source_uid.source_id,
            shard_ids=%shard_ids.pretty_display(),
            "deleted shards"
        );
        Ok(())
    }

    fn debug_info(&self) -> JsonValue {
        // Build the union of ingesters tracked by ingester pool and the model.
        let mut ingesters: BTreeMap<NodeId, JsonValue> = BTreeMap::new();

        for (ingester_id, ingester) in self.ingest_controller.ingester_pool.keys_values() {
            let ingester_json = json!({
                "available": true,
                "status": ingester.status.as_json_str_name(),
            });
            ingesters.insert(ingester_id.clone(), ingester_json);
        }
        for shard in self.model.all_shards() {
            let ingester_id = NodeId::from(shard.leader_id.clone());

            if let Entry::Vacant(entry) = ingesters.entry(ingester_id.clone()) {
                let ingester_json = json!({
                    "available": false,
                    "status": IngesterStatus::default(),
                });
                entry.insert(ingester_json);
            }
        }

        let physical_indexing_plan: Vec<JsonValue> = self
            .indexing_scheduler
            .observable_state()
            .last_applied_physical_plan
            .map(|plan| {
                plan.indexing_tasks_per_indexer()
                    .iter()
                    .map(|(node_id, tasks)| {
                        json!({
                            "node_id": node_id.clone(),
                            "tasks": tasks.clone(),
                        })
                    })
                    .collect()
            })
            .unwrap_or_default();

        let mut per_index_and_leader_shards_json: BTreeMap<
            IndexUid,
            BTreeMap<String, Vec<JsonValue>>,
        > = BTreeMap::new();

        for (source_uid, shard_entries) in self.model.all_shards_with_source() {
            for shard_entry in shard_entries {
                let shard_json = json!({
                    "index_uid": source_uid.index_uid,
                    "source_id": source_uid.source_id,
                    "shard_id": shard_entry.shard_id,
                    "shard_state": shard_entry.shard_state().as_json_str_name(),
                    "leader_id": shard_entry.leader_id,
                    "follower_id": shard_entry.follower_id,
                    "publish_position_inclusive": shard_entry.publish_position_inclusive(),
                });
                per_index_and_leader_shards_json
                    .entry(source_uid.index_uid.clone())
                    .or_default()
                    .entry(shard_entry.leader_id.clone())
                    .or_default()
                    .push(shard_json);
            }
        }
        json!({
            "ingesters": ingesters,
            "physical_indexing_plan": physical_indexing_plan,
            "shard_table": per_index_and_leader_shards_json,
        })
    }

    /// Rebuilds the indexing plan.
    ///
    /// This method includes some debouncing logic. Every call will be followed by a cooldown
    /// period.
    ///
    /// This method returns a future that can be awaited to ensure that the relevant rebuild plan
    /// operation has been executed.
    fn rebuild_plan_debounced(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> impl Future<Output = ()> + use<> {
        let next_rebuild_waiter = self
            .indexing_scheduler
            .next_rebuild_tracker
            .next_rebuild_waiter();
        self.rebuild_plan_debouncer
            .self_send_with_cooldown::<RebuildPlan>(ctx);
        next_rebuild_waiter
    }
}

#[async_trait]
impl Handler<RebuildPlan> for ControlPlane {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: RebuildPlan,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.indexing_scheduler.rebuild_plan(&self.model);
        Ok(())
    }
}

#[async_trait]
impl Handler<ShardPositionsUpdate> for ControlPlane {
    type Reply = ();

    async fn handle(
        &mut self,
        shard_positions_update: ShardPositionsUpdate,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if enabled!(Level::DEBUG) {
            let pretty_positions: Vec<String> = shard_positions_update
                .updated_shard_positions
                .iter()
                .map(|(shard_id, position)| format!("{shard_id}:{}", position.pretty_display()))
                .sorted()
                .collect();

            debug!(
                index_uid=%shard_positions_update.source_uid.index_uid,
                source_id=%shard_positions_update.source_uid.source_id,
                positions=%pretty_positions.as_slice().pretty_display(),
                "received shard positions update"
            );
        }
        let Some(shard_entries) = self
            .model
            .get_shards_for_source_mut(&shard_positions_update.source_uid)
        else {
            // The source no longer exists.
            return Ok(());
        };

        let mut shard_ids_to_close = Vec::new();
        for (shard_id, position) in shard_positions_update.updated_shard_positions {
            if let Some(shard) = shard_entries.get_mut(&shard_id) {
                shard.publish_position_inclusive =
                    Some(shard.publish_position_inclusive().max(position.clone()));
                if position.is_eof() {
                    // identify shards that have reached EOF but have not yet been removed.
                    info!(
                        index_uid=%shard_positions_update.source_uid.index_uid,
                        source_id=%shard_positions_update.source_uid.source_id,
                        %shard_id,
                        position=%position.pretty_display(),
                        "received shard eof via gossip"
                    );
                    shard_ids_to_close.push(shard_id);
                }
            }
        }
        if shard_ids_to_close.is_empty() {
            return Ok(());
        }
        self.delete_shards(
            &shard_positions_update.source_uid,
            &shard_ids_to_close,
            ctx.progress(),
        )
        .await?;
        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);
        Ok(())
    }
}

#[async_trait]
impl Handler<ControlPlanLoop> for ControlPlane {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: ControlPlanLoop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if self.disable_control_loop {
            return Ok(());
        }
        if let Err(metastore_error) = self
            .ingest_controller
            .rebalance_shards(&mut self.model, ctx.mailbox(), ctx.progress())
            .await
        {
            return convert_metastore_error::<()>(metastore_error).map(|_| ());
        }
        self.indexing_scheduler.control_running_plan(&self.model);
        ctx.schedule_self_msg(CONTROL_PLAN_LOOP_INTERVAL, ControlPlanLoop);
        Ok(())
    }
}

/// This function converts a metastore error into an actor error.
///
/// If the metastore error is implying the transaction has not been
/// successful, then we do not need to restart the metastore.
/// If the metastore error does not let us know whether the transaction was
/// successful or not, we need to restart the actor and have it load its state from
/// the metastore.
///
/// This function also logs errors.
fn convert_metastore_error<T>(
    metastore_error: MetastoreError,
) -> Result<ControlPlaneResult<T>, ActorExitStatus> {
    // If true, we know that the transactions has not been recorded in the Metastore.
    // If false, we simply are not sure whether the transaction has been recorded or not.
    let is_transaction_certainly_aborted = metastore_error.is_transaction_certainly_aborted();
    if is_transaction_certainly_aborted {
        // If the metastore transaction is certain to have been aborted,
        // this is actually a good thing.
        // We do not need to restart the control plane.
        if !matches!(metastore_error, MetastoreError::AlreadyExists(_)) {
            // This is not always an error to attempt to create an object that already exists.
            // In particular, we create two otel indexes on startup.
            // It will be up to the client to decide what to do there.
            error!(err=?metastore_error, transaction_outcome="aborted", "metastore error");
        }
        crate::metrics::CONTROL_PLANE_METRICS
            .metastore_error_aborted
            .inc();
        Ok(Err(ControlPlaneError::Metastore(metastore_error)))
    } else {
        // If the metastore transaction may have been executed, we need to restart the control plane
        // so that it gets resynced with the metastore state.
        error!(error=?metastore_error, transaction_outcome="maybe-executed", "metastore error");
        crate::metrics::CONTROL_PLANE_METRICS
            .metastore_error_maybe_executed
            .inc();
        Err(ActorExitStatus::from(anyhow::anyhow!(metastore_error)))
    }
}

// This handler is a metastore call proxied through the control plane: we must first forward the
// request to the metastore, and then act on the event.
#[async_trait]
impl DeferableReplyHandler<CreateIndexRequest> for ControlPlane {
    type Reply = ControlPlaneResult<CreateIndexResponse>;

    async fn handle_message(
        &mut self,
        request: CreateIndexRequest,
        reply: impl FnOnce(Self::Reply) + Send + Sync + 'static,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        debug!("creating index");

        let response = match ctx
            .protect_future(self.metastore.create_index(request))
            .await
        {
            Ok(response) => response,
            Err(metastore_error) => {
                reply(convert_metastore_error(metastore_error)?);
                return Ok(());
            }
        };
        let index_metadata = match response.deserialize_index_metadata() {
            Ok(index_metadata) => index_metadata,
            Err(serde_error) => {
                error!(error=?serde_error, "failed to deserialize index metadata");
                return Err(ActorExitStatus::from(anyhow::anyhow!(serde_error)));
            }
        };
        let index_uid = index_metadata.index_uid.clone();

        // Now, create index can also add sources to support creating indexes automatically from
        // index and source config templates.
        let should_rebuild_plan = !index_metadata.sources.is_empty();
        self.model.add_index(index_metadata);

        if should_rebuild_plan {
            let rebuild_plan_notifier = self.rebuild_plan_debounced(ctx);
            tokio::task::spawn(async move {
                rebuild_plan_notifier.await;
                reply(Ok(response));
            });
        } else {
            reply(Ok(response));
        }
        info!(%index_uid, "created index");
        Ok(())
    }
}

// This handler is a metastore call proxied through the control plane: we must first forward the
// request to the metastore, and then act on the event.
#[async_trait]
impl Handler<UpdateIndexRequest> for ControlPlane {
    type Reply = ControlPlaneResult<IndexMetadataResponse>;

    async fn handle(
        &mut self,
        request: UpdateIndexRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let index_uid: IndexUid = request.index_uid().clone();
        debug!(%index_uid, "updating index");

        let response = match ctx
            .protect_future(self.metastore.update_index(request))
            .await
        {
            Ok(response) => response,
            Err(metastore_error) => {
                return convert_metastore_error(metastore_error);
            }
        };
        let index_metadata = match response.deserialize_index_metadata() {
            Ok(index_metadata) => index_metadata,
            Err(serde_error) => {
                error!(error=?serde_error, "failed to deserialize index metadata");
                return Err(ActorExitStatus::from(anyhow::anyhow!(serde_error)));
            }
        };
        if self
            .model
            .update_index_config(&index_uid, index_metadata.index_config)?
        {
            let _rebuild_plan_notifier = self.rebuild_plan_debounced(ctx);
        }
        info!(%index_uid, "updated index");
        Ok(Ok(response))
    }
}

// This handler is a metastore call proxied through the control plane: we must first forward the
// request to the metastore, and then act on the event.
#[async_trait]
impl Handler<DeleteIndexRequest> for ControlPlane {
    type Reply = ControlPlaneResult<EmptyResponse>;

    async fn handle(
        &mut self,
        request: DeleteIndexRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let index_uid: IndexUid = request.index_uid().clone();
        debug!(%index_uid, "deleting index");

        if let Err(metastore_error) = ctx
            .protect_future(self.metastore.delete_index(request))
            .await
        {
            return convert_metastore_error(metastore_error);
        };
        let ingester_needing_resync: BTreeSet<NodeId> = self
            .model
            .list_shards_for_index(&index_uid)
            .flat_map(|shard_entry| shard_entry.ingesters())
            .map(|node_id_ref| node_id_ref.to_owned())
            .collect();

        self.model.delete_index(&index_uid);

        self.ingest_controller
            .sync_with_ingesters(&ingester_needing_resync, &self.model);

        // TODO: Refine the event. Notify index will have the effect to reload the entire state from
        // the metastore. We should update the state of the control plane.
        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);

        info!(%index_uid, "deleted index");
        let response = EmptyResponse {};
        Ok(Ok(response))
    }
}

// This handler is a metastore call proxied through the control plane: we must first forward the
// request to the metastore, and then act on the event.
#[async_trait]
impl Handler<AddSourceRequest> for ControlPlane {
    type Reply = ControlPlaneResult<EmptyResponse>;

    async fn handle(
        &mut self,
        request: AddSourceRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let index_uid: IndexUid = request.index_uid().clone();
        let source_config: SourceConfig =
            match serde_utils::from_json_str(&request.source_config_json) {
                Ok(source_config) => source_config,
                Err(error) => {
                    error!(%error, "failed to deserialize source config");
                    return Ok(Err(ControlPlaneError::from(error)));
                }
            };
        let source_id = source_config.source_id.clone();
        debug!(%index_uid, source_id, "adding source");

        if let Err(error) = ctx.protect_future(self.metastore.add_source(request)).await {
            return Ok(Err(ControlPlaneError::from(error)));
        };
        self.model
            .add_source(&index_uid, source_config)
            .context("failed to add source")?;

        info!(%index_uid, source_id, "added source");

        // TODO: Refine the event. Notify index will have the effect to reload the entire state from
        // the metastore. We should update the state of the control plane.
        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);

        let response = EmptyResponse {};
        Ok(Ok(response))
    }
}

#[async_trait]
impl Handler<UpdateSourceRequest> for ControlPlane {
    type Reply = ControlPlaneResult<EmptyResponse>;

    async fn handle(
        &mut self,
        request: UpdateSourceRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let index_uid: IndexUid = request.index_uid().clone();
        let source_config: SourceConfig =
            match serde_utils::from_json_str(&request.source_config_json) {
                Ok(source_config) => source_config,
                Err(error) => {
                    error!(%error, "failed to deserialize source config");
                    return Ok(Err(ControlPlaneError::from(error)));
                }
            };
        let source_id = source_config.source_id.clone();
        debug!(%index_uid, source_id, "updating source");

        if let Err(error) = ctx
            .protect_future(self.metastore.update_source(request))
            .await
        {
            return Ok(Err(ControlPlaneError::from(error)));
        };
        self.model
            .update_source(&index_uid, source_config)
            .context("failed to add source")?;

        // TODO: Refine the event. Notify index will have the effect to reload the entire state from
        // the metastore. We should update the state of the control plane.
        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);

        info!(%index_uid, source_id, "updated source");
        let response = EmptyResponse {};
        Ok(Ok(response))
    }
}

// This handler is a metastore call proxied through the control plane: we must first forward the
// request to the metastore, and then act on the event.
#[async_trait]
impl Handler<ToggleSourceRequest> for ControlPlane {
    type Reply = ControlPlaneResult<EmptyResponse>;

    async fn handle(
        &mut self,
        request: ToggleSourceRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let index_uid: IndexUid = request.index_uid().clone();
        let source_id = request.source_id.clone();
        let enable = request.enable;
        debug!(%index_uid, source_id, enable, "toggling source");

        if let Err(error) = ctx
            .protect_future(self.metastore.toggle_source(request))
            .await
        {
            return Ok(Err(ControlPlaneError::from(error)));
        };

        let mutation_occurred = self
            .model
            .toggle_source(&index_uid, &source_id, enable)
            .context("failed to toggle source")?;

        if mutation_occurred {
            let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);
        }
        info!(%index_uid, source_id, enabled=enable, "toggled source");
        let response = EmptyResponse {};
        Ok(Ok(response))
    }
}

// This handler is a metastore call proxied through the control plane: we must first forward the
// request to the metastore, and then act on the event.
#[async_trait]
impl Handler<DeleteSourceRequest> for ControlPlane {
    type Reply = ControlPlaneResult<EmptyResponse>;

    async fn handle(
        &mut self,
        request: DeleteSourceRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<ControlPlaneResult<EmptyResponse>, ActorExitStatus> {
        let index_uid: IndexUid = request.index_uid().clone();
        let source_id = request.source_id.clone();
        debug!(%index_uid, source_id, "deleting source");

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };

        if let Err(metastore_error) = ctx
            .protect_future(self.metastore.delete_source(request))
            .await
        {
            // TODO If the metastore fails returns an error but somehow succeed deleting the source,
            // the control plane will restart and the shards will be remaining on the ingesters.
            //
            // This is tracked in #4274
            return convert_metastore_error(metastore_error);
        };

        let ingesters_needing_resync: BTreeSet<NodeId> =
            if let Some(shard_entries) = self.model.get_shards_for_source(&source_uid) {
                shard_entries
                    .values()
                    .flat_map(|shard_entry| shard_entry.ingesters())
                    .map(|node_id_ref| node_id_ref.to_owned())
                    .collect()
            } else {
                BTreeSet::new()
            };

        self.ingest_controller
            .sync_with_ingesters(&ingesters_needing_resync, &self.model);

        self.model.delete_source(&source_uid);
        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);

        info!(
            index_uid=%source_uid.index_uid,
            source_id=%source_uid.source_id,
            "deleted source"
        );
        let response = EmptyResponse {};
        Ok(Ok(response))
    }
}

#[async_trait]
impl Handler<PruneShardsRequest> for ControlPlane {
    type Reply = ControlPlaneResult<EmptyResponse>;

    async fn handle(
        &mut self,
        request: PruneShardsRequest,
        _ctx: &ActorContext<Self>,
    ) -> Result<ControlPlaneResult<EmptyResponse>, ActorExitStatus> {
        let interval = request
            .interval_secs
            .map(|interval_secs| Duration::from_secs(interval_secs as u64))
            .unwrap_or_else(|| PRUNE_SHARDS_DEFAULT_COOLDOWN_PERIOD);

        // A very basic debounce is enough here, missing one call to the pruning API is fine
        let status = self.prune_shard_cooldown.update(
            (
                request.index_uid().index_id.clone(),
                request.source_id.clone(),
            ),
            interval,
        );
        if let CooldownStatus::Ready = status
            && let Err(metastore_error) = self.metastore.prune_shards(request).await
        {
            return convert_metastore_error(metastore_error);
        };
        // Return ok regardless of whether the call was successful or debounced
        let response = EmptyResponse {};
        Ok(Ok(response))
    }
}

// This is neither a proxied call nor a metastore callback.
#[async_trait]
impl Handler<GetOrCreateOpenShardsRequest> for ControlPlane {
    type Reply = ControlPlaneResult<GetOrCreateOpenShardsResponse>;

    async fn handle(
        &mut self,
        request: GetOrCreateOpenShardsRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        if let Err(metastore_error) = self
            .auto_create_indexes(&request.subrequests, ctx.progress())
            .await
        {
            return convert_metastore_error(metastore_error);
        }
        match self
            .ingest_controller
            .get_or_create_open_shards(request, &mut self.model, ctx.progress())
            .await
        {
            Ok(response) => {
                let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);
                Ok(Ok(response))
            }
            Err(metastore_error) => convert_metastore_error(metastore_error),
        }
    }
}

// This is neither a proxied call nor a metastore callback.
#[async_trait]
impl Handler<AdviseResetShardsRequest> for ControlPlane {
    type Reply = ControlPlaneResult<AdviseResetShardsResponse>;

    async fn handle(
        &mut self,
        request: AdviseResetShardsRequest,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let response = self
            .ingest_controller
            .advise_reset_shards(request, &self.model);
        Ok(Ok(response))
    }
}

#[async_trait]
impl Handler<LocalShardsUpdate> for ControlPlane {
    type Reply = ControlPlaneResult<()>;

    async fn handle(
        &mut self,
        local_shards_update: LocalShardsUpdate,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        if let Err(metastore_error) = self
            .ingest_controller
            .handle_local_shards_update(local_shards_update, &mut self.model, ctx.progress())
            .await
        {
            return convert_metastore_error(metastore_error);
        }
        let _rebuild_plan_waiter = self.rebuild_plan_debounced(ctx);
        Ok(Ok(()))
    }
}

#[derive(Debug)]
pub struct GetDebugInfo;

#[async_trait]
impl Handler<GetDebugInfo> for ControlPlane {
    type Reply = JsonValue;

    async fn handle(
        &mut self,
        _: GetDebugInfo,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.debug_info())
    }
}

#[derive(Clone)]
pub struct ControlPlaneEventSubscriber(WeakMailbox<ControlPlane>);

impl ControlPlaneEventSubscriber {
    pub fn new(weak_control_plane_mailbox: WeakMailbox<ControlPlane>) -> Self {
        Self(weak_control_plane_mailbox)
    }
}

#[async_trait]
impl EventSubscriber<LocalShardsUpdate> for ControlPlaneEventSubscriber {
    async fn handle_event(&mut self, local_shards_update: LocalShardsUpdate) {
        if let Some(control_plane_mailbox) = self.0.upgrade()
            && let Err(error) = control_plane_mailbox
                .send_message(local_shards_update)
                .await
        {
            error!(%error, "failed to forward local shards update to control plane");
        }
    }
}

#[async_trait]
impl EventSubscriber<ShardPositionsUpdate> for ControlPlaneEventSubscriber {
    async fn handle_event(&mut self, shard_positions_update: ShardPositionsUpdate) {
        if let Some(control_plane_mailbox) = self.0.upgrade()
            && let Err(error) = control_plane_mailbox
                .send_message(shard_positions_update)
                .await
        {
            error!(%error, "failed to forward shard positions update to control plane");
        }
    }
}

fn apply_index_template_match(
    index_template_match: IndexTemplateMatch,
    default_index_root_uri: &Uri,
) -> MetastoreResult<IndexConfig> {
    let index_template: IndexTemplate =
        serde_utils::from_json_str(&index_template_match.index_template_json)?;
    let index_config = index_template
        .apply_template(index_template_match.index_id, default_index_root_uri)
        .map_err(|error| MetastoreError::Internal {
            message: "failed to apply index template".to_string(),
            cause: error.to_string(),
        })?;
    Ok(index_config)
}

#[derive(Debug)]
struct RebalanceShards;

#[async_trait]
impl Handler<RebalanceShards> for ControlPlane {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: RebalanceShards,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        if let Err(error) = self
            .ingest_controller
            .rebalance_shards(&mut self.model, ctx.mailbox(), ctx.progress())
            .await
        {
            return convert_metastore_error::<()>(error).map(|_| ());
        };
        self.indexing_scheduler.rebuild_plan(&self.model);
        Ok(())
    }
}

#[async_trait]
impl Handler<RebalanceShardsCallback> for ControlPlane {
    type Reply = ();

    async fn handle(
        &mut self,
        message: RebalanceShardsCallback,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let num_closed_shards = message.closed_shards.len();
        debug!("closing {num_closed_shards} shards after rebalance");

        for closed_shard in message.closed_shards {
            let shard_id = closed_shard.shard_id().clone();
            let source_uid = SourceUid {
                index_uid: closed_shard.index_uid().clone(),
                source_id: closed_shard.source_id,
            };
            self.model.close_shards(&source_uid, &[shard_id]);
        }
        // We drop the rebalance guard explicitly here to put some emphasis on where the rebalance
        // lock is released.
        drop(message.rebalance_guard);
        Ok(())
    }
}

fn spawn_watch_indexers_task(
    weak_mailbox: WeakMailbox<ControlPlane>,
    cluster_change_stream: ClusterChangeStream,
) {
    tokio::spawn(watcher_indexers(weak_mailbox, cluster_change_stream));
}

async fn watcher_indexers(
    weak_mailbox: WeakMailbox<ControlPlane>,
    mut cluster_change_stream: ClusterChangeStream,
) {
    while let Some(cluster_change) = cluster_change_stream.next().await {
        let Some(mailbox) = weak_mailbox.upgrade() else {
            return;
        };

        // Ingesters have two readiness levels:
        // 1. Cluster connectivity: node is up and can reach the metastore (similar to other nodes)
        // 2. Shard readiness: IngesterStatus::Ready indicates the ingester can accept new shards
        // We rebalance shards when either readiness level changes.
        let mut trigger_rebalance = false;
        match cluster_change {
            ClusterChange::Add(node) if node.is_indexer() => {
                if node.ingester_status().is_ready() {
                    info!(
                        "indexer `{}` with status `{}` joined the cluster: rebalancing shards and \
                         rebuilding indexing plan",
                        node.node_id(),
                        node.ingester_status().as_json_str_name()
                    );
                    trigger_rebalance = true;
                }
            }
            ClusterChange::Remove(node) if node.is_indexer() => {
                info!(
                    "indexer `{}` left the cluster: rebalancing shards and rebuilding indexing \
                     plan",
                    node.node_id()
                );
                trigger_rebalance = true
            }
            ClusterChange::Update { previous, updated } if updated.is_indexer() => {
                let was_ready = previous.ingester_status().is_ready();
                let is_ready = updated.ingester_status().is_ready();

                if was_ready ^ is_ready {
                    info!(
                        "indexer `{}` status changed to `{}`: rebalancing shards and rebuilding \
                         indexing plan",
                        updated.node_id(),
                        updated.ingester_status().as_json_str_name()
                    );
                    trigger_rebalance = true;
                }
            }
            _ => {}
        }
        if trigger_rebalance && mailbox.send_message(RebalanceShards).await.is_err() {
            return;
        }
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZero;
    use std::sync::Arc;

    use mockall::Sequence;
    use quickwit_actors::{AskError, Observe, SupervisorMetrics};
    use quickwit_cluster::{ClusterChangeStreamFactoryForTest, ClusterNode};
    use quickwit_config::{
        CLI_SOURCE_ID, INGEST_V2_SOURCE_ID, IndexConfig, KafkaSourceParams, SourceParams,
    };
    use quickwit_indexing::IndexingService;
    use quickwit_ingest::IngesterPoolEntry;
    use quickwit_metastore::{
        CreateIndexRequestExt, IndexMetadata, ListIndexesMetadataResponseExt,
    };
    use quickwit_proto::control_plane::{
        GetOrCreateOpenShardsFailureReason, GetOrCreateOpenShardsSubrequest,
    };
    use quickwit_proto::indexing::{
        ApplyIndexingPlanRequest, ApplyIndexingPlanResponse, CpuCapacity, IndexingServiceClient,
        MockIndexingService,
    };
    use quickwit_proto::ingest::ingester::{
        IngesterServiceClient, IngesterStatus, InitShardSuccess, InitShardsResponse,
        MockIngesterService, RetainShardsResponse,
    };
    use quickwit_proto::ingest::{Shard, ShardPKey, ShardState};
    use quickwit_proto::metastore::{
        DeleteShardsResponse, EntityKind, FindIndexTemplateMatchesResponse,
        ListIndexesMetadataRequest, ListIndexesMetadataResponse, ListShardsRequest,
        ListShardsResponse, ListShardsSubresponse, MetastoreError, MockMetastoreService,
        OpenShardSubresponse, OpenShardsResponse, SourceType,
    };
    use quickwit_proto::types::{DocMappingUid, Position};
    use tokio::sync::Mutex;

    use super::*;
    use crate::IndexerNodeInfo;

    #[tokio::test]
    async fn test_control_plane_create_index() {
        let universe = Universe::with_accelerated_time();
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();

        let mut mock_metastore = MockMetastoreService::new();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_create_index()
            .withf(|create_index_request| {
                let index_config: IndexConfig =
                    create_index_request.deserialize_index_config().unwrap();
                assert_eq!(index_config.index_id, "test-index");
                assert_eq!(index_config.index_uri, "ram:///test-index");
                true
            })
            .returning(move |_| {
                let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
                let index_metadata_json = serde_json::to_string(&index_metadata).unwrap();
                let response = CreateIndexResponse {
                    index_uid: Some(index_uid_clone.clone()),
                    index_metadata_json,
                };
                Ok(response)
            });
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));
        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let index_config = IndexConfig::for_test("test-index", "ram:///test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = control_plane_mailbox
            .ask_for_res(create_index_request)
            .await
            .unwrap();
        assert_eq!(create_index_response.index_uid(), &index_uid);

        // TODO: Test that create index event is properly sent to ingest controller.

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_delete_index() {
        let universe = Universe::with_accelerated_time();
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();

        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let mut mock_metastore = MockMetastoreService::new();
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_delete_index()
            .withf(move |delete_index_request| delete_index_request.index_uid() == &index_uid_clone)
            .returning(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let delete_index_request = DeleteIndexRequest {
            index_uid: Some(index_uid),
        };
        control_plane_mailbox
            .ask_for_res(delete_index_request)
            .await
            .unwrap();

        // TODO: Test that delete index event is properly sent to ingest controller.

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_add_source() {
        let universe = Universe::with_accelerated_time();
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();

        let mut index_metadata = IndexMetadata::for_test("test-index", "ram://test");
        index_metadata
            .add_source(SourceConfig::ingest_v2())
            .unwrap();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_add_source()
            .withf(|add_source_request| {
                let source_config: SourceConfig =
                    serde_json::from_str(&add_source_request.source_config_json).unwrap();
                assert_eq!(source_config.source_id, "test-source");
                assert_eq!(source_config.source_type(), SourceType::Void);
                true
            })
            .return_once(|_| Ok(EmptyResponse {}));
        // the list_indexes_metadata and list_shards calls are made when the control plane starts
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(move |_| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_shards()
            .return_once(move |_| Ok(ListShardsResponse::default()));

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_config = SourceConfig::for_test("test-source", SourceParams::void());
        let add_source_request = AddSourceRequest {
            index_uid: Some(index_uid),
            source_config_json: serde_json::to_string(&source_config).unwrap(),
        };
        control_plane_mailbox
            .ask_for_res(add_source_request)
            .await
            .unwrap();

        // TODO: Test that delete index event is properly sent to ingest controller.

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_update_source() {
        let universe = Universe::with_accelerated_time();
        let pipelines_after_update = 3;
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();
        let mut mock_indexer = MockIndexingService::new();
        // call when starting the cp
        mock_indexer
            .expect_apply_indexing_plan()
            .withf(|request| request.indexing_tasks.len() == 1)
            .return_once(|_| Ok(ApplyIndexingPlanResponse {}));
        // call after the update (3 tasks because 3 pipelines)
        mock_indexer
            .expect_apply_indexing_plan()
            .withf(move |request| request.indexing_tasks.len() == pipelines_after_update)
            .return_once(|_| Ok(ApplyIndexingPlanResponse {}));
        let indexer = IndexingServiceClient::from_mock(mock_indexer);
        let indexer_info = IndexerNodeInfo {
            node_id: self_node_id.clone(),
            generation_id: 0,
            client: indexer,
            indexing_tasks: Vec::new(),
            indexing_capacity: CpuCapacity::from_cpu_millis(1_000),
        };
        indexer_pool.insert(self_node_id.clone(), indexer_info);

        let ingester_pool = IngesterPool::default();

        let mut index_metadata = IndexMetadata::for_test("test-index", "ram://tata");
        index_metadata
            .add_source(SourceConfig::ingest_v2())
            .unwrap();

        let mut test_source_config = SourceConfig::for_test(
            "test-source",
            SourceParams::Kafka(KafkaSourceParams {
                topic: "test-topic".to_string(),
                client_log_level: None,
                enable_backfill_mode: false,
                client_params: json!({}),
            }),
        );
        index_metadata
            .add_source(test_source_config.clone())
            .unwrap();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_update_source()
            .withf(move |update_source_request| {
                let source_config: SourceConfig =
                    serde_json::from_str(&update_source_request.source_config_json).unwrap();
                assert_eq!(source_config.source_id, "test-source");
                assert_eq!(source_config.source_type(), SourceType::Kafka);
                assert_eq!(
                    source_config.num_pipelines,
                    NonZero::new(pipelines_after_update).unwrap()
                );
                true
            })
            .return_once(|_| Ok(EmptyResponse {}));
        // the list_indexes_metadata and list_shards calls are made when the control plane starts
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(move |_| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_shards()
            .return_once(move |_| Ok(ListShardsResponse::default()));

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        test_source_config.num_pipelines = NonZero::new(pipelines_after_update).unwrap();
        let update_source_request = UpdateSourceRequest {
            index_uid: Some(index_uid),
            source_config_json: serde_json::to_string(&test_source_config).unwrap(),
        };
        control_plane_mailbox
            .ask_for_res(update_source_request)
            .await
            .unwrap();

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_toggle_source() {
        let universe = Universe::with_accelerated_time();
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();

        let mut index_metadata = IndexMetadata::for_test("test-index", "ram://toto");
        index_metadata
            .add_source(SourceConfig::ingest_v2())
            .unwrap();

        let test_source_config = SourceConfig::for_test("test-source", SourceParams::void());
        index_metadata.add_source(test_source_config).unwrap();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|_| Ok(ListIndexesMetadataResponse::for_test(vec![index_metadata])));
        mock_metastore
            .expect_list_shards()
            .return_once(move |_| Ok(ListShardsResponse::default()));

        let index_uid = IndexUid::for_test("test-index", 0);
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_toggle_source()
            .times(1)
            .return_once(move |toggle_source_request| {
                assert_eq!(toggle_source_request.index_uid(), &index_uid_clone);
                assert_eq!(toggle_source_request.source_id, "test-source");
                Ok(EmptyResponse {})
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_toggle_source()
            .times(1)
            .return_once(move |toggle_source_request| {
                assert_eq!(toggle_source_request.index_uid(), &index_uid_clone);
                assert_eq!(toggle_source_request.source_id, "test-source");
                assert!(!toggle_source_request.enable);
                Ok(EmptyResponse {})
            });

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let enable_source_request = ToggleSourceRequest {
            index_uid: Some(index_uid.clone()),
            source_id: "test-source".to_string(),
            enable: true,
        };
        control_plane_mailbox
            .ask_for_res(enable_source_request)
            .await
            .unwrap();

        let disable_source_request = ToggleSourceRequest {
            index_uid: Some(index_uid),
            source_id: "test-source".to_string(),
            enable: false,
        };
        control_plane_mailbox
            .ask_for_res(disable_source_request)
            .await
            .unwrap();

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_delete_source() {
        let universe = Universe::with_accelerated_time();
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();

        let mut mock_metastore = MockMetastoreService::new();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_delete_source()
            .withf(move |delete_source_request| {
                assert_eq!(delete_source_request.index_uid(), &index_uid_clone);
                assert_eq!(delete_source_request.source_id, "test-source");
                true
            })
            .returning(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let delete_source_request = DeleteSourceRequest {
            index_uid: Some(index_uid),
            source_id: "test-source".to_string(),
        };
        control_plane_mailbox
            .ask_for_res(delete_source_request)
            .await
            .unwrap();

        // TODO: Test that delete index event is properly sent to ingest controller.

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_get_or_create_open_shards() {
        let universe = Universe::with_accelerated_time();
        let self_node_id: NodeId = "test-node".into();
        let indexer_pool = IndexerPool::default();

        let ingester_pool = IngesterPool::default();

        let mut mock_metastore = MockMetastoreService::new();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(|_| {
                let mut index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
                let mut source_config = SourceConfig::ingest_v2();
                source_config.enabled = true;
                index_metadata.add_source(source_config).unwrap();
                Ok(ListIndexesMetadataResponse::for_test(vec![index_metadata]))
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_list_shards()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_uid(), &index_uid_clone);
                assert_eq!(subrequest.source_id, INGEST_V2_SOURCE_ID);

                let subresponses = vec![ListShardsSubresponse {
                    index_uid: Some(index_uid_clone.clone()),
                    source_id: INGEST_V2_SOURCE_ID.to_string(),
                    shards: vec![Shard {
                        index_uid: Some(index_uid_clone.clone()),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        ..Default::default()
                    }],
                }];
                let response = ListShardsResponse { subresponses };
                Ok(response)
            });

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            self_node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let get_open_shards_request = GetOrCreateOpenShardsRequest {
            subrequests: vec![GetOrCreateOpenShardsSubrequest {
                subrequest_id: 0,
                index_id: "test-index".to_string(),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
            }],
            closed_shards: Vec::new(),
            unavailable_leaders: Vec::new(),
        };
        let get_open_shards_response = control_plane_mailbox
            .ask_for_res(get_open_shards_request)
            .await
            .unwrap();
        assert_eq!(get_open_shards_response.successes.len(), 1);
        assert_eq!(get_open_shards_response.failures.len(), 0);

        let subresponse = &get_open_shards_response.successes[0];
        assert_eq!(subresponse.index_uid(), &index_uid);
        assert_eq!(subresponse.source_id, INGEST_V2_SOURCE_ID);
        assert_eq!(subresponse.open_shards.len(), 1);
        assert_eq!(subresponse.open_shards[0].shard_id(), ShardId::from(1));

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_supervision_reload_from_metastore() {
        let universe = Universe::default();
        let node_id = NodeId::new("test_node".to_string());
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();
        let mut mock_metastore = MockMetastoreService::new();

        let mut index_0 = IndexMetadata::for_test("test-index-0", "ram:///test-index-0");
        let source = SourceConfig::ingest_v2();
        index_0.add_source(source.clone()).unwrap();

        mock_metastore
            .expect_list_indexes_metadata()
            .times(2) // 1 for the first initialization, 1 after the respawn of the control plane.
            .returning(|list_indexes_request: ListIndexesMetadataRequest| {
                assert_eq!(list_indexes_request, ListIndexesMetadataRequest::all());
                Ok(ListIndexesMetadataResponse::for_test(Vec::new()))
            });
        mock_metastore.expect_list_shards().return_once(
            |_list_shards_request: ListShardsRequest| {
                let list_shards_resp = ListShardsResponse {
                    subresponses: Vec::new(),
                };
                Ok(list_shards_resp)
            },
        );
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_metadata_json = serde_json::to_string(&index_metadata).unwrap();

        mock_metastore.expect_create_index().times(1).return_once(
            |_create_index_request: CreateIndexRequest| {
                Ok(CreateIndexResponse {
                    index_uid: index_metadata.index_uid.into(),
                    index_metadata_json,
                })
            },
        );
        mock_metastore.expect_create_index().times(1).return_once(
            |create_index_request: CreateIndexRequest| {
                Err(MetastoreError::AlreadyExists(EntityKind::Index {
                    index_id: create_index_request
                        .deserialize_index_config()
                        .unwrap()
                        .index_id,
                }))
            },
        );
        mock_metastore.expect_create_index().times(1).return_once(
            |_create_index_request: CreateIndexRequest| {
                Err(MetastoreError::Connection {
                    message: "Fake connection error.".to_string(),
                })
            },
        );

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, control_plane_handle, mut readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        tokio::time::timeout(
            Duration::from_secs(5),
            readiness_rx.wait_for(|readiness| *readiness),
        )
        .await
        .unwrap()
        .unwrap();

        let index_config = IndexConfig::for_test("test-index", "ram:///test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();

        // A happy path: we simply create the index.
        control_plane_mailbox
            .ask_for_res(create_index_request.clone())
            .await
            .unwrap();

        // Now let's see what happens if we attempt to create the same index a second time.
        let control_plane_error: ControlPlaneError = control_plane_mailbox
            .ask(create_index_request.clone())
            .await
            .unwrap()
            .unwrap_err();

        // That kind of error clearly indicates that the transaction has failed.
        // The control plane does not need to be restarted.
        assert!(
            matches!(control_plane_error, ControlPlaneError::Metastore(MetastoreError::AlreadyExists(entity)) if entity == EntityKind::Index { index_id: "test-index".to_string() })
        );

        control_plane_mailbox.ask(Observe).await.unwrap();

        assert_eq!(
            control_plane_handle
                .process_pending_and_observe()
                .await
                .metrics,
            SupervisorMetrics {
                num_panics: 0,
                num_errors: 0,
                num_kills: 0
            }
        );

        // Now let's see what happens with a grayer type of error.
        let control_plane_error: AskError<ControlPlaneError> = control_plane_mailbox
            .ask_for_res(create_index_request)
            .await
            .unwrap_err();
        assert!(matches!(control_plane_error, AskError::ProcessMessageError));

        // This time, the control plane is restarted.
        control_plane_mailbox.ask(Observe).await.unwrap();
        assert_eq!(
            control_plane_handle
                .process_pending_and_observe()
                .await
                .metrics,
            SupervisorMetrics {
                num_panics: 0,
                num_errors: 1,
                num_kills: 0
            }
        );

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_delete_shard_on_eof() {
        let universe = Universe::with_accelerated_time();
        let node_id = NodeId::new("test-control-plane".to_string());
        let indexer_pool = IndexerPool::default();
        let (client_mailbox, client_inbox) = universe.create_test_mailbox();
        let client = IndexingServiceClient::from_mailbox::<IndexingService>(client_mailbox);
        let indexer_node_info = IndexerNodeInfo {
            node_id: NodeId::new("test-indexer".to_string()),
            generation_id: 0,
            client,
            indexing_tasks: Vec::new(),
            indexing_capacity: CpuCapacity::from_cpu_millis(4_000),
        };
        indexer_pool.insert(indexer_node_info.node_id.clone(), indexer_node_info);
        let ingester_pool = IngesterPool::default();
        let mut mock_metastore = MockMetastoreService::new();

        let mut index_0 = IndexMetadata::for_test("test-index-0", "ram:///test-index-0");
        let mut source = SourceConfig::ingest_v2();
        source.enabled = true;
        index_0.add_source(source.clone()).unwrap();

        let index_0_clone = index_0.clone();
        mock_metastore.expect_list_indexes_metadata().return_once(
            move |list_indexes_request: ListIndexesMetadataRequest| {
                assert_eq!(list_indexes_request, ListIndexesMetadataRequest::all());
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_0_clone.clone(),
                ]))
            },
        );
        let index_uid_clone = index_0.index_uid.clone();
        mock_metastore.expect_delete_shards().return_once(
            move |delete_shards_request: DeleteShardsRequest| {
                assert_eq!(delete_shards_request.index_uid(), &index_uid_clone);
                assert_eq!(delete_shards_request.source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(delete_shards_request.shard_ids, [ShardId::from(17)]);
                assert!(!delete_shards_request.force);

                let response = DeleteShardsResponse {
                    index_uid: delete_shards_request.index_uid,
                    source_id: delete_shards_request.source_id,
                    successes: delete_shards_request.shard_ids,
                    failures: Vec::new(),
                };
                Ok(response)
            },
        );

        let mut shard = Shard {
            index_uid: Some(index_0.index_uid.clone()),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
            shard_id: Some(ShardId::from(17)),
            leader_id: "test-ingester".to_string(),
            publish_position_inclusive: Some(Position::Beginning),
            ..Default::default()
        };
        shard.set_shard_state(ShardState::Open);

        let index_uid_clone = index_0.index_uid.clone();
        mock_metastore.expect_list_shards().return_once(
            move |_list_shards_request: ListShardsRequest| {
                let list_shards_resp = ListShardsResponse {
                    subresponses: vec![ListShardsSubresponse {
                        index_uid: Some(index_uid_clone),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: vec![shard],
                    }],
                };
                Ok(list_shards_resp)
            },
        );

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let source_uid = SourceUid {
            index_uid: index_0.index_uid.clone(),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
        };

        // This update should not triggeer anything in the control plane.
        control_plane_mailbox
            .ask(ShardPositionsUpdate {
                source_uid: source_uid.clone(),
                updated_shard_positions: vec![(ShardId::from(17), Position::offset(1_000u64))],
            })
            .await
            .unwrap();

        let control_plane_obs: ControlPlaneObservableState =
            control_plane_mailbox.ask(Observe).await.unwrap();
        let last_applied_physical_plan = control_plane_obs
            .indexing_scheduler
            .last_applied_physical_plan
            .unwrap();
        let indexing_tasks = last_applied_physical_plan
            .indexing_tasks_per_indexer()
            .get("test-indexer")
            .unwrap();
        assert_eq!(indexing_tasks.len(), 1);
        assert_eq!(indexing_tasks[0].shard_ids, [ShardId::from(17)]);

        let control_plane_debug_info = control_plane_mailbox.ask(GetDebugInfo).await.unwrap();
        let shard = &control_plane_debug_info["shard_table"]
            ["test-index-0:00000000000000000000000000"]["test-ingester"][0];
        assert_eq!(shard["shard_id"], "00000000000000000017");
        assert_eq!(shard["publish_position_inclusive"], "00000000000000001000");

        let _ = client_inbox.drain_for_test();

        universe.sleep(Duration::from_secs(30)).await;
        // This update should trigger the deletion of the shard and a new indexing plan.
        control_plane_mailbox
            .ask(ShardPositionsUpdate {
                source_uid,
                updated_shard_positions: vec![(ShardId::from(17), Position::eof(1_000u64))],
            })
            .await
            .unwrap();

        let control_plane_obs: ControlPlaneObservableState =
            control_plane_mailbox.ask(Observe).await.unwrap();
        let last_applied_physical_plan = control_plane_obs
            .indexing_scheduler
            .last_applied_physical_plan
            .unwrap();
        let indexing_tasks = last_applied_physical_plan
            .indexing_tasks_per_indexer()
            .get("test-indexer")
            .unwrap();
        assert!(indexing_tasks.is_empty());

        let apply_plan_requests = client_inbox.drain_for_test_typed::<ApplyIndexingPlanRequest>();
        let last_apply_plan_request = apply_plan_requests.last().unwrap();
        assert!(last_apply_plan_request.indexing_tasks.is_empty());

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_fill_shard_table_position_from_metastore_on_startup() {
        let universe = Universe::with_accelerated_time();
        let node_id = NodeId::new("test-control-plane".to_string());
        let indexer_pool = IndexerPool::default();
        let (client_mailbox, _client_inbox) = universe.create_test_mailbox();
        let client = IndexingServiceClient::from_mailbox::<IndexingService>(client_mailbox);
        let indexer_node_info = IndexerNodeInfo {
            node_id: NodeId::new("test-indexer".to_string()),
            generation_id: 0,
            client,
            indexing_tasks: Vec::new(),
            indexing_capacity: CpuCapacity::from_cpu_millis(4_000),
        };
        indexer_pool.insert(indexer_node_info.node_id.clone(), indexer_node_info);
        let ingester_pool = IngesterPool::default();
        let mut mock_metastore = MockMetastoreService::new();

        let mut index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let mut source_config = SourceConfig::ingest_v2();
        source_config.enabled = true;
        index_metadata.add_source(source_config.clone()).unwrap();

        let index_metadata_clone = index_metadata.clone();
        mock_metastore.expect_list_indexes_metadata().return_once(
            move |list_indexes_request: ListIndexesMetadataRequest| {
                assert_eq!(list_indexes_request, ListIndexesMetadataRequest::all());
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata_clone,
                ]))
            },
        );

        let mut shard = Shard {
            index_uid: Some(index_metadata.index_uid.clone()),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
            shard_id: Some(ShardId::from(17)),
            leader_id: "test-ingester".to_string(),
            publish_position_inclusive: Some(Position::Offset(1234u64.into())),
            ..Default::default()
        };
        shard.set_shard_state(ShardState::Open);

        let index_uid_clone = index_metadata.index_uid.clone();
        mock_metastore.expect_list_shards().return_once(
            move |_list_shards_request: ListShardsRequest| {
                let list_shards_resp = ListShardsResponse {
                    subresponses: vec![ListShardsSubresponse {
                        index_uid: Some(index_uid_clone),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: vec![shard],
                    }],
                };
                Ok(list_shards_resp)
            },
        );

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let control_plane_debug_info = control_plane_mailbox.ask(GetDebugInfo).await.unwrap();
        let shard = &control_plane_debug_info["shard_table"]
            ["test-index:00000000000000000000000000"]["test-ingester"][0];
        assert_eq!(shard["shard_id"], "00000000000000000017");
        assert_eq!(shard["publish_position_inclusive"], "00000000000000001234");

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_delete_non_existing_shard() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::default();
        let node_id = NodeId::new("test-control-plane".to_string());
        let indexer_pool = IndexerPool::default();
        let (client_mailbox, _client_inbox) = universe.create_test_mailbox();
        let client = IndexingServiceClient::from_mailbox::<IndexingService>(client_mailbox);
        let indexer_node_info = IndexerNodeInfo {
            node_id: NodeId::new("test-indexer".to_string()),
            generation_id: 0,
            client,
            indexing_tasks: Vec::new(),
            indexing_capacity: CpuCapacity::from_cpu_millis(4_000),
        };
        indexer_pool.insert(indexer_node_info.node_id.clone(), indexer_node_info);
        let ingester_pool = IngesterPool::default();
        let mut mock_metastore = MockMetastoreService::new();

        let mut index_0 = IndexMetadata::for_test("test-index-0", "ram:///test-index-0");
        let mut source = SourceConfig::ingest_v2();
        source.enabled = true;
        index_0.add_source(source.clone()).unwrap();

        let index_0_clone = index_0.clone();
        mock_metastore.expect_list_indexes_metadata().return_once(
            move |list_indexes_request: ListIndexesMetadataRequest| {
                assert_eq!(list_indexes_request, ListIndexesMetadataRequest::all());
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_0_clone.clone(),
                ]))
            },
        );
        let index_uid_clone = index_0.index_uid.clone();
        mock_metastore.expect_delete_shards().return_once(
            move |delete_shards_request: DeleteShardsRequest| {
                assert_eq!(delete_shards_request.index_uid(), &index_uid_clone);
                assert_eq!(delete_shards_request.source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(delete_shards_request.shard_ids, [ShardId::from(17)]);
                assert!(!delete_shards_request.force);

                let response = DeleteShardsResponse {
                    index_uid: delete_shards_request.index_uid,
                    source_id: delete_shards_request.source_id,
                    successes: delete_shards_request.shard_ids,
                    failures: Vec::new(),
                };
                Ok(response)
            },
        );

        let index_uid_clone = index_0.index_uid.clone();
        mock_metastore.expect_list_shards().return_once(
            move |_list_shards_request: ListShardsRequest| {
                let list_shards_resp = ListShardsResponse {
                    subresponses: vec![ListShardsSubresponse {
                        index_uid: Some(index_uid_clone),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: Vec::new(),
                    }],
                };
                Ok(list_shards_resp)
            },
        );

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        let source_uid = SourceUid {
            index_uid: index_0.index_uid.clone(),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
        };

        // This update should not triggeer anything in the control plane.
        control_plane_mailbox
            .ask(ShardPositionsUpdate {
                source_uid: source_uid.clone(),
                updated_shard_positions: vec![(ShardId::from(17), Position::eof(1_000u64))],
            })
            .await
            .unwrap();

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_delete_index() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::default();
        let node_id = NodeId::new("test-control-plane".to_string());
        let indexer_pool = IndexerPool::default();

        let ingester_pool = IngesterPool::default();
        let mut mock_ingester = MockIngesterService::new();
        let mut seq = Sequence::new();

        let mut index_0 = IndexMetadata::for_test("test-index-0", "ram:///test-index-0");
        let mut source = SourceConfig::ingest_v2();
        source.enabled = true;
        index_0.add_source(source.clone()).unwrap();

        let index_uid_clone = index_0.index_uid.clone();
        let index_0_clone = index_0.clone();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .in_sequence(&mut seq)
            .returning(move |list_indexes_request: ListIndexesMetadataRequest| {
                assert_eq!(list_indexes_request, ListIndexesMetadataRequest::all());
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_0_clone.clone(),
                ]))
            });
        mock_metastore
            .expect_list_shards()
            .times(1)
            .in_sequence(&mut seq)
            .returning(move |_list_shards_request: ListShardsRequest| {
                let list_shards_resp = ListShardsResponse {
                    subresponses: vec![ListShardsSubresponse {
                        index_uid: Some(index_uid_clone.clone()),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: vec![Shard {
                            index_uid: Some(index_uid_clone.clone()),
                            source_id: source.source_id.to_string(),
                            shard_id: Some(ShardId::from(15)),
                            leader_id: "node1".to_string(),
                            follower_id: None,
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: None,
                            publish_token: None,
                            update_timestamp: 1724158996,
                        }],
                    }],
                };
                Ok(list_shards_resp)
            });

        mock_ingester
            .expect_retain_shards()
            .times(1)
            .in_sequence(&mut seq)
            .returning(|request| {
                assert_eq!(request.retain_shards_for_sources.len(), 1);
                assert_eq!(
                    request.retain_shards_for_sources[0].shard_ids,
                    [ShardId::from(15)]
                );
                Ok(RetainShardsResponse {})
            });

        let index_uid_clone = index_0.index_uid.clone();
        mock_metastore
            .expect_delete_index()
            .times(1)
            .in_sequence(&mut seq)
            .returning(move |delete_index_request: DeleteIndexRequest| {
                assert_eq!(delete_index_request.index_uid(), &index_uid_clone);
                Ok(EmptyResponse {})
            });
        mock_ingester
            .expect_retain_shards()
            .times(1)
            .in_sequence(&mut seq)
            .returning(|mut request| {
                assert_eq!(request.retain_shards_for_sources.len(), 1);
                let retain_shards_for_source = request.retain_shards_for_sources.pop().unwrap();
                assert!(&retain_shards_for_source.shard_ids.is_empty());
                Ok(RetainShardsResponse {})
            });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert("node1".into(), ingester);

        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        // This update should not trigger anything in the control plane.
        control_plane_mailbox
            .ask(DeleteIndexRequest {
                index_uid: Some(index_0.index_uid),
            })
            .await
            .unwrap()
            .unwrap();

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_delete_source() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::default();
        let node_id = NodeId::new("test-control-plane".to_string());
        let indexer_pool = IndexerPool::default();

        let ingester_pool = IngesterPool::default();
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_retain_shards()
            .times(2)
            .returning(|request| {
                assert_eq!(request.retain_shards_for_sources.len(), 1);
                assert_eq!(
                    request.retain_shards_for_sources[0].shard_ids,
                    [ShardId::from(15)]
                );
                Ok(RetainShardsResponse {})
            });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert("node1".into(), ingester);

        let mut index_0 = IndexMetadata::for_test("test-index-0", "ram:///test-index-0");
        let index_uid_clone = index_0.index_uid.clone();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_delete_source().return_once(
            move |delete_source_request: DeleteSourceRequest| {
                assert_eq!(delete_source_request.index_uid(), &index_uid_clone);
                assert_eq!(&delete_source_request.source_id, INGEST_V2_SOURCE_ID);
                Ok(EmptyResponse {})
            },
        );

        let mut source = SourceConfig::ingest_v2();
        source.enabled = true;
        index_0.add_source(source.clone()).unwrap();

        let index_0_clone = index_0.clone();
        mock_metastore.expect_list_indexes_metadata().return_once(
            move |list_indexes_request: ListIndexesMetadataRequest| {
                assert_eq!(list_indexes_request, ListIndexesMetadataRequest::all());
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_0_clone.clone(),
                ]))
            },
        );

        let index_uid_clone = index_0.index_uid.clone();
        mock_metastore.expect_list_shards().return_once(
            move |_list_shards_request: ListShardsRequest| {
                let list_shards_resp = ListShardsResponse {
                    subresponses: vec![ListShardsSubresponse {
                        index_uid: Some(index_uid_clone.clone()),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: vec![Shard {
                            index_uid: Some(index_uid_clone),
                            source_id: source.source_id.to_string(),
                            shard_id: Some(ShardId::from(15)),
                            leader_id: "node1".to_string(),
                            follower_id: None,
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: None,
                            publish_token: None,
                            update_timestamp: 1724158996,
                        }],
                    }],
                };
                Ok(list_shards_resp)
            },
        );
        let cluster_config = ClusterConfig::for_test();
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );
        // This update should not trigger anything in the control plane.
        control_plane_mailbox
            .ask(DeleteSourceRequest {
                index_uid: Some(index_0.index_uid),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
            })
            .await
            .unwrap()
            .unwrap();

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_auto_create_indexes_on_get_or_create_open_shards_request() {
        let universe = Universe::default();

        let mut cluster_config = ClusterConfig::for_test();
        cluster_config.auto_create_indexes = true;

        let node_id = NodeId::from("test-node");
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();

        let mut mock_metastore = MockMetastoreService::new();

        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));

        mock_metastore
            .expect_find_index_template_matches()
            .return_once(|request| {
                assert_eq!(request.index_ids, ["test-index-foo"]);

                let index_template =
                    IndexTemplate::for_test("test-template-foo", &["test-index-foo*"], 100);
                let index_template_json = serde_json::to_string(&index_template).unwrap();

                Ok(FindIndexTemplateMatchesResponse {
                    matches: vec![IndexTemplateMatch {
                        template_id: "test-template-foo".to_string(),
                        index_id: "test-index-foo".to_string(),
                        index_template_json,
                    }],
                })
            });

        mock_metastore.expect_create_index().return_once(|request| {
            let index_config = request.deserialize_index_config().unwrap();
            assert_eq!(index_config.index_id, "test-index-foo");
            assert_eq!(index_config.index_uri, "ram:///indexes/test-index-foo");

            let source_configs = request.deserialize_source_configs().unwrap();
            assert_eq!(source_configs.len(), 2);
            // assert_eq!(source_configs[0].source_id, INGEST_API_SOURCE_ID);
            assert_eq!(source_configs[0].source_id, INGEST_V2_SOURCE_ID);
            assert_eq!(source_configs[1].source_id, CLI_SOURCE_ID);

            let index_uid = IndexUid::for_test("test-index-foo", 0);
            let mut index_metadata = IndexMetadata::new_with_index_uid(index_uid, index_config);

            for source_config in source_configs {
                index_metadata.add_source(source_config).unwrap();
            }
            let index_metadata_json = serde_json::to_string(&index_metadata).unwrap();

            Ok(CreateIndexResponse {
                index_uid: index_metadata.index_uid.into(),
                index_metadata_json,
            })
        });

        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory,
            indexer_pool,
            ingester_pool,
            MetastoreServiceClient::from_mock(mock_metastore),
        );

        let response = control_plane_mailbox
            .ask(GetOrCreateOpenShardsRequest {
                subrequests: vec![GetOrCreateOpenShardsSubrequest {
                    subrequest_id: 0,
                    index_id: "test-index-foo".to_string(),
                    source_id: INGEST_V2_SOURCE_ID.to_string(),
                }],
                closed_shards: Vec::new(),
                unavailable_leaders: Vec::new(),
            })
            .await
            .unwrap()
            .unwrap();
        assert!(response.successes.is_empty());
        assert_eq!(response.failures.len(), 1);
        assert!(matches!(
            response.failures[0].reason(),
            GetOrCreateOpenShardsFailureReason::NoIngestersAvailable
        ));

        let control_plane_state = control_plane_mailbox.ask(Observe).await.unwrap();
        assert_eq!(control_plane_state.num_indexes, 1);
        assert_eq!(control_plane_state.num_sources, 1);

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_watch_indexers() {
        let universe = Universe::with_accelerated_time();
        let (control_plane_mailbox, control_plane_inbox) = universe.create_test_mailbox();
        let weak_control_plane_mailbox = control_plane_mailbox.downgrade();

        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();
        let cluster_change_stream = cluster_change_stream_factory.create();
        spawn_watch_indexers_task(weak_control_plane_mailbox, cluster_change_stream);

        let cluster_change_stream_tx = cluster_change_stream_factory.change_stream_tx();

        // a non-indexer node status change doesn't trigger a shard rebalancing.
        let metastore_node = ClusterNode::for_test(
            "test-metastore",
            1515,
            false,
            &["metastore"],
            &[],
            IngesterStatus::Unspecified,
        )
        .await;
        let cluster_change = ClusterChange::Add(metastore_node);
        cluster_change_stream_tx.send(cluster_change).unwrap();

        tokio::time::sleep(Duration::from_millis(1)).await;
        assert!(
            control_plane_inbox
                .drain_for_test_typed::<RebalanceShards>()
                .is_empty()
        );

        // an indexer initializing doesn't trigger a shard rebalancing.
        let indexer_node_initializing: ClusterNode = ClusterNode::for_test(
            "test-indexer",
            1515,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Initializing,
        )
        .await;
        let cluster_change = ClusterChange::Add(indexer_node_initializing);
        cluster_change_stream_tx.send(cluster_change).unwrap();

        tokio::time::sleep(Duration::from_millis(1)).await;
        assert!(
            control_plane_inbox
                .drain_for_test_typed::<RebalanceShards>()
                .is_empty()
        );

        // an indexer ready triggers a shard rebalancing.
        let indexer_node: ClusterNode = ClusterNode::for_test(
            "test-indexer",
            1515,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        let cluster_change = ClusterChange::Add(indexer_node.clone());
        cluster_change_stream_tx.send(cluster_change).unwrap();

        tokio::time::sleep(Duration::from_millis(1)).await;
        let RebalanceShards = control_plane_inbox.recv_typed_message().await.unwrap();

        // removing an indexer node triggers a shard rebalancing.
        let cluster_change = ClusterChange::Remove(indexer_node.clone());
        cluster_change_stream_tx.send(cluster_change).unwrap();

        tokio::time::sleep(Duration::from_millis(1)).await;
        let RebalanceShards = control_plane_inbox.recv_typed_message().await.unwrap();

        // a change in IngesterStatus readiness triggers a shard rebalancing.
        let node_ready = ClusterNode::for_test(
            "test-indexer",
            1515,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        let node_retiring = ClusterNode::for_test(
            "test-indexer",
            1515,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Retiring,
        )
        .await;
        let cluster_change = ClusterChange::Update {
            previous: node_ready,
            updated: node_retiring,
        };
        cluster_change_stream_tx.send(cluster_change).unwrap();

        tokio::time::sleep(Duration::from_millis(1)).await;
        let RebalanceShards = control_plane_inbox.recv_typed_message().await.unwrap();

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_rebuilds_plan_on_indexer_joins_or_leaves_the_cluster() {
        let universe = Universe::with_accelerated_time();

        let cluster_config = ClusterConfig::for_test();
        let node_id = NodeId::from("test-control-plane");
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();

        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let disable_control_loop = true;
        let (_control_plane_mailbox, control_plane_handle, _readiness_rx) =
            ControlPlane::spawn_inner(
                &universe,
                cluster_config,
                node_id,
                cluster_change_stream_factory.clone(),
                indexer_pool.clone(),
                ingester_pool,
                metastore,
                disable_control_loop,
            );
        let cluster_change_stream_tx = cluster_change_stream_factory.change_stream_tx();
        let indexer_node: ClusterNode = ClusterNode::for_test(
            "test-indexer",
            1515,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        let cluster_change = ClusterChange::Add(indexer_node.clone());
        cluster_change_stream_tx.send(cluster_change).unwrap();

        universe.sleep(Duration::from_secs(10)).await;

        let ingest_controller_stats = control_plane_handle
            .process_pending_and_observe()
            .await
            .state_opt
            .as_ref()
            .unwrap()
            .ingest_controller;
        assert_eq!(ingest_controller_stats.num_rebalance_shards_ops, 1);

        let cluster_change = ClusterChange::Remove(indexer_node);
        cluster_change_stream_tx.send(cluster_change).unwrap();

        universe.sleep(Duration::from_secs(10)).await;

        let ingest_controller_stats = control_plane_handle
            .process_pending_and_observe()
            .await
            .state_opt
            .as_ref()
            .unwrap()
            .ingest_controller;
        assert_eq!(ingest_controller_stats.num_rebalance_shards_ops, 2);

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_handles_rebalance_shards_callback() {
        let universe = Universe::with_accelerated_time();

        let cluster_config = ClusterConfig::for_test();
        let node_id = NodeId::from("test-control-plane");
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();

        let indexer_pool = IndexerPool::default();
        let ingester_pool = IngesterPool::default();
        let ingester_id = NodeId::from("test-ingester");
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_retain_shards()
            .return_once(|_| Ok(RetainShardsResponse {}));
        mock_ingester.expect_init_shards().return_once(|request| {
            let shard = request.subrequests[0].shard().clone();
            let response = InitShardsResponse {
                successes: vec![InitShardSuccess {
                    subrequest_id: 0,
                    shard: Some(shard),
                }],
                failures: Vec::new(),
            };
            Ok(response)
        });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert(ingester_id, ingester);

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));

        mock_metastore.expect_create_index().return_once(|request| {
            let index_config = request.deserialize_index_config().unwrap();
            let source_configs = request.deserialize_source_configs().unwrap();
            let mut index_metadata = IndexMetadata::new_with_index_uid(
                IndexUid::for_test(&index_config.index_id, 0),
                index_config,
            );
            for source_config in source_configs {
                index_metadata.add_source(source_config).unwrap();
            }
            let index_metadata_json = serde_json::to_string(&index_metadata).unwrap();
            let response = CreateIndexResponse {
                index_uid: Some(IndexUid::for_test("test-index", 0u128)),
                index_metadata_json,
            };
            Ok(response)
        });
        mock_metastore.expect_open_shards().return_once(|_| {
            let response = OpenShardsResponse {
                subresponses: vec![OpenShardSubresponse {
                    subrequest_id: 0,
                    open_shard: Some(Shard {
                        index_uid: Some(IndexUid::for_test("test-index", 0u128)),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shard_id: Some(ShardId::from(0u64)),
                        leader_id: "test-ingester".to_string(),
                        follower_id: None,
                        shard_state: ShardState::Open as i32,
                        doc_mapping_uid: Some(DocMappingUid::default()),
                        publish_position_inclusive: Some(Position::Beginning),
                        publish_token: None,
                        update_timestamp: 1724158996,
                    }),
                }],
            };
            Ok(response)
        });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory.clone(),
            indexer_pool.clone(),
            ingester_pool,
            metastore,
        );
        let index_config = IndexConfig::for_test("test-index", "ram:///test-index");
        let mut source_config = SourceConfig::ingest_v2();
        source_config.enabled = true;

        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, &[source_config])
                .unwrap();
        control_plane_mailbox
            .ask(create_index_request)
            .await
            .unwrap()
            .unwrap();

        let get_or_create_open_shards_request = GetOrCreateOpenShardsRequest {
            subrequests: vec![GetOrCreateOpenShardsSubrequest {
                subrequest_id: 0,
                index_id: "test-index".to_string(),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
            }],
            closed_shards: Vec::new(),
            unavailable_leaders: Vec::new(),
        };
        control_plane_mailbox
            .ask(get_or_create_open_shards_request)
            .await
            .unwrap()
            .unwrap();

        let closed_shards = vec![
            ShardPKey {
                index_uid: Some(IndexUid::for_test("test-index", 0u128)),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(0u64)),
            },
            ShardPKey {
                index_uid: Some(IndexUid::for_test("test-index", 0u128)),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(1u64)),
            },
        ];
        let rebalance_lock = Arc::new(Mutex::new(()));
        let rebalance_guard = rebalance_lock.clone().lock_owned().await;
        let callback = RebalanceShardsCallback {
            closed_shards,
            rebalance_guard,
        };
        control_plane_mailbox.ask(callback).await.unwrap();

        let control_plane_debug_info = control_plane_mailbox.ask(GetDebugInfo).await.unwrap();
        let shard = &control_plane_debug_info["shard_table"]
            ["test-index:00000000000000000000000000"]["test-ingester"][0];
        assert_eq!(shard["shard_id"], "00000000000000000000");
        assert_eq!(shard["shard_state"], "closed");

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_control_plane_get_debug_info() {
        let universe = Universe::with_accelerated_time();

        let cluster_config = ClusterConfig::for_test();
        let node_id = NodeId::from("test-control-plane");
        let cluster_change_stream_factory = ClusterChangeStreamFactoryForTest::default();

        let indexer_pool = IndexerPool::default();
        let ingester_id = NodeId::from("test-ingester");

        let mut mock_indexer = MockIndexingService::new();
        mock_indexer
            .expect_apply_indexing_plan()
            .return_once(|_| Ok(ApplyIndexingPlanResponse {}));
        let indexer = IndexingServiceClient::from_mock(mock_indexer);

        let indexer_info = IndexerNodeInfo {
            node_id: ingester_id.clone(),
            generation_id: 0,
            client: indexer,
            indexing_tasks: Vec::new(),
            indexing_capacity: CpuCapacity::from_cpu_millis(1_000),
        };
        indexer_pool.insert(ingester_id.clone(), indexer_info);

        let ingester_pool = IngesterPool::default();
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_retain_shards()
            .return_once(|_| Ok(RetainShardsResponse {}));
        mock_ingester.expect_init_shards().return_once(|request| {
            let shard = request.subrequests[0].shard().clone();
            let response = InitShardsResponse {
                successes: vec![InitShardSuccess {
                    subrequest_id: 0,
                    shard: Some(shard),
                }],
                failures: Vec::new(),
            };
            Ok(response)
        });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert(ingester_id, ingester);

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|_| Ok(ListIndexesMetadataResponse::for_test(Vec::new())));

        mock_metastore.expect_create_index().return_once(|request| {
            let index_config = request.deserialize_index_config().unwrap();
            let source_configs = request.deserialize_source_configs().unwrap();
            let mut index_metadata = IndexMetadata::new_with_index_uid(
                IndexUid::for_test(&index_config.index_id, 0),
                index_config,
            );
            for source_config in source_configs {
                index_metadata.add_source(source_config).unwrap();
            }
            let index_metadata_json = serde_json::to_string(&index_metadata).unwrap();
            let response = CreateIndexResponse {
                index_uid: Some(IndexUid::for_test("test-index", 0u128)),
                index_metadata_json,
            };
            Ok(response)
        });
        mock_metastore.expect_open_shards().return_once(|_| {
            let response = OpenShardsResponse {
                subresponses: vec![OpenShardSubresponse {
                    subrequest_id: 0,
                    open_shard: Some(Shard {
                        index_uid: Some(IndexUid::for_test("test-index", 0u128)),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shard_id: Some(ShardId::from(0u64)),
                        leader_id: "test-ingester".to_string(),
                        follower_id: None,
                        shard_state: ShardState::Open as i32,
                        doc_mapping_uid: Some(DocMappingUid::default()),
                        publish_position_inclusive: Some(Position::Beginning),
                        publish_token: None,
                        update_timestamp: 1724158996,
                    }),
                }],
            };
            Ok(response)
        });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let (control_plane_mailbox, _control_plane_handle, _readiness_rx) = ControlPlane::spawn(
            &universe,
            cluster_config,
            node_id,
            cluster_change_stream_factory.clone(),
            indexer_pool.clone(),
            ingester_pool,
            metastore,
        );
        let index_config = IndexConfig::for_test("test-index", "ram:///test-index");
        let mut source_config = SourceConfig::ingest_v2();
        source_config.enabled = true;

        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, &[source_config])
                .unwrap();
        control_plane_mailbox
            .ask(create_index_request)
            .await
            .unwrap()
            .unwrap();

        let get_or_create_open_shards_request = GetOrCreateOpenShardsRequest {
            subrequests: vec![GetOrCreateOpenShardsSubrequest {
                subrequest_id: 0,
                index_id: "test-index".to_string(),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
            }],
            closed_shards: Vec::new(),
            unavailable_leaders: Vec::new(),
        };
        control_plane_mailbox
            .ask(get_or_create_open_shards_request)
            .await
            .unwrap()
            .unwrap();

        let control_plane_debug_info = control_plane_mailbox.ask(GetDebugInfo).await.unwrap();

        assert_eq!(
            control_plane_debug_info["physical_indexing_plan"][0]["node_id"],
            "test-ingester"
        );
        let shard = &control_plane_debug_info["shard_table"]
            ["test-index:00000000000000000000000000"]["test-ingester"][0];
        assert_eq!(shard["index_uid"], "test-index:00000000000000000000000000");
        assert_eq!(shard["source_id"], INGEST_V2_SOURCE_ID);
        assert_eq!(shard["shard_id"], "00000000000000000000");
        assert_eq!(shard["shard_state"], "open");
        assert_eq!(shard["leader_id"], "test-ingester");
        assert_eq!(shard["follower_id"], JsonValue::Null);
        assert_eq!(
            shard["publish_position_inclusive"],
            json!(Position::Beginning)
        );

        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/cooldown_map.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Debug;
use std::hash::Hash;
use std::num::NonZeroUsize;
use std::time::{Duration, Instant};

use lru::LruCache;

/// A map that keeps track of a cooldown deadline for each of its keys.
///
/// Internally it uses an [`LruCache`] to prune the oldest entries when the
/// capacity is reached. If the capacity is reached but the oldest entry is not
/// outdated, the capacity is extended (2x).
pub struct CooldownMap<K>(LruCache<K, Instant>);

#[derive(Debug, PartialEq)]
pub enum CooldownStatus {
    Ready,
    InCooldown,
}

impl<K: Hash + Eq> CooldownMap<K> {
    pub fn new(capacity: NonZeroUsize) -> Self {
        Self(LruCache::new(capacity))
    }

    /// Updates the deadline for the given key if it isn't currently in cooldown.
    ///
    /// The status returned is the one before the update (after an update, the
    /// status is always `InCooldown`).
    pub fn update(&mut self, key: K, cooldown_interval: Duration) -> CooldownStatus {
        let deadline_opt = self.0.get_mut(&key);
        let now = Instant::now();
        if let Some(deadline) = deadline_opt {
            if *deadline > now {
                CooldownStatus::InCooldown
            } else {
                *deadline = now + cooldown_interval;
                CooldownStatus::Ready
            }
        } else {
            let capacity: usize = self.0.cap().into();
            if self.0.len() == capacity
                && let Some((_, deadline)) = self.0.peek_lru()
                && *deadline > now
            {
                // the oldest entry is not outdated, grow the LRU
                self.0.resize(NonZeroUsize::new(capacity * 2).unwrap());
            }
            self.0.push(key, now + cooldown_interval);
            CooldownStatus::Ready
        }
    }
}
#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_cooldown_map_resize() {
        let mut cooldown_map = CooldownMap::new(NonZeroUsize::new(2).unwrap());
        let cooldown_interval = Duration::from_secs(1);
        assert_eq!(
            cooldown_map.update("test_key1", cooldown_interval),
            CooldownStatus::Ready
        );
        assert_eq!(
            cooldown_map.update("test_key1", cooldown_interval),
            CooldownStatus::InCooldown
        );
        assert_eq!(
            cooldown_map.update("test_key2", cooldown_interval),
            CooldownStatus::Ready
        );
        assert_eq!(
            cooldown_map.update("test_key2", cooldown_interval),
            CooldownStatus::InCooldown
        );
        // Hitting the capacity, the map should grow transparently
        assert_eq!(
            cooldown_map.update("test_key3", cooldown_interval),
            CooldownStatus::Ready
        );
        assert_eq!(
            cooldown_map.update("test_key1", cooldown_interval),
            CooldownStatus::InCooldown
        );
        assert_eq!(
            cooldown_map.update("test_key2", cooldown_interval),
            CooldownStatus::InCooldown
        );
        assert_eq!(cooldown_map.0.cap(), NonZeroUsize::new(4).unwrap());
    }

    #[test]
    fn test_cooldown_map_expired() {
        let mut cooldown_map = CooldownMap::new(NonZeroUsize::new(2).unwrap());
        let cooldown_interval_short = Duration::from_millis(100);
        let cooldown_interval_long = Duration::from_secs(5);

        assert_eq!(
            cooldown_map.update("test_key_short", cooldown_interval_short),
            CooldownStatus::Ready
        );
        assert_eq!(
            cooldown_map.update("test_key_long", cooldown_interval_long),
            CooldownStatus::Ready
        );

        std::thread::sleep(cooldown_interval_short.mul_f32(1.1));
        assert_eq!(
            cooldown_map.update("test_key_short", cooldown_interval_short),
            CooldownStatus::Ready
        );
        assert_eq!(
            cooldown_map.update("test_key_long", cooldown_interval_long),
            CooldownStatus::InCooldown
        );
    }

    #[test]
    fn test_cooldown_map_eviction() {
        let mut cooldown_map = CooldownMap::new(NonZeroUsize::new(2).unwrap());
        let cooldown_interval_short = Duration::from_millis(100);
        let cooldown_interval_long = Duration::from_secs(5);

        assert_eq!(
            cooldown_map.update("test_key_short", cooldown_interval_short),
            CooldownStatus::Ready
        );
        assert_eq!(
            cooldown_map.update("test_key_long_1", cooldown_interval_long),
            CooldownStatus::Ready
        );

        // after the cooldown period `test_key_short` should be evicted when adding a new key
        std::thread::sleep(cooldown_interval_short.mul_f32(1.1));
        assert_eq!(cooldown_map.0.len(), 2);
        assert_eq!(
            cooldown_map.update("test_key_long_2", cooldown_interval_long),
            CooldownStatus::Ready
        );
        assert_eq!(cooldown_map.0.len(), 2);
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/debouncer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::{Arc, Mutex};
use std::time::Duration;

use quickwit_actors::{Actor, ActorContext, Handler};

/// A debouncer is a helper to debounce events.
///
/// The debouncing takes a `cooldown_period` parameter and works as you may expect:
///
///
///    time                t=0                   t=COOLDOWN            t=2*COOLDOWN
///                        |                          |                     |
///  ----------------------------------------------------------------------------------------------------
///    event               *     * *    *                                   *   * *
///    debounced effect    o                          o                     o
///
/// In particular, note the event triggered at `t=COOLDOWN`.
#[derive(Clone)]
pub struct Debouncer {
    cooldown_period: Duration,
    cooldown_state: Arc<Mutex<DebouncerState>>,
}

#[derive(Clone, Copy, Debug, PartialEq)]
enum DebouncerState {
    /// More than `cooldown_period` has elapsed since we last emitted an event.
    NoCooldown,
    // Less than `cooldown_period` has elapsed since we last emitted an event,
    // and no event has been received since then.
    CooldownNotScheduled,
    // Less than `cooldown_period` has elapsed since we last emitted an event,
    // and we have already received an event during this cooldown period.
    CooldownScheduled,
}

impl DebouncerState {
    fn accept(self, transition: Transition) -> DebouncerState {
        use DebouncerState::*;
        use Transition::*;
        match (self, transition) {
            (NoCooldown, Emit) => CooldownNotScheduled,
            (NoCooldown, CooldownExpired) => unreachable!(),
            (CooldownNotScheduled, Emit) => CooldownScheduled,
            (CooldownNotScheduled, CooldownExpired) => NoCooldown,
            (CooldownScheduled, Emit) => CooldownScheduled,
            (CooldownScheduled, CooldownExpired) => NoCooldown,
        }
    }
}

enum Transition {
    CooldownExpired,
    Emit,
}

#[allow(dead_code)]
impl Debouncer {
    pub fn new(cooldown_period: Duration) -> Debouncer {
        Debouncer {
            cooldown_period,
            cooldown_state: Arc::new(Mutex::new(DebouncerState::NoCooldown)),
        }
    }

    /// Updates the state according to the transition, and returns the state before the transition.
    /// The entire transition is atomic.
    fn accept_transition(&self, transition: Transition) -> DebouncerState {
        let mut lock = self.cooldown_state.lock().unwrap();
        let previous_state = *lock;
        let new_state = previous_state.accept(transition);
        *lock = new_state;
        previous_state
    }

    fn emit_message<A, M>(&self, ctx: &ActorContext<A>)
    where
        A: Actor + Handler<M>,
        M: Default + std::fmt::Debug + Send + Sync + 'static,
    {
        let _ = ctx.mailbox().send_message_with_high_priority(M::default());
    }

    fn schedule_post_cooldown_callback<A, M>(&self, ctx: &ActorContext<A>)
    where
        A: Actor + Handler<M>,
        M: Default + std::fmt::Debug + Send + Sync + 'static,
    {
        let ctx_clone = ctx.clone();
        let self_clone = self.clone();
        let callback = move || {
            let previous_state = self_clone.accept_transition(Transition::CooldownExpired);
            if previous_state == DebouncerState::CooldownScheduled {
                self_clone.self_send_with_cooldown(&ctx_clone);
            }
        };
        ctx.spawn_ctx()
            .schedule_event(callback, self.cooldown_period);
    }

    pub fn self_send_with_cooldown<M>(&self, ctx: &ActorContext<impl Handler<M>>)
    where M: Default + std::fmt::Debug + Send + Sync + 'static {
        let cooldown_state = self.accept_transition(Transition::Emit);
        match cooldown_state {
            DebouncerState::NoCooldown => {
                self.emit_message(ctx);
                self.schedule_post_cooldown_callback(ctx);
            }
            DebouncerState::CooldownNotScheduled | DebouncerState::CooldownScheduled => {}
        }
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use async_trait::async_trait;
    use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Universe};

    use crate::debouncer::Debouncer;

    struct DebouncingActor {
        count: usize,
        debouncer: Debouncer,
    }

    impl DebouncingActor {
        pub fn new(cooldown_duration: Duration) -> DebouncingActor {
            DebouncingActor {
                count: 0,
                debouncer: Debouncer::new(cooldown_duration),
            }
        }
    }

    #[derive(Debug, Default)]
    struct Increment;

    #[derive(Debug)]
    struct DebouncedIncrement;

    #[async_trait]
    impl Actor for DebouncingActor {
        type ObservableState = usize;

        fn observable_state(&self) -> Self::ObservableState {
            self.count
        }
    }

    #[async_trait]
    impl Handler<Increment> for DebouncingActor {
        type Reply = ();

        async fn handle(
            &mut self,
            _message: Increment,
            _ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, ActorExitStatus> {
            self.count += 1;
            Ok(())
        }
    }

    #[async_trait]
    impl Handler<DebouncedIncrement> for DebouncingActor {
        type Reply = ();

        async fn handle(
            &mut self,
            _message: DebouncedIncrement,
            ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, ActorExitStatus> {
            self.debouncer.self_send_with_cooldown::<Increment>(ctx);
            Ok(())
        }
    }

    #[tokio::test]
    async fn test_debouncer() {
        let universe = Universe::default();
        let cooldown_period = Duration::from_millis(1_000);
        let debouncer = DebouncingActor::new(cooldown_period);
        let (debouncer_mailbox, debouncer_handle) = universe.spawn_builder().spawn(debouncer);
        {
            let count = *debouncer_handle.process_pending_and_observe().await;
            assert_eq!(count, 0);
        }
        {
            let _ = debouncer_mailbox.ask(DebouncedIncrement).await;
            let count = *debouncer_handle.process_pending_and_observe().await;
            assert_eq!(count, 1);
        }
        for _ in 0..10 {
            let _ = debouncer_mailbox.ask(DebouncedIncrement).await;
            let count = *debouncer_handle.process_pending_and_observe().await;
            assert_eq!(count, 1);
        }
        {
            universe.sleep(cooldown_period.mul_f32(1.2f32)).await;
            let count = *debouncer_handle.process_pending_and_observe().await;
            assert_eq!(count, 2);
        }
        {
            let _ = debouncer_mailbox.ask(DebouncedIncrement).await;
            let count = *debouncer_handle.process_pending_and_observe().await;
            assert_eq!(count, 2);
        }
        {
            universe.sleep(cooldown_period * 2).await;
            let count = *debouncer_handle.process_pending_and_observe().await;
            assert_eq!(count, 3);
        }
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_plan.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use fnv::FnvHashMap;
use quickwit_proto::indexing::IndexingTask;
use serde::Serialize;

/// A [`PhysicalIndexingPlan`] defines the list of indexing tasks
/// each indexer, identified by its node ID, should run.
/// TODO(fmassot): a metastore version number will be attached to the plan
/// to identify if the plan is up to date with the metastore.
#[derive(Debug, PartialEq, Clone, Serialize)]
pub struct PhysicalIndexingPlan {
    indexing_tasks_per_indexer_id: FnvHashMap<String, Vec<IndexingTask>>,
}

impl PhysicalIndexingPlan {
    pub fn with_indexer_ids(indexer_ids: &[String]) -> PhysicalIndexingPlan {
        PhysicalIndexingPlan {
            indexing_tasks_per_indexer_id: indexer_ids
                .iter()
                .map(|indexer_id| (indexer_id.clone(), Vec::new()))
                .collect(),
        }
    }

    pub fn add_indexing_task(&mut self, indexer_id: &str, indexing_task: IndexingTask) {
        self.indexing_tasks_per_indexer_id
            .entry(indexer_id.to_string())
            .or_default()
            .push(indexing_task);
    }

    /// Returns the hashmap of (indexer ID, indexing tasks).
    pub fn indexing_tasks_per_indexer(&self) -> &FnvHashMap<String, Vec<IndexingTask>> {
        &self.indexing_tasks_per_indexer_id
    }

    pub fn num_indexers(&self) -> usize {
        self.indexing_tasks_per_indexer_id.len()
    }

    /// Returns the hashmap of (indexer ID, indexing tasks).
    pub fn indexing_tasks_per_indexer_mut(&mut self) -> &mut FnvHashMap<String, Vec<IndexingTask>> {
        &mut self.indexing_tasks_per_indexer_id
    }

    /// Returns the hashmap of (indexer ID, indexing tasks).
    pub fn indexer(&self, indexer_id: &str) -> Option<&[IndexingTask]> {
        self.indexing_tasks_per_indexer_id
            .get(indexer_id)
            .map(Vec::as_slice)
    }

    pub fn normalize(&mut self) {
        for tasks in self.indexing_tasks_per_indexer_id.values_mut() {
            for task in tasks.iter_mut() {
                task.shard_ids.sort_unstable();
            }
            tasks.sort_unstable_by(|left, right| {
                left.index_uid
                    .cmp(&right.index_uid)
                    .then_with(|| left.source_id.cmp(&right.source_id))
                    .then_with(|| left.shard_ids.first().cmp(&right.shard_ids.first()))
                    .then_with(|| left.pipeline_uid.cmp(&right.pipeline_uid))
            });
        }
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_scheduler/change_tracker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use tokio::sync::watch;

/// This object makes it possible to track for the completion of the next rebuild.
pub struct RebuildNotifier {
    generation_processed_tx: watch::Sender<usize>,
    generation_processed_rx: watch::Receiver<usize>,
    generation: usize,
}

impl Default for RebuildNotifier {
    fn default() -> Self {
        let (generation_processed_tx, generation_processed_rx) = watch::channel(0);

        Self {
            generation_processed_tx,
            generation_processed_rx,
            generation: 1,
        }
    }
}

impl RebuildNotifier {
    /// Returns a future that resolves when the next rebuild is completed.
    ///
    /// If an ongoing build T exists, it will not resolve upon build T's completion.
    /// It will only be resolved upon build T+1's completion, or any subsequent build.
    pub fn next_rebuild_waiter(&mut self) -> impl std::future::Future<Output = ()> + use<> {
        let mut generation_processed_rx = self.generation_processed_rx.clone();
        let current_generation = self.generation;
        async move {
            loop {
                if *generation_processed_rx.borrow() >= current_generation {
                    return;
                }
                if generation_processed_rx.changed().await.is_err() {
                    return;
                }
            }
        }
    }

    /// Starts a new rebuild.
    pub fn start_rebuild(&mut self) -> Arc<NotifyChangeOnDrop> {
        let generation = self.generation;
        self.generation += 1;
        Arc::new(NotifyChangeOnDrop {
            generation,
            generation_processed_tx: self.generation_processed_tx.clone(),
        })
    }
}

pub struct NotifyChangeOnDrop {
    generation: usize,
    generation_processed_tx: watch::Sender<usize>,
}

impl Drop for NotifyChangeOnDrop {
    fn drop(&mut self) {
        if self.generation < *self.generation_processed_tx.borrow() {
            return;
        }
        let _ = self.generation_processed_tx.send(self.generation);
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use super::*;

    #[tokio::test]
    async fn test_change_tracker() {
        let mut change_tracker = RebuildNotifier::default();
        let waiter = change_tracker.next_rebuild_waiter();
        let change_notifier = change_tracker.start_rebuild();
        drop(change_notifier);
        waiter.await;
    }

    #[tokio::test]
    async fn test_change_tracker_ongoing_is_not_good() {
        let mut change_tracker = RebuildNotifier::default();
        let change_notifier = change_tracker.start_rebuild();
        let waiter = change_tracker.next_rebuild_waiter();
        let waiter2 = change_tracker.next_rebuild_waiter();
        drop(change_notifier);
        let change_notifier2 = change_tracker.start_rebuild();
        let timeout_res = tokio::time::timeout(Duration::from_millis(100), waiter).await;
        assert!(timeout_res.is_err());
        drop(change_notifier2);
        waiter2.await;
    }

    #[tokio::test]
    async fn test_change_tracker_all_waiters_are_notified() {
        let mut change_tracker = RebuildNotifier::default();
        let waiter = change_tracker.next_rebuild_waiter();
        let waiter2 = change_tracker.next_rebuild_waiter();
        let change_notifier = change_tracker.start_rebuild();
        drop(change_notifier);
        waiter.await;
        waiter2.await;
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_scheduler/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod change_tracker;
mod scheduling;

use std::cmp::Ordering;
use std::fmt;
use std::num::NonZeroU32;
use std::sync::{Arc, OnceLock};
use std::time::{Duration, Instant};

use fnv::{FnvHashMap, FnvHashSet};
use itertools::Itertools;
use once_cell::sync::OnceCell;
use quickwit_common::pretty::PrettySample;
use quickwit_config::{FileSourceParams, SourceParams, indexing_pipeline_params_fingerprint};
use quickwit_proto::indexing::{
    ApplyIndexingPlanRequest, CpuCapacity, IndexingService, IndexingTask, PIPELINE_FULL_CAPACITY,
    PIPELINE_THROUGHPUT,
};
use quickwit_proto::types::NodeId;
use scheduling::{SourceToSchedule, SourceToScheduleType};
use serde::Serialize;
use tracing::{debug, info, warn};

use crate::indexing_plan::PhysicalIndexingPlan;
use crate::indexing_scheduler::change_tracker::{NotifyChangeOnDrop, RebuildNotifier};
use crate::indexing_scheduler::scheduling::build_physical_indexing_plan;
use crate::metrics::ShardLocalityMetrics;
use crate::model::{ControlPlaneModel, ShardEntry, ShardLocations};
use crate::{IndexerNodeInfo, IndexerPool};

const DEFAULT_ENABLE_VARIABLE_SHARD_LOAD: bool = false;

pub(crate) const MIN_DURATION_BETWEEN_SCHEDULING: Duration =
    if cfg!(any(test, feature = "testsuite")) {
        Duration::from_millis(50)
    } else {
        Duration::from_secs(30)
    };

#[derive(Debug, Clone, Default, Serialize)]
pub struct IndexingSchedulerState {
    pub num_applied_physical_indexing_plan: usize,
    pub num_schedule_indexing_plan: usize,
    pub last_applied_physical_plan: Option<PhysicalIndexingPlan>,
    #[serde(skip)]
    pub last_applied_plan_timestamp: Option<Instant>,
}

/// The [`IndexingScheduler`] is responsible for listing indexing tasks and assigning them to
/// indexers.
/// We call this duty `scheduling`. Contrary to what the name suggests, most indexing tasks are
/// ever running. We just borrowed the terminology to Kubernetes.
///
/// Scheduling executes the following steps:
/// 1. Builds a [`PhysicalIndexingPlan`] from the list of logical indexing tasks. See
///    [`build_physical_indexing_plan`] for the implementation details.
/// 2. Apply the [`PhysicalIndexingPlan`]: for each indexer, the scheduler send the indexing tasks
///    by gRPC. An indexer immediately returns an Ok and apply asynchronously the received plan. Any
///    errors (network) happening in this step are ignored. The scheduler runs a control loop that
///    regularly checks if indexers are effectively running their plans (more details in the next
///    section).
///
/// All events altering the list of indexes and sources are proxied through
/// through the control plane. The control plane model is therefore guaranteed to be up-to-date
/// (at the cost of making the control plane a single point of failure).
///
/// Each change to the model triggers the production of a new `PhysicalIndexingPlan`.
///
/// A `ControlPlanLoop` event is scheduled every `CONTROL_PLAN_LOOP_INTERVAL` and steers
/// the cluster toward the last applied [`PhysicalIndexingPlan`].
///
/// This physical plan is a desired state. Even after that state is reached, it can be altered due
/// to faulty server for instance.
///
/// We then need to detect deviation, possibly recompute the desired `PhysicalIndexingPlan`
/// and steer back the cluster to the right state.
///
/// First to detect deviation, the control plan gathers an eventually consistent view of what is
/// running on the different nodes of the cluster: the `running plan`. This is done via `chitchat`.
///
/// If the list of node ids has changed, the scheduler will retrigger a scheduling.
/// If the indexing tasks do not match, the scheduler will apply again the last applied plan.
/// Concretely, it will send the faulty nodes of the plan they are supposed to follow.
//
/// Finally, in order to give the time for each indexer to run their indexing tasks, the control
/// plane will wait at least [`MIN_DURATION_BETWEEN_SCHEDULING`] before comparing the desired
/// plan with the running plan.
pub struct IndexingScheduler {
    cluster_id: String,
    self_node_id: NodeId,
    indexer_pool: IndexerPool,
    state: IndexingSchedulerState,
    pub(crate) next_rebuild_tracker: RebuildNotifier,
}

impl fmt::Debug for IndexingScheduler {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("IndexingScheduler")
            .field("cluster_id", &self.cluster_id)
            .field("node_id", &self.self_node_id)
            .field(
                "last_applied_plan_ts",
                &self.state.last_applied_plan_timestamp,
            )
            .finish()
    }
}

fn enable_variable_shard_load() -> bool {
    static IS_SHARD_LOAD_CP_ENABLED: OnceCell<bool> = OnceCell::new();
    *IS_SHARD_LOAD_CP_ENABLED.get_or_init(|| {
        if let Some(enable_flag) =
            quickwit_common::get_bool_from_env_opt("QW_ENABLE_VARIABLE_SHARD_LOAD")
        {
            return enable_flag;
        }
        // For backward compatibility, if QW_DISABLE_VARIABLE_SHARD_LOAD is set, we accept this
        // value too.
        if let Some(disable_flag) =
            quickwit_common::get_bool_from_env_opt("QW_DISABLE_VARIABLE_SHARD_LOAD")
        {
            warn!(
                disable = disable_flag,
                "QW_DISABLE_VARIABLE_SHARD_LOAD is deprecated. Please use \
                 QW_ENABLE_VARIABLE_SHARD_LOAD instead. We will use your setting in this version, \
                 but will likely ignore it in future versions."
            );
            return !disable_flag;
        }
        // Defaulting to false
        info!(
            "QW_ENABLE_VARIABLE_SHARD_LOAD not set, defaulting to {}",
            DEFAULT_ENABLE_VARIABLE_SHARD_LOAD
        );
        DEFAULT_ENABLE_VARIABLE_SHARD_LOAD
    })
}

/// Computes the CPU load associated to a single shard of a given index.
///
/// The array passed contains all of data we have about the shard of the index.
/// This function averages their statistics.
///
/// For the moment, this function only takes in account the measured throughput,
/// and assumes a constant CPU usage of 4 vCPU = 20mb/s.
///
/// It does not take in account the variation that could raise from the different
/// doc mapping / nature of the data, etc.
fn compute_load_per_shard(shard_entries: &[&ShardEntry]) -> NonZeroU32 {
    if enable_variable_shard_load() {
        let num_shards = shard_entries.len().max(1) as u64;
        let average_throughput_per_shard_bytes: u64 = shard_entries
            .iter()
            .map(|shard_entry| shard_entry.long_term_ingestion_rate.0 as u64 * bytesize::MIB)
            .sum::<u64>()
            .div_ceil(num_shards)
            // A shard throughput cannot exceed PIPELINE_THROUGHPUT in the long term (this is
            // enforced by the configuration).
            .min(PIPELINE_THROUGHPUT.as_u64());
        let num_cpu_millis = (PIPELINE_FULL_CAPACITY.cpu_millis() as u64
            * average_throughput_per_shard_bytes)
            / PIPELINE_THROUGHPUT.as_u64();
        const MIN_CPU_LOAD_PER_SHARD: u32 = 50u32;
        NonZeroU32::new((num_cpu_millis as u32).max(MIN_CPU_LOAD_PER_SHARD)).unwrap()
    } else {
        get_default_load_per_shard()
    }
}

fn get_default_load_per_shard() -> NonZeroU32 {
    static DEFAULT_LOAD_PER_SHARD: OnceLock<NonZeroU32> = OnceLock::new();
    *DEFAULT_LOAD_PER_SHARD.get_or_init(|| {
        let default_load_per_shard = quickwit_common::get_from_env(
            "QW_DEFAULT_LOAD_PER_SHARD",
            PIPELINE_FULL_CAPACITY.cpu_millis() / 4,
            false,
        );
        NonZeroU32::new(default_load_per_shard).unwrap()
    })
}

fn get_sources_to_schedule(model: &ControlPlaneModel) -> Vec<SourceToSchedule> {
    let mut sources = Vec::new();

    for (source_uid, source_config) in model.source_configs() {
        if !source_config.enabled {
            continue;
        }
        let params_fingerprint = model
            .index_metadata(&source_uid.index_uid)
            .map(|index_meta| {
                indexing_pipeline_params_fingerprint(&index_meta.index_config, source_config)
            })
            .unwrap_or_default();
        match source_config.source_params {
            SourceParams::File(FileSourceParams::Filepath(_))
            | SourceParams::IngestCli
            | SourceParams::Stdin
            | SourceParams::Void(_)
            | SourceParams::Vec(_) => { // We don't need to schedule those.
            }

            SourceParams::IngestApi => {
                // TODO ingest v1 is scheduled differently
                sources.push(SourceToSchedule {
                    source_uid,
                    source_type: SourceToScheduleType::IngestV1,
                    params_fingerprint,
                });
            }
            SourceParams::Ingest => {
                // Expect: the source should exist since we just read it from `get_source_configs`.
                // Note that we keep all shards, including Closed shards:
                // A closed shards still needs to be indexed.
                let shard_entries: Vec<&ShardEntry> = model
                    .get_shards_for_source(&source_uid)
                    .expect("source should exist")
                    .values()
                    .collect();
                if shard_entries.is_empty() {
                    continue;
                }
                let shard_ids = shard_entries
                    .iter()
                    .map(|shard_entry| shard_entry.shard_id().clone())
                    .collect();
                let load_per_shard = compute_load_per_shard(&shard_entries[..]);
                sources.push(SourceToSchedule {
                    source_uid,
                    source_type: SourceToScheduleType::Sharded {
                        shard_ids,
                        load_per_shard,
                    },
                    params_fingerprint,
                });
            }
            SourceParams::Kafka(_)
            | SourceParams::Kinesis(_)
            | SourceParams::PubSub(_)
            | SourceParams::Pulsar(_)
            | SourceParams::File(FileSourceParams::Notifications(_)) => {
                sources.push(SourceToSchedule {
                    source_uid,
                    source_type: SourceToScheduleType::NonSharded {
                        num_pipelines: source_config.num_pipelines.get() as u32,
                        // FIXME
                        load_per_pipeline: NonZeroU32::new(PIPELINE_FULL_CAPACITY.cpu_millis())
                            .unwrap(),
                    },
                    params_fingerprint,
                });
            }
        }
    }
    sources
}

impl IndexingScheduler {
    pub fn new(cluster_id: String, self_node_id: NodeId, indexer_pool: IndexerPool) -> Self {
        IndexingScheduler {
            cluster_id,
            self_node_id,
            indexer_pool,
            state: IndexingSchedulerState::default(),
            next_rebuild_tracker: RebuildNotifier::default(),
        }
    }

    pub fn observable_state(&self) -> IndexingSchedulerState {
        self.state.clone()
    }

    // Should be called whenever a change in the list of index/shard
    // has happened.
    //
    // Prefer not calling this method directly, and instead call
    // `ControlPlane::rebuild_indexing_plan_debounced`.
    pub(crate) fn rebuild_plan(&mut self, model: &ControlPlaneModel) {
        crate::metrics::CONTROL_PLANE_METRICS.schedule_total.inc();

        let notify_on_drop = self.next_rebuild_tracker.start_rebuild();

        let sources = get_sources_to_schedule(model);

        let indexers: Vec<IndexerNodeInfo> = self.get_indexers_from_indexer_pool();

        let indexer_id_to_cpu_capacities: FnvHashMap<String, CpuCapacity> = indexers
            .iter()
            .filter_map(|indexer| {
                if indexer.indexing_capacity.cpu_millis() > 0 {
                    Some((indexer.node_id.to_string(), indexer.indexing_capacity))
                } else {
                    None
                }
            })
            .collect();

        if indexer_id_to_cpu_capacities.is_empty() {
            if !sources.is_empty() {
                warn!("no indexing capacity available, cannot schedule an indexing plan");
            }
            return;
        };

        let shard_locations = model.shard_locations();
        let new_physical_plan = build_physical_indexing_plan(
            &sources,
            &indexer_id_to_cpu_capacities,
            self.state.last_applied_physical_plan.as_ref(),
            &shard_locations,
        );
        let shard_locality_metrics =
            get_shard_locality_metrics(&new_physical_plan, &shard_locations);
        crate::metrics::CONTROL_PLANE_METRICS.set_shard_locality_metrics(shard_locality_metrics);
        if let Some(last_applied_plan) = &self.state.last_applied_physical_plan {
            let plans_diff = get_indexing_plans_diff(
                last_applied_plan.indexing_tasks_per_indexer(),
                new_physical_plan.indexing_tasks_per_indexer(),
            );
            // No need to apply the new plan as it is the same as the old one.
            if plans_diff.is_empty() {
                return;
            }
        }
        self.apply_physical_indexing_plan(&indexers, new_physical_plan, Some(notify_on_drop));
        self.state.num_schedule_indexing_plan += 1;
    }

    /// Checks if the last applied plan corresponds to the running indexing tasks present in the
    /// chitchat cluster state. If true, do nothing.
    /// - If node IDs differ, schedule a new indexing plan.
    /// - If indexing tasks differ, apply again the last plan.
    pub(crate) fn control_running_plan(&mut self, model: &ControlPlaneModel) {
        let last_applied_plan =
            if let Some(last_applied_plan) = &self.state.last_applied_physical_plan {
                last_applied_plan
            } else {
                // If there is no plan, the node is probably starting and the scheduler did not find
                // indexers yet. In this case, we want to schedule as soon as possible to find new
                // indexers.
                self.rebuild_plan(model);
                return;
            };
        if let Some(last_applied_plan_timestamp) = self.state.last_applied_plan_timestamp
            && Instant::now().duration_since(last_applied_plan_timestamp)
                < MIN_DURATION_BETWEEN_SCHEDULING
        {
            return;
        }
        let indexers: Vec<IndexerNodeInfo> = self.get_indexers_from_indexer_pool();
        let running_indexing_tasks_by_node_id: FnvHashMap<String, Vec<IndexingTask>> = indexers
            .iter()
            .map(|indexer| (indexer.node_id.to_string(), indexer.indexing_tasks.clone()))
            .collect();

        let indexing_plans_diff = get_indexing_plans_diff(
            &running_indexing_tasks_by_node_id,
            last_applied_plan.indexing_tasks_per_indexer(),
        );
        if !indexing_plans_diff.has_same_nodes() {
            info!(plans_diff=?indexing_plans_diff, "running plan and last applied plan node IDs differ: schedule an indexing plan");
            self.rebuild_plan(model);
        } else if !indexing_plans_diff.has_same_tasks() {
            // Some nodes may have not received their tasks, apply it again.
            info!(plans_diff=?indexing_plans_diff, "running tasks and last applied tasks differ: reapply last plan");
            self.apply_physical_indexing_plan(&indexers, last_applied_plan.clone(), None);
        }
    }

    fn get_indexers_from_indexer_pool(&self) -> Vec<IndexerNodeInfo> {
        self.indexer_pool.values()
    }

    fn apply_physical_indexing_plan(
        &mut self,
        indexers: &[IndexerNodeInfo],
        new_physical_plan: PhysicalIndexingPlan,
        notify_on_drop: Option<Arc<NotifyChangeOnDrop>>,
    ) {
        debug!(new_physical_plan=?new_physical_plan, "apply physical indexing plan");
        crate::metrics::CONTROL_PLANE_METRICS.apply_plan_total.inc();
        for (node_id, indexing_tasks) in new_physical_plan.indexing_tasks_per_indexer() {
            // We don't want to block on a slow indexer so we apply this change asynchronously
            // TODO not blocking is cool, but we need to make sure there is not accumulation
            // possible here.
            let notify_on_drop = notify_on_drop.clone();
            tokio::spawn({
                let indexer = indexers
                    .iter()
                    .find(|indexer| indexer.node_id == *node_id)
                    .expect("This should never happen as the plan was built from these indexers.")
                    .clone();
                let indexing_tasks = indexing_tasks.clone();
                async move {
                    if let Err(error) = indexer
                        .client
                        .clone()
                        .apply_indexing_plan(ApplyIndexingPlanRequest { indexing_tasks })
                        .await
                    {
                        warn!(
                            %error,
                            node_id=%indexer.node_id,
                            generation_id=indexer.generation_id,
                            "failed to apply indexing plan to indexer"
                        );
                    }
                    drop(notify_on_drop);
                }
            });
        }
        self.state.num_applied_physical_indexing_plan += 1;
        self.state.last_applied_plan_timestamp = Some(Instant::now());
        self.state.last_applied_physical_plan = Some(new_physical_plan);
    }
}

struct IndexingPlansDiff<'a> {
    pub missing_node_ids: FnvHashSet<&'a str>,
    pub unplanned_node_ids: FnvHashSet<&'a str>,
    pub missing_tasks_by_node_id: FnvHashMap<&'a str, Vec<&'a IndexingTask>>,
    pub unplanned_tasks_by_node_id: FnvHashMap<&'a str, Vec<&'a IndexingTask>>,
}

impl IndexingPlansDiff<'_> {
    pub fn has_same_nodes(&self) -> bool {
        self.missing_node_ids.is_empty() && self.unplanned_node_ids.is_empty()
    }

    pub fn has_same_tasks(&self) -> bool {
        self.missing_tasks_by_node_id
            .values()
            .map(Vec::len)
            .sum::<usize>()
            == 0
            && self
                .unplanned_tasks_by_node_id
                .values()
                .map(Vec::len)
                .sum::<usize>()
                == 0
    }

    pub fn is_empty(&self) -> bool {
        self.has_same_nodes() && self.has_same_tasks()
    }
}

fn get_shard_locality_metrics(
    physical_plan: &PhysicalIndexingPlan,
    shard_locations: &ShardLocations,
) -> ShardLocalityMetrics {
    let mut num_local_shards = 0;
    let mut num_remote_shards = 0;
    for (indexer, tasks) in physical_plan.indexing_tasks_per_indexer() {
        for task in tasks {
            for shard_id in &task.shard_ids {
                if shard_locations
                    .get_shard_locations(shard_id)
                    .iter()
                    .any(|node| node.as_str() == indexer)
                {
                    num_local_shards += 1;
                } else {
                    num_remote_shards += 1;
                }
            }
        }
    }
    ShardLocalityMetrics {
        num_remote_shards,
        num_local_shards,
    }
}

impl fmt::Debug for IndexingPlansDiff<'_> {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        if self.has_same_nodes() && self.has_same_tasks() {
            return write!(formatter, "EmptyIndexingPlansDiff");
        }
        write!(formatter, "IndexingPlansDiff(")?;
        let mut separator = "";
        if !self.missing_node_ids.is_empty() {
            write!(
                formatter,
                "missing_node_ids={:?}",
                PrettySample::new(&self.missing_node_ids, 10)
            )?;
            separator = ", "
        }
        if !self.unplanned_node_ids.is_empty() {
            write!(
                formatter,
                "{separator}unplanned_node_ids={:?}",
                PrettySample::new(&self.unplanned_node_ids, 10)
            )?;
            separator = ", "
        }
        if !self.missing_tasks_by_node_id.is_empty() {
            write!(formatter, "{separator}missing_tasks_by_node_id=",)?;
            format_indexing_task_map(formatter, &self.missing_tasks_by_node_id)?;
            separator = ", "
        }
        if !self.unplanned_tasks_by_node_id.is_empty() {
            write!(formatter, "{separator}unplanned_tasks_by_node_id=",)?;
            format_indexing_task_map(formatter, &self.unplanned_tasks_by_node_id)?;
        }
        write!(formatter, ")")
    }
}

fn format_indexing_task_map(
    formatter: &mut std::fmt::Formatter,
    indexing_tasks: &FnvHashMap<&str, Vec<&IndexingTask>>,
) -> std::fmt::Result {
    // we show at most 5 nodes, and aggregate the results for the other.
    // we show at most 10 indexes, but aggregate results after.
    // we always aggregate shard ids
    // we hide pipeline id and incarnation id, they are not very useful in most case, but take a
    // lot of place
    const MAX_NODE: usize = 5;
    const MAX_INDEXES: usize = 10;
    let mut index_displayed = 0;
    write!(formatter, "{{")?;
    let mut indexer_iter = indexing_tasks.iter().enumerate();
    for (i, (index_name, tasks)) in &mut indexer_iter {
        if i != 0 {
            write!(formatter, ", ")?;
        }
        if index_displayed != MAX_INDEXES - 1 {
            write!(formatter, "{index_name:?}: [")?;
            let mut tasks_iter = tasks.iter().enumerate();
            for (i, task) in &mut tasks_iter {
                if i != 0 {
                    write!(formatter, ", ")?;
                }
                write!(
                    formatter,
                    r#"(index_id: "{}", source_id: "{}", shard_count: {})"#,
                    task.index_uid.as_ref().unwrap().index_id,
                    task.source_id,
                    task.shard_ids.len()
                )?;
                index_displayed += 1;
                if index_displayed == MAX_INDEXES - 1 {
                    let (task_count, shard_count) = tasks_iter.fold((0, 0), |(t, s), (_, task)| {
                        (t + 1, s + task.shard_ids.len())
                    });
                    if task_count > 0 {
                        write!(
                            formatter,
                            " and {task_count} tasks and {shard_count} shards"
                        )?;
                    }
                    break;
                }
            }
            write!(formatter, "]")?;
        } else {
            write!(
                formatter,
                "{index_name:?}: [with {} tasks and {} shards]",
                tasks.len(),
                tasks.iter().map(|task| task.shard_ids.len()).sum::<usize>()
            )?;
        }
        if i == MAX_NODE - 1 {
            break;
        }
    }
    let (indexer, tasks, shards) = indexer_iter.fold((0, 0, 0), |(i, t, s), (_, (_, task))| {
        (
            i + 1,
            t + task.len(),
            s + task.iter().map(|task| task.shard_ids.len()).sum::<usize>(),
        )
    });
    if indexer > 0 {
        write!(
            formatter,
            " and {indexer} more indexers, handling {tasks} tasks and {shards} shards}}"
        )
    } else {
        write!(formatter, "}}")
    }
}

/// Returns the difference between the `running_plan` retrieved from the chitchat state and
/// the last plan applied by the scheduler.
fn get_indexing_plans_diff<'a>(
    running_plan: &'a FnvHashMap<String, Vec<IndexingTask>>,
    last_applied_plan: &'a FnvHashMap<String, Vec<IndexingTask>>,
) -> IndexingPlansDiff<'a> {
    // Nodes diff.
    let running_node_ids: FnvHashSet<&str> = running_plan
        .keys()
        .map(|node_id| node_id.as_str())
        .collect();
    let planned_node_ids: FnvHashSet<&str> = last_applied_plan
        .keys()
        .map(|node_id| node_id.as_str())
        .collect();
    let missing_node_ids: FnvHashSet<&str> = planned_node_ids
        .difference(&running_node_ids)
        .copied()
        .collect();
    let unplanned_node_ids: FnvHashSet<&str> = running_node_ids
        .difference(&planned_node_ids)
        .copied()
        .collect();
    // Tasks diff.
    let mut missing_tasks_by_node_id: FnvHashMap<&str, Vec<&IndexingTask>> = FnvHashMap::default();
    let mut unplanned_tasks_by_node_id: FnvHashMap<&str, Vec<&IndexingTask>> =
        FnvHashMap::default();
    for node_id in running_node_ids.iter().chain(planned_node_ids.iter()) {
        let running_tasks = running_plan
            .get(*node_id)
            .map(Vec::as_slice)
            .unwrap_or_else(|| &[]);
        let last_applied_tasks = last_applied_plan
            .get(*node_id)
            .map(Vec::as_slice)
            .unwrap_or_else(|| &[]);
        let (missing_tasks, unplanned_tasks) =
            get_indexing_tasks_diff(running_tasks, last_applied_tasks);
        missing_tasks_by_node_id.insert(*node_id, missing_tasks);
        unplanned_tasks_by_node_id.insert(*node_id, unplanned_tasks);
    }
    IndexingPlansDiff {
        missing_node_ids,
        unplanned_node_ids,
        missing_tasks_by_node_id,
        unplanned_tasks_by_node_id,
    }
}

/// Computes the difference between `running_tasks` and `last_applied_tasks` and returns a tuple
/// of `missing_tasks` and `unplanned_tasks`.
/// Note: we need to handle duplicate tasks in each array, so we count them and make the diff.
fn get_indexing_tasks_diff<'a>(
    running_tasks: &'a [IndexingTask],
    last_applied_tasks: &'a [IndexingTask],
) -> (Vec<&'a IndexingTask>, Vec<&'a IndexingTask>) {
    let mut missing_tasks: Vec<&IndexingTask> = Vec::new();
    let mut unplanned_tasks: Vec<&IndexingTask> = Vec::new();
    let grouped_running_tasks: FnvHashMap<&IndexingTask, usize> = running_tasks
        .iter()
        .chunk_by(|&task| task)
        .into_iter()
        .map(|(key, group)| (key, group.count()))
        .collect();
    let grouped_last_applied_tasks: FnvHashMap<&IndexingTask, usize> = last_applied_tasks
        .iter()
        .chunk_by(|&task| task)
        .into_iter()
        .map(|(key, group)| (key, group.count()))
        .collect();
    let all_tasks: FnvHashSet<&IndexingTask> =
        FnvHashSet::from_iter(running_tasks.iter().chain(last_applied_tasks.iter()));
    for task in all_tasks {
        let running_task_count = grouped_running_tasks.get(task).unwrap_or(&0);
        let desired_task_count = grouped_last_applied_tasks.get(task).unwrap_or(&0);
        match running_task_count.cmp(desired_task_count) {
            Ordering::Greater => {
                unplanned_tasks
                    .extend_from_slice(&vec![task; running_task_count - desired_task_count]);
            }
            Ordering::Less => {
                missing_tasks
                    .extend_from_slice(&vec![task; desired_task_count - running_task_count])
            }
            _ => {}
        }
    }

    (missing_tasks, unplanned_tasks)
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;
    use std::str::FromStr;

    use proptest::{prop_compose, proptest};
    use quickwit_config::{IndexConfig, KafkaSourceParams, SourceConfig, SourceParams};
    use quickwit_metastore::IndexMetadata;
    use quickwit_proto::types::{IndexUid, PipelineUid, ShardId, SourceUid};

    use super::*;
    use crate::model::ShardLocations;
    #[test]
    fn test_indexing_plans_diff() {
        let index_uid = IndexUid::from_str("index-1:11111111111111111111111111").unwrap();
        let index_uid2 = IndexUid::from_str("index-2:11111111111111111111111111").unwrap();
        {
            let running_plan = FnvHashMap::default();
            let desired_plan = FnvHashMap::default();
            let indexing_plans_diff = get_indexing_plans_diff(&running_plan, &desired_plan);
            assert!(indexing_plans_diff.is_empty());
        }
        {
            let mut running_plan = FnvHashMap::default();
            let mut desired_plan = FnvHashMap::default();
            let task_1 = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(10u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            let task_1b = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(11u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            let task_2 = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(20u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-2".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            running_plan.insert(
                "indexer-1".to_string(),
                vec![task_1.clone(), task_1b.clone(), task_2.clone()],
            );
            desired_plan.insert(
                "indexer-1".to_string(),
                vec![task_2, task_1.clone(), task_1b.clone()],
            );
            let indexing_plans_diff = get_indexing_plans_diff(&running_plan, &desired_plan);
            assert!(indexing_plans_diff.is_empty());
        }
        {
            let mut running_plan = FnvHashMap::default();
            let mut desired_plan = FnvHashMap::default();
            let task_1 = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(1u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            let task_2 = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(2u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-2".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            running_plan.insert("indexer-1".to_string(), vec![task_1.clone()]);
            desired_plan.insert("indexer-1".to_string(), vec![task_2.clone()]);

            let indexing_plans_diff = get_indexing_plans_diff(&running_plan, &desired_plan);
            assert!(!indexing_plans_diff.is_empty());
            assert!(indexing_plans_diff.has_same_nodes());
            assert!(!indexing_plans_diff.has_same_tasks());
            assert_eq!(
                indexing_plans_diff.unplanned_tasks_by_node_id,
                FnvHashMap::from_iter([("indexer-1", vec![&task_1])])
            );
            assert_eq!(
                indexing_plans_diff.missing_tasks_by_node_id,
                FnvHashMap::from_iter([("indexer-1", vec![&task_2])])
            );
        }
        {
            // Task assigned to indexer-1 in desired plan but another one running.
            let mut running_plan = FnvHashMap::default();
            let mut desired_plan = FnvHashMap::default();
            let task_1 = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(1u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            let task_2 = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(2u128)),
                index_uid: Some(index_uid2.clone()),
                source_id: "source-2".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            running_plan.insert("indexer-2".to_string(), vec![task_2.clone()]);
            desired_plan.insert("indexer-1".to_string(), vec![task_1.clone()]);

            let indexing_plans_diff = get_indexing_plans_diff(&running_plan, &desired_plan);
            assert!(!indexing_plans_diff.is_empty());
            assert!(!indexing_plans_diff.has_same_nodes());
            assert!(!indexing_plans_diff.has_same_tasks());
            assert_eq!(
                indexing_plans_diff.missing_node_ids,
                FnvHashSet::from_iter(["indexer-1"])
            );
            assert_eq!(
                indexing_plans_diff.unplanned_node_ids,
                FnvHashSet::from_iter(["indexer-2"])
            );
            assert_eq!(
                indexing_plans_diff.missing_tasks_by_node_id,
                FnvHashMap::from_iter([("indexer-1", vec![&task_1]), ("indexer-2", Vec::new())])
            );
            assert_eq!(
                indexing_plans_diff.unplanned_tasks_by_node_id,
                FnvHashMap::from_iter([("indexer-2", vec![&task_2]), ("indexer-1", Vec::new())])
            );
        }
        {
            // Diff with 3 same tasks running but only one on the desired plan.
            let mut running_plan = FnvHashMap::default();
            let mut desired_plan = FnvHashMap::default();
            let task_1a = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(10u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            let task_1b = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(11u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            let task_1c = IndexingTask {
                pipeline_uid: Some(PipelineUid::for_test(12u128)),
                index_uid: Some(index_uid.clone()),
                source_id: "source-1".to_string(),
                shard_ids: Vec::new(),
                params_fingerprint: 0,
            };
            running_plan.insert("indexer-1".to_string(), vec![task_1a.clone()]);
            desired_plan.insert(
                "indexer-1".to_string(),
                vec![task_1a.clone(), task_1b.clone(), task_1c.clone()],
            );

            let indexing_plans_diff = get_indexing_plans_diff(&running_plan, &desired_plan);
            assert!(!indexing_plans_diff.is_empty());
            assert!(indexing_plans_diff.has_same_nodes());
            assert!(!indexing_plans_diff.has_same_tasks());
            assert_eq!(
                indexing_plans_diff.missing_tasks_by_node_id,
                FnvHashMap::from_iter([("indexer-1", vec![&task_1b, &task_1c])])
            );
        }
    }

    #[test]
    fn test_get_sources_to_schedule() {
        let mut model = ControlPlaneModel::default();
        let kafka_source_params = KafkaSourceParams {
            topic: "kafka-topic".to_string(),
            client_log_level: None,
            client_params: serde_json::json!({}),
            enable_backfill_mode: false,
        };
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata);
        model
            .add_source(
                &index_uid,
                SourceConfig {
                    source_id: "source_disabled".to_string(),
                    num_pipelines: NonZeroUsize::new(3).unwrap(),
                    enabled: false,
                    source_params: SourceParams::Kafka(kafka_source_params.clone()),
                    transform_config: None,
                    input_format: Default::default(),
                },
            )
            .unwrap();
        model
            .add_source(
                &index_uid,
                SourceConfig {
                    source_id: "source_enabled".to_string(),
                    num_pipelines: NonZeroUsize::new(2).unwrap(),
                    enabled: true,
                    source_params: SourceParams::Kafka(kafka_source_params.clone()),
                    transform_config: None,
                    input_format: Default::default(),
                },
            )
            .unwrap();
        model
            .add_source(
                &index_uid,
                SourceConfig {
                    source_id: "ingest_v1".to_string(),
                    num_pipelines: NonZeroUsize::new(2).unwrap(),
                    enabled: true,
                    // ingest v1
                    source_params: SourceParams::IngestApi,
                    transform_config: None,
                    input_format: Default::default(),
                },
            )
            .unwrap();
        model
            .add_source(
                &index_uid,
                SourceConfig {
                    source_id: "ingest_v2".to_string(),
                    num_pipelines: NonZeroUsize::new(2).unwrap(),
                    enabled: true,
                    // ingest v2
                    source_params: SourceParams::Ingest,
                    transform_config: None,
                    input_format: Default::default(),
                },
            )
            .unwrap();
        // ingest v2 without any open shard is skipped.
        model
            .add_source(
                &index_uid,
                SourceConfig {
                    source_id: "ingest_v2_without_shard".to_string(),
                    num_pipelines: NonZeroUsize::new(2).unwrap(),
                    enabled: true,
                    // ingest v2
                    source_params: SourceParams::Ingest,
                    transform_config: None,
                    input_format: Default::default(),
                },
            )
            .unwrap();
        model
            .add_source(
                &index_uid,
                SourceConfig {
                    source_id: "ingest_cli".to_string(),
                    num_pipelines: NonZeroUsize::new(2).unwrap(),
                    enabled: true,
                    // ingest v1
                    source_params: SourceParams::IngestCli,
                    transform_config: None,
                    input_format: Default::default(),
                },
            )
            .unwrap();
        let shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: "ingest_v2".to_string(),
            shard_id: Some(ShardId::from(17)),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        model.insert_shards(&index_uid, &"ingest_v2".to_string(), vec![shard]);
        let shards: Vec<SourceToSchedule> = get_sources_to_schedule(&model);
        assert_eq!(shards.len(), 3);
    }

    #[test]
    fn test_build_physical_indexing_plan_simple() {
        let source_1 = SourceUid {
            index_uid: IndexUid::for_test("index-1", 0),
            source_id: "source1".to_string(),
        };
        let source_2 = SourceUid {
            index_uid: IndexUid::for_test("index-2", 0),
            source_id: "source2".to_string(),
        };
        let sources = [
            SourceToSchedule {
                source_uid: source_1.clone(),
                source_type: SourceToScheduleType::NonSharded {
                    num_pipelines: 3,
                    load_per_pipeline: NonZeroU32::new(1_000).unwrap(),
                },
                params_fingerprint: 0,
            },
            SourceToSchedule {
                source_uid: source_2.clone(),
                source_type: SourceToScheduleType::NonSharded {
                    num_pipelines: 2,
                    load_per_pipeline: NonZeroU32::new(1_000).unwrap(),
                },
                params_fingerprint: 0,
            },
        ];
        let mut indexer_max_loads = FnvHashMap::default();
        indexer_max_loads.insert("indexer1".to_string(), mcpu(3_000));
        indexer_max_loads.insert("indexer2".to_string(), mcpu(3_000));
        let shard_locations = ShardLocations::default();
        let physical_plan =
            build_physical_indexing_plan(&sources[..], &indexer_max_loads, None, &shard_locations);
        assert_eq!(physical_plan.indexing_tasks_per_indexer().len(), 2);
        let indexing_tasks_1 = physical_plan.indexer("indexer1").unwrap();
        assert_eq!(indexing_tasks_1.len(), 2);
        let indexer_2_tasks = physical_plan.indexer("indexer2").unwrap();
        assert_eq!(indexer_2_tasks.len(), 3);
    }

    #[test]
    fn test_debug_indexing_task_map() {
        let mut map = FnvHashMap::default();
        let task1 = IndexingTask {
            index_uid: Some(IndexUid::for_test("index1", 123)),
            source_id: "my-source".to_string(),
            pipeline_uid: Some(PipelineUid::random()),
            shard_ids: vec!["shard1".into()],
            params_fingerprint: 0,
        };
        let task2 = IndexingTask {
            index_uid: Some(IndexUid::for_test("index2", 123)),
            source_id: "my-source".to_string(),
            pipeline_uid: Some(PipelineUid::random()),
            shard_ids: vec!["shard2".into(), "shard3".into()],
            params_fingerprint: 0,
        };
        let task3 = IndexingTask {
            index_uid: Some(IndexUid::for_test("index3", 123)),
            source_id: "my-source".to_string(),
            pipeline_uid: Some(PipelineUid::random()),
            shard_ids: vec!["shard6".into()],
            params_fingerprint: 0,
        };
        // order made to map with the debug for lisibility
        map.insert("indexer5", vec![&task2]);
        map.insert("indexer4", vec![&task1]);
        map.insert("indexer3", vec![&task1, &task3]);
        map.insert("indexer2", vec![&task2, &task3, &task1, &task2]);
        map.insert("indexer1", vec![&task1, &task2, &task3, &task1]);
        map.insert("indexer6", vec![&task1, &task2, &task3]);
        let plan = IndexingPlansDiff {
            missing_node_ids: FnvHashSet::default(),
            unplanned_node_ids: FnvHashSet::default(),
            missing_tasks_by_node_id: map,
            unplanned_tasks_by_node_id: FnvHashMap::default(),
        };

        let debug = format!("{plan:?}");
        assert_eq!(
            debug,
            r#"IndexingPlansDiff(missing_tasks_by_node_id={"indexer5": [(index_id: "index2", source_id: "my-source", shard_count: 2)], "indexer4": [(index_id: "index1", source_id: "my-source", shard_count: 1)], "indexer3": [(index_id: "index1", source_id: "my-source", shard_count: 1), (index_id: "index3", source_id: "my-source", shard_count: 1)], "indexer2": [(index_id: "index2", source_id: "my-source", shard_count: 2), (index_id: "index3", source_id: "my-source", shard_count: 1), (index_id: "index1", source_id: "my-source", shard_count: 1), (index_id: "index2", source_id: "my-source", shard_count: 2)], "indexer1": [(index_id: "index1", source_id: "my-source", shard_count: 1) and 3 tasks and 4 shards] and 1 more indexers, handling 3 tasks and 4 shards})"#
        );
    }

    proptest! {
        #[test]
        fn test_building_indexing_tasks_and_physical_plan(num_indexers in 1usize..50usize, index_id_sources in proptest::collection::vec(gen_kafka_source(), 1..20)) {
            let index_uids: fnv::FnvHashSet<IndexUid> =
                index_id_sources.iter()
                    .map(|(index_uid, _)| index_uid.clone())
                    .collect();
            let mut model = ControlPlaneModel::default();
            for index_uid in index_uids {
                let index_config = IndexConfig::for_test(&index_uid.index_id, &format!("ram://test/{index_uid}"));
                model.add_index(IndexMetadata::new_with_index_uid(index_uid, index_config));
            }
            for (index_uid, source_config) in &index_id_sources {
                model.add_source(index_uid, source_config.clone()).unwrap();
            }

            let sources: Vec<SourceToSchedule> = get_sources_to_schedule(&model);
            let mut indexer_max_loads = FnvHashMap::default();
            for i in 0..num_indexers {
                let indexer_id = format!("indexer-{i}");
                indexer_max_loads.insert(indexer_id, mcpu(4_000));
            }
            let shard_locations = ShardLocations::default();
            let _physical_indexing_plan = build_physical_indexing_plan(&sources, &indexer_max_loads, None, &shard_locations);
        }
    }

    use quickwit_config::SourceInputFormat;
    use quickwit_proto::indexing::mcpu;
    use quickwit_proto::ingest::{Shard, ShardState};

    fn kafka_source_params_for_test() -> SourceParams {
        SourceParams::Kafka(KafkaSourceParams {
            topic: "topic".to_string(),
            client_log_level: None,
            client_params: serde_json::json!({
                "bootstrap.servers": "localhost:9092",
            }),
            enable_backfill_mode: true,
        })
    }

    prop_compose! {
      fn gen_kafka_source()
        (index_idx in 0usize..100usize, num_pipelines in 1usize..51usize) -> (IndexUid, SourceConfig) {
          let index_uid = IndexUid::for_test(&format!("index-id-{index_idx}"), 0 /* this is the index uid */);
          let source_id = quickwit_common::rand::append_random_suffix("kafka-source");
          (index_uid, SourceConfig {
              source_id,
              num_pipelines: NonZeroUsize::new(num_pipelines).unwrap(),
              enabled: true,
              source_params: kafka_source_params_for_test(),
              transform_config: None,
              input_format: SourceInputFormat::Json,
          })
      }
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_scheduler/scheduling/README.md
================================================
# Scheduling logic

Quickwit needs to assign indexing tasks to a set of indexers nodes.
We call the result of this decision the indexing physical plan.

We also want to observe some interesting properties such as:
- (A) we want to avoid moving indexing tasks from one indexer to another one needlessly.
- (B) we want a source to be spread amongst as few nodes as possible
- (C) we want to balance the load between nodes as soon as the load is significatively (>30%) higher than the average (target) load
- (D) when we are working with the Ingest API source, we prefer to colocate indexers on
  the ingesters holding the data.

# Problem abstraction

To simplify the logic and make it easier to test it, we first abstract this in the following
optimization problem. In Quickwit, we have two types of source:

- The push api source: they have a given (changing) set of shards associated to them.
  A shard is rate-limited to ensure their throughput is lower than `5MB/s` worth of
  uncompressed data. This guarantees that a given shard can be indexed by a
  single indexing pipeline.

- Other sources, like Kafka. It is a very common use case to use quickwit to index large
  amounts of historical data. Right now, the user is therefore expected to supply a desired
  number of pipeline.

Routers send their batch to the different ingesters they know using a round-robin logic.
We assume that routers's list of known shards gets eventually updated after a shard addition, so that
we can assume that shard have roughly the same load.

Indexers inform of observed load of all of their pipelines. 
This load is assumed unidimensional. This is imperfect of course: indexing consumes network, io, etc.
Still for the sake of simplification we pick one metric, measured as the amount of CPU spent
in the indexer. 

The control plane consolidates this figure to create a load_per_shard metric expressed in millicpu.

The hypothesis above allow us to see both kafka and ingest sources through the same lens, and stop 
making a distinction between shards.

In our scheduler, a source simply has:
- an identifier (a `u32`)
- a number of shard.
- a load per shard identified by a u32, expression thousandth of CPU.

And indexer has:
- a maximum total load (that we will need to measure or configure).

The problem is now greatly simplified.
A solution is a sparse matrix of `(num_indexers, num_sources)` that holds a number of shards to be indexed.
The different constraint and wanted properties can all be re-expressed. For instance:
- We want the dot product of the load per shard vector with each row, to be close to the average load of each node (C)
- We do not want a large distance between the two solution matrixes (A)
- We want that matrix as sparse as possible (B)

Note that the constraint (C) is enforced differently depending on the load:
- shards can be placed freely on nodes up to 30% of their capacity
- above this threshold, we try to assign shards to indexers so that the total load on each indexer is close to the average load

To express the affinity constraint (D) we could similarly define a matrix of `(num_indexers, num_sources)` with affinity scores and compute a distance with the solution matrix. 

The actual cost function we would craft is however not linear, it is the combination of multiple distances like those discribed above.

# The heuristic

We use the following heuristic.

While assigning shards to node, we try to ensure that workloads are balanced (except for very small cluster loads). This is achieved by calculating a virtual capacity for each indexer. We calculate 120% of the total load on the entire cluster then divide it up proportionally between indexers according to their capacity. By respecting this virtual capacity when assigning shards to indexers, we make sure that all indexers have a load close to the average load.

## Phase 1: Remove extraneous shards

Starting from the existing solution, we first reduce it to make sure we do not have too many shards assigned. This happens when a source was scaled down or deleted.
This is done by reducing the number of shard wherever needed, picking in priority nodes with few shards.

We call the resulting solution "reduced solution". The reduced solution is usually not a valid solution as some shard
may have been added. We will add these in Phase 3.

If we compute the distance to the previous solution, we want to use the "reduced solution" and not the actual
previous solution.

## Phase 2: Enforce nodes maximum load

We then remove entire sources from nodes where the load is higher than the capcity (load <30%) or virtual capacity (load >30%).
For every given node, we remove in priority sources that have an overall small load on the node.

Matrix-wise, note that phase 1 and phase 2 creates a matrix lower or equal to the previous solution.

## Phase 3: Greedy assignment

At this point we have reached a solution that fits on the cluster, but we possibly has several missing shards.
We therefore use a greedy algorithm to allocate these shard. We assign the shards source by source, in the order of decreasing total load.

We try assigning shards to indexers while trying to respect their virtual capacity. Because of the uneven size of shards and the greedy approach, this problem might not have a solution. In that case we iteratively grow the virtual capacity by 20% until the solution fits.

Shards for each source are placed in two steps:
- in a first iteration we assign shards that have affinity scores (D)
- in a second iteration we assign the rest of the shards starting with the node having the highest capacity

## Phase 4: Optimization

This is not implemented yet. We could craft a proper optimization cost and use a BFS search to explore
better solutions.


# Code organization

All of this scheduling is done in the scheduling directory.
Clients only have to call the `build_physical_indexing_plan` function.

The code converts the list of sources into a "scheduling problem" that abstracts away kafka pipelines and ingest v2 pipelines.
The problem then goes through our optimization code.
The solution at this point only contains the number of shards of each type to be assigned to each indexers.
The function expands this solution into a complete physical plan, with shard ids and pipelines.


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_scheduler/scheduling/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub mod scheduling_logic;
pub mod scheduling_logic_model;

use std::collections::HashMap;
use std::num::NonZeroU32;

use fnv::{FnvHashMap, FnvHashSet};
use quickwit_common::rate_limited_debug;
use quickwit_proto::indexing::{CpuCapacity, IndexingTask};
use quickwit_proto::types::{PipelineUid, ShardId, SourceUid};
use scheduling_logic_model::{IndexerOrd, SourceOrd};
use tracing::{error, warn};

use crate::indexing_plan::PhysicalIndexingPlan;
use crate::indexing_scheduler::scheduling::scheduling_logic_model::{
    IndexerAssignment, SchedulingProblem, SchedulingSolution,
};
use crate::model::ShardLocations;

/// If we have several pipelines below this threshold we
/// reduce the number of pipelines.
///
/// Note that even for 2 pipelines, this creates an hysteris effect.
///
/// Starting from a single pipeline.
/// An overall load above 80% is enough to trigger the creation of a
/// second pipeline.
///
/// Coming back to a single pipeline requires having a load per pipeline
/// of 30%. Which translates into an overall load of 60%.
const CPU_PER_PIPELINE_LOAD_LOWER_THRESHOLD: CpuCapacity = CpuCapacity::from_cpu_millis(1_200);

/// That's 80% of a period
const MAX_LOAD_PER_PIPELINE: CpuCapacity = CpuCapacity::from_cpu_millis(3_200);

fn populate_problem(
    source: &SourceToSchedule,
    problem: &mut SchedulingProblem,
) -> Option<SourceOrd> {
    match &source.source_type {
        SourceToScheduleType::IngestV1 => {
            // TODO ingest v1 is scheduled differently
            None
        }
        SourceToScheduleType::Sharded {
            shard_ids,
            load_per_shard,
        } => {
            let num_shards = shard_ids.len() as u32;
            let source_ord = problem.add_source(num_shards, *load_per_shard);
            Some(source_ord)
        }
        SourceToScheduleType::NonSharded {
            num_pipelines,
            load_per_pipeline,
        } => {
            let source_ord = problem.add_source(*num_pipelines, *load_per_pipeline);
            Some(source_ord)
        }
    }
}

#[derive(Default)]
struct IdToOrdMap<'a> {
    indexer_ids: Vec<String>,
    sources: Vec<&'a SourceToSchedule>,
    indexer_id_to_indexer_ord: FnvHashMap<String, IndexerOrd>,
    source_uid_to_source_ord: FnvHashMap<SourceUid, SourceOrd>,
}

impl<'a> IdToOrdMap<'a> {
    // All source added are required to have a different source uid.
    fn add_source(&mut self, source: &'a SourceToSchedule) -> SourceOrd {
        let source_ord = self.source_uid_to_source_ord.len() as SourceOrd;
        let previous_item = self
            .source_uid_to_source_ord
            .insert(source.source_uid.clone(), source_ord);
        assert!(previous_item.is_none());
        self.sources.push(source);
        source_ord
    }

    fn source_ord(&self, source_uid: &SourceUid) -> Option<SourceOrd> {
        self.source_uid_to_source_ord.get(source_uid).copied()
    }

    fn source(&self, source_uid: &SourceUid) -> Option<(SourceOrd, &'a SourceToSchedule)> {
        let source_ord = self.source_uid_to_source_ord.get(source_uid).copied()?;
        Some((source_ord, self.sources[source_ord as usize]))
    }

    fn indexer_ord(&self, indexer_id: &str) -> Option<IndexerOrd> {
        self.indexer_id_to_indexer_ord.get(indexer_id).copied()
    }

    fn add_indexer_id(&mut self, indexer_id: String) -> IndexerOrd {
        let indexer_ord = self.indexer_ids.len() as IndexerOrd;
        self.indexer_id_to_indexer_ord
            .insert(indexer_id.clone(), indexer_ord);
        self.indexer_ids.push(indexer_id);
        indexer_ord
    }
}

fn convert_physical_plan_to_solution(
    plan: &PhysicalIndexingPlan,
    id_to_ord_map: &IdToOrdMap,
    solution: &mut SchedulingSolution,
) {
    for (indexer_id, indexing_tasks) in plan.indexing_tasks_per_indexer() {
        if let Some(indexer_ord) = id_to_ord_map.indexer_ord(indexer_id) {
            let indexer_assignment = &mut solution.indexer_assignments[indexer_ord];
            for indexing_task in indexing_tasks {
                let source_uid = SourceUid {
                    index_uid: indexing_task.index_uid().clone(),
                    source_id: indexing_task.source_id.clone(),
                };
                if let Some((source_ord, source)) = id_to_ord_map.source(&source_uid) {
                    match &source.source_type {
                        SourceToScheduleType::Sharded { .. } => {
                            indexer_assignment
                                .add_shards(source_ord, indexing_task.shard_ids.len() as u32);
                        }
                        SourceToScheduleType::NonSharded { .. } => {
                            // For non-sharded sources like Kafka, one pipeline = one shard in the
                            // solutions
                            indexer_assignment.add_shards(source_ord, 1);
                        }
                        SourceToScheduleType::IngestV1 => {
                            // Ingest V1 is not part of the logical placement algorithm.
                        }
                    }
                }
            }
        }
    }
}

#[derive(Debug)]
pub struct SourceToSchedule {
    pub source_uid: SourceUid,
    pub source_type: SourceToScheduleType,
    pub params_fingerprint: u64,
}

#[derive(Debug)]
pub enum SourceToScheduleType {
    Sharded {
        shard_ids: Vec<ShardId>,
        load_per_shard: NonZeroU32,
    },
    NonSharded {
        num_pipelines: u32,
        load_per_pipeline: NonZeroU32,
    },
    // deprecated
    IngestV1,
}

fn compute_max_num_shards_per_pipeline(source_type: &SourceToScheduleType) -> NonZeroU32 {
    match &source_type {
        SourceToScheduleType::Sharded { load_per_shard, .. } => {
            NonZeroU32::new(MAX_LOAD_PER_PIPELINE.cpu_millis() / load_per_shard.get())
                .unwrap_or_else(|| {
                    // We throttle shard at ingestion to ensure that a shard does not
                    // exceed 5MB/s.
                    //
                    // This value has been chosen to make sure that one full pipeline
                    // should always be able to handle the load of one shard.
                    //
                    // However it is possible for the system to take more than this
                    // when it is playing catch up.
                    //
                    // This is a transitory state, and not a problem per se.
                    warn!("load per shard is higher than `MAX_LOAD_PER_PIPELINE`");
                    NonZeroU32::MIN // also colloquially known as `1`
                })
        }
        SourceToScheduleType::IngestV1 | SourceToScheduleType::NonSharded { .. } => {
            NonZeroU32::new(1u32).unwrap()
        }
    }
}

// This converts a scheduling solution for a given node and a given source.
// Major quirk however:
// For sharded function, this function only partially performs this conversion.
// In the resulting function some of the shards may not be allocated.
// The remaining shards will be added in postprocessing pass.
fn convert_scheduling_solution_to_physical_plan_single_node_single_source(
    mut remaining_num_shards_to_schedule_on_node: u32,
    // Specific to the source.
    previous_tasks: &[&IndexingTask],
    source: &SourceToSchedule,
) -> Vec<IndexingTask> {
    match &source.source_type {
        SourceToScheduleType::Sharded {
            shard_ids,
            load_per_shard,
        } => {
            if remaining_num_shards_to_schedule_on_node == 0 {
                return Vec::new();
            }
            // For the moment we do something voluntarily suboptimal.
            let max_num_pipelines = quickwit_common::div_ceil_u32(
                remaining_num_shards_to_schedule_on_node * load_per_shard.get(),
                CPU_PER_PIPELINE_LOAD_LOWER_THRESHOLD.cpu_millis(),
            );
            let max_num_shards_per_pipeline: NonZeroU32 =
                compute_max_num_shards_per_pipeline(&source.source_type);
            let mut new_tasks = Vec::new();
            for previous_task in previous_tasks {
                let max_shard_in_pipeline = max_num_shards_per_pipeline
                    .get()
                    .min(remaining_num_shards_to_schedule_on_node)
                    as usize;
                let shard_ids: Vec<ShardId> = previous_task
                    .shard_ids
                    .iter()
                    .filter(|shard_id| shard_ids.contains(shard_id))
                    .take(max_shard_in_pipeline)
                    .cloned()
                    .collect();
                remaining_num_shards_to_schedule_on_node -= shard_ids.len() as u32;
                let pipeline_uid = if previous_task.params_fingerprint == source.params_fingerprint
                {
                    previous_task.pipeline_uid
                } else {
                    Some(PipelineUid::random())
                };
                let new_task = IndexingTask {
                    index_uid: previous_task.index_uid.clone(),
                    source_id: previous_task.source_id.clone(),
                    pipeline_uid,
                    shard_ids,
                    params_fingerprint: source.params_fingerprint,
                };
                new_tasks.push(new_task);
                if new_tasks.len() >= max_num_pipelines as usize {
                    break;
                }
                if remaining_num_shards_to_schedule_on_node == 0 {
                    break;
                }
            }
            new_tasks
        }
        SourceToScheduleType::NonSharded { .. } => {
            // For non-sharded pipelines, we just need `num_shards` is a number of pipelines.
            let mut indexing_tasks: Vec<IndexingTask> = previous_tasks
                .iter()
                .take(remaining_num_shards_to_schedule_on_node as usize)
                .map(|task| (*task).clone())
                .collect();
            for indexing_task in &mut indexing_tasks {
                if indexing_task.params_fingerprint != source.params_fingerprint {
                    indexing_task.params_fingerprint = source.params_fingerprint;
                    indexing_task.pipeline_uid = Some(PipelineUid::random());
                }
            }
            indexing_tasks.resize_with(remaining_num_shards_to_schedule_on_node as usize, || {
                IndexingTask {
                    index_uid: Some(source.source_uid.index_uid.clone()),
                    source_id: source.source_uid.source_id.clone(),
                    pipeline_uid: Some(PipelineUid::random()),
                    shard_ids: Vec::new(),
                    params_fingerprint: source.params_fingerprint,
                }
            });
            indexing_tasks
        }
        SourceToScheduleType::IngestV1 => {
            // Ingest V1 is simple. One pipeline per indexer node.
            if let Some(indexing_task) = previous_tasks.first() {
                // The pipeline already exists, let's reuse it.
                let mut indexing_task = (*indexing_task).clone();
                if indexing_task.params_fingerprint != source.params_fingerprint {
                    indexing_task.params_fingerprint = source.params_fingerprint;
                    indexing_task.pipeline_uid = Some(PipelineUid::random());
                }
                vec![indexing_task]
            } else {
                // The source is new, we need to create a new task.
                vec![IndexingTask {
                    index_uid: Some(source.source_uid.index_uid.clone()),
                    source_id: source.source_uid.source_id.clone(),
                    pipeline_uid: Some(PipelineUid::random()),
                    shard_ids: Vec::new(),
                    params_fingerprint: source.params_fingerprint,
                }]
            }
        }
    }
}

fn convert_scheduling_solution_to_physical_plan_single_node(
    indexer_assignment: &IndexerAssignment,
    previous_tasks: &[IndexingTask],
    sources: &[SourceToSchedule],
    id_to_ord_map: &IdToOrdMap,
) -> Vec<IndexingTask> {
    let mut tasks = Vec::new();
    for source in sources {
        let source_num_shards =
            if let Some(source_ord) = id_to_ord_map.source_ord(&source.source_uid) {
                indexer_assignment.num_shards(source_ord)
            } else {
                // This can happen for IngestV1
                1u32
            };
        let source_pipelines: Vec<&IndexingTask> = previous_tasks
            .iter()
            .filter(|task| {
                task.index_uid() == &source.source_uid.index_uid
                    && task.source_id == source.source_uid.source_id
            })
            .collect();
        let source_tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
            source_num_shards,
            &source_pipelines[..],
            source,
        );
        tasks.extend(source_tasks);
    }
    // code goes here.
    tasks.sort_by(|left: &IndexingTask, right: &IndexingTask| {
        left.index_uid
            .cmp(&right.index_uid)
            .then_with(|| left.source_id.cmp(&right.source_id))
    });
    tasks
}

/// This function takes a scheduling solution (which abstracts the notion of pipelines,
/// and shard ids) and builds a physical plan, attempting to make as little change as possible
/// to the existing pipelines.
///
/// We do not support moving shard from one pipeline to another, so if required this function may
/// also return instruction about deleting / adding new shards.
fn convert_scheduling_solution_to_physical_plan(
    solution: &SchedulingSolution,
    id_to_ord_map: &IdToOrdMap,
    sources: &[SourceToSchedule],
    previous_plan_opt: Option<&PhysicalIndexingPlan>,
    shard_locations: &ShardLocations,
) -> PhysicalIndexingPlan {
    let mut indexer_assignments = solution.indexer_assignments.clone();
    let mut new_physical_plan = PhysicalIndexingPlan::with_indexer_ids(&id_to_ord_map.indexer_ids);
    for (indexer_id, indexer_assignment) in id_to_ord_map
        .indexer_ids
        .iter()
        .zip(&mut indexer_assignments)
    {
        let previous_tasks_for_indexer = previous_plan_opt
            .and_then(|previous_plan| previous_plan.indexer(indexer_id))
            .unwrap_or(&[]);
        // First we attempt to recycle existing pipelines.
        let new_plan_indexing_tasks_for_indexer: Vec<IndexingTask> =
            convert_scheduling_solution_to_physical_plan_single_node(
                indexer_assignment,
                previous_tasks_for_indexer,
                sources,
                id_to_ord_map,
            );
        for indexing_task in new_plan_indexing_tasks_for_indexer {
            new_physical_plan.add_indexing_task(indexer_id, indexing_task);
        }
    }

    // We still need to do some extra work for sharded sources: assign missing shards, and possibly
    // adding extra pipelines.
    for source in sources {
        let SourceToScheduleType::Sharded { shard_ids, .. } = &source.source_type else {
            continue;
        };
        let source_ord = id_to_ord_map.source_ord(&source.source_uid).unwrap();
        let mut scheduled_shards: FnvHashSet<ShardId> = FnvHashSet::default();
        let mut remaining_num_shards_per_node: HashMap<String, NonZeroU32> =
            HashMap::with_capacity(new_physical_plan.num_indexers());
        for (indexer, indexing_tasks) in new_physical_plan.indexing_tasks_per_indexer_mut() {
            let indexer_ord = id_to_ord_map.indexer_ord(indexer).unwrap();
            let mut num_shards_for_indexer_source: u32 =
                indexer_assignments[indexer_ord].num_shards(source_ord);
            for indexing_task in indexing_tasks {
                if indexing_task.index_uid() == &source.source_uid.index_uid
                    && indexing_task.source_id == source.source_uid.source_id
                {
                    indexing_task.shard_ids.retain(|shard_id| {
                        let shard_added = scheduled_shards.insert(shard_id.clone());
                        if shard_added {
                            true
                        } else {
                            error!(
                                "this should never happen. shard was allocated into two pipelines."
                            );
                            false
                        }
                    });
                    num_shards_for_indexer_source -= indexing_task.shard_ids.len() as u32;
                }
            }
            if let Some(num_shards_for_indexer_source_non_zero) =
                NonZeroU32::new(num_shards_for_indexer_source)
            {
                remaining_num_shards_per_node
                    .insert(indexer.clone(), num_shards_for_indexer_source_non_zero);
            }
        }

        // Missing shards is an iterator over the shards that are not scheduled into a pipeline yet.
        let missing_shards: Vec<ShardId> = shard_ids
            .iter()
            .filter(|shard_id| !scheduled_shards.contains(shard_id))
            .cloned()
            .collect();

        // Let's assign the missing shards.
        let max_shard_per_pipeline = compute_max_num_shards_per_pipeline(&source.source_type);

        let shard_to_indexer: HashMap<ShardId, String> = assign_shards(
            missing_shards,
            remaining_num_shards_per_node,
            shard_locations,
        );
        for (shard_id, indexer) in shard_to_indexer {
            add_shard_to_indexer(
                shard_id,
                indexer,
                &source.source_uid,
                max_shard_per_pipeline,
                &mut new_physical_plan,
                source.params_fingerprint,
            );
        }
    }

    new_physical_plan.normalize();

    new_physical_plan
}

/// This function is meant to be called after we have solved the scheduling
/// problem, so we already know the number of shards to be assigned on each indexer node.
/// We now need to precisely where each shard should be assigned.
///
/// It assigns the missing shards for a given source to the indexers, given:
/// - the total number of shards that are to be scheduled on each nodes
/// - the shard locations
///
/// This function will assign shards on a node hosting them in priority.
///
/// The current implementation is a heuristic.
/// In the first pass, we attempt to assign as many shards as possible on the
/// node hosting them.
fn assign_shards(
    missing_shards: Vec<ShardId>,
    mut remaining_num_shards_per_node: HashMap<String, NonZeroU32>,
    shard_locations: &ShardLocations,
) -> HashMap<ShardId, String> {
    let mut shard_to_indexer: HashMap<ShardId, String> =
        HashMap::with_capacity(missing_shards.len());

    // In a first pass we first assign as many shards on their hosting nodes as possible.
    let mut remaining_missing_shards: Vec<ShardId> = Vec::new();
    for shard_id in missing_shards {
        // As a heuristic, we pick the first node hosting the shard that is available.
        let indexer_hosting_shard: Option<(NonZeroU32, &str)> = shard_locations
            .get_shard_locations(&shard_id)
            .iter()
            .map(|node_id| node_id.as_str())
            .flat_map(|node_id| {
                let num_shards = remaining_num_shards_per_node.get(node_id)?;
                Some((*num_shards, node_id))
            })
            .min_by_key(|(num_shards, _node_id)| *num_shards);
        if let Some((_num_shards, indexer)) = indexer_hosting_shard {
            decrement_num_shards(indexer, &mut remaining_num_shards_per_node);
            shard_to_indexer.insert(shard_id, indexer.to_string());
        } else {
            remaining_missing_shards.push(shard_id);
        }
    }

    for shard_id in remaining_missing_shards {
        let indexer = remaining_num_shards_per_node
            .keys()
            .next()
            .expect("failed to assign all shards. please report")
            .to_string();
        decrement_num_shards(&indexer, &mut remaining_num_shards_per_node);
        shard_to_indexer.insert(shard_id, indexer.to_string());
    }
    assert!(remaining_num_shards_per_node.is_empty());

    shard_to_indexer
}

fn decrement_num_shards(
    node_id: &str,
    remaining_num_shards_to_schedule_per_indexers: &mut HashMap<String, NonZeroU32>,
) {
    {
        let previous_num_shards = remaining_num_shards_to_schedule_per_indexers
            .get_mut(node_id)
            .unwrap();
        if let Some(new_num_shards) = NonZeroU32::new(previous_num_shards.get() - 1) {
            *previous_num_shards = new_num_shards;
            return;
        }
    }
    remaining_num_shards_to_schedule_per_indexers.remove(node_id);
}

// Checks that's the physical solution indeed matches the scheduling solution.
fn assert_post_condition_physical_plan_match_solution(
    physical_plan: &PhysicalIndexingPlan,
    solution: &SchedulingSolution,
    id_to_ord_map: &IdToOrdMap,
) {
    let num_indexers = physical_plan.indexing_tasks_per_indexer().len();
    assert_eq!(num_indexers, solution.indexer_assignments.len());
    assert_eq!(num_indexers, id_to_ord_map.indexer_ids.len());
    let mut reconstructed_solution = SchedulingSolution::with_num_indexers(num_indexers);
    convert_physical_plan_to_solution(physical_plan, id_to_ord_map, &mut reconstructed_solution);
    assert_eq!(
        solution.indexer_assignments,
        reconstructed_solution.indexer_assignments
    );
}

fn add_shard_to_indexer(
    missing_shard: ShardId,
    indexer: String,
    source_uid: &SourceUid,
    max_shard_per_pipeline: NonZeroU32,
    new_physical_plan: &mut PhysicalIndexingPlan,
    params_fingerprint: u64,
) {
    let indexer_tasks = new_physical_plan
        .indexing_tasks_per_indexer_mut()
        .entry(indexer)
        .or_default();

    let indexing_task_opt = indexer_tasks
        .iter_mut()
        .filter(|indexing_task| {
            indexing_task.index_uid() == &source_uid.index_uid
                && indexing_task.source_id == source_uid.source_id
        })
        .filter(|task| task.shard_ids.len() < max_shard_per_pipeline.get() as usize)
        .min_by_key(|task| task.shard_ids.len());

    if let Some(indexing_task) = indexing_task_opt {
        indexing_task.shard_ids.push(missing_shard);
    } else {
        // We haven't found any pipeline with remaining room.
        // It is time to create a new pipeline.
        indexer_tasks.push(IndexingTask {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.clone(),
            pipeline_uid: Some(PipelineUid::random()),
            shard_ids: vec![missing_shard],
            params_fingerprint,
        });
    }
}

// If the total node capacities is lower than 120% of the problem load, this
// function scales the load of the indexer to reach this limit.
fn inflate_node_capacities_if_necessary(problem: &mut SchedulingProblem) {
    // First we scale the problem to the point where any indexer can fit the largest shard.
    let Some(largest_shard_load) = problem.sources().map(|source| source.load_per_shard).max()
    else {
        return;
    };

    // We first artificially scale down the node capacities.
    //
    // The node capacity is an estimate of the amount of CPU available on a given indexer node.
    // It has two purpose,
    // - under a lot of load, indexer will receive work proportional to their relative capacity.
    // - under low load, the absolute magnitude will be used by the scheduler, to decide whether
    // to prefer having a balanced workload over other criteria (all pipeline from a same index on
    // the same node, indexing local shards, etc.).
    //
    // The default CPU capacity is detected from the OS. Using these values directly leads
    // a non uniform distribution of the load which is very confusing for users. We artificially
    // scale down the indexer capacities.
    problem.scale_node_capacities(0.3f32);

    let min_indexer_capacity = (0..problem.num_indexers())
        .map(|indexer_ord| problem.indexer_cpu_capacity(indexer_ord))
        .min()
        .expect("At least one indexer is required");

    assert_ne!(min_indexer_capacity.cpu_millis(), 0);
    if min_indexer_capacity.cpu_millis() < largest_shard_load.get() {
        let scaling_factor =
            (largest_shard_load.get() as f32) / (min_indexer_capacity.cpu_millis() as f32);
        problem.scale_node_capacities(scaling_factor);
    }

    let total_node_capacities: f32 = problem.total_node_capacities().cpu_millis() as f32;
    let total_load: f32 = problem.total_load() as f32;
    let inflated_total_load = total_load * 1.2f32;
    if inflated_total_load >= total_node_capacities {
        // We need to inflate our node capacities to match the problem.
        let ratio = inflated_total_load / total_node_capacities;
        problem.scale_node_capacities(ratio);
    }
}

/// Creates a physical plan given the current situation of the cluster and the list of sources
/// to schedule.
///
/// The scheduling problem abstracts all notion of shard ids, source types, and node_ids,
/// to transform scheduling into a math problem.
///
/// This function implementation therefore goes
/// 1) transform our problem into a scheduling problem. Something closer to a well-defined
///    optimization problem. In particular this step removes:
///    - the notion of shard ids, and only considers a number of shards being allocated.
///    - node_ids and shard ids. These are replaced by integers.
/// 2) convert the current situation of the cluster into something a previous scheduling solution.
/// 3) compute the new scheduling solution.
/// 4) convert the new scheduling solution back to the real world by reallocating the shard ids.
///
/// TODO cut into pipelines.
/// Panics if any sources has no shards.
pub fn build_physical_indexing_plan(
    sources: &[SourceToSchedule],
    indexer_id_to_cpu_capacities: &FnvHashMap<String, CpuCapacity>,
    previous_plan_opt: Option<&PhysicalIndexingPlan>,
    shard_locations: &ShardLocations,
) -> PhysicalIndexingPlan {
    // Asserts that the source are valid.
    check_sources(sources);

    // We convert our problem into a simplified scheduling problem.
    // In this simplified version, nodes and sources are just ids.
    // Instead of individual shard ids, we just keep count of shards.
    // Similarly, instead of accurate locality, we just keep the number of shards local
    // to an indexer.
    let (id_to_ord_map, problem) =
        convert_to_simplified_problem(indexer_id_to_cpu_capacities, sources, shard_locations);

    // Populate the previous solution, if any.
    let mut previous_solution = problem.new_solution();
    if let Some(previous_plan) = previous_plan_opt {
        convert_physical_plan_to_solution(previous_plan, &id_to_ord_map, &mut previous_solution);
    }

    // Compute the new scheduling solution using a heuristic.
    let new_solution = scheduling_logic::solve(problem, previous_solution);

    // Convert the new scheduling solution back to a physical plan.
    let new_physical_plan = convert_scheduling_solution_to_physical_plan(
        &new_solution,
        &id_to_ord_map,
        sources,
        previous_plan_opt,
        shard_locations,
    );

    assert_post_condition_physical_plan_match_solution(
        &new_physical_plan,
        &new_solution,
        &id_to_ord_map,
    );

    new_physical_plan
}

/// Makes any checks on the sources.
/// Sharded sources are not allowed to have no shards.
fn check_sources(sources: &[SourceToSchedule]) {
    for source in sources {
        if let SourceToScheduleType::Sharded { shard_ids, .. } = &source.source_type {
            assert!(!shard_ids.is_empty())
        }
    }
}

fn convert_to_simplified_problem<'a>(
    indexer_id_to_cpu_capacities: &'a FnvHashMap<String, CpuCapacity>,
    sources: &'a [SourceToSchedule],
    shard_locations: &ShardLocations,
) -> (IdToOrdMap<'a>, SchedulingProblem) {
    // Convert our problem to a scheduling problem.
    let mut id_to_ord_map: IdToOrdMap<'a> = IdToOrdMap::default();

    // We use a Vec as a `IndexOrd` -> Max load map.
    let mut indexer_cpu_capacities: Vec<CpuCapacity> =
        Vec::with_capacity(indexer_id_to_cpu_capacities.len());
    for (indexer_id, &cpu_capacity) in indexer_id_to_cpu_capacities {
        let indexer_ord = id_to_ord_map.add_indexer_id(indexer_id.clone());
        assert_eq!(indexer_ord, indexer_cpu_capacities.len() as IndexerOrd);
        indexer_cpu_capacities.push(cpu_capacity);
    }

    let mut problem = SchedulingProblem::with_indexer_cpu_capacities(indexer_cpu_capacities);

    for source in sources {
        if let Some(source_ord) = populate_problem(source, &mut problem) {
            let registered_source_ord = id_to_ord_map.add_source(source);
            if let SourceToScheduleType::Sharded { shard_ids, .. } = &source.source_type {
                for shard_id in shard_ids {
                    for &indexer in shard_locations.get_shard_locations(shard_id) {
                        let Some(indexer_ord) = id_to_ord_map.indexer_ord(indexer.as_str()) else {
                            // This happens if the ingester is unavailable.
                            rate_limited_debug!(
                                limit_per_min = 10,
                                "failed to find indexer ord for indexer {indexer}"
                            );
                            continue;
                        };
                        problem.inc_affinity(source_ord, indexer_ord);
                    }
                }
            }
            assert_eq!(source_ord, registered_source_ord);
        }
    }
    (id_to_ord_map, problem)
}

#[cfg(test)]
mod tests {

    use std::collections::{HashMap, HashSet};
    use std::num::NonZeroU32;
    use std::str::FromStr;
    use std::sync::atomic::{AtomicUsize, Ordering};

    use fnv::FnvHashMap;
    use itertools::Itertools;
    use quickwit_proto::indexing::{CpuCapacity, IndexingTask, mcpu};
    use quickwit_proto::types::{IndexUid, NodeId, PipelineUid, ShardId, SourceUid};
    use rand::prelude::IndexedRandom;

    use super::{
        SourceToSchedule, SourceToScheduleType, build_physical_indexing_plan,
        convert_scheduling_solution_to_physical_plan_single_node_single_source,
    };
    use crate::indexing_plan::PhysicalIndexingPlan;
    use crate::indexing_scheduler::get_shard_locality_metrics;
    use crate::indexing_scheduler::scheduling::assign_shards;
    use crate::model::ShardLocations;

    fn source_id() -> SourceUid {
        static COUNTER: AtomicUsize = AtomicUsize::new(0);
        let index = IndexUid::for_test("test_index", 0);
        let source_id = COUNTER.fetch_add(1, Ordering::SeqCst);
        SourceUid {
            index_uid: index,
            source_id: format!("source_{source_id}"),
        }
    }

    #[test]
    fn test_build_physical_plan() {
        let indexer1 = "indexer1".to_string();
        let indexer2 = "indexer2".to_string();
        let source_uid0 = source_id();
        let source_uid1 = source_id();
        let source_uid2 = source_id();
        let source_0 = SourceToSchedule {
            source_uid: source_uid0.clone(),
            source_type: SourceToScheduleType::Sharded {
                shard_ids: vec![
                    ShardId::from(0),
                    ShardId::from(1),
                    ShardId::from(2),
                    ShardId::from(3),
                    ShardId::from(4),
                    ShardId::from(5),
                    ShardId::from(6),
                    ShardId::from(7),
                ],
                load_per_shard: NonZeroU32::new(1_000).unwrap(),
            },
            params_fingerprint: 0,
        };
        let source_1 = SourceToSchedule {
            source_uid: source_uid1.clone(),
            source_type: SourceToScheduleType::NonSharded {
                num_pipelines: 2,
                load_per_pipeline: NonZeroU32::new(3_200).unwrap(),
            },
            params_fingerprint: 0,
        };
        let source_2 = SourceToSchedule {
            source_uid: source_uid2.clone(),
            source_type: SourceToScheduleType::IngestV1,
            params_fingerprint: 0,
        };
        let mut indexer_id_to_cpu_capacities = FnvHashMap::default();
        indexer_id_to_cpu_capacities.insert(indexer1.clone(), mcpu(16_000));
        indexer_id_to_cpu_capacities.insert(indexer2.clone(), mcpu(16_000));
        let shard_locations = ShardLocations::default();
        let indexing_plan = build_physical_indexing_plan(
            &[source_0, source_1, source_2],
            &indexer_id_to_cpu_capacities,
            None,
            &shard_locations,
        );
        assert_eq!(indexing_plan.indexing_tasks_per_indexer().len(), 2);

        let node1_plan = indexing_plan.indexer(&indexer1).unwrap();
        let node2_plan = indexing_plan.indexer(&indexer2).unwrap();

        // both non-sharded pipelines get scheduled on the same node.
        assert_eq!(node1_plan.len(), 3);
        assert_eq!(&node1_plan[0].source_id, &source_uid1.source_id);
        assert!(&node1_plan[0].shard_ids.is_empty());
        assert_eq!(&node1_plan[1].source_id, &source_uid1.source_id);
        assert!(&node1_plan[1].shard_ids.is_empty());
        assert_eq!(&node1_plan[2].source_id, &source_uid2.source_id);
        assert!(&node1_plan[2].shard_ids.is_empty());

        assert_eq!(node2_plan.len(), 4);
        assert_eq!(&node2_plan[0].source_id, &source_uid0.source_id);

        let mut shard_ids: HashSet<ShardId> = HashSet::default();
        let mut shard_lens = Vec::new();
        shard_lens.push(node2_plan[0].shard_ids.len());
        shard_ids.extend(node2_plan[0].shard_ids.iter().cloned());
        assert_eq!(&node2_plan[1].source_id, &source_uid0.source_id);
        shard_lens.push(node2_plan[1].shard_ids.len());
        shard_ids.extend(node2_plan[1].shard_ids.iter().cloned());
        assert_eq!(&node2_plan[2].source_id, &source_uid0.source_id);
        shard_lens.push(node2_plan[2].shard_ids.len());
        shard_ids.extend(node2_plan[2].shard_ids.iter().cloned());
        assert_eq!(shard_ids.len(), 8);
        assert_eq!(&node2_plan[3].source_id, &source_uid2.source_id);
        shard_lens.sort();
        assert_eq!(&shard_lens[..], &[2, 3, 3]);
    }

    #[test]
    fn test_build_physical_plan_with_locality() {
        let num_indexers = 10;
        let num_shards: usize = 1000;
        let indexers: Vec<NodeId> = (0..num_indexers)
            .map(|indexer_id| NodeId::new(format!("indexer{indexer_id}")))
            .collect();
        let source_uids: Vec<SourceUid> = std::iter::repeat_with(source_id).take(1_000).collect();
        let shard_ids: Vec<ShardId> = (0..num_shards as u64).map(ShardId::from).collect();
        let sources: Vec<SourceToSchedule> = (0..num_shards)
            .map(|i| SourceToSchedule {
                source_uid: source_uids[i].clone(),
                source_type: SourceToScheduleType::Sharded {
                    shard_ids: vec![shard_ids[i].clone()],
                    load_per_shard: NonZeroU32::new(250).unwrap(),
                },
                params_fingerprint: 0,
            })
            .collect();

        let mut indexer_id_to_cpu_capacities = FnvHashMap::default();
        for indexer in &indexers {
            indexer_id_to_cpu_capacities.insert(indexer.as_str().to_string(), mcpu(16_000));
        }
        let mut rng = rand::rng();

        let mut shard_locations = ShardLocations::default();
        for shard_id in &shard_ids {
            let indexer = indexers[..].choose(&mut rng).unwrap();
            shard_locations.add_location(shard_id, indexer);
        }

        let plan = build_physical_indexing_plan(
            &sources,
            &indexer_id_to_cpu_capacities,
            None,
            &shard_locations,
        );
        assert_eq!(plan.indexing_tasks_per_indexer().len(), num_indexers);
        let metrics = get_shard_locality_metrics(&plan, &shard_locations);
        assert_eq!(
            metrics.num_remote_shards + metrics.num_local_shards,
            num_shards
        );
        assert!(metrics.num_remote_shards < 10);
    }

    #[tokio::test]
    async fn test_build_physical_indexing_plan_with_not_enough_indexers() {
        let source_uid1 = source_id();
        let source_1 = SourceToSchedule {
            source_uid: source_uid1.clone(),
            source_type: SourceToScheduleType::NonSharded {
                num_pipelines: 2,
                load_per_pipeline: NonZeroU32::new(1000).unwrap(),
            },
            params_fingerprint: 0,
        };
        let sources = vec![source_1];

        let indexer1 = "indexer1".to_string();
        let mut indexer_max_loads = FnvHashMap::default();
        let shard_locations = ShardLocations::default();
        {
            indexer_max_loads.insert(indexer1.clone(), mcpu(1_999));
            // This test what happens when there isn't enough capacity on the cluster.
            let physical_plan =
                build_physical_indexing_plan(&sources, &indexer_max_loads, None, &shard_locations);
            assert_eq!(physical_plan.indexing_tasks_per_indexer().len(), 1);
            let expected_tasks = physical_plan.indexer(&indexer1).unwrap();
            assert_eq!(expected_tasks.len(), 2);
            assert_eq!(&expected_tasks[0].source_id, &source_uid1.source_id);
        }
        {
            indexer_max_loads.insert(indexer1.clone(), mcpu(2_000));
            // This test what happens when there isn't enough capacity on the cluster.
            let physical_plan =
                build_physical_indexing_plan(&sources, &indexer_max_loads, None, &shard_locations);
            assert_eq!(physical_plan.indexing_tasks_per_indexer().len(), 1);
            let expected_tasks = physical_plan.indexer(&indexer1).unwrap();
            assert_eq!(expected_tasks.len(), 2);
            assert_eq!(&expected_tasks[0].source_id, &source_uid1.source_id);
            assert!(expected_tasks[0].shard_ids.is_empty());
            assert_eq!(&expected_tasks[1].source_id, &source_uid1.source_id);
            assert!(expected_tasks[1].shard_ids.is_empty());
        }
    }

    fn make_indexing_tasks(
        source_uid: &SourceUid,
        shards: &[(PipelineUid, &[ShardId])],
    ) -> Vec<IndexingTask> {
        let mut plan = Vec::new();
        for (pipeline_uid, shard_ids) in shards {
            plan.push(IndexingTask {
                index_uid: Some(source_uid.index_uid.clone()),
                source_id: source_uid.source_id.clone(),
                pipeline_uid: Some(*pipeline_uid),
                shard_ids: shard_ids.to_vec(),
                params_fingerprint: 0,
            });
        }
        plan
    }

    #[test]
    fn test_group_shards_into_pipeline_simple() {
        let source_uid = source_id();
        let indexing_tasks = make_indexing_tasks(
            &source_uid,
            &[
                (
                    PipelineUid::for_test(1u128),
                    &[ShardId::from(1), ShardId::from(2)],
                ),
                (
                    PipelineUid::for_test(2u128),
                    &[ShardId::from(3), ShardId::from(4), ShardId::from(5)],
                ),
            ],
        );
        let sources = vec![SourceToSchedule {
            source_uid: source_uid.clone(),
            source_type: SourceToScheduleType::Sharded {
                shard_ids: vec![
                    ShardId::from(0),
                    ShardId::from(1),
                    ShardId::from(3),
                    ShardId::from(4),
                    ShardId::from(5),
                ],
                load_per_shard: NonZeroU32::new(1_000).unwrap(),
            },
            params_fingerprint: 0,
        }];
        let mut indexer_id_to_cpu_capacities = FnvHashMap::default();
        indexer_id_to_cpu_capacities.insert("node1".to_string(), mcpu(10_000));
        let mut indexing_plan = PhysicalIndexingPlan::with_indexer_ids(&["node1".to_string()]);
        for indexing_task in indexing_tasks {
            indexing_plan.add_indexing_task("node1", indexing_task);
        }
        let shard_locations = ShardLocations::default();
        let new_plan = build_physical_indexing_plan(
            &sources,
            &indexer_id_to_cpu_capacities,
            Some(&indexing_plan),
            &shard_locations,
        );
        let indexing_tasks = new_plan.indexer("node1").unwrap();
        assert_eq!(indexing_tasks.len(), 2);
        assert_eq!(
            &indexing_tasks[0].shard_ids,
            &[ShardId::from(0), ShardId::from(1)]
        );
        assert_eq!(
            &indexing_tasks[1].shard_ids,
            &[ShardId::from(3), ShardId::from(4), ShardId::from(5)]
        );
    }

    fn group_shards_into_pipelines_aux(
        source_uid: &SourceUid,
        shard_ids: &[u64],
        previous_pipeline_shards: &[(PipelineUid, &[ShardId])],
        load_per_shard: CpuCapacity,
    ) -> Vec<IndexingTask> {
        let indexing_tasks = make_indexing_tasks(source_uid, previous_pipeline_shards);
        let sources = vec![SourceToSchedule {
            source_uid: source_uid.clone(),
            source_type: SourceToScheduleType::Sharded {
                shard_ids: shard_ids.iter().copied().map(ShardId::from).collect(),
                load_per_shard: NonZeroU32::new(load_per_shard.cpu_millis()).unwrap(),
            },
            params_fingerprint: 0,
        }];
        const NODE: &str = "node1";
        let mut indexer_id_to_cpu_capacities = FnvHashMap::default();
        indexer_id_to_cpu_capacities.insert(NODE.to_string(), mcpu(10_000));
        let mut indexing_plan = PhysicalIndexingPlan::with_indexer_ids(&["node1".to_string()]);
        for indexing_task in indexing_tasks {
            indexing_plan.add_indexing_task(NODE, indexing_task);
        }
        let shard_locations = ShardLocations::default();
        let new_plan = build_physical_indexing_plan(
            &sources,
            &indexer_id_to_cpu_capacities,
            Some(&indexing_plan),
            &shard_locations,
        );
        let mut indexing_tasks = new_plan.indexer(NODE).unwrap().to_vec();
        for indexing_task in &mut indexing_tasks {
            indexing_task.shard_ids.sort();
        }
        // We sort indexing tasks for normalization purpose
        indexing_tasks.sort_by_key(|task| task.shard_ids[0].clone());
        indexing_tasks
    }

    #[test]
    fn test_group_shards_load_per_shard_too_high() {
        let source_uid = source_id();
        let indexing_tasks =
            group_shards_into_pipelines_aux(&source_uid, &[1, 2], &[], mcpu(4_000));
        assert_eq!(indexing_tasks.len(), 2);
    }

    #[test]
    fn test_group_shards_into_pipeline_hysteresis() {
        let source_uid = source_id();
        let indexing_tasks_1 = group_shards_into_pipelines_aux(
            &source_uid,
            &[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
            &[],
            mcpu(400),
        );
        assert_eq!(indexing_tasks_1.len(), 2);
        let indexing_tasks_len_1: Vec<usize> = indexing_tasks_1
            .iter()
            .map(|task| task.shard_ids.len())
            .sorted()
            .collect();
        assert_eq!(&indexing_tasks_len_1, &[3, 8]);

        let pipeline_tasks1: Vec<(PipelineUid, &[ShardId])> = indexing_tasks_1
            .iter()
            .map(|task| (task.pipeline_uid(), &task.shard_ids[..]))
            .collect();

        // With the same set of shards, an increase of load triggers the creation of a new task.
        let indexing_tasks_2 = group_shards_into_pipelines_aux(
            &source_uid,
            &[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
            &pipeline_tasks1[..],
            mcpu(600),
        );
        assert_eq!(indexing_tasks_2.len(), 3);
        let indexing_tasks_len_2: Vec<usize> = indexing_tasks_2
            .iter()
            .map(|task| task.shard_ids.len())
            .sorted()
            .collect();
        assert_eq!(&indexing_tasks_len_2, &[1, 5, 5]);

        // Now the load comes back to normal
        // The hysteresis takes effect. We do not switch back to 2 pipelines.
        let pipeline_tasks_2: Vec<(PipelineUid, &[ShardId])> = indexing_tasks_2
            .iter()
            .map(|task| (task.pipeline_uid(), &task.shard_ids[..]))
            .collect();
        assert_eq!(indexing_tasks_2.len(), 3);
        let indexing_tasks_3 = group_shards_into_pipelines_aux(
            &source_uid,
            &[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
            &pipeline_tasks_2,
            mcpu(400),
        );
        assert_eq!(&indexing_tasks_3, &indexing_tasks_2);

        let pipeline_tasks3: Vec<(PipelineUid, &[ShardId])> = indexing_tasks_3
            .iter()
            .map(|task| (task.pipeline_uid(), &task.shard_ids[..]))
            .collect();
        // Now a further lower load.
        let indexing_tasks_4 = group_shards_into_pipelines_aux(
            &source_uid,
            &[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
            &pipeline_tasks3,
            mcpu(200),
        );
        assert_eq!(indexing_tasks_4.len(), 2);
        let indexing_tasks_len_4: Vec<usize> = indexing_tasks_4
            .iter()
            .map(|task| task.shard_ids.len())
            .sorted()
            .collect();
        assert_eq!(&indexing_tasks_len_4, &[5, 6]);
    }

    /// We want to make sure for small pipelines, we still reschedule them with the same
    /// pipeline uid.
    #[test]
    fn test_group_shards_into_pipeline_single_small_pipeline() {
        let source_uid = source_id();
        let pipeline_uid = PipelineUid::for_test(1u128);
        let indexing_tasks = group_shards_into_pipelines_aux(
            &source_uid,
            &[12],
            &[(pipeline_uid, &[ShardId::from(12)])],
            mcpu(100),
        );
        assert_eq!(indexing_tasks.len(), 1);
        let indexing_task = &indexing_tasks[0];
        assert_eq!(&indexing_task.shard_ids, &[ShardId::from(12)]);
        assert_eq!(indexing_task.pipeline_uid.unwrap(), pipeline_uid);
    }

    #[test]
    fn test_assign_missing_shards() {
        let shard0 = ShardId::from(0);
        let shard1 = ShardId::from(1);
        let shard2 = ShardId::from(2);
        let shard3 = ShardId::from(3);

        let missing_shards = vec![
            shard0.clone(),
            shard1.clone(),
            shard2.clone(),
            shard3.clone(),
        ];
        let node1 = NodeId::new("node1".to_string());
        let node2 = NodeId::new("node2".to_string());
        // This node is missing from the capacity map.
        // It should not be assigned any task despite being present in shard locations.
        let node_missing = NodeId::new("node_missing".to_string());
        let mut remaining_num_shards_per_node = HashMap::default();
        remaining_num_shards_per_node
            .insert(node1.as_str().to_string(), NonZeroU32::new(3).unwrap());
        remaining_num_shards_per_node
            .insert(node2.as_str().to_string(), NonZeroU32::new(1).unwrap());

        let mut shard_locations: ShardLocations = ShardLocations::default();
        // shard1 on 1
        shard_locations.add_location(&shard1, &node1);
        // shard2 on 2
        shard_locations.add_location(&shard2, &node2);
        // shard3 on both 1 and 2
        shard_locations.add_location(&shard3, &node1);
        shard_locations.add_location(&shard3, &node2);
        shard_locations.add_location(&shard0, &node_missing);

        let shard_to_indexer = assign_shards(
            missing_shards,
            remaining_num_shards_per_node,
            &shard_locations,
        );
        assert_eq!(shard_to_indexer.len(), 4);
        assert_eq!(shard_to_indexer.get(&shard1).unwrap(), "node1");
        assert_eq!(shard_to_indexer.get(&shard2).unwrap(), "node2");
        assert_eq!(shard_to_indexer.get(&shard3).unwrap(), "node1");
        assert_eq!(shard_to_indexer.get(&shard0).unwrap(), "node1");
    }

    #[test]
    fn test_solution_reconstruction() {
        let sources_to_schedule = vec![
            SourceToSchedule {
                source_uid: SourceUid {
                    index_uid: IndexUid::from_str("otel-logs-v0_6:01HKYD1SE37C90KSH21CD1M11A")
                        .unwrap(),
                    source_id: "_ingest-api-source".to_string(),
                },
                source_type: SourceToScheduleType::IngestV1,
                params_fingerprint: 0,
            },
            SourceToSchedule {
                source_uid: SourceUid {
                    index_uid: IndexUid::from_str(
                        "simian_chico_12856033706389338959:01HKYD414H1WVSASC5YD972P39",
                    )
                    .unwrap(),
                    source_id: "_ingest-source".to_string(),
                },
                source_type: SourceToScheduleType::Sharded {
                    shard_ids: vec![ShardId::from(1)],
                    load_per_shard: NonZeroU32::new(250).unwrap(),
                },
                params_fingerprint: 0,
            },
        ];
        let mut capacities = FnvHashMap::default();
        capacities.insert("indexer-1".to_string(), CpuCapacity::from_cpu_millis(8000));
        let shard_locations = ShardLocations::default();
        build_physical_indexing_plan(&sources_to_schedule, &capacities, None, &shard_locations);
    }

    #[test]
    fn test_convert_scheduling_solution_to_physical_plan_single_node_single_source_sharded() {
        let source_uid = SourceUid {
            index_uid: IndexUid::new_with_random_ulid("testindex"),
            source_id: "testsource".to_string(),
        };
        let previous_task1 = IndexingTask {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.to_string(),
            pipeline_uid: Some(PipelineUid::random()),
            shard_ids: vec![ShardId::from(1), ShardId::from(4), ShardId::from(5)],
            params_fingerprint: 0,
        };
        let previous_task2 = IndexingTask {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.to_string(),
            pipeline_uid: Some(PipelineUid::random()),
            shard_ids: vec![
                ShardId::from(6),
                ShardId::from(7),
                ShardId::from(8),
                ShardId::from(9),
                ShardId::from(10),
            ],
            params_fingerprint: 0,
        };
        {
            let sharded_source = SourceToSchedule {
                source_uid: source_uid.clone(),
                source_type: SourceToScheduleType::Sharded {
                    shard_ids: vec![
                        ShardId::from(1),
                        ShardId::from(2),
                        ShardId::from(4),
                        ShardId::from(6),
                    ],
                    load_per_shard: NonZeroU32::new(1_000).unwrap(),
                },
                params_fingerprint: 0,
            };
            let tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
                4,
                &[&previous_task1, &previous_task2],
                &sharded_source,
            );
            assert_eq!(tasks.len(), 2);
            assert_eq!(tasks[0].index_uid(), &source_uid.index_uid);
            assert_eq!(tasks[0].shard_ids, [ShardId::from(1), ShardId::from(4)]);
            assert_eq!(tasks[1].index_uid(), &source_uid.index_uid);
            assert_eq!(tasks[1].shard_ids, [ShardId::from(6)]);
        }
        {
            // smaller shards force a merge into a single pipeline
            let sharded_source = SourceToSchedule {
                source_uid: source_uid.clone(),
                source_type: SourceToScheduleType::Sharded {
                    shard_ids: vec![
                        ShardId::from(1),
                        ShardId::from(2),
                        ShardId::from(4),
                        ShardId::from(6),
                    ],
                    load_per_shard: NonZeroU32::new(250).unwrap(),
                },
                params_fingerprint: 0,
            };
            let tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
                4,
                &[&previous_task1, &previous_task2],
                &sharded_source,
            );
            assert_eq!(tasks.len(), 1);
            assert_eq!(tasks[0].index_uid(), &source_uid.index_uid);
            assert_eq!(tasks[0].shard_ids, [ShardId::from(1), ShardId::from(4)]);
        }
    }

    #[test]
    fn test_convert_scheduling_solution_to_physical_plan_single_node_single_source_non_sharded() {
        let source_uid = SourceUid {
            index_uid: IndexUid::new_with_random_ulid("testindex"),
            source_id: "testsource".to_string(),
        };
        let pipeline_uid1 = PipelineUid::random();
        let previous_task1 = IndexingTask {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.to_string(),
            pipeline_uid: Some(pipeline_uid1),
            shard_ids: Vec::new(),
            params_fingerprint: 0,
        };
        let pipeline_uid2 = PipelineUid::random();
        let previous_task2 = IndexingTask {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.to_string(),
            pipeline_uid: Some(pipeline_uid2),
            shard_ids: Vec::new(),
            params_fingerprint: 0,
        };
        {
            let sharded_source = SourceToSchedule {
                source_uid: source_uid.clone(),
                source_type: SourceToScheduleType::NonSharded {
                    num_pipelines: 1,
                    load_per_pipeline: NonZeroU32::new(4000).unwrap(),
                },
                params_fingerprint: 0,
            };
            let tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
                1,
                &[&previous_task1, &previous_task2],
                &sharded_source,
            );
            assert_eq!(tasks.len(), 1);
            assert_eq!(tasks[0].index_uid(), &source_uid.index_uid);
            assert!(tasks[0].shard_ids.is_empty());
            assert_eq!(tasks[0].pipeline_uid.as_ref().unwrap(), &pipeline_uid1);
        }
        {
            let sharded_source = SourceToSchedule {
                source_uid: source_uid.clone(),
                source_type: SourceToScheduleType::NonSharded {
                    num_pipelines: 0,
                    load_per_pipeline: NonZeroU32::new(1_000).unwrap(),
                },
                params_fingerprint: 0,
            };
            let tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
                0,
                &[&previous_task1, &previous_task2],
                &sharded_source,
            );
            assert_eq!(tasks.len(), 0);
        }
        {
            let sharded_source = SourceToSchedule {
                source_uid: source_uid.clone(),
                source_type: SourceToScheduleType::NonSharded {
                    num_pipelines: 2,
                    load_per_pipeline: NonZeroU32::new(1_000).unwrap(),
                },
                params_fingerprint: 0,
            };
            let tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
                2,
                &[&previous_task1, &previous_task2],
                &sharded_source,
            );
            assert_eq!(tasks.len(), 2);
            assert_eq!(tasks[0].index_uid(), &source_uid.index_uid);
            assert!(tasks[0].shard_ids.is_empty());
            assert_eq!(tasks[0].pipeline_uid.as_ref().unwrap(), &pipeline_uid1);
            assert_eq!(tasks[1].index_uid(), &source_uid.index_uid);
            assert!(tasks[1].shard_ids.is_empty());
            assert_eq!(tasks[1].pipeline_uid.as_ref().unwrap(), &pipeline_uid2);
        }
        {
            let sharded_source = SourceToSchedule {
                source_uid: source_uid.clone(),
                source_type: SourceToScheduleType::NonSharded {
                    num_pipelines: 2,
                    load_per_pipeline: NonZeroU32::new(1_000).unwrap(),
                },
                params_fingerprint: 0,
            };
            let tasks = convert_scheduling_solution_to_physical_plan_single_node_single_source(
                2,
                &[&previous_task1],
                &sharded_source,
            );
            assert_eq!(tasks.len(), 2);
            assert_eq!(tasks[0].index_uid(), &source_uid.index_uid);
            assert!(tasks[0].shard_ids.is_empty());
            assert_eq!(tasks[0].pipeline_uid.as_ref().unwrap(), &pipeline_uid1);
            assert_eq!(tasks[1].index_uid(), &source_uid.index_uid);
            assert!(tasks[1].shard_ids.is_empty());
            assert_ne!(tasks[1].pipeline_uid.as_ref().unwrap(), &pipeline_uid1);
        }
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_scheduler/scheduling/scheduling_logic.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Reverse;
use std::collections::BTreeMap;
use std::collections::btree_map::Entry;

use itertools::Itertools;
use quickwit_proto::indexing::CpuCapacity;

use super::scheduling_logic_model::*;
use crate::indexing_scheduler::scheduling::inflate_node_capacities_if_necessary;

// ------------------------------------------------------------------------------------
// High level algorithm

fn check_contract_conditions(problem: &SchedulingProblem, solution: &SchedulingSolution) {
    assert_eq!(problem.num_indexers(), solution.num_indexers());
    for (node_id, indexer_assignment) in solution.indexer_assignments.iter().enumerate() {
        assert_eq!(indexer_assignment.indexer_ord, node_id);
    }
    for (source_ord, source) in problem.sources().enumerate() {
        assert_eq!(source_ord as SourceOrd, source.source_ord);
    }
}

pub fn solve(
    mut problem: SchedulingProblem,
    previous_solution: SchedulingSolution,
) -> SchedulingSolution {
    // We first inflate the indexer capacities to make sure they globally
    // have at least 120% of the total problem load. This is done proportionally
    // to their original capacity.
    inflate_node_capacities_if_necessary(&mut problem);
    // As a heuristic, to offer stability, we work iteratively
    // from the previous solution.
    let mut solution = previous_solution;
    // We first run a few asserts to ensure that the problem is correct.
    check_contract_conditions(&problem, &solution);
    // Due to scale down, or entire removal of sources some shards we might have
    // too many shards in the current solution.
    // Let's first shave off the extraneous shards.
    remove_extraneous_shards(&problem, &mut solution);
    // Because the load associated to shards can change, some indexers
    // may have too much work assigned to them.
    // Again, we shave off some shards to make sure they are
    // within their capacity.
    enforce_indexers_cpu_capacity(&problem, &mut solution);
    // The solution now meets the constraint, but it does not necessarily
    // contains all of the shards that we need to assign.
    //
    // We first assign sources to indexers that have some affinity with them
    // (provided they have the capacity.)
    place_unassigned_shards_with_affinity(&problem, &mut solution);
    // Finally we assign the remaining shards, regardess of whether they have affinity
    // or not.
    place_unassigned_shards_ignoring_affinity(problem, &solution)
}

// -------------------------------------------------------------------------
// Phase 1
// Remove shards in solution that are not needed anymore

fn remove_extraneous_shards(problem: &SchedulingProblem, solution: &mut SchedulingSolution) {
    let mut num_shards_per_source: Vec<u32> = vec![0; problem.num_sources()];
    for indexer_assignment in &solution.indexer_assignments {
        if let Some((&source_ord, _)) = indexer_assignment.num_shards_per_source.last_key_value() {
            assert!(source_ord < problem.num_sources() as SourceOrd);
        }
        for (&source, &source_num_shards) in &indexer_assignment.num_shards_per_source {
            num_shards_per_source[source as usize] += source_num_shards;
        }
    }
    let num_shards_per_source_to_remove: Vec<(SourceOrd, u32)> = num_shards_per_source
        .into_iter()
        .zip(problem.sources())
        .flat_map(|(num_shards, source)| {
            let target_num_shards = source.num_shards;
            if target_num_shards < num_shards {
                Some((source.source_ord, num_shards - target_num_shards))
            } else {
                None
            }
        })
        .collect();

    let mut nodes_with_source: BTreeMap<SourceOrd, Vec<IndexerOrd>> = BTreeMap::default();
    for (node_id, indexer_assignment) in solution.indexer_assignments.iter().enumerate() {
        for (&source, &num_shards) in &indexer_assignment.num_shards_per_source {
            if num_shards > 0 {
                nodes_with_source.entry(source).or_default().push(node_id);
            }
        }
    }

    let mut indexer_available_capacity: Vec<i32> = solution
        .indexer_assignments
        .iter()
        .map(|indexer_assignment| indexer_assignment.indexer_available_capacity(problem))
        .collect();

    for (source_ord, mut num_shards_to_remove) in num_shards_per_source_to_remove {
        let nodes_with_source = nodes_with_source
            .get_mut(&source_ord)
            // Unwrap is safe here. By construction if we need to decrease the number of shard of a
            // given source, at least one node has it.
            .unwrap();
        nodes_with_source.sort_by_key(|&node_id| indexer_available_capacity[node_id]);
        for node_id in nodes_with_source.iter().copied() {
            let indexer_assignment = &mut solution.indexer_assignments[node_id];
            let previous_num_shards = indexer_assignment.num_shards(source_ord);
            assert!(previous_num_shards > 0);
            assert!(num_shards_to_remove > 0);
            let num_shards_removed = previous_num_shards.min(num_shards_to_remove);
            indexer_assignment.remove_shards(source_ord, num_shards_removed);
            num_shards_to_remove -= num_shards_removed;
            // We update the node capacity since its load has changed.
            indexer_available_capacity[node_id] =
                indexer_assignment.indexer_available_capacity(problem);
            if num_shards_to_remove == 0 {
                // No more work to do for this source.
                break;
            }
        }
    }
    assert_remove_extraneous_shards_post_condition(problem, solution);
}

fn assert_remove_extraneous_shards_post_condition(
    problem: &SchedulingProblem,
    solution: &SchedulingSolution,
) {
    let mut num_shards_per_source: Vec<u32> = vec![0; problem.num_sources()];
    for indexer_assignment in &solution.indexer_assignments {
        for (&source, &load) in &indexer_assignment.num_shards_per_source {
            num_shards_per_source[source as usize] += load;
        }
    }
    for source in problem.sources() {
        assert!(num_shards_per_source[source.source_ord as usize] <= source.num_shards);
    }
}

// -------------------------------------------------------------------------
// Phase 2
// Relieve sources from the node that are exceeding their maximum load.

fn enforce_indexers_cpu_capacity(problem: &SchedulingProblem, solution: &mut SchedulingSolution) {
    for indexer_assignment in &mut solution.indexer_assignments {
        let indexer_cpu_capacity: CpuCapacity =
            problem.indexer_cpu_capacity(indexer_assignment.indexer_ord);
        enforce_indexer_cpu_capacity(problem, indexer_cpu_capacity, indexer_assignment);
    }
}

fn enforce_indexer_cpu_capacity(
    problem: &SchedulingProblem,
    indexer_cpu_capacity: CpuCapacity,
    indexer_assignment: &mut IndexerAssignment,
) {
    let total_load = indexer_assignment.total_cpu_load(problem);
    if total_load <= indexer_cpu_capacity.cpu_millis() {
        return;
    }
    let mut load_to_remove: CpuCapacity =
        CpuCapacity::from_cpu_millis(total_load) - indexer_cpu_capacity;
    let mut source_cpu_capacities: Vec<(CpuCapacity, SourceOrd)> = indexer_assignment
        .num_shards_per_source
        .iter()
        .map(|(&source_ord, num_shards)| {
            let load_for_source = problem.source_load_per_shard(source_ord).get() * num_shards;
            (CpuCapacity::from_cpu_millis(load_for_source), source_ord)
        })
        .collect();
    source_cpu_capacities.sort();
    for (source_cpu_capacity, source_ord) in source_cpu_capacities {
        indexer_assignment.num_shards_per_source.remove(&source_ord);
        load_to_remove = if load_to_remove <= source_cpu_capacity {
            break;
        } else {
            load_to_remove - source_cpu_capacity
        };
    }
    assert_enforce_nodes_cpu_capacity_post_condition(problem, indexer_assignment);
}

fn assert_enforce_nodes_cpu_capacity_post_condition(
    problem: &SchedulingProblem,
    indexer_assignment: &IndexerAssignment,
) {
    let total_load = indexer_assignment.total_cpu_load(problem);
    assert!(
        total_load
            <= problem
                .indexer_cpu_capacity(indexer_assignment.indexer_ord)
                .cpu_millis()
    );
}

// ----------------------------------------------------
// Phase 3
// Place unassigned sources.
//
// We use a greedy algorithm as a simple heuristic here.
//
// We go through the sources in decreasing order of their load,
// in two passes.
//
// In the first pass, we have a look at
// the nodes with which there is an affinity.
//
// If one of them has room for all of the shards, then we assign all
// of the shards to it.
//
// In the second pass, we just put as many shards as possible on the node
// with the highest available capacity.
//
// If this algorithm fails to place all remaining shards, we inflate
// the node capacities by 20% in the scheduling problem and start from the beginning.

fn attempt_place_unassigned_shards(
    unassigned_shards: &[Source],
    problem: &SchedulingProblem,
    partial_solution: &SchedulingSolution,
) -> Result<SchedulingSolution, NotEnoughCapacity> {
    let mut solution = partial_solution.clone();
    for source in unassigned_shards {
        let indexers_with_most_available_capacity =
            compute_indexer_available_capacity(problem, &solution)
                .sorted_by_key(|(indexer_ord, capacity)| Reverse((*capacity, *indexer_ord)));
        place_unassigned_shards_single_source(
            source,
            indexers_with_most_available_capacity,
            &mut solution,
        )?;
    }
    assert_place_unassigned_shards_post_condition(problem, &solution);
    Ok(solution)
}

fn place_unassigned_shards_with_affinity(
    problem: &SchedulingProblem,
    solution: &mut SchedulingSolution,
) {
    let mut unassigned_shards: Vec<Source> = compute_unassigned_sources(problem, solution);
    unassigned_shards.sort_by_key(|source| {
        let load = source.num_shards * source.load_per_shard.get();
        Reverse(load)
    });
    for source in &unassigned_shards {
        // List of indexer with a non-null affinity and some available capacity, sorted by
        // (affinity, available capacity) in that order.
        let indexers_with_affinity_and_available_capacity = source
            .affinities
            .iter()
            .filter(|&(_, &affinity)| affinity != 0u32)
            .map(|(&indexer_ord, affinity)| {
                let available_capacity =
                    solution.indexer_assignments[indexer_ord].indexer_available_capacity(problem);
                let capacity = CpuCapacity::from_cpu_millis(available_capacity as u32);
                (indexer_ord, affinity, capacity)
            })
            .sorted_by_key(|(indexer_ord, affinity, capacity)| {
                Reverse((*affinity, *capacity, *indexer_ord))
            })
            .map(|(indexer_ord, _, capacity)| (indexer_ord, capacity));
        let _ = place_unassigned_shards_single_source(
            source,
            indexers_with_affinity_and_available_capacity,
            solution,
        );
    }
}

#[must_use]
fn place_unassigned_shards_ignoring_affinity(
    mut problem: SchedulingProblem,
    partial_solution: &SchedulingSolution,
) -> SchedulingSolution {
    let mut unassigned_shards: Vec<Source> = compute_unassigned_sources(&problem, partial_solution);
    unassigned_shards.sort_by_key(|source| {
        let load = source.num_shards * source.load_per_shard.get();
        Reverse(load)
    });

    // Thanks to the call to `inflate_node_capacities_if_necessary`, we are
    // certain that even on our first attempt, the total capacity of the indexer
    // exceeds 120% of the partial solution. If a large shard needs to be placed
    // in an already well balanced solution, it may not fit on any node. In that
    // case, we iteratively grow the virtual capacity until it can be placed.
    //
    // 1.2^30 is about 240. If we reach 30 attempts we are certain to have a
    // logical bug.
    for attempt_number in 0..30 {
        match attempt_place_unassigned_shards(&unassigned_shards[..], &problem, partial_solution) {
            Ok(mut solution) => {
                // the higher the attempt number, the more unbalanced the solution
                if attempt_number > 0 {
                    tracing::warn!(
                        attempt_number = attempt_number,
                        "capacity re-scaled, scheduling solution likely unbalanced"
                    );
                }
                solution.capacity_scaling_iterations = attempt_number;
                return solution;
            }
            Err(NotEnoughCapacity) => {
                problem.scale_node_capacities(1.2f32);
            }
        }
    }
    unreachable!("Failed to assign all of the sources");
}

fn assert_place_unassigned_shards_post_condition(
    problem: &SchedulingProblem,
    solution: &SchedulingSolution,
) {
    // We make sure we all shard are as placed.
    for source in problem.sources() {
        let num_assigned_shards: u32 = solution
            .indexer_assignments
            .iter()
            .map(|indexer_assignment| indexer_assignment.num_shards(source.source_ord))
            .sum();
        assert_eq!(num_assigned_shards, source.num_shards);
    }
    // We make sure that the node capacity is respected.
    for indexer_assignment in &solution.indexer_assignments {
        // We call this function just to check that the indexer assignment does not exceed this
        // capacity. (it includes an assert that panics if it happens).
        assert_enforce_nodes_cpu_capacity_post_condition(problem, indexer_assignment);
    }
}

struct NotEnoughCapacity;

/// Return Err(NotEnoughCapacity) iff the algorithm was unable to pack all of the sources
/// amongst the node with their given node capacity.
fn place_unassigned_shards_single_source(
    source: &Source,
    mut indexer_with_capacities: impl Iterator<Item = (IndexerOrd, CpuCapacity)>,
    solution: &mut SchedulingSolution,
) -> Result<(), NotEnoughCapacity> {
    let mut num_shards = source.num_shards;
    while num_shards > 0 {
        let Some((indexer_ord, available_capacity)) = indexer_with_capacities.next() else {
            return Err(NotEnoughCapacity);
        };
        let num_placable_shards = available_capacity.cpu_millis() / source.load_per_shard;
        let num_shards_to_place = num_placable_shards.min(num_shards);
        // Update the solution, the shard load, and the number of shards to place.
        solution.indexer_assignments[indexer_ord]
            .add_shards(source.source_ord, num_shards_to_place);
        num_shards -= num_shards_to_place;
    }
    Ok(())
}

/// Compute the sources/shards that have not been assigned to any indexer yet.
/// Affinity are also updated, with the limitation described in `Source`.
fn compute_unassigned_sources(
    problem: &SchedulingProblem,
    solution: &SchedulingSolution,
) -> Vec<Source> {
    let mut unassigned_sources: BTreeMap<SourceOrd, Source> = problem
        .sources()
        .map(|source| (source.source_ord as SourceOrd, source))
        .collect();
    for (indexer_ord, indexer_assignment) in solution.indexer_assignments.iter().enumerate() {
        for (&source_ord, &num_shards) in &indexer_assignment.num_shards_per_source {
            if num_shards == 0 {
                continue;
            }
            let Entry::Occupied(mut entry) = unassigned_sources.entry(source_ord) else {
                panic!("The solution contains more shards than the actual problem.");
            };
            if !entry.get_mut().remove_shards(indexer_ord, num_shards) {
                entry.remove();
            }
        }
    }
    unassigned_sources.into_values().collect()
}

/// Builds a BinaryHeap with the different indexer capacities.
///
/// Panics if one of the indexer is over-assigned.
fn compute_indexer_available_capacity<'a>(
    problem: &'a SchedulingProblem,
    solution: &'a SchedulingSolution,
) -> impl Iterator<Item = (IndexerOrd, CpuCapacity)> + 'a {
    solution
        .indexer_assignments
        .iter()
        .map(|indexer_assignment| {
            let available_capacity: i32 = indexer_assignment.indexer_available_capacity(problem);
            assert!(available_capacity >= 0i32);
            (
                indexer_assignment.indexer_ord,
                CpuCapacity::from_cpu_millis(available_capacity as u32),
            )
        })
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroU32;

    use proptest::prelude::*;
    use quickwit_proto::indexing::mcpu;

    use super::*;

    #[test]
    fn test_remove_extraneous_shards() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(4_000), mcpu(5_000)]);
        problem.add_source(1, NonZeroU32::new(1_000u32).unwrap());
        let mut solution = problem.new_solution();
        solution.indexer_assignments[0].add_shards(0, 3);
        solution.indexer_assignments[1].add_shards(0, 3);
        remove_extraneous_shards(&problem, &mut solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(0), 0);
        assert_eq!(solution.indexer_assignments[1].num_shards(0), 1);
    }

    #[test]
    fn test_remove_extraneous_shards_2() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(5_000), mcpu(4_000)]);
        problem.add_source(2, NonZeroU32::new(1_000).unwrap());
        let mut solution = problem.new_solution();
        solution.indexer_assignments[0].add_shards(0, 3);
        solution.indexer_assignments[1].add_shards(0, 3);
        remove_extraneous_shards(&problem, &mut solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(0), 2);
        assert_eq!(solution.indexer_assignments[1].num_shards(0), 0);
    }

    #[test]
    fn test_remove_missing_sources() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(5_000), mcpu(4_000)]);
        // Source 0
        problem.add_source(0, NonZeroU32::new(1_000).unwrap());
        // Source 1
        problem.add_source(2, NonZeroU32::new(1_000).unwrap());
        let mut solution = problem.new_solution();
        solution.indexer_assignments[0].add_shards(0, 1);
        solution.indexer_assignments[0].add_shards(1, 1);
        solution.indexer_assignments[1].add_shards(1, 2);
        remove_extraneous_shards(&problem, &mut solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(0), 0);
        assert_eq!(solution.indexer_assignments[0].num_shards(1), 1);
        assert_eq!(solution.indexer_assignments[1].num_shards(0), 0);
        assert_eq!(solution.indexer_assignments[1].num_shards(1), 1);
    }

    #[test]
    fn test_enforce_nodes_cpu_capacity() {
        let mut problem = SchedulingProblem::with_indexer_cpu_capacities(vec![
            mcpu(5_000),
            mcpu(5_000),
            mcpu(5_000),
            mcpu(5_000),
            mcpu(7_000),
        ]);
        // Source 0
        problem.add_source(10, NonZeroU32::new(3_000).unwrap());
        problem.add_source(10, NonZeroU32::new(2_000).unwrap());
        problem.add_source(10, NonZeroU32::new(1_001).unwrap());
        let mut solution = problem.new_solution();

        // node 0 does not exceed its capacity
        solution.indexer_assignments[0].add_shards(0, 1);

        // node 1 exceed its capacity with a single source
        solution.indexer_assignments[1].add_shards(0, 2);

        // node 2 is precisely at capacity
        solution.indexer_assignments[2].add_shards(0, 1);
        solution.indexer_assignments[2].add_shards(1, 1);

        // node 3 is exceeding its capacity due with several sources
        // We choose to remove sources entirely (as opposed to removing only shards that do not fit)
        solution.indexer_assignments[3].add_shards(0, 1);
        solution.indexer_assignments[3].add_shards(2, 2);

        // node 3 is exceeding its capacity due with several sources
        // We choose to remove sources entirely (as opposed to removing only shards that do not fit)
        solution.indexer_assignments[4].add_shards(0, 1);
        solution.indexer_assignments[4].add_shards(1, 1);
        solution.indexer_assignments[4].add_shards(2, 2);

        enforce_indexers_cpu_capacity(&problem, &mut solution);

        assert_eq!(solution.indexer_assignments[0].num_shards(0), 1);
        assert_eq!(solution.indexer_assignments[0].num_shards(1), 0);
        assert_eq!(solution.indexer_assignments[0].num_shards(2), 0);

        // We remove sources entirely!
        assert_eq!(solution.indexer_assignments[1].num_shards(0), 0);
        assert_eq!(solution.indexer_assignments[1].num_shards(1), 0);
        assert_eq!(solution.indexer_assignments[1].num_shards(2), 0);

        assert_eq!(solution.indexer_assignments[2].num_shards(0), 1);
        assert_eq!(solution.indexer_assignments[2].num_shards(1), 1);
        assert_eq!(solution.indexer_assignments[2].num_shards(2), 0);

        assert_eq!(solution.indexer_assignments[3].num_shards(0), 1);
        assert_eq!(solution.indexer_assignments[3].num_shards(1), 0);
        assert_eq!(solution.indexer_assignments[3].num_shards(2), 0);

        assert_eq!(solution.indexer_assignments[4].num_shards(0), 1);
        assert_eq!(solution.indexer_assignments[4].num_shards(1), 0);
        assert_eq!(solution.indexer_assignments[4].num_shards(2), 2);
    }

    #[test]
    fn test_compute_unassigned_shards_simple() {
        let mut problem = SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(4_000)]);
        problem.add_source(4, NonZeroU32::new(1000).unwrap());
        problem.add_source(4, NonZeroU32::new(1_000).unwrap());
        let solution = problem.new_solution();
        let unassigned_shards = compute_unassigned_sources(&problem, &solution);
        assert_eq!(
            unassigned_shards[0],
            Source {
                source_ord: 0,
                load_per_shard: NonZeroU32::new(1_000).unwrap(),
                num_shards: 4,
                affinities: BTreeMap::default(),
            }
        );
    }

    #[test]
    fn test_compute_unassigned_shards_with_non_trivial_solution() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(50_000), mcpu(40_000)]);
        problem.add_source(5, NonZeroU32::new(1_000).unwrap());
        problem.add_source(15, NonZeroU32::new(2_000).unwrap());
        let mut solution = problem.new_solution();

        solution.indexer_assignments[0].add_shards(0, 1);
        solution.indexer_assignments[0].add_shards(1, 3);
        solution.indexer_assignments[1].add_shards(0, 2);
        solution.indexer_assignments[1].add_shards(1, 3);
        let unassigned_shards = compute_unassigned_sources(&problem, &solution);
        assert_eq!(
            unassigned_shards[0],
            Source {
                source_ord: 0,
                load_per_shard: NonZeroU32::new(1_000).unwrap(),
                num_shards: 5 - (1 + 2),
                affinities: Default::default(),
            }
        );
        assert_eq!(
            unassigned_shards[1],
            Source {
                source_ord: 1,
                load_per_shard: NonZeroU32::new(2_000).unwrap(),
                num_shards: 15 - (3 + 3),
                affinities: Default::default(),
            }
        );
    }

    #[test]
    fn test_place_unassigned_shards_simple() {
        let mut problem = SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(4_000)]);
        problem.add_source(4, NonZeroU32::new(1_000).unwrap());
        let partial_solution = problem.new_solution();
        let solution = place_unassigned_shards_ignoring_affinity(problem, &partial_solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(0), 4);
    }

    #[test]
    fn test_place_unassigned_shards_with_affinity() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(4_000), mcpu(4000)]);
        problem.add_source(4, NonZeroU32::new(1_000).unwrap());
        problem.add_source(4, NonZeroU32::new(1_000).unwrap());
        problem.inc_affinity(0, 1);
        problem.inc_affinity(1, 0);
        let mut solution = problem.new_solution();
        place_unassigned_shards_with_affinity(&problem, &mut solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(1), 4);
        assert_eq!(solution.indexer_assignments[1].num_shards(0), 4);
    }

    #[test]
    fn test_place_unassigned_shards_reach_capacity() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(50_000), mcpu(40_000)]);
        problem.add_source(5, NonZeroU32::new(1_000).unwrap());
        problem.add_source(15, NonZeroU32::new(2_000).unwrap());
        let mut solution = problem.new_solution();
        solution.indexer_assignments[0].add_shards(0, 1);
        solution.indexer_assignments[0].add_shards(1, 3);
        solution.indexer_assignments[1].add_shards(0, 2);
        solution.indexer_assignments[1].add_shards(1, 3);
        let unassigned_shards = compute_unassigned_sources(&problem, &solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(0), 1);
        assert_eq!(solution.indexer_assignments[0].num_shards(1), 3);
        assert_eq!(solution.indexer_assignments[1].num_shards(0), 2);
        assert_eq!(solution.indexer_assignments[1].num_shards(1), 3);
        assert_eq!(
            unassigned_shards[0],
            Source {
                source_ord: 0,
                load_per_shard: NonZeroU32::new(1_000).unwrap(),
                num_shards: 5 - (1 + 2),
                affinities: Default::default(),
            }
        );
        assert_eq!(
            unassigned_shards[1],
            Source {
                source_ord: 1,
                load_per_shard: NonZeroU32::new(2_000).unwrap(),
                num_shards: 15 - (3 + 3),
                affinities: Default::default(),
            }
        );
    }

    #[test]
    fn test_solve() {
        let mut problem = SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(800)]);
        problem.add_source(43, NonZeroU32::new(1).unwrap());
        problem.add_source(379, NonZeroU32::new(1).unwrap());
        let previous_solution = problem.new_solution();
        solve(problem, previous_solution);
    }

    fn indexer_cpu_capacity_strat() -> impl Strategy<Value = CpuCapacity> {
        prop_oneof![
            1u32..10_000u32,
            Just(1u32),
            800u32..1200u32,
            1900u32..2100u32,
        ]
        .prop_map(CpuCapacity::from_cpu_millis)
    }

    fn num_shards() -> impl Strategy<Value = u32> {
        0u32..3u32
    }

    fn source_strat() -> impl Strategy<Value = (u32, NonZeroU32)> {
        let load_strat = prop_oneof![
            Just(1u32),
            Just(2u32),
            Just(10u32),
            Just(100u32),
            Just(250u32),
            1u32..1_000u32
        ];
        (
            num_shards(),
            load_strat.prop_map(|load| NonZeroU32::new(load).unwrap()),
        )
    }

    fn problem_strategy(
        num_nodes: usize,
        num_sources: usize,
    ) -> impl Strategy<Value = SchedulingProblem> {
        let indexer_cpu_capacity_strat =
            proptest::collection::vec(indexer_cpu_capacity_strat(), num_nodes);
        let sources_strat = proptest::collection::vec(source_strat(), num_sources);
        (indexer_cpu_capacity_strat, sources_strat).prop_map(|(node_cpu_capacities, sources)| {
            let mut problem = SchedulingProblem::with_indexer_cpu_capacities(node_cpu_capacities);
            for (num_shards, load_per_shard) in sources {
                problem.add_source(num_shards, load_per_shard);
            }
            problem
        })
    }

    fn num_nodes_strat() -> impl Strategy<Value = usize> {
        prop_oneof![
            3 => 1usize..3,
            1 => 4usize..10,
        ]
    }
    fn num_sources_strat() -> impl Strategy<Value = usize> {
        prop_oneof![
            3 => 0usize..3,
            1 => 4usize..10,
        ]
    }

    fn indexer_assignments_strategy(num_sources: usize) -> impl Strategy<Value = Vec<u32>> {
        proptest::collection::vec(0u32..3u32, num_sources)
    }

    fn initial_solution_strategy(
        num_nodes: usize,
        num_sources: usize,
    ) -> impl Strategy<Value = SchedulingSolution> {
        proptest::collection::vec(indexer_assignments_strategy(num_sources), num_nodes).prop_map(
            move |indexer_assignments: Vec<Vec<u32>>| {
                let mut solution = SchedulingSolution::with_num_indexers(num_nodes);
                for (node_id, indexer_assignment) in indexer_assignments.iter().enumerate() {
                    for (source_ord, num_shards) in indexer_assignment.iter().copied().enumerate() {
                        solution.indexer_assignments[node_id]
                            .add_shards(source_ord as u32, num_shards);
                    }
                }
                solution
            },
        )
    }

    fn problem_solution_strategy() -> impl Strategy<Value = (SchedulingProblem, SchedulingSolution)>
    {
        (num_nodes_strat(), num_sources_strat()).prop_flat_map(move |(num_nodes, num_sources)| {
            (
                problem_strategy(num_nodes, num_sources),
                initial_solution_strategy(num_nodes, num_sources),
            )
        })
    }

    #[test]
    fn test_problem_missing_capacities() {
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![CpuCapacity::from_cpu_millis(100)]);
        problem.add_source(1, NonZeroU32::new(1).unwrap());
        let mut previous_solution = problem.new_solution();
        previous_solution.indexer_assignments[0].add_shards(0, 0);
        let solution = solve(problem, previous_solution);
        assert_eq!(solution.indexer_assignments[0].num_shards(0), 1);
    }

    #[test]
    fn test_problem_unbalanced_simple() {
        let mut problem = SchedulingProblem::with_indexer_cpu_capacities(vec![
            CpuCapacity::from_cpu_millis(1),
            CpuCapacity::from_cpu_millis(1),
        ]);
        problem.add_source(1, NonZeroU32::new(10).unwrap());
        for _ in 0..10 {
            problem.add_source(1, NonZeroU32::new(1).unwrap());
        }
        let previous_solution = problem.new_solution();
        let solution = solve(problem.clone(), previous_solution);
        let available_capacities: Vec<u32> = solution
            .indexer_assignments
            .iter()
            .map(|indexer_assignment: &IndexerAssignment| {
                indexer_assignment.total_cpu_load(&problem)
            })
            .collect();
        assert_eq!(available_capacities.len(), 2);
        let (min, max) = available_capacities
            .into_iter()
            .minmax()
            .into_option()
            .unwrap();
        assert_eq!(min, 10);
        assert_eq!(max, 10);
    }

    proptest! {
        #[test]
        fn test_proptest_post_conditions((problem, solution) in problem_solution_strategy()) {
            let solution_1 = solve(problem.clone(), solution);
            let solution_2 = solve(problem.clone(), solution_1.clone());
            // TODO: This assert actually fails for some scenarii. We say it is fine
            // for now as long as the solution does not change again during the
            // next resolution:
            // let has_solution_changed_once = solution_1.indexer_assignments != solution_2.indexer_assignments;
            // assert!(!has_solution_changed_once, "Solution changed for same problem\nSolution 1:{solution_1:?}\nSolution 2: {solution_2:?}");
            let solution_3 = solve(problem, solution_2.clone());
            let has_solution_changed_again = solution_2.indexer_assignments != solution_3.indexer_assignments;
            assert!(!has_solution_changed_again, "solution unstable!!!\nSolution 1: {solution_1:?}\nSolution 2: {solution_2:?}\nSolution 3: {solution_3:?}");
        }
    }

    #[test]
    fn test_capacity_scaling_iteration_required() {
        // Create a problem where affinity constraints cause suboptimal placement
        // requiring iterative scaling despite initial capacity scaling.
        let mut problem =
            SchedulingProblem::with_indexer_cpu_capacities(vec![mcpu(3000), mcpu(3000)]);
        problem.add_source(1, NonZeroU32::new(2500).unwrap()); // Source 0
        problem.add_source(1, NonZeroU32::new(2500).unwrap()); // Source 1
        problem.add_source(1, NonZeroU32::new(1500).unwrap()); // Source 2
        let previous_solution = problem.new_solution();
        let solution = solve(problem, previous_solution);

        assert_eq!(solution.capacity_scaling_iterations, 1);
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/indexing_scheduler/scheduling/scheduling_logic_model.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::collections::btree_map::Entry;
use std::num::NonZeroU32;

use quickwit_proto::indexing::CpuCapacity;

pub type SourceOrd = u32;
pub type IndexerOrd = usize;

#[derive(Clone, Debug, Eq, PartialEq)]
pub struct Source {
    pub source_ord: SourceOrd,
    pub load_per_shard: NonZeroU32,
    /// Affinities of the source for each indexer.
    /// In the beginning, affinities are initialized to be the count of shards of the source
    /// that are located on the indexer.
    ///
    /// As we compute unassigned sources, we decrease the affinity by the given number of shards,
    /// saturating at 0.
    ///
    /// As a result we only have the invariant
    /// and `affinity(source, indexer) <= num shard of source on indexer`
    pub affinities: BTreeMap<IndexerOrd, u32>,
    pub num_shards: u32,
}

impl Source {
    // Remove a given number of shards, located on the given indexer.
    // Returns `false` if and only if all of the shards have been removed.
    //
    // This function also decrease the affinity of the source for the given indexer
    // by num_shards_to_remove in a saturating way.
    //
    // # Panics
    //
    // If the source does have that many total number of shards to begin with.
    pub fn remove_shards(&mut self, indexer_ord: usize, num_shards_to_remove: u32) -> bool {
        if num_shards_to_remove == 0u32 {
            return self.num_shards > 0u32;
        }
        let entry = self.affinities.entry(indexer_ord);
        self.num_shards = self
            .num_shards
            .checked_sub(num_shards_to_remove)
            .expect("removing more shards than available.");
        if self.num_shards == 0u32 {
            self.affinities.clear();
            return false;
        }
        if let Entry::Occupied(mut affinity_with_indexer_entry) = entry {
            let affinity_with_indexer: &mut u32 = affinity_with_indexer_entry.get_mut();
            let affinity_after_removal = affinity_with_indexer.saturating_sub(num_shards_to_remove);
            if affinity_after_removal == 0u32 {
                affinity_with_indexer_entry.remove();
            } else {
                *affinity_with_indexer = affinity_after_removal;
            }
        }
        true
    }
}

#[derive(Debug, Clone)]
pub struct SchedulingProblem {
    sources: Vec<Source>,
    indexer_cpu_capacities: Vec<CpuCapacity>,
}

impl SchedulingProblem {
    /// Problem constructor.
    ///
    /// Panics if the list of indexers is empty or if one of the
    /// indexer has a null capacity.
    pub fn with_indexer_cpu_capacities(
        indexer_cpu_capacities: Vec<CpuCapacity>,
    ) -> SchedulingProblem {
        assert!(!indexer_cpu_capacities.is_empty());
        assert!(
            indexer_cpu_capacities
                .iter()
                .all(|cpu_capacity| cpu_capacity.cpu_millis() > 0)
        );
        // TODO assert for affinity.
        SchedulingProblem {
            sources: Vec::new(),
            indexer_cpu_capacities,
        }
    }

    pub fn new_solution(&self) -> SchedulingSolution {
        SchedulingSolution::with_num_indexers(self.indexer_cpu_capacities.len())
    }

    pub fn indexer_cpu_capacity(&self, indexer_ord: IndexerOrd) -> CpuCapacity {
        self.indexer_cpu_capacities[indexer_ord]
    }

    /// Scales the cpu capacity by the given scaling factor.
    ///
    /// Resulting cpu capacity are ceiled to the next integer millicpus value.
    pub fn scale_node_capacities(&mut self, scale: f32) {
        for capacity in &mut self.indexer_cpu_capacities {
            let scaled_cpu_millis = (capacity.cpu_millis() as f32 * scale).ceil() as u32;
            *capacity = CpuCapacity::from_cpu_millis(scaled_cpu_millis);
        }
    }

    pub fn total_node_capacities(&self) -> CpuCapacity {
        self.indexer_cpu_capacities
            .iter()
            .copied()
            .fold(CpuCapacity::zero(), |left, right| left + right)
    }

    pub fn total_load(&self) -> u32 {
        self.sources
            .iter()
            .map(|source| source.num_shards * source.load_per_shard.get())
            .sum()
    }

    pub fn sources(&self) -> impl Iterator<Item = Source> + '_ {
        self.sources.iter().cloned()
    }

    pub fn add_source(&mut self, num_shards: u32, load_per_shard: NonZeroU32) -> SourceOrd {
        let source_ord = self.sources.len() as SourceOrd;
        self.sources.push(Source {
            source_ord,
            num_shards,
            load_per_shard,
            affinities: Default::default(),
        });
        source_ord
    }

    /// Increases the affinity source <-> indexer by 1.
    /// This is done to record that the indexer is hosting one shard of the source.
    pub fn inc_affinity(&mut self, source_ord: SourceOrd, indexer_ord: IndexerOrd) {
        let affinity: &mut u32 = self.sources[source_ord as usize]
            .affinities
            .entry(indexer_ord)
            .or_default();
        *affinity += 1;
    }

    pub fn source_load_per_shard(&self, source_ord: SourceOrd) -> NonZeroU32 {
        self.sources[source_ord as usize].load_per_shard
    }

    pub fn num_sources(&self) -> usize {
        self.sources.len()
    }

    pub fn num_indexers(&self) -> usize {
        self.indexer_cpu_capacities.len()
    }
}

#[derive(Clone, Debug, Eq, PartialEq)]
pub struct IndexerAssignment {
    pub indexer_ord: IndexerOrd,
    pub num_shards_per_source: BTreeMap<SourceOrd, u32>,
}

impl IndexerAssignment {
    pub fn new(indexer_ord: IndexerOrd) -> IndexerAssignment {
        IndexerAssignment {
            indexer_ord,
            num_shards_per_source: Default::default(),
        }
    }

    /// Returns the number of available `mcpu` in the indexer.
    /// If the indexer is over-assigned this method returns a negative value.
    pub fn indexer_available_capacity(&self, problem: &SchedulingProblem) -> i32 {
        let total_cpu_load = self.total_cpu_load(problem);
        let indexer_cpu_capacity = problem.indexer_cpu_capacities[self.indexer_ord];
        indexer_cpu_capacity.cpu_millis() as i32 - total_cpu_load as i32
    }

    pub fn total_cpu_load(&self, problem: &SchedulingProblem) -> u32 {
        self.num_shards_per_source
            .iter()
            .map(|(source_ord, num_shards)| {
                problem.source_load_per_shard(*source_ord).get() * num_shards
            })
            .sum()
    }

    pub fn num_shards(&self, source_ord: SourceOrd) -> u32 {
        self.num_shards_per_source
            .get(&source_ord)
            .copied()
            .unwrap_or(0u32)
    }

    /// Add shards to a source (noop of `num_shards` is 0).
    pub fn add_shards(&mut self, source_ord: u32, num_shards: u32) {
        // No need to fill indexer_assignments with empty assignments.
        if num_shards == 0 {
            return;
        }
        *self.num_shards_per_source.entry(source_ord).or_default() += num_shards;
    }

    pub fn remove_shards(&mut self, source_ord: u32, num_shards_removed: u32) {
        let entry = self.num_shards_per_source.entry(source_ord);
        let Entry::Occupied(mut occupied_entry) = entry else {
            assert_eq!(num_shards_removed, 0);
            return;
        };
        let previous_shard_count = *occupied_entry.get();
        assert!(previous_shard_count >= num_shards_removed);
        if previous_shard_count > num_shards_removed {
            *occupied_entry.get_mut() -= num_shards_removed
        } else {
            occupied_entry.remove();
        }
    }
}

#[derive(Clone, Debug)]
pub struct SchedulingSolution {
    pub indexer_assignments: Vec<IndexerAssignment>,
    // used for tests
    pub capacity_scaling_iterations: usize,
}

impl SchedulingSolution {
    pub fn with_num_indexers(num_indexers: usize) -> SchedulingSolution {
        SchedulingSolution {
            indexer_assignments: (0..num_indexers).map(IndexerAssignment::new).collect(),
            capacity_scaling_iterations: 0,
        }
    }
    pub fn num_indexers(&self) -> usize {
        self.indexer_assignments.len()
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    fn test_source() -> Source {
        let mut affinities: BTreeMap<usize, u32> = Default::default();
        affinities.insert(7, 3u32);
        affinities.insert(11, 2u32);
        Source {
            source_ord: 0u32,
            load_per_shard: NonZeroU32::new(1000u32).unwrap(),
            affinities,
            num_shards: 2 + 3,
        }
    }

    #[test]
    fn test_source_remove_simple() {
        let mut source = test_source();
        assert!(source.remove_shards(7, 2));
        assert_eq!(source.num_shards, 5 - 2);
        assert_eq!(source.affinities.get(&7).copied(), Some(1));
        assert_eq!(source.affinities.get(&11).copied(), Some(2));
    }

    #[test]
    fn test_source_remove_all_affinity() {
        let mut source = test_source();
        assert!(source.remove_shards(7, 3));
        assert_eq!(source.num_shards, 5 - 3);
        assert!(!source.affinities.contains_key(&7));
        assert_eq!(source.affinities.get(&11).copied(), Some(2));
    }

    #[test]
    fn test_source_remove_more_than_affinity() {
        let mut source = test_source();
        assert!(source.remove_shards(7, 4));
        assert_eq!(source.num_shards, 5 - 4);
        assert!(!source.affinities.contains_key(&7));
        assert_eq!(source.affinities.get(&11).copied(), Some(2));
    }

    #[test]
    fn test_source_remove_all_shards() {
        let mut source = test_source();
        assert!(!source.remove_shards(7, 5));
        assert_eq!(source.num_shards, 0);
        assert!(source.affinities.is_empty());
    }

    #[test]
    #[should_panic]
    fn test_source_remove_more_than_all_shards() {
        let mut source = test_source();
        assert!(source.remove_shards(7, 6));
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/ingest/ingest_controller.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::btree_map::Entry;
use std::collections::{BTreeMap, BTreeSet, HashMap, HashSet};
use std::fmt;
use std::future::Future;
use std::num::NonZeroUsize;
use std::sync::Arc;
use std::time::Duration;

use fnv::FnvHashSet;
use futures::StreamExt;
use futures::stream::FuturesUnordered;
use itertools::{Itertools as _, MinMaxResult};
use quickwit_actors::Mailbox;
use quickwit_common::Progress;
use quickwit_common::pretty::PrettySample;
use quickwit_ingest::{IngesterPool, LeaderId, LocalShardsUpdate};
use quickwit_proto::control_plane::{
    AdviseResetShardsRequest, AdviseResetShardsResponse, GetOrCreateOpenShardsFailureReason,
    GetOrCreateOpenShardsRequest, GetOrCreateOpenShardsResponse, GetOrCreateOpenShardsSubrequest,
    GetOrCreateOpenShardsSuccess,
};
use quickwit_proto::ingest::ingester::{
    CloseShardsRequest, CloseShardsResponse, IngesterService, IngesterStatus, InitShardFailure,
    InitShardSubrequest, InitShardsRequest, InitShardsResponse, RetainShardsForSource,
    RetainShardsRequest,
};
use quickwit_proto::ingest::{
    Shard, ShardIdPosition, ShardIdPositions, ShardIds, ShardPKey, ShardState,
};
use quickwit_proto::metastore::{
    MetastoreResult, MetastoreService, MetastoreServiceClient, OpenShardSubrequest,
    OpenShardsRequest, OpenShardsResponse, serde_utils,
};
use quickwit_proto::types::{IndexUid, NodeId, NodeIdRef, Position, ShardId, SourceUid};
use rand::prelude::IndexedRandom;
use rand::rngs::ThreadRng;
use rand::seq::SliceRandom;
use rand::{Rng, RngCore, rng};
use serde::{Deserialize, Serialize};
use tokio::sync::{Mutex, OwnedMutexGuard};
use tracing::{Level, debug, enabled, error, info, instrument, warn};
use ulid::Ulid;

use super::scaling_arbiter::ScalingArbiter;
use crate::control_plane::ControlPlane;
use crate::ingest::wait_handle::WaitHandle;
use crate::model::{ControlPlaneModel, ScalingMode, ShardEntry, ShardStats};

const CLOSE_SHARDS_REQUEST_TIMEOUT: Duration = if cfg!(test) {
    Duration::from_millis(50)
} else {
    Duration::from_secs(3)
};

const INIT_SHARDS_REQUEST_TIMEOUT: Duration = CLOSE_SHARDS_REQUEST_TIMEOUT;

const CLOSE_SHARDS_UPON_REBALANCE_DELAY: Duration = if cfg!(test) {
    Duration::ZERO
} else {
    Duration::from_secs(10)
};

const FIRE_AND_FORGET_TIMEOUT: Duration = Duration::from_secs(3);

/// Spawns a new task to execute the given future,
/// and stops polling it/drops it after a timeout.
///
/// All errors are ignored, and not even logged.
fn fire_and_forget(
    fut: impl Future<Output = ()> + Send + 'static,
    operation: impl std::fmt::Display + Send + 'static,
) {
    tokio::spawn(async move {
        if let Err(_timeout_elapsed) = tokio::time::timeout(FIRE_AND_FORGET_TIMEOUT, fut).await {
            error!(%operation, "timeout elapsed");
        }
    });
}

// Returns a random position of the els `slice`, such that the element in this array is NOT
// `except_el`.
fn pick_position(
    els: &[&NodeIdRef],
    except_el_opt: Option<&NodeIdRef>,
    rng: &mut ThreadRng,
) -> Option<usize> {
    let except_pos_opt =
        except_el_opt.and_then(|except_el| els.iter().position(|el| *el == except_el));
    if let Some(except_pos) = except_pos_opt {
        let pos = rng.random_range(0..els.len() - 1);
        if pos >= except_pos {
            Some(pos + 1)
        } else {
            Some(pos)
        }
    } else {
        Some(rng.random_range(0..els.len()))
    }
}

/// Pick a node from the `shard_count_to_node_ids` that is different from `except_node_opt`.
/// We pick in priority nodes with the least number of shards, and we break any tie randomly.
///
/// Once a node has been found, we update the `shard_count_to_node_ids` to reflect the new state.
/// In particular, the ingester node is moved from its previous shard_count level to its new
/// shard_count level. In particular, a shard_count entry that is empty should be removed from the
/// BTreeMap.
fn pick_one<'a>(
    shard_count_to_node_ids: &mut BTreeMap<usize, Vec<&'a NodeIdRef>>,
    except_node_opt: Option<&'a NodeIdRef>,
    rng: &mut ThreadRng,
) -> Option<&'a NodeIdRef> {
    let (&shard_count, _) = shard_count_to_node_ids.iter().find(|(_, node_ids)| {
        let Some(except_node) = except_node_opt else {
            return true;
        };
        if node_ids.len() >= 2 {
            return true;
        }
        let Some(&single_node_id) = node_ids.first() else {
            return false;
        };
        single_node_id != except_node
    })?;
    let mut shard_entry = shard_count_to_node_ids.entry(shard_count);
    let Entry::Occupied(occupied_shard_entry) = &mut shard_entry else {
        panic!();
    };
    let nodes = occupied_shard_entry.get_mut();
    let position = pick_position(nodes, except_node_opt, rng)?;

    let node_id = nodes.swap_remove(position);
    let new_shard_count = shard_count + 1;
    let should_remove_entry = nodes.is_empty();

    if should_remove_entry {
        shard_count_to_node_ids.remove(&shard_count);
    }
    shard_count_to_node_ids
        .entry(new_shard_count)
        .or_default()
        .push(node_id);
    Some(node_id)
}

/// Pick two ingester nodes from `shard_count_to_node_ids` different one from each other.
/// Ingesters with the lower number of shards are preferred.
fn pick_two<'a>(
    shard_count_to_node_ids: &mut BTreeMap<usize, Vec<&'a NodeIdRef>>,
    rng: &mut ThreadRng,
) -> Option<(&'a NodeIdRef, &'a NodeIdRef)> {
    let leader = pick_one(shard_count_to_node_ids, None, rng)?;
    let follower = pick_one(shard_count_to_node_ids, Some(leader), rng)?;
    Some((leader, follower))
}

fn allocate_shards(
    node_id_shard_counts: &HashMap<NodeId, usize>,
    num_shards: usize,
    replication_enabled: bool,
) -> Option<Vec<(&NodeIdRef, Option<&NodeIdRef>)>> {
    let mut shard_count_to_node_ids: BTreeMap<usize, Vec<&NodeIdRef>> = BTreeMap::default();
    for (node_id, &num_shards) in node_id_shard_counts {
        shard_count_to_node_ids
            .entry(num_shards)
            .or_default()
            .push(node_id.as_ref());
    }
    let mut rng = rng();
    let mut shard_allocations: Vec<(&NodeIdRef, Option<&NodeIdRef>)> =
        Vec::with_capacity(num_shards);
    for _ in 0..num_shards {
        if replication_enabled {
            let (leader, follower) = pick_two(&mut shard_count_to_node_ids, &mut rng)?;
            shard_allocations.push((leader, Some(follower)));
        } else {
            let leader = pick_one(&mut shard_count_to_node_ids, None, &mut rng)?;
            shard_allocations.push((leader, None));
        }
    }
    Some(shard_allocations)
}

#[derive(Debug, Default, Clone, Copy, Serialize, Deserialize)]
pub struct IngestControllerStats {
    pub num_rebalance_shards_ops: usize,
}

pub struct IngestController {
    pub(crate) ingester_pool: IngesterPool,
    pub(crate) stats: IngestControllerStats,
    metastore: MetastoreServiceClient,
    replication_factor: usize,
    // This lock ensures that only one rebalance operation is performed at a time.
    rebalance_lock: Arc<Mutex<()>>,
    scaling_arbiter: ScalingArbiter,
}

impl fmt::Debug for IngestController {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("IngestController")
            .field("ingester_pool", &self.ingester_pool)
            .field("metastore", &self.metastore)
            .field("replication_factor", &self.replication_factor)
            .finish()
    }
}

/// Updates both the metastore and the control plane.
/// If successful, the control plane is guaranteed to be in sync with the metastore.
/// If an error is returned, the control plane might be out of sync with the metastore.
/// It is up to the client to check the error type and see if the control plane actor should be
/// restarted.
async fn open_shards_on_metastore_and_model(
    open_shard_subrequests: Vec<OpenShardSubrequest>,
    metastore: &mut MetastoreServiceClient,
    model: &mut ControlPlaneModel,
) -> MetastoreResult<OpenShardsResponse> {
    if open_shard_subrequests.is_empty() {
        return Ok(OpenShardsResponse {
            subresponses: Vec::new(),
        });
    }
    let open_shards_request = OpenShardsRequest {
        subrequests: open_shard_subrequests,
    };
    let open_shards_response = metastore.open_shards(open_shards_request).await?;
    for open_shard_subresponse in &open_shards_response.subresponses {
        if let Some(shard) = &open_shard_subresponse.open_shard {
            let shard = shard.clone();
            let index_uid = shard.index_uid().clone();
            let source_id = shard.source_id.clone();
            model.insert_shards(&index_uid, &source_id, vec![shard]);
        }
    }
    Ok(open_shards_response)
}

fn get_open_shard_from_model(
    get_open_shards_subrequest: &GetOrCreateOpenShardsSubrequest,
    model: &ControlPlaneModel,
    unavailable_leaders: &FnvHashSet<NodeId>,
) -> Result<Option<GetOrCreateOpenShardsSuccess>, GetOrCreateOpenShardsFailureReason> {
    let Some(index_uid) = model.index_uid(&get_open_shards_subrequest.index_id) else {
        return Err(GetOrCreateOpenShardsFailureReason::IndexNotFound);
    };
    let Some(open_shard_entries) = model.find_open_shards(
        index_uid,
        &get_open_shards_subrequest.source_id,
        unavailable_leaders,
    ) else {
        return Err(GetOrCreateOpenShardsFailureReason::SourceNotFound);
    };
    if open_shard_entries.is_empty() {
        return Ok(None);
    }
    // We already have open shards. Let's return them.
    let open_shards: Vec<Shard> = open_shard_entries
        .into_iter()
        .map(|shard_entry| shard_entry.shard)
        .collect();
    Ok(Some(GetOrCreateOpenShardsSuccess {
        subrequest_id: get_open_shards_subrequest.subrequest_id,
        index_uid: Some(index_uid.clone()),
        source_id: get_open_shards_subrequest.source_id.clone(),
        open_shards,
    }))
}

impl IngestController {
    pub fn new(
        metastore: MetastoreServiceClient,
        ingester_pool: IngesterPool,
        replication_factor: usize,
        max_shard_ingestion_throughput_mib_per_sec: f32,
        shard_scale_up_factor: f32,
    ) -> Self {
        IngestController {
            metastore,
            ingester_pool,
            replication_factor,
            rebalance_lock: Arc::new(Mutex::new(())),
            stats: IngestControllerStats::default(),
            scaling_arbiter: ScalingArbiter::with_max_shard_ingestion_throughput_mib_per_sec(
                max_shard_ingestion_throughput_mib_per_sec,
                shard_scale_up_factor,
            ),
        }
    }

    /// Sends a retain shard request to the given list of ingesters.
    ///
    /// If the request fails, we just log an error.
    pub(crate) fn sync_with_ingesters(
        &self,
        ingesters: &BTreeSet<NodeId>,
        model: &ControlPlaneModel,
    ) {
        for ingester in ingesters {
            self.sync_with_ingester(ingester, model);
        }
    }

    pub(crate) fn sync_with_all_ingesters(&self, model: &ControlPlaneModel) {
        let ingesters: Vec<NodeId> = self.ingester_pool.keys();
        for ingester in ingesters {
            self.sync_with_ingester(&ingester, model);
        }
    }

    /// Syncs the ingester in a fire and forget manner.
    ///
    /// The returned oneshot is just here for unit test to wait for the operation to terminate.
    fn sync_with_ingester(&self, ingester_id: &NodeId, model: &ControlPlaneModel) -> WaitHandle {
        info!(ingester = %ingester_id, "sync_with_ingester");
        let (wait_drop_guard, wait_handle) = WaitHandle::new();
        let Some(ingester) = self.ingester_pool.get(ingester_id) else {
            // TODO: (Maybe) We should mark the ingester as unavailable, and stop advertise its
            // shard to routers.
            warn!("failed to sync with ingester `{ingester_id}`: not available");
            return wait_handle;
        };
        let mut retain_shards_req = RetainShardsRequest::default();
        for (source_uid, shard_ids) in &*model.list_shards_for_node(ingester_id) {
            let shards_for_source = RetainShardsForSource {
                index_uid: Some(source_uid.index_uid.clone()),
                source_id: source_uid.source_id.clone(),
                shard_ids: shard_ids.iter().cloned().collect(),
            };
            retain_shards_req
                .retain_shards_for_sources
                .push(shards_for_source);
        }
        info!(%ingester_id, "retain shards ingester");
        let operation: String = format!("retain shards `{ingester_id}`");
        fire_and_forget(
            async move {
                if let Err(retain_shards_err) =
                    ingester.client.retain_shards(retain_shards_req).await
                {
                    error!(%retain_shards_err, "retain shards error");
                }
                // just a way to force moving the drop guard.
                drop(wait_drop_guard);
            },
            operation,
        );
        wait_handle
    }

    fn handle_closed_shards(&self, closed_shards: Vec<ShardIds>, model: &mut ControlPlaneModel) {
        for closed_shard in closed_shards {
            let index_uid: IndexUid = closed_shard.index_uid().clone();
            let source_id = closed_shard.source_id;

            let source_uid = SourceUid {
                index_uid,
                source_id,
            };
            let closed_shard_ids = model.close_shards(&source_uid, &closed_shard.shard_ids);

            if !closed_shard_ids.is_empty() {
                info!(
                    index_id=%source_uid.index_uid.index_id,
                    source_id=%source_uid.source_id,
                    shard_ids=?PrettySample::new(&closed_shard_ids, 5),
                    "closed {} shards reported by router",
                    closed_shard_ids.len()
                );
            }
        }
    }

    pub(crate) async fn handle_local_shards_update(
        &mut self,
        local_shards_update: LocalShardsUpdate,
        model: &mut ControlPlaneModel,
        progress: &Progress,
    ) -> MetastoreResult<()> {
        let shard_stats = model.update_shards(
            &local_shards_update.source_uid,
            &local_shards_update.shard_infos,
        );
        let min_shards = model
            .index_metadata(&local_shards_update.source_uid.index_uid)
            .expect("index should exist")
            .index_config
            .ingest_settings
            .min_shards;

        let Some(scaling_mode) = self.scaling_arbiter.should_scale(shard_stats, min_shards) else {
            return Ok(());
        };
        match scaling_mode {
            ScalingMode::Up(num_shards) => {
                self.try_scale_up_shards(
                    local_shards_update.source_uid,
                    shard_stats,
                    model,
                    progress,
                    num_shards,
                )
                .await?;
            }
            ScalingMode::Down => {
                self.try_scale_down_shards(
                    local_shards_update.source_uid,
                    shard_stats,
                    min_shards,
                    model,
                    progress,
                )
                .await?;
            }
        }

        Ok(())
    }

    /// Finds the open shards that satisfies the [`GetOrCreateOpenShardsRequest`] request sent by an
    /// ingest router. First, the control plane checks its internal shard table to find
    /// candidates. If it does not contain any, the control plane will ask
    /// the metastore to open new shards.
    pub(crate) async fn get_or_create_open_shards(
        &mut self,
        get_open_shards_request: GetOrCreateOpenShardsRequest,
        model: &mut ControlPlaneModel,
        progress: &Progress,
    ) -> MetastoreResult<GetOrCreateOpenShardsResponse> {
        // Closing shards is an operation performed by ingesters,
        // so the control plane is not necessarily aware that they are closed.
        //
        // Routers can report closed shards so that we can update our
        // internal state.
        self.handle_closed_shards(get_open_shards_request.closed_shards, model);

        let num_subrequests = get_open_shards_request.subrequests.len();
        let mut get_or_create_open_shards_successes = Vec::with_capacity(num_subrequests);
        let mut get_or_create_open_shards_failures = Vec::new();

        let mut per_source_num_shards_to_open = HashMap::new();

        let unavailable_leaders: FnvHashSet<NodeId> = get_open_shards_request
            .unavailable_leaders
            .into_iter()
            .map(NodeId::from)
            .collect();

        // We do a first pass to identify the shards that are missing from the model and need to be
        // created.
        for get_open_shards_subrequest in &get_open_shards_request.subrequests {
            if let Ok(None) =
                get_open_shard_from_model(get_open_shards_subrequest, model, &unavailable_leaders)
            {
                // We did not find any open shard in the model, we will have to create one.
                // Let's keep track of all of the source that require new shards, so we can batch
                // create them after this loop.
                let index_uid = model
                    .index_uid(&get_open_shards_subrequest.index_id)
                    .expect("index should exist")
                    .clone();
                let min_shards = model
                    .index_metadata(&index_uid)
                    .expect("index should exist")
                    .index_config
                    .ingest_settings
                    .min_shards
                    .get();
                let source_uid = SourceUid {
                    index_uid,
                    source_id: get_open_shards_subrequest.source_id.clone(),
                };
                per_source_num_shards_to_open.insert(source_uid, min_shards);
            }
        }

        if let Err(metastore_error) = self
            .try_open_shards(
                per_source_num_shards_to_open,
                model,
                &unavailable_leaders,
                progress,
            )
            .await
        {
            // We experienced a metastore error. If this is not certain abort, we need
            // to restart the control plane, to make sure the control plane is not out-of-sync.
            //
            if !metastore_error.is_transaction_certainly_aborted() {
                return Err(metastore_error);
            } else {
                // If not, let's just log something.
                // This is not critical. We will just end up return some failure in the response.
                error!(error=?metastore_error, "failed to open shards on the metastore");
            }
        }
        for get_open_shards_subrequest in get_open_shards_request.subrequests {
            match get_open_shard_from_model(
                &get_open_shards_subrequest,
                model,
                &unavailable_leaders,
            ) {
                Ok(Some(success)) => {
                    get_or_create_open_shards_successes.push(success);
                }
                Ok(None) => {
                    get_or_create_open_shards_failures.push(
                        GetOrCreateOpenShardsFailureReason::NoIngestersAvailable
                            .create_failure(get_open_shards_subrequest),
                    );
                }
                Err(failure_reason) => {
                    get_or_create_open_shards_failures
                        .push(failure_reason.create_failure(get_open_shards_subrequest));
                }
            }
        }
        let response = GetOrCreateOpenShardsResponse {
            successes: get_or_create_open_shards_successes,
            failures: get_or_create_open_shards_failures,
        };
        Ok(response)
    }

    /// Allocates and assigns new shards to ingesters.
    fn allocate_shards(
        &self,
        num_shards_to_allocate: usize,
        unavailable_leaders: &FnvHashSet<NodeId>,
        model: &ControlPlaneModel,
    ) -> Option<Vec<(NodeId, Option<NodeId>)>> {
        // Count of open shards per available ingester node (including the ingester with 0 open
        // shards).
        let mut per_node_num_open_shards: HashMap<NodeId, usize> = self
            .ingester_pool
            .keys_values()
            .into_iter()
            .filter(|(ingester_id, ingester)| {
                ingester.status.is_ready() && !unavailable_leaders.contains(ingester_id)
            })
            .map(|(ingester_id, _)| (ingester_id, 0))
            .collect();

        let num_ingesters = per_node_num_open_shards.len();

        if num_ingesters == 0 {
            warn!("failed to allocate {num_shards_to_allocate} shards: no ingesters available");
            return None;
        }

        if self.replication_factor > num_ingesters {
            warn!(
                "failed to allocate {num_shards_to_allocate} shards: replication factor is \
                 greater than the number of available ingesters"
            );
            return None;
        }

        for shard in model.all_shards() {
            if shard.is_open() && !unavailable_leaders.contains(&shard.leader_id) {
                for ingest_node in shard.ingesters() {
                    if let Some(shard_count) =
                        per_node_num_open_shards.get_mut(ingest_node.as_str())
                    {
                        *shard_count += 1;
                    } else {
                        // The shard is not present in the `per_node_num_open_shards` map.
                        // This is normal. It just means an ingester is temporarily unavailable,
                        // either from the control plane view (not present in the indexer pool,
                        // because as a result of information from
                        // chitchat), or because it is in the unavailable
                        // leaders map.
                    }
                }
            }
        }

        assert!(self.replication_factor == 1 || self.replication_factor == 2);
        let leader_follower_pairs: Vec<(&NodeIdRef, Option<&NodeIdRef>)> = allocate_shards(
            &per_node_num_open_shards,
            num_shards_to_allocate,
            self.replication_factor == 2,
        )?;
        Some(
            leader_follower_pairs
                .into_iter()
                .map(|(leader_id, follower_id)| {
                    (leader_id.to_owned(), follower_id.map(NodeIdRef::to_owned))
                })
                .collect(),
        )
    }

    /// Calls init shards on the leaders hosting newly opened shards.
    async fn init_shards(
        &self,
        init_shard_subrequests: Vec<InitShardSubrequest>,
        progress: &Progress,
    ) -> InitShardsResponse {
        let mut successes = Vec::with_capacity(init_shard_subrequests.len());
        let mut failures = Vec::new();

        let mut per_leader_shards_to_init: HashMap<String, Vec<InitShardSubrequest>> =
            HashMap::new();

        for init_shard_subrequest in init_shard_subrequests {
            let leader_id = init_shard_subrequest.shard().leader_id.clone();
            per_leader_shards_to_init
                .entry(leader_id)
                .or_default()
                .push(init_shard_subrequest);
        }
        let mut init_shards_futures = FuturesUnordered::new();

        for (leader_id, subrequests) in per_leader_shards_to_init {
            let init_shard_failures: Vec<InitShardFailure> = subrequests
                .iter()
                .map(|subrequest| {
                    let shard = subrequest.shard();

                    InitShardFailure {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: Some(shard.index_uid().clone()),
                        source_id: shard.source_id.clone(),
                        shard_id: Some(shard.shard_id().clone()),
                    }
                })
                .collect();
            let Some(leader) = self.ingester_pool.get(&leader_id) else {
                warn!("failed to init shards: ingester `{leader_id}` is unavailable");
                failures.extend(init_shard_failures);
                continue;
            };
            let init_shards_request = InitShardsRequest { subrequests };
            let init_shards_future = async move {
                let init_shards_result = tokio::time::timeout(
                    INIT_SHARDS_REQUEST_TIMEOUT,
                    leader.client.init_shards(init_shards_request),
                )
                .await;
                (leader_id.clone(), init_shards_result, init_shard_failures)
            };
            init_shards_futures.push(init_shards_future);
        }
        while let Some((leader_id, init_shards_result, init_shard_failures)) =
            progress.protect_future(init_shards_futures.next()).await
        {
            match init_shards_result {
                Ok(Ok(init_shards_response)) => {
                    successes.extend(init_shards_response.successes);
                    failures.extend(init_shards_response.failures);
                }
                Ok(Err(error)) => {
                    error!(%error, "failed to init shards on `{leader_id}`");
                    failures.extend(init_shard_failures);
                }
                Err(_elapsed) => {
                    error!("failed to init shards on `{leader_id}`: request timed out");
                    failures.extend(init_shard_failures);
                }
            }
        }
        InitShardsResponse {
            successes,
            failures,
        }
    }

    /// Attempts to increase the number of shards. This operation is rate limited to avoid creating
    /// to many shards in a short period of time. As a result, this method may not create any
    /// shard.
    async fn try_scale_up_shards(
        &mut self,
        source_uid: SourceUid,
        shard_stats: ShardStats,
        model: &mut ControlPlaneModel,
        progress: &Progress,
        num_shards_to_open: usize,
    ) -> MetastoreResult<()> {
        if !model
            .acquire_scaling_permits(&source_uid, ScalingMode::Up(num_shards_to_open))
            .unwrap_or(false)
        {
            return Ok(());
        }
        let new_num_open_shards = shard_stats.num_open_shards + num_shards_to_open;
        let new_shards_per_source: HashMap<SourceUid, usize> =
            HashMap::from_iter([(source_uid.clone(), num_shards_to_open)]);
        let successful_source_uids_res = self
            .try_open_shards(new_shards_per_source, model, &Default::default(), progress)
            .await;

        match successful_source_uids_res {
            Ok(successful_source_uids) => {
                assert!(successful_source_uids.len() <= 1);

                if successful_source_uids.is_empty() {
                    // We did not manage to create the shard.
                    // We can release our permit.
                    model.release_scaling_permits(&source_uid, ScalingMode::Up(num_shards_to_open));
                    warn!(
                        index_uid=%source_uid.index_uid,
                        source_id=%source_uid.source_id,
                        "scaling up number of shards to {new_num_open_shards} failed: shard initialization failure"
                    );
                } else {
                    info!(
                        index_id=%source_uid.index_uid.index_id,
                        source_id=%source_uid.source_id,
                        "successfully scaled up number of shards to {new_num_open_shards}"
                    );
                }
                Ok(())
            }
            Err(metastore_error) => {
                // We did not manage to create the shard.
                // We can release our permit, but we also need to return the error to the caller, in
                // order to restart the control plane actor if necessary.
                warn!(
                    index_id=%source_uid.index_uid.index_id,
                    source_id=%source_uid.source_id,
                    "scaling up number of shards to {new_num_open_shards} failed: {metastore_error:?}"
                );
                model.release_scaling_permits(&source_uid, ScalingMode::Up(num_shards_to_open));
                Err(metastore_error)
            }
        }
    }

    /// Attempts to open shards for different sources
    /// `source_uids` may contain the same source multiple times.
    ///
    /// This function returns the list of sources for which `try_open_shards` was successful.
    ///
    /// As long as no metastore error is returned this function leaves the control plane model
    /// in sync with the metastore.
    ///
    /// Also, this function only updates the control plane model and the metastore after
    /// having successfully initialized a shard (and possibly its replica) on the ingester.
    ///
    /// This function can be partially successful: if init_shards was unsuccessful for some shard,
    /// then the successfully initialized shard will still be record in the metastore/control
    /// plane model.
    ///
    /// The number of successfully open shards is returned.
    async fn try_open_shards(
        &mut self,
        per_source_num_shards_to_open: HashMap<SourceUid, usize>,
        model: &mut ControlPlaneModel,
        unavailable_leaders: &FnvHashSet<NodeId>,
        progress: &Progress,
    ) -> MetastoreResult<HashMap<SourceUid, usize>> {
        let total_num_shards_to_open: usize = per_source_num_shards_to_open.values().sum();

        if total_num_shards_to_open == 0 {
            return Ok(HashMap::new());
        }
        // TODO unavailable leaders
        let Some(leader_follower_pairs) =
            self.allocate_shards(total_num_shards_to_open, unavailable_leaders, model)
        else {
            return Ok(HashMap::new());
        };

        let source_uids_with_multiplicity = per_source_num_shards_to_open
            .iter()
            .flat_map(|(source_uid, count)| std::iter::repeat_n(source_uid, *count));

        let mut init_shard_subrequests: Vec<InitShardSubrequest> = Vec::new();

        for (subrequest_id, (source_uid, (leader_id, follower_id_opt))) in
            source_uids_with_multiplicity
                .zip(leader_follower_pairs)
                .enumerate()
        {
            let shard_id = ShardId::from(Ulid::new());

            let index_metadata = model
                .index_metadata(&source_uid.index_uid)
                .expect("index should exist");
            let has_transform = model
                .source_metadata(source_uid)
                .expect("source should exist")
                .transform_config
                .is_some();
            let validate_docs =
                index_metadata.index_config.ingest_settings.validate_docs && !has_transform;
            let doc_mapping = &index_metadata.index_config.doc_mapping;
            let doc_mapping_uid = doc_mapping.doc_mapping_uid;
            let doc_mapping_json = serde_utils::to_json_str(doc_mapping)?;

            let shard = Shard {
                index_uid: Some(source_uid.index_uid.clone()),
                source_id: source_uid.source_id.clone(),
                shard_id: Some(shard_id),
                leader_id: leader_id.to_string(),
                follower_id: follower_id_opt.as_ref().map(ToString::to_string),
                shard_state: ShardState::Open as i32,
                doc_mapping_uid: Some(doc_mapping_uid),
                publish_position_inclusive: Some(Position::Beginning),
                publish_token: None,
                update_timestamp: 0, // assigned later by the metastore
            };
            let init_shard_subrequest = InitShardSubrequest {
                subrequest_id: subrequest_id as u32,
                shard: Some(shard),
                doc_mapping_json,
                validate_docs,
            };
            init_shard_subrequests.push(init_shard_subrequest);
        }

        // Let's first attempt to initialize these shards.
        let init_shards_response = self.init_shards(init_shard_subrequests, progress).await;

        let open_shard_subrequests = init_shards_response
            .successes
            .into_iter()
            .enumerate()
            .map(|(subrequest_id, init_shard_success)| {
                let shard = init_shard_success.shard();

                OpenShardSubrequest {
                    subrequest_id: subrequest_id as u32,
                    index_uid: shard.index_uid.clone(),
                    source_id: shard.source_id.clone(),
                    shard_id: shard.shard_id.clone(),
                    leader_id: shard.leader_id.clone(),
                    follower_id: shard.follower_id.clone(),
                    doc_mapping_uid: shard.doc_mapping_uid,
                    // Shards are acquired by the ingest sources
                    publish_token: None,
                }
            })
            .collect();

        let open_shards_response = progress
            .protect_future(open_shards_on_metastore_and_model(
                open_shard_subrequests,
                &mut self.metastore,
                model,
            ))
            .await?;

        let mut per_source_num_opened_shards: HashMap<SourceUid, usize> = HashMap::new();

        for open_shard_subresponse in open_shards_response.subresponses {
            let source_uid = open_shard_subresponse.open_shard().source_uid();
            *per_source_num_opened_shards.entry(source_uid).or_default() += 1;
        }

        Ok(per_source_num_opened_shards)
    }

    /// Attempts to decrease the number of shards. This operation is rate limited to avoid closing
    /// shards too aggressively. As a result, this method may not close any shard.
    async fn try_scale_down_shards(
        &self,
        source_uid: SourceUid,
        shard_stats: ShardStats,
        min_shards: NonZeroUsize,
        model: &mut ControlPlaneModel,
        progress: &Progress,
    ) -> MetastoreResult<()> {
        // The scaling arbiter should not suggest scaling down if the number of shards is already
        // below the minimum, but we're just being defensive here.
        if shard_stats.num_open_shards <= min_shards.get() {
            return Ok(());
        }
        if !model
            .acquire_scaling_permits(&source_uid, ScalingMode::Down)
            .unwrap_or(false)
        {
            return Ok(());
        }
        let new_num_open_shards = shard_stats.num_open_shards - 1;

        info!(
            index_id=%source_uid.index_uid.index_id,
            source_id=%source_uid.source_id,
            "scaling down number of shards to {new_num_open_shards}"
        );
        let Some((leader_id, shard_id)) = find_scale_down_candidate(&source_uid, model) else {
            model.release_scaling_permits(&source_uid, ScalingMode::Down);
            return Ok(());
        };
        info!("scaling down shard {shard_id} from {leader_id}");
        let Some(ingester) = self.ingester_pool.get(&leader_id) else {
            model.release_scaling_permits(&source_uid, ScalingMode::Down);
            return Ok(());
        };
        let shard_pkeys = vec![ShardPKey {
            index_uid: Some(source_uid.index_uid.clone()),
            source_id: source_uid.source_id.clone(),
            shard_id: Some(shard_id.clone()),
        }];
        let close_shards_request = CloseShardsRequest { shard_pkeys };

        if let Err(error) = progress
            .protect_future(ingester.client.close_shards(close_shards_request))
            .await
        {
            warn!("failed to scale down number of shards: {error}");
            model.release_scaling_permits(&source_uid, ScalingMode::Down);
            return Ok(());
        }
        model.close_shards(&source_uid, &[shard_id]);
        Ok(())
    }

    pub(crate) fn advise_reset_shards(
        &self,
        request: AdviseResetShardsRequest,
        model: &ControlPlaneModel,
    ) -> AdviseResetShardsResponse {
        info!(
            "received advise reset shards request from `{}`",
            request.ingester_id
        );
        debug!(shard_ids=?summarize_shard_ids(&request.shard_ids), "advise reset shards");

        let mut shards_to_delete: Vec<ShardIds> = Vec::new();
        let mut shards_to_truncate: Vec<ShardIdPositions> = Vec::new();

        for shard_ids in request.shard_ids {
            let index_uid = shard_ids.index_uid().clone();
            let source_id = shard_ids.source_id.clone();

            let source_uid = SourceUid {
                index_uid,
                source_id,
            };
            let Some(shard_entries) = model.get_shards_for_source(&source_uid) else {
                // The source no longer exists: we can safely delete all the shards.
                shards_to_delete.push(shard_ids);
                continue;
            };
            let mut shard_ids_to_delete = Vec::new();
            let mut shard_positions_to_truncate = Vec::new();

            for shard_id in shard_ids.shard_ids {
                if let Some(shard_entry) = shard_entries.get(&shard_id) {
                    let publish_position_inclusive = shard_entry.publish_position_inclusive();

                    shard_positions_to_truncate.push(ShardIdPosition {
                        shard_id: Some(shard_id),
                        publish_position_inclusive: Some(publish_position_inclusive),
                    });
                } else {
                    shard_ids_to_delete.push(shard_id);
                }
            }
            if !shard_ids_to_delete.is_empty() {
                shards_to_delete.push(ShardIds {
                    index_uid: Some(source_uid.index_uid.clone()),
                    source_id: source_uid.source_id.clone(),
                    shard_ids: shard_ids_to_delete,
                });
            }
            if !shard_positions_to_truncate.is_empty() {
                shards_to_truncate.push(ShardIdPositions {
                    index_uid: Some(source_uid.index_uid),
                    source_id: source_uid.source_id,
                    shard_positions: shard_positions_to_truncate,
                });
            }
        }
        if enabled!(Level::DEBUG) {
            let shards_to_truncate: Vec<(&str, Position)> = shards_to_truncate
                .iter()
                .flat_map(|shard_positions| {
                    shard_positions
                        .shard_positions
                        .iter()
                        .map(|shard_id_position| {
                            (
                                shard_id_position.shard_id().as_str(),
                                shard_id_position.publish_position_inclusive(),
                            )
                        })
                })
                .collect();
            debug!(shard_ids_to_delete=?summarize_shard_ids(&shards_to_delete), shards_to_truncate=?shards_to_truncate, "advise reset shards response");
        }

        AdviseResetShardsResponse {
            shards_to_delete,
            shards_to_truncate,
        }
    }

    /// Rebalances shards from ingesters with too many shards to ingesters with too few shards.
    /// Moving a shard consists of closing the shard on the source ingester and opening a new
    /// one on the target ingester.
    ///
    /// This method is guarded by a lock to ensure that only one rebalance operation is performed at
    /// a time.
    #[instrument(skip_all)]
    pub(crate) async fn rebalance_shards(
        &mut self,
        model: &mut ControlPlaneModel,
        mailbox: &Mailbox<ControlPlane>,
        progress: &Progress,
    ) -> MetastoreResult<usize> {
        let Ok(rebalance_guard) = self.rebalance_lock.clone().try_lock_owned() else {
            debug!("skipping rebalance: another rebalance is already in progress");
            return Ok(0);
        };
        self.stats.num_rebalance_shards_ops += 1;

        let shards_to_rebalance: Vec<Shard> = self.compute_shards_to_rebalance(model);

        crate::metrics::CONTROL_PLANE_METRICS
            .rebalance_shards
            .set(shards_to_rebalance.len() as i64);

        if shards_to_rebalance.is_empty() {
            debug!("skipping rebalance: no shards to rebalance");
            return Ok(0);
        }
        let mut per_source_num_shards_to_open: HashMap<SourceUid, usize> = HashMap::new();

        for shard in &shards_to_rebalance {
            *per_source_num_shards_to_open
                .entry(shard.source_uid())
                .or_default() += 1;
        }
        let mut per_source_num_opened_shards: HashMap<SourceUid, usize> = self
            .try_open_shards(
                per_source_num_shards_to_open,
                model,
                &Default::default(),
                progress,
            )
            .await
            .inspect_err(|error| {
                error!(%error, "failed to open shards during rebalance");
                crate::metrics::CONTROL_PLANE_METRICS
                    .rebalance_shards
                    .set(0);
            })?;

        let num_opened_shards: usize = per_source_num_opened_shards.values().sum();

        crate::metrics::CONTROL_PLANE_METRICS
            .rebalance_shards
            .set(num_opened_shards as i64);

        for source_uid in per_source_num_opened_shards.keys() {
            // We temporarily disable the ability the scale down the number of shards for
            // the source to avoid closing the shards we just opened.
            model.drain_scaling_permits(source_uid, ScalingMode::Down);
        }

        // Close as many shards as we opened. Because `try_open_shards` might fail partially, we
        // must only close the shards that we successfully opened.
        let mut shards_to_close = Vec::with_capacity(shards_to_rebalance.len());

        for shard in shards_to_rebalance {
            let source_uid = shard.source_uid();
            let Some(num_open_shards) = per_source_num_opened_shards.get_mut(&source_uid) else {
                continue;
            };
            if *num_open_shards == 0 {
                continue;
            };
            *num_open_shards -= 1;
            shards_to_close.push(shard);
        }
        let close_shards_fut = self.close_shards(shards_to_close);
        let mailbox_clone = mailbox.clone();

        let close_shards_and_send_callback_fut = async move {
            // We wait for a few seconds before closing the shards to give the ingesters some time
            // to learn about the ones we just opened via gossip.
            tokio::time::sleep(CLOSE_SHARDS_UPON_REBALANCE_DELAY).await;

            let closed_shards = close_shards_fut.await;

            if closed_shards.is_empty() {
                return;
            }
            let callback = RebalanceShardsCallback {
                closed_shards,
                rebalance_guard,
            };
            let _ = mailbox_clone.send_message(callback).await;
        };
        tokio::spawn(close_shards_and_send_callback_fut);

        if num_opened_shards > 0 {
            info!("rebalance opened {num_opened_shards} new shards");
        }
        Ok(num_opened_shards)
    }

    /// Computes shards that need to be rebalanced.
    ///
    /// This function identifies which shards should be moved to achieve a balance across available
    /// ingesters.
    /// It does not mutate any state. It just identifies the list of shards
    /// that need to be rebalanced.
    ///
    /// Unfortunately, we cannot move shards that are on unavailable ingesters.
    /// The closing operation can only be done by the leader of that shard.
    /// For these reason, we exclude these shards from the rebalance process.
    fn compute_shards_to_rebalance(&self, model: &ControlPlaneModel) -> Vec<Shard> {
        let mut per_ready_ingester_shards: HashMap<NodeId, Vec<&Shard>> = HashMap::new();
        let mut retiring_ingesters: HashSet<NodeId> = HashSet::new();

        for (ingester_id, ingester) in self.ingester_pool.keys_values() {
            if ingester.status.is_ready() {
                per_ready_ingester_shards.insert(ingester_id, Vec::new());
            } else if ingester.status == IngesterStatus::Retiring {
                retiring_ingesters.insert(ingester_id);
            }
        }

        let mut shards_to_rebalance: Vec<Shard> = Vec::new();
        let mut num_ready_shards: usize = 0;

        for shard in model.all_shards() {
            if !shard.is_open() {
                continue;
            }
            let leader_id_ref = NodeIdRef::from_str(&shard.leader_id);

            if let Some(shards) = per_ready_ingester_shards.get_mut(leader_id_ref) {
                // Shards on ready ingesters participate in the balancing logic.
                num_ready_shards += 1;
                shards.push(&shard.shard);
            } else if retiring_ingesters.contains(leader_id_ref) {
                // All open shards on retiring ingesters must be rebalanced.
                shards_to_rebalance.push(shard.shard.clone());
            }
        }

        let num_retiring_shards = shards_to_rebalance.len();
        let num_ready_ingesters = per_ready_ingester_shards.len();

        let mut rng = rng();
        let mut per_leader_open_shards_shuffled: Vec<Vec<&Shard>> = per_ready_ingester_shards
            .into_values()
            .map(|mut shards| {
                shards.shuffle(&mut rng);
                shards
            })
            .collect();

        // This is more of a loop-loop, but since we know it should exit before
        // `num_ready_shards`, we defensively use a for-loop.
        for _ in 0..num_ready_shards {
            let MinMaxResult::MinMax(min_shards, max_shards) = per_leader_open_shards_shuffled
                .iter_mut()
                .minmax_by_key(|shards| shards.len())
            else {
                // There are less than 2 ingesters.
                // Nothing to do here.
                break;
            };

            // We leave a tolerance of 1/10 between the min and max number of shards per leader
            const TOLERANCE_INV_RATIO: usize = 10;
            if max_shards.len()
                < min_shards.len() + min_shards.len().div_ceil(TOLERANCE_INV_RATIO).max(2)
            {
                break;
            }

            let shard = max_shards.pop().expect("shards should not be empty");
            shards_to_rebalance.push(shard.clone());
            min_shards.push(shard);
        }

        if shards_to_rebalance.is_empty() {
            debug!("no shards to rebalance");
        } else {
            info!(
                num_ready_shards,
                num_ready_ingesters,
                num_retiring_shards,
                num_shards_to_rebalance = shards_to_rebalance.len(),
                "rebalancing shards"
            );
        }
        shards_to_rebalance
    }

    /// Attempts to close the list of shards passed as argument.
    ///
    /// If ingesters are not available, the shards are not closed.
    fn close_shards(
        &self,
        shards_to_close: Vec<Shard>,
    ) -> impl Future<Output = Vec<ShardPKey>> + Send + 'static {
        let mut per_leader_shards_to_close: HashMap<LeaderId, Vec<ShardPKey>> = HashMap::new();

        for shard in shards_to_close {
            let shard_pkey = ShardPKey {
                index_uid: shard.index_uid,
                source_id: shard.source_id,
                shard_id: shard.shard_id,
            };
            let leader_id = NodeId::from(shard.leader_id);
            per_leader_shards_to_close
                .entry(leader_id)
                .or_default()
                .push(shard_pkey);
        }
        let mut close_shards_futures = FuturesUnordered::new();

        for (leader_id, shard_pkeys) in per_leader_shards_to_close {
            let Some(ingester) = self.ingester_pool.get(&leader_id) else {
                warn!("failed to close shards: ingester `{leader_id}` is unavailable");
                continue;
            };
            let shards_to_close_request = CloseShardsRequest { shard_pkeys };
            let close_shards_future = async move {
                tokio::time::timeout(
                    CLOSE_SHARDS_REQUEST_TIMEOUT,
                    ingester.client.close_shards(shards_to_close_request),
                )
                .await
            };
            close_shards_futures.push(close_shards_future);
        }
        async move {
            let mut closed_shards = Vec::new();

            while let Some(close_shards_result) = close_shards_futures.next().await {
                match close_shards_result {
                    Ok(Ok(CloseShardsResponse { successes })) => {
                        closed_shards.extend(successes);
                    }
                    Ok(Err(error)) => {
                        error!(%error, "failed to close shards");
                    }
                    Err(_elapsed) => {
                        error!("close shards request timed out");
                    }
                }
            }
            closed_shards
        }
    }
}

fn summarize_shard_ids(shard_ids: &[ShardIds]) -> Vec<&str> {
    shard_ids
        .iter()
        .flat_map(|source_shard_ids| {
            source_shard_ids
                .shard_ids
                .iter()
                .map(|shard_id| shard_id.as_str())
        })
        .collect()
}

/// When rebalancing shards, shards to move are closed some time after new shards are opened.
/// Because we don't want to stall the control plane event loop while waiting for the close shards
/// requests to complete, we use a callback to handle the results of those close shards requests.
#[derive(Debug)]
pub(crate) struct RebalanceShardsCallback {
    pub closed_shards: Vec<ShardPKey>,
    pub rebalance_guard: OwnedMutexGuard<()>,
}

/// Finds a shard on the ingester with the highest number of open
/// shards for this source.
///
/// If multiple shards are hosted on that ingester, the shard with the lowest (oldest)
/// shard ID is chosen.
fn find_scale_down_candidate(
    source_uid: &SourceUid,
    model: &ControlPlaneModel,
) -> Option<(NodeId, ShardId)> {
    let mut per_leader_shard_entries: HashMap<&String, Vec<&ShardEntry>> = HashMap::new();
    let mut rng = rng();

    for shard in model.get_shards_for_source(source_uid)?.values() {
        if shard.is_open() {
            per_leader_shard_entries
                .entry(&shard.leader_id)
                .or_default()
                .push(shard);
        }
    }
    per_leader_shard_entries
        .into_iter()
        // We use a random number to break ties... The HashMap is randomly seeded so this is
        // should not make much difference, but we might want to be as explicit as possible.
        .max_by_key(|(_leader_id, shard_entries)| (shard_entries.len(), rng.next_u32()))
        .map(|(leader_id, shard_entries)| {
            (
                leader_id.clone().into(),
                shard_entries.choose(&mut rng).unwrap().shard_id().clone(),
            )
        })
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeSet;
    use std::str::FromStr;
    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};

    use itertools::Itertools;
    use quickwit_actors::Universe;
    use quickwit_common::setup_logging_for_tests;
    use quickwit_common::shared_consts::DEFAULT_SHARD_THROUGHPUT_LIMIT;
    use quickwit_common::tower::DelayLayer;
    use quickwit_config::{DocMapping, INGEST_V2_SOURCE_ID, SourceConfig};
    use quickwit_ingest::{IngesterPoolEntry, RateMibPerSec, ShardInfo};
    use quickwit_metastore::IndexMetadata;
    use quickwit_proto::control_plane::GetOrCreateOpenShardsSubrequest;
    use quickwit_proto::ingest::ingester::{
        CloseShardsResponse, IngesterServiceClient, IngesterStatus, InitShardSuccess,
        InitShardsResponse, MockIngesterService, RetainShardsResponse,
    };
    use quickwit_proto::ingest::{IngestV2Error, Shard, ShardState};
    use quickwit_proto::metastore::{
        self, MetastoreError, MockMetastoreService, OpenShardSubresponse,
    };
    use quickwit_proto::types::{DocMappingUid, Position, SourceId};

    use super::*;

    const TEST_SHARD_THROUGHPUT_LIMIT_MIB: f32 =
        DEFAULT_SHARD_THROUGHPUT_LIMIT.as_u64() as f32 / quickwit_common::shared_consts::MIB as f32;

    #[tokio::test]
    async fn test_ingest_controller_get_or_create_open_shards() {
        let source_id: &'static str = "test-source";

        let index_id_0 = "test-index-0";
        let mut index_metadata_0 =
            IndexMetadata::for_test(index_id_0, "ram://indexes/test-index-0");
        let index_uid_0 = index_metadata_0.index_uid.clone();

        let doc_mapping_uid_0 = DocMappingUid::random();
        index_metadata_0.index_config.doc_mapping.doc_mapping_uid = doc_mapping_uid_0;

        let index_id_1 = "test-index-1";
        let mut index_metadata_1 =
            IndexMetadata::for_test(index_id_1, "ram://indexes/test-index-1");
        let index_uid_1 = index_metadata_1.index_uid.clone();

        let doc_mapping_uid_1 = DocMappingUid::random();
        index_metadata_1.index_config.doc_mapping.doc_mapping_uid = doc_mapping_uid_1;

        let progress = Progress::default();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_open_shards().once().returning({
            let index_uid_1 = index_uid_1.clone();

            move |request| {
                assert_eq!(request.subrequests.len(), 1);
                assert_eq!(request.subrequests[0].index_uid(), &index_uid_1);
                assert_eq!(request.subrequests[0].source_id, source_id);
                assert_eq!(request.subrequests[0].doc_mapping_uid(), doc_mapping_uid_1);

                let subresponses = vec![metastore::OpenShardSubresponse {
                    subrequest_id: 1,
                    open_shard: Some(Shard {
                        index_uid: index_uid_1.clone().into(),
                        source_id: source_id.to_string(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: "test-ingester-2".to_string(),
                        doc_mapping_uid: Some(doc_mapping_uid_1),
                        ..Default::default()
                    }),
                }];
                let response = metastore::OpenShardsResponse { subresponses };
                Ok(response)
            }
        });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);

        let mock_ingester = MockIngesterService::new();
        let client = IngesterServiceClient::from_mock(mock_ingester);

        let ingester_pool = IngesterPool::default();
        ingester_pool.insert(
            NodeId::from("test-ingester-1"),
            IngesterPoolEntry::ready_with_client(client.clone()),
        );

        let mut mock_ingester = MockIngesterService::new();
        let index_uid_1_clone = index_uid_1.clone();
        mock_ingester
            .expect_init_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];

                let shard = subrequest.shard();
                assert_eq!(shard.index_uid(), &index_uid_1_clone);
                assert_eq!(shard.source_id, source_id);
                assert_eq!(shard.leader_id, "test-ingester-2");

                let successes = vec![InitShardSuccess {
                    subrequest_id: request.subrequests[0].subrequest_id,
                    shard: Some(shard.clone()),
                }];
                let response = InitShardsResponse {
                    successes,
                    failures: Vec::new(),
                };
                Ok(response)
            });
        let ingester = IngesterServiceClient::from_mock(mock_ingester);
        ingester_pool.insert(
            NodeId::from("test-ingester-2"),
            IngesterPoolEntry::ready_with_client(ingester.clone()),
        );

        let replication_factor = 2;
        let mut controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let mut model = ControlPlaneModel::default();
        model.add_index(index_metadata_0.clone());
        model.add_index(index_metadata_1.clone());

        let mut source_config = SourceConfig::ingest_v2();
        source_config.source_id = source_id.to_string();

        model
            .add_source(&index_uid_0, source_config.clone())
            .unwrap();
        model.add_source(&index_uid_1, source_config).unwrap();

        let shards = vec![
            Shard {
                index_uid: index_uid_0.clone().into(),
                source_id: source_id.to_string(),
                shard_id: Some(ShardId::from(1)),
                leader_id: "test-ingester-0".to_string(),
                shard_state: ShardState::Open as i32,
                doc_mapping_uid: Some(doc_mapping_uid_0),
                ..Default::default()
            },
            Shard {
                index_uid: index_uid_0.clone().into(),
                source_id: source_id.to_string(),
                shard_id: Some(ShardId::from(2)),
                leader_id: "test-ingester-1".to_string(),
                shard_state: ShardState::Open as i32,
                doc_mapping_uid: Some(doc_mapping_uid_0),
                ..Default::default()
            },
        ];

        model.insert_shards(&index_uid_0, &source_id.into(), shards);

        let request = GetOrCreateOpenShardsRequest {
            subrequests: Vec::new(),
            closed_shards: Vec::new(),
            unavailable_leaders: Vec::new(),
        };
        let response = controller
            .get_or_create_open_shards(request, &mut model, &progress)
            .await
            .unwrap();

        assert_eq!(response.successes.len(), 0);
        assert_eq!(response.failures.len(), 0);

        let subrequests = vec![
            GetOrCreateOpenShardsSubrequest {
                subrequest_id: 0,
                index_id: "test-index-0".to_string(),
                source_id: source_id.to_string(),
            },
            GetOrCreateOpenShardsSubrequest {
                subrequest_id: 1,
                index_id: "test-index-1".to_string(),
                source_id: source_id.to_string(),
            },
            GetOrCreateOpenShardsSubrequest {
                subrequest_id: 2,
                index_id: "index-not-found".to_string(),
                source_id: "source-not-found".to_string(),
            },
            GetOrCreateOpenShardsSubrequest {
                subrequest_id: 3,
                index_id: "test-index-0".to_string(),
                source_id: "source-not-found".to_string(),
            },
        ];
        let closed_shards = Vec::new();
        let unavailable_leaders = vec!["test-ingester-0".to_string()];
        let request = GetOrCreateOpenShardsRequest {
            subrequests,
            closed_shards,
            unavailable_leaders,
        };
        let response = controller
            .get_or_create_open_shards(request, &mut model, &progress)
            .await
            .unwrap();

        assert_eq!(response.successes.len(), 2);
        assert_eq!(response.failures.len(), 2);

        let success = &response.successes[0];
        assert_eq!(success.subrequest_id, 0);
        assert_eq!(success.index_uid(), &index_uid_0);
        assert_eq!(success.source_id, source_id);
        assert_eq!(success.open_shards.len(), 1);
        assert_eq!(success.open_shards[0].shard_id(), ShardId::from(2));
        assert_eq!(success.open_shards[0].leader_id, "test-ingester-1");
        assert_eq!(success.open_shards[0].doc_mapping_uid(), doc_mapping_uid_0);

        let success = &response.successes[1];
        assert_eq!(success.subrequest_id, 1);
        assert_eq!(success.index_uid(), &index_uid_1);
        assert_eq!(success.source_id, source_id);
        assert_eq!(success.open_shards.len(), 1);
        assert_eq!(success.open_shards[0].shard_id(), ShardId::from(1));
        assert_eq!(success.open_shards[0].leader_id, "test-ingester-2");
        assert_eq!(success.open_shards[0].doc_mapping_uid(), doc_mapping_uid_1);

        let failure = &response.failures[0];
        assert_eq!(failure.subrequest_id, 2);
        assert_eq!(failure.index_id, "index-not-found");
        assert_eq!(failure.source_id, "source-not-found");
        assert_eq!(
            failure.reason(),
            GetOrCreateOpenShardsFailureReason::IndexNotFound
        );

        let failure = &response.failures[1];
        assert_eq!(failure.subrequest_id, 3);
        assert_eq!(failure.index_id, index_id_0);
        assert_eq!(failure.source_id, "source-not-found");
        assert_eq!(
            failure.reason(),
            GetOrCreateOpenShardsFailureReason::SourceNotFound
        );

        assert_eq!(model.num_shards(), 3);
    }

    #[tokio::test]
    async fn test_ingest_controller_get_or_create_open_shards_metastore_failure() {
        let source_id: &'static str = "test-source";

        let index_id_0 = "test-index-0";
        let index_metadata_0 = IndexMetadata::for_test(index_id_0, "ram://indexes/test-index-0");
        let index_uid_0 = index_metadata_0.index_uid.clone();
        let index_uid_0_clone = index_uid_0.clone();

        let progress = Progress::default();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_open_shards()
            .once()
            .returning(move |_| {
                Err(MetastoreError::Internal {
                    message: "this error could be mean anything. transaction success or failure!"
                        .to_string(),
                    cause: "".to_string(),
                })
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);

        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_init_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];

                let shard = subrequest.shard();
                assert_eq!(shard.index_uid(), &index_uid_0);
                assert_eq!(shard.source_id, source_id);
                assert_eq!(shard.leader_id, "test-ingester-1");

                let successes = vec![InitShardSuccess {
                    subrequest_id: request.subrequests[0].subrequest_id,
                    shard: Some(shard.clone()),
                }];
                let response = InitShardsResponse {
                    successes,
                    failures: Vec::new(),
                };
                Ok(response)
            });
        let client = IngesterServiceClient::from_mock(mock_ingester);

        let ingester_pool = IngesterPool::default();
        ingester_pool.insert(
            NodeId::from("test-ingester-1"),
            IngesterPoolEntry::ready_with_client(client.clone()),
        );

        let replication_factor = 1;
        let mut controller = IngestController::new(
            metastore,
            ingester_pool,
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let mut model = ControlPlaneModel::default();
        model.add_index(index_metadata_0.clone());

        let mut source_config = SourceConfig::ingest_v2();
        source_config.source_id = source_id.to_string();

        model
            .add_source(&index_uid_0_clone, source_config.clone())
            .unwrap();

        let subrequests = vec![GetOrCreateOpenShardsSubrequest {
            subrequest_id: 0,
            index_id: "test-index-0".to_string(),
            source_id: source_id.to_string(),
        }];
        let request = GetOrCreateOpenShardsRequest {
            subrequests,
            closed_shards: Vec::new(),
            unavailable_leaders: Vec::new(),
        };

        let metastore_error = controller
            .get_or_create_open_shards(request, &mut model, &progress)
            .await
            .unwrap_err();

        assert!(!metastore_error.is_transaction_certainly_aborted());
    }

    #[tokio::test]
    async fn test_ingest_controller_get_open_shards_handles_closed_shards() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 2;

        let mut controller = IngestController::new(
            metastore,
            ingester_pool,
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );
        let mut model = ControlPlaneModel::default();

        let index_uid = IndexUid::for_test("test-index-0", 0);
        let source_id: SourceId = "test-source".to_string();

        let shards = vec![Shard {
            shard_id: Some(ShardId::from(1)),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            leader_id: "test-ingester-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, shards);

        let request = GetOrCreateOpenShardsRequest {
            subrequests: Vec::new(),
            closed_shards: vec![ShardIds {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_ids: vec![ShardId::from(1), ShardId::from(2)],
            }],
            unavailable_leaders: Vec::new(),
        };
        let progress = Progress::default();

        controller
            .get_or_create_open_shards(request, &mut model, &progress)
            .await
            .unwrap();

        let shard_1 = model
            .all_shards()
            .find(|shard| shard.shard_id() == ShardId::from(1))
            .unwrap();
        assert!(shard_1.is_closed());
    }

    #[test]
    fn test_ingest_controller_allocate_shards() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 2;

        let controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let mut model = ControlPlaneModel::default();

        let leader_follower_pairs_opt =
            controller.allocate_shards(0, &FnvHashSet::default(), &model);
        assert!(leader_follower_pairs_opt.is_none());

        ingester_pool.insert(
            NodeId::from("test-ingester-1"),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::mocked()),
        );

        let leader_follower_pairs_opt =
            controller.allocate_shards(0, &FnvHashSet::default(), &model);

        // We have only one node so with a replication factor of 2, we can't
        // find any solution.
        assert!(leader_follower_pairs_opt.is_none());

        ingester_pool.insert(
            "test-ingester-2".into(),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::mocked()),
        );

        let leader_follower_pairs = controller
            .allocate_shards(0, &FnvHashSet::default(), &model)
            .unwrap();

        // We tried to allocate 0 shards, so an empty vec makes sense.
        assert!(leader_follower_pairs.is_empty());

        let leader_follower_pairs = controller
            .allocate_shards(1, &FnvHashSet::default(), &model)
            .unwrap();

        assert_eq!(leader_follower_pairs.len(), 1);

        // The leader follower is picked at random: both ingester have the same number of shards.
        if leader_follower_pairs[0].0 == "test-ingester-1" {
            assert_eq!(
                leader_follower_pairs[0].1,
                Some(NodeId::from("test-ingester-2"))
            );
        } else {
            assert_eq!(leader_follower_pairs[0].0, "test-ingester-2");
            assert_eq!(
                leader_follower_pairs[0].1,
                Some(NodeId::from("test-ingester-1"))
            );
        }

        let leader_follower_pairs = controller
            .allocate_shards(2, &FnvHashSet::default(), &model)
            .unwrap();
        assert_eq!(leader_follower_pairs.len(), 2);

        for leader_follower_pair in leader_follower_pairs {
            if leader_follower_pair.0 == "test-ingester-1" {
                assert_eq!(
                    leader_follower_pair.1,
                    Some(NodeId::from("test-ingester-2"))
                );
            } else {
                assert_eq!(leader_follower_pair.0, "test-ingester-2");
                assert_eq!(
                    leader_follower_pair.1,
                    Some(NodeId::from("test-ingester-1"))
                );
            }
        }

        let leader_follower_pairs = controller
            .allocate_shards(3, &FnvHashSet::default(), &model)
            .unwrap();
        assert_eq!(leader_follower_pairs.len(), 3);
        let index_uid = IndexUid::for_test("test-index", 0);

        let source_id: SourceId = "test-source".to_string();
        let open_shards = vec![Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: "test-ingester-1".to_string(),
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, open_shards);

        let leader_follower_pairs = controller
            .allocate_shards(3, &FnvHashSet::default(), &model)
            .unwrap();
        assert_eq!(leader_follower_pairs.len(), 3);
        assert_eq!(leader_follower_pairs[0].0, "test-ingester-2");
        assert_eq!(
            leader_follower_pairs[0].1,
            Some(NodeId::from("test-ingester-1"))
        );

        assert_eq!(leader_follower_pairs[1].0, "test-ingester-2");
        assert_eq!(
            leader_follower_pairs[1].1,
            Some(NodeId::from("test-ingester-1"))
        );

        assert_eq!(leader_follower_pairs[2].0, "test-ingester-2");
        assert_eq!(
            leader_follower_pairs[2].1,
            Some(NodeId::from("test-ingester-1"))
        );

        let open_shards = vec![
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(2)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-1".to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(3)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-1".to_string(),
                ..Default::default()
            },
        ];
        model.insert_shards(&index_uid, &source_id, open_shards);

        let leader_follower_pairs = controller
            .allocate_shards(1, &FnvHashSet::default(), &model)
            .unwrap();
        assert_eq!(leader_follower_pairs.len(), 1);
        // Ingester 1 already has two shards, so ingester 2 is picked as leader
        assert_eq!(leader_follower_pairs[0].0, "test-ingester-2");
        assert_eq!(
            leader_follower_pairs[0].1,
            Some(NodeId::from("test-ingester-1"))
        );

        ingester_pool.insert(
            "test-ingester-3".into(),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::mocked()),
        );
        let unavailable_leaders = FnvHashSet::from_iter([NodeId::from("test-ingester-2")]);
        let leader_follower_pairs = controller
            .allocate_shards(4, &unavailable_leaders, &model)
            .unwrap();
        // Ingester 2 is unavailable. Ingester 1 has open shards. Ingester 3 ends up leader.
        assert_eq!(leader_follower_pairs.len(), 4);
        assert_eq!(leader_follower_pairs[0].0, "test-ingester-3");
        assert_eq!(
            leader_follower_pairs[0].1,
            Some(NodeId::from("test-ingester-1"))
        );

        assert_eq!(leader_follower_pairs[1].0, "test-ingester-3");
        assert_eq!(
            leader_follower_pairs[1].1,
            Some(NodeId::from("test-ingester-1"))
        );

        assert_eq!(leader_follower_pairs[2].0, "test-ingester-3");
        assert_eq!(
            leader_follower_pairs[2].1,
            Some(NodeId::from("test-ingester-1"))
        );

        assert_eq!(leader_follower_pairs[3].0, "test-ingester-3");
        assert_eq!(
            leader_follower_pairs[3].1,
            Some(NodeId::from("test-ingester-1"))
        );
    }

    #[tokio::test]
    async fn test_ingest_controller_init_shards() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;

        let controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let ingester_id_0 = NodeId::from("test-ingester-0");
        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_init_shards()
            .once()
            .returning(|mut request| {
                assert_eq!(request.subrequests.len(), 2);

                request
                    .subrequests
                    .sort_by_key(|subrequest| subrequest.subrequest_id);

                let subrequest_0 = &request.subrequests[0];
                assert_eq!(subrequest_0.subrequest_id, 0);

                let shard_0 = request.subrequests[0].shard();
                assert_eq!(shard_0.index_uid(), &("test-index", 0));
                assert_eq!(shard_0.source_id, "test-source");
                assert_eq!(shard_0.shard_id(), ShardId::from(0));
                assert_eq!(shard_0.leader_id, "test-ingester-0");

                let subrequest_1 = &request.subrequests[1];
                assert_eq!(subrequest_1.subrequest_id, 1);

                let shard_1 = request.subrequests[1].shard();
                assert_eq!(shard_1.index_uid(), &("test-index", 0));
                assert_eq!(shard_1.source_id, "test-source");
                assert_eq!(shard_1.shard_id(), ShardId::from(1));
                assert_eq!(shard_1.leader_id, "test-ingester-0");

                let successes = vec![InitShardSuccess {
                    subrequest_id: 0,
                    shard: Some(shard_0.clone()),
                }];
                let failures = vec![InitShardFailure {
                    subrequest_id: 1,
                    index_uid: shard_1.index_uid.clone(),
                    source_id: shard_1.source_id.clone(),
                    shard_id: shard_1.shard_id.clone(),
                }];
                let response = InitShardsResponse {
                    successes,
                    failures,
                };
                Ok(response)
            });
        let ingester_0 = IngesterServiceClient::from_mock(mock_ingester_0);
        ingester_pool.insert(
            ingester_id_0,
            IngesterPoolEntry::ready_with_client(ingester_0),
        );

        let ingester_id_1 = NodeId::from("test-ingester-1");
        let mut mock_ingester_1 = MockIngesterService::new();
        mock_ingester_1
            .expect_init_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.subrequest_id, 2);

                let shard = request.subrequests[0].shard();
                assert_eq!(shard.index_uid(), &("test-index", 0));
                assert_eq!(shard.source_id, "test-source");
                assert_eq!(shard.shard_id(), ShardId::from(2));
                assert_eq!(shard.leader_id, "test-ingester-1");

                Err(IngestV2Error::Internal("internal error".to_string()))
            });
        let ingester_1 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1));
        ingester_pool.insert(ingester_id_1, ingester_1);

        let ingester_id_2 = NodeId::from("test-ingester-2");
        let mut mock_ingester_2 = MockIngesterService::new();
        mock_ingester_2.expect_init_shards().never();

        let client_2 = IngesterServiceClient::tower()
            .stack_init_shards_layer(DelayLayer::new(INIT_SHARDS_REQUEST_TIMEOUT * 2))
            .build_from_mock(mock_ingester_2);
        ingester_pool.insert(
            ingester_id_2,
            IngesterPoolEntry::ready_with_client(client_2),
        );

        let init_shards_response = controller
            .init_shards(Vec::new(), &Progress::default())
            .await;
        assert_eq!(init_shards_response.successes.len(), 0);
        assert_eq!(init_shards_response.failures.len(), 0);

        // In this test:
        // - ingester 0 will initialize shard 0 successfully and fail to initialize shard 1;
        // - ingester 1 will return an error;
        // - ingester 2 will time out;
        // - ingester 3 will be unavailable.

        let init_shard_subrequests: Vec<InitShardSubrequest> = vec![
            InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(Shard {
                    index_uid: IndexUid::for_test("test-index", 0).into(),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(0)),
                    leader_id: "test-ingester-0".to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                }),
                doc_mapping_json: "{}".to_string(),
                validate_docs: false,
            },
            InitShardSubrequest {
                subrequest_id: 1,
                shard: Some(Shard {
                    index_uid: IndexUid::for_test("test-index", 0).into(),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    leader_id: "test-ingester-0".to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                }),
                doc_mapping_json: "{}".to_string(),
                validate_docs: false,
            },
            InitShardSubrequest {
                subrequest_id: 2,
                shard: Some(Shard {
                    index_uid: IndexUid::for_test("test-index", 0).into(),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(2)),
                    leader_id: "test-ingester-1".to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                }),
                doc_mapping_json: "{}".to_string(),
                validate_docs: false,
            },
            InitShardSubrequest {
                subrequest_id: 3,
                shard: Some(Shard {
                    index_uid: IndexUid::for_test("test-index", 0).into(),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(3)),
                    leader_id: "test-ingester-2".to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                }),
                doc_mapping_json: "{}".to_string(),
                validate_docs: false,
            },
            InitShardSubrequest {
                subrequest_id: 4,
                shard: Some(Shard {
                    index_uid: IndexUid::for_test("test-index", 0).into(),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(4)),
                    leader_id: "test-ingester-3".to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                }),
                doc_mapping_json: "{}".to_string(),
                validate_docs: false,
            },
        ];
        let init_shards_response = controller
            .init_shards(init_shard_subrequests, &Progress::default())
            .await;
        assert_eq!(init_shards_response.successes.len(), 1);
        assert_eq!(init_shards_response.failures.len(), 4);

        let success = &init_shards_response.successes[0];
        assert_eq!(success.subrequest_id, 0);

        let mut failures = init_shards_response.failures;
        failures.sort_by_key(|failure| failure.subrequest_id);

        assert_eq!(failures[0].subrequest_id, 1);
        assert_eq!(failures[1].subrequest_id, 2);
        assert_eq!(failures[2].subrequest_id, 3);
        assert_eq!(failures[3].subrequest_id, 4);
    }

    #[tokio::test]
    async fn test_ingest_controller_try_open_shards() {
        let doc_mapping_uid = DocMappingUid::random();
        let expected_doc_mapping = doc_mapping_uid;

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_open_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.subrequest_id, 0);

                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(subrequest.leader_id, "test-ingester-1");
                assert_eq!(subrequest.doc_mapping_uid(), expected_doc_mapping);

                let subresponses = vec![metastore::OpenShardSubresponse {
                    subrequest_id: 0,
                    open_shard: Some(Shard {
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        shard_id: Some(ShardId::from(0)),
                        leader_id: "test-ingester-1".to_string(),
                        shard_state: ShardState::Open as i32,
                        doc_mapping_uid: Some(expected_doc_mapping),
                        ..Default::default()
                    }),
                }];
                let response = metastore::OpenShardsResponse { subresponses };
                Ok(response)
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;

        let mut controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let mut index_metadata = IndexMetadata::for_test("test-index", "ram://indexes/test-index");
        index_metadata.sources.insert(
            source_id.clone(),
            SourceConfig::for_test(&source_id, quickwit_config::SourceParams::void()),
        );

        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "field_mappings": [{{
                        "name": "message",
                        "type": "text"
                }}]
            }}"#
        );
        let doc_mapping: DocMapping = serde_json::from_str(&doc_mapping_json).unwrap();
        let expected_doc_mapping = doc_mapping.clone();
        index_metadata.index_config.doc_mapping = doc_mapping;

        let mut model = ControlPlaneModel::default();
        model.add_index(index_metadata);

        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_init_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.subrequest_id, 0);

                let doc_mapping: DocMapping =
                    serde_json::from_str(&subrequest.doc_mapping_json).unwrap();
                assert_eq!(doc_mapping, expected_doc_mapping);

                let shard = request.subrequests[0].shard();
                assert_eq!(shard.index_uid(), &("test-index", 0));
                assert_eq!(shard.source_id, "test-source");
                assert_eq!(shard.leader_id, "test-ingester-1");
                assert_eq!(shard.doc_mapping_uid(), doc_mapping_uid);

                let successes = vec![InitShardSuccess {
                    subrequest_id: 0,
                    shard: Some(shard.clone()),
                }];
                let response = InitShardsResponse {
                    successes,
                    failures: Vec::new(),
                };
                Ok(response)
            });

        ingester_pool.insert(
            NodeId::from("test-ingester-1"),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester)),
        );
        let source_uids: HashMap<SourceUid, usize> = HashMap::from_iter([(source_uid.clone(), 1)]);
        let unavailable_leaders = FnvHashSet::default();
        let progress = Progress::default();

        let per_source_num_opened_shards = controller
            .try_open_shards(source_uids, &mut model, &unavailable_leaders, &progress)
            .await
            .unwrap();

        assert_eq!(per_source_num_opened_shards.len(), 1);
        assert_eq!(*per_source_num_opened_shards.get(&source_uid).unwrap(), 1);
    }

    #[tokio::test]
    async fn test_ingest_controller_handle_local_shards_update() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_open_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.subrequests.len(), 1);
                let subrequest = &request.subrequests[0];

                assert_eq!(subrequest.index_uid(), &IndexUid::for_test("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(subrequest.leader_id, "test-ingester");

                Err(MetastoreError::InvalidArgument {
                    message: "failed to open shards".to_string(),
                })
            });
        mock_metastore
            .expect_open_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.subrequests.len(), 1);
                let subrequest: &OpenShardSubrequest = &request.subrequests[0];

                assert_eq!(subrequest.index_uid(), &IndexUid::for_test("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(subrequest.leader_id, "test-ingester");

                let shard = Shard {
                    index_uid: subrequest.index_uid.clone(),
                    source_id: subrequest.source_id.clone(),
                    shard_id: subrequest.shard_id.clone(),
                    shard_state: ShardState::Open as i32,
                    leader_id: subrequest.leader_id.clone(),
                    follower_id: subrequest.follower_id.clone(),
                    doc_mapping_uid: subrequest.doc_mapping_uid,
                    publish_position_inclusive: Some(Position::Beginning),
                    publish_token: None,
                    update_timestamp: 1724158996,
                };
                let response = OpenShardsResponse {
                    subresponses: vec![OpenShardSubresponse {
                        subrequest_id: subrequest.subrequest_id,
                        open_shard: Some(shard),
                    }],
                };
                Ok(response)
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;

        let mut controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let mut index_metadata = IndexMetadata::for_test("test-index", "ram://indexes/test-index");
        let source_id: SourceId = "test-source".to_string();
        index_metadata.sources.insert(
            source_id.clone(),
            SourceConfig::for_test(&source_id, quickwit_config::SourceParams::void()),
        );

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let mut model = ControlPlaneModel::default();
        model.add_index(index_metadata);
        let progress = Progress::default();

        let shards = vec![Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-ingester".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, shards);
        let shard_entries: Vec<ShardEntry> = model.all_shards().cloned().collect();

        assert_eq!(shard_entries.len(), 1);
        assert_eq!(shard_entries[0].short_term_ingestion_rate, 0);

        // Test update shard ingestion rate but no scale down because num open shards is 1.
        let shard_infos = BTreeSet::from_iter([ShardInfo {
            shard_id: ShardId::from(1),
            shard_state: ShardState::Open,
            short_term_ingestion_rate: RateMibPerSec(1),
            long_term_ingestion_rate: RateMibPerSec(1),
        }]);
        let local_shards_update = LocalShardsUpdate {
            leader_id: "test-ingester".into(),
            source_uid: source_uid.clone(),
            shard_infos,
        };

        controller
            .handle_local_shards_update(local_shards_update, &mut model, &progress)
            .await
            .unwrap();

        let shard_entries: Vec<ShardEntry> = model.all_shards().cloned().collect();
        assert_eq!(shard_entries.len(), 1);
        assert_eq!(shard_entries[0].short_term_ingestion_rate, 1);

        // Test update shard ingestion rate with failing scale down.
        let shards = vec![Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Open as i32,
            leader_id: "test-ingester".to_string(),
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, shards);

        let shard_entries: Vec<ShardEntry> = model.all_shards().cloned().collect();
        assert_eq!(shard_entries.len(), 2);

        let mut mock_ingester = MockIngesterService::new();

        let index_uid_clone = index_uid.clone();
        mock_ingester.expect_init_shards().returning(
            move |init_shard_request: InitShardsRequest| {
                assert_eq!(init_shard_request.subrequests.len(), 1);
                let init_shard_subrequest: &InitShardSubrequest =
                    &init_shard_request.subrequests[0];
                assert!(init_shard_subrequest.validate_docs);
                Ok(InitShardsResponse {
                    successes: vec![InitShardSuccess {
                        subrequest_id: init_shard_subrequest.subrequest_id,
                        shard: init_shard_subrequest.shard.clone(),
                    }],
                    failures: Vec::new(),
                })
            },
        );
        mock_ingester
            .expect_close_shards()
            .returning(move |request| {
                assert_eq!(request.shard_pkeys.len(), 1);
                assert_eq!(request.shard_pkeys[0].index_uid(), &index_uid_clone);
                assert_eq!(request.shard_pkeys[0].source_id, "test-source");
                Err(IngestV2Error::Internal(
                    "failed to close shards".to_string(),
                ))
            });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert("test-ingester".into(), ingester);

        let shard_infos = BTreeSet::from_iter([
            ShardInfo {
                shard_id: ShardId::from(1),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(1),
                long_term_ingestion_rate: RateMibPerSec(1),
            },
            ShardInfo {
                shard_id: ShardId::from(2),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(1),
                long_term_ingestion_rate: RateMibPerSec(1),
            },
        ]);
        let local_shards_update = LocalShardsUpdate {
            leader_id: "test-ingester".into(),
            source_uid: source_uid.clone(),
            shard_infos,
        };
        controller
            .handle_local_shards_update(local_shards_update, &mut model, &progress)
            .await
            .unwrap();

        // Test update shard ingestion rate with failing scale up.
        let shard_infos = BTreeSet::from_iter([
            ShardInfo {
                shard_id: ShardId::from(1),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(4),
                long_term_ingestion_rate: RateMibPerSec(4),
            },
            ShardInfo {
                shard_id: ShardId::from(2),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(4),
                long_term_ingestion_rate: RateMibPerSec(4),
            },
        ]);
        let local_shards_update = LocalShardsUpdate {
            leader_id: "test-ingester".into(),
            source_uid: source_uid.clone(),
            shard_infos,
        };

        // The first request fails due to an error on the metastore.
        let MetastoreError::InvalidArgument { .. } = controller
            .handle_local_shards_update(local_shards_update.clone(), &mut model, &progress)
            .await
            .unwrap_err()
        else {
            panic!();
        };

        // The second request works!
        controller
            .handle_local_shards_update(local_shards_update, &mut model, &progress)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_ingest_controller_disable_validation_when_vrl() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_open_shards()
            .once()
            .returning(|request| {
                let subrequest: &OpenShardSubrequest = &request.subrequests[0];
                let shard = Shard {
                    index_uid: subrequest.index_uid.clone(),
                    source_id: subrequest.source_id.clone(),
                    shard_id: subrequest.shard_id.clone(),
                    shard_state: ShardState::Open as i32,
                    leader_id: subrequest.leader_id.clone(),
                    follower_id: subrequest.follower_id.clone(),
                    doc_mapping_uid: subrequest.doc_mapping_uid,
                    publish_position_inclusive: Some(Position::Beginning),
                    publish_token: None,
                    update_timestamp: 1724158996,
                };
                let response = OpenShardsResponse {
                    subresponses: vec![OpenShardSubresponse {
                        subrequest_id: subrequest.subrequest_id,
                        open_shard: Some(shard),
                    }],
                };
                Ok(response)
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;

        let mut controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let mut index_metadata = IndexMetadata::for_test("test-index", "ram://indexes/test-index");
        let source_id: SourceId = "test-source".to_string();
        let mut source_config =
            SourceConfig::for_test(&source_id, quickwit_config::SourceParams::void());
        // set a vrl script
        source_config.transform_config =
            Some(quickwit_config::TransformConfig::new("".to_string(), None));
        index_metadata
            .sources
            .insert(source_id.clone(), source_config);

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let mut model = ControlPlaneModel::default();
        model.add_index(index_metadata);
        let progress = Progress::default();

        let shards = vec![Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-ingester".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, shards);

        let mut mock_ingester = MockIngesterService::new();

        mock_ingester.expect_init_shards().returning(
            move |init_shard_request: InitShardsRequest| {
                assert_eq!(init_shard_request.subrequests.len(), 1);
                let init_shard_subrequest: &InitShardSubrequest =
                    &init_shard_request.subrequests[0];
                // we have vrl, so no validation
                assert!(!init_shard_subrequest.validate_docs);
                Ok(InitShardsResponse {
                    successes: vec![InitShardSuccess {
                        subrequest_id: init_shard_subrequest.subrequest_id,
                        shard: init_shard_subrequest.shard.clone(),
                    }],
                    failures: Vec::new(),
                })
            },
        );

        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert("test-ingester".into(), ingester);

        let shard_infos = BTreeSet::from_iter([ShardInfo {
            shard_id: ShardId::from(1),
            shard_state: ShardState::Open,
            short_term_ingestion_rate: RateMibPerSec(4),
            long_term_ingestion_rate: RateMibPerSec(4),
        }]);
        let local_shards_update = LocalShardsUpdate {
            leader_id: "test-ingester".into(),
            source_uid: source_uid.clone(),
            shard_infos,
        };

        controller
            .handle_local_shards_update(local_shards_update, &mut model, &progress)
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_ingest_controller_try_scale_up_shards() {
        let mut mock_metastore = MockMetastoreService::new();

        let index_uid = IndexUid::from_str("test-index:00000000000000000000000000").unwrap();
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_open_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);
                assert_eq!(request.subrequests[0].index_uid(), &index_uid_clone);
                assert_eq!(request.subrequests[0].source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(request.subrequests[0].leader_id, "test-ingester");

                Err(MetastoreError::InvalidArgument {
                    message: "failed to open shards".to_string(),
                })
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_open_shards()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);
                assert_eq!(request.subrequests[0].index_uid(), &index_uid_clone);
                assert_eq!(request.subrequests[0].source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(request.subrequests[0].leader_id, "test-ingester");

                let subresponses = vec![metastore::OpenShardSubresponse {
                    subrequest_id: 0,
                    open_shard: Some(Shard {
                        index_uid: Some(index_uid.clone()),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shard_id: Some(ShardId::from(1)),
                        leader_id: "test-ingester".to_string(),
                        shard_state: ShardState::Open as i32,
                        ..Default::default()
                    }),
                }];
                let response = metastore::OpenShardsResponse { subresponses };
                Ok(response)
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);

        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;

        let mut controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = INGEST_V2_SOURCE_ID.to_string();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let shard_stats = ShardStats {
            num_open_shards: 2,
            ..Default::default()
        };
        let mut model = ControlPlaneModel::default();
        let index_metadata =
            IndexMetadata::for_test(&index_uid.index_id, "ram://indexes/test-index:0");
        model.add_index(index_metadata);

        let source_config = SourceConfig::ingest_v2();
        model.add_source(&index_uid, source_config).unwrap();

        let progress = Progress::default();

        // Test could not find leader because no ingester in pool
        controller
            .try_scale_up_shards(source_uid.clone(), shard_stats, &mut model, &progress, 1)
            .await
            .unwrap();

        let mut mock_ingester = MockIngesterService::new();

        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_init_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.subrequest_id, 0);

                let shard = request.subrequests[0].shard();
                assert_eq!(shard.index_uid(), &index_uid_clone);
                assert_eq!(shard.source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(shard.leader_id, "test-ingester");

                Err(IngestV2Error::Internal("failed to init shards".to_string()))
            });
        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_init_shards()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.subrequest_id, 0);

                let shard = subrequest.shard();
                assert_eq!(shard.index_uid(), &index_uid_clone);
                assert_eq!(shard.source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(shard.leader_id, "test-ingester");

                let successes = vec![InitShardSuccess {
                    subrequest_id: request.subrequests[0].subrequest_id,
                    shard: Some(shard.clone()),
                }];
                let response = InitShardsResponse {
                    successes,
                    failures: Vec::new(),
                };
                Ok(response)
            });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert("test-ingester".into(), ingester);

        // Test failed to open shards.
        controller
            .try_scale_up_shards(source_uid.clone(), shard_stats, &mut model, &progress, 1)
            .await
            .unwrap();
        assert_eq!(model.all_shards().count(), 0);

        // Test failed to init shards.
        controller
            .try_scale_up_shards(source_uid.clone(), shard_stats, &mut model, &progress, 1)
            .await
            .unwrap_err();
        assert_eq!(model.all_shards().count(), 0);

        // Test successfully opened shard.
        controller
            .try_scale_up_shards(source_uid.clone(), shard_stats, &mut model, &progress, 1)
            .await
            .unwrap();
        assert_eq!(
            model.all_shards().filter(|shard| shard.is_open()).count(),
            1
        );
    }

    #[tokio::test]
    async fn test_ingest_controller_try_scale_down_shards() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;

        let controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".to_string();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let shard_stats = ShardStats {
            num_open_shards: 2,
            ..Default::default()
        };
        let min_shards = NonZeroUsize::MIN;
        let mut model = ControlPlaneModel::default();
        let progress = Progress::default();

        // Test could not find a scale down candidate.
        controller
            .try_scale_down_shards(
                source_uid.clone(),
                shard_stats,
                min_shards,
                &mut model,
                &progress,
            )
            .await
            .unwrap();

        let shards = vec![Shard {
            shard_id: Some(ShardId::from(1)),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            leader_id: "test-ingester".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, shards);

        // Test ingester is unavailable.
        controller
            .try_scale_down_shards(
                source_uid.clone(),
                shard_stats,
                min_shards,
                &mut model,
                &progress,
            )
            .await
            .unwrap();

        let mut mock_ingester = MockIngesterService::new();

        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_close_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.shard_pkeys.len(), 1);
                assert_eq!(request.shard_pkeys[0].index_uid(), &index_uid_clone);
                assert_eq!(request.shard_pkeys[0].source_id, "test-source");
                assert_eq!(request.shard_pkeys[0].shard_id(), ShardId::from(1));

                Err(IngestV2Error::Internal(
                    "failed to close shards".to_string(),
                ))
            });
        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_close_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.shard_pkeys.len(), 1);
                assert_eq!(request.shard_pkeys[0].index_uid(), &index_uid_clone);
                assert_eq!(request.shard_pkeys[0].source_id, "test-source");
                assert_eq!(request.shard_pkeys[0].shard_id(), ShardId::from(1));

                let response = CloseShardsResponse {
                    successes: request.shard_pkeys,
                };
                Ok(response)
            });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));
        ingester_pool.insert("test-ingester".into(), ingester);

        // Test failed to close shard.
        controller
            .try_scale_down_shards(
                source_uid.clone(),
                shard_stats,
                min_shards,
                &mut model,
                &progress,
            )
            .await
            .unwrap();
        assert!(model.all_shards().all(|shard| shard.is_open()));

        // Test successfully closed shard.
        controller
            .try_scale_down_shards(
                source_uid.clone(),
                shard_stats,
                min_shards,
                &mut model,
                &progress,
            )
            .await
            .unwrap();
        assert!(model.all_shards().all(|shard| shard.is_closed()));

        let shards = vec![Shard {
            shard_id: Some(ShardId::from(2)),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            leader_id: "test-ingester".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id, shards);

        // Test rate limited.
        controller
            .try_scale_down_shards(
                source_uid.clone(),
                shard_stats,
                min_shards,
                &mut model,
                &progress,
            )
            .await
            .unwrap();
        assert!(model.all_shards().any(|shard| shard.is_open()));
    }

    #[test]
    fn test_find_scale_down_candidate() {
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".to_string();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let mut model = ControlPlaneModel::default();

        assert!(find_scale_down_candidate(&source_uid, &model).is_none());

        let shards = vec![
            Shard {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-0".to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(2)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-0".to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(3)),
                shard_state: ShardState::Closed as i32, //< this one is closed
                leader_id: "test-ingester-0".to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(4)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-1".to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(5)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-1".to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: index_uid.clone().into(),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(6)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-1".to_string(),
                ..Default::default()
            },
        ];
        // That's 3 open shards on indexer-1, 2 open shard and one closed shard on indexer-0..
        model.insert_shards(&index_uid, &source_id, shards);

        let shard_infos = BTreeSet::from_iter([
            ShardInfo {
                shard_id: ShardId::from(1),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: quickwit_ingest::RateMibPerSec(1),
                long_term_ingestion_rate: quickwit_ingest::RateMibPerSec(1),
            },
            ShardInfo {
                shard_id: ShardId::from(2),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: quickwit_ingest::RateMibPerSec(2),
                long_term_ingestion_rate: quickwit_ingest::RateMibPerSec(2),
            },
            ShardInfo {
                shard_id: ShardId::from(3),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: quickwit_ingest::RateMibPerSec(3),
                long_term_ingestion_rate: quickwit_ingest::RateMibPerSec(3),
            },
            ShardInfo {
                shard_id: ShardId::from(4),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: quickwit_ingest::RateMibPerSec(4),
                long_term_ingestion_rate: quickwit_ingest::RateMibPerSec(4),
            },
            ShardInfo {
                shard_id: ShardId::from(5),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: quickwit_ingest::RateMibPerSec(5),
                long_term_ingestion_rate: quickwit_ingest::RateMibPerSec(5),
            },
            ShardInfo {
                shard_id: ShardId::from(6),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: quickwit_ingest::RateMibPerSec(6),
                long_term_ingestion_rate: quickwit_ingest::RateMibPerSec(6),
            },
        ]);
        model.update_shards(&source_uid, &shard_infos);

        let (leader_id, _shard_id) = find_scale_down_candidate(&source_uid, &model).unwrap();
        // We pick ingester 1 has it has more open shard
        assert_eq!(leader_id, "test-ingester-1");
    }

    #[tokio::test]
    async fn test_sync_with_ingesters() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 2;

        let controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".to_string();
        let mut model = ControlPlaneModel::default();
        let shards = vec![
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                leader_id: "node-1".to_string(),
                follower_id: Some("node-2".to_string()),
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(2)),
                shard_state: ShardState::Open as i32,
                leader_id: "node-2".to_string(),
                follower_id: Some("node-3".to_string()),
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(3)),
                shard_state: ShardState::Open as i32,
                leader_id: "node-2".to_string(),
                follower_id: Some("node-1".to_string()),
                ..Default::default()
            },
        ];
        model.insert_shards(&index_uid, &source_id, shards);

        let mut mock_ingester_1 = MockIngesterService::new();
        let mock_ingester_2 = MockIngesterService::new();
        let mock_ingester_3 = MockIngesterService::new();

        let count_calls = Arc::new(AtomicUsize::new(0));
        let count_calls_clone = count_calls.clone();
        mock_ingester_1
            .expect_retain_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.retain_shards_for_sources.len(), 1);
                assert_eq!(
                    request.retain_shards_for_sources[0].shard_ids,
                    [ShardId::from(1), ShardId::from(3)]
                );
                count_calls_clone.fetch_add(1, Ordering::Release);
                Ok(RetainShardsResponse {})
            });
        ingester_pool.insert(
            "node-1".into(),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1)),
        );
        ingester_pool.insert(
            "node-2".into(),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_2)),
        );
        ingester_pool.insert(
            "node-3".into(),
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_3)),
        );
        let node_id = "node-1".into();
        let wait_handle = controller.sync_with_ingester(&node_id, &model);
        wait_handle.wait().await;
        assert_eq!(count_calls.load(Ordering::Acquire), 1);
    }

    #[tokio::test]
    async fn test_ingest_controller_advise_reset_shards() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 2;

        let controller = IngestController::new(
            metastore,
            ingester_pool,
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let mut model = ControlPlaneModel::default();

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id_00: SourceId = "test-source-0".into();
        let source_id_01: SourceId = "test-source-1".into();

        let shards = vec![Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id_00.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            publish_position_inclusive: Some(Position::offset(1337u64)),
            ..Default::default()
        }];
        model.insert_shards(&index_uid, &source_id_00, shards);

        let advise_reset_shards_request = AdviseResetShardsRequest {
            ingester_id: "test-ingester".to_string(),
            shard_ids: vec![
                ShardIds {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id_00.clone(),
                    shard_ids: vec![ShardId::from(1), ShardId::from(2)],
                },
                ShardIds {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id_01.clone(),
                    shard_ids: vec![ShardId::from(3)],
                },
            ],
        };
        let advise_reset_shards_response =
            controller.advise_reset_shards(advise_reset_shards_request, &model);

        assert_eq!(advise_reset_shards_response.shards_to_delete.len(), 2);

        let shard_to_delete_00 = &advise_reset_shards_response.shards_to_delete[0];
        assert_eq!(shard_to_delete_00.index_uid(), &index_uid);
        assert_eq!(shard_to_delete_00.source_id, source_id_00);
        assert_eq!(shard_to_delete_00.shard_ids.len(), 1);
        assert_eq!(shard_to_delete_00.shard_ids[0], ShardId::from(2));

        let shard_to_delete_01 = &advise_reset_shards_response.shards_to_delete[1];
        assert_eq!(shard_to_delete_01.index_uid(), &index_uid);
        assert_eq!(shard_to_delete_01.source_id, source_id_01);
        assert_eq!(shard_to_delete_01.shard_ids.len(), 1);
        assert_eq!(shard_to_delete_01.shard_ids[0], ShardId::from(3));

        assert_eq!(advise_reset_shards_response.shards_to_truncate.len(), 1);

        let shard_to_truncate = &advise_reset_shards_response.shards_to_truncate[0];
        assert_eq!(shard_to_truncate.index_uid(), &index_uid);
        assert_eq!(shard_to_truncate.source_id, source_id_00);
        assert_eq!(shard_to_truncate.shard_positions.len(), 1);
        assert_eq!(
            shard_to_truncate.shard_positions[0].shard_id(),
            ShardId::from(1)
        );
        assert_eq!(
            shard_to_truncate.shard_positions[0].publish_position_inclusive(),
            Position::offset(1337u64)
        );
    }

    #[tokio::test]
    async fn test_ingest_controller_close_shards() {
        let metastore = MetastoreServiceClient::mocked();
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let closed_shards = controller.close_shards(Vec::new()).await;
        assert_eq!(closed_shards.len(), 0);

        let ingester_id_0 = NodeId::from("test-ingester-0");
        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_close_shards()
            .once()
            .returning(|mut request| {
                assert_eq!(request.shard_pkeys.len(), 2);

                request
                    .shard_pkeys
                    .sort_by(|left, right| left.shard_id().cmp(right.shard_id()));

                let shard_0 = &request.shard_pkeys[0];
                assert_eq!(shard_0.index_uid(), &IndexUid::for_test("test-index", 0));
                assert_eq!(shard_0.source_id, "test-source");
                assert_eq!(shard_0.shard_id(), ShardId::from(0));

                let shard_1 = &request.shard_pkeys[1];
                assert_eq!(shard_1.index_uid(), &IndexUid::for_test("test-index", 0));
                assert_eq!(shard_1.source_id, "test-source");
                assert_eq!(shard_1.shard_id(), ShardId::from(1));

                let response = CloseShardsResponse {
                    successes: vec![shard_0.clone()],
                };
                Ok(response)
            });
        let ingester_0 = IngesterServiceClient::from_mock(mock_ingester_0);
        ingester_pool.insert(
            ingester_id_0.clone(),
            IngesterPoolEntry::ready_with_client(ingester_0),
        );

        let ingester_id_1 = NodeId::from("test-ingester-1");
        let mut mock_ingester_1 = MockIngesterService::new();
        mock_ingester_1
            .expect_close_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.shard_pkeys.len(), 1);

                let shard = &request.shard_pkeys[0];
                assert_eq!(shard.index_uid(), &IndexUid::for_test("test-index", 0));
                assert_eq!(shard.source_id, "test-source");
                assert_eq!(shard.shard_id(), ShardId::from(2));

                Err(IngestV2Error::Internal("internal error".to_string()))
            });
        let ingester_1 = IngesterServiceClient::from_mock(mock_ingester_1);
        ingester_pool.insert(
            ingester_id_1.clone(),
            IngesterPoolEntry::ready_with_client(ingester_1),
        );

        let ingester_id_2 = NodeId::from("test-ingester-2");
        let mut mock_ingester_2 = MockIngesterService::new();
        mock_ingester_2.expect_close_shards().never();

        let client_2 = IngesterServiceClient::tower()
            .stack_close_shards_layer(DelayLayer::new(CLOSE_SHARDS_REQUEST_TIMEOUT * 2))
            .build_from_mock(mock_ingester_2);
        ingester_pool.insert(
            ingester_id_2.clone(),
            IngesterPoolEntry::ready_with_client(client_2),
        );

        // In this test:
        // - ingester 0 will close shard 0 successfully and fail to close shard 1;
        // - ingester 1 will return an error;
        // - ingester 2 will time out;
        // - ingester 3 will be unavailable.

        let shards_to_close = vec![
            Shard {
                index_uid: Some(IndexUid::for_test("test-index", 0)),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(0)),
                leader_id: ingester_id_0.to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: Some(IndexUid::for_test("test-index", 0)),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                leader_id: ingester_id_0.to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: Some(IndexUid::for_test("test-index", 0)),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(2)),
                leader_id: ingester_id_1.to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: Some(IndexUid::for_test("test-index", 0)),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(3)),
                leader_id: ingester_id_2.to_string(),
                ..Default::default()
            },
            Shard {
                index_uid: Some(IndexUid::for_test("test-index", 0)),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(4)),
                leader_id: "test-ingester-3".to_string(),
                ..Default::default()
            },
        ];
        let closed_shards = controller.close_shards(shards_to_close).await;
        assert_eq!(closed_shards.len(), 1);

        let closed_shard = &closed_shards[0];
        assert_eq!(closed_shard.index_uid(), &("test-index", 0));
        assert_eq!(closed_shard.source_id, "test-source");
        assert_eq!(closed_shard.shard_id(), ShardId::from(0));
    }

    #[tokio::test]
    async fn test_ingest_controller_rebalance_shards() {
        setup_logging_for_tests();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_open_shards().return_once(|request| {
            assert_eq!(request.subrequests.len(), 1);

            let subrequest_0 = &request.subrequests[0];
            assert_eq!(subrequest_0.subrequest_id, 0);
            assert_eq!(subrequest_0.index_uid(), &("test-index", 0));
            assert_eq!(subrequest_0.source_id, INGEST_V2_SOURCE_ID.to_string());
            assert_eq!(subrequest_0.leader_id, "test-ingester-1");
            assert!(subrequest_0.follower_id.is_none());

            let subresponses = vec![metastore::OpenShardSubresponse {
                subrequest_id: 0,
                open_shard: Some(Shard {
                    index_uid: Some(IndexUid::for_test("test-index", 0)),
                    source_id: INGEST_V2_SOURCE_ID.to_string(),
                    shard_id: subrequest_0.shard_id.clone(),
                    leader_id: "test-ingester-1".to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                }),
            }];
            let response = metastore::OpenShardsResponse { subresponses };
            Ok(response)
        });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let mut controller = IngestController::new(
            metastore,
            ingester_pool.clone(),
            replication_factor,
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );

        let mut model = ControlPlaneModel::default();

        let universe = Universe::with_accelerated_time();
        let (control_plane_mailbox, control_plane_inbox) = universe.create_test_mailbox();
        let progress = Progress::default();

        let num_opened_shards = controller
            .rebalance_shards(&mut model, &control_plane_mailbox, &progress)
            .await
            .unwrap();
        assert_eq!(num_opened_shards, 0);

        let index_metadata = IndexMetadata::for_test("test-index", "ram://indexes/test-index");
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata);

        let source_config = SourceConfig::ingest_v2();
        model.add_source(&index_uid, source_config).unwrap();

        // In this test, ingester 0 hosts 5 shards but there are two ingesters in the cluster.
        // `rebalance_shards` will attempt to move 2 shards to ingester 1. However, it will fail to
        // init one shard, so only one shard will be actually moved.

        let open_shards = vec![
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(0)),
                leader_id: "test-ingester-0".to_string(),
                shard_state: ShardState::Open as i32,
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(1)),
                leader_id: "test-ingester-0".to_string(),
                shard_state: ShardState::Open as i32,
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(2)),
                leader_id: "test-ingester-0".to_string(),
                shard_state: ShardState::Open as i32,
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(3)),
                leader_id: "test-ingester-0".to_string(),
                shard_state: ShardState::Open as i32,
                ..Default::default()
            },
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(ShardId::from(4)),
                leader_id: "test-ingester-0".to_string(),
                shard_state: ShardState::Open as i32,
                ..Default::default()
            },
        ];
        model.insert_shards(&index_uid, &INGEST_V2_SOURCE_ID.to_string(), open_shards);

        let ingester_id_0 = NodeId::from("test-ingester-0");
        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_close_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.shard_pkeys.len(), 1);

                let shard = &request.shard_pkeys[0];
                assert_eq!(shard.index_uid(), &("test-index", 0));
                assert_eq!(shard.source_id, INGEST_V2_SOURCE_ID);
                // assert_eq!(shard.shard_id(), ShardId::from(2));

                let response = CloseShardsResponse {
                    successes: vec![shard.clone()],
                };
                Ok(response)
            });
        let ingester_0 = IngesterServiceClient::from_mock(mock_ingester_0);
        ingester_pool.insert(
            ingester_id_0.clone(),
            IngesterPoolEntry::ready_with_client(ingester_0),
        );

        let ingester_id_1 = NodeId::from("test-ingester-1");
        let mut mock_ingester_1 = MockIngesterService::new();
        mock_ingester_1.expect_init_shards().return_once(|request| {
            assert_eq!(request.subrequests.len(), 2);

            let subrequest_0 = &request.subrequests[0];
            assert_eq!(subrequest_0.subrequest_id, 0);

            let shard_0 = request.subrequests[0].shard();
            assert_eq!(shard_0.index_uid(), &("test-index", 0));
            assert_eq!(shard_0.source_id, INGEST_V2_SOURCE_ID.to_string());
            assert_eq!(shard_0.leader_id, "test-ingester-1");
            assert!(shard_0.follower_id.is_none());

            let subrequest_1 = &request.subrequests[1];
            assert_eq!(subrequest_1.subrequest_id, 1);

            let shard_1 = request.subrequests[0].shard();
            assert_eq!(shard_1.index_uid(), &("test-index", 0));
            assert_eq!(shard_1.source_id, INGEST_V2_SOURCE_ID.to_string());
            assert_eq!(shard_1.leader_id, "test-ingester-1");
            assert!(shard_1.follower_id.is_none());

            let successes = vec![InitShardSuccess {
                subrequest_id: request.subrequests[0].subrequest_id,
                shard: Some(shard_0.clone()),
            }];
            let failures = vec![InitShardFailure {
                subrequest_id: request.subrequests[1].subrequest_id,
                index_uid: Some(IndexUid::for_test("test-index", 0)),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                shard_id: Some(shard_1.shard_id().clone()),
            }];
            let response = InitShardsResponse {
                successes,
                failures,
            };
            Ok(response)
        });
        let ingester_1 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1));
        ingester_pool.insert(ingester_id_1.clone(), ingester_1);

        let num_opened_shards = controller
            .rebalance_shards(&mut model, &control_plane_mailbox, &progress)
            .await
            .unwrap();
        assert_eq!(num_opened_shards, 1);

        let callback: RebalanceShardsCallback = tokio::time::timeout(
            CLOSE_SHARDS_REQUEST_TIMEOUT * 2,
            control_plane_inbox.recv_typed_message(),
        )
        .await
        .unwrap()
        .unwrap();
        assert_eq!(callback.closed_shards.len(), 1);
    }

    // #[track_caller]
    fn test_allocate_shards_aux_aux(
        shard_counts_map: &HashMap<NodeId, usize>,
        num_shards: usize,
        replication_enabled: bool,
    ) {
        let shard_allocations_opt =
            super::allocate_shards(shard_counts_map, num_shards, replication_enabled);
        if num_shards == 0 {
            assert_eq!(shard_allocations_opt, Some(Vec::new()));
            return;
        }
        let num_nodes_required = if replication_enabled { 2 } else { 1 };
        if shard_counts_map.len() < num_nodes_required {
            assert!(shard_allocations_opt.is_none());
            return;
        }
        let shard_allocations = shard_allocations_opt.unwrap();
        let mut total_counts: HashMap<&NodeIdRef, usize> = HashMap::default();
        assert_eq!(shard_allocations.len(), num_shards);
        if num_shards == 0 {
            return;
        }
        for (leader, follower_opt) in shard_allocations {
            assert_eq!(follower_opt.is_some(), replication_enabled);
            *total_counts.entry(leader).or_default() += 1;
            if let Some(follower) = follower_opt {
                *total_counts.entry(follower).or_default() += 1;
                assert_ne!(follower, leader);
            }
        }
        for (shard, count) in shard_counts_map {
            if let Some(shard_count) = total_counts.get_mut(shard.as_ref()) {
                *shard_count += *count;
            }
        }
        let (min, max) = total_counts
            .values()
            .copied()
            .minmax()
            .into_option()
            .unwrap();
        if !replication_enabled {
            // If replication is enabled, we can end up being forced to not spread shards as evenly
            // as we would wish. For instance, if there are only two nodes initially
            // unbalanced.
            assert!(min + 1 >= max);
        } else {
            let (previous_min, previous_max) = shard_counts_map
                .values()
                .copied()
                .minmax()
                .into_option()
                .unwrap();
            // The algorithm is supposed to reduce the variance.
            // Of course sometimes it is not possible. For instance for 3 nodes that are
            // perfectly balanced to begin with, if we as for a single shard.
            assert!((previous_max - previous_min).max(1) >= (max - min));
        }
    }

    fn test_allocate_shards_aux(shard_counts: &[usize]) {
        let mut shard_counts_map: HashMap<NodeId, usize> = HashMap::new();
        let shards: Vec<String> = (0..shard_counts.len())
            .map(|i| format!("shard-{i}"))
            .collect();
        for (shard, &shard_count) in shards.into_iter().zip(shard_counts.iter()) {
            shard_counts_map.insert(NodeId::from(shard), shard_count);
        }
        for i in 0..10 {
            test_allocate_shards_aux_aux(&shard_counts_map, i, false);
            test_allocate_shards_aux_aux(&shard_counts_map, i, true);
        }
    }

    use proptest::prelude::*;

    proptest! {
        #[test]
        fn test_proptest_allocate_shards(shard_counts in proptest::collection::vec(0..10usize, 0..10usize)) {
            test_allocate_shards_aux(&shard_counts);
        }
    }

    #[test]
    fn test_allocate_shards_prop_test() {
        test_allocate_shards_aux(&[]);
        test_allocate_shards_aux(&[1]);
        test_allocate_shards_aux(&[1, 1]);
        test_allocate_shards_aux(&[1, 2]);
        test_allocate_shards_aux(&[1, 4]);
        test_allocate_shards_aux(&[2, 3, 2]);
        test_allocate_shards_aux(&[2, 4, 6]);
        test_allocate_shards_aux(&[2, 3, 10]);
    }

    #[test]
    fn test_allocate_shards_prop_test_bug() {
        test_allocate_shards_aux(&[7, 7, 7]);
    }

    #[test]
    fn test_pick_one() {
        let mut shard_counts = BTreeMap::default();
        shard_counts.insert(
            1,
            vec![NodeIdRef::from_str("node1"), NodeIdRef::from_str("node2")],
        );
        let mut rng = rand::rng();
        let node = pick_one(
            &mut shard_counts,
            Some(NodeIdRef::from_str("node2")),
            &mut rng,
        )
        .unwrap();
        assert_eq!(node.as_str(), "node1");
        assert_eq!(shard_counts.len(), 2);
        assert_eq!(
            &shard_counts.get(&1).unwrap()[..],
            &[NodeIdRef::from_str("node2")]
        );
        assert_eq!(
            &shard_counts.get(&2).unwrap()[..],
            &[NodeIdRef::from_str("node1")]
        );
        let node = pick_one(&mut shard_counts, None, &mut rng).unwrap();
        assert_eq!(node.as_str(), "node2");
        assert_eq!(shard_counts.len(), 1);
        assert_eq!(
            &shard_counts.get(&2).unwrap()[..],
            &[NodeIdRef::from_str("node1"), NodeIdRef::from_str("node2")]
        );
    }

    /// Test helper for compute_shards_to_rebalance.
    /// The reason for testing both available and unavailable ingesters with open shards is to
    /// ensure the algorithm holds up when there are open shards
    ///
    /// - `available_ingester_shards`: open shards per available ingester
    /// - `unavailable_ingester_shards`: open shards on unavailable ingesters
    fn test_compute_shards_to_rebalance_aux(
        ready_ingester_shards: &[usize],
        unavailable_ingester_shards: &[usize],
        retiring_ingester_shards: &[usize],
    ) {
        let index_id = "test-index";
        let index_metadata = IndexMetadata::for_test(index_id, "ram://indexes/test-index");
        let index_uid = index_metadata.index_uid.clone();
        let source_id: SourceId = "test-source".to_string();

        let mut model = ControlPlaneModel::default();
        model.add_index(index_metadata.clone());

        let mut source_config = SourceConfig::ingest_v2();
        source_config.source_id = source_id.to_string();
        model.add_source(&index_uid, source_config).unwrap();

        let ingester_pool = IngesterPool::default();
        let mock_ingester = MockIngesterService::new();
        let ingester_client = IngesterServiceClient::from_mock(mock_ingester);

        let ready_ids: Vec<String> = (0..ready_ingester_shards.len())
            .map(|i| format!("ready-ingester-{}", i))
            .collect();

        for ingester_id in &ready_ids {
            let ingester = IngesterPoolEntry {
                client: ingester_client.clone(),
                status: IngesterStatus::Ready,
                availability_zone: None,
            };
            ingester_pool.insert(NodeId::from(ingester_id.clone()), ingester);
        }

        let unavailable_ids: Vec<String> = (0..unavailable_ingester_shards.len())
            .map(|i| format!("unavailable-ingester-{}", i))
            .collect();

        let retiring_ids: Vec<String> = (0..retiring_ingester_shards.len())
            .map(|i| format!("retiring-ingester-{}", i))
            .collect();

        for ingester_id in &retiring_ids {
            let ingester = IngesterPoolEntry {
                client: ingester_client.clone(),
                status: IngesterStatus::Retiring,
                availability_zone: None,
            };
            ingester_pool.insert(NodeId::from(ingester_id.clone()), ingester);
        }

        let mut shards: Vec<Shard> = Vec::new();
        let mut shard_id: u64 = 0;

        for (idx, &num_shards) in ready_ingester_shards.iter().enumerate() {
            for _ in 0..num_shards {
                shards.push(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(shard_id)),
                    leader_id: ready_ids[idx].clone(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                });
                shard_id += 1;
            }
        }

        // Shards on unavailable ingesters - these shouldn't affect rebalancing calculations
        for (idx, &num_shards) in unavailable_ingester_shards.iter().enumerate() {
            for _ in 0..num_shards {
                shards.push(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(shard_id)),
                    leader_id: unavailable_ids[idx].clone(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                });
                shard_id += 1;
            }
        }

        let num_retiring_shards: usize = retiring_ingester_shards.iter().sum();

        // Shards on retiring ingesters - all of these should be rebalanced
        for (idx, &num_shards) in retiring_ingester_shards.iter().enumerate() {
            for _ in 0..num_shards {
                shards.push(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(shard_id)),
                    leader_id: retiring_ids[idx].clone(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                });
                shard_id += 1;
            }
        }

        model.insert_shards(&index_uid, &source_id, shards.clone());

        let controller = IngestController::new(
            MetastoreServiceClient::mocked(),
            ingester_pool.clone(),
            2, // replication_factor
            TEST_SHARD_THROUGHPUT_LIMIT_MIB,
            1.001,
        );
        let shards_to_rebalance = controller.compute_shards_to_rebalance(&model);

        // All shards on retiring ingesters must be rebalanced.
        let num_retiring_shards_to_rebalance = shards_to_rebalance
            .iter()
            .filter(|shard| shard.leader_id.starts_with("retiring-"))
            .count();
        assert_eq!(num_retiring_shards_to_rebalance, num_retiring_shards);

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let shard_ids_to_rebalance: Vec<ShardId> = shards_to_rebalance
            .iter()
            .flat_map(|shard| shard.shard_id.clone())
            .collect();

        let closed_shard_ids = model.close_shards(&source_uid, &shard_ids_to_rebalance);
        assert_eq!(closed_shard_ids.len(), shards_to_rebalance.len());

        let mut per_ready_ingester_num_shards: HashMap<&str, usize> = ready_ids
            .iter()
            .map(|ready_id| (ready_id.as_str(), 0))
            .collect();

        for shard in model.all_shards() {
            if !shard.is_open() {
                continue;
            }
            if let Some(count_shard) =
                per_ready_ingester_num_shards.get_mut(shard.leader_id.as_str())
            {
                *count_shard += 1;
            }
        }

        // Now we move the different shards to ready ingesters (not retiring ones).
        // We can only simulate this if there are ready ingesters to receive shards.
        if !ready_ids.is_empty() {
            let mut per_ingester_num_shards_sorted: BTreeSet<(usize, &str)> =
                per_ready_ingester_num_shards
                    .into_iter()
                    .map(|(ingester_id, num_shards)| (num_shards, ingester_id))
                    .collect();
            let mut opened_shards: Vec<Shard> = Vec::new();
            for _ in 0..shards_to_rebalance.len() {
                let (num_shards, ingester_id) = per_ingester_num_shards_sorted.pop_first().unwrap();
                let opened_shard = Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.to_string(),
                    shard_id: Some(ShardId::from(shard_id)),
                    leader_id: ingester_id.to_string(),
                    shard_state: ShardState::Open as i32,
                    ..Default::default()
                };
                per_ingester_num_shards_sorted.insert((num_shards + 1, ingester_id));
                opened_shards.push(opened_shard);
                shard_id += 1;
            }

            if let Some((min_shards, max_shards)) = per_ingester_num_shards_sorted
                .iter()
                .map(|(num_shards, _)| num_shards)
                .copied()
                .minmax()
                .into_option()
            {
                assert!(min_shards + min_shards.div_ceil(10).max(2) >= max_shards);
            }

            // Test stability of the algorithm: mark the retiring ingesters as
            // decommissioned, insert the new shards, and verify no further rebalance is
            // needed among the ready ingesters.
            for ingester_id in &retiring_ids {
                let ingester = IngesterPoolEntry {
                    client: ingester_client.clone(),
                    status: IngesterStatus::Decommissioned,
                    availability_zone: None,
                };
                ingester_pool.insert(NodeId::from(ingester_id.clone()), ingester);
            }
            model.insert_shards(&index_uid, &source_id, opened_shards);

            let shards_to_rebalance = controller.compute_shards_to_rebalance(&model);
            assert!(shards_to_rebalance.is_empty());
        }
    }

    proptest! {
        #[test]
        fn test_compute_shards_to_rebalance_proptest(
            ready_shards in proptest::collection::vec(0..13usize, 0..13usize),
            unavailable_shards in proptest::collection::vec(0..13usize, 0..5usize),
            retiring_shards in proptest::collection::vec(0..5usize, 0..5usize),
        ) {
            test_compute_shards_to_rebalance_aux(&ready_shards, &unavailable_shards, &retiring_shards);
        }
    }

    #[test]
    fn test_compute_shards_to_rebalance() {
        test_compute_shards_to_rebalance_aux(&[], &[], &[]);
        test_compute_shards_to_rebalance_aux(&[0], &[], &[]);
        test_compute_shards_to_rebalance_aux(&[1], &[], &[]);
        test_compute_shards_to_rebalance_aux(&[0, 1], &[], &[]);
        test_compute_shards_to_rebalance_aux(&[0, 1], &[1], &[]);
        test_compute_shards_to_rebalance_aux(&[0, 1, 2], &[3, 4], &[]);
        // Retiring ingesters: all their shards must be rebalanced
        test_compute_shards_to_rebalance_aux(&[1, 1], &[], &[3]);
        test_compute_shards_to_rebalance_aux(&[0, 0, 0], &[], &[5]);
        test_compute_shards_to_rebalance_aux(&[2], &[], &[1, 2]);
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/ingest/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub(crate) mod ingest_controller;
mod scaling_arbiter;
mod wait_handle;

pub use ingest_controller::IngestController;
pub use wait_handle::WaitHandle;


================================================
FILE: quickwit/quickwit-control-plane/src/ingest/scaling_arbiter.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;

use crate::model::{ScalingMode, ShardStats};

pub(crate) struct ScalingArbiter {
    // Threshold in MiB/s below which we decrease the number of shards.
    scale_down_shards_threshold_mib_per_sec: f32,

    // Per shard threshold in MiB/s above which we increase the number of shards.
    //
    // We want scaling up to be reactive, so we first inspect the short
    // term threshold.
    //
    // However, this threshold is based on a very short window of time: 5s.
    //
    // In order to avoid having back and forth scaling up and down in response to temporary
    // punctual spikes of a few MB, we also compute what would be the long term ingestion rate
    // after scaling up, and double check that it is above the long term threshold.
    scale_up_shards_short_term_threshold_mib_per_sec: f32,
    scale_up_shards_long_term_threshold_mib_per_sec: f32,
    // The max increase factor of the number of shards in one scale up operation
    shard_scale_up_factor: f32,
}

impl ScalingArbiter {
    pub fn with_max_shard_ingestion_throughput_mib_per_sec(
        max_shard_throughput_mib_per_sec: f32,
        shard_scale_up_factor: f32,
    ) -> ScalingArbiter {
        ScalingArbiter {
            scale_up_shards_short_term_threshold_mib_per_sec: max_shard_throughput_mib_per_sec
                * 0.8f32,
            scale_up_shards_long_term_threshold_mib_per_sec: max_shard_throughput_mib_per_sec
                * 0.3f32,
            scale_down_shards_threshold_mib_per_sec: max_shard_throughput_mib_per_sec * 0.2f32,
            shard_scale_up_factor,
        }
    }

    /// Computes the maximum number of shards we can have without going below
    /// the long term scale up threshold
    fn long_term_scale_up_threshold_max_shards(&self, shard_stats: ShardStats) -> usize {
        (shard_stats.avg_long_term_ingestion_rate * shard_stats.num_open_shards as f32
            / self.scale_up_shards_long_term_threshold_mib_per_sec)
            .floor() as usize
    }

    /// Computes the next number of shards we should have according the scaling factor
    fn scale_up_factor_target_shards(&self, shard_stats: ShardStats) -> usize {
        (shard_stats.num_open_shards as f32 * self.shard_scale_up_factor).ceil() as usize
    }

    /// Scale based on the "per shard average" metric
    ///
    /// Returns `None` when there are no open shards because in that case routers are expected to
    /// make the [`quickwit_proto::control_plane::GetOrCreateOpenShardsRequest`]
    pub(crate) fn should_scale(
        &self,
        shard_stats: ShardStats,
        min_shards: NonZeroUsize,
    ) -> Option<ScalingMode> {
        // If ingest is idle, there is nothing to do. Idle shards are automatically closed by
        // ingesters (see `quickwit_ingest::ingest_v2::idle::CloseIdleShardsTask`).
        if shard_stats.num_open_shards == 0 || shard_stats.avg_long_term_ingestion_rate == 0.0 {
            return None;
        }
        if shard_stats.num_open_shards < min_shards.get() {
            let num_shards_to_open = min_shards.get() - shard_stats.num_open_shards;
            let scaling_mode = ScalingMode::Up(num_shards_to_open);
            return Some(scaling_mode);
        }
        // Scale up based on the short term metric value while making sure that
        // the long term value doesn't get near the scale down threshold.
        if shard_stats.avg_short_term_ingestion_rate
            >= self.scale_up_shards_short_term_threshold_mib_per_sec
        {
            let new_calculated_num_shards = usize::min(
                self.long_term_scale_up_threshold_max_shards(shard_stats),
                self.scale_up_factor_target_shards(shard_stats),
            );

            let target_num_shards = usize::max(min_shards.get(), new_calculated_num_shards);

            if target_num_shards > shard_stats.num_open_shards {
                let num_shards_to_open = target_num_shards - shard_stats.num_open_shards;
                let scaling_mode = ScalingMode::Up(num_shards_to_open);
                return Some(scaling_mode);
            }
        }
        // On the other hand, scale down only based on the long term metric value to avoid
        // being sensitive to very short drops in ingestion
        if shard_stats.avg_long_term_ingestion_rate <= self.scale_down_shards_threshold_mib_per_sec
            && shard_stats.num_open_shards > min_shards.get()
        {
            return Some(ScalingMode::Down);
        }
        None
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;

    use super::ScalingArbiter;
    use crate::model::{ScalingMode, ShardStats};

    #[test]
    fn test_scaling_arbiter_one_by_one() {
        // use shard throughput 10MiB to simplify calculations
        // with a factor close to 1 shards are effectively added 1 by 1
        let scaling_arbiter =
            ScalingArbiter::with_max_shard_ingestion_throughput_mib_per_sec(10.0, 1.01);
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 0,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 0.0,
                    avg_long_term_ingestion_rate: 0.0,
                },
                NonZeroUsize::MIN
            ),
            None,
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 5.0,
                    avg_long_term_ingestion_rate: 6.0,
                },
                NonZeroUsize::MIN
            ),
            None
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.1,
                    avg_long_term_ingestion_rate: 8.1,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Up(1))
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 2,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.1,
                    avg_long_term_ingestion_rate: 8.1,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Up(1))
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 2,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 3.0,
                    avg_long_term_ingestion_rate: 1.5,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Down)
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 3.0,
                    avg_long_term_ingestion_rate: 1.5,
                },
                NonZeroUsize::MIN
            ),
            None,
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.0,
                    avg_long_term_ingestion_rate: 3.0,
                },
                NonZeroUsize::MIN
            ),
            None,
        );
    }

    #[test]
    fn test_scaling_arbiter_2x() {
        // use shard throughput 10MiB to simplify calculations
        let scaling_arbiter =
            ScalingArbiter::with_max_shard_ingestion_throughput_mib_per_sec(10.0, 2.);
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 0,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 0.0,
                    avg_long_term_ingestion_rate: 0.0,
                },
                NonZeroUsize::MIN
            ),
            None,
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 2,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 5.0,
                    avg_long_term_ingestion_rate: 6.0,
                },
                NonZeroUsize::MIN
            ),
            None
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.1,
                    avg_long_term_ingestion_rate: 8.1,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Up(1))
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 2,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.1,
                    avg_long_term_ingestion_rate: 8.1,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Up(2))
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 2,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 3.0,
                    avg_long_term_ingestion_rate: 1.5,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Down)
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 3.0,
                    avg_long_term_ingestion_rate: 1.5,
                },
                NonZeroUsize::MIN
            ),
            None,
        );
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 1,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.0,
                    avg_long_term_ingestion_rate: 3.1,
                },
                NonZeroUsize::MIN
            ),
            None,
        );
        // Scale by just 1 if 2 would bring us too close to the scale down threshold
        assert_eq!(
            scaling_arbiter.should_scale(
                ShardStats {
                    num_open_shards: 2,
                    num_closed_shards: 0,
                    avg_short_term_ingestion_rate: 8.1,
                    avg_long_term_ingestion_rate: 5.,
                },
                NonZeroUsize::MIN
            ),
            Some(ScalingMode::Up(1)),
        );
    }

    #[test]
    fn test_scale_up_computations() {
        // use shard throughput 10MiB to simplify calculations
        let scaling_arbiter =
            ScalingArbiter::with_max_shard_ingestion_throughput_mib_per_sec(10.0, 1.5);

        let shard_stats = ShardStats {
            num_open_shards: 0,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 0.,
            avg_long_term_ingestion_rate: 0.,
        };
        assert_eq!(
            scaling_arbiter.long_term_scale_up_threshold_max_shards(shard_stats),
            0
        );
        assert_eq!(
            scaling_arbiter.scale_up_factor_target_shards(shard_stats),
            0
        );

        let shard_stats = ShardStats {
            num_open_shards: 1,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 5.0,
            avg_long_term_ingestion_rate: 6.1,
        };
        assert_eq!(
            scaling_arbiter.long_term_scale_up_threshold_max_shards(shard_stats),
            2
        );
        assert_eq!(
            scaling_arbiter.scale_up_factor_target_shards(shard_stats),
            2
        );

        let shard_stats = ShardStats {
            num_open_shards: 2,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 5.0,
            avg_long_term_ingestion_rate: 1.1,
        };
        assert_eq!(
            scaling_arbiter.long_term_scale_up_threshold_max_shards(shard_stats),
            0
        );
        assert_eq!(
            scaling_arbiter.scale_up_factor_target_shards(shard_stats),
            3
        );

        let shard_stats = ShardStats {
            num_open_shards: 2,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 5.0,
            avg_long_term_ingestion_rate: 6.1,
        };
        assert_eq!(
            scaling_arbiter.long_term_scale_up_threshold_max_shards(shard_stats),
            4
        );
        assert_eq!(
            scaling_arbiter.scale_up_factor_target_shards(shard_stats),
            3
        );

        let shard_stats = ShardStats {
            num_open_shards: 5,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 5.0,
            avg_long_term_ingestion_rate: 1.1,
        };
        assert_eq!(
            scaling_arbiter.long_term_scale_up_threshold_max_shards(shard_stats),
            1
        );
        assert_eq!(
            scaling_arbiter.scale_up_factor_target_shards(shard_stats),
            8
        );
    }

    #[test]
    fn test_scaling_arbiter_idle() {
        let scaling_arbiter =
            ScalingArbiter::with_max_shard_ingestion_throughput_mib_per_sec(10.0, 1.5);

        let shard_stats = ShardStats {
            num_open_shards: 0,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 0.0,
            avg_long_term_ingestion_rate: 0.0,
        };
        let min_shards = NonZeroUsize::MIN;
        let scaling_mode = scaling_arbiter.should_scale(shard_stats, min_shards);
        assert!(scaling_mode.is_none());

        let shard_stats = ShardStats {
            num_open_shards: 1,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 0.0,
            avg_long_term_ingestion_rate: 0.0,
        };
        let min_shards = NonZeroUsize::new(2).unwrap();
        let scaling_mode = scaling_arbiter.should_scale(shard_stats, min_shards);
        assert!(scaling_mode.is_none());
    }

    #[test]
    fn test_scaling_arbiter_min_shards() {
        let scaling_arbiter =
            ScalingArbiter::with_max_shard_ingestion_throughput_mib_per_sec(10.0, 1.5);

        let shard_stats = ShardStats {
            num_open_shards: 1,
            num_closed_shards: 0,
            avg_short_term_ingestion_rate: 5.0,
            avg_long_term_ingestion_rate: 1.0,
        };
        let min_shards = NonZeroUsize::new(5).unwrap();
        let scaling_mode = scaling_arbiter
            .should_scale(shard_stats, min_shards)
            .unwrap();
        assert_eq!(scaling_mode, ScalingMode::Up(4));
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/ingest/wait_handle.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use tokio::sync::oneshot;

pub struct WaitHandle {
    rx: oneshot::Receiver<()>,
}

impl WaitHandle {
    pub fn new() -> (WaitDropGuard, WaitHandle) {
        let (tx, rx) = oneshot::channel();
        let wait_drop_guard = WaitDropGuard(tx);
        let wait_handle = WaitHandle { rx };
        (wait_drop_guard, wait_handle)
    }

    pub async fn wait(self) {
        let _ = self.rx.await;
    }
}

pub struct WaitDropGuard(#[allow(dead_code)] oneshot::Sender<()>);

#[cfg(test)]
mod tests {
    use tokio::sync::oneshot::error::TryRecvError;

    #[tokio::test]
    async fn test_wait_handle_simple() {
        let (wait_drop_handle, mut wait_handle) = super::WaitHandle::new();
        assert!(matches!(
            wait_handle.rx.try_recv().unwrap_err(),
            TryRecvError::Empty
        ));
        drop(wait_drop_handle);
        wait_handle.wait().await;
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub mod control_plane;
pub mod indexing_plan;
pub mod indexing_scheduler;
pub mod ingest;
pub(crate) mod metrics;
pub(crate) mod model;

use quickwit_common::tower::Pool;
use quickwit_proto::indexing::{CpuCapacity, IndexingServiceClient, IndexingTask};
use quickwit_proto::types::NodeId;

/// Indexer-node specific information stored in the pool of available indexer nodes
#[derive(Debug, Clone)]
pub struct IndexerNodeInfo {
    pub node_id: NodeId,
    pub generation_id: u64,
    pub client: IndexingServiceClient,
    pub indexing_tasks: Vec<IndexingTask>,
    pub indexing_capacity: CpuCapacity,
}

pub type IndexerPool = Pool<NodeId, IndexerNodeInfo>;

mod cooldown_map;
mod debouncer;
#[cfg(test)]
mod tests;


================================================
FILE: quickwit/quickwit-control-plane/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    IntCounter, IntGauge, IntGaugeVec, new_counter, new_gauge, new_gauge_vec,
};

#[derive(Debug, Clone, Copy)]
pub struct ShardLocalityMetrics {
    pub num_remote_shards: usize,
    pub num_local_shards: usize,
}

pub struct ControlPlaneMetrics {
    // Indexes and shards tracked by the control plane.
    pub indexes_total: IntGauge,
    pub open_shards: IntGaugeVec<1>,
    pub closed_shards: IntGaugeVec<1>,

    // Operations performed by the control plane.
    pub apply_plan_total: IntCounter,
    pub rebalance_shards: IntGauge,
    pub restart_total: IntCounter,
    pub schedule_total: IntCounter,

    // Metastore errors.
    pub metastore_error_aborted: IntCounter,
    pub metastore_error_maybe_executed: IntCounter,

    // Indexing plan metrics.
    pub local_shards: IntGauge,
    pub remote_shards: IntGauge,
}

impl ControlPlaneMetrics {
    pub fn set_shard_locality_metrics(&self, shard_locality_metrics: ShardLocalityMetrics) {
        self.local_shards
            .set(shard_locality_metrics.num_local_shards as i64);
        self.remote_shards
            .set(shard_locality_metrics.num_remote_shards as i64);
    }
}

impl Default for ControlPlaneMetrics {
    fn default() -> Self {
        let open_shards = new_gauge_vec(
            "shards",
            "Number of open and closed shards tracked by the ingest controller",
            "control_plane",
            &[("state", "open")],
            ["index_id"],
        );
        let closed_shards = new_gauge_vec(
            "shards",
            "Number of open and closed shards tracked by the ingest controller",
            "control_plane",
            &[("state", "closed")],
            ["index_id"],
        );
        let indexed_shards = new_gauge_vec(
            "indexed_shards",
            "Number of (remote/local) shards in the indexing plan",
            "control_plane",
            &[],
            ["locality"],
        );
        let local_shards = indexed_shards.with_label_values(["local"]);
        let remote_shards = indexed_shards.with_label_values(["remote"]);

        ControlPlaneMetrics {
            indexes_total: new_gauge(
                "indexes_total",
                "Number of indexes tracked by the control plane.",
                "control_plane",
                &[],
            ),
            open_shards,
            closed_shards,
            apply_plan_total: new_counter(
                "apply_plan_total",
                "Number of control plane `apply plan` operations.",
                "control_plane",
                &[],
            ),
            rebalance_shards: new_gauge(
                "rebalance_shards",
                "Number of shards rebalanced by the control plane.",
                "control_plane",
                &[],
            ),
            restart_total: new_counter(
                "restart_total",
                "Number of control plane restarts.",
                "control_plane",
                &[],
            ),
            schedule_total: new_counter(
                "schedule_total",
                "Number of control plane `schedule` operations.",
                "control_plane",
                &[],
            ),
            metastore_error_aborted: new_counter(
                "metastore_error_aborted",
                "Number of aborted metastore transaction (= do not trigger a control plane \
                 restart)",
                "control_plane",
                &[],
            ),
            metastore_error_maybe_executed: new_counter(
                "metastore_error_maybe_executed",
                "Number of metastore transaction with an uncertain outcome (= do trigger a \
                 control plane restart)",
                "control_plane",
                &[],
            ),
            local_shards,
            remote_shards,
        }
    }
}

pub static CONTROL_PLANE_METRICS: Lazy<ControlPlaneMetrics> =
    Lazy::new(ControlPlaneMetrics::default);


================================================
FILE: quickwit/quickwit-control-plane/src/model/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod shard_table;

use std::borrow::Cow;
use std::collections::BTreeSet;
use std::mem;
use std::ops::Deref;
use std::time::Instant;

use anyhow::bail;
use fnv::{FnvHashMap, FnvHashSet};
use futures::StreamExt;
use quickwit_common::Progress;
use quickwit_common::pretty::PrettyDisplay;
use quickwit_config::{INGEST_V2_SOURCE_ID, IndexConfig, SourceConfig, enable_ingest_v2};
use quickwit_ingest::ShardInfos;
use quickwit_metastore::{AddSourceRequestExt, IndexMetadata, ListIndexesMetadataResponseExt};
use quickwit_proto::control_plane::ControlPlaneResult;
use quickwit_proto::ingest::Shard;
use quickwit_proto::metastore::{
    self, AddSourceRequest, EntityKind, ListIndexesMetadataRequest, ListShardsSubrequest,
    ListShardsSubresponse, MetastoreError, MetastoreResult, MetastoreService,
    MetastoreServiceClient, SourceType, ToggleSourceRequest,
};
use quickwit_proto::types::{IndexId, IndexUid, NodeId, ShardId, SourceId, SourceUid};
pub(super) use shard_table::{ScalingMode, ShardEntry, ShardLocations, ShardStats, ShardTable};
use tracing::{debug, error, info, instrument, warn};

/// The control plane maintains a model in sync with the metastore.
///
/// The model stays consistent with the metastore, because all
/// the mutations (create/delete index, add/delete source, etc.) go through the control plane.
///
/// If a mutation yields an error, the control plane is killed
/// and restarted.
///
/// Upon starts, it loads its entire state from the metastore.
#[derive(Default, Debug)]
pub(crate) struct ControlPlaneModel {
    index_uid_table: FnvHashMap<IndexId, IndexUid>,
    index_table: FnvHashMap<IndexUid, IndexMetadata>,
    shard_table: ShardTable,
}

impl ControlPlaneModel {
    /// Clears the entire state of the model.
    pub fn clear(&mut self) {
        *self = Default::default();
    }

    pub fn num_indexes(&self) -> usize {
        self.index_table.len()
    }

    pub fn num_sources(&self) -> usize {
        self.shard_table.num_sources()
    }

    pub fn shard_locations(&self) -> ShardLocations<'_> {
        self.shard_table.shard_locations()
    }

    #[cfg(test)]
    pub fn num_shards(&self) -> usize {
        self.shard_table.num_shards()
    }

    #[instrument(skip_all)]
    pub async fn load_from_metastore(
        &mut self,
        metastore: &mut MetastoreServiceClient,
        progress: &Progress,
    ) -> ControlPlaneResult<()> {
        const BATCH_SIZE: usize = 500;

        let now = Instant::now();
        self.clear();

        let indexes_metadata = progress
            .protect_future(metastore.list_indexes_metadata(ListIndexesMetadataRequest::all()))
            .await?
            .deserialize_indexes_metadata()
            .await?;

        let num_indexes = indexes_metadata.len();
        self.index_table.reserve(num_indexes);

        for index_metadata in indexes_metadata {
            self.add_index(index_metadata);
        }
        self.create_or_enable_ingest_v2_sources_if_necessary(metastore, progress)
            .await?;

        let mut num_sources = 0;
        let mut num_shards = 0;

        let mut next_list_shards_request = metastore::ListShardsRequest::default();

        for (idx, index_metadata) in self.index_table.values().enumerate() {
            for source_config in index_metadata.sources.values() {
                num_sources += 1;

                if source_config.source_type() == SourceType::IngestV2 {
                    let request = ListShardsSubrequest {
                        index_uid: index_metadata.index_uid.clone().into(),
                        source_id: source_config.source_id.clone(),
                        shard_state: None,
                    };
                    next_list_shards_request.subrequests.push(request);
                }
            }
            let num_subrequests = next_list_shards_request.subrequests.len();

            if num_subrequests > 0 && (num_subrequests >= BATCH_SIZE || idx == num_indexes - 1) {
                let list_shards_request = mem::take(&mut next_list_shards_request);
                let list_shards_response = progress
                    .protect_future(metastore.list_shards(list_shards_request))
                    .await?;

                for list_shards_subresponse in list_shards_response.subresponses {
                    num_shards += list_shards_subresponse.shards.len();

                    let ListShardsSubresponse {
                        index_uid,
                        source_id,
                        shards,
                    } = list_shards_subresponse;
                    let index_uid = index_uid.expect("`index_uid` should be a required field");
                    self.shard_table
                        .insert_shards(&index_uid, &source_id, shards);
                }
            }
        }
        info!(
            "synced control plane model with metastore in {} ({num_indexes} indexes, \
             {num_sources} sources, {num_shards} shards)",
            now.elapsed().pretty_display()
        );
        Ok(())
    }

    pub fn index_uid(&self, index_id: &str) -> Option<&IndexUid> {
        self.index_uid_table.get(index_id)
    }

    pub fn index_metadata(&self, index_uid: &IndexUid) -> Option<&IndexMetadata> {
        self.index_table.get(index_uid)
    }

    pub(crate) fn source_metadata(&self, source_uid: &SourceUid) -> Option<&SourceConfig> {
        self.index_metadata(&source_uid.index_uid)?
            .sources
            .get(&source_uid.source_id)
    }

    fn update_metrics(&self) {
        crate::metrics::CONTROL_PLANE_METRICS
            .indexes_total
            .set(self.index_table.len() as i64);
    }

    pub(crate) fn source_configs(&self) -> impl Iterator<Item = (SourceUid, &SourceConfig)> + '_ {
        self.index_table.values().flat_map(|index_metadata| {
            index_metadata
                .sources
                .iter()
                .map(move |(source_id, source_config)| {
                    (
                        SourceUid {
                            index_uid: index_metadata.index_uid.clone(),
                            source_id: source_id.clone(),
                        },
                        source_config,
                    )
                })
        })
    }

    pub(crate) fn add_index(&mut self, index_metadata: IndexMetadata) {
        let index_uid = index_metadata.index_uid.clone();
        let index_id = index_uid.index_id.clone();

        self.index_uid_table.insert(index_id, index_uid.clone());

        for (source_id, source_config) in &index_metadata.sources {
            if source_config.source_type() == SourceType::IngestV2 {
                self.shard_table.add_source(&index_uid, source_id);
            }
        }
        self.index_table.insert(index_uid, index_metadata);
        self.update_metrics();
    }

    /// Updates the configuration of the specified index, returning an error if
    /// the index didn't exist.
    pub(crate) fn update_index_config(
        &mut self,
        index_uid: &IndexUid,
        index_config: IndexConfig,
    ) -> anyhow::Result<bool> {
        let Some(index_model) = self.index_table.get_mut(index_uid) else {
            bail!("index `{}` not found", index_uid.index_id);
        };
        let fp_changed = !index_model.index_config.equals_fingerprint(&index_config);
        index_model.index_config = index_config;
        Ok(fp_changed)
    }

    pub(crate) fn delete_index(&mut self, index_uid: &IndexUid) {
        self.index_table.remove(index_uid);
        self.index_uid_table.remove(&index_uid.index_id);
        self.shard_table.delete_index(&index_uid.index_id);
        self.update_metrics();
    }

    /// Adds a source to a given index. Returns an error if the source already
    /// exists.
    pub(crate) fn add_source(
        &mut self,
        index_uid: &IndexUid,
        source_config: SourceConfig,
    ) -> ControlPlaneResult<()> {
        let index_metadata = self.index_table.get_mut(index_uid).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.to_string(),
            })
        })?;
        index_metadata.add_source(source_config.clone())?;

        if source_config.source_type() == SourceType::IngestV2 {
            self.shard_table
                .add_source(index_uid, &source_config.source_id);
        }
        Ok(())
    }

    pub(crate) fn update_source(
        &mut self,
        index_uid: &IndexUid,
        source_config: SourceConfig,
    ) -> ControlPlaneResult<()> {
        let index_metadata = self.index_table.get_mut(index_uid).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.to_string(),
            })
        })?;
        index_metadata.update_source(source_config)?;
        Ok(())
    }

    pub(crate) fn delete_source(&mut self, source_uid: &SourceUid) {
        // Removing shards from shard table.
        self.shard_table
            .delete_source(&source_uid.index_uid, &source_uid.source_id);
        // Remove source from index metadata.
        let Some(index_metadata) = self.index_table.get_mut(&source_uid.index_uid) else {
            warn!(index_uid=%source_uid.index_uid, source_id=%source_uid.source_id, "delete source: index not found");
            return;
        };
        if index_metadata
            .sources
            .remove(&source_uid.source_id)
            .is_none()
        {
            warn!(index_uid=%source_uid.index_uid, source_id=%source_uid.source_id, "delete source: source not found");
        };
    }

    /// Returns `true` if the source status has changed, `false` otherwise.
    /// Returns an error if the source could not be found.
    pub(crate) fn toggle_source(
        &mut self,
        index_uid: &IndexUid,
        source_id: &SourceId,
        enable: bool,
    ) -> ControlPlaneResult<bool> {
        let index_model = self.index_table.get_mut(index_uid).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.to_string(),
            })
        })?;
        let source_config = index_model.sources.get_mut(source_id).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Source {
                index_id: index_uid.to_string(),
                source_id: source_id.clone(),
            })
        })?;
        let has_changed = source_config.enabled != enable;
        source_config.enabled = enable;
        Ok(has_changed)
    }

    pub(crate) fn all_shards(&self) -> impl Iterator<Item = &ShardEntry> + '_ {
        self.shard_table.all_shards()
    }

    pub(crate) fn all_shards_with_source(
        &self,
    ) -> impl Iterator<Item = (&SourceUid, impl Iterator<Item = &ShardEntry>)> + '_ {
        self.shard_table.all_shards_with_source()
    }

    pub fn list_shards_for_node(
        &self,
        ingester: &NodeId,
    ) -> impl Deref<Target = FnvHashMap<SourceUid, BTreeSet<ShardId>>> + '_ {
        if let Some(shards_for_node) = self.shard_table.list_shards_for_node(ingester) {
            Cow::Borrowed(shards_for_node)
        } else {
            Cow::Owned(FnvHashMap::default())
        }
    }

    pub fn list_shards_for_index<'a>(
        &'a self,
        index_uid: &'a IndexUid,
    ) -> impl Iterator<Item = &'a ShardEntry> + 'a {
        self.shard_table.list_shards_for_index(index_uid)
    }

    /// Lists the shards of a given source. Returns `None` if the source does not exist.
    pub fn get_shards_for_source(
        &self,
        source_uid: &SourceUid,
    ) -> Option<&FnvHashMap<ShardId, ShardEntry>> {
        self.shard_table.get_shards(source_uid)
    }

    /// Lists the shards of a given source. Returns `None` if the source does not exist.
    pub fn get_shards_for_source_mut(
        &mut self,
        source_uid: &SourceUid,
    ) -> Option<&mut FnvHashMap<ShardId, ShardEntry>> {
        self.shard_table.get_shards_mut(source_uid)
    }

    /// Inserts the shards that have just been opened by calling `open_shards` on the metastore.
    pub fn insert_shards(
        &mut self,
        index_uid: &IndexUid,
        source_id: &SourceId,
        opened_shards: Vec<Shard>,
    ) {
        self.shard_table
            .insert_shards(index_uid, source_id, opened_shards);
    }

    /// Finds open shards for a given index and source and whose leaders are not in the set of
    /// unavailable ingesters.
    pub fn find_open_shards(
        &self,
        index_uid: &IndexUid,
        source_id: &SourceId,
        unavailable_leaders: &FnvHashSet<NodeId>,
    ) -> Option<Vec<ShardEntry>> {
        self.shard_table
            .find_open_shards(index_uid, source_id, unavailable_leaders)
    }

    /// Updates the state and ingestion rate of the shards according to the given shard infos.
    pub fn update_shards(
        &mut self,
        source_uid: &SourceUid,
        shard_infos: &ShardInfos,
    ) -> ShardStats {
        debug!(
            index_uid=%source_uid.index_uid,
            source_id=%source_uid.source_id,
            "updating shards"
        );
        self.shard_table.update_shards(source_uid, shard_infos)
    }

    /// Sets the state of the shards identified by their index UID, source ID, and shard IDs to
    /// `Closed`.
    pub fn close_shards(&mut self, source_uid: &SourceUid, shard_ids: &[ShardId]) -> Vec<ShardId> {
        debug!(
            index_uid=%source_uid.index_uid,
            source_id=%source_uid.source_id,
            shard_ids=%shard_ids.pretty_display(),
            "closing shards"
        );
        self.shard_table.close_shards(source_uid, shard_ids)
    }

    /// Removes the shards identified by their index UID, source ID, and shard IDs.
    pub fn delete_shards(&mut self, source_uid: &SourceUid, shard_ids: &[ShardId]) {
        debug!(
            index_uid=%source_uid.index_uid,
            source_id=%source_uid.source_id,
            shard_ids=%shard_ids.pretty_display(),
            "deleting shards"
        );
        self.shard_table.delete_shards(source_uid, shard_ids);
    }

    pub fn acquire_scaling_permits(
        &mut self,
        source_uid: &SourceUid,
        scaling_mode: ScalingMode,
    ) -> Option<bool> {
        self.shard_table
            .acquire_scaling_permits(source_uid, scaling_mode)
    }

    pub fn drain_scaling_permits(&mut self, source_uid: &SourceUid, scaling_mode: ScalingMode) {
        self.shard_table
            .drain_scaling_permits(source_uid, scaling_mode)
    }

    pub fn release_scaling_permits(&mut self, source_uid: &SourceUid, scaling_mode: ScalingMode) {
        self.shard_table
            .release_scaling_permits(source_uid, scaling_mode)
    }

    // Quickwit 0.9 uses the ingest v2 source by default. For indexes created prior to 0.9, we need
    // to ensure that the ingest v2 source is created and enabled if necessary.
    //
    // TODO(#5604)
    async fn create_or_enable_ingest_v2_sources_if_necessary(
        &mut self,
        metastore: &mut MetastoreServiceClient,
        progress: &Progress,
    ) -> ControlPlaneResult<()> {
        // User has voluntarily disabled ingest v2, nothing to do.
        if !enable_ingest_v2() {
            return Ok(());
        }
        // Indexes for which the ingest v2 source needs to be created.
        let mut sources_to_create = Vec::new();
        // Indexes for which the ingest v2 source needs to be enabled.
        let mut sources_to_enable = Vec::new();

        for (index_uid, index_metadata) in &self.index_table {
            let ingest_v2_source_opt = index_metadata.sources.get(INGEST_V2_SOURCE_ID);

            if let Some(ingest_v2_source) = ingest_v2_source_opt {
                if !ingest_v2_source.enabled {
                    sources_to_enable.push(index_uid.clone());
                }
            } else {
                sources_to_create.push(index_uid.clone());
            }
        }
        self.create_ingest_v2_sources(sources_to_create, metastore, progress)
            .await?;
        self.enable_ingest_v2_sources(sources_to_enable, metastore, progress)
            .await?;
        Ok(())
    }

    async fn create_ingest_v2_sources(
        &mut self,
        sources_to_create: Vec<IndexUid>,
        metastore: &mut MetastoreServiceClient,
        progress: &Progress,
    ) -> MetastoreResult<()> {
        let num_sources_to_create = sources_to_create.len();
        let now = Instant::now();
        info!("adding ingest v2 source to {num_sources_to_create} indexes");

        let mut add_source_futures = Vec::with_capacity(num_sources_to_create);

        for index_uid in sources_to_create {
            let metastore = metastore.clone();
            let source_config = SourceConfig::ingest_v2();
            let add_source_request =
                AddSourceRequest::try_from_source_config(index_uid.clone(), &source_config)?;
            let add_source_future = async move {
                let add_source_result = metastore.add_source(add_source_request).await;
                match add_source_result {
                    Ok(_) => Ok((index_uid, source_config)),
                    Err(error) => Err((index_uid, error)),
                }
            };
            add_source_futures.push(add_source_future);
        }
        let mut add_source_result_stream =
            futures::stream::iter(add_source_futures).buffer_unordered(100);
        let mut num_errors = 0;

        while let Some(add_source_result) = progress
            .protect_future(add_source_result_stream.next())
            .await
        {
            match add_source_result {
                Ok((index_uid, source_config)) => {
                    self.add_source(&index_uid, source_config)?;
                }
                Err((index_uid, error)) => {
                    num_errors += 1;
                    debug!(%error, %index_uid, "failed to add ingest v2 source to index");
                }
            }
        }
        if num_errors > 0 {
            error!("failed to add ingest v2 sources to {num_errors} indexes");
        }
        info!(
            "added ingest v2 source to {num_sources_to_create} indexes in {}",
            now.elapsed().pretty_display()
        );
        Ok(())
    }

    async fn enable_ingest_v2_sources(
        &mut self,
        sources_to_enable: Vec<IndexUid>,
        metastore: &mut MetastoreServiceClient,
        progress: &Progress,
    ) -> MetastoreResult<()> {
        let num_sources_to_enable = sources_to_enable.len();
        let now = Instant::now();
        info!("enabling {num_sources_to_enable} ingest v2 sources");

        let mut toggle_source_futures = Vec::with_capacity(num_sources_to_enable);

        for index_uid in sources_to_enable {
            let metastore = metastore.clone();
            let toggle_source_request = ToggleSourceRequest {
                index_uid: index_uid.clone().into(),
                source_id: INGEST_V2_SOURCE_ID.to_string(),
                enable: true,
            };
            let toggle_source_future = async move {
                let toggle_source_result = metastore.toggle_source(toggle_source_request).await;
                match toggle_source_result {
                    Ok(_) => Ok(index_uid),
                    Err(error) => Err((index_uid, error)),
                }
            };
            toggle_source_futures.push(toggle_source_future);
        }
        let mut toggle_source_result_stream =
            futures::stream::iter(toggle_source_futures).buffer_unordered(100);
        let mut num_errors = 0;

        let ingest_v2_source_id = INGEST_V2_SOURCE_ID.to_string();

        while let Some(toggle_source_result) = progress
            .protect_future(toggle_source_result_stream.next())
            .await
        {
            match toggle_source_result {
                Ok(index_uid) => {
                    self.toggle_source(&index_uid, &ingest_v2_source_id, true)?;
                }
                Err((index_uid, error)) => {
                    num_errors += 1;
                    debug!(%error, %index_uid, "failed to enable ingest v2 source");
                }
            }
        }
        if num_errors > 0 {
            error!("failed to enable {num_errors} ingest v2 sources");
        }
        info!(
            "enabled {num_sources_to_enable} ingest v2 sources in {}",
            now.elapsed().pretty_display()
        );
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use metastore::EmptyResponse;
    use quickwit_config::{INGEST_V2_SOURCE_ID, SourceConfig, SourceParams, TransformConfig};
    use quickwit_metastore::IndexMetadata;
    use quickwit_proto::ingest::{Shard, ShardState};
    use quickwit_proto::metastore::{ListIndexesMetadataResponse, MockMetastoreService};

    use super::*;

    #[tokio::test]
    async fn test_control_plane_model_load_shard_table() {
        let index_uid0 = IndexUid::for_test("test-index-0", 0);
        let index_uid1 = IndexUid::for_test("test-index-1", 0);
        let index_uid2 = IndexUid::for_test("test-index-2", 0);

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(|request| {
                assert_eq!(request, ListIndexesMetadataRequest::all());

                let mut index_0 = IndexMetadata::for_test("test-index-0", "ram:///test-index-0");
                let mut source_config = SourceConfig::ingest_v2();
                source_config.enabled = true;
                index_0.add_source(source_config.clone()).unwrap();

                let mut index_1 = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
                source_config.enabled = false;
                index_1.add_source(source_config).unwrap();

                let mut index_2 = IndexMetadata::for_test("test-index-2", "ram:///test-index-2");
                index_2.add_source(SourceConfig::cli()).unwrap();

                let indexes = vec![index_0, index_1, index_2];
                Ok(ListIndexesMetadataResponse::for_test(indexes))
            });
        let index_uid2_clone = index_uid2.clone();
        mock_metastore
            .expect_add_source()
            .return_once(move |request| {
                assert_eq!(*request.index_uid(), index_uid2_clone);

                let source_config = request.deserialize_source_config().unwrap();
                assert_eq!(source_config.source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(source_config.source_type(), SourceType::IngestV2);

                Ok(EmptyResponse {})
            });
        let index_uid1_clone = index_uid1.clone();
        mock_metastore
            .expect_toggle_source()
            .return_once(move |request| {
                assert_eq!(*request.index_uid(), index_uid1_clone);
                assert_eq!(request.source_id, INGEST_V2_SOURCE_ID);
                assert!(request.enable);

                Ok(EmptyResponse {})
            });
        let index_uid0_clone = index_uid0.clone();
        let index_uid1_clone = index_uid1.clone();
        let index_uid2_clone = index_uid2.clone();
        mock_metastore
            .expect_list_shards()
            .return_once(move |mut request| {
                assert_eq!(request.subrequests.len(), 3);

                request
                    .subrequests
                    .sort_by(|left, right| left.index_uid().cmp(right.index_uid()));

                assert_eq!(request.subrequests[0].index_uid(), &index_uid0_clone);
                assert_eq!(request.subrequests[0].source_id, INGEST_V2_SOURCE_ID);
                assert!(request.subrequests[0].shard_state.is_none());

                assert_eq!(request.subrequests[1].index_uid(), &index_uid1_clone);
                assert_eq!(request.subrequests[1].source_id, INGEST_V2_SOURCE_ID);
                assert!(request.subrequests[1].shard_state.is_none());

                assert_eq!(request.subrequests[2].index_uid(), &index_uid2_clone);
                assert_eq!(request.subrequests[2].source_id, INGEST_V2_SOURCE_ID);
                assert!(request.subrequests[2].shard_state.is_none());

                let subresponses = vec![
                    metastore::ListShardsSubresponse {
                        index_uid: Some(index_uid0_clone.clone()),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: vec![Shard {
                            shard_id: Some(ShardId::from(42)),
                            index_uid: Some(index_uid0_clone.clone()),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            shard_state: ShardState::Open as i32,
                            leader_id: "node1".to_string(),
                            ..Default::default()
                        }],
                    },
                    metastore::ListShardsSubresponse {
                        index_uid: Some(index_uid1_clone.clone()),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shards: Vec::new(),
                    },
                ];
                let response = metastore::ListShardsResponse { subresponses };
                Ok(response)
            });
        let mut model = ControlPlaneModel::default();
        let mut metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let progress = Progress::default();
        model
            .load_from_metastore(&mut metastore, &progress)
            .await
            .unwrap();

        assert_eq!(model.index_table.len(), 3);
        assert_eq!(*model.index_uid("test-index-0").unwrap(), index_uid0);
        assert_eq!(*model.index_uid("test-index-1").unwrap(), index_uid1);
        assert_eq!(*model.index_uid("test-index-2").unwrap(), index_uid2);

        assert_eq!(model.shard_table.num_shards(), 1);

        let source_uid_0 = SourceUid {
            index_uid: index_uid0.clone(),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
        };
        let shards: Vec<&ShardEntry> = model
            .shard_table
            .get_shards(&source_uid_0)
            .unwrap()
            .values()
            .collect();
        assert_eq!(shards.len(), 1);
        assert_eq!(shards[0].shard_id(), ShardId::from(42));

        let source_uid_1 = SourceUid {
            index_uid: index_uid1.clone(),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
        };
        let shards: Vec<&ShardEntry> = model
            .shard_table
            .get_shards(&source_uid_1)
            .unwrap()
            .values()
            .collect();
        assert_eq!(shards.len(), 0);
    }

    #[test]
    fn test_control_plane_model_add_index() {
        let mut model = ControlPlaneModel::default();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes");
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata.clone());

        assert_eq!(model.index_table.len(), 1);
        assert_eq!(model.index_table.get(&index_uid).unwrap(), &index_metadata);

        assert_eq!(model.index_uid_table.len(), 1);
        assert_eq!(*model.index_uid("test-index").unwrap(), index_uid);
    }

    #[test]
    fn test_control_plane_model_add_index_with_sources() {
        let mut model = ControlPlaneModel::default();
        let mut index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes");
        index_metadata.add_source(SourceConfig::cli()).unwrap();
        index_metadata
            .add_source(SourceConfig::ingest_v2())
            .unwrap();
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata.clone());

        assert_eq!(model.index_table.len(), 1);
        assert_eq!(model.index_table.get(&index_uid).unwrap(), &index_metadata);

        assert_eq!(model.index_uid_table.len(), 1);
        assert_eq!(*model.index_uid("test-index").unwrap(), index_uid);

        assert_eq!(model.shard_table.num_sources(), 1);

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: INGEST_V2_SOURCE_ID.to_string(),
        };
        assert_eq!(model.shard_table.get_shards(&source_uid).unwrap().len(), 0);
    }

    #[test]
    fn test_control_plane_model_update_index_config() {
        let mut model = ControlPlaneModel::default();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes");
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata.clone());

        // Update the index config
        let mut index_config = index_metadata.index_config.clone();
        index_config.search_settings.default_search_fields = vec!["myfield".to_string()];
        model
            .update_index_config(&index_uid, index_config.clone())
            .unwrap();

        assert_eq!(model.index_table.len(), 1);
        assert_eq!(
            model.index_table.get(&index_uid).unwrap().index_config,
            index_config
        );
    }

    #[test]
    fn test_control_plane_model_update_sources() {
        let mut model = ControlPlaneModel::default();
        let mut index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes");
        let mut my_source = SourceConfig::for_test("my-source", SourceParams::void());
        index_metadata.add_source(my_source.clone()).unwrap();
        index_metadata
            .add_source(SourceConfig::ingest_v2())
            .unwrap();
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata.clone());

        // Update a source
        my_source.transform_config = Some(TransformConfig::new("del(.username)".to_string(), None));
        model.update_source(&index_uid, my_source.clone()).unwrap();

        assert_eq!(model.index_table.len(), 1);
        assert_eq!(
            model
                .index_table
                .get(&index_uid)
                .unwrap()
                .sources
                .get("my-source")
                .unwrap(),
            &my_source
        );
    }

    #[test]
    fn test_control_plane_model_delete_index() {
        let mut model = ControlPlaneModel::default();

        let mut index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes");
        let index_uid = index_metadata.index_uid.clone();
        model.delete_index(&index_uid);

        index_metadata
            .add_source(SourceConfig::ingest_v2())
            .unwrap();
        model.add_index(index_metadata);

        model.delete_index(&index_uid);

        assert!(model.index_table.is_empty());
        assert!(model.index_uid_table.is_empty());
        assert_eq!(model.shard_table.num_sources(), 0);
    }

    #[test]
    fn test_control_plane_model_toggle_source() {
        let mut model = ControlPlaneModel::default();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes");
        let index_uid = index_metadata.index_uid.clone();
        model.add_index(index_metadata);
        let source_config = SourceConfig::for_test("test-source", SourceParams::void());
        model.add_source(&index_uid, source_config).unwrap();
        {
            let has_changed = model
                .toggle_source(&index_uid, &"test-source".to_string(), true)
                .unwrap();
            assert!(!has_changed);
        }
        {
            let has_changed = model
                .toggle_source(&index_uid, &"test-source".to_string(), true)
                .unwrap();
            assert!(!has_changed);
        }
        {
            let has_changed = model
                .toggle_source(&index_uid, &"test-source".to_string(), false)
                .unwrap();
            assert!(has_changed);
        }
        {
            let has_changed = model
                .toggle_source(&index_uid, &"test-source".to_string(), false)
                .unwrap();
            assert!(!has_changed);
        }
        {
            let has_changed = model
                .toggle_source(&index_uid, &"test-source".to_string(), true)
                .unwrap();
            assert!(has_changed);
        }
        {
            let has_changed = model
                .toggle_source(&index_uid, &"test-source".to_string(), true)
                .unwrap();
            assert!(!has_changed);
        }
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/model/shard_table.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::hash_map::Entry;
use std::collections::{BTreeSet, HashMap};
use std::ops::{Deref, DerefMut};
use std::time::Duration;

use fnv::{FnvHashMap, FnvHashSet};
use quickwit_common::metrics::index_label;
use quickwit_common::rate_limiter::{RateLimiter, RateLimiterSettings};
use quickwit_common::tower::ConstantRate;
use quickwit_ingest::{RateMibPerSec, ShardInfo, ShardInfos};
use quickwit_proto::ingest::{Shard, ShardState};
use quickwit_proto::types::{IndexUid, NodeId, ShardId, SourceId, SourceUid};
use tracing::{error, info, warn};

/// Limits the number of scale up operations that can happen to a source to 5 per minute.
const SCALING_UP_RATE_LIMITER_SETTINGS: RateLimiterSettings = RateLimiterSettings {
    burst_limit: 5,
    rate_limit: ConstantRate::new(5, Duration::from_secs(60)),
    refill_period: Duration::from_secs(12),
};

/// Limits the number of shards that can be closed for scaling down a source to 1 per minute.
const SCALING_DOWN_RATE_LIMITER_SETTINGS: RateLimiterSettings = RateLimiterSettings {
    burst_limit: 1,
    rate_limit: ConstantRate::new(1, Duration::from_secs(60)),
    refill_period: Duration::from_secs(60),
};

#[derive(Debug, Clone, Copy, Eq, PartialEq)]
pub(crate) enum ScalingMode {
    /// Scale up by adding this number of shards
    Up(usize),
    /// Scale down by removing one shard
    Down,
}

#[derive(Debug, Clone)]
pub(crate) struct ShardEntry {
    pub shard: Shard,
    pub short_term_ingestion_rate: RateMibPerSec,
    pub long_term_ingestion_rate: RateMibPerSec,
}

impl Deref for ShardEntry {
    type Target = Shard;

    fn deref(&self) -> &Self::Target {
        &self.shard
    }
}

impl DerefMut for ShardEntry {
    fn deref_mut(&mut self) -> &mut Self::Target {
        &mut self.shard
    }
}

impl From<Shard> for ShardEntry {
    fn from(shard: Shard) -> Self {
        Self {
            shard,
            short_term_ingestion_rate: RateMibPerSec::default(),
            long_term_ingestion_rate: RateMibPerSec::default(),
        }
    }
}

#[derive(Debug)]
pub(crate) struct ShardTableEntry {
    shard_entries: FnvHashMap<ShardId, ShardEntry>,
    scaling_up_rate_limiter: RateLimiter,
    scaling_down_rate_limiter: RateLimiter,
}

impl Default for ShardTableEntry {
    fn default() -> Self {
        Self {
            shard_entries: Default::default(),
            scaling_up_rate_limiter: RateLimiter::from_settings(SCALING_UP_RATE_LIMITER_SETTINGS),
            scaling_down_rate_limiter: RateLimiter::from_settings(
                SCALING_DOWN_RATE_LIMITER_SETTINGS,
            ),
        }
    }
}

impl ShardTableEntry {
    fn is_empty(&self) -> bool {
        self.shard_entries.is_empty()
    }

    fn shards_stats(&self) -> ShardStats {
        let mut num_open_shards = 0;
        let mut num_closed_shards = 0;
        let mut short_term_ingestion_rate_sum = 0;
        let mut long_term_ingestion_rate_sum = 0;

        for shard_entry in self.shard_entries.values() {
            if shard_entry.is_open() {
                num_open_shards += 1;
                short_term_ingestion_rate_sum += shard_entry.short_term_ingestion_rate.0 as usize;
                long_term_ingestion_rate_sum += shard_entry.long_term_ingestion_rate.0 as usize;
            } else if shard_entry.is_closed() {
                num_closed_shards += 1;
            }
        }
        let avg_short_term_ingestion_rate = if num_open_shards > 0 {
            short_term_ingestion_rate_sum as f32 / num_open_shards as f32
        } else {
            0.0
        };
        let avg_long_term_ingestion_rate = if num_open_shards > 0 {
            long_term_ingestion_rate_sum as f32 / num_open_shards as f32
        } else {
            0.0
        };
        ShardStats {
            num_open_shards,
            num_closed_shards,
            avg_short_term_ingestion_rate,
            avg_long_term_ingestion_rate,
        }
    }
}

#[derive(Default)]
pub struct ShardLocations<'a> {
    shard_locations: HashMap<&'a ShardId, smallvec::SmallVec<[&'a NodeId; 2]>>,
}

impl<'a> ShardLocations<'a> {
    pub(crate) fn add_location(&mut self, shard_id: &'a ShardId, ingester_id: &'a NodeId) {
        let locations = self.shard_locations.entry(shard_id).or_default();
        if locations.contains(&ingester_id) {
            warn!("shard {shard_id:?} was registered twice the same ingester {ingester_id:?}");
        } else {
            locations.push(ingester_id);
        }
    }

    /// Returns the list of indexer holding the given shard.
    /// No guarantee is made on the order of the returned list.
    pub fn get_shard_locations(&self, shard_id: &ShardId) -> &[&'a NodeId] {
        let Some(node_ids) = self.shard_locations.get(shard_id) else {
            return &[];
        };
        node_ids.as_slice()
    }
}

// A table that keeps track of the existing shards for each index and source,
// and for each ingester, the list of shards it is supposed to host.
//
// (All mutable methods must maintain these two invariants.)
#[derive(Debug, Default)]
pub(crate) struct ShardTable {
    table_entries: FnvHashMap<SourceUid, ShardTableEntry>,
    ingester_shards: FnvHashMap<NodeId, FnvHashMap<SourceUid, BTreeSet<ShardId>>>,
}

// Removes the shards from the ingester_shards map.
//
// This function is used to maintain the shard table invariant.
// Logs an error if the shard was not found in the ingester_shards map.
fn remove_shard_from_ingesters_internal(
    source_uid: &SourceUid,
    shard: &Shard,
    ingester_shards: &mut FnvHashMap<NodeId, FnvHashMap<SourceUid, BTreeSet<ShardId>>>,
) {
    for node in shard.ingesters() {
        let ingester_shards = ingester_shards
            .get_mut(node)
            .expect("shard table reached inconsistent state");
        let shard_ids = ingester_shards.get_mut(source_uid).unwrap();
        let shard_was_removed = shard_ids.remove(shard.shard_id());
        if !shard_was_removed {
            error!(
                "shard table has reached an inconsistent state. shard {shard:?} was removed from \
                 the shard table but was apparently not in the ingester_shards map."
            );
        }
    }
}

impl ShardTable {
    /// Returns a ShardLocations object that maps each shard to the list of ingesters hosting it.
    /// All shards are considered regardless of their state (including unavailable).
    pub fn shard_locations(&self) -> ShardLocations<'_> {
        let mut shard_locations = ShardLocations::default();
        for (ingester_id, source_shards) in &self.ingester_shards {
            for shard_ids in source_shards.values() {
                for shard_id in shard_ids {
                    shard_locations.add_location(shard_id, ingester_id);
                }
            }
        }
        shard_locations
    }

    /// Removes all the entries that match the target index ID.
    pub fn delete_index(&mut self, index_id: &str) {
        let shards_removed = self
            .table_entries
            .iter()
            .filter(|(source_uid, _)| source_uid.index_uid.index_id == index_id)
            .flat_map(|(source_uid, shard_table_entry)| {
                shard_table_entry
                    .shard_entries
                    .values()
                    .map(move |shard_entry: &ShardEntry| (source_uid, &shard_entry.shard))
            });
        for (source_uid, shard) in shards_removed {
            remove_shard_from_ingesters_internal(source_uid, shard, &mut self.ingester_shards);
        }
        self.table_entries
            .retain(|source_uid, _| source_uid.index_uid.index_id != index_id);
        self.check_invariant();
    }

    /// Checks whether the shard table is consistent.
    ///
    /// Panics if it is not.
    #[allow(clippy::mutable_key_type)]
    fn check_invariant(&self) {
        // This function is expensive! Let's not call it in release mode.
        if !cfg!(debug_assertions) {
            return;
        };
        let mut shard_sets_in_shard_table = FnvHashSet::default();
        for (source_uid, shard_table_entry) in &self.table_entries {
            for (shard_id, shard_entry) in &shard_table_entry.shard_entries {
                debug_assert_eq!(shard_id, shard_entry.shard.shard_id());
                debug_assert_eq!(&source_uid.index_uid, shard_entry.shard.index_uid());
                for node in shard_entry.shard.ingesters() {
                    shard_sets_in_shard_table.insert((node, source_uid, shard_id));
                }
            }
        }
        for (node, ingester_shards) in &self.ingester_shards {
            for (source_uid, shard_ids) in ingester_shards {
                for shard_id in shard_ids {
                    let shard_table_entry = self.table_entries.get(source_uid).unwrap();
                    debug_assert!(shard_table_entry.shard_entries.contains_key(shard_id));
                    debug_assert!(shard_sets_in_shard_table.remove(&(node, source_uid, shard_id)));
                }
            }
        }
    }

    /// Lists all the shards hosted on a given node, regardless of whether it is a
    /// leader or a follower.
    pub fn list_shards_for_node(
        &self,
        ingester: &NodeId,
    ) -> Option<&FnvHashMap<SourceUid, BTreeSet<ShardId>>> {
        self.ingester_shards.get(ingester)
    }

    pub fn list_shards_for_index<'a>(
        &'a self,
        index_uid: &'a IndexUid,
    ) -> impl Iterator<Item = &'a ShardEntry> + 'a {
        self.table_entries
            .iter()
            .filter(move |(source_uid, _)| source_uid.index_uid == *index_uid)
            .flat_map(|(_, shard_table_entry)| shard_table_entry.shard_entries.values())
    }

    pub fn num_sources(&self) -> usize {
        self.table_entries.len()
    }

    #[cfg(test)]
    pub fn num_shards(&self) -> usize {
        self.table_entries
            .values()
            .map(|shard_table_entry| shard_table_entry.shard_entries.len())
            .sum()
    }

    /// Adds a new empty entry for the given index and source.
    ///
    /// TODO check and document the behavior on error (if the source was already here).
    pub fn add_source(&mut self, index_uid: &IndexUid, source_id: &SourceId) {
        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let table_entry = ShardTableEntry::default();
        let previous_table_entry_opt = self.table_entries.insert(source_uid, table_entry);
        if let Some(previous_table_entry) = previous_table_entry_opt
            && !previous_table_entry.is_empty()
        {
            error!(
                "shard table entry for index `{}` and source `{}` already exists",
                index_uid.index_id, source_id
            );
        }
        self.check_invariant();
    }

    pub fn delete_source(&mut self, index_uid: &IndexUid, source_id: &SourceId) {
        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let Some(shard_table_entry) = self.table_entries.remove(&source_uid) else {
            return;
        };
        for shard_entry in shard_table_entry.shard_entries.values() {
            remove_shard_from_ingesters_internal(
                &source_uid,
                &shard_entry.shard,
                &mut self.ingester_shards,
            );
        }
        self.check_invariant();
    }

    pub(crate) fn all_shards(&self) -> impl Iterator<Item = &ShardEntry> + '_ {
        self.table_entries
            .values()
            .flat_map(|table_entry| table_entry.shard_entries.values())
    }

    pub(crate) fn all_shards_with_source(
        &self,
    ) -> impl Iterator<Item = (&SourceUid, impl Iterator<Item = &ShardEntry>)> + '_ {
        self.table_entries
            .iter()
            .map(|(source, shard_table)| (source, shard_table.shard_entries.values()))
    }

    /// Lists the shards of a given source. Returns `None` if the source does not exist.
    pub fn get_shards(&self, source_uid: &SourceUid) -> Option<&FnvHashMap<ShardId, ShardEntry>> {
        self.table_entries
            .get(source_uid)
            .map(|table_entry| &table_entry.shard_entries)
    }

    /// Lists the shards of a given source. Returns `None` if the source does not exist.
    pub fn get_shards_mut(
        &mut self,
        source_uid: &SourceUid,
    ) -> Option<&mut FnvHashMap<ShardId, ShardEntry>> {
        self.table_entries
            .get_mut(source_uid)
            .map(|table_entry| &mut table_entry.shard_entries)
    }

    /// Inserts the shards into the shard table.
    pub fn insert_shards(
        &mut self,
        index_uid: &IndexUid,
        source_id: &SourceId,
        opened_shards: Vec<Shard>,
    ) {
        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        for shard in &opened_shards {
            if shard.index_uid() != &source_uid.index_uid || shard.source_id != source_uid.source_id
            {
                panic!(
                    "shard source UID `{}/{}` does not match source UID `{source_uid}`",
                    shard.index_uid(),
                    shard.source_id,
                );
            }
        }
        for shard in &opened_shards {
            for node in shard.ingesters() {
                let ingester_shards = self.ingester_shards.entry(node.to_owned()).or_default();
                let shard_ids = ingester_shards.entry(source_uid.clone()).or_default();
                shard_ids.insert(shard.shard_id().clone());
            }
        }
        match self.table_entries.entry(source_uid.clone()) {
            Entry::Occupied(mut entry) => {
                let table_entry = entry.get_mut();
                for opened_shard in opened_shards {
                    // We only insert shards that we don't know about because the control plane
                    // knows more about the state of the shards than the metastore.
                    table_entry
                        .shard_entries
                        .entry(opened_shard.shard_id().clone())
                        .or_insert_with(|| ShardEntry::from(opened_shard));
                }
            }
            // This should never happen if the control plane view is consistent with the state of
            // the metastore, so should we panic here? Warnings are most likely going to go
            // unnoticed.
            Entry::Vacant(entry) => {
                warn!(
                    "control plane inconsistent with metastore: inserting shards for a \
                     non-existing source (please report)"
                );
                let shard_entries: FnvHashMap<ShardId, ShardEntry> = opened_shards
                    .into_iter()
                    .map(|shard| (shard.shard_id().clone(), shard.into()))
                    .collect();
                let table_entry = ShardTableEntry {
                    shard_entries,
                    ..Default::default()
                };
                entry.insert(table_entry);
            }
        }
        // Let's now update the open shard metrics for this specific index.
        self.update_shard_metrics_for_source_uid(&source_uid);
        self.check_invariant();
    }

    /// Finds open shards for a given index and source and whose leaders are not in the set of
    /// unavailable ingesters.
    pub fn find_open_shards(
        &self,
        index_uid: &IndexUid,
        source_id: &SourceId,
        unavailable_leaders: &FnvHashSet<NodeId>,
    ) -> Option<Vec<ShardEntry>> {
        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let table_entry = self.table_entries.get(&source_uid)?;
        let open_shards: Vec<ShardEntry> = table_entry
            .shard_entries
            .values()
            .filter(|shard_entry| {
                shard_entry.shard.is_open() && !unavailable_leaders.contains(&shard_entry.leader_id)
            })
            .cloned()
            .collect();
        Some(open_shards)
    }

    pub fn update_shard_metrics_for_source_uid(&self, source_uid: &SourceUid) {
        let Some(table_entry) = self.table_entries.get(source_uid) else {
            return;
        };
        let index_id = source_uid.index_uid.index_id.as_str();
        let index_label = index_label(index_id);

        // If `index_label(index_id)` returns `index_id`, then per-index metrics are enabled and we
        // can update the metrics for this specific index.
        if index_label == index_id {
            let shard_stats = table_entry.shards_stats();
            crate::metrics::CONTROL_PLANE_METRICS
                .open_shards
                .with_label_values([index_label])
                .set(shard_stats.num_open_shards as i64);
            crate::metrics::CONTROL_PLANE_METRICS
                .closed_shards
                .with_label_values([index_label])
                .set(shard_stats.num_closed_shards as i64);
            return;
        }
        // Per-index metrics are disabled, so we update the metrics for all sources.
        let mut num_open_shards = 0;
        let mut num_closed_shards = 0;

        for shard_entry in self.all_shards() {
            if shard_entry.is_open() {
                num_open_shards += 1;
            } else if shard_entry.is_closed() {
                num_closed_shards += 1;
            }
        }
        crate::metrics::CONTROL_PLANE_METRICS
            .open_shards
            .with_label_values([index_label])
            .set(num_open_shards as i64);
        crate::metrics::CONTROL_PLANE_METRICS
            .closed_shards
            .with_label_values([index_label])
            .set(num_closed_shards as i64);
    }

    pub fn update_shards(
        &mut self,
        source_uid: &SourceUid,
        shard_infos: &ShardInfos,
    ) -> ShardStats {
        let Some(table_entry) = self.table_entries.get_mut(source_uid) else {
            return ShardStats::default();
        };
        for shard_info in shard_infos {
            let ShardInfo {
                shard_id,
                shard_state,
                short_term_ingestion_rate,
                long_term_ingestion_rate,
            } = shard_info;

            if let Some(shard_entry) = table_entry.shard_entries.get_mut(shard_id) {
                shard_entry.short_term_ingestion_rate = *short_term_ingestion_rate;
                shard_entry.long_term_ingestion_rate = *long_term_ingestion_rate;
                // `ShardInfos` are broadcasted via Chitchat and eventually consistent. As a
                // result, we can only trust the `Closed` state, which is final.
                if shard_state.is_closed() {
                    shard_entry.set_shard_state(ShardState::Closed);
                }
            }
        }
        table_entry.shards_stats()
    }

    /// Sets the state of the shards identified by their index UID, source ID, and shard IDs to
    /// `Closed`.
    pub fn close_shards(&mut self, source_uid: &SourceUid, shard_ids: &[ShardId]) -> Vec<ShardId> {
        let Some(table_entry) = self.table_entries.get_mut(source_uid) else {
            return Vec::new();
        };
        let mut closed_shard_ids = Vec::new();

        for shard_id in shard_ids {
            if let Some(shard_entry) = table_entry.shard_entries.get_mut(shard_id) {
                if !shard_entry.is_closed() {
                    shard_entry.set_shard_state(ShardState::Closed);
                    closed_shard_ids.push(shard_id.clone());
                }
            } else {
                info!(
                    index_id=%source_uid.index_uid.index_id,
                    source_id=%source_uid.source_id,
                    %shard_id,
                    "ignoring attempt to close shard: it is unknown (probably because it has been deleted)"
                );
            }
        }
        self.update_shard_metrics_for_source_uid(source_uid);
        closed_shard_ids
    }

    /// Removes the shards identified by their index UID, source ID, and shard IDs.
    pub fn delete_shards(&mut self, source_uid: &SourceUid, shard_ids: &[ShardId]) {
        let Some(table_entry) = self.table_entries.get_mut(source_uid) else {
            return;
        };
        let mut shard_entries_to_remove: Vec<ShardEntry> = Vec::new();
        for shard_id in shard_ids {
            if let Some(shard_entry) = table_entry.shard_entries.remove(shard_id) {
                shard_entries_to_remove.push(shard_entry);
            } else {
                warn!(shard=%shard_id, "deleting a non-existing shard");
            }
        }
        for shard_entry in shard_entries_to_remove {
            remove_shard_from_ingesters_internal(
                source_uid,
                &shard_entry.shard,
                &mut self.ingester_shards,
            );
        }
        self.check_invariant();
        self.update_shard_metrics_for_source_uid(source_uid);
    }

    pub fn acquire_scaling_permits(
        &mut self,
        source_uid: &SourceUid,
        scaling_mode: ScalingMode,
    ) -> Option<bool> {
        let table_entry = self.table_entries.get_mut(source_uid)?;
        let scaling_rate_limiter = match scaling_mode {
            ScalingMode::Up(_) => &mut table_entry.scaling_up_rate_limiter,
            ScalingMode::Down => &mut table_entry.scaling_down_rate_limiter,
        };
        Some(scaling_rate_limiter.acquire(1))
    }

    pub fn drain_scaling_permits(&mut self, source_uid: &SourceUid, scaling_mode: ScalingMode) {
        if let Some(table_entry) = self.table_entries.get_mut(source_uid) {
            let scaling_rate_limiter = match scaling_mode {
                ScalingMode::Up(_) => &mut table_entry.scaling_up_rate_limiter,
                ScalingMode::Down => &mut table_entry.scaling_down_rate_limiter,
            };
            scaling_rate_limiter.drain();
        }
    }

    pub fn release_scaling_permits(&mut self, source_uid: &SourceUid, scaling_mode: ScalingMode) {
        if let Some(table_entry) = self.table_entries.get_mut(source_uid) {
            let scaling_rate_limiter = match scaling_mode {
                ScalingMode::Up(_) => &mut table_entry.scaling_up_rate_limiter,
                ScalingMode::Down => &mut table_entry.scaling_down_rate_limiter,
            };
            scaling_rate_limiter.release(1);
        }
    }
}

#[derive(Clone, Copy, Default)]
pub(crate) struct ShardStats {
    pub num_open_shards: usize,
    pub num_closed_shards: usize,
    /// Average short-term ingestion rate (MiB/s) over all open shards.
    pub avg_short_term_ingestion_rate: f32,
    /// Average long-term ingestion rate (MiB/s) over all open shards.
    pub avg_long_term_ingestion_rate: f32,
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeSet;

    use itertools::Itertools;
    use quickwit_proto::ingest::Shard;

    use super::*;

    impl ShardTableEntry {
        pub fn shards(&self) -> Vec<Shard> {
            self.shard_entries
                .values()
                .map(|shard_entry| shard_entry.shard.clone())
                .sorted_unstable_by(|left, right| left.shard_id.cmp(&right.shard_id))
                .collect()
        }
    }

    impl ShardTable {
        pub fn find_open_shards_sorted(
            &self,
            index_uid: &IndexUid,
            source_id: &SourceId,
            unavailable_leaders: &FnvHashSet<NodeId>,
        ) -> Option<Vec<ShardEntry>> {
            self.find_open_shards(index_uid, source_id, unavailable_leaders)
                .map(|mut shards| {
                    shards.sort_unstable_by(|left, right| {
                        left.shard.shard_id.cmp(&right.shard.shard_id)
                    });
                    shards
                })
        }
    }

    #[test]
    fn test_shard_table_delete_index() {
        let mut shard_table = ShardTable::default();
        shard_table.delete_index("test-index");

        let index_uid_0: IndexUid = IndexUid::for_test("test-index-foo", 0);
        let source_id_0 = "test-source-0".to_string();
        shard_table.add_source(&index_uid_0, &source_id_0);

        let source_id_1 = "test-source-1".to_string();
        shard_table.add_source(&index_uid_0, &source_id_1);

        let index_uid_1: IndexUid = IndexUid::for_test("test-index-bar", 1);
        shard_table.add_source(&index_uid_1, &source_id_0);

        shard_table.delete_index("test-index-foo");
        assert_eq!(shard_table.table_entries.len(), 1);

        assert!(shard_table.table_entries.contains_key(&SourceUid {
            index_uid: index_uid_1,
            source_id: source_id_0
        }));
    }

    #[test]
    fn test_shard_table_add_source() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let mut shard_table = ShardTable::default();
        shard_table.add_source(&index_uid, &source_id);
        assert_eq!(shard_table.table_entries.len(), 1);

        let source_uid = SourceUid {
            index_uid,
            source_id,
        };
        let table_entry = shard_table.table_entries.get(&source_uid).unwrap();
        assert!(table_entry.shard_entries.is_empty());
    }

    #[test]
    fn test_shard_table_list_shards() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let mut shard_table = ShardTable::default();

        assert!(shard_table.get_shards(&source_uid).is_none());

        shard_table.add_source(&index_uid, &source_id);
        let shards = shard_table.get_shards(&source_uid).unwrap();
        assert_eq!(shards.len(), 0);

        let shard_01 = Shard {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Closed as i32,
            ..Default::default()
        };
        shard_table.insert_shards(&index_uid, &source_id, vec![shard_01]);

        let shards = shard_table.get_shards(&source_uid).unwrap();
        assert_eq!(shards.len(), 1);
    }

    #[test]
    fn test_shard_table_insert_newly_opened_shards() {
        let index_uid_0: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let mut shard_table = ShardTable::default();

        let shard_01 = Shard {
            index_uid: index_uid_0.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        shard_table.insert_shards(&index_uid_0, &source_id, vec![shard_01.clone()]);

        assert_eq!(shard_table.table_entries.len(), 1);

        let source_uid = SourceUid {
            index_uid: index_uid_0.clone(),
            source_id: source_id.clone(),
        };
        let table_entry = shard_table.table_entries.get(&source_uid).unwrap();
        let shards = table_entry.shards();
        assert_eq!(shards.len(), 1);
        assert_eq!(shards[0], shard_01);

        shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .shard_entries
            .get_mut(&ShardId::from(1))
            .unwrap()
            .set_shard_state(ShardState::Unavailable);

        let shard_02 = Shard {
            index_uid: index_uid_0.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };

        shard_table.insert_shards(
            &index_uid_0,
            &source_id,
            vec![shard_01.clone(), shard_02.clone()],
        );

        assert_eq!(shard_table.table_entries.len(), 1);

        let source_uid = SourceUid {
            index_uid: index_uid_0.clone(),
            source_id: source_id.clone(),
        };
        let table_entry = shard_table.table_entries.get(&source_uid).unwrap();
        let shards = table_entry.shards();
        assert_eq!(shards.len(), 2);
        assert_eq!(shards[0].shard_state(), ShardState::Unavailable);
        assert_eq!(shards[1], shard_02);
    }

    #[test]
    fn test_shard_table_find_open_shards() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let mut shard_table = ShardTable::default();
        shard_table.add_source(&index_uid, &source_id);

        let mut unavailable_ingesters = FnvHashSet::default();

        let open_shards = shard_table
            .find_open_shards_sorted(&index_uid, &source_id, &unavailable_ingesters)
            .unwrap();
        assert_eq!(open_shards.len(), 0);

        let shard_01 = Shard {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Closed as i32,
            ..Default::default()
        };
        let shard_02 = Shard {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Unavailable as i32,
            ..Default::default()
        };
        let shard_03 = Shard {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(3)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_04 = Shard {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(4)),
            leader_id: "test-leader-1".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        shard_table.insert_shards(
            &index_uid,
            &source_id,
            vec![shard_01, shard_02, shard_03.clone(), shard_04.clone()],
        );
        let open_shards = shard_table
            .find_open_shards_sorted(&index_uid, &source_id, &unavailable_ingesters)
            .unwrap();
        assert_eq!(open_shards.len(), 2);
        assert_eq!(open_shards[0].shard, shard_03);
        assert_eq!(open_shards[1].shard, shard_04);

        unavailable_ingesters.insert("test-leader-0".into());

        let open_shards = shard_table
            .find_open_shards_sorted(&index_uid, &source_id, &unavailable_ingesters)
            .unwrap();
        assert_eq!(open_shards.len(), 1);
        assert_eq!(open_shards[0].shard, shard_04);
    }

    #[test]
    fn test_shard_table_update_shards() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let mut shard_table = ShardTable::default();

        let shard_01 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_02 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_03 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(3)),
            shard_state: ShardState::Unavailable as i32,
            ..Default::default()
        };
        let shard_04 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(4)),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        shard_table.insert_shards(
            &index_uid,
            &source_id,
            vec![shard_01, shard_02, shard_03, shard_04],
        );
        let source_uid = SourceUid {
            index_uid,
            source_id,
        };
        let shard_infos = BTreeSet::from_iter([
            ShardInfo {
                shard_id: ShardId::from(1),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(1),
                long_term_ingestion_rate: RateMibPerSec(1),
            },
            ShardInfo {
                shard_id: ShardId::from(2),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(2),
                long_term_ingestion_rate: RateMibPerSec(2),
            },
            ShardInfo {
                shard_id: ShardId::from(3),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(3),
                long_term_ingestion_rate: RateMibPerSec(3),
            },
            ShardInfo {
                shard_id: ShardId::from(4),
                shard_state: ShardState::Closed,
                short_term_ingestion_rate: RateMibPerSec(4),
                long_term_ingestion_rate: RateMibPerSec(4),
            },
            ShardInfo {
                shard_id: ShardId::from(5),
                shard_state: ShardState::Open,
                short_term_ingestion_rate: RateMibPerSec(5),
                long_term_ingestion_rate: RateMibPerSec(5),
            },
        ]);
        let shard_stats = shard_table.update_shards(&source_uid, &shard_infos);
        assert_eq!(shard_stats.num_open_shards, 2);
        assert_eq!(shard_stats.avg_short_term_ingestion_rate, 1.5);

        assert_eq!(shard_stats.avg_short_term_ingestion_rate, 1.5);

        let shard_entries: Vec<ShardEntry> = shard_table
            .get_shards(&source_uid)
            .unwrap()
            .values()
            .cloned()
            .sorted_unstable_by(|left, right| left.shard.shard_id.cmp(&right.shard.shard_id))
            .collect();
        assert_eq!(shard_entries.len(), 4);

        assert_eq!(shard_entries[0].shard.shard_id(), ShardId::from(1));
        assert_eq!(shard_entries[0].shard.shard_state(), ShardState::Open);
        assert_eq!(shard_entries[0].short_term_ingestion_rate, RateMibPerSec(1));

        assert_eq!(shard_entries[1].shard.shard_id(), ShardId::from(2));
        assert_eq!(shard_entries[1].shard.shard_state(), ShardState::Open);
        assert_eq!(shard_entries[1].short_term_ingestion_rate, RateMibPerSec(2));

        assert_eq!(shard_entries[2].shard.shard_id(), ShardId::from(3));
        assert_eq!(
            shard_entries[2].shard.shard_state(),
            ShardState::Unavailable
        );
        assert_eq!(shard_entries[2].short_term_ingestion_rate, RateMibPerSec(3));

        assert_eq!(shard_entries[3].shard.shard_id(), ShardId::from(4));
        assert_eq!(shard_entries[3].shard.shard_state(), ShardState::Closed);
        assert_eq!(shard_entries[3].short_term_ingestion_rate, RateMibPerSec(4));
    }

    #[test]
    fn test_shard_table_close_shards() {
        let index_uid_0: IndexUid = IndexUid::for_test("test-index", 0);
        let index_uid_1: IndexUid = IndexUid::for_test("test-index", 1);
        let source_id = "test-source".to_string();

        let mut shard_table = ShardTable::default();

        let shard_01 = Shard {
            index_uid: index_uid_0.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_02 = Shard {
            index_uid: index_uid_0.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Closed as i32,
            ..Default::default()
        };
        let shard_11 = Shard {
            index_uid: index_uid_1.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        shard_table.insert_shards(&index_uid_0, &source_id, vec![shard_01, shard_02]);
        shard_table.insert_shards(&index_uid_1, &source_id, vec![shard_11]);

        let source_uid_0 = SourceUid {
            index_uid: index_uid_0,
            source_id,
        };
        let closed_shard_ids = shard_table.close_shards(
            &source_uid_0,
            &[ShardId::from(1), ShardId::from(2), ShardId::from(3)],
        );
        assert_eq!(closed_shard_ids, &[ShardId::from(1)]);

        let table_entry = shard_table.table_entries.get(&source_uid_0).unwrap();
        let shards = table_entry.shards();
        assert_eq!(shards[0].shard_state(), ShardState::Closed);
    }

    #[test]
    fn test_shard_table_delete_shards() {
        let mut shard_table = ShardTable::default();

        let index_uid_0: IndexUid = IndexUid::for_test("test-index", 0);
        let index_uid_1: IndexUid = IndexUid::for_test("test-index", 1);
        let source_id = "test-source".to_string();

        let shard_01 = Shard {
            index_uid: index_uid_0.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_02 = Shard {
            index_uid: index_uid_0.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_11 = Shard {
            index_uid: index_uid_1.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-leader-0".to_string(),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        shard_table.insert_shards(&index_uid_0, &source_id, vec![shard_01.clone(), shard_02]);
        shard_table.insert_shards(&index_uid_1, &source_id, vec![shard_11]);

        let source_uid_0 = SourceUid {
            index_uid: index_uid_0.clone(),
            source_id: source_id.clone(),
        };
        shard_table.delete_shards(&source_uid_0, &[ShardId::from(2)]);

        let source_uid_1 = SourceUid {
            index_uid: index_uid_1.clone(),
            source_id: source_id.clone(),
        };
        shard_table.delete_shards(&source_uid_1, &[ShardId::from(1)]);

        assert_eq!(shard_table.table_entries.len(), 2);

        let table_entry = shard_table.table_entries.get(&source_uid_0).unwrap();
        let shards = table_entry.shards();
        assert_eq!(shards.len(), 1);
        assert_eq!(shards[0], shard_01);

        let table_entry = shard_table.table_entries.get(&source_uid_1).unwrap();
        assert!(table_entry.is_empty());
    }

    #[test]
    fn test_shard_table_acquire_scaling_up_permits() {
        let mut shard_table = ShardTable::default();

        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        assert!(
            shard_table
                .acquire_scaling_permits(&source_uid, ScalingMode::Up(1))
                .is_none()
        );

        shard_table.add_source(&index_uid, &source_id);

        let previous_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_up_rate_limiter
            .available_permits();

        assert!(
            shard_table
                .acquire_scaling_permits(&source_uid, ScalingMode::Up(1))
                .unwrap()
        );

        let new_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_up_rate_limiter
            .available_permits();

        assert_eq!(new_available_permits, previous_available_permits - 1);
    }

    #[test]
    fn test_shard_table_acquire_scaling_down_permits() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        let mut shard_table = ShardTable::default();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        assert!(
            shard_table
                .acquire_scaling_permits(&source_uid, ScalingMode::Down)
                .is_none()
        );

        shard_table.add_source(&index_uid, &source_id);

        let previous_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_down_rate_limiter
            .available_permits();

        assert!(
            shard_table
                .acquire_scaling_permits(&source_uid, ScalingMode::Down)
                .unwrap()
        );

        let new_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_down_rate_limiter
            .available_permits();

        assert_eq!(new_available_permits, previous_available_permits - 1);
    }

    #[test]
    fn test_shard_table_release_scaling_up_permits() {
        let mut shard_table = ShardTable::default();

        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        shard_table.add_source(&index_uid, &source_id);

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let previous_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_up_rate_limiter
            .available_permits();

        assert!(
            shard_table
                .acquire_scaling_permits(&source_uid, ScalingMode::Up(1))
                .unwrap()
        );

        shard_table.release_scaling_permits(&source_uid, ScalingMode::Up(1));

        let new_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_up_rate_limiter
            .available_permits();

        assert_eq!(new_available_permits, previous_available_permits);
    }

    #[test]
    fn test_shard_table_release_scaling_down_permits() {
        let mut shard_table = ShardTable::default();

        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();

        shard_table.add_source(&index_uid, &source_id);

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: source_id.clone(),
        };
        let previous_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_up_rate_limiter
            .available_permits();

        assert!(
            shard_table
                .acquire_scaling_permits(&source_uid, ScalingMode::Down)
                .unwrap()
        );

        shard_table.release_scaling_permits(&source_uid, ScalingMode::Down);

        let new_available_permits = shard_table
            .table_entries
            .get_mut(&source_uid)
            .unwrap()
            .scaling_up_rate_limiter
            .available_permits();

        assert_eq!(new_available_permits, previous_available_permits);
    }

    #[test]
    fn test_shard_locations() {
        let shard1 = ShardId::from("shard1");
        let shard2 = ShardId::from("shard1");
        let unlisted_shard = ShardId::from("unlisted");
        let node1 = NodeId::new("node1".to_string());
        let node2 = NodeId::new("node2".to_string());
        let mut shard_locations = ShardLocations::default();
        shard_locations.add_location(&shard1, &node1);
        shard_locations.add_location(&shard1, &node2);
        // add location called several times should counted once.
        shard_locations.add_location(&shard2, &node2);
        assert_eq!(
            shard_locations.get_shard_locations(&shard1),
            &[&node1, &node2]
        );
        assert_eq!(
            shard_locations.get_shard_locations(&shard2),
            &[&node1, &node2]
        );
        // If the shard is not listed, we do not panic but just return an empty list.
        assert!(
            shard_locations
                .get_shard_locations(&unlisted_shard)
                .is_empty()
        );
    }

    #[test]
    fn test_shard_table_shard_locations() {
        let mut shard_table = ShardTable::default();

        let index_uid0: IndexUid = IndexUid::for_test("test-index0", 0);
        let source_id = "test-source0".to_string();
        shard_table.add_source(&index_uid0, &source_id);

        let index_uid1: IndexUid = IndexUid::for_test("test-index1", 0);
        let source_id = "test-source1".to_string();
        shard_table.add_source(&index_uid1, &source_id);

        let source_uid0 = SourceUid {
            index_uid: index_uid0.clone(),
            source_id: source_id.clone(),
        };

        let source_uid1 = SourceUid {
            index_uid: index_uid1.clone(),
            source_id: source_id.clone(),
        };

        let make_shard = |source_uid: &SourceUid,
                          leader_id: &str,
                          shard_id: u64,
                          follower_id: Option<&str>,
                          shard_state: ShardState| {
            Shard {
                index_uid: source_uid.index_uid.clone().into(),
                source_id: source_uid.source_id.clone(),
                shard_id: Some(ShardId::from(shard_id)),
                leader_id: leader_id.to_string(),
                follower_id: follower_id.map(|s| s.to_string()),
                shard_state: shard_state as i32,
                ..Default::default()
            }
        };

        shard_table.insert_shards(
            &source_uid0.index_uid,
            &source_uid0.source_id,
            vec![
                make_shard(
                    &source_uid0,
                    "indexer1",
                    0,
                    Some("indexer2"),
                    ShardState::Open,
                ),
                make_shard(&source_uid0, "indexer1", 1, None, ShardState::Closed),
                make_shard(&source_uid0, "indexer2", 2, None, ShardState::Open),
            ],
        );

        shard_table.insert_shards(
            &source_uid1.index_uid,
            &source_uid1.source_id,
            vec![
                make_shard(
                    &source_uid1,
                    "indexer2",
                    3,
                    Some("indexer1"),
                    ShardState::Unavailable,
                ),
                make_shard(
                    &source_uid1,
                    "indexer2",
                    3,
                    Some("indexer1"),
                    ShardState::Open,
                ),
            ],
        );

        let shard_locations = shard_table.shard_locations();
        let get_sorted_locations_for_shard = |shard_id: u64| {
            let mut locations = shard_locations
                .get_shard_locations(&ShardId::from(shard_id))
                .to_vec();
            locations.sort();
            locations
        };
        assert_eq!(
            &get_sorted_locations_for_shard(0u64),
            &[&NodeId::from("indexer1"), &NodeId::from("indexer2")]
        );
        assert_eq!(
            &get_sorted_locations_for_shard(1u64),
            &[&NodeId::from("indexer1")]
        );
        assert_eq!(
            &get_sorted_locations_for_shard(2u64),
            &[&NodeId::from("indexer2")]
        );
        assert_eq!(
            &get_sorted_locations_for_shard(3u64),
            &[&NodeId::from("indexer1"), &NodeId::from("indexer2")]
        );
    }
}


================================================
FILE: quickwit/quickwit-control-plane/src/tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;
use std::time::Duration;

use fnv::FnvHashMap;
use futures::{Stream, StreamExt};
use quickwit_actors::{Inbox, Mailbox, Observe, Universe};
use quickwit_cluster::{ChannelTransport, Cluster, ClusterChange, create_cluster_for_test};
use quickwit_common::test_utils::wait_until_predicate;
use quickwit_common::tower::{Change, Pool};
use quickwit_config::service::QuickwitService;
use quickwit_config::{
    ClusterConfig, KafkaSourceParams, SourceConfig, SourceInputFormat, SourceParams,
};
use quickwit_indexing::IndexingService;
use quickwit_metastore::{IndexMetadata, ListIndexesMetadataResponseExt};
use quickwit_proto::indexing::{ApplyIndexingPlanRequest, CpuCapacity, IndexingServiceClient};
use quickwit_proto::metastore::{
    ListIndexesMetadataResponse, ListShardsResponse, MetastoreServiceClient, MockMetastoreService,
};
use quickwit_proto::types::NodeId;
use serde_json::json;

use crate::IndexerNodeInfo;
use crate::control_plane::{CONTROL_PLAN_LOOP_INTERVAL, ControlPlane};
use crate::indexing_scheduler::MIN_DURATION_BETWEEN_SCHEDULING;

fn index_metadata_for_test(index_id: &str, source_id: &str, num_pipelines: usize) -> IndexMetadata {
    let mut index_metadata = IndexMetadata::for_test(index_id, "ram://indexes/test-index");
    let ingest_source_config = SourceConfig::ingest_v2();
    index_metadata.add_source(ingest_source_config).unwrap();

    let kafka_source_config = SourceConfig {
        enabled: true,
        source_id: source_id.to_string(),
        num_pipelines: NonZeroUsize::new(num_pipelines).unwrap(),
        source_params: SourceParams::Kafka(KafkaSourceParams {
            topic: "topic".to_string(),
            client_log_level: None,
            client_params: json!({
            "bootstrap.servers": "localhost:9092",
            }),
            enable_backfill_mode: true,
        }),
        transform_config: None,
        input_format: SourceInputFormat::Json,
    };
    index_metadata.add_source(kafka_source_config).unwrap();
    index_metadata
}

pub fn test_indexer_change_stream(
    cluster_change_stream: impl Stream<Item = ClusterChange> + Send + 'static,
    indexing_clients: FnvHashMap<NodeId, Mailbox<IndexingService>>,
) -> impl Stream<Item = Change<NodeId, IndexerNodeInfo>> + Send + 'static {
    cluster_change_stream.filter_map(move |cluster_change| {
        let indexing_clients = indexing_clients.clone();
        Box::pin(async move {
            match cluster_change {
                ClusterChange::Add(node)
                    if node.enabled_services().contains(&QuickwitService::Indexer) =>
                {
                    let node_id = node.node_id().to_owned();
                    let generation_id = node.chitchat_id().generation_id;
                    let indexing_tasks = node.indexing_tasks().to_vec();
                    let client_mailbox = indexing_clients.get(&node_id).unwrap().clone();
                    let client = IndexingServiceClient::from_mailbox(client_mailbox);
                    let change = Change::Insert(
                        node_id.clone(),
                        IndexerNodeInfo {
                            node_id,
                            generation_id,
                            client,
                            indexing_tasks,
                            indexing_capacity: CpuCapacity::from_cpu_millis(4_000),
                        },
                    );
                    Some(change)
                }
                ClusterChange::Remove(node) => Some(Change::Remove(node.node_id().to_owned())),
                _ => None,
            }
        })
    })
}

async fn start_control_plane(
    cluster: Cluster,
    indexers: &[&Cluster],
    universe: &Universe,
) -> (Vec<Inbox<IndexingService>>, Mailbox<ControlPlane>) {
    let index_1 = "test-indexing-plan-1";
    let source_1 = "source-1";
    let index_2 = "test-indexing-plan-2";
    let source_2 = "source-2";
    let index_metadata_1 = index_metadata_for_test(index_1, source_1, 2);
    let mut index_metadata_2 = index_metadata_for_test(index_2, source_2, 1);
    index_metadata_2.create_timestamp = index_metadata_1.create_timestamp + 1;
    let mut mock_metastore = MockMetastoreService::new();
    mock_metastore.expect_list_indexes_metadata().returning(
        move |_list_indexes_request: quickwit_proto::metastore::ListIndexesMetadataRequest| {
            let indexes_metadata = vec![index_metadata_2.clone(), index_metadata_1.clone()];
            Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
        },
    );
    mock_metastore.expect_list_shards().returning(|_| {
        Ok(ListShardsResponse {
            subresponses: Vec::new(),
        })
    });
    let mut indexer_inboxes = Vec::new();

    let indexer_pool = Pool::default();
    let ingester_pool = Pool::default();
    let mut indexing_clients = FnvHashMap::default();

    for indexer in indexers {
        let (indexing_service_mailbox, indexing_service_inbox) = universe.create_test_mailbox();
        indexing_clients.insert(indexer.self_node_id().to_owned(), indexing_service_mailbox);
        indexer_inboxes.push(indexing_service_inbox);
    }
    let indexer_change_stream =
        test_indexer_change_stream(cluster.change_stream(), indexing_clients);
    indexer_pool.listen_for_changes(indexer_change_stream);

    let mut cluster_config = ClusterConfig::for_test();
    cluster_config.cluster_id = cluster.cluster_id().to_string();

    let self_node_id = cluster.self_node_id().to_owned();
    let (control_plane_mailbox, _control_plane_handle, _is_ready_rx) = ControlPlane::spawn(
        universe,
        cluster_config,
        self_node_id,
        cluster,
        indexer_pool,
        ingester_pool,
        MetastoreServiceClient::from_mock(mock_metastore),
    );

    (indexer_inboxes, control_plane_mailbox)
}

#[tokio::test]
async fn test_scheduler_scheduling_and_control_loop_apply_plan_again() {
    quickwit_common::setup_logging_for_tests();
    let transport = ChannelTransport::default();
    let cluster =
        create_cluster_for_test(Vec::new(), &["indexer", "control_plane"], &transport, true)
            .await
            .unwrap();
    cluster
        .wait_for_ready_members(|members| members.len() == 1, Duration::from_secs(5))
        .await
        .unwrap();
    let universe = Universe::with_accelerated_time();
    let (indexing_service_inboxes, control_plane_mailbox) =
        start_control_plane(cluster.clone(), &[&cluster.clone()], &universe).await;
    let indexing_service_inbox = indexing_service_inboxes[0].clone();
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    let indexing_service_inbox_messages =
        indexing_service_inbox.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 1);
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 1);
    assert!(scheduler_state.last_applied_physical_plan.is_some());
    assert_eq!(indexing_service_inbox_messages.len(), 1);

    // After a CONTROL_PLAN_LOOP_INTERVAL, the control loop will check if the desired plan is
    // running on the indexer. As chitchat state of the indexer is not updated (we did
    // not instantiate a indexing service for that), the control loop will apply again
    // the same plan.
    // Check first the plan is not updated before `MIN_DURATION_BETWEEN_SCHEDULING`.
    tokio::time::sleep(MIN_DURATION_BETWEEN_SCHEDULING.mul_f32(0.5)).await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 1);
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 1);

    // After `MIN_DURATION_BETWEEN_SCHEDULING`, we should see a plan update.
    tokio::time::sleep(MIN_DURATION_BETWEEN_SCHEDULING.mul_f32(0.7)).await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    let indexing_service_inbox_messages =
        indexing_service_inbox.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 1);
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 2);
    assert_eq!(indexing_service_inbox_messages.len(), 1);
    let indexing_tasks = indexing_service_inbox_messages
        .first()
        .unwrap()
        .indexing_tasks
        .clone();

    // Update the indexer state and check that the indexer does not receive any new
    // `ApplyIndexingPlanRequest`.
    cluster
        .update_self_node_indexing_tasks(&indexing_tasks)
        .await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 2);
    let indexing_service_inbox_messages =
        indexing_service_inbox.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    assert_eq!(indexing_service_inbox_messages.len(), 0);

    // Update the indexer state with a different plan and check that the indexer does now
    // receive a new `ApplyIndexingPlanRequest`.
    cluster
        .update_self_node_indexing_tasks(&[indexing_tasks[0].clone()])
        .await;
    tokio::time::sleep(MIN_DURATION_BETWEEN_SCHEDULING.mul_f32(1.2)).await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 3);
    let indexing_service_inbox_messages =
        indexing_service_inbox.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    assert_eq!(indexing_service_inbox_messages.len(), 1);
    universe.assert_quit().await;
}

#[tokio::test]
async fn test_scheduler_scheduling_no_indexer() {
    let transport = ChannelTransport::default();
    let cluster = create_cluster_for_test(Vec::new(), &["control_plane"], &transport, true)
        .await
        .unwrap();
    let universe = Universe::with_accelerated_time();
    let (indexing_service_inboxes, control_plane_mailbox) =
        start_control_plane(cluster.clone(), &[], &universe).await;
    assert_eq!(indexing_service_inboxes.len(), 0);

    // No indexer.
    universe.sleep(CONTROL_PLAN_LOOP_INTERVAL).await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 0);
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 0);
    assert!(scheduler_state.last_applied_physical_plan.is_none());

    // There is no indexer, we should observe no
    // scheduling.
    universe.sleep(Duration::from_secs(60)).await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 0);
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 0);
    assert!(scheduler_state.last_applied_physical_plan.is_none());
    universe.assert_quit().await;
}

#[tokio::test]
async fn test_scheduler_scheduling_multiple_indexers() {
    let transport = ChannelTransport::default();
    let cluster = create_cluster_for_test(Vec::new(), &["control_plane"], &transport, true)
        .await
        .unwrap();
    let cluster_indexer_1 = create_cluster_for_test(
        vec![cluster.gossip_advertise_addr().to_string()],
        &["indexer"],
        &transport,
        true,
    )
    .await
    .unwrap();
    let cluster_indexer_2 = create_cluster_for_test(
        vec![cluster.gossip_advertise_addr().to_string()],
        &["indexer"],
        &transport,
        true,
    )
    .await
    .unwrap();
    let universe = Universe::new();
    let (indexing_service_inboxes, control_plane_mailbox) = start_control_plane(
        cluster.clone(),
        &[&cluster_indexer_1, &cluster_indexer_2],
        &universe,
    )
    .await;
    let indexing_service_inbox_1 = indexing_service_inboxes[0].clone();
    let indexing_service_inbox_2 = indexing_service_inboxes[1].clone();

    // No indexer.
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    let indexing_service_inbox_messages =
        indexing_service_inbox_1.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 0);
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 0);
    assert!(scheduler_state.last_applied_physical_plan.is_none());
    assert_eq!(indexing_service_inbox_messages.len(), 0);

    cluster
        .wait_for_ready_members(
            |members| {
                members
                    .iter()
                    .any(|member| member.enabled_services.contains(&QuickwitService::Indexer))
            },
            Duration::from_secs(5),
        )
        .await
        .unwrap();

    // Wait for chitchat update, sheduler will detect new indexers and schedule a plan.
    wait_until_predicate(
        || {
            let control_plane_mailbox_clone = control_plane_mailbox.clone();
            async move {
                let scheduler_state = control_plane_mailbox_clone
                    .ask(Observe)
                    .await
                    .unwrap()
                    .indexing_scheduler;
                scheduler_state.num_schedule_indexing_plan == 1
            }
        },
        CONTROL_PLAN_LOOP_INTERVAL * 4,
        Duration::from_millis(100),
    )
    .await
    .unwrap();
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_applied_physical_indexing_plan, 1);
    let indexing_service_inbox_messages_1 =
        indexing_service_inbox_1.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    let indexing_service_inbox_messages_2 =
        indexing_service_inbox_2.drain_for_test_typed::<ApplyIndexingPlanRequest>();
    assert_eq!(indexing_service_inbox_messages_1.len(), 1);
    assert_eq!(indexing_service_inbox_messages_2.len(), 1);
    cluster_indexer_1
        .update_self_node_indexing_tasks(&indexing_service_inbox_messages_1[0].indexing_tasks)
        .await;
    cluster_indexer_2
        .update_self_node_indexing_tasks(&indexing_service_inbox_messages_2[0].indexing_tasks)
        .await;

    // Wait 2 CONTROL_PLAN_LOOP_INTERVAL again and check the scheduler will not apply the plan
    // several times.
    universe.sleep(CONTROL_PLAN_LOOP_INTERVAL * 2).await;
    let scheduler_state = control_plane_mailbox
        .ask(Observe)
        .await
        .unwrap()
        .indexing_scheduler;
    assert_eq!(scheduler_state.num_schedule_indexing_plan, 1);

    // Shutdown cluster and wait until the new scheduling.
    cluster_indexer_2.leave().await;

    cluster
        .wait_for_ready_members(
            |members| {
                members
                    .iter()
                    .filter(|member| member.enabled_services.contains(&QuickwitService::Indexer))
                    .count()
                    == 1
            },
            Duration::from_secs(5),
        )
        .await
        .unwrap();

    wait_until_predicate(
        || {
            let scheduler_handler_mailbox_clone = control_plane_mailbox.clone();
            async move {
                let scheduler_state = scheduler_handler_mailbox_clone
                    .ask(Observe)
                    .await
                    .unwrap()
                    .indexing_scheduler;
                scheduler_state.num_schedule_indexing_plan == 2
            }
        },
        CONTROL_PLAN_LOOP_INTERVAL * 10,
        Duration::from_millis(100),
    )
    .await
    .unwrap();

    universe.assert_quit().await;
}


================================================
FILE: quickwit/quickwit-datetime/Cargo.toml
================================================
[package]
name = "quickwit-datetime"
description = "Date and datetime utilities for Quickwit"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
itertools = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
tantivy = { workspace = true }
time = { workspace = true }
time-fmt = "0.3.8"


================================================
FILE: quickwit/quickwit-datetime/README.md
================================================
Why a datetime crate? Why is it no in quickwit-common or where it is consumed?

- We don't want to add a dependency to tantivy in quickwit-common
- We need this date logic both in quickwit-query and in quickwit-docmapper


================================================
FILE: quickwit/quickwit-datetime/src/date_time_format.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Display;
use std::str::FromStr;

use serde::de::Error;
use serde::{Deserialize, Deserializer, Serialize};
use serde_json::Value as JsonValue;
use time::Month;
use time::format_description::well_known::{Iso8601, Rfc2822, Rfc3339};

use crate::java_date_time_format::is_strftime_formatting;
use crate::{StrptimeParser, TantivyDateTime};

/// Specifies the datetime and unix timestamp formats to use when parsing date strings.
#[derive(Clone, Debug, Eq, PartialEq, Hash, Default)]
pub enum DateTimeInputFormat {
    Iso8601,
    Rfc2822,
    #[default]
    Rfc3339,
    Strptime(StrptimeParser),
    Timestamp,
}

impl DateTimeInputFormat {
    pub fn as_str(&self) -> &str {
        match self {
            DateTimeInputFormat::Iso8601 => "iso8601",
            DateTimeInputFormat::Rfc2822 => "rfc2822",
            DateTimeInputFormat::Rfc3339 => "rfc3339",
            DateTimeInputFormat::Strptime(parser) => parser.strptime_format.as_str(),
            DateTimeInputFormat::Timestamp => "unix_timestamp",
        }
    }
}

impl Display for DateTimeInputFormat {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        formatter.write_str(self.as_str())
    }
}

impl FromStr for DateTimeInputFormat {
    type Err = String;

    fn from_str(date_time_format_str: &str) -> Result<Self, Self::Err> {
        let date_time_format = match date_time_format_str.to_lowercase().as_str() {
            "iso8601" => DateTimeInputFormat::Iso8601,
            "rfc2822" => DateTimeInputFormat::Rfc2822,
            "rfc3339" => DateTimeInputFormat::Rfc3339,
            "unix_timestamp" => DateTimeInputFormat::Timestamp,
            _ => {
                if !is_strftime_formatting(date_time_format_str) {
                    return Err(format!(
                        "unknown input format: `{date_time_format_str}`. a custom date time \
                         format must contain at least one `strftime` special characters"
                    ));
                }
                DateTimeInputFormat::Strptime(StrptimeParser::from_strptime(date_time_format_str)?)
            }
        };
        Ok(date_time_format)
    }
}

impl Serialize for DateTimeInputFormat {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        serializer.serialize_str(self.as_str())
    }
}

impl<'de> Deserialize<'de> for DateTimeInputFormat {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let date_time_format_str: String = Deserialize::deserialize(deserializer)?;
        let date_time_format = date_time_format_str.parse().map_err(D::Error::custom)?;
        Ok(date_time_format)
    }
}

/// Specifies the datetime format to use when displaying datetime values.
#[derive(Clone, Debug, Eq, PartialEq, Hash, Default)]
pub enum DateTimeOutputFormat {
    Iso8601,
    Rfc2822,
    #[default]
    Rfc3339,
    Strptime(StrptimeParser),
    TimestampSecs,
    TimestampMillis,
    TimestampMicros,
    TimestampNanos,
}

impl DateTimeOutputFormat {
    pub fn as_str(&self) -> &str {
        match self {
            DateTimeOutputFormat::Iso8601 => "iso8601",
            DateTimeOutputFormat::Rfc2822 => "rfc2822",
            DateTimeOutputFormat::Rfc3339 => "rfc3339",
            DateTimeOutputFormat::Strptime(parser) => parser.strptime_format.as_str(),
            DateTimeOutputFormat::TimestampSecs => "unix_timestamp_secs",
            DateTimeOutputFormat::TimestampMillis => "unix_timestamp_millis",
            DateTimeOutputFormat::TimestampMicros => "unix_timestamp_micros",
            DateTimeOutputFormat::TimestampNanos => "unix_timestamp_nanos",
        }
    }

    pub fn format_to_json(&self, date_time: TantivyDateTime) -> Result<JsonValue, String> {
        let date = date_time.into_utc();
        let format_result = match &self {
            DateTimeOutputFormat::Rfc3339 => date.format(&Rfc3339).map(JsonValue::String),
            DateTimeOutputFormat::Iso8601 => date.format(&Iso8601::DEFAULT).map(JsonValue::String),
            DateTimeOutputFormat::Rfc2822 => date.format(&Rfc2822).map(JsonValue::String),
            DateTimeOutputFormat::Strptime(strftime_parser) => strftime_parser
                .format_date_time(&date)
                .map(JsonValue::String),
            DateTimeOutputFormat::TimestampSecs => {
                Ok(JsonValue::Number(date_time.into_timestamp_secs().into()))
            }
            DateTimeOutputFormat::TimestampMillis => {
                Ok(JsonValue::Number(date_time.into_timestamp_millis().into()))
            }
            DateTimeOutputFormat::TimestampMicros => {
                Ok(JsonValue::Number(date_time.into_timestamp_micros().into()))
            }
            DateTimeOutputFormat::TimestampNanos => {
                Ok(JsonValue::Number(date_time.into_timestamp_nanos().into()))
            }
        };
        format_result.map_err(|error| error.to_string())
    }
}

impl Display for DateTimeOutputFormat {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        formatter.write_str(self.as_str())
    }
}

impl FromStr for DateTimeOutputFormat {
    type Err = String;

    fn from_str(date_time_format_str: &str) -> Result<Self, Self::Err> {
        let date_time_format = match date_time_format_str.to_lowercase().as_str() {
            "iso8601" => DateTimeOutputFormat::Iso8601,
            "rfc2822" => DateTimeOutputFormat::Rfc2822,
            "rfc3339" => DateTimeOutputFormat::Rfc3339,
            "unix_timestamp_secs" => DateTimeOutputFormat::TimestampSecs,
            "unix_timestamp_millis" => DateTimeOutputFormat::TimestampMillis,
            "unix_timestamp_micros" => DateTimeOutputFormat::TimestampMicros,
            "unix_timestamp_nanos" => DateTimeOutputFormat::TimestampNanos,
            _ => {
                if !is_strftime_formatting(date_time_format_str) {
                    return Err(format!(
                        "unknown output format: `{date_time_format_str}`. a custom date time \
                         format must contain at least one `strftime` special characters"
                    ));
                }
                DateTimeOutputFormat::Strptime(StrptimeParser::from_strptime(date_time_format_str)?)
            }
        };
        Ok(date_time_format)
    }
}

impl Serialize for DateTimeOutputFormat {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        serializer.serialize_str(self.as_str())
    }
}

impl<'de> Deserialize<'de> for DateTimeOutputFormat {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let date_time_format_str: String = Deserialize::deserialize(deserializer)?;
        let date_time_format = date_time_format_str.parse().map_err(D::Error::custom)?;
        Ok(date_time_format)
    }
}

/// Infers the year of a parsed date time. It assumes that events appear more often delayed than in
/// the future and, as a result, skews towards the past year.
pub(super) fn infer_year(
    parsed_month_opt: Option<Month>,
    this_month: Month,
    this_year: i32,
) -> i32 {
    let Some(parsed_month) = parsed_month_opt else {
        return this_year;
    };
    if parsed_month as u8 > this_month as u8 + 3 {
        return this_year - 1;
    }
    this_year
}

#[cfg(test)]
mod tests {
    use time::Month;

    use super::*;

    #[test]
    fn test_date_time_input_format_ser() {
        let date_time_formats_json = serde_json::to_value(&[
            DateTimeInputFormat::Iso8601,
            DateTimeInputFormat::Rfc2822,
            DateTimeInputFormat::Rfc3339,
            DateTimeInputFormat::Timestamp,
        ])
        .unwrap();

        let expected_date_time_formats =
            serde_json::json!(["iso8601", "rfc2822", "rfc3339", "unix_timestamp",]);
        assert_eq!(date_time_formats_json, expected_date_time_formats);
    }

    #[test]
    fn test_date_time_input_format_deser() {
        let date_time_formats_json = r#"
            [
                "iso8601",
                "rfc2822",
                "rfc3339",
                "unix_timestamp"
            ]
            "#;
        let date_time_formats: Vec<DateTimeInputFormat> =
            serde_json::from_str(date_time_formats_json).unwrap();
        let expected_date_time_formats = [
            DateTimeInputFormat::Iso8601,
            DateTimeInputFormat::Rfc2822,
            DateTimeInputFormat::Rfc3339,
            DateTimeInputFormat::Timestamp,
        ];
        assert_eq!(date_time_formats, &expected_date_time_formats);
    }

    #[test]
    fn test_date_time_output_format_ser() {
        let date_time_formats_json = serde_json::to_value(&[
            DateTimeOutputFormat::Iso8601,
            DateTimeOutputFormat::Rfc2822,
            DateTimeOutputFormat::Rfc3339,
            DateTimeOutputFormat::TimestampSecs,
            DateTimeOutputFormat::TimestampMillis,
            DateTimeOutputFormat::TimestampMicros,
            DateTimeOutputFormat::TimestampNanos,
        ])
        .unwrap();

        let expected_date_time_formats = serde_json::json!([
            "iso8601",
            "rfc2822",
            "rfc3339",
            "unix_timestamp_secs",
            "unix_timestamp_millis",
            "unix_timestamp_micros",
            "unix_timestamp_nanos",
        ]);
        assert_eq!(date_time_formats_json, expected_date_time_formats);
    }

    #[test]
    fn test_date_time_output_format_deser() {
        let date_time_formats_json = r#"
            [
                "iso8601",
                "rfc2822",
                "rfc3339",
                "unix_timestamp_secs",
                "unix_timestamp_millis",
                "unix_timestamp_micros",
                "unix_timestamp_nanos"
            ]
            "#;
        let date_time_formats: Vec<DateTimeOutputFormat> =
            serde_json::from_str(date_time_formats_json).unwrap();
        let expected_date_time_formats = [
            DateTimeOutputFormat::Iso8601,
            DateTimeOutputFormat::Rfc2822,
            DateTimeOutputFormat::Rfc3339,
            DateTimeOutputFormat::TimestampSecs,
            DateTimeOutputFormat::TimestampMillis,
            DateTimeOutputFormat::TimestampMicros,
            DateTimeOutputFormat::TimestampNanos,
        ];
        assert_eq!(date_time_formats, &expected_date_time_formats);
    }

    #[test]
    fn test_fail_date_time_input_format_from_str_with_unknown_format() {
        let formats = vec![
            "test%",
            "test-%v",
            "test-%q",
            "unix_timestamp_secs",
            "unix_timestamp_seconds",
        ];
        for format in formats {
            let error_str = DateTimeInputFormat::from_str(format)
                .unwrap_err()
                .to_string();
            assert!(error_str.contains(&format!("unknown input format: `{format}`")));
        }
    }

    #[test]
    fn test_fail_date_time_output_format_from_str_with_unknown_format() {
        let formats = vec!["test%", "test-%v", "test-%q", "unix_timestamp_seconds"];
        for format in formats {
            let error_str = DateTimeOutputFormat::from_str(format)
                .unwrap_err()
                .to_string();
            assert!(error_str.contains(&format!("unknown output format: `{format}`")));
        }
    }

    #[test]
    fn test_infer_year() {
        let inferred_year = infer_year(None, Month::January, 2024);
        assert_eq!(inferred_year, 2024);

        let inferred_year = infer_year(Some(Month::December), Month::January, 2024);
        assert_eq!(inferred_year, 2023);

        let inferred_year = infer_year(Some(Month::January), Month::January, 2024);
        assert_eq!(inferred_year, 2024);

        let inferred_year = infer_year(Some(Month::February), Month::January, 2024);
        assert_eq!(inferred_year, 2024);

        let inferred_year = infer_year(Some(Month::March), Month::January, 2024);
        assert_eq!(inferred_year, 2024);

        let inferred_year = infer_year(Some(Month::April), Month::January, 2024);
        assert_eq!(inferred_year, 2024);

        let inferred_year = infer_year(Some(Month::May), Month::January, 2024);
        assert_eq!(inferred_year, 2023);
    }
}


================================================
FILE: quickwit/quickwit-datetime/src/date_time_parsing.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use itertools::Itertools;
use time::OffsetDateTime;
use time::format_description::well_known::{Iso8601, Rfc2822, Rfc3339};

use super::date_time_format::DateTimeInputFormat;
use crate::TantivyDateTime;

// Minimum supported timestamp value in seconds (13 Apr 1972 23:59:55 GMT).
const MIN_TIMESTAMP_SECONDS: i64 = 72_057_595;

// Maximum supported timestamp value in seconds (16 Mar 2242 12:56:31 GMT).
const MAX_TIMESTAMP_SECONDS: i64 = 8_589_934_591;

pub fn parse_date_time_str(
    date_time_str: &str,
    date_time_formats: &[DateTimeInputFormat],
) -> Result<TantivyDateTime, String> {
    let trimmed_date_time_str = date_time_str.trim_ascii();

    for date_time_format in date_time_formats {
        let date_time_opt = match date_time_format {
            DateTimeInputFormat::Iso8601 => parse_iso8601(trimmed_date_time_str)
                .map(TantivyDateTime::from_utc)
                .ok(),
            DateTimeInputFormat::Rfc2822 => parse_rfc2822(trimmed_date_time_str)
                .map(TantivyDateTime::from_utc)
                .ok(),
            DateTimeInputFormat::Rfc3339 => parse_rfc3339(trimmed_date_time_str)
                .map(TantivyDateTime::from_utc)
                .ok(),
            DateTimeInputFormat::Strptime(parser) => parser
                .parse_date_time(trimmed_date_time_str)
                .map(TantivyDateTime::from_utc)
                .ok(),
            DateTimeInputFormat::Timestamp => parse_timestamp_str(trimmed_date_time_str),
        };
        if let Some(date_time) = date_time_opt {
            return Ok(date_time);
        }
    }
    Err(format!(
        "failed to parse datetime `{date_time_str}` using the following formats: `{}`",
        date_time_formats
            .iter()
            .map(|date_time_format| date_time_format.as_str())
            .join("`, `")
    ))
}

pub fn parse_timestamp_float(
    timestamp: f64,
    date_time_formats: &[DateTimeInputFormat],
) -> Result<TantivyDateTime, String> {
    if !date_time_formats.contains(&DateTimeInputFormat::Timestamp) {
        return Err(format!(
            "failed to parse datetime `{timestamp}` using the following formats: `{}`",
            date_time_formats
                .iter()
                .map(|date_time_format| date_time_format.as_str())
                .join("`, `")
        ));
    }
    let duration_since_epoch = Duration::try_from_secs_f64(timestamp)
        .map_err(|error| format!("failed to parse datetime `{timestamp}`: {error}"))?;
    let timestamp_nanos = duration_since_epoch.as_nanos() as i64;
    Ok(TantivyDateTime::from_timestamp_nanos(timestamp_nanos))
}

pub fn parse_timestamp_int(
    timestamp: i64,
    date_time_formats: &[DateTimeInputFormat],
) -> Result<TantivyDateTime, String> {
    if !date_time_formats.contains(&DateTimeInputFormat::Timestamp) {
        return Err(format!(
            "failed to parse datetime `{timestamp}` using the following formats: `{}`",
            date_time_formats
                .iter()
                .map(|date_time_format| date_time_format.as_str())
                .join("`, `")
        ));
    }
    parse_timestamp(timestamp)
}

pub fn parse_timestamp_str(timestamp_str: &str) -> Option<TantivyDateTime> {
    if let Ok(timestamp) = timestamp_str.parse::<i64>() {
        return parse_timestamp(timestamp).ok();
    }
    if let Some((timestamp_secs_str, subsecond_digits_str)) = timestamp_str.split_once('.') {
        if subsecond_digits_str.is_empty() {
            return parse_timestamp_str(timestamp_secs_str);
        }
        if let Ok(timestamp_secs @ MIN_TIMESTAMP_SECONDS..=MAX_TIMESTAMP_SECONDS) =
            timestamp_secs_str.parse::<i64>()
        {
            let num_subsecond_digits = subsecond_digits_str.len().min(9);

            if let Ok(subsecond_digits) =
                subsecond_digits_str[..num_subsecond_digits].parse::<i64>()
            {
                let nanos = subsecond_digits * 10i64.pow(9 - num_subsecond_digits as u32);
                let timestamp_nanos = timestamp_secs * 1_000_000_000 + nanos;
                return Some(TantivyDateTime::from_timestamp_nanos(timestamp_nanos));
            }
        }
    }
    None
}

/// Parses a ISO8601 date.
fn parse_iso8601(value: &str) -> Result<OffsetDateTime, String> {
    OffsetDateTime::parse(value, &Iso8601::DEFAULT).map_err(|error| error.to_string())
}

/// Parses a RFC2822 date.
fn parse_rfc2822(value: &str) -> Result<OffsetDateTime, String> {
    OffsetDateTime::parse(value, &Rfc2822).map_err(|error| error.to_string())
}

/// Parses a RFC3339 date.
fn parse_rfc3339(value: &str) -> Result<OffsetDateTime, String> {
    OffsetDateTime::parse(value, &Rfc3339).map_err(|error| error.to_string())
}

/// Returns the appropriate [`TantivyDateTime`] for the specified Unix timestamp.
///
/// This function will choose the timestamp precision based on the value range.
/// The tradeoff is that we can only support dates ranging:
/// - from `13 Apr 1972 23:59:55`: smallest value that can be converted to all precisions.
/// - to: `16 Mar 2242 12:56:31`: greatest value that can be converted to all precisions.
pub fn parse_timestamp(timestamp: i64) -> Result<TantivyDateTime, String> {
    const MIN_TIMESTAMP_MILLIS: i64 = MIN_TIMESTAMP_SECONDS * 1000;
    const MAX_TIMESTAMP_MILLIS: i64 = MAX_TIMESTAMP_SECONDS * 1000;

    const MIN_TIMESTAMP_MICROS: i64 = MIN_TIMESTAMP_SECONDS * 1_000_000;
    const MAX_TIMESTAMP_MICROS: i64 = MAX_TIMESTAMP_SECONDS * 1_000_000;

    const MIN_TIMESTAMP_NANOS: i64 = MIN_TIMESTAMP_SECONDS * 1_000_000_000;
    const MAX_TIMESTAMP_NANOS: i64 = MAX_TIMESTAMP_SECONDS * 1_000_000_000;

    match timestamp {
        MIN_TIMESTAMP_SECONDS..=MAX_TIMESTAMP_SECONDS => {
            Ok(TantivyDateTime::from_timestamp_secs(timestamp))
        }
        MIN_TIMESTAMP_MILLIS..=MAX_TIMESTAMP_MILLIS => {
            Ok(TantivyDateTime::from_timestamp_millis(timestamp))
        }
        MIN_TIMESTAMP_MICROS..=MAX_TIMESTAMP_MICROS => {
            Ok(TantivyDateTime::from_timestamp_micros(timestamp))
        }
        MIN_TIMESTAMP_NANOS..=MAX_TIMESTAMP_NANOS => {
            Ok(TantivyDateTime::from_timestamp_nanos(timestamp))
        }
        _ => Err(format!(
            "failed to parse unix timestamp `{timestamp}`. Quickwit only support timestamp values \
             ranging from `13 Apr 1972 23:59:55` to `16 Mar 2242 12:56:31`"
        )),
    }
}

#[cfg(test)]
mod tests {
    use time::Month;
    use time::macros::datetime;

    use super::*;
    use crate::StrptimeParser;
    use crate::date_time_format::infer_year;

    #[test]
    fn test_parse_iso8601() {
        let date_time = parse_iso8601("20120521T120914Z").unwrap();
        assert_eq!(date_time, datetime!(2012-05-21 12:09:14 UTC));
    }

    #[test]
    fn test_parse_rfc2822() {
        let date_time = parse_rfc2822("Mon, 21 May 2012 12:09:14 GMT").unwrap();
        assert_eq!(date_time, datetime!(2012-05-21 12:09:14 UTC));
    }

    #[test]
    fn test_parse_rfc3339() {
        let date_time = parse_rfc3339("2012-05-21T12:09:14-00:00").unwrap();
        assert_eq!(date_time, datetime!(2012-05-21 12:09:14 UTC));
    }

    #[test]
    fn test_parse_strptime() {
        let test_data = vec![
            (
                " %Y-%m-%d %H:%M:%S ",
                "2012-05-21 12:09:14",
                datetime!(2012-05-21 12:09:14 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S %z",
                " 2012-05-21 12:09:14 +0000 ",
                datetime!(2012-05-21 12:09:14 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S %z",
                "2012-05-21 12:09:14 +0200",
                datetime!(2012-05-21 10:09:14 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S %z",
                "2012-05-21 12:09:14 -0300",
                datetime!(2012-05-21 15:09:14 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S %z",
                "2012-05-21 12:09:14 -03:00",
                datetime!(2012-05-21 15:09:14 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S.%f",
                "2024-01-31 18:40:19.950",
                datetime!(2024-01-31 18:40:19.950000000 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S.%f",
                "2024-01-31 18:40:19.950188",
                datetime!(2024-01-31 18:40:19.950188000 UTC),
            ),
            (
                "%Y-%m-%d %H:%M:%S.%f",
                "2024-01-31 18:40:19.950188123",
                datetime!(2024-01-31 18:40:19.950188123 UTC),
            ),
            ("%b %d %H:%M:%S", "Mar  6 17:40:02", {
                let dt = datetime!(1900-03-06 17:40:02 UTC);
                let now = OffsetDateTime::now_utc();
                let year = infer_year(Some(Month::March), now.month(), now.year());
                dt.replace_year(year).unwrap()
            }),
            (
                "%Y-%m-%dT%H:%M:%S.%f%z",
                "2024-03-21T03:45:02.561820768-0400",
                datetime!(2024-03-21 03:45:02.561820768 -04:00),
            ),
        ];
        for (fmt, date_time_str, expected) in test_data {
            let parser = DateTimeInputFormat::Strptime(StrptimeParser::from_strptime(fmt).unwrap());
            let result = parse_date_time_str(date_time_str, &[parser]);
            if let Err(error) = &result {
                panic!(
                    "failed to parse `{date_time_str}` using the following strptime format \
                     `{fmt}`: {error}"
                )
            }
            assert_eq!(result.unwrap(), TantivyDateTime::from_utc(expected));
        }
    }

    #[test]
    fn test_parse_date_without_time() {
        let strptime_parser = StrptimeParser::from_strptime("%Y-%m-%d").unwrap();
        let date = strptime_parser.parse_date_time("2012-05-21").unwrap();
        assert_eq!(date, datetime!(2012-05-21 00:00:00 UTC));
    }

    #[test]
    fn test_parse_date_am_pm_hour_not_zeroed() {
        let strptime_parser = StrptimeParser::from_strptime("%Y-%m-%d %I:%M:%S %p").unwrap();
        let date = strptime_parser
            .parse_date_time("2012-05-21 10:05:12 pm")
            .unwrap();
        assert_eq!(date, datetime!(2012-05-21 22:05:12 UTC));
    }

    #[test]
    fn test_parse_date_time_str() {
        for date_time_str in [
            "20120521T120914Z ",
            " Mon, 21 May 2012 12:09:14 GMT",
            " 2012-05-21T12:09:14-00:00 ",
            "2012-05-21 12:09:14",
            " 2012/05/21 12:09:14",
            "2012/05/21 12:09:14 +00:00",
            "1337602154 ",
            " 1337602154.0 ",
        ] {
            let date_time = parse_date_time_str(
                date_time_str,
                &[
                    DateTimeInputFormat::Iso8601,
                    DateTimeInputFormat::Rfc2822,
                    DateTimeInputFormat::Rfc3339,
                    DateTimeInputFormat::Strptime(
                        StrptimeParser::from_strptime("%Y-%m-%d %H:%M:%S").unwrap(),
                    ),
                    DateTimeInputFormat::Strptime(
                        StrptimeParser::from_strptime("%Y/%m/%d %H:%M:%S").unwrap(),
                    ),
                    DateTimeInputFormat::Strptime(
                        StrptimeParser::from_strptime("%Y/%m/%d %H:%M:%S %z").unwrap(),
                    ),
                    DateTimeInputFormat::Timestamp,
                ],
            )
            .unwrap();
            assert_eq!(
                date_time.into_timestamp_secs(),
                datetime!(2012-05-21 12:09:14 UTC).unix_timestamp()
            );
        }
        let error = parse_date_time_str(
            "foo",
            &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Rfc2822],
        )
        .unwrap_err();
        assert_eq!(
            error,
            "failed to parse datetime `foo` using the following formats: `iso8601`, `rfc2822`"
        );
    }

    #[test]
    fn test_parse_timestamp_float() {
        let unix_ts_secs = OffsetDateTime::now_utc().unix_timestamp();
        {
            let date_time = parse_timestamp_float(
                unix_ts_secs as f64,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Timestamp],
            )
            .unwrap();
            assert_eq!(date_time.into_timestamp_millis(), unix_ts_secs * 1_000);
        }
        {
            let date_time = parse_timestamp_float(
                unix_ts_secs as f64 + 0.1230,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Timestamp],
            )
            .unwrap();
            assert!((date_time.into_timestamp_millis() - (unix_ts_secs * 1_000 + 123)).abs() <= 1);
        }
        {
            let date_time = parse_timestamp_float(
                unix_ts_secs as f64 + 0.1234560,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Timestamp],
            )
            .unwrap();
            assert!(
                (date_time.into_timestamp_micros() - (unix_ts_secs * 1_000_000 + 123_456)).abs()
                    <= 1
            );
        }
        {
            let date_time = parse_timestamp_float(
                unix_ts_secs as f64 + 0.123456789,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Timestamp],
            )
            .unwrap();
            assert!(
                (date_time.into_timestamp_nanos() - (unix_ts_secs * 1_000_000_000 + 123_456_789))
                    .abs()
                    <= 100
            );
        }
        {
            let error = parse_timestamp_float(
                1668730394917.01,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Rfc2822],
            )
            .unwrap_err();
            assert_eq!(
                error,
                "failed to parse datetime `1668730394917.01` using the following formats: \
                 `iso8601`, `rfc2822`"
            );
        }
    }

    #[test]
    fn test_parse_timestamp_int() {
        {
            let unix_ts_secs = OffsetDateTime::now_utc().unix_timestamp();
            let date_time = parse_timestamp_int(
                unix_ts_secs,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Timestamp],
            )
            .unwrap();
            assert_eq!(date_time.into_timestamp_secs(), unix_ts_secs);
        }
        {
            let error = parse_timestamp_int(
                1668730394917,
                &[DateTimeInputFormat::Iso8601, DateTimeInputFormat::Rfc2822],
            )
            .unwrap_err();
            assert_eq!(
                error,
                "failed to parse datetime `1668730394917` using the following formats: `iso8601`, \
                 `rfc2822`"
            );
        }
    }

    #[test]
    fn test_parse_timestamp_str() {
        let date_time = parse_timestamp_str("123456789").unwrap();
        assert_eq!(date_time.into_timestamp_secs(), 123456789);

        let date_time = parse_timestamp_str("123456789.").unwrap();
        assert_eq!(date_time.into_timestamp_secs(), 123456789);

        let date_time = parse_timestamp_str("123456789.0").unwrap();
        assert_eq!(date_time.into_timestamp_secs(), 123456789);

        let date_time = parse_timestamp_str("123456789.1").unwrap();
        assert_eq!(date_time.into_timestamp_millis(), 123456789100);

        let date_time = parse_timestamp_str("123456789.100000001").unwrap();
        assert_eq!(date_time.into_timestamp_nanos(), 123456789100000001);

        let date_time = parse_timestamp_str("123456789.1000000011").unwrap();
        assert_eq!(date_time.into_timestamp_nanos(), 123456789100000001);
    }

    #[test]
    fn test_parse_date_time_millis() {
        for date_time_str in [
            "20120521T120914.12Z",
            "2012-05-21T12:09:14.12-00:00",
            "2012-05-21 12:09:14.120",
        ] {
            let date_time = parse_date_time_str(
                date_time_str,
                &[
                    DateTimeInputFormat::Iso8601,
                    DateTimeInputFormat::Rfc3339,
                    DateTimeInputFormat::Strptime(
                        StrptimeParser::from_strptime("%Y-%m-%d %H:%M:%S.%f").unwrap(),
                    ),
                ],
            )
            .unwrap();
            assert_eq!(
                date_time.into_timestamp_micros() as i128,
                datetime!(2012-05-21 12:09:14.12 UTC).unix_timestamp_nanos() / 1_000
            );
        }
    }

    #[test]
    fn test_parse_timestamp() {
        let now = OffsetDateTime::now_utc();
        {
            let unix_ts_secs = now.unix_timestamp();
            let date_time = parse_timestamp(unix_ts_secs).unwrap();
            assert_eq!(date_time.into_timestamp_secs(), unix_ts_secs);
        }
        {
            let unix_ts_millis = (now.unix_timestamp_nanos() / 1_000_000) as i64;
            let date_time = parse_timestamp(unix_ts_millis).unwrap();
            assert_eq!(date_time.into_timestamp_millis(), unix_ts_millis);
        }
        {
            let unix_ts_micros = (now.unix_timestamp_nanos() / 1_000) as i64;
            let date_time = parse_timestamp(unix_ts_micros).unwrap();
            assert_eq!(date_time.into_timestamp_micros(), unix_ts_micros);
        }
        {
            let unix_ts_nanos = now.unix_timestamp_nanos() as i64;
            let date_time = parse_timestamp(unix_ts_nanos).unwrap();
            assert_eq!(date_time.into_timestamp_nanos(), unix_ts_nanos);
        }
        {
            let min_supported_date =
                OffsetDateTime::parse("1972-04-13T23:59:55.00Z", &Rfc3339).unwrap();
            let parsed_date_time = parse_timestamp(min_supported_date.unix_timestamp()).unwrap();
            assert_eq!(
                parsed_date_time.into_timestamp_secs(),
                min_supported_date.unix_timestamp()
            );
            assert_eq!(
                parsed_date_time.into_timestamp_micros(),
                min_supported_date.unix_timestamp_nanos() as i64 / 1_000
            );
        }
        {
            let max_supported_date =
                OffsetDateTime::parse("2242-03-16T12:56:31.00Z", &Rfc3339).unwrap();
            let parsed_date_time = parse_timestamp(max_supported_date.unix_timestamp()).unwrap();
            assert_eq!(
                parsed_date_time.into_timestamp_secs(),
                max_supported_date.unix_timestamp()
            );
            assert_eq!(
                parsed_date_time.into_timestamp_micros(),
                max_supported_date.unix_timestamp_nanos() as i64 / 1_000
            );
        }
        {
            let less_than_supported_date = MIN_TIMESTAMP_SECONDS - 1;
            let parse_err = parse_timestamp(less_than_supported_date).unwrap_err();
            assert!(parse_err.contains("failed to parse unix timestamp"));
        }
        {
            let greater_than_supported_date = MAX_TIMESTAMP_SECONDS + 1;
            let parse_err = parse_timestamp(greater_than_supported_date).unwrap_err();
            assert!(parse_err.contains("failed to parse unix timestamp"));
        }
        {
            let unix_epoch = 0;
            let parse_err = parse_timestamp(unix_epoch).unwrap_err();
            assert!(parse_err.contains("failed to parse unix timestamp"));

            let parse_err = parse_timestamp(MIN_TIMESTAMP_SECONDS << 7).unwrap_err();
            assert!(parse_err.contains("failed to parse unix timestamp"));

            let parse_err = parse_timestamp(MIN_TIMESTAMP_SECONDS << 17).unwrap_err();
            assert!(parse_err.contains("failed to parse unix timestamp"));

            let parse_err = parse_timestamp(MIN_TIMESTAMP_SECONDS << 27).unwrap_err();
            assert!(parse_err.contains("failed to parse unix timestamp"));
        }
    }

    #[test]
    fn test_parse_timestamp_min_max_values() {
        {
            let min_ts_millis = MIN_TIMESTAMP_SECONDS * 1_000;
            let date_time = parse_timestamp(min_ts_millis).unwrap();
            assert_eq!(date_time.into_timestamp_millis(), min_ts_millis);

            let min_ts_micros = MIN_TIMESTAMP_SECONDS * 1_000_000;
            let date_time = parse_timestamp(min_ts_micros).unwrap();
            assert_eq!(date_time.into_timestamp_micros(), min_ts_micros);

            let min_ts_nanos = MIN_TIMESTAMP_SECONDS * 1_000_000_000;
            let date_time = parse_timestamp(min_ts_nanos).unwrap();
            assert_eq!(date_time.into_timestamp_micros() * 1000, min_ts_nanos);
        }
        {
            let max_ts_seconds = MAX_TIMESTAMP_SECONDS;
            let date_time = parse_timestamp(max_ts_seconds).unwrap();
            assert_eq!(date_time.into_timestamp_secs(), max_ts_seconds);

            let max_ts_millis = MAX_TIMESTAMP_SECONDS * 1_000;
            let date_time = parse_timestamp(max_ts_millis).unwrap();
            assert_eq!(date_time.into_timestamp_millis(), max_ts_millis);

            let max_ts_micros = MAX_TIMESTAMP_SECONDS * 1_000_000;
            let date_time = parse_timestamp(max_ts_micros).unwrap();
            assert_eq!(date_time.into_timestamp_micros(), max_ts_micros);
        }
    }
}


================================================
FILE: quickwit/quickwit-datetime/src/java_date_time_format.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::num::NonZeroU8;
use std::sync::OnceLock;

use time::error::{Format, TryFromParsed};
use time::format_description::modifier::{
    Day, Hour, Minute, Month as MonthModifier, Padding, Second, Subsecond, SubsecondDigits,
    WeekNumber, WeekNumberRepr, Weekday, WeekdayRepr, Year, YearRepr,
};
use time::format_description::{Component, OwnedFormatItem};
use time::parsing::Parsed;
use time::{Month, OffsetDateTime, PrimitiveDateTime, UtcOffset};
use time_fmt::parse::time_format_item::parse_to_format_item;

use crate::date_time_format;

const JAVA_DATE_FORMAT_TOKENS: &[&str] = &[
    "yyyy",
    "xxxx",
    "SSSSSSSSS", // For nanoseconds
    "SSSSSSS",   // For microseconds
    "SSSSSS",    // For fractional seconds up to six digits
    "SSSSS",
    "SSSS",
    "SSS",
    "SS",
    "ZZ",
    "ww",
    "w[w]",
    "MM",
    "dd",
    "HH",
    "hh",
    "kk",
    "mm",
    "ss",
    "aa",
    "a",
    "w",
    "M",
    "d",
    "H",
    "h",
    "k",
    "m",
    "s",
    "S",
    "Z",
    "e",
];

fn literal(s: &[u8]) -> OwnedFormatItem {
    // builds a boxed slice from a slice
    let boxed_slice: Box<[u8]> = s.to_vec().into_boxed_slice();
    OwnedFormatItem::Literal(boxed_slice)
}

#[inline]
fn get_padding(ptn: &str) -> Padding {
    if ptn.len() == 2 {
        Padding::Zero
    } else {
        Padding::None
    }
}

fn build_zone_offset(_: &str) -> Option<OwnedFormatItem> {
    // 'Z' literal to represent UTC offset
    let z_literal = OwnedFormatItem::Literal(Box::from(b"Z".as_ref()));

    // Offset in '+/-HH:MM' format
    let offset_with_delimiter_items: Box<[OwnedFormatItem]> = vec![
        OwnedFormatItem::Component(Component::OffsetHour(Default::default())),
        OwnedFormatItem::Literal(Box::from(b":".as_ref())),
        OwnedFormatItem::Component(Component::OffsetMinute(Default::default())),
    ]
    .into_boxed_slice();
    let offset_with_delimiter_compound = OwnedFormatItem::Compound(offset_with_delimiter_items);

    // Offset in '+/-HHMM' format
    let offset_items: Box<[OwnedFormatItem]> = vec![
        OwnedFormatItem::Component(Component::OffsetHour(Default::default())),
        OwnedFormatItem::Component(Component::OffsetMinute(Default::default())),
    ]
    .into_boxed_slice();
    let offset_compound = OwnedFormatItem::Compound(offset_items);

    Some(OwnedFormatItem::First(
        vec![z_literal, offset_with_delimiter_compound, offset_compound].into_boxed_slice(),
    ))
}

// There is a `YearRepr::LastTwo` representation in the time crate, but the parser is unreliable, so
// we only support `YearRepr::Full` for now. See also https://github.com/time-rs/time/issues/649.
const fn year_item() -> Option<OwnedFormatItem> {
    let mut year_component = Year::default();
    year_component.repr = YearRepr::Full;
    Some(OwnedFormatItem::Component(Component::Year(year_component)))
}

fn build_month_item(ptn: &str) -> Option<OwnedFormatItem> {
    let mut month: MonthModifier = Default::default();
    month.padding = get_padding(ptn);
    Some(OwnedFormatItem::Component(Component::Month(month)))
}

fn build_day_item(ptn: &str) -> Option<OwnedFormatItem> {
    let mut day = Day::default();
    day.padding = get_padding(ptn);
    Some(OwnedFormatItem::Component(Component::Day(day)))
}

fn build_day_of_week_item(_: &str) -> Option<OwnedFormatItem> {
    let mut weekday = Weekday::default();
    weekday.repr = WeekdayRepr::Monday;
    weekday.one_indexed = false;
    Some(OwnedFormatItem::Component(Component::Weekday(weekday)))
}

fn build_week_of_year_item(ptn: &str) -> Option<OwnedFormatItem> {
    let mut week_number = WeekNumber::default();
    week_number.repr = WeekNumberRepr::Monday;
    week_number.padding = get_padding(ptn);
    Some(OwnedFormatItem::Component(Component::WeekNumber(
        week_number,
    )))
}

fn build_hour_item(ptn: &str) -> Option<OwnedFormatItem> {
    let mut hour = Hour::default();
    hour.padding = get_padding(ptn);
    hour.is_12_hour_clock = false;
    Some(OwnedFormatItem::Component(Component::Hour(hour)))
}

fn build_minute_item(ptn: &str) -> Option<OwnedFormatItem> {
    let mut minute: Minute = Default::default();
    minute.padding = get_padding(ptn);
    Some(OwnedFormatItem::Component(Component::Minute(minute)))
}

fn build_second_item(ptn: &str) -> Option<OwnedFormatItem> {
    let mut second: Second = Default::default();
    second.padding = get_padding(ptn);
    Some(OwnedFormatItem::Component(Component::Second(second)))
}

fn build_fraction_of_second_item(_ptn: &str) -> Option<OwnedFormatItem> {
    let mut subsecond: Subsecond = Default::default();
    subsecond.digits = SubsecondDigits::OneOrMore;
    Some(OwnedFormatItem::Component(Component::Subsecond(subsecond)))
}

fn parse_java_datetime_format_items_recursive(
    chars: &mut std::iter::Peekable<std::str::Chars>,
) -> Result<Vec<OwnedFormatItem>, String> {
    let mut items = Vec::new();

    while let Some(&c) = chars.peek() {
        match c {
            '[' => {
                chars.next();
                let optional_items = parse_java_datetime_format_items_recursive(chars)?;
                items.push(OwnedFormatItem::Optional(Box::new(
                    OwnedFormatItem::Compound(optional_items.into_boxed_slice()),
                )));
            }
            ']' => {
                chars.next();
                break;
            }
            '\'' => {
                chars.next();
                let mut literal_str = String::new();
                while let Some(&next_c) = chars.peek() {
                    if next_c == '\'' {
                        chars.next();
                        break;
                    } else {
                        literal_str.push(next_c);
                        chars.next();
                    }
                }
                items.push(literal(literal_str.as_bytes()));
            }
            _ => {
                if let Some(format_item) = match_java_date_format_token(chars)? {
                    items.push(format_item);
                } else {
                    // Treat as a literal character
                    items.push(literal(c.to_string().as_bytes()));
                    chars.next();
                }
            }
        }
    }

    Ok(items)
}

// Elasticsearch/OpenSearch uses a set of preconfigured formats, more information could be found
// here https://www.elastic.co/guide/en/elasticsearch/reference/current/mapping-date-format.html
fn match_java_date_format_token(
    chars: &mut std::iter::Peekable<std::str::Chars>,
) -> Result<Option<OwnedFormatItem>, String> {
    if chars.peek().is_none() {
        return Ok(None);
    }

    let remaining: String = chars.clone().collect();

    // Try to match the longest possible token
    for token in JAVA_DATE_FORMAT_TOKENS {
        if remaining.starts_with(token) {
            for _ in 0..token.len() {
                chars.next();
            }

            let format_item = match *token {
                "yyyy" | "xxxx" => year_item(),
                "MM" | "M" => build_month_item(token),
                "dd" | "d" => build_day_item(token),
                "HH" | "H" => build_hour_item(token),
                "mm" | "m" => build_minute_item(token),
                "ss" | "s" => build_second_item(token),
                "SSSSSSSSS" | "SSSSSSS" | "SSSSSS" | "SSSSS" | "SSSS" | "SSS" | "SS" | "S" => {
                    build_fraction_of_second_item(token)
                }
                "Z" => build_zone_offset(token),
                "ww" | "w[w]" | "w" => build_week_of_year_item(token),
                "e" => build_day_of_week_item(token),
                _ => return Err(format!("unrecognized token '{token}'")),
            };
            return Ok(format_item);
        }
    }

    Ok(None)
}

// Check if the given date time format is a common alias and replace it with the
// Java date format it is mapped to, if any.
// If the java_datetime_format is not an alias, it is expected to be a
// java date time format and should be returned as is.
fn resolve_java_datetime_format_alias(java_datetime_format: &str) -> &str {
    static JAVA_DATE_FORMAT_ALIASES: OnceLock<HashMap<&'static str, &'static str>> =
        OnceLock::new();
    let java_datetime_format_map = JAVA_DATE_FORMAT_ALIASES.get_or_init(|| {
        let mut m = HashMap::new();
        m.insert("date_optional_time", "yyyy-MM-dd['T'HH:mm:ss.SSSZ]");
        m.insert(
            "strict_date_optional_time",
            "yyyy[-MM[-dd['T'HH[:mm[:ss[.SSS[Z]]]]]]]",
        );
        m.insert(
            "strict_date_optional_time_nanos",
            "yyyy[-MM[-dd['T'HH:mm:ss.SSSSSSZ]]]",
        );
        m.insert("basic_date", "yyyyMMdd");

        m.insert("strict_basic_week_date", "xxxx'W'wwe");
        m.insert("basic_week_date", "xxxx'W'wwe");

        m.insert("strict_basic_week_date_time", "xxxx'W'wwe'T'HHmmss.SSSZ");
        m.insert("basic_week_date_time", "xxxx'W'wwe'T'HHmmss.SSSZ");

        m.insert(
            "strict_basic_week_date_time_no_millis",
            "xxxx'W'wwe'T'HHmmssZ",
        );
        m.insert("basic_week_date_time_no_millis", "xxxx'W'wwe'T'HHmmssZ");

        m.insert("strict_week_date", "xxxx-'W'ww-e");
        m.insert("week_date", "xxxx-'W'w[w]-e");
        m
    });
    java_datetime_format_map
        .get(java_datetime_format)
        .copied()
        .unwrap_or(java_datetime_format)
}

/// A date time parser that holds the format specification `Vec<FormatItem>`.
#[derive(Clone)]
pub struct StrptimeParser {
    pub(crate) strptime_format: String,
    items: Box<[OwnedFormatItem]>,
}

pub fn parse_java_datetime_format_items(
    java_datetime_format: &str,
) -> Result<Box<[OwnedFormatItem]>, String> {
    let mut chars = java_datetime_format.chars().peekable();
    let items = parse_java_datetime_format_items_recursive(&mut chars)?;
    Ok(items.into_boxed_slice())
}

impl StrptimeParser {
    /// Parse a date assume UTC if unspecified.
    /// See `parse_date_time_with_default_timezone` for more details.
    pub fn parse_date_time(&self, date_time_str: &str) -> Result<OffsetDateTime, String> {
        self.parse_date_time_with_default_timezone(date_time_str, UtcOffset::UTC)
    }

    /// Parse a date. If no timezone is specified we will assume the timezone passed as
    /// `default_offset`. If the date is missing, it will be automatically set to 00:00:00.
    pub fn parse_date_time_with_default_timezone(
        &self,
        date_time_str: &str,
        default_offset: UtcOffset,
    ) -> Result<OffsetDateTime, String> {
        let mut parsed = Parsed::new();
        if !parsed
            .parse_items(date_time_str.as_bytes(), &self.items)
            .map_err(|err| err.to_string())?
            .is_empty()
        {
            return Err(format!(
                "datetime string `{date_time_str}` does not match strptime format `{}`",
                self.strptime_format
            ));
        }

        // The parsed datetime contains a date but seems to be missing "time".
        // We complete it artificially with 00:00:00.
        if parsed.hour_24().is_none()
            && !(parsed.hour_12().is_some() && parsed.hour_12_is_pm().is_some())
        {
            parsed.set_hour_24(0u8);
            parsed.set_minute(0u8);
            parsed.set_second(0u8);
        }

        if parsed.year().is_none() {
            let now = OffsetDateTime::now_utc();
            let year = date_time_format::infer_year(parsed.month(), now.month(), now.year());
            parsed.set_year(year);
        }

        if parsed.day().is_none() && parsed.monday_week_number().is_none() {
            parsed.set_day(NonZeroU8::try_from(1u8).unwrap());
        }

        if parsed.month().is_none() && parsed.monday_week_number().is_none() {
            parsed.set_month(Month::January);
        }

        if parsed.offset_hour().is_some() {
            let offset_datetime: OffsetDateTime = parsed
                .try_into()
                .map_err(|err: TryFromParsed| err.to_string())?;
            return Ok(offset_datetime);
        }
        let primitive_date_time: PrimitiveDateTime = parsed
            .try_into()
            .map_err(|err: TryFromParsed| err.to_string())?;
        Ok(primitive_date_time.assume_offset(default_offset))
    }

    pub fn format_date_time(&self, date_time: &OffsetDateTime) -> Result<String, Format> {
        date_time.format(&self.items)
    }

    pub fn from_strptime(strptime_format: &str) -> Result<StrptimeParser, String> {
        let items: Box<[OwnedFormatItem]> = parse_to_format_item(strptime_format)
            .map_err(|err| format!("invalid strptime format `{strptime_format}`: {err}"))?
            .into_iter()
            .map(|item| item.into())
            .collect::<Vec<_>>()
            .into_boxed_slice();
        Ok(StrptimeParser::new(strptime_format.to_string(), items))
    }

    pub fn from_java_datetime_format(java_datetime_format: &str) -> Result<StrptimeParser, String> {
        let java_datetime_format_resolved =
            resolve_java_datetime_format_alias(java_datetime_format);
        let items: Box<[OwnedFormatItem]> =
            parse_java_datetime_format_items(java_datetime_format_resolved)?;
        Ok(StrptimeParser::new(java_datetime_format.to_string(), items))
    }

    fn new(strptime_format: String, items: Box<[OwnedFormatItem]>) -> Self {
        StrptimeParser {
            strptime_format,
            items,
        }
    }
}

impl PartialEq for StrptimeParser {
    fn eq(&self, other: &Self) -> bool {
        self.strptime_format == other.strptime_format
    }
}

impl Eq for StrptimeParser {}

impl std::fmt::Debug for StrptimeParser {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        formatter
            .debug_struct("StrptimeParser")
            .field("format", &self.strptime_format)
            .finish()
    }
}

impl std::hash::Hash for StrptimeParser {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        self.strptime_format.hash(state);
    }
}

// `Strftime` format special characters.
// These characters are taken from the parsing crate we use for compatibility.
const STRFTIME_FORMAT_MARKERS: [&str; 36] = [
    "%a", "%A", "%b", "%B", "%c", "%C", "%d", "%D", "%e", "%f", "%F", "%h", "%H", "%I", "%j", "%k",
    "%l", "%m", "%M", "%n", "%p", "%P", "%r", "%R", "%S", "%t", "%T", "%U", "%w", "%W", "%x", "%X",
    "%y", "%Y", "%z", "%Z",
];

// Checks if a format contains `strftime` special characters.
pub fn is_strftime_formatting(format_str: &str) -> bool {
    STRFTIME_FORMAT_MARKERS
        .iter()
        .any(|marker| format_str.contains(marker))
}

#[cfg(test)]
mod tests {
    use time::macros::datetime;

    use super::*;
    use crate::java_date_time_format::parse_java_datetime_format_items;

    #[test]
    fn test_parse_datetime_format_missing_time() {
        let parser = StrptimeParser::from_strptime("%Y-%m-%d").unwrap();
        assert_eq!(
            parser.parse_date_time("2021-01-01").unwrap(),
            datetime!(2021-01-01 00:00:00 UTC)
        );
    }

    #[test]
    fn test_parse_datetime_format_strict_on_trailing_data() {
        let parser = StrptimeParser::from_strptime("%Y-%m-%d").unwrap();
        let error = parser.parse_date_time("2021-01-01TABC").unwrap_err();
        assert_eq!(
            error,
            "datetime string `2021-01-01TABC` does not match strptime format `%Y-%m-%d`"
        );
    }

    #[test]
    fn test_parse_strptime_with_timezone() {
        let parser = StrptimeParser::from_strptime("%Y-%m-%dT%H:%M:%S %z").unwrap();
        let offset_datetime = parser
            .parse_date_time("2021-01-01T11:00:03 +07:00")
            .unwrap();
        assert_eq!(offset_datetime, datetime!(2021-01-01 11:00:03 +7));
    }

    #[track_caller]
    fn test_parse_java_datetime_aux(
        java_date_time_format: &str,
        date_str: &str,
        expected_datetime: OffsetDateTime,
    ) {
        let parser = StrptimeParser::from_java_datetime_format(java_date_time_format).unwrap();
        let datetime = parser.parse_date_time(date_str).unwrap();
        assert_eq!(datetime, expected_datetime);
    }

    #[test]
    fn test_parse_java_datetime_format() {
        test_parse_java_datetime_aux("yyyyMMdd", "20210101", datetime!(2021-01-01 00:00:00 UTC));
        test_parse_java_datetime_aux(
            "yyyy MM dd",
            "2021 01 01",
            datetime!(2021-01-01 00:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "yyyy!MM?dd",
            "2021!01?01",
            datetime!(2021-01-01 00:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "yyyy!MM?dd'T'HH:",
            "2021!01?01T13:",
            datetime!(2021-01-01 13:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "yyyy!MM?dd['T'[HH:]]",
            "2021!01?01",
            datetime!(2021-01-01 00:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "yyyy!MM?dd['T'[HH:]",
            "2021!01?01T",
            datetime!(2021-01-01 00:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "yyyy!MM?dd['T'[HH:]]",
            "2021!01?01T13:",
            datetime!(2021-01-01 13:00:00 UTC),
        );
    }

    #[test]
    fn test_parse_java_missing_time() {
        test_parse_java_datetime_aux(
            "yyyy-MM-dd",
            "2021-01-01",
            datetime!(2021-01-01 00:00:00 UTC),
        );
    }

    #[test]
    fn test_parse_java_optional_missing_time() {
        test_parse_java_datetime_aux(
            "yyyy-MM-dd[ HH:mm:ss]",
            "2021-01-01",
            datetime!(2021-01-01 00:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "yyyy-MM-dd[ HH:mm:ss]",
            "2021-01-01 12:34:56",
            datetime!(2021-01-01 12:34:56 UTC),
        );
    }

    #[test]
    fn test_parse_java_datetime_format_aliases() {
        test_parse_java_datetime_aux(
            "date_optional_time",
            "2021-01-01",
            datetime!(2021-01-01 00:00:00 UTC),
        );
        test_parse_java_datetime_aux(
            "date_optional_time",
            "2021-01-21T03:01:22.312+01:00",
            datetime!(2021-01-21 03:01:22.312 +1),
        );
    }

    #[test]
    fn test_parse_java_week_formats() {
        test_parse_java_datetime_aux(
            "basic_week_date",
            "2024W313",
            datetime!(2024-08-01 0:00:00.0 +00:00:00),
        );
        let parser = StrptimeParser::from_java_datetime_format("basic_week_date").unwrap();
        parser.parse_date_time("24W313").unwrap_err();

        let parser = StrptimeParser::from_java_datetime_format("basic_week_date").unwrap();
        parser.parse_date_time("1W313").unwrap_err();

        test_parse_java_datetime_aux(
            "basic_week_date_time",
            "2018W313T121212.1Z",
            datetime!(2018-08-02 12:12:12.1 +00:00:00),
        );
        test_parse_java_datetime_aux(
            "basic_week_date_time",
            "2018W313T121212.123Z",
            datetime!(2018-08-02 12:12:12.123 +00:00:00),
        );
        test_parse_java_datetime_aux(
            "basic_week_date_time",
            "2018W313T121212.123456789Z",
            datetime!(2018-08-02 12:12:12.123456789 +00:00:00),
        );
        test_parse_java_datetime_aux(
            "basic_week_date_time",
            "2018W313T121212.123+0100",
            datetime!(2018-08-02 12:12:12.123 +01:00:00),
        );
        test_parse_java_datetime_aux(
            "basic_week_date_time_no_millis",
            "2018W313T121212Z",
            datetime!(2018-08-02 12:12:12.0 +00:00:00),
        );
        test_parse_java_datetime_aux(
            "basic_week_date_time_no_millis",
            "2018W313T121212+0100",
            datetime!(2018-08-02 12:12:12.0 +01:00:00),
        );
        test_parse_java_datetime_aux(
            "basic_week_date_time_no_millis",
            "2018W313T121212+01:00",
            datetime!(2018-08-02 12:12:12.0 +01:00:00),
        );

        test_parse_java_datetime_aux(
            "week_date",
            "2012-W48-6",
            datetime!(2012-12-02 0:00:00.0 +00:00:00),
        );

        test_parse_java_datetime_aux(
            "week_date",
            "2012-W01-6",
            datetime!(2012-01-08 0:00:00.0 +00:00:00),
        );

        test_parse_java_datetime_aux(
            "week_date",
            "2012-W1-6",
            datetime!(2012-01-08 0:00:00.0 +00:00:00),
        );
    }

    #[test]
    fn test_parse_java_strict_week_formats() {
        test_parse_java_datetime_aux(
            "strict_basic_week_date",
            "2024W313",
            datetime!(2024-08-01 0:00:00.0 +00:00:00),
        );

        test_parse_java_datetime_aux(
            "strict_week_date",
            "2012-W48-6",
            datetime!(2012-12-02 0:00:00.0 +00:00:00),
        );

        test_parse_java_datetime_aux(
            "strict_week_date",
            "2012-W01-6",
            datetime!(2012-01-08 0:00:00.0 +00:00:00),
        );
    }

    #[test]
    fn test_parse_strict_date_optional_time() {
        let parser =
            StrptimeParser::from_java_datetime_format("strict_date_optional_time").unwrap();
        let dates = [
            "2019",
            "2019-03",
            "2019-03-23",
            "2019-03-23T21:34",
            "2019-03-23T21:34:46",
            "2019-03-23T21:34:46.123Z",
            "2019-03-23T21:35:46.123+00:00",
            "2019-03-23T21:36:46.123+03:00",
            "2019-03-23T21:37:46.123+0300",
        ];
        let expected = [
            datetime!(2019-01-01 00:00:00 UTC),
            datetime!(2019-03-01 00:00:00 UTC),
            datetime!(2019-03-23 00:00:00 UTC),
            datetime!(2019-03-23 21:34 UTC),
            datetime!(2019-03-23 21:34:46 UTC),
            datetime!(2019-03-23 21:34:46.123 UTC),
            datetime!(2019-03-23 21:35:46.123 UTC),
            datetime!(2019-03-23 21:36:46.123 +03:00:00),
            datetime!(2019-03-23 21:37:46.123 +03:00:00),
        ];
        for (date_str, &expected_dt) in dates.iter().zip(expected.iter()) {
            let parsed_dt = parser
                .parse_date_time(date_str)
                .unwrap_or_else(|error| panic!("failed to parse {date_str}: {error}"));
            assert_eq!(parsed_dt, expected_dt);
        }
    }

    #[test]
    fn test_parse_strict_date_optional_time_nanos() {
        let parser =
            StrptimeParser::from_java_datetime_format("strict_date_optional_time_nanos").unwrap();
        let dates = [
            "2019",
            "2019-03",
            "2019-03-23",
            "2019-03-23T21:34:46.123456789Z",
            "2019-03-23T21:35:46.123456789+00:00",
            "2019-03-23T21:36:46.123456789+03:00",
            "2019-03-23T21:37:46.123456789+0300",
        ];
        let expected = [
            datetime!(2019-01-01 00:00:00 UTC),
            datetime!(2019-03-01 00:00:00 UTC),
            datetime!(2019-03-23 00:00:00 UTC),
            datetime!(2019-03-23 21:34:46.123456789 UTC),
            datetime!(2019-03-23 21:35:46.123456789 UTC),
            datetime!(2019-03-23 21:36:46.123456789 +03:00:00),
            datetime!(2019-03-23 21:37:46.123456789 +03:00:00),
        ];
        for (date_str, &expected_dt) in dates.iter().zip(expected.iter()) {
            let parsed_dt = parser
                .parse_date_time(date_str)
                .unwrap_or_else(|error| panic!("failed to parse {date_str}: {error}"));
            assert_eq!(parsed_dt, expected_dt);
        }
    }

    #[test]
    fn test_parse_java_datetime_format_items() {
        let format_str = "xxxx'W'wwe";
        let result = parse_java_datetime_format_items(format_str).unwrap();

        // We expect the tokens to be parsed as:
        // - 'xxxx' (week-based year)
        // - 'W' (literal)
        // - 'ww' (week of year)
        // - 'e' (day of week)

        assert_eq!(result.len(), 4);

        // Verify each token
        match &result[0] {
            OwnedFormatItem::Component(Component::Year(year)) => {
                assert_eq!(year.repr, YearRepr::Full);
            }
            unexpected => panic!("expected Year, but found: {unexpected:?}",),
        }
        match &result[1] {
            OwnedFormatItem::Literal(lit) => assert_eq!(lit.as_ref(), b"W"),
            unexpected => panic!("expected literal 'W', but found: {unexpected:?}"),
        }
        match &result[2] {
            OwnedFormatItem::Component(Component::WeekNumber(_)) => {}
            unexpected => panic!("expected WeekNumber component, but found: {unexpected:?}"),
        }
        match &result[3] {
            OwnedFormatItem::Component(Component::Weekday(_)) => {}
            unexpected => panic!("expected Weekday component, but found: {unexpected:?}"),
        }
    }

    #[test]
    fn test_parse_java_datetime_format_with_literals() {
        let format = "yyyy'T'Z-HHuu";
        let parser = StrptimeParser::from_java_datetime_format(format).unwrap();

        let test_cases = [
            ("2023TZ-14uu", datetime!(2023-01-01 14:00:00 UTC)),
            ("2024TZ-05uu", datetime!(2024-01-01 05:00:00 UTC)),
            ("2025TZ-23uu", datetime!(2025-01-01 23:00:00 UTC)),
        ];

        for (input, expected) in test_cases.iter() {
            let result = parser.parse_date_time(input).unwrap();
            assert_eq!(result, *expected, "failed to parse {input}");
        }

        // Test error case
        let error_case = "2023-1430";
        assert!(
            parser.parse_date_time(error_case).is_err(),
            "expected error for input: {error_case}",
        );
    }
}


================================================
FILE: quickwit/quickwit-datetime/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod date_time_format;
mod date_time_parsing;
pub mod java_date_time_format;

pub use date_time_format::{DateTimeInputFormat, DateTimeOutputFormat};
pub use date_time_parsing::{
    parse_date_time_str, parse_timestamp, parse_timestamp_float, parse_timestamp_int,
};
pub use java_date_time_format::StrptimeParser;
pub use tantivy::DateTime as TantivyDateTime;


================================================
FILE: quickwit/quickwit-directories/Cargo.toml
================================================
[package]
name = "quickwit-directories"
description = "Custom `tantivy::Directory` implementations for Quickwit"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
postcard = { workspace = true }
serde = { workspace = true }
tantivy = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }

quickwit-common = { workspace = true }
quickwit-storage = { workspace = true }

[dev-dependencies]
tempfile = { workspace = true }


================================================
FILE: quickwit/quickwit-directories/src/bundle_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::TryInto;
use std::fmt::Debug;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::{fmt, io};

use quickwit_storage::{BundleStorageFileOffsets, OwnedBytes, Storage, StorageResult};
use tantivy::directory::error::OpenReadError;
use tantivy::directory::{FileHandle, FileSlice};
use tantivy::{Directory, HasLen};

/// BundleDirectory is a read-only directory that makes it possible to
/// open a split and serve the file it contains via tantivy's `Directory`.
///
/// It is the `Directory` equivalent of `BundleStorage`.
///
/// Split Format:
/// `[Files][FilesMetadata][FilesMetadata length 8 byte Little endian][Hotcache][Hotcache length 8
/// byte Little endian]`
#[derive(Clone)]
pub struct BundleDirectory {
    file: FileSlice,
    file_offsets: BundleStorageFileOffsets,
}

impl Debug for BundleDirectory {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "BundleDirectory")
    }
}

/// Loads the split footer from a storage and path.
///
/// Returns (SplitFooter, BundleFooter)
/// SplitFooter [BundleMetadata, BundleMetadata Len, Hotcache, Hotcache len]
/// BundleFooter [BundleMetadata, BundleMetadata Len]
pub async fn read_split_footer(
    storage: Arc<dyn Storage>,
    path: &Path,
) -> StorageResult<(OwnedBytes, OwnedBytes)> {
    let file_len = storage.file_num_bytes(path).await? as usize;

    let hotcache_len_bytes = storage.get_slice(path, file_len - 8..file_len).await?;
    let hotcache_len = u64::from_le_bytes(hotcache_len_bytes.as_ref().try_into().unwrap()) as usize;

    let second_footer_start = file_len - 8 - hotcache_len - 8;
    let second_footer_bytes = storage
        .get_slice(path, second_footer_start..second_footer_start + 8)
        .await?;
    let second_footer_len =
        u64::from_le_bytes(second_footer_bytes.as_ref().try_into().unwrap()) as usize;

    let split_footer = storage
        .get_slice(path, second_footer_start - second_footer_len..file_len)
        .await?;
    let only_bundle_footer = split_footer.slice(0..second_footer_len + 8);

    Ok((split_footer, only_bundle_footer))
}

/// Return two slices for given split: `[body and bundle meta data] [hotcache]`
fn split_footer(file_slice: FileSlice) -> io::Result<(FileSlice, FileSlice)> {
    let (body_and_footer_slice, footer_len_slice) = file_slice.split_from_end(4);
    let footer_len_bytes = footer_len_slice.read_bytes()?;
    let footer_len = u32::from_le_bytes(footer_len_bytes.as_slice().try_into().unwrap());
    Ok(body_and_footer_slice.split_from_end(footer_len as usize))
}

/// Return two slices for given split: `[body and bundle meta data] [hotcache]`
pub fn get_hotcache_from_split(data: OwnedBytes) -> io::Result<OwnedBytes> {
    let split_file = FileSlice::new(Arc::new(data));
    let (_, hotcache) = split_footer(split_file)?;
    hotcache.read_bytes()
}

impl BundleDirectory {
    /// Get files and their sizes in a split.
    pub fn get_stats_split(data: OwnedBytes) -> anyhow::Result<Vec<(PathBuf, u64)>> {
        let split_file = FileSlice::new(Arc::new(data));
        let (body_and_bundle_metadata, hot_cache) = split_footer(split_file)?;
        let file_offsets = BundleStorageFileOffsets::open(body_and_bundle_metadata)?;

        let mut files_and_size: Vec<(_, _)> = file_offsets
            .files
            .into_iter()
            .map(|(file, range)| (file, range.end - range.start))
            .collect();

        files_and_size.push((
            PathBuf::from("hotcache".to_string()),
            hot_cache.len() as u64,
        ));

        files_and_size.sort();
        Ok(files_and_size)
    }

    /// Opens a split file.
    pub fn open_split(split_file: FileSlice) -> io::Result<BundleDirectory> {
        // First we remove the hotcache from our file slice.
        let (body_and_bundle_metadata, _hot_cache) = split_footer(split_file)?;
        BundleDirectory::open_bundle(body_and_bundle_metadata).map_err(io::Error::other)
    }

    /// Opens a BundleDirectory, given a file containing the bundle data.
    pub fn open_bundle(file: FileSlice) -> anyhow::Result<BundleDirectory> {
        let file_offsets = BundleStorageFileOffsets::open(file.clone())?;
        Ok(BundleDirectory { file, file_offsets })
    }
}

impl Directory for BundleDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        let file_slice = self.open_read(path)?;
        Ok(Arc::new(file_slice))
    }

    fn open_read(&self, path: &Path) -> Result<FileSlice, OpenReadError> {
        let byte_range = self
            .file_offsets
            .get(path)
            .ok_or_else(|| OpenReadError::FileDoesNotExist(path.to_path_buf()))?;
        Ok(self
            .file
            .slice(byte_range.start as usize..byte_range.end as usize))
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        let file_slice = self.open_read(path)?;
        let payload = file_slice
            .read_bytes()
            .map_err(|io_error| OpenReadError::wrap_io_error(io_error, path.to_path_buf()))?;
        Ok(payload.to_vec())
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        Ok(self.file_offsets.exists(path))
    }

    crate::read_only_directory!();
}

#[cfg(test)]
mod tests {
    use std::fs::File;
    use std::io::Write;

    use quickwit_common::shared_consts::SPLIT_FIELDS_FILE_NAME;
    use quickwit_storage::{PutPayload, SplitPayloadBuilder};

    use super::*;

    #[tokio::test]
    async fn test_bundle_directory_stats() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(&[123, 76])?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(&[99, 55, 44])?;

        let split_streamer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1.clone(), test_filepath2.clone()],
            &[],
            &[
                1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18,
            ],
        )?;

        let buffer = split_streamer.read_all().await?;

        // check stats
        let stats = BundleDirectory::get_stats_split(buffer)?;

        assert_eq!(stats[0], (PathBuf::from("f1".to_string()), 2_u64));
        assert_eq!(stats[1], (PathBuf::from("f2".to_string()), 3_u64));
        assert_eq!(stats[2], (PathBuf::from("hotcache".to_string()), 18_u64));

        Ok(())
    }

    #[tokio::test]
    async fn test_bundle_directory() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(&[123, 76])?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(&[99, 55, 44])?;

        let split_streamer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1.clone(), test_filepath2.clone()],
            &[],
            &[
                1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18,
            ],
        )?;

        let buffer = split_streamer.read_all().await?;

        let bundle_file_slice = FileSlice::from(buffer.to_vec());

        let bundle_dir = BundleDirectory::open_split(bundle_file_slice)?;

        assert!(bundle_dir.exists(Path::new("f1")).unwrap());
        assert!(bundle_dir.exists(Path::new("f2")).unwrap());
        assert!(!bundle_dir.exists(Path::new("f3")).unwrap());

        let f1_data = bundle_dir.atomic_read(Path::new("f1"))?;
        assert_eq!(&*f1_data, &[123u8, 76u8]);

        let f2_data = bundle_dir.atomic_read(Path::new("f2"))?;
        assert_eq!(&f2_data[..], &[99, 55, 44]);

        Ok(())
    }

    #[tokio::test]
    async fn test_stream_split_to_bundle_and_open() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(&[123, 76])?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(&[99, 55, 44])?;

        let split_streamer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1.clone(), test_filepath2.clone()],
            &[5, 5, 5],
            &[1, 2, 3],
        )?;

        let data = split_streamer.read_all().await?;

        let bundle_dir = BundleDirectory::open_split(FileSlice::from(data.to_vec()))?;

        let field_data = bundle_dir.atomic_read(Path::new(SPLIT_FIELDS_FILE_NAME))?;
        assert_eq!(&*field_data, &[5, 5, 5]);

        let f1_data = bundle_dir.atomic_read(Path::new("f1"))?;
        assert_eq!(&*f1_data, &[123u8, 76u8]);

        let f2_data = bundle_dir.atomic_read(Path::new("f2"))?;
        assert_eq!(&f2_data[..], &[99, 55, 44]);

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-directories/src/caching_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::{fmt, io};

use async_trait::async_trait;
use quickwit_storage::ByteRangeCache;
use tantivy::directory::error::OpenReadError;
use tantivy::directory::{FileHandle, OwnedBytes};
use tantivy::{Directory, HasLen};

/// The caching directory is a simple cache that wraps another directory.
#[derive(Clone)]
pub struct CachingDirectory {
    underlying: Arc<dyn Directory>,
    // TODO fixme: that's a pretty ugly cache we have here.
    cache: ByteRangeCache,
}

impl CachingDirectory {
    /// Creates a new CachingDirectory.
    ///
    /// Warning: The resulting CacheDirectory will cache all information without ever
    /// removing any item from the cache.
    pub fn new_unbounded(underlying: Arc<dyn Directory>) -> CachingDirectory {
        let byte_range_cache = ByteRangeCache::with_infinite_capacity(
            &quickwit_storage::STORAGE_METRICS.shortlived_cache,
        );
        CachingDirectory::new(underlying, byte_range_cache)
    }

    /// Creates a new CachingDirectory.
    ///
    /// Warning: The resulting CacheDirectory will cache all information without ever
    /// removing any item from the cache.
    pub fn new(underlying: Arc<dyn Directory>, cache: ByteRangeCache) -> CachingDirectory {
        CachingDirectory { underlying, cache }
    }
}

impl fmt::Debug for CachingDirectory {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "CachingDirectory({:?})", self.underlying)
    }
}

struct CachingFileHandle {
    path: PathBuf,
    cache: ByteRangeCache,
    underlying_filehandle: Arc<dyn FileHandle>,
}

impl fmt::Debug for CachingFileHandle {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "CachingFileHandle(path={:?}, underlying={:?})",
            &self.path,
            self.underlying_filehandle.as_ref()
        )
    }
}

#[async_trait]
impl FileHandle for CachingFileHandle {
    fn read_bytes(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        if let Some(bytes) = self.cache.get_slice(&self.path, byte_range.clone()) {
            return Ok(bytes);
        }
        let owned_bytes = self.underlying_filehandle.read_bytes(byte_range.clone())?;
        self.cache
            .put_slice(self.path.clone(), byte_range, owned_bytes.clone());
        Ok(owned_bytes)
    }

    async fn read_bytes_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        if let Some(owned_bytes) = self.cache.get_slice(&self.path, byte_range.clone()) {
            return Ok(owned_bytes);
        }
        let read_bytes = self
            .underlying_filehandle
            .read_bytes_async(byte_range.clone())
            .await?;
        self.cache
            .put_slice(self.path.clone(), byte_range, read_bytes.clone());
        Ok(read_bytes)
    }
}

impl HasLen for CachingFileHandle {
    fn len(&self) -> usize {
        self.underlying_filehandle.len()
    }
}

impl Directory for CachingDirectory {
    fn exists(&self, path: &Path) -> std::result::Result<bool, OpenReadError> {
        self.underlying.exists(path)
    }

    fn get_file_handle(
        &self,
        path: &Path,
    ) -> std::result::Result<Arc<dyn FileHandle>, OpenReadError> {
        let underlying_filehandle = self.underlying.get_file_handle(path)?;
        let caching_file_handle = CachingFileHandle {
            path: path.to_path_buf(),
            cache: self.cache.clone(),
            underlying_filehandle,
        };
        Ok(Arc::new(caching_file_handle))
    }

    fn atomic_read(&self, path: &Path) -> std::result::Result<Vec<u8>, OpenReadError> {
        let file_handle = self.get_file_handle(path)?;
        let len = file_handle.len();
        let owned_bytes = file_handle
            .read_bytes(0..len)
            .map_err(|io_error| OpenReadError::wrap_io_error(io_error, path.to_path_buf()))?;
        Ok(owned_bytes.as_slice().to_vec())
    }

    crate::read_only_directory!();
}

#[cfg(test)]
mod tests {

    use std::path::Path;
    use std::sync::Arc;

    use tantivy::Directory;
    use tantivy::directory::RamDirectory;

    use super::CachingDirectory;
    use crate::DebugProxyDirectory;

    #[test]
    fn test_caching_directory() -> tantivy::Result<()> {
        let ram_directory = RamDirectory::default();
        let test_path = Path::new("test");
        ram_directory.atomic_write(test_path, &b"test"[..])?;
        let debug_proxy_directory = Arc::new(DebugProxyDirectory::wrap(ram_directory));
        let caching_directory = CachingDirectory::new_unbounded(debug_proxy_directory.clone());
        caching_directory.atomic_read(test_path)?;
        caching_directory.atomic_read(test_path)?;
        assert_eq!(debug_proxy_directory.drain_read_operations().count(), 1);
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-directories/src/debug_proxy_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::{Arc, Mutex};
use std::time::{Duration, Instant};
use std::{fmt, io, mem};

use async_trait::async_trait;
use tantivy::directory::error::OpenReadError;
use tantivy::directory::{FileHandle, OwnedBytes};
use tantivy::{Directory, HasLen};
use time::OffsetDateTime;

#[derive(Clone, Default)]
struct OperationBuffer(Arc<Mutex<Vec<ReadOperation>>>);

impl fmt::Debug for OperationBuffer {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "OperationBuffer")
    }
}

impl OperationBuffer {
    fn drain(&self) -> impl Iterator<Item = ReadOperation> + 'static {
        let mut guard = self.0.lock().expect("Mutex poisoned");
        let ops: Vec<ReadOperation> = mem::take(guard.as_mut());
        ops.into_iter()
    }

    fn push(&self, read_operation: ReadOperation) {
        let mut guard = self.0.lock().expect("Mutex poisoned");
        guard.push(read_operation);
    }
}

/// A ReadOperation records meta data about a read operation.
/// It is recorded by the `DebugProxyDirectory`.
#[derive(Clone, Debug, Eq, PartialEq)]
pub struct ReadOperation {
    /// Path that was read
    pub path: PathBuf,
    /// If fetching a range of data, the start offset, else 0.
    pub offset: usize,
    /// The number of bytes fetched
    pub num_bytes: usize,
    /// The date at which the operation was performed (UTC timezone).
    pub start_date: OffsetDateTime,
    /// The elapsed time to run the read operatioon.
    pub duration: Duration,
}

struct ReadOperationBuilder {
    start_date: OffsetDateTime,
    start_instant: Instant,
    path: PathBuf,
    offset: usize,
}

impl ReadOperationBuilder {
    pub fn new(path: &Path) -> Self {
        let start_instant = Instant::now();
        let start_date = OffsetDateTime::now_utc();
        ReadOperationBuilder {
            start_date,
            start_instant,
            path: path.to_path_buf(),
            offset: 0,
        }
    }

    pub fn with_offset(self, offset: usize) -> Self {
        ReadOperationBuilder {
            start_date: self.start_date,
            start_instant: self.start_instant,
            path: self.path,
            offset,
        }
    }

    fn terminate(self, num_bytes: usize) -> ReadOperation {
        let duration = self.start_instant.elapsed();
        ReadOperation {
            path: self.path.clone(),
            offset: self.offset,
            num_bytes,
            start_date: self.start_date,
            duration,
        }
    }
}

/// The debug proxy wraps another directory and simply acts as a proxy
/// recording all of its read operations.
///
/// It has two purpose
/// - It is used when building our hotcache, to identify the file sections that should be in the
///   hotcache.
/// - It is used in the search-api to provide debugging/performance information.
#[derive(Debug)]
pub struct DebugProxyDirectory<D: Directory> {
    underlying: Arc<D>,
    operations: OperationBuffer,
}

impl<D: Directory> Clone for DebugProxyDirectory<D> {
    fn clone(&self) -> Self {
        DebugProxyDirectory {
            underlying: self.underlying.clone(),
            operations: self.operations.clone(),
        }
    }
}

impl<D: Directory> DebugProxyDirectory<D> {
    /// Wraps another directory to log all of its read operations.
    pub fn wrap(directory: D) -> Self {
        DebugProxyDirectory {
            underlying: Arc::new(directory),
            operations: OperationBuffer::default(),
        }
    }

    /// Returns all of the existing read operations.
    ///
    /// Calling this "drains" the existing queue of operations.
    pub fn drain_read_operations(&self) -> impl Iterator<Item = ReadOperation> + '_ {
        self.operations.drain()
    }

    /// Adds a new operation
    fn register(&self, read_op: ReadOperation) {
        self.operations.push(read_op);
    }

    /// Adds a new operation in an async fashion.
    async fn register_async(&self, read_op: ReadOperation) {
        self.operations.push(read_op);
    }
}

struct DebugProxyFileHandle<D: Directory> {
    directory: DebugProxyDirectory<D>,
    underlying: Arc<dyn FileHandle>,
    path: PathBuf,
}

#[async_trait]
impl<D: Directory> FileHandle for DebugProxyFileHandle<D> {
    fn read_bytes(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        let read_operation_builder =
            ReadOperationBuilder::new(&self.path).with_offset(byte_range.start);
        let payload = self.underlying.read_bytes(byte_range)?;
        let read_operation = read_operation_builder.terminate(payload.len());
        self.directory.register(read_operation);
        Ok(payload)
    }

    async fn read_bytes_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        let read_operation_builder =
            ReadOperationBuilder::new(&self.path).with_offset(byte_range.start);
        let payload = self.underlying.read_bytes_async(byte_range).await?;
        let read_operation = read_operation_builder.terminate(payload.len());
        self.directory.register_async(read_operation).await;
        Ok(payload)
    }
}

impl<D: Directory> fmt::Debug for DebugProxyFileHandle<D> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "DebugProxyFileHandle({:?})", &self.underlying)
    }
}

impl<D: Directory> HasLen for DebugProxyFileHandle<D> {
    fn len(&self) -> usize {
        self.underlying.len()
    }
}

impl<D: Directory> Directory for DebugProxyDirectory<D> {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        let underlying = self.underlying.get_file_handle(path)?;
        Ok(Arc::new(DebugProxyFileHandle {
            underlying,
            directory: self.clone(),
            path: path.to_owned(),
        }))
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        self.underlying.exists(path)
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        let read_operation_builder = ReadOperationBuilder::new(path);
        let payload = self.underlying.atomic_read(path)?;
        let read_operation = read_operation_builder.terminate(payload.len());
        self.register(read_operation);
        Ok(payload.to_vec())
    }

    crate::read_only_directory!();
}

#[cfg(test)]
mod tests {
    use std::io::Write;
    use std::path::Path;

    use tantivy::Directory;
    use tantivy::directory::{RamDirectory, TerminatingWrite};

    use super::DebugProxyDirectory;

    const TEST_PATH: &str = "test.file";
    const TEST_PAYLOAD: &[u8] = b"hello happy tax payer";

    fn make_test_directory() -> tantivy::Result<RamDirectory> {
        let ram_directory = RamDirectory::create();
        let mut wrt = ram_directory.open_write(Path::new(TEST_PATH))?;
        wrt.write_all(TEST_PAYLOAD)?;
        wrt.flush()?;
        wrt.terminate()?;
        Ok(ram_directory)
    }

    #[test]
    fn test_debug_proxy_atomic_read() -> tantivy::Result<()> {
        let debug_proxy = DebugProxyDirectory::wrap(make_test_directory()?);
        let test_path = Path::new(TEST_PATH);
        let read_data = debug_proxy.atomic_read(test_path)?;
        assert_eq!(&read_data[..], TEST_PAYLOAD);
        let operations: Vec<crate::ReadOperation> = debug_proxy.drain_read_operations().collect();
        println!("operations {operations:?}");
        assert_eq!(operations.len(), 1);
        let op0 = &operations[0];
        assert_eq!(op0.offset, 0);
        assert_eq!(op0.num_bytes, 21);
        assert_eq!(op0.path, test_path);
        Ok(())
    }

    #[test]
    fn test_debug_proxy_open_read_read_sync() -> tantivy::Result<()> {
        let test_path = Path::new(TEST_PATH);
        let debug_proxy = DebugProxyDirectory::wrap(make_test_directory()?);
        let read_data = debug_proxy.open_read(test_path)?;
        assert_eq!(read_data.read_bytes_slice(1..3)?.as_slice(), b"el");
        let operations: Vec<crate::ReadOperation> = debug_proxy.drain_read_operations().collect();
        assert_eq!(operations.len(), 1);
        let op = &operations[0];
        assert_eq!(op.path, test_path);
        assert_eq!(op.offset, 1);
        assert_eq!(op.num_bytes, 2);
        Ok(())
    }

    #[tokio::test]
    async fn test_debug_proxy_open_read_read_async() {
        let test_path = Path::new(TEST_PATH);
        let debug_proxy = DebugProxyDirectory::wrap(make_test_directory().unwrap());
        let read_data = debug_proxy.open_read(test_path).unwrap();
        assert_eq!(
            read_data
                .read_bytes_slice_async(1..3)
                .await
                .unwrap()
                .as_slice(),
            b"el"
        );
        let operations: Vec<crate::ReadOperation> = debug_proxy.drain_read_operations().collect();
        assert_eq!(operations.len(), 1);
        let op = &operations[0];
        assert_eq!(op.path, test_path);
        assert_eq!(op.offset, 1);
        assert_eq!(op.num_bytes, 2);
    }
}


================================================
FILE: quickwit/quickwit-directories/src/hot_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::{fmt, io};

use anyhow::{Context, bail};
use async_trait::async_trait;
use quickwit_storage::VersionedComponent;
use serde::{Deserialize, Serialize};
use tantivy::directory::error::OpenReadError;
use tantivy::directory::{FileHandle, FileSlice, OwnedBytes};
use tantivy::error::DataCorruption;
use tantivy::{Directory, HasLen, Index, IndexReader, ReloadPolicy, TantivyError};

use crate::{CachingDirectory, DebugProxyDirectory};

#[derive(Clone, Copy, Default)]
#[repr(u32)]
pub enum HotDirectoryVersions {
    #[default]
    V1 = 1,
}

impl VersionedComponent for HotDirectoryVersions {
    const MAGIC_NUMBER: u32 = 2_557_869_106u32;
    type Component = HotDirectoryMeta;

    fn to_version_code(self) -> u32 {
        self as u32
    }

    fn try_from_version_code_impl(code: u32) -> Option<Self> {
        match code {
            1u32 => Some(Self::V1),
            _ => None,
        }
    }

    fn deserialize_impl(&self, bytes: &mut OwnedBytes) -> anyhow::Result<HotDirectoryMeta> {
        match self {
            Self::V1 => {
                if bytes.len() < 4 {
                    bail!("data too short (len={})", bytes.len());
                }
                let len = bytes.read_u32() as usize;
                let hot_directory_meta = postcard::from_bytes(&bytes.as_slice()[..len])
                    .context("failed to deserialize hot directory meta")?;
                bytes.advance(len);
                Ok(hot_directory_meta)
            }
        }
    }

    fn serialize_impl(component: &Self::Component, output: &mut Vec<u8>) {
        let buf = postcard::to_stdvec(component).unwrap();
        output.extend_from_slice(&(buf.len() as u32).to_le_bytes());
        output.extend_from_slice(&buf[..]);
    }
}

#[derive(Serialize, Deserialize)]
pub struct HotDirectoryMeta {
    file_lengths: HashMap<PathBuf, u64>,
    slice_offsets: Vec<(PathBuf, u64)>,
}

#[derive(Clone, Debug, Serialize, Deserialize)]
struct SliceCacheIndexEntry {
    start: usize, //< legacy. We keep this instead of range due to existing indices.
    stop: usize,
    addr: usize,
}

impl SliceCacheIndexEntry {
    pub fn len(&self) -> usize {
        self.range().len()
    }

    pub fn range(&self) -> Range<usize> {
        self.start..self.stop
    }
}

#[derive(Serialize, Deserialize, Default)]
pub struct SliceCacheIndex {
    total_len: u64,
    slices: Vec<SliceCacheIndexEntry>,
}
impl SliceCacheIndex {
    pub fn is_complete(&self) -> bool {
        if self.slices.len() != 1 {
            return false;
        }
        self.slices[0].len() as u64 == self.total_len
    }

    pub fn get(&self, byte_range: Range<usize>) -> Option<usize> {
        let entry_idx = match self
            .slices
            .binary_search_by_key(&byte_range.start, |entry| entry.range().start)
        {
            Ok(idx) => idx,
            Err(0) => {
                return None;
            }
            Err(idx_after) => idx_after - 1,
        };
        let entry = &self.slices[entry_idx];
        if entry.range().start > byte_range.start || entry.range().end < byte_range.end {
            return None;
        }
        Some(entry.addr + byte_range.start - entry.range().start)
    }
}

#[derive(Default)]
struct StaticDirectoryCacheBuilder {
    file_cache_builder: HashMap<PathBuf, StaticSliceCacheBuilder>,
    file_lengths: HashMap<PathBuf, u64>, // a mapping from file path to file size in bytes
}

impl StaticDirectoryCacheBuilder {
    pub fn add_file(&mut self, path: &Path, file_len: u64) -> &mut StaticSliceCacheBuilder {
        self.file_lengths.insert(path.to_owned(), file_len);
        self.file_cache_builder
            .entry(path.to_owned())
            .or_insert_with(|| StaticSliceCacheBuilder::new(file_len))
    }

    /// Flush needs to be called afterwards.
    pub fn write(self, wrt: &mut dyn io::Write) -> tantivy::Result<()> {
        let mut data_buffer = Vec::new();
        let mut data_idx: Vec<(PathBuf, u64)> = Vec::new();
        let mut offset = 0u64;
        for (path, cache) in self.file_cache_builder {
            let buf = cache.flush()?;
            data_idx.push((path, offset));
            offset += buf.len() as u64;
            data_buffer.extend_from_slice(&buf);
        }
        let hot_directory_metas = HotDirectoryMeta {
            file_lengths: self.file_lengths,
            slice_offsets: data_idx,
        };
        let buffer = HotDirectoryVersions::serialize(&hot_directory_metas);
        wrt.write_all(&buffer)?;
        wrt.write_all(&data_buffer)?;
        Ok(())
    }
}

#[derive(Debug)]
struct StaticDirectoryCache {
    file_lengths: HashMap<PathBuf, u64>,
    slices: HashMap<PathBuf, Arc<StaticSliceCache>>,
}

impl StaticDirectoryCache {
    pub fn open(mut bytes: OwnedBytes) -> anyhow::Result<StaticDirectoryCache> {
        let HotDirectoryMeta {
            mut slice_offsets,
            file_lengths,
        } = HotDirectoryVersions::try_read_component(&mut bytes)?;
        slice_offsets.push((PathBuf::default(), bytes.len() as u64));
        let slices = slice_offsets
            .windows(2)
            .map(|slice_offsets_window| {
                let path = slice_offsets_window[0].0.clone();
                let start = slice_offsets_window[0].1 as usize;
                let end = slice_offsets_window[1].1 as usize;
                StaticSliceCache::open(bytes.slice(start..end)).map(|s| (path, Arc::new(s)))
            })
            .collect::<tantivy::Result<_>>()?;
        Ok(StaticDirectoryCache {
            file_lengths,
            slices,
        })
    }

    pub fn get_slice(&self, path: &Path) -> Arc<StaticSliceCache> {
        self.slices.get(path).cloned().unwrap_or_default()
    }

    pub fn get_file_length(&self, path: &Path) -> Option<u64> {
        self.file_lengths.get(path).copied()
    }

    pub fn get_file_lengths(&self) -> Vec<(PathBuf, u64)> {
        let mut entries = self
            .file_lengths
            .iter()
            .map(|(path, len)| (path.clone(), *len))
            .collect::<Vec<_>>();
        entries.sort_by_key(|el| el.0.to_owned());
        entries
    }
}

/// A SliceCache is a static toring
pub struct StaticSliceCache {
    bytes: OwnedBytes,
    index: SliceCacheIndex,
}

impl Default for StaticSliceCache {
    fn default() -> StaticSliceCache {
        StaticSliceCache {
            bytes: OwnedBytes::empty(),
            index: SliceCacheIndex::default(),
        }
    }
}

impl StaticSliceCache {
    pub fn open(owned_bytes: OwnedBytes) -> tantivy::Result<Self> {
        let owned_bytes_len = owned_bytes.len();
        assert!(owned_bytes_len >= 8);
        let (body, len_bytes) = owned_bytes.split(owned_bytes_len - 8);
        let mut body_len_bytes = [0u8; 8];
        body_len_bytes.copy_from_slice(len_bytes.as_slice());
        let body_len = u64::from_le_bytes(body_len_bytes);
        let (body, idx) = body.split(body_len as usize);
        let idx_bytes = idx.as_slice();
        let index: SliceCacheIndex = postcard::from_bytes(idx_bytes).map_err(|err| {
            DataCorruption::comment_only(format!("failed to deserialize the slice index: {err:?}"))
        })?;
        Ok(StaticSliceCache { bytes: body, index })
    }

    pub fn try_read_all(&self) -> Option<OwnedBytes> {
        if !self.index.is_complete() {
            return None;
        }
        Some(self.bytes.clone())
    }

    pub fn try_read_bytes(&self, byte_range: Range<usize>) -> Option<OwnedBytes> {
        if byte_range.is_empty() {
            return Some(OwnedBytes::empty());
        }
        if let Some(start) = self.index.get(byte_range.clone()) {
            return Some(self.bytes.slice(start..start + byte_range.len()));
        }
        None
    }
}

struct StaticSliceCacheBuilder {
    wrt: Vec<u8>,
    slices: Vec<SliceCacheIndexEntry>,
    offset: u64,
    total_len: u64,
}

impl StaticSliceCacheBuilder {
    pub fn new(total_len: u64) -> StaticSliceCacheBuilder {
        StaticSliceCacheBuilder {
            wrt: Vec::new(),
            slices: Vec::new(),
            offset: 0u64,
            total_len,
        }
    }

    pub fn add_bytes(&mut self, bytes: &[u8], start: usize) {
        self.wrt.extend_from_slice(bytes);
        let end = start + bytes.len();
        self.slices.push(SliceCacheIndexEntry {
            start,
            stop: end,
            addr: self.offset as usize,
        });
        self.offset += bytes.len() as u64;
    }

    fn merged_slices(&mut self) -> tantivy::Result<Vec<SliceCacheIndexEntry>> {
        if self.slices.is_empty() {
            return Ok(Vec::new());
        }
        self.slices.sort_unstable_by_key(|e| e.range().start);
        let mut slices = Vec::with_capacity(self.slices.len());
        let mut last = self.slices[0].clone();
        for segment in &self.slices[1..] {
            if segment.range().start < last.range().end {
                return Err(tantivy::TantivyError::InvalidArgument(format!(
                    "two segments are overlapping on byte {}",
                    segment.range().start
                )));
            }
            if last.stop == segment.range().start
                && (last.addr + last.range().len() == segment.addr)
            {
                // We merge the current segment with the previous one
                last.stop += segment.range().len();
            } else {
                slices.push(last);
                last = segment.clone();
            }
        }
        slices.push(last);
        Ok(slices)
    }

    pub fn flush(mut self) -> tantivy::Result<Vec<u8>> {
        let merged_slices = self.merged_slices()?;
        let slices_idx = SliceCacheIndex {
            total_len: self.total_len,
            slices: merged_slices,
        };
        self.wrt.extend_from_slice(
            &postcard::to_allocvec(&slices_idx).map_err(|err| {
                TantivyError::InternalError(format!("could not serialize {err:?}"))
            })?,
        );
        self.wrt.extend_from_slice(&self.offset.to_le_bytes()[..]);
        Ok(self.wrt)
    }
}

impl fmt::Debug for StaticSliceCache {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "SliceCache()")
    }
}

/// The hot directory accelerates a given directory,
/// by placing a static cache in front of a directory.
///
/// The `HotDirectory` does not implement write operations. It has been
/// designed for quickwit in order to regroup all of the small random
/// read operations required to open an index.
/// All of these operations are gather into a single file called the
/// hotcache.
#[derive(Clone)]
pub struct HotDirectory {
    inner: Arc<InnerHotDirectory>,
}

impl HotDirectory {
    /// Wraps an index, with a static cache serialized into `hot_cache_bytes`.
    pub fn open<D: Directory>(
        underlying: D,
        hot_cache_bytes: OwnedBytes,
    ) -> anyhow::Result<HotDirectory> {
        let static_cache = StaticDirectoryCache::open(hot_cache_bytes)?;
        Ok(HotDirectory {
            inner: Arc::new(InnerHotDirectory {
                underlying: Box::new(underlying),
                cache: Arc::new(static_cache),
            }),
        })
    }

    /// Get all the files in the directory and their sizes.
    ///
    /// The actual cached data is a very small fraction of this length.
    pub fn get_file_lengths(&self) -> Vec<(PathBuf, u64)> {
        self.inner.cache.get_file_lengths()
    }
}

struct FileSliceWithCache {
    underlying: FileSlice,
    static_cache: Arc<StaticSliceCache>,
    file_length: u64,
}

#[async_trait]
impl FileHandle for FileSliceWithCache {
    fn read_bytes(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        if let Some(found_bytes) = self.static_cache.try_read_bytes(byte_range.clone()) {
            return Ok(found_bytes);
        }
        self.underlying.read_bytes_slice(byte_range)
    }

    async fn read_bytes_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        if let Some(found_bytes) = self.static_cache.try_read_bytes(byte_range.clone()) {
            return Ok(found_bytes);
        }
        self.underlying.read_bytes_slice_async(byte_range).await
    }
}

impl fmt::Debug for FileSliceWithCache {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "FileSliceWithCache({:?})", &self.underlying)
    }
}

impl HasLen for FileSliceWithCache {
    fn len(&self) -> usize {
        self.file_length as usize
    }
}

struct InnerHotDirectory {
    underlying: Box<dyn Directory>,
    cache: Arc<StaticDirectoryCache>,
}

impl fmt::Debug for HotDirectory {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "HotDirectory(dir={:?}, cache={:?})",
            self.inner.underlying.as_ref(),
            self.inner.cache.as_ref()
        )
    }
}

impl Directory for HotDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        let file_length = self
            .inner
            .cache
            .get_file_length(path)
            .ok_or_else(|| OpenReadError::FileDoesNotExist(path.to_owned()))?;
        let underlying_filehandle = self.inner.underlying.get_file_handle(path)?;
        let underlying = FileSlice::new_with_num_bytes(underlying_filehandle, file_length as usize);
        let file_slice_with_cache = FileSliceWithCache {
            underlying,
            static_cache: self.inner.cache.get_slice(path),
            file_length,
        };
        Ok(Arc::new(file_slice_with_cache))
    }

    fn exists(&self, path: &std::path::Path) -> Result<bool, OpenReadError> {
        Ok(self.inner.cache.get_file_length(path).is_some())
    }

    fn atomic_read(&self, path: &std::path::Path) -> Result<Vec<u8>, OpenReadError> {
        let slice_cache = self.inner.cache.get_slice(path);
        if let Some(all_bytes) = slice_cache.try_read_all() {
            return Ok(all_bytes.as_slice().to_owned());
        }
        self.inner.underlying.atomic_read(path)
    }

    crate::read_only_directory!();
}

fn list_index_files(index: &Index) -> tantivy::Result<HashSet<PathBuf>> {
    let index_meta = index.load_metas()?;
    let mut files: HashSet<PathBuf> = index_meta
        .segments
        .into_iter()
        .flat_map(|segment_meta| segment_meta.list_files())
        .collect();
    files.insert(Path::new("meta.json").to_path_buf());
    files.insert(Path::new(".managed.json").to_path_buf());
    Ok(files)
}

/// Given a tantivy directory, automatically identify the parts that should be loaded on startup
/// and writes a static cache file called hotcache in the `output`.
///
/// See [`HotDirectory`] for more information.
pub fn write_hotcache<D: Directory>(
    directory: D,
    output: &mut dyn io::Write,
) -> tantivy::Result<()> {
    // We use the caching directory here in order to defensively ensure that
    // the content of the directory that will be written in the hotcache is precisely
    // the same that was read on the first pass.
    let caching_directory = CachingDirectory::new_unbounded(Arc::new(directory));
    let debug_proxy_directory = DebugProxyDirectory::wrap(caching_directory);
    let index = Index::open(debug_proxy_directory.clone())?;
    let schema = index.schema();
    let reader: IndexReader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()?;
    let searcher = reader.searcher();
    for (field, field_entry) in schema.fields() {
        if !field_entry.is_indexed() {
            continue;
        }
        for reader in searcher.segment_readers() {
            let _inv_idx = reader.inverted_index(field)?;
        }
    }
    let mut cache_builder = StaticDirectoryCacheBuilder::default();
    let read_operations = debug_proxy_directory.drain_read_operations();
    let mut per_file_slices: HashMap<PathBuf, HashSet<Range<usize>>> = HashMap::default();
    for read_operation in read_operations {
        per_file_slices
            .entry(read_operation.path)
            .or_default()
            .insert(read_operation.offset..read_operation.offset + read_operation.num_bytes);
    }
    let index_files = list_index_files(&index)?;
    for file_path in index_files {
        let file_slice_res = debug_proxy_directory.open_read(&file_path);
        if let Err(tantivy::directory::error::OpenReadError::FileDoesNotExist(_)) = file_slice_res {
            continue;
        }
        let file_slice = file_slice_res?;
        let file_cache_builder = cache_builder.add_file(&file_path, file_slice.len() as u64);
        if let Some(intervals) = per_file_slices.get(&file_path) {
            for byte_range in intervals {
                let len = byte_range.len();
                // We do not want to store slices that are too large in the hotcache,
                // but on the other hand, the term dictionray index and the docstore
                // index are required for quickwit to work.
                //
                // Warning: we need to work on string here because `Path::ends_with`
                // has very different semantics.
                let file_path_str = file_path.to_string_lossy();
                if file_path_str.ends_with("store")
                    || file_path_str.ends_with("term")
                    || len < 10_000_000
                {
                    let bytes = file_slice.read_bytes_slice(byte_range.clone())?;
                    file_cache_builder.add_bytes(bytes.as_slice(), byte_range.start);
                }
            }
        }
    }
    cache_builder.write(output)?;
    output.flush()?;
    Ok(())
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_empty_slice_cache_index() -> tantivy::Result<()> {
        let slice_cache_builder = StaticSliceCacheBuilder::new(10u64);
        let cache_data = slice_cache_builder.flush()?;
        let owned_bytes = OwnedBytes::new(cache_data);
        let slice_cache = StaticSliceCache::open(owned_bytes)?;
        assert!(slice_cache.try_read_bytes(5..6).is_none());
        Ok(())
    }

    #[test]
    fn test_simple_slice_cache_index() -> tantivy::Result<()> {
        let mut slice_cache_builder = StaticSliceCacheBuilder::new(10u64);
        slice_cache_builder.add_bytes(b"abc", 2);
        let cache_data = slice_cache_builder.flush()?;
        let owned_bytes = OwnedBytes::new(cache_data);
        let slice_cache = StaticSliceCache::open(owned_bytes)?;
        assert_eq!(
            slice_cache.try_read_bytes(2..5).unwrap().as_slice(),
            &b"abc"[..]
        );
        assert_eq!(
            slice_cache.try_read_bytes(2..3).unwrap().as_slice(),
            &b"a"[..]
        );
        assert_eq!(
            slice_cache.try_read_bytes(3..5).unwrap().as_slice(),
            &b"bc"[..]
        );
        assert_eq!(
            slice_cache.try_read_bytes(4..5).unwrap().as_slice(),
            &b"c"[..]
        );
        assert!(slice_cache.try_read_bytes(5..6).is_none());
        assert!(slice_cache.try_read_bytes(4..6).is_none());
        assert!(slice_cache.try_read_bytes(6..7).is_none());
        assert_eq!(
            slice_cache.try_read_bytes(6..6).unwrap().as_slice(),
            &b""[..]
        );
        Ok(())
    }

    #[test]
    fn test_several_segments() -> tantivy::Result<()> {
        let mut slice_cache_builder = StaticSliceCacheBuilder::new(100u64);
        slice_cache_builder.add_bytes(b"def", 6);
        slice_cache_builder.add_bytes(b"ghi", 12);
        slice_cache_builder.add_bytes(b"abc", 2);
        let cache_data = slice_cache_builder.flush()?;
        let owned_bytes = OwnedBytes::new(cache_data);
        let slice_cache = StaticSliceCache::open(owned_bytes)?;
        assert_eq!(
            slice_cache.try_read_bytes(2..5).unwrap().as_slice(),
            &b"abc"[..]
        );
        assert_eq!(
            slice_cache.try_read_bytes(2..3).unwrap().as_slice(),
            &b"a"[..]
        );
        assert_eq!(
            slice_cache.try_read_bytes(3..5).unwrap().as_slice(),
            &b"bc"[..]
        );
        assert_eq!(
            slice_cache.try_read_bytes(4..5).unwrap().as_slice(),
            &b"c"[..]
        );
        assert!(slice_cache.try_read_bytes(5..6).is_none());
        assert!(slice_cache.try_read_bytes(4..6).is_none());
        assert_eq!(
            slice_cache.try_read_bytes(6..7).unwrap().as_slice(),
            &b"d"[..]
        );
        assert!(slice_cache.try_read_bytes(2..7).is_none());
        Ok(())
    }

    #[test]
    fn test_slice_cache_merged_entries() -> tantivy::Result<()> {
        let mut slice_cache_builder = StaticSliceCacheBuilder::new(100u64);
        slice_cache_builder.add_bytes(b"abc", 2);
        slice_cache_builder.add_bytes(b"def", 5);
        let cache_data = slice_cache_builder.flush()?;
        let owned_bytes = OwnedBytes::new(cache_data);
        let slice_cache = StaticSliceCache::open(owned_bytes)?;
        assert_eq!(
            slice_cache.try_read_bytes(3..7).unwrap().as_slice(),
            &b"bcde"[..]
        );
        Ok(())
    }

    #[test]
    fn test_slice_cache_unmergeable_entries() -> tantivy::Result<()> {
        let mut slice_cache_builder = StaticSliceCacheBuilder::new(100u64);
        slice_cache_builder.add_bytes(b"def", 5);
        slice_cache_builder.add_bytes(b"abc", 2);
        let cache_data = slice_cache_builder.flush()?;
        let owned_bytes = OwnedBytes::new(cache_data);
        let slice_cache = StaticSliceCache::open(owned_bytes)?;
        assert!(slice_cache.try_read_bytes(3..7).is_none());
        Ok(())
    }

    #[test]
    fn test_slice_cache_overlapping_entries() {
        let mut slice_cache_builder = StaticSliceCacheBuilder::new(100u64);
        slice_cache_builder.add_bytes(b"abcd", 2);
        slice_cache_builder.add_bytes(b"def", 5);
        assert!(slice_cache_builder.flush().is_err());
    }

    #[test]
    fn test_slice_entry_serialization() -> anyhow::Result<()> {
        let slice_entry = super::SliceCacheIndexEntry {
            start: 1,
            stop: 5,
            addr: 4,
        };
        let bytes = postcard::to_allocvec(&slice_entry)?;
        assert_eq!(&bytes[..], &[1, 5, 4]);
        Ok(())
    }

    #[test]
    fn test_slice_directory_cache() {
        let one_path = Path::new("one.txt");
        let two_path = Path::new("two.txt");
        let three_path = Path::new("three.txt");
        let four_path = Path::new("four.txt");

        let mut directory_cache_builder = StaticDirectoryCacheBuilder::default();
        directory_cache_builder
            .add_file(one_path, 100)
            .add_bytes(b" happy t", 5);
        directory_cache_builder
            .add_file(two_path, 200)
            .add_bytes(b"my name", 0);
        directory_cache_builder.add_file(three_path, 300);

        let mut buffer = Vec::new();
        directory_cache_builder.write(&mut buffer).unwrap();
        let directory_cache = StaticDirectoryCache::open(OwnedBytes::new(buffer)).unwrap();

        assert_eq!(directory_cache.get_file_length(one_path), Some(100));
        assert_eq!(directory_cache.get_file_length(two_path), Some(200));
        assert_eq!(directory_cache.get_file_length(three_path), Some(300));
        assert_eq!(directory_cache.get_file_length(four_path), None);

        let file_lengths = directory_cache.get_file_lengths();
        assert_eq!(file_lengths[0], (one_path.to_owned(), 100));
        assert_eq!(file_lengths[1], (three_path.to_owned(), 300));
        assert_eq!(file_lengths[2], (two_path.to_owned(), 200));

        assert_eq!(
            directory_cache
                .get_slice(one_path)
                .try_read_bytes(6..11)
                .unwrap()
                .as_ref(),
            b"happy"
        );
        assert_eq!(
            directory_cache
                .get_slice(two_path)
                .try_read_bytes(3..7)
                .unwrap()
                .as_ref(),
            b"name"
        );
    }
}


================================================
FILE: quickwit/quickwit-directories/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! This crate contains all of the building pieces that make quickwit's IO possible.
//!
//! - The `StorageDirectory` just wraps a `Storage` trait to make it compatible with tantivy's
//!   Directory API.
//! - The `BundleDirectory` bundles multiple files into a single file.
//! - The `HotDirectory` wraps another directory with a static cache.
//! - The `CachingDirectory` wraps a Directory with a dynamic cache.
//! - The `DebugDirectory` acts as a proxy to another directory to instrument it and record all of
//!   its IO.
#![warn(missing_docs)]
#![deny(clippy::disallowed_methods)]

mod bundle_directory;
mod caching_directory;
mod debug_proxy_directory;
mod hot_directory;
mod storage_directory;
mod union_directory;

pub use self::bundle_directory::{BundleDirectory, get_hotcache_from_split, read_split_footer};
pub use self::caching_directory::CachingDirectory;
pub use self::debug_proxy_directory::{DebugProxyDirectory, ReadOperation};
pub use self::hot_directory::{HotDirectory, write_hotcache};
pub use self::storage_directory::StorageDirectory;
pub use self::union_directory::UnionDirectory;

macro_rules! read_only_directory {
    () => {
        fn atomic_write(&self, _path: &Path, _data: &[u8]) -> io::Result<()> {
            unimplemented!("read-only")
        }

        fn delete(&self, _path: &Path) -> Result<(), tantivy::directory::error::DeleteError> {
            unimplemented!("read-only")
        }

        fn open_write(
            &self,
            _path: &Path,
        ) -> Result<tantivy::directory::WritePtr, tantivy::directory::error::OpenWriteError> {
            unimplemented!("read-only")
        }

        fn sync_directory(&self) -> io::Result<()> {
            unimplemented!("read-only")
        }

        fn watch(
            &self,
            _watch_callback: tantivy::directory::WatchCallback,
        ) -> tantivy::Result<tantivy::directory::WatchHandle> {
            Ok(tantivy::directory::WatchHandle::empty())
        }

        fn acquire_lock(
            &self,
            _lock: &tantivy::directory::Lock,
        ) -> Result<tantivy::directory::DirectoryLock, tantivy::directory::error::LockError> {
            Ok(tantivy::directory::DirectoryLock::from(Box::new(|| {})))
        }
    };
}
pub(crate) use read_only_directory;


================================================
FILE: quickwit/quickwit-directories/src/storage_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Debug;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::{fmt, io};

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_storage::{OwnedBytes, Storage};
use tantivy::directory::FileHandle;
use tantivy::directory::error::OpenReadError;
use tantivy::{Directory, HasLen};
use tracing::{error, instrument};

struct StorageDirectoryFileHandle {
    storage_directory: StorageDirectory,
    path: PathBuf,
}

impl HasLen for StorageDirectoryFileHandle {
    fn len(&self) -> usize {
        unimplemented!()
    }
}

impl fmt::Debug for StorageDirectoryFileHandle {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "StorageDirectoryFileHandle({:?}, dir={:?})",
            &self.path, self.storage_directory
        )
    }
}

#[async_trait]
impl FileHandle for StorageDirectoryFileHandle {
    fn read_bytes(&self, _byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        Err(unsupported_operation(&self.path))
    }

    #[instrument(level = "debug", fields(path = %self.path.to_string_lossy(), byte_range_size = byte_range.end - byte_range.start), skip(self))]
    async fn read_bytes_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        if byte_range.is_empty() {
            return Ok(OwnedBytes::empty());
        }
        let object_bytes = self
            .storage_directory
            .get_slice(&self.path, byte_range)
            .await?;
        Ok(object_bytes)
    }
}

/// Directory backed a quickwit `Storage` abstraction.
///
/// It should not be used in a context outside quickwit, as it contains
/// several pitfalls:
/// Fetching data synchronously panics.
/// Writing data panics.
///
/// This directory is fetch slices of data to a possibly distant storage
/// everytime `read_bytes` is called.
#[derive(Clone)]
pub struct StorageDirectory {
    storage: Arc<dyn Storage>,
}

impl Debug for StorageDirectory {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "StorageDirectory({:?})", self.uri())
    }
}

impl StorageDirectory {
    /// Creates a new StorageDirectory, backed by the given `storage`.
    pub fn new(storage: Arc<dyn Storage>) -> StorageDirectory {
        StorageDirectory { storage }
    }

    /// Fetches a slice of byte from a file asynchronously.
    pub async fn get_slice(&self, path: &Path, range: Range<usize>) -> io::Result<OwnedBytes> {
        let payload: OwnedBytes = self.storage.get_slice(path, range).await?;
        Ok(payload)
    }

    /// Fetches an entire file asynchronously.
    pub async fn get_all(&self, path: &Path) -> io::Result<OwnedBytes> {
        let payload: OwnedBytes = self.storage.get_all(path).await?;
        Ok(payload)
    }

    /// Returns the uri associated to the underlying storage.
    pub fn uri(&self) -> &Uri {
        self.storage.uri()
    }
}

fn unsupported_operation(path: &Path) -> io::Error {
    let error = "unsupported operation: `StorageDirectory` only supports async reads";
    error!(error, ?path);
    io::Error::other(format!("{error}: {}", path.display()))
}

impl Directory for StorageDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        Ok(Arc::new(StorageDirectoryFileHandle {
            storage_directory: self.clone(),
            path: path.to_path_buf(),
        }))
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        Err(OpenReadError::wrap_io_error(
            unsupported_operation(path),
            path.to_path_buf(),
        ))
    }

    fn exists(&self, path: &std::path::Path) -> Result<bool, OpenReadError> {
        Err(OpenReadError::wrap_io_error(
            unsupported_operation(path),
            path.to_path_buf(),
        ))
    }

    crate::read_only_directory!();
}


================================================
FILE: quickwit/quickwit-directories/src/union_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use tantivy::Directory;
use tantivy::directory::error::{DeleteError, OpenReadError, OpenWriteError};
use tantivy::directory::{FileHandle, WatchHandle};

/// A union directory takes a bunch of directories and stacks them, similarly to UnionFS.
/// The resulting directory is a virtual view of the union of the different directories.
///
/// If a path exists in all directories, the first of the list containing the path
/// will shadow the other directories.
///
/// The first directory of the list will receive all write operations.
/// Deletes on the other hand will be applied on all directories containing the file.
#[derive(Clone, Debug)]
pub struct UnionDirectory {
    directories: Arc<Vec<Box<dyn Directory>>>,
}

impl UnionDirectory {
    /// Creates a new union directory.
    pub fn union_of(directories: Vec<Box<dyn Directory>>) -> UnionDirectory {
        UnionDirectory {
            directories: Arc::new(directories),
        }
    }

    /// Helper function to find the first directory containing the given path.
    fn find_directory_for_path(&self, path: &Path) -> Result<&dyn Directory, OpenReadError> {
        for directory in self.directories.iter() {
            if directory.exists(path)? {
                return Ok(directory.as_ref());
            }
        }
        Err(OpenReadError::FileDoesNotExist(path.to_path_buf()))
    }
}

fn convert_open_to_delete_error(open_err: OpenReadError) -> DeleteError {
    match open_err {
        OpenReadError::FileDoesNotExist(path) => DeleteError::FileDoesNotExist(path),
        OpenReadError::IoError { io_error, filepath } => {
            DeleteError::IoError { io_error, filepath }
        }
        err @ OpenReadError::IncompatibleIndex(_) => DeleteError::IoError {
            io_error: Arc::new(io::Error::new(io::ErrorKind::Unsupported, err)),
            filepath: PathBuf::from("/"),
        },
    }
}

impl Directory for UnionDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        let directory = self.find_directory_for_path(path)?;
        directory.get_file_handle(path)
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        match self.find_directory_for_path(path) {
            Ok(_) => Ok(true),
            Err(OpenReadError::FileDoesNotExist(_)) => Ok(false),
            Err(err) => Err(err),
        }
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        let directory = self.find_directory_for_path(path)?;
        directory.atomic_read(path)
    }

    fn open_write(&self, path: &Path) -> Result<tantivy::directory::WritePtr, OpenWriteError> {
        self.directories[0].open_write(path)
    }

    fn delete(&self, path: &Path) -> Result<(), DeleteError> {
        let mut found_file = false;
        for directory in self.directories.iter() {
            // We first check exist, in order to support read-only directories.
            match directory.exists(path) {
                Ok(true) => {
                    directory.delete(path)?;
                    found_file = true;
                }
                Ok(false) => {}
                Err(exist_err) => {
                    return Err(convert_open_to_delete_error(exist_err));
                }
            }
        }
        if !found_file {
            return Err(DeleteError::FileDoesNotExist(path.to_path_buf()));
        }
        Ok(())
    }

    fn atomic_write(&self, path: &Path, data: &[u8]) -> io::Result<()> {
        self.directories[0].atomic_write(path, data)
    }

    fn watch(&self, callback: tantivy::directory::WatchCallback) -> tantivy::Result<WatchHandle> {
        self.directories[0].watch(callback)
    }

    fn sync_directory(&self) -> io::Result<()> {
        self.directories[0].sync_directory()
    }
}

#[cfg(test)]
mod tests {
    use std::path::Path;

    use tantivy::directory::{Directory, RamDirectory};

    use crate::UnionDirectory;

    #[test]
    fn test_union_directory_atomic_simple() -> anyhow::Result<()> {
        let dir1 = RamDirectory::create();
        let dir2 = RamDirectory::create();
        dir1.atomic_write(Path::new("path1"), &b"data1"[..])?;
        dir2.atomic_write(Path::new("path2"), &b"data2"[..])?;
        let union_directory = UnionDirectory::union_of(vec![Box::new(dir1), Box::new(dir2)]);
        {
            let payload_1 = union_directory.atomic_read(Path::new("path1"))?;
            assert_eq!(payload_1, b"data1");
        }
        {
            let payload_1 = union_directory
                .open_read(Path::new("path1"))?
                .read_bytes()?;
            assert_eq!(payload_1.as_slice(), b"data1");
        }
        {
            let payload_2 = union_directory.atomic_read(Path::new("path2"))?;
            assert_eq!(payload_2, b"data2");
        }
        {
            let payload_2 = union_directory
                .open_read(Path::new("path2"))?
                .read_bytes()?;
            assert_eq!(payload_2.as_slice(), b"data2");
        }
        Ok(())
    }

    #[test]
    fn test_union_directory_shadowing() -> anyhow::Result<()> {
        let dir1 = RamDirectory::create();
        let dir2 = RamDirectory::create();
        dir1.atomic_write(Path::new("shadowed_path"), &b"shadower"[..])?;
        dir2.atomic_write(Path::new("shadowed_path"), &b"shadowee"[..])?;
        let union_directory = UnionDirectory::union_of(vec![Box::new(dir1), Box::new(dir2)]);
        let payload = union_directory.atomic_read(Path::new("shadowed_path"))?;
        assert_eq!(payload, b"shadower");
        Ok(())
    }

    #[test]
    fn test_union_directory_exists() -> anyhow::Result<()> {
        let dir1 = RamDirectory::create();
        dir1.atomic_write(Path::new("path1"), &b"data1"[..])?;
        dir1.atomic_write(Path::new("shadowed_path"), &b"shadower"[..])?;

        let dir2 = RamDirectory::create();
        dir2.atomic_write(Path::new("path2"), &b"data2"[..])?;
        dir2.atomic_write(Path::new("shadowed_path"), &b"shadowee"[..])?;

        let union_directory = UnionDirectory::union_of(vec![Box::new(dir1), Box::new(dir2)]);
        assert!(union_directory.exists(Path::new("path1"))?);
        assert!(union_directory.exists(Path::new("path2"))?);
        assert!(union_directory.exists(Path::new("shadowed_path"))?);

        assert!(!union_directory.exists(Path::new("path3"))?);
        Ok(())
    }

    #[test]
    fn test_union_directory_delete() -> anyhow::Result<()> {
        let dir1 = RamDirectory::create();
        dir1.atomic_write(Path::new("path1"), &b"data1"[..])?;
        dir1.atomic_write(Path::new("shadowed_path"), &b"shadower"[..])?;

        let dir2 = RamDirectory::create();
        dir2.atomic_write(Path::new("path2"), &b"data2"[..])?;
        dir2.atomic_write(Path::new("shadowed_path"), &b"shadowee"[..])?;

        let union_directory = UnionDirectory::union_of(vec![Box::new(dir1), Box::new(dir2)]);

        union_directory.delete(Path::new("path1"))?;
        assert!(!union_directory.exists(Path::new("path1"))?);

        union_directory.delete(Path::new("path2"))?;
        assert!(!union_directory.exists(Path::new("path2"))?);

        union_directory.delete(Path::new("shadowed_path"))?;
        assert!(!union_directory.exists(Path::new("shadowed_path"))?);

        union_directory.delete(Path::new("path3")).unwrap_err();
        Ok(())
    }
    #[test]
    fn test_union_directory_write() -> anyhow::Result<()> {
        let dir1 = RamDirectory::create();
        dir1.atomic_write(Path::new("path1"), &b"data1"[..])?;

        let dir2 = RamDirectory::create();
        dir2.atomic_write(Path::new("path2"), &b"data2"[..])?;

        let union_directory = UnionDirectory::union_of(vec![Box::new(dir1), Box::new(dir2)]);
        union_directory.atomic_write(Path::new("path1"), &b"data1 data1"[..])?;
        union_directory.atomic_write(Path::new("path3"), &b"data3"[..])?;
        {
            let payload = union_directory.atomic_read(Path::new("path1"))?;
            assert_eq!(payload, b"data1 data1");
        }
        {
            let payload = union_directory.atomic_read(Path::new("path3"))?;
            assert_eq!(payload, b"data3");
        }
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/Cargo.toml
================================================
[package]
name = "quickwit-doc-mapper"
description = "Index schema and document mapping"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
base64 = { workspace = true }
fnv = { workspace = true }
hex = { workspace = true }
indexmap = { workspace = true }
itertools = { workspace = true }
nom = { workspace = true }
once_cell = { workspace = true }
regex = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
serde_json_borrow = { workspace = true }
siphasher = { workspace = true }
tantivy = { workspace = true }
thiserror = { workspace = true }
tracing = { workspace = true }
utoipa = { workspace = true }

quickwit-common = { workspace = true }
quickwit-datetime = { workspace = true }
quickwit-macros = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-query = { workspace = true }

[dev-dependencies]
binggan = { workspace = true }
matches = { workspace = true }
serde_yaml = { workspace = true }
time = { workspace = true }

quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-query = { workspace = true }

[features]
testsuite = []

[[bench]]
name = "doc_to_json_bench"
harness = false

[[bench]]
name = "routing_expression_bench"
harness = false


================================================
FILE: quickwit/quickwit-doc-mapper/benches/data/simple-parse-bench.json
================================================
{"id":1,"first_name":"Giulia","last_name":"Chaplain","email":"gchaplain0@ameblo.jp"}
{"id":2,"first_name":"Vivyan","last_name":"Shitliffe","email":"vshitliffe1@skype.com"}
{"id":3,"first_name":"Phip","last_name":"Ribey","email":"pribey2@sitemeter.com"}
{"id":4,"first_name":"Theressa","last_name":"Gamlin","email":"tgamlin3@alibaba.com"}
{"id":5,"first_name":"Monica","last_name":"Buney","email":"mbuney4@abc.net.au"}
{"id":6,"first_name":"Adore","last_name":"Brickhill","email":"abrickhill5@liveinternet.ru"}
{"id":7,"first_name":"Germana","last_name":"Culligan","email":"gculligan6@forbes.com"}
{"id":8,"first_name":"Jorgan","last_name":"Provost","email":"jprovost7@naver.com"}
{"id":9,"first_name":"Dianemarie","last_name":"Dorney","email":"ddorney8@alexa.com"}
{"id":10,"first_name":"Philipa","last_name":"Cocozza","email":"pcocozza9@eventbrite.com"}
{"id":11,"first_name":"Adena","last_name":"Frickey","email":"africkeya@php.net"}
{"id":12,"first_name":"Noelyn","last_name":"Jocelyn","email":"njocelynb@addtoany.com"}
{"id":13,"first_name":"Cammy","last_name":"Norwell","email":"cnorwellc@yale.edu"}
{"id":14,"first_name":"Eadie","last_name":"Pipworth","email":"epipworthd@barnesandnoble.com"}
{"id":15,"first_name":"Tandy","last_name":"Lenahan","email":"tlenahane@tripod.com"}
{"id":16,"first_name":"Honoria","last_name":"Van Weedenburg","email":"hvanweedenburgf@discovery.com"}
{"id":17,"first_name":"Felita","last_name":"O' Mullane","email":"fomullaneg@msu.edu"}
{"id":18,"first_name":"Austin","last_name":"Brownstein","email":"abrownsteinh@prlog.org"}
{"id":19,"first_name":"Leigh","last_name":"Berzins","email":"lberzinsi@walmart.com"}
{"id":20,"first_name":"Rachele","last_name":"Adamsson","email":"radamssonj@csmonitor.com"}
{"id":21,"first_name":"Barbabra","last_name":"Wilacot","email":"bwilacotk@kickstarter.com"}
{"id":22,"first_name":"Griffin","last_name":"Jone","email":"gjonel@google.pl"}
{"id":23,"first_name":"Michel","last_name":"Bothie","email":"mbothiem@shareasale.com"}
{"id":24,"first_name":"Callie","last_name":"Selley","email":"cselleyn@gmpg.org"}
{"id":25,"first_name":"Gleda","last_name":"O'Lahy","email":"golahyo@nih.gov"}
{"id":26,"first_name":"Alia","last_name":"Ladel","email":"aladelp@phpbb.com"}
{"id":27,"first_name":"Gusti","last_name":"McVitty","email":"gmcvittyq@redcross.org"}
{"id":28,"first_name":"Carolann","last_name":"Pachmann","email":"cpachmannr@goodreads.com"}
{"id":29,"first_name":"Agata","last_name":"Nyssen","email":"anyssens@utexas.edu"}
{"id":30,"first_name":"Jerrie","last_name":"Craddy","email":"jcraddyt@cbc.ca"}
{"id":31,"first_name":"Nariko","last_name":"Von Brook","email":"nvonbrooku@comcast.net"}
{"id":32,"first_name":"Zacharias","last_name":"Gobel","email":"zgobelv@wordpress.org"}
{"id":33,"first_name":"Sidnee","last_name":"Whettleton","email":"swhettletonw@lycos.com"}
{"id":34,"first_name":"Orlan","last_name":"Adamovitch","email":"oadamovitchx@hibu.com"}
{"id":35,"first_name":"Lotty","last_name":"Eddolls","email":"leddollsy@oracle.com"}
{"id":36,"first_name":"Sarge","last_name":"Tongue","email":"stonguez@shutterfly.com"}
{"id":37,"first_name":"Dalia","last_name":"Fisbey","email":"dfisbey10@ca.gov"}
{"id":38,"first_name":"Christin","last_name":"Yokel","email":"cyokel11@weebly.com"}
{"id":39,"first_name":"Maryjo","last_name":"Thridgould","email":"mthridgould12@apple.com"}
{"id":40,"first_name":"Maxie","last_name":"Nock","email":"mnock13@symantec.com"}
{"id":41,"first_name":"Shani","last_name":"Breeds","email":"sbreeds14@who.int"}
{"id":42,"first_name":"Loraine","last_name":"Sainthill","email":"lsainthill15@icq.com"}
{"id":43,"first_name":"Lorain","last_name":"Davidou","email":"ldavidou16@hexun.com"}
{"id":44,"first_name":"Ameline","last_name":"Dymoke","email":"adymoke17@usgs.gov"}
{"id":45,"first_name":"Tod","last_name":"Mendenhall","email":"tmendenhall18@skype.com"}
{"id":46,"first_name":"Cloris","last_name":"Pengilley","email":"cpengilley19@upenn.edu"}
{"id":47,"first_name":"Kathi","last_name":"Ortells","email":"kortells1a@state.tx.us"}
{"id":48,"first_name":"Sal","last_name":"Praill","email":"spraill1b@deviantart.com"}
{"id":49,"first_name":"Gideon","last_name":"McCauley","email":"gmccauley1c@wordpress.com"}
{"id":50,"first_name":"Rickie","last_name":"Zanitti","email":"rzanitti1d@jigsy.com"}
{"id":51,"first_name":"Leodora","last_name":"Chaloner","email":"lchaloner1e@163.com"}
{"id":52,"first_name":"Freida","last_name":"Strethill","email":"fstrethill1f@photobucket.com"}
{"id":53,"first_name":"Noach","last_name":"Coot","email":"ncoot1g@omniture.com"}
{"id":54,"first_name":"Shawn","last_name":"Booij","email":"sbooij1h@eepurl.com"}
{"id":55,"first_name":"Currey","last_name":"Boyford","email":"cboyford1i@netvibes.com"}
{"id":56,"first_name":"Kaitlin","last_name":"Ripon","email":"kripon1j@prnewswire.com"}
{"id":57,"first_name":"Quintina","last_name":"Hallows","email":"qhallows1k@wikimedia.org"}
{"id":58,"first_name":"Gallagher","last_name":"Degoey","email":"gdegoey1l@ox.ac.uk"}
{"id":59,"first_name":"Bride","last_name":"Lodin","email":"blodin1m@storify.com"}
{"id":60,"first_name":"Wilhelmine","last_name":"Longworth","email":"wlongworth1n@drupal.org"}
{"id":61,"first_name":"Giacinta","last_name":"Gulliman","email":"ggulliman1o@ow.ly"}
{"id":62,"first_name":"Whitney","last_name":"Swallwell","email":"wswallwell1p@businesswire.com"}
{"id":63,"first_name":"Boris","last_name":"Larraway","email":"blarraway1q@disqus.com"}
{"id":64,"first_name":"Guenevere","last_name":"Pierse","email":"gpierse1r@sourceforge.net"}
{"id":65,"first_name":"Leela","last_name":"O'Carran","email":"locarran1s@telegraph.co.uk"}
{"id":66,"first_name":"Anna-diana","last_name":"Marple","email":"amarple1t@unesco.org"}
{"id":67,"first_name":"Irita","last_name":"Hayto","email":"ihayto1u@samsung.com"}
{"id":68,"first_name":"Rance","last_name":"Urwen","email":"rurwen1v@t.co"}
{"id":69,"first_name":"Mollie","last_name":"Frowing","email":"mfrowing1w@comcast.net"}
{"id":70,"first_name":"Ellsworth","last_name":"Sandell","email":"esandell1x@google.com"}
{"id":71,"first_name":"Jude","last_name":"Rooksby","email":"jrooksby1y@issuu.com"}
{"id":72,"first_name":"Zahara","last_name":"Edworthie","email":"zedworthie1z@mysql.com"}
{"id":73,"first_name":"Prentiss","last_name":"Meddings","email":"pmeddings20@deviantart.com"}
{"id":74,"first_name":"Chrissie","last_name":"Lechmere","email":"clechmere21@abc.net.au"}
{"id":75,"first_name":"Rosie","last_name":"Danels","email":"rdanels22@flavors.me"}
{"id":76,"first_name":"Cchaddie","last_name":"Hatfield","email":"chatfield23@ehow.com"}
{"id":77,"first_name":"Deana","last_name":"Goter","email":"dgoter24@yellowpages.com"}
{"id":78,"first_name":"Agatha","last_name":"Witchard","email":"awitchard25@google.cn"}
{"id":79,"first_name":"Rhiamon","last_name":"Bleckly","email":"rbleckly26@nymag.com"}
{"id":80,"first_name":"Kellie","last_name":"Karpushkin","email":"kkarpushkin27@seattletimes.com"}
{"id":81,"first_name":"Konstanze","last_name":"Ramsbottom","email":"kramsbottom28@gov.uk"}
{"id":82,"first_name":"Doy","last_name":"Servant","email":"dservant29@amazon.de"}
{"id":83,"first_name":"Marj","last_name":"Kenford","email":"mkenford2a@studiopress.com"}
{"id":84,"first_name":"Amalia","last_name":"Hubbock","email":"ahubbock2b@upenn.edu"}
{"id":85,"first_name":"Jeannie","last_name":"Vannah","email":"jvannah2c@sourceforge.net"}
{"id":86,"first_name":"Janina","last_name":"Wigelsworth","email":"jwigelsworth2d@instagram.com"}
{"id":87,"first_name":"Ermina","last_name":"Patshull","email":"epatshull2e@arstechnica.com"}
{"id":88,"first_name":"Abbi","last_name":"Joseland","email":"ajoseland2f@discuz.net"}
{"id":89,"first_name":"Lavinie","last_name":"Cosson","email":"lcosson2g@ucoz.com"}
{"id":90,"first_name":"Noble","last_name":"Wyborn","email":"nwyborn2h@sun.com"}
{"id":91,"first_name":"Lulita","last_name":"Tunnicliff","email":"ltunnicliff2i@dagondesign.com"}
{"id":92,"first_name":"Debera","last_name":"Juris","email":"djuris2j@samsung.com"}
{"id":93,"first_name":"Dania","last_name":"Heersema","email":"dheersema2k@ox.ac.uk"}
{"id":94,"first_name":"Jacki","last_name":"Leveridge","email":"jleveridge2l@dropbox.com"}
{"id":95,"first_name":"Zara","last_name":"Sainsbury-Brown","email":"zsainsburybrown2m@thetimes.co.uk"}
{"id":96,"first_name":"Rhianna","last_name":"Pittson","email":"rpittson2n@ameblo.jp"}
{"id":97,"first_name":"Bevon","last_name":"Rugge","email":"brugge2o@163.com"}
{"id":98,"first_name":"Balduin","last_name":"Crosen","email":"bcrosen2p@nationalgeographic.com"}
{"id":99,"first_name":"Jens","last_name":"Muspratt","email":"jmuspratt2q@wordpress.org"}
{"id":100,"first_name":"Butch","last_name":"Rijkeseis","email":"brijkeseis2r@wordpress.com"}
{"id":101,"first_name":"Garold","last_name":"Tincey","email":"gtincey2s@unesco.org"}
{"id":102,"first_name":"Krishna","last_name":"Starkie","email":"kstarkie2t@gizmodo.com"}
{"id":103,"first_name":"Thomasine","last_name":"Tickner","email":"ttickner2u@slashdot.org"}
{"id":104,"first_name":"Tuesday","last_name":"Osmon","email":"tosmon2v@vkontakte.ru"}
{"id":105,"first_name":"Elberta","last_name":"Ellsbury","email":"eellsbury2w@cmu.edu"}
{"id":106,"first_name":"Rudyard","last_name":"Barrie","email":"rbarrie2x@wisc.edu"}
{"id":107,"first_name":"Cash","last_name":"Cloutt","email":"ccloutt2y@twitter.com"}
{"id":108,"first_name":"Jammal","last_name":"Bateman","email":"jbateman2z@va.gov"}
{"id":109,"first_name":"Binnie","last_name":"Siddall","email":"bsiddall30@narod.ru"}
{"id":110,"first_name":"Cirillo","last_name":"Stockbridge","email":"cstockbridge31@reddit.com"}
{"id":111,"first_name":"Cherie","last_name":"Sommerlie","email":"csommerlie32@scientificamerican.com"}
{"id":112,"first_name":"Jaquenette","last_name":"Autrie","email":"jautrie33@umich.edu"}
{"id":113,"first_name":"Ellswerth","last_name":"Bethell","email":"ebethell34@adobe.com"}
{"id":114,"first_name":"Earvin","last_name":"Millmore","email":"emillmore35@kickstarter.com"}
{"id":115,"first_name":"Hall","last_name":"Ruddle","email":"hruddle36@tripod.com"}
{"id":116,"first_name":"Eveleen","last_name":"O'Kennavain","email":"eokennavain37@squarespace.com"}
{"id":117,"first_name":"Dillie","last_name":"Petrescu","email":"dpetrescu38@ibm.com"}
{"id":118,"first_name":"Celestia","last_name":"Burwood","email":"cburwood39@oaic.gov.au"}
{"id":119,"first_name":"Lynna","last_name":"Barnsdall","email":"lbarnsdall3a@marketwatch.com"}
{"id":120,"first_name":"Jandy","last_name":"Noods","email":"jnoods3b@behance.net"}
{"id":121,"first_name":"Guillemette","last_name":"Chinn","email":"gchinn3c@comcast.net"}
{"id":122,"first_name":"Abagael","last_name":"Keenleyside","email":"akeenleyside3d@usatoday.com"}
{"id":123,"first_name":"Arlan","last_name":"Kubczak","email":"akubczak3e@apache.org"}
{"id":124,"first_name":"Tybi","last_name":"Flobert","email":"tflobert3f@cbsnews.com"}
{"id":125,"first_name":"Hodge","last_name":"Champley","email":"hchampley3g@etsy.com"}
{"id":126,"first_name":"Betta","last_name":"Navarijo","email":"bnavarijo3h@xrea.com"}
{"id":127,"first_name":"Stacee","last_name":"Brunetti","email":"sbrunetti3i@artisteer.com"}
{"id":128,"first_name":"Hurlee","last_name":"Bowstead","email":"hbowstead3j@mit.edu"}
{"id":129,"first_name":"Linet","last_name":"Binnall","email":"lbinnall3k@blogger.com"}
{"id":130,"first_name":"Daile","last_name":"Borrett","email":"dborrett3l@npr.org"}
{"id":131,"first_name":"Kay","last_name":"Coneybeare","email":"kconeybeare3m@amazon.co.uk"}
{"id":132,"first_name":"Menard","last_name":"Chatan","email":"mchatan3n@nih.gov"}
{"id":133,"first_name":"Anthiathia","last_name":"Innman","email":"ainnman3o@wiley.com"}
{"id":134,"first_name":"Lenka","last_name":"Polland","email":"lpolland3p@xing.com"}
{"id":135,"first_name":"Allina","last_name":"Custed","email":"acusted3q@usa.gov"}
{"id":136,"first_name":"Janessa","last_name":"Gerckens","email":"jgerckens3r@nyu.edu"}
{"id":137,"first_name":"Magdalen","last_name":"Doerr","email":"mdoerr3s@lycos.com"}
{"id":138,"first_name":"Pail","last_name":"Sellstrom","email":"psellstrom3t@sohu.com"}
{"id":139,"first_name":"Lissy","last_name":"Pindell","email":"lpindell3u@dailymail.co.uk"}
{"id":140,"first_name":"Beatriz","last_name":"Elintune","email":"belintune3v@cdc.gov"}
{"id":141,"first_name":"Arlana","last_name":"Carik","email":"acarik3w@bigcartel.com"}
{"id":142,"first_name":"Conny","last_name":"Anster","email":"canster3x@domainmarket.com"}
{"id":143,"first_name":"Alvera","last_name":"Carn","email":"acarn3y@biblegateway.com"}
{"id":144,"first_name":"Adriaens","last_name":"Farfoot","email":"afarfoot3z@dion.ne.jp"}
{"id":145,"first_name":"Rosabelle","last_name":"Mardoll","email":"rmardoll40@i2i.jp"}
{"id":146,"first_name":"Riki","last_name":"Orrett","email":"rorrett41@fda.gov"}
{"id":147,"first_name":"Zorah","last_name":"Jaime","email":"zjaime42@xing.com"}
{"id":148,"first_name":"Godwin","last_name":"Birkinshaw","email":"gbirkinshaw43@mail.ru"}
{"id":149,"first_name":"Karoly","last_name":"Cowl","email":"kcowl44@rambler.ru"}
{"id":150,"first_name":"Myrtle","last_name":"Gostling","email":"mgostling45@psu.edu"}
{"id":151,"first_name":"Matthew","last_name":"Shird","email":"mshird46@linkedin.com"}
{"id":152,"first_name":"Tanner","last_name":"Kubelka","email":"tkubelka47@state.tx.us"}
{"id":153,"first_name":"Cosimo","last_name":"Broune","email":"cbroune48@sogou.com"}
{"id":154,"first_name":"Rafa","last_name":"Vear","email":"rvear49@theglobeandmail.com"}
{"id":155,"first_name":"Emmalynn","last_name":"Elcomb","email":"eelcomb4a@cam.ac.uk"}
{"id":156,"first_name":"Karolina","last_name":"Mayler","email":"kmayler4b@furl.net"}
{"id":157,"first_name":"Serene","last_name":"Piers","email":"spiers4c@etsy.com"}
{"id":158,"first_name":"Garnet","last_name":"Reynault","email":"greynault4d@trellian.com"}
{"id":159,"first_name":"Decca","last_name":"Kauscher","email":"dkauscher4e@eepurl.com"}
{"id":160,"first_name":"Olga","last_name":"Willas","email":"owillas4f@npr.org"}
{"id":161,"first_name":"Neil","last_name":"Chatel","email":"nchatel4g@nifty.com"}
{"id":162,"first_name":"Jim","last_name":"Terrelly","email":"jterrelly4h@360.cn"}
{"id":163,"first_name":"Ximenez","last_name":"Saffen","email":"xsaffen4i@deliciousdays.com"}
{"id":164,"first_name":"Kandace","last_name":"Skitt","email":"kskitt4j@webs.com"}
{"id":165,"first_name":"Dinny","last_name":"Borman","email":"dborman4k@issuu.com"}
{"id":166,"first_name":"Wolfy","last_name":"McVanamy","email":"wmcvanamy4l@msn.com"}
{"id":167,"first_name":"Tito","last_name":"Orlton","email":"torlton4m@discuz.net"}
{"id":168,"first_name":"Leia","last_name":"Evelyn","email":"levelyn4n@dagondesign.com"}
{"id":169,"first_name":"Kamila","last_name":"Jeste","email":"kjeste4o@imgur.com"}
{"id":170,"first_name":"Annissa","last_name":"Aitchinson","email":"aaitchinson4p@msn.com"}
{"id":171,"first_name":"Zulema","last_name":"Pimme","email":"zpimme4q@lulu.com"}
{"id":172,"first_name":"Nichole","last_name":"Nealand","email":"nnealand4r@arstechnica.com"}
{"id":173,"first_name":"Barth","last_name":"Carver","email":"bcarver4s@bloomberg.com"}
{"id":174,"first_name":"Theodosia","last_name":"Helkin","email":"thelkin4t@shinystat.com"}
{"id":175,"first_name":"Sander","last_name":"Monkton","email":"smonkton4u@globo.com"}
{"id":176,"first_name":"Claus","last_name":"Mattsson","email":"cmattsson4v@joomla.org"}
{"id":177,"first_name":"Julianne","last_name":"Bettenay","email":"jbettenay4w@com.com"}
{"id":178,"first_name":"Conant","last_name":"Da Costa","email":"cdacosta4x@cam.ac.uk"}
{"id":179,"first_name":"Patten","last_name":"Goldby","email":"pgoldby4y@nasa.gov"}
{"id":180,"first_name":"Courtenay","last_name":"Taft","email":"ctaft4z@indiegogo.com"}
{"id":181,"first_name":"Kirsten","last_name":"Gore","email":"kgore50@angelfire.com"}
{"id":182,"first_name":"Quincy","last_name":"Cosslett","email":"qcosslett51@netscape.com"}
{"id":183,"first_name":"Sherri","last_name":"Marchenko","email":"smarchenko52@simplemachines.org"}
{"id":184,"first_name":"Marianna","last_name":"Van Schafflaer","email":"mvanschafflaer53@ftc.gov"}
{"id":185,"first_name":"Idalina","last_name":"Mullinger","email":"imullinger54@dot.gov"}
{"id":186,"first_name":"Pauline","last_name":"Volk","email":"pvolk55@addtoany.com"}
{"id":187,"first_name":"Joel","last_name":"Kaasman","email":"jkaasman56@youtube.com"}
{"id":188,"first_name":"Tremaine","last_name":"Follin","email":"tfollin57@answers.com"}
{"id":189,"first_name":"Dyane","last_name":"Shasnan","email":"dshasnan58@whitehouse.gov"}
{"id":190,"first_name":"Deny","last_name":"Packe","email":"dpacke59@wordpress.com"}
{"id":191,"first_name":"Danella","last_name":"Clifford","email":"dclifford5a@toplist.cz"}
{"id":192,"first_name":"Melesa","last_name":"Ballach","email":"mballach5b@netscape.com"}
{"id":193,"first_name":"Annabel","last_name":"Bragginton","email":"abragginton5c@de.vu"}
{"id":194,"first_name":"Reagen","last_name":"Boullin","email":"rboullin5d@e-recht24.de"}
{"id":195,"first_name":"Cassi","last_name":"Chieco","email":"cchieco5e@go.com"}
{"id":196,"first_name":"Rollins","last_name":"Hurdiss","email":"rhurdiss5f@indiatimes.com"}
{"id":197,"first_name":"Ole","last_name":"Martusov","email":"omartusov5g@washingtonpost.com"}
{"id":198,"first_name":"Hillyer","last_name":"Godson","email":"hgodson5h@51.la"}
{"id":199,"first_name":"Wat","last_name":"Trusdale","email":"wtrusdale5i@alexa.com"}
{"id":200,"first_name":"Dotti","last_name":"MacClancey","email":"dmacclancey5j@51.la"}
{"id":201,"first_name":"Cassius","last_name":"Vaughan-Hughes","email":"cvaughanhughes5k@pcworld.com"}
{"id":202,"first_name":"Aleksandr","last_name":"Rossey","email":"arossey5l@imageshack.us"}
{"id":203,"first_name":"Wakefield","last_name":"Goodhay","email":"wgoodhay5m@gov.uk"}
{"id":204,"first_name":"Patrizio","last_name":"Loutheane","email":"ploutheane5n@goo.gl"}
{"id":205,"first_name":"Dayna","last_name":"Blaylock","email":"dblaylock5o@fda.gov"}
{"id":206,"first_name":"Ad","last_name":"Henken","email":"ahenken5p@wikimedia.org"}
{"id":207,"first_name":"Selene","last_name":"Saunderson","email":"ssaunderson5q@over-blog.com"}
{"id":208,"first_name":"Almeda","last_name":"Hlavecek","email":"ahlavecek5r@ted.com"}
{"id":209,"first_name":"Jessamine","last_name":"Coaster","email":"jcoaster5s@ning.com"}
{"id":210,"first_name":"Valry","last_name":"McCollum","email":"vmccollum5t@upenn.edu"}
{"id":211,"first_name":"Cami","last_name":"Treherne","email":"ctreherne5u@istockphoto.com"}
{"id":212,"first_name":"Bartholemy","last_name":"Tharme","email":"btharme5v@businessinsider.com"}
{"id":213,"first_name":"Sallyann","last_name":"Selcraig","email":"sselcraig5w@pcworld.com"}
{"id":214,"first_name":"Felipa","last_name":"Faichnie","email":"ffaichnie5x@jimdo.com"}
{"id":215,"first_name":"Charis","last_name":"Lakenton","email":"clakenton5y@goo.gl"}
{"id":216,"first_name":"Hildagard","last_name":"Klesse","email":"hklesse5z@washington.edu"}
{"id":217,"first_name":"Zoe","last_name":"Doul","email":"zdoul60@imdb.com"}
{"id":218,"first_name":"Mab","last_name":"Thorrold","email":"mthorrold61@freewebs.com"}
{"id":219,"first_name":"Shay","last_name":"Pringer","email":"springer62@arizona.edu"}
{"id":220,"first_name":"Sandi","last_name":"Petford","email":"spetford63@symantec.com"}
{"id":221,"first_name":"Yuma","last_name":"Pilmer","email":"ypilmer64@sciencedaily.com"}
{"id":222,"first_name":"Jaymee","last_name":"Bennen","email":"jbennen65@a8.net"}
{"id":223,"first_name":"Chris","last_name":"Carwithim","email":"ccarwithim66@tripadvisor.com"}
{"id":224,"first_name":"Denney","last_name":"Shillum","email":"dshillum67@hugedomains.com"}
{"id":225,"first_name":"Odille","last_name":"Marshall","email":"omarshall68@aboutads.info"}
{"id":226,"first_name":"Forrest","last_name":"MacMoyer","email":"fmacmoyer69@bbc.co.uk"}
{"id":227,"first_name":"Matteo","last_name":"Millhill","email":"mmillhill6a@ibm.com"}
{"id":228,"first_name":"Loni","last_name":"Kedie","email":"lkedie6b@reverbnation.com"}
{"id":229,"first_name":"Roland","last_name":"Lipyeat","email":"rlipyeat6c@aol.com"}
{"id":230,"first_name":"Merrick","last_name":"Catterell","email":"mcatterell6d@barnesandnoble.com"}
{"id":231,"first_name":"Lucias","last_name":"Kadar","email":"lkadar6e@slideshare.net"}
{"id":232,"first_name":"Koral","last_name":"Sendall","email":"ksendall6f@ted.com"}
{"id":233,"first_name":"Pollyanna","last_name":"Asbrey","email":"pasbrey6g@salon.com"}
{"id":234,"first_name":"Gorden","last_name":"Guinn","email":"gguinn6h@usa.gov"}
{"id":235,"first_name":"Cal","last_name":"Nower","email":"cnower6i@cloudflare.com"}
{"id":236,"first_name":"Waldon","last_name":"McGruar","email":"wmcgruar6j@sbwire.com"}
{"id":237,"first_name":"Ginger","last_name":"Cheers","email":"gcheers6k@gnu.org"}
{"id":238,"first_name":"Jeremiah","last_name":"Ivanitsa","email":"jivanitsa6l@mlb.com"}
{"id":239,"first_name":"Lind","last_name":"Marcu","email":"lmarcu6m@twitpic.com"}
{"id":240,"first_name":"Sigismond","last_name":"Emmer","email":"semmer6n@hatena.ne.jp"}
{"id":241,"first_name":"Zedekiah","last_name":"Davidsen","email":"zdavidsen6o@google.ru"}
{"id":242,"first_name":"Alex","last_name":"Formie","email":"aformie6p@loc.gov"}
{"id":243,"first_name":"Reid","last_name":"Goodhall","email":"rgoodhall6q@loc.gov"}
{"id":244,"first_name":"Gray","last_name":"Forge","email":"gforge6r@virginia.edu"}
{"id":245,"first_name":"Dalston","last_name":"Batteson","email":"dbatteson6s@dailymail.co.uk"}
{"id":246,"first_name":"Base","last_name":"Devey","email":"bdevey6t@cocolog-nifty.com"}
{"id":247,"first_name":"Beret","last_name":"Bann","email":"bbann6u@pcworld.com"}
{"id":248,"first_name":"Lois","last_name":"Dudney","email":"ldudney6v@blog.com"}
{"id":249,"first_name":"Garth","last_name":"Renner","email":"grenner6w@wsj.com"}
{"id":250,"first_name":"Dorette","last_name":"Baglan","email":"dbaglan6x@cisco.com"}
{"id":251,"first_name":"Joe","last_name":"Painter","email":"jpainter6y@unblog.fr"}
{"id":252,"first_name":"Emilie","last_name":"Radborn","email":"eradborn6z@geocities.jp"}
{"id":253,"first_name":"Dehlia","last_name":"Betchley","email":"dbetchley70@slideshare.net"}
{"id":254,"first_name":"Ertha","last_name":"Makepeace","email":"emakepeace71@samsung.com"}
{"id":255,"first_name":"Brita","last_name":"Currie","email":"bcurrie72@jigsy.com"}
{"id":256,"first_name":"Blisse","last_name":"Collimore","email":"bcollimore73@hhs.gov"}
{"id":257,"first_name":"Stearn","last_name":"Tattersall","email":"stattersall74@youtu.be"}
{"id":258,"first_name":"Randi","last_name":"Lambertini","email":"rlambertini75@dot.gov"}
{"id":259,"first_name":"Beryle","last_name":"Aspray","email":"baspray76@biglobe.ne.jp"}
{"id":260,"first_name":"Pansy","last_name":"Ricketts","email":"pricketts77@google.co.uk"}
{"id":261,"first_name":"Jeniece","last_name":"Eveque","email":"jeveque78@ucoz.ru"}
{"id":262,"first_name":"Kelsey","last_name":"Desorts","email":"kdesorts79@blog.com"}
{"id":263,"first_name":"Cecilla","last_name":"Hunting","email":"chunting7a@rediff.com"}
{"id":264,"first_name":"Robbie","last_name":"Rudeyeard","email":"rrudeyeard7b@twitpic.com"}
{"id":265,"first_name":"Ronny","last_name":"Cloy","email":"rcloy7c@wufoo.com"}
{"id":266,"first_name":"Fallon","last_name":"McGarrie","email":"fmcgarrie7d@domainmarket.com"}
{"id":267,"first_name":"Andree","last_name":"Salazar","email":"asalazar7e@aol.com"}
{"id":268,"first_name":"Terri","last_name":"Pentlow","email":"tpentlow7f@narod.ru"}
{"id":269,"first_name":"Teodoro","last_name":"Guerrazzi","email":"tguerrazzi7g@trellian.com"}
{"id":270,"first_name":"Ashton","last_name":"Kirimaa","email":"akirimaa7h@cdc.gov"}
{"id":271,"first_name":"Nikolas","last_name":"Vidineev","email":"nvidineev7i@tuttocitta.it"}
{"id":272,"first_name":"Myrtia","last_name":"Karsh","email":"mkarsh7j@wired.com"}
{"id":273,"first_name":"Modesty","last_name":"Boissier","email":"mboissier7k@aol.com"}
{"id":274,"first_name":"Cyndia","last_name":"Leemans","email":"cleemans7l@cornell.edu"}
{"id":275,"first_name":"Shantee","last_name":"Maykin","email":"smaykin7m@wix.com"}
{"id":276,"first_name":"Emmerich","last_name":"Gergus","email":"egergus7n@paypal.com"}
{"id":277,"first_name":"Lindsey","last_name":"Chaulk","email":"lchaulk7o@sfgate.com"}
{"id":278,"first_name":"Romona","last_name":"Murie","email":"rmurie7p@sun.com"}
{"id":279,"first_name":"Bel","last_name":"Hitzschke","email":"bhitzschke7q@jugem.jp"}
{"id":280,"first_name":"Hilton","last_name":"Haythorn","email":"hhaythorn7r@sciencedaily.com"}
{"id":281,"first_name":"Lydie","last_name":"Heinrici","email":"lheinrici7s@cnbc.com"}
{"id":282,"first_name":"Gwynne","last_name":"Harriman","email":"gharriman7t@linkedin.com"}
{"id":283,"first_name":"Boy","last_name":"Abrahmson","email":"babrahmson7u@mit.edu"}
{"id":284,"first_name":"Rayner","last_name":"Murrill","email":"rmurrill7v@freewebs.com"}
{"id":285,"first_name":"Steward","last_name":"Lodovichi","email":"slodovichi7w@ucoz.com"}
{"id":286,"first_name":"Zelig","last_name":"Guillet","email":"zguillet7x@vistaprint.com"}
{"id":287,"first_name":"Merrily","last_name":"Millen","email":"mmillen7y@cam.ac.uk"}
{"id":288,"first_name":"Raff","last_name":"Goold","email":"rgoold7z@canalblog.com"}
{"id":289,"first_name":"Aland","last_name":"Richards","email":"arichards80@people.com.cn"}
{"id":290,"first_name":"Ambrose","last_name":"Fanning","email":"afanning81@telegraph.co.uk"}
{"id":291,"first_name":"Dolly","last_name":"McConnulty","email":"dmcconnulty82@pen.io"}
{"id":292,"first_name":"Eleen","last_name":"Muffen","email":"emuffen83@reddit.com"}
{"id":293,"first_name":"Rachele","last_name":"Cleminshaw","email":"rcleminshaw84@apache.org"}
{"id":294,"first_name":"Royall","last_name":"Grierson","email":"rgrierson85@chron.com"}
{"id":295,"first_name":"Goldie","last_name":"Bouskill","email":"gbouskill86@vkontakte.ru"}
{"id":296,"first_name":"Padraic","last_name":"Manolov","email":"pmanolov87@163.com"}
{"id":297,"first_name":"Olivie","last_name":"Corcut","email":"ocorcut88@nyu.edu"}
{"id":298,"first_name":"Cly","last_name":"Peete","email":"cpeete89@feedburner.com"}
{"id":299,"first_name":"Stanly","last_name":"Grieswood","email":"sgrieswood8a@google.it"}
{"id":300,"first_name":"Cullin","last_name":"Hammatt","email":"chammatt8b@hostgator.com"}
{"id":301,"first_name":"Talbert","last_name":"Lilliman","email":"tlilliman8c@wufoo.com"}
{"id":302,"first_name":"Britteny","last_name":"Kubica","email":"bkubica8d@jiathis.com"}
{"id":303,"first_name":"Leona","last_name":"Matthaus","email":"lmatthaus8e@chicagotribune.com"}
{"id":304,"first_name":"Minda","last_name":"Emmerson","email":"memmerson8f@cnn.com"}
{"id":305,"first_name":"Reinhard","last_name":"Dudderidge","email":"rdudderidge8g@twitter.com"}
{"id":306,"first_name":"Ode","last_name":"Isaac","email":"oisaac8h@mashable.com"}
{"id":307,"first_name":"Tannie","last_name":"Duffan","email":"tduffan8i@netlog.com"}
{"id":308,"first_name":"Riccardo","last_name":"Heaney","email":"rheaney8j@g.co"}
{"id":309,"first_name":"Leann","last_name":"Klimpt","email":"lklimpt8k@wsj.com"}
{"id":310,"first_name":"Jacquelyn","last_name":"Reddle","email":"jreddle8l@prlog.org"}
{"id":311,"first_name":"Pebrook","last_name":"Gladdor","email":"pgladdor8m@hp.com"}
{"id":312,"first_name":"Devy","last_name":"Keers","email":"dkeers8n@theglobeandmail.com"}
{"id":313,"first_name":"Em","last_name":"Bullock","email":"ebullock8o@theglobeandmail.com"}
{"id":314,"first_name":"Catharine","last_name":"Rabbitt","email":"crabbitt8p@usnews.com"}
{"id":315,"first_name":"Roderick","last_name":"Barette","email":"rbarette8q@icq.com"}
{"id":316,"first_name":"Joshia","last_name":"MacIver","email":"jmaciver8r@biblegateway.com"}
{"id":317,"first_name":"Jarrad","last_name":"Donnan","email":"jdonnan8s@is.gd"}
{"id":318,"first_name":"Sophey","last_name":"Corriea","email":"scorriea8t@liveinternet.ru"}
{"id":319,"first_name":"Aura","last_name":"Pancast","email":"apancast8u@google.com.hk"}
{"id":320,"first_name":"Benedikta","last_name":"Billin","email":"bbillin8v@cmu.edu"}
{"id":321,"first_name":"Hermine","last_name":"Bidgood","email":"hbidgood8w@businessweek.com"}
{"id":322,"first_name":"Woody","last_name":"Sellack","email":"wsellack8x@hibu.com"}
{"id":323,"first_name":"Wrennie","last_name":"Ivermee","email":"wivermee8y@tuttocitta.it"}
{"id":324,"first_name":"Miranda","last_name":"Pyle","email":"mpyle8z@bbb.org"}
{"id":325,"first_name":"Cathee","last_name":"Dowdeswell","email":"cdowdeswell90@unblog.fr"}
{"id":326,"first_name":"Georgine","last_name":"Beesley","email":"gbeesley91@amazon.com"}
{"id":327,"first_name":"Marmaduke","last_name":"Musprat","email":"mmusprat92@fda.gov"}
{"id":328,"first_name":"Jermayne","last_name":"Lindro","email":"jlindro93@spotify.com"}
{"id":329,"first_name":"Kris","last_name":"Tripe","email":"ktripe94@phoca.cz"}
{"id":330,"first_name":"Ofella","last_name":"Antushev","email":"oantushev95@desdev.cn"}
{"id":331,"first_name":"Tod","last_name":"Macia","email":"tmacia96@engadget.com"}
{"id":332,"first_name":"Jelene","last_name":"Cecere","email":"jcecere97@51.la"}
{"id":333,"first_name":"Britney","last_name":"Sanches","email":"bsanches98@princeton.edu"}
{"id":334,"first_name":"Quinn","last_name":"Pirolini","email":"qpirolini99@oracle.com"}
{"id":335,"first_name":"Costanza","last_name":"Wharby","email":"cwharby9a@shareasale.com"}
{"id":336,"first_name":"Steven","last_name":"Edel","email":"sedel9b@google.com.au"}
{"id":337,"first_name":"Quinton","last_name":"Simonnet","email":"qsimonnet9c@mail.ru"}
{"id":338,"first_name":"Conroy","last_name":"Sorey","email":"csorey9d@mapy.cz"}
{"id":339,"first_name":"Kacey","last_name":"Tweedy","email":"ktweedy9e@telegraph.co.uk"}
{"id":340,"first_name":"Aubrie","last_name":"Oatley","email":"aoatley9f@amazon.com"}
{"id":341,"first_name":"Gerhard","last_name":"Rizzolo","email":"grizzolo9g@ftc.gov"}
{"id":342,"first_name":"Keenan","last_name":"Godier","email":"kgodier9h@harvard.edu"}
{"id":343,"first_name":"Alard","last_name":"Tubridy","email":"atubridy9i@ask.com"}
{"id":344,"first_name":"Nadine","last_name":"Naden","email":"nnaden9j@ca.gov"}
{"id":345,"first_name":"Alessandro","last_name":"Timson","email":"atimson9k@gov.uk"}
{"id":346,"first_name":"Mirella","last_name":"Shurville","email":"mshurville9l@google.co.uk"}
{"id":347,"first_name":"Libbie","last_name":"Waterman","email":"lwaterman9m@abc.net.au"}
{"id":348,"first_name":"Cordy","last_name":"Selesnick","email":"cselesnick9n@freewebs.com"}
{"id":349,"first_name":"Gerrard","last_name":"Roney","email":"groney9o@xrea.com"}
{"id":350,"first_name":"Paulita","last_name":"Giacomi","email":"pgiacomi9p@utexas.edu"}
{"id":351,"first_name":"Martguerita","last_name":"Ceaser","email":"mceaser9q@toplist.cz"}
{"id":352,"first_name":"Alexei","last_name":"Kellitt","email":"akellitt9r@joomla.org"}
{"id":353,"first_name":"Domenico","last_name":"Byard","email":"dbyard9s@histats.com"}
{"id":354,"first_name":"Herby","last_name":"Piele","email":"hpiele9t@edublogs.org"}
{"id":355,"first_name":"Shaughn","last_name":"Ramsby","email":"sramsby9u@ning.com"}
{"id":356,"first_name":"Britni","last_name":"Maginot","email":"bmaginot9v@walmart.com"}
{"id":357,"first_name":"May","last_name":"Manshaw","email":"mmanshaw9w@slideshare.net"}
{"id":358,"first_name":"Onofredo","last_name":"Corcut","email":"ocorcut9x@vistaprint.com"}
{"id":359,"first_name":"Lincoln","last_name":"Mantrup","email":"lmantrup9y@yolasite.com"}
{"id":360,"first_name":"Ora","last_name":"Kearton","email":"okearton9z@bravesites.com"}
{"id":361,"first_name":"Gaylord","last_name":"Kulicke","email":"gkulickea0@pen.io"}
{"id":362,"first_name":"Thibaut","last_name":"Easbie","email":"teasbiea1@amazonaws.com"}
{"id":363,"first_name":"Doro","last_name":"Metts","email":"dmettsa2@tiny.cc"}
{"id":364,"first_name":"Lon","last_name":"Breslane","email":"lbreslanea3@sciencedaily.com"}
{"id":365,"first_name":"Coreen","last_name":"Coultass","email":"ccoultassa4@skyrock.com"}
{"id":366,"first_name":"Donall","last_name":"Cusack","email":"dcusacka5@cyberchimps.com"}
{"id":367,"first_name":"Derrek","last_name":"O'Sharry","email":"dosharrya6@cbslocal.com"}
{"id":368,"first_name":"Barth","last_name":"Thieme","email":"bthiemea7@odnoklassniki.ru"}
{"id":369,"first_name":"Wyatt","last_name":"Alderton","email":"waldertona8@whitehouse.gov"}
{"id":370,"first_name":"Correna","last_name":"Colmore","email":"ccolmorea9@icio.us"}
{"id":371,"first_name":"Kacy","last_name":"Weippert","email":"kweippertaa@devhub.com"}
{"id":372,"first_name":"Trista","last_name":"Androsik","email":"tandrosikab@boston.com"}
{"id":373,"first_name":"Joyan","last_name":"Abramski","email":"jabramskiac@gnu.org"}
{"id":374,"first_name":"Rafi","last_name":"Garfield","email":"rgarfieldad@yellowpages.com"}
{"id":375,"first_name":"Wilton","last_name":"Tankard","email":"wtankardae@networksolutions.com"}
{"id":376,"first_name":"Noak","last_name":"Crielly","email":"ncriellyaf@guardian.co.uk"}
{"id":377,"first_name":"Louisette","last_name":"Redrup","email":"lredrupag@phoca.cz"}
{"id":378,"first_name":"Anneliese","last_name":"Pegram","email":"apegramah@vinaora.com"}
{"id":379,"first_name":"Jenny","last_name":"Guirau","email":"jguirauai@sciencedirect.com"}
{"id":380,"first_name":"Phaedra","last_name":"Plaistowe","email":"pplaistoweaj@usatoday.com"}
{"id":381,"first_name":"Terri","last_name":"Mathew","email":"tmathewak@jigsy.com"}
{"id":382,"first_name":"Allegra","last_name":"Wenn","email":"awennal@squidoo.com"}
{"id":383,"first_name":"Davita","last_name":"Fergyson","email":"dfergysonam@wix.com"}
{"id":384,"first_name":"Genovera","last_name":"Billinge","email":"gbillingean@edublogs.org"}
{"id":385,"first_name":"Lyndsay","last_name":"Zuker","email":"lzukerao@npr.org"}
{"id":386,"first_name":"Bess","last_name":"Ryrie","email":"bryrieap@cnbc.com"}
{"id":387,"first_name":"Rena","last_name":"Orniz","email":"rornizaq@cargocollective.com"}
{"id":388,"first_name":"Baudoin","last_name":"Walklate","email":"bwalklatear@uiuc.edu"}
{"id":389,"first_name":"Cherri","last_name":"Pollicote","email":"cpollicoteas@state.tx.us"}
{"id":390,"first_name":"Yanaton","last_name":"Knappitt","email":"yknappittat@ucoz.com"}
{"id":391,"first_name":"Audi","last_name":"Izkovicz","email":"aizkoviczau@google.es"}
{"id":392,"first_name":"Lewes","last_name":"Chilcott","email":"lchilcottav@amazonaws.com"}
{"id":393,"first_name":"Mariquilla","last_name":"Pinck","email":"mpinckaw@example.com"}
{"id":394,"first_name":"Lodovico","last_name":"Tadman","email":"ltadmanax@vk.com"}
{"id":395,"first_name":"Yancey","last_name":"Beardsall","email":"ybeardsallay@printfriendly.com"}
{"id":396,"first_name":"Matilda","last_name":"Fedorski","email":"mfedorskiaz@biglobe.ne.jp"}
{"id":397,"first_name":"Kellen","last_name":"Cleveley","email":"kcleveleyb0@state.gov"}
{"id":398,"first_name":"Dave","last_name":"Aglione","email":"daglioneb1@barnesandnoble.com"}
{"id":399,"first_name":"Sanders","last_name":"Noades","email":"snoadesb2@wufoo.com"}
{"id":400,"first_name":"Ingar","last_name":"Asser","email":"iasserb3@youku.com"}
{"id":401,"first_name":"Sandie","last_name":"Gregore","email":"sgregoreb4@msu.edu"}
{"id":402,"first_name":"Georgiana","last_name":"Statefield","email":"gstatefieldb5@kickstarter.com"}
{"id":403,"first_name":"Jackquelin","last_name":"Frugier","email":"jfrugierb6@unicef.org"}
{"id":404,"first_name":"Hillary","last_name":"Dallyn","email":"hdallynb7@loc.gov"}
{"id":405,"first_name":"Townsend","last_name":"Syde","email":"tsydeb8@answers.com"}
{"id":406,"first_name":"Rina","last_name":"Scurrah","email":"rscurrahb9@wunderground.com"}
{"id":407,"first_name":"Frank","last_name":"Sheer","email":"fsheerba@howstuffworks.com"}
{"id":408,"first_name":"Marice","last_name":"Bertie","email":"mbertiebb@senate.gov"}
{"id":409,"first_name":"Cookie","last_name":"McMillan","email":"cmcmillanbc@webeden.co.uk"}
{"id":410,"first_name":"Emmy","last_name":"Lauthian","email":"elauthianbd@dedecms.com"}
{"id":411,"first_name":"Kory","last_name":"Francklin","email":"kfrancklinbe@furl.net"}
{"id":412,"first_name":"Gardiner","last_name":"Senyard","email":"gsenyardbf@wikispaces.com"}
{"id":413,"first_name":"Mercedes","last_name":"Kolczynski","email":"mkolczynskibg@posterous.com"}
{"id":414,"first_name":"Myriam","last_name":"Saben","email":"msabenbh@wix.com"}
{"id":415,"first_name":"Chevy","last_name":"Quinell","email":"cquinellbi@dyndns.org"}
{"id":416,"first_name":"Ed","last_name":"Heddon","email":"eheddonbj@usda.gov"}
{"id":417,"first_name":"Gerek","last_name":"Baddiley","email":"gbaddileybk@diigo.com"}
{"id":418,"first_name":"Edgardo","last_name":"Careswell","email":"ecareswellbl@amazonaws.com"}
{"id":419,"first_name":"Hunfredo","last_name":"Gibbard","email":"hgibbardbm@istockphoto.com"}
{"id":420,"first_name":"Audie","last_name":"Siddle","email":"asiddlebn@squidoo.com"}
{"id":421,"first_name":"Adey","last_name":"Kingsford","email":"akingsfordbo@telegraph.co.uk"}
{"id":422,"first_name":"Ethelyn","last_name":"Vanyushkin","email":"evanyushkinbp@amazonaws.com"}
{"id":423,"first_name":"Bron","last_name":"Edger","email":"bedgerbq@bandcamp.com"}
{"id":424,"first_name":"Cathrine","last_name":"Arnaldo","email":"carnaldobr@imgur.com"}
{"id":425,"first_name":"Rickie","last_name":"Yeskov","email":"ryeskovbs@slate.com"}
{"id":426,"first_name":"Gale","last_name":"Choat","email":"gchoatbt@google.de"}
{"id":427,"first_name":"Garik","last_name":"Leak","email":"gleakbu@privacy.gov.au"}
{"id":428,"first_name":"Timofei","last_name":"Whiteoak","email":"twhiteoakbv@tinyurl.com"}
{"id":429,"first_name":"Wally","last_name":"Caughan","email":"wcaughanbw@msu.edu"}
{"id":430,"first_name":"Yancy","last_name":"Stealfox","email":"ystealfoxbx@berkeley.edu"}
{"id":431,"first_name":"Dela","last_name":"Strong","email":"dstrongby@free.fr"}
{"id":432,"first_name":"Dougie","last_name":"Tewnion","email":"dtewnionbz@discovery.com"}
{"id":433,"first_name":"Kelly","last_name":"Frean","email":"kfreanc0@imageshack.us"}
{"id":434,"first_name":"Connie","last_name":"Blaschek","email":"cblaschekc1@wikipedia.org"}
{"id":435,"first_name":"Michell","last_name":"D'Ambrogio","email":"mdambrogioc2@sfgate.com"}
{"id":436,"first_name":"Larine","last_name":"Comber","email":"lcomberc3@com.com"}
{"id":437,"first_name":"Giacopo","last_name":"Linde","email":"glindec4@tripadvisor.com"}
{"id":438,"first_name":"Debbi","last_name":"Whaley","email":"dwhaleyc5@studiopress.com"}
{"id":439,"first_name":"Alva","last_name":"Matyasik","email":"amatyasikc6@gmpg.org"}
{"id":440,"first_name":"Mead","last_name":"Andrini","email":"mandrinic7@arstechnica.com"}
{"id":441,"first_name":"Esme","last_name":"Casetti","email":"ecasettic8@furl.net"}
{"id":442,"first_name":"Barbara","last_name":"Piel","email":"bpielc9@addtoany.com"}
{"id":443,"first_name":"Slade","last_name":"Coaker","email":"scoakerca@spiegel.de"}
{"id":444,"first_name":"Read","last_name":"Wackley","email":"rwackleycb@va.gov"}
{"id":445,"first_name":"Min","last_name":"Dunnet","email":"mdunnetcc@friendfeed.com"}
{"id":446,"first_name":"Barbabra","last_name":"Taffarello","email":"btaffarellocd@samsung.com"}
{"id":447,"first_name":"Sadie","last_name":"Stanlick","email":"sstanlickce@vistaprint.com"}
{"id":448,"first_name":"Keefe","last_name":"Inglese","email":"kinglesecf@nationalgeographic.com"}
{"id":449,"first_name":"Domenic","last_name":"Tomasek","email":"dtomasekcg@privacy.gov.au"}
{"id":450,"first_name":"Felic","last_name":"Rydzynski","email":"frydzynskich@flickr.com"}
{"id":451,"first_name":"Alfy","last_name":"Hamman","email":"ahammanci@slate.com"}
{"id":452,"first_name":"Townie","last_name":"Tomini","email":"ttominicj@printfriendly.com"}
{"id":453,"first_name":"Evangelia","last_name":"Badrick","email":"ebadrickck@facebook.com"}
{"id":454,"first_name":"Caron","last_name":"Cornil","email":"ccornilcl@newsvine.com"}
{"id":455,"first_name":"Ernie","last_name":"Reddin","email":"ereddincm@tmall.com"}
{"id":456,"first_name":"Arley","last_name":"Wardall","email":"awardallcn@tripod.com"}
{"id":457,"first_name":"Robinet","last_name":"Sam","email":"rsamco@upenn.edu"}
{"id":458,"first_name":"Melisenda","last_name":"Timeby","email":"mtimebycp@shinystat.com"}
{"id":459,"first_name":"Shantee","last_name":"Annes","email":"sannescq@va.gov"}
{"id":460,"first_name":"Molli","last_name":"Mish","email":"mmishcr@dot.gov"}
{"id":461,"first_name":"Merralee","last_name":"Vickerman","email":"mvickermancs@baidu.com"}
{"id":462,"first_name":"Wilhelmina","last_name":"Heminsley","email":"wheminsleyct@is.gd"}
{"id":463,"first_name":"Granville","last_name":"MacKeague","email":"gmackeaguecu@pbs.org"}
{"id":464,"first_name":"Sean","last_name":"Loftus","email":"sloftuscv@psu.edu"}
{"id":465,"first_name":"Nevins","last_name":"Gawke","email":"ngawkecw@stumbleupon.com"}
{"id":466,"first_name":"Gunilla","last_name":"Lucock","email":"glucockcx@deviantart.com"}
{"id":467,"first_name":"Haydon","last_name":"Fiddy","email":"hfiddycy@imgur.com"}
{"id":468,"first_name":"Ema","last_name":"Salatino","email":"esalatinocz@sitemeter.com"}
{"id":469,"first_name":"Valentin","last_name":"Yakovliv","email":"vyakovlivd0@furl.net"}
{"id":470,"first_name":"Carri","last_name":"Saltern","email":"csalternd1@biblegateway.com"}
{"id":471,"first_name":"Kristos","last_name":"Stanmore","email":"kstanmored2@4shared.com"}
{"id":472,"first_name":"Adriena","last_name":"Bes","email":"abesd3@constantcontact.com"}
{"id":473,"first_name":"Cristabel","last_name":"Bortolutti","email":"cbortoluttid4@pinterest.com"}
{"id":474,"first_name":"Hersh","last_name":"Lock","email":"hlockd5@forbes.com"}
{"id":475,"first_name":"Yoshi","last_name":"Marler","email":"ymarlerd6@free.fr"}
{"id":476,"first_name":"Tremaine","last_name":"Librey","email":"tlibreyd7@trellian.com"}
{"id":477,"first_name":"Inge","last_name":"Strawbridge","email":"istrawbridged8@barnesandnoble.com"}
{"id":478,"first_name":"Pascal","last_name":"Carvill","email":"pcarvilld9@washington.edu"}
{"id":479,"first_name":"Zabrina","last_name":"Ianitti","email":"zianittida@yellowpages.com"}
{"id":480,"first_name":"Almeta","last_name":"Wessell","email":"awesselldb@bbb.org"}
{"id":481,"first_name":"Crissie","last_name":"Troy","email":"ctroydc@rambler.ru"}
{"id":482,"first_name":"Xena","last_name":"Frammingham","email":"xframminghamdd@t-online.de"}
{"id":483,"first_name":"Zilvia","last_name":"Grinvalds","email":"zgrinvaldsde@example.com"}
{"id":484,"first_name":"Brit","last_name":"Twelftree","email":"btwelftreedf@shop-pro.jp"}
{"id":485,"first_name":"Brianne","last_name":"Johannes","email":"bjohannesdg@nymag.com"}
{"id":486,"first_name":"Felicle","last_name":"MacRury","email":"fmacrurydh@jiathis.com"}
{"id":487,"first_name":"Salli","last_name":"Chillingworth","email":"schillingworthdi@gravatar.com"}
{"id":488,"first_name":"Merline","last_name":"Bodd","email":"mbodddj@yandex.ru"}
{"id":489,"first_name":"Christian","last_name":"Pengelley","email":"cpengelleydk@flavors.me"}
{"id":490,"first_name":"Dallas","last_name":"Sollowaye","email":"dsollowayedl@zdnet.com"}
{"id":491,"first_name":"Matias","last_name":"Austen","email":"maustendm@ow.ly"}
{"id":492,"first_name":"Carney","last_name":"Bergin","email":"cbergindn@tiny.cc"}
{"id":493,"first_name":"Carol","last_name":"Vannikov","email":"cvannikovdo@oakley.com"}
{"id":494,"first_name":"Gail","last_name":"Garwood","email":"ggarwooddp@cbc.ca"}
{"id":495,"first_name":"Adela","last_name":"Baddam","email":"abaddamdq@blinklist.com"}
{"id":496,"first_name":"Bogey","last_name":"Tomala","email":"btomaladr@samsung.com"}
{"id":497,"first_name":"Annabel","last_name":"Pinsent","email":"apinsentds@yelp.com"}
{"id":498,"first_name":"Marijn","last_name":"Trevarthen","email":"mtrevarthendt@google.ca"}
{"id":499,"first_name":"Arabelle","last_name":"Corneliussen","email":"acorneliussendu@census.gov"}
{"id":500,"first_name":"Ritchie","last_name":"Rosenblum","email":"rrosenblumdv@i2i.jp"}
{"id":501,"first_name":"Marji","last_name":"Clarage","email":"mclaragedw@gravatar.com"}
{"id":502,"first_name":"Yolanthe","last_name":"Doddemeade","email":"ydoddemeadedx@cpanel.net"}
{"id":503,"first_name":"Larine","last_name":"Rodd","email":"lrodddy@ft.com"}
{"id":504,"first_name":"Adolpho","last_name":"Bleasdale","email":"ableasdaledz@unicef.org"}
{"id":505,"first_name":"Rriocard","last_name":"Roggeman","email":"rroggemane0@salon.com"}
{"id":506,"first_name":"Sissie","last_name":"Ephgrave","email":"sephgravee1@wikipedia.org"}
{"id":507,"first_name":"Shepherd","last_name":"Davidde","email":"sdaviddee2@wikimedia.org"}
{"id":508,"first_name":"Cecilla","last_name":"Girt","email":"cgirte3@soundcloud.com"}
{"id":509,"first_name":"Alanah","last_name":"Newtown","email":"anewtowne4@cocolog-nifty.com"}
{"id":510,"first_name":"Marvin","last_name":"Duckhouse","email":"mduckhousee5@icq.com"}
{"id":511,"first_name":"Esme","last_name":"Crouch","email":"ecrouche6@foxnews.com"}
{"id":512,"first_name":"Cthrine","last_name":"Yelding","email":"cyeldinge7@stumbleupon.com"}
{"id":513,"first_name":"Nolly","last_name":"Gude","email":"ngudee8@bing.com"}
{"id":514,"first_name":"Kimball","last_name":"O' Mulderrig","email":"komulderrige9@newyorker.com"}
{"id":515,"first_name":"Felicdad","last_name":"Mutlow","email":"fmutlowea@wunderground.com"}
{"id":516,"first_name":"Sybila","last_name":"Kirke","email":"skirkeeb@w3.org"}
{"id":517,"first_name":"Aubrey","last_name":"Horney","email":"ahorneyec@1688.com"}
{"id":518,"first_name":"Prudy","last_name":"Hartles","email":"phartlesed@scribd.com"}
{"id":519,"first_name":"Saw","last_name":"Olyunin","email":"solyuninee@google.it"}
{"id":520,"first_name":"Pearline","last_name":"Fasham","email":"pfashamef@chron.com"}
{"id":521,"first_name":"Gretta","last_name":"Vasilmanov","email":"gvasilmanoveg@godaddy.com"}
{"id":522,"first_name":"Pearle","last_name":"Scougal","email":"pscougaleh@si.edu"}
{"id":523,"first_name":"Marney","last_name":"Mariotte","email":"mmariotteei@newsvine.com"}
{"id":524,"first_name":"Bamby","last_name":"Lockhart","email":"blockhartej@mayoclinic.com"}
{"id":525,"first_name":"Miguela","last_name":"Baumadier","email":"mbaumadierek@go.com"}
{"id":526,"first_name":"Lusa","last_name":"Bartalin","email":"lbartalinel@fc2.com"}
{"id":527,"first_name":"Helene","last_name":"Parlott","email":"hparlottem@wikimedia.org"}
{"id":528,"first_name":"Manuel","last_name":"Scallon","email":"mscallonen@apple.com"}
{"id":529,"first_name":"Wendie","last_name":"O' Scallan","email":"woscallaneo@aboutads.info"}
{"id":530,"first_name":"Benito","last_name":"Kerry","email":"bkerryep@cmu.edu"}
{"id":531,"first_name":"Dorthy","last_name":"Skinner","email":"dskinnereq@ustream.tv"}
{"id":532,"first_name":"Demetris","last_name":"Picton","email":"dpictoner@typepad.com"}
{"id":533,"first_name":"Barrie","last_name":"Hurkett","email":"bhurkettes@mlb.com"}
{"id":534,"first_name":"Lucretia","last_name":"Wherry","email":"lwherryet@amazon.com"}
{"id":535,"first_name":"Molly","last_name":"Castagna","email":"mcastagnaeu@google.cn"}
{"id":536,"first_name":"Waylin","last_name":"Chieco","email":"wchiecoev@youtube.com"}
{"id":537,"first_name":"Bobinette","last_name":"Headingham","email":"bheadinghamew@intel.com"}
{"id":538,"first_name":"Malinda","last_name":"Gerardi","email":"mgerardiex@samsung.com"}
{"id":539,"first_name":"Rhodia","last_name":"Kenderdine","email":"rkenderdineey@arstechnica.com"}
{"id":540,"first_name":"Saundra","last_name":"Brader","email":"sbraderez@msu.edu"}
{"id":541,"first_name":"Mariana","last_name":"Buye","email":"mbuyef0@wikimedia.org"}
{"id":542,"first_name":"Hagan","last_name":"Stoop","email":"hstoopf1@tripadvisor.com"}
{"id":543,"first_name":"Marlene","last_name":"Keane","email":"mkeanef2@google.cn"}
{"id":544,"first_name":"Sayer","last_name":"Eggar","email":"seggarf3@unicef.org"}
{"id":545,"first_name":"Eve","last_name":"Allanson","email":"eallansonf4@china.com.cn"}
{"id":546,"first_name":"Arielle","last_name":"Kytter","email":"akytterf5@spotify.com"}
{"id":547,"first_name":"Deerdre","last_name":"Cabbell","email":"dcabbellf6@youtube.com"}
{"id":548,"first_name":"Nathan","last_name":"Cromleholme","email":"ncromleholmef7@fema.gov"}
{"id":549,"first_name":"Brion","last_name":"Recher","email":"brecherf8@usgs.gov"}
{"id":550,"first_name":"Tiena","last_name":"Grealish","email":"tgrealishf9@mail.ru"}
{"id":551,"first_name":"Dane","last_name":"Durtnal","email":"ddurtnalfa@latimes.com"}
{"id":552,"first_name":"Bealle","last_name":"Lesurf","email":"blesurffb@vinaora.com"}
{"id":553,"first_name":"Evangelina","last_name":"Lawrie","email":"elawriefc@ameblo.jp"}
{"id":554,"first_name":"Svend","last_name":"Leel","email":"sleelfd@ucoz.ru"}
{"id":555,"first_name":"Cristen","last_name":"Klimkov","email":"cklimkovfe@about.me"}
{"id":556,"first_name":"Devon","last_name":"Lanchbury","email":"dlanchburyff@umn.edu"}
{"id":557,"first_name":"Rem","last_name":"Cordes","email":"rcordesfg@yolasite.com"}
{"id":558,"first_name":"Romy","last_name":"Mattiazzi","email":"rmattiazzifh@craigslist.org"}
{"id":559,"first_name":"Wit","last_name":"Attenborrow","email":"wattenborrowfi@auda.org.au"}
{"id":560,"first_name":"Nanni","last_name":"Studders","email":"nstuddersfj@yandex.ru"}
{"id":561,"first_name":"Mandie","last_name":"Trembley","email":"mtrembleyfk@gizmodo.com"}
{"id":562,"first_name":"Babette","last_name":"Clemmens","email":"bclemmensfl@acquirethisname.com"}
{"id":563,"first_name":"Ban","last_name":"Bennion","email":"bbennionfm@github.com"}
{"id":564,"first_name":"Gail","last_name":"Trevon","email":"gtrevonfn@upenn.edu"}
{"id":565,"first_name":"Karine","last_name":"Alexandrescu","email":"kalexandrescufo@globo.com"}
{"id":566,"first_name":"Sabrina","last_name":"Klaes","email":"sklaesfp@example.com"}
{"id":567,"first_name":"Adriane","last_name":"Figgins","email":"afigginsfq@cafepress.com"}
{"id":568,"first_name":"Terese","last_name":"Goldney","email":"tgoldneyfr@purevolume.com"}
{"id":569,"first_name":"Ashlie","last_name":"Bowling","email":"abowlingfs@dion.ne.jp"}
{"id":570,"first_name":"Rivi","last_name":"Laurenz","email":"rlaurenzft@php.net"}
{"id":571,"first_name":"Phillip","last_name":"Longstaffe","email":"plongstaffefu@goo.gl"}
{"id":572,"first_name":"Adrian","last_name":"Jewes","email":"ajewesfv@elpais.com"}
{"id":573,"first_name":"Muriel","last_name":"Ladlow","email":"mladlowfw@vkontakte.ru"}
{"id":574,"first_name":"Ange","last_name":"Habishaw","email":"ahabishawfx@walmart.com"}
{"id":575,"first_name":"Kennith","last_name":"Olive","email":"kolivefy@tamu.edu"}
{"id":576,"first_name":"Vonnie","last_name":"Eastbrook","email":"veastbrookfz@merriam-webster.com"}
{"id":577,"first_name":"Doralyn","last_name":"Scarbarrow","email":"dscarbarrowg0@gnu.org"}
{"id":578,"first_name":"Adams","last_name":"Sharpley","email":"asharpleyg1@blogger.com"}
{"id":579,"first_name":"Gilberte","last_name":"Camamile","email":"gcamamileg2@dailymail.co.uk"}
{"id":580,"first_name":"Emylee","last_name":"Siley","email":"esileyg3@friendfeed.com"}
{"id":581,"first_name":"Hanan","last_name":"Falvey","email":"hfalveyg4@springer.com"}
{"id":582,"first_name":"Nerty","last_name":"Marqyes","email":"nmarqyesg5@thetimes.co.uk"}
{"id":583,"first_name":"Neysa","last_name":"Mossdale","email":"nmossdaleg6@de.vu"}
{"id":584,"first_name":"Allayne","last_name":"Crookall","email":"acrookallg7@amazon.de"}
{"id":585,"first_name":"Ally","last_name":"Lesly","email":"aleslyg8@howstuffworks.com"}
{"id":586,"first_name":"Saraann","last_name":"Rosson","email":"srossong9@e-recht24.de"}
{"id":587,"first_name":"Marissa","last_name":"Garn","email":"mgarnga@360.cn"}
{"id":588,"first_name":"Rusty","last_name":"Jenteau","email":"rjenteaugb@spiegel.de"}
{"id":589,"first_name":"Daria","last_name":"Danilchenko","email":"ddanilchenkogc@networkadvertising.org"}
{"id":590,"first_name":"Emmi","last_name":"Duny","email":"edunygd@dedecms.com"}
{"id":591,"first_name":"Felice","last_name":"Manser","email":"fmanserge@bizjournals.com"}
{"id":592,"first_name":"Domeniga","last_name":"Garrand","email":"dgarrandgf@goo.ne.jp"}
{"id":593,"first_name":"Tani","last_name":"Bampton","email":"tbamptongg@huffingtonpost.com"}
{"id":594,"first_name":"Paige","last_name":"Holdren","email":"pholdrengh@hugedomains.com"}
{"id":595,"first_name":"Junia","last_name":"Stoppe","email":"jstoppegi@slideshare.net"}
{"id":596,"first_name":"Krista","last_name":"Hardwidge","email":"khardwidgegj@people.com.cn"}
{"id":597,"first_name":"Theodosia","last_name":"Bleddon","email":"tbleddongk@geocities.jp"}
{"id":598,"first_name":"Esmaria","last_name":"Gomez","email":"egomezgl@slate.com"}
{"id":599,"first_name":"Karisa","last_name":"Dearnley","email":"kdearnleygm@nyu.edu"}
{"id":600,"first_name":"Dud","last_name":"Cuddon","email":"dcuddongn@youku.com"}
{"id":601,"first_name":"Daile","last_name":"Mylechreest","email":"dmylechreestgo@ox.ac.uk"}
{"id":602,"first_name":"Josselyn","last_name":"Chaplyn","email":"jchaplyngp@shop-pro.jp"}
{"id":603,"first_name":"Klarrisa","last_name":"Balnave","email":"kbalnavegq@microsoft.com"}
{"id":604,"first_name":"Nolie","last_name":"Petters","email":"npettersgr@opera.com"}
{"id":605,"first_name":"Bruno","last_name":"Vautin","email":"bvautings@earthlink.net"}
{"id":606,"first_name":"Ki","last_name":"Stucke","email":"kstuckegt@newyorker.com"}
{"id":607,"first_name":"Jerad","last_name":"MacGettigen","email":"jmacgettigengu@nyu.edu"}
{"id":608,"first_name":"Waverly","last_name":"Gwyer","email":"wgwyergv@sogou.com"}
{"id":609,"first_name":"Norene","last_name":"Detloff","email":"ndetloffgw@istockphoto.com"}
{"id":610,"first_name":"Alfonse","last_name":"Mont","email":"amontgx@mozilla.org"}
{"id":611,"first_name":"Shepperd","last_name":"Duffy","email":"sduffygy@jigsy.com"}
{"id":612,"first_name":"Petronille","last_name":"Doughty","email":"pdoughtygz@prweb.com"}
{"id":613,"first_name":"Northrop","last_name":"Stent","email":"nstenth0@nytimes.com"}
{"id":614,"first_name":"Marline","last_name":"Ferrar","email":"mferrarh1@utexas.edu"}
{"id":615,"first_name":"Brenda","last_name":"Sancho","email":"bsanchoh2@com.com"}
{"id":616,"first_name":"Leeanne","last_name":"Candlish","email":"lcandlishh3@merriam-webster.com"}
{"id":617,"first_name":"Brianna","last_name":"Starford","email":"bstarfordh4@theguardian.com"}
{"id":618,"first_name":"Leroi","last_name":"Smissen","email":"lsmissenh5@loc.gov"}
{"id":619,"first_name":"Nev","last_name":"Belvin","email":"nbelvinh6@dedecms.com"}
{"id":620,"first_name":"Kellen","last_name":"Strowlger","email":"kstrowlgerh7@about.com"}
{"id":621,"first_name":"Ninette","last_name":"Kerton","email":"nkertonh8@google.com.au"}
{"id":622,"first_name":"Ruby","last_name":"Klewer","email":"rklewerh9@engadget.com"}
{"id":623,"first_name":"Berte","last_name":"Joynes","email":"bjoynesha@icq.com"}
{"id":624,"first_name":"Jacob","last_name":"Houseago","email":"jhouseagohb@ocn.ne.jp"}
{"id":625,"first_name":"Wandis","last_name":"Souster","email":"wsousterhc@ask.com"}
{"id":626,"first_name":"Kelila","last_name":"Guillon","email":"kguillonhd@vistaprint.com"}
{"id":627,"first_name":"Gretchen","last_name":"Mellsop","email":"gmellsophe@nationalgeographic.com"}
{"id":628,"first_name":"Agnese","last_name":"Rider","email":"ariderhf@bloglovin.com"}
{"id":629,"first_name":"Sabina","last_name":"Spilsburie","email":"sspilsburiehg@who.int"}
{"id":630,"first_name":"Aubrie","last_name":"Patey","email":"apateyhh@linkedin.com"}
{"id":631,"first_name":"Wolfie","last_name":"Sommerville","email":"wsommervillehi@domainmarket.com"}
{"id":632,"first_name":"Anderea","last_name":"Haversum","email":"ahaversumhj@pbs.org"}
{"id":633,"first_name":"Alessandro","last_name":"Giovani","email":"agiovanihk@cbslocal.com"}
{"id":634,"first_name":"Arlette","last_name":"Dulwich","email":"adulwichhl@google.nl"}
{"id":635,"first_name":"Reamonn","last_name":"Flintiff","email":"rflintiffhm@wikia.com"}
{"id":636,"first_name":"Lowe","last_name":"Redding","email":"lreddinghn@naver.com"}
{"id":637,"first_name":"Dannel","last_name":"Lloyds","email":"dlloydsho@odnoklassniki.ru"}
{"id":638,"first_name":"Gasparo","last_name":"Curtoys","email":"gcurtoyshp@tuttocitta.it"}
{"id":639,"first_name":"Larry","last_name":"Shatliff","email":"lshatliffhq@mayoclinic.com"}
{"id":640,"first_name":"Faina","last_name":"Dauby","email":"fdaubyhr@washingtonpost.com"}
{"id":641,"first_name":"Kara-lynn","last_name":"Prise","email":"kprisehs@live.com"}
{"id":642,"first_name":"Garry","last_name":"Patinkin","email":"gpatinkinht@goo.gl"}
{"id":643,"first_name":"Bryan","last_name":"Eyrl","email":"beyrlhu@indiegogo.com"}
{"id":644,"first_name":"Dominick","last_name":"Goracci","email":"dgoraccihv@cdbaby.com"}
{"id":645,"first_name":"Sabine","last_name":"Dami","email":"sdamihw@php.net"}
{"id":646,"first_name":"Simeon","last_name":"Czajka","email":"sczajkahx@auda.org.au"}
{"id":647,"first_name":"Bertrando","last_name":"Ostler","email":"bostlerhy@networksolutions.com"}
{"id":648,"first_name":"Guillaume","last_name":"Halahan","email":"ghalahanhz@weibo.com"}
{"id":649,"first_name":"Artus","last_name":"Shotton","email":"ashottoni0@goodreads.com"}
{"id":650,"first_name":"Thurston","last_name":"Privett","email":"tprivetti1@goo.ne.jp"}
{"id":651,"first_name":"Dagny","last_name":"Handford","email":"dhandfordi2@homestead.com"}
{"id":652,"first_name":"Bathsheba","last_name":"Pordall","email":"bpordalli3@howstuffworks.com"}
{"id":653,"first_name":"Gwynne","last_name":"Vallens","email":"gvallensi4@feedburner.com"}
{"id":654,"first_name":"Faun","last_name":"McMurrugh","email":"fmcmurrughi5@merriam-webster.com"}
{"id":655,"first_name":"Kerry","last_name":"Gooding","email":"kgoodingi6@macromedia.com"}
{"id":656,"first_name":"Sol","last_name":"Baskerfield","email":"sbaskerfieldi7@amazon.co.uk"}
{"id":657,"first_name":"Belvia","last_name":"Risebrow","email":"brisebrowi8@netlog.com"}
{"id":658,"first_name":"Kelila","last_name":"Stocken","email":"kstockeni9@xinhuanet.com"}
{"id":659,"first_name":"Raff","last_name":"Kelland","email":"rkellandia@technorati.com"}
{"id":660,"first_name":"Sophi","last_name":"Bengough","email":"sbengoughib@booking.com"}
{"id":661,"first_name":"Annmarie","last_name":"Ivins","email":"aivinsic@wikispaces.com"}
{"id":662,"first_name":"Nettie","last_name":"Camings","email":"ncamingsid@amazon.co.jp"}
{"id":663,"first_name":"Ted","last_name":"Alcoran","email":"talcoranie@hhs.gov"}
{"id":664,"first_name":"Tim","last_name":"Murden","email":"tmurdenif@jugem.jp"}
{"id":665,"first_name":"Latrina","last_name":"Baines","email":"lbainesig@sphinn.com"}
{"id":666,"first_name":"Sanders","last_name":"Crampsey","email":"scrampseyih@cocolog-nifty.com"}
{"id":667,"first_name":"Laurena","last_name":"Bristowe","email":"lbristoweii@sciencedaily.com"}
{"id":668,"first_name":"Brose","last_name":"Blanchet","email":"bblanchetij@archive.org"}
{"id":669,"first_name":"Jacintha","last_name":"Kimmel","email":"jkimmelik@psu.edu"}
{"id":670,"first_name":"Nat","last_name":"Hast","email":"nhastil@ifeng.com"}
{"id":671,"first_name":"Ealasaid","last_name":"MacHoste","email":"emachosteim@nps.gov"}
{"id":672,"first_name":"Merralee","last_name":"Phippen","email":"mphippenin@usgs.gov"}
{"id":673,"first_name":"Donella","last_name":"Sanzio","email":"dsanzioio@theatlantic.com"}
{"id":674,"first_name":"Giorgi","last_name":"Chaff","email":"gchaffip@taobao.com"}
{"id":675,"first_name":"Bennie","last_name":"Smallsman","email":"bsmallsmaniq@webmd.com"}
{"id":676,"first_name":"Georgie","last_name":"Crole","email":"gcroleir@dot.gov"}
{"id":677,"first_name":"Petra","last_name":"Chappelow","email":"pchappelowis@tmall.com"}
{"id":678,"first_name":"Dalton","last_name":"Wewell","email":"dwewellit@tiny.cc"}
{"id":679,"first_name":"Kinnie","last_name":"Guilaem","email":"kguilaemiu@ezinearticles.com"}
{"id":680,"first_name":"Merci","last_name":"Doyle","email":"mdoyleiv@boston.com"}
{"id":681,"first_name":"Constance","last_name":"Tilson","email":"ctilsoniw@usda.gov"}
{"id":682,"first_name":"Paige","last_name":"Sygroves","email":"psygrovesix@sfgate.com"}
{"id":683,"first_name":"Rutherford","last_name":"Ughi","email":"rughiiy@webeden.co.uk"}
{"id":684,"first_name":"Jamil","last_name":"Crighton","email":"jcrightoniz@china.com.cn"}
{"id":685,"first_name":"Gaspard","last_name":"Lockner","email":"glocknerj0@hao123.com"}
{"id":686,"first_name":"Sindee","last_name":"Beade","email":"sbeadej1@sbwire.com"}
{"id":687,"first_name":"Irina","last_name":"Perren","email":"iperrenj2@oracle.com"}
{"id":688,"first_name":"Annis","last_name":"Asker","email":"aaskerj3@whitehouse.gov"}
{"id":689,"first_name":"Ingram","last_name":"MacGiany","email":"imacgianyj4@blogspot.com"}
{"id":690,"first_name":"Germaine","last_name":"Maltby","email":"gmaltbyj5@usda.gov"}
{"id":691,"first_name":"Berkly","last_name":"Prazor","email":"bprazorj6@flickr.com"}
{"id":692,"first_name":"Ferguson","last_name":"Kyffin","email":"fkyffinj7@goodreads.com"}
{"id":693,"first_name":"Winonah","last_name":"Furze","email":"wfurzej8@alexa.com"}
{"id":694,"first_name":"Merwin","last_name":"Ionnidis","email":"mionnidisj9@slashdot.org"}
{"id":695,"first_name":"Jerrilee","last_name":"Speerman","email":"jspeermanja@tumblr.com"}
{"id":696,"first_name":"Leslie","last_name":"Mulvy","email":"lmulvyjb@bravesites.com"}
{"id":697,"first_name":"Eryn","last_name":"Stoffel","email":"estoffeljc@infoseek.co.jp"}
{"id":698,"first_name":"Ladonna","last_name":"Bosward","email":"lboswardjd@php.net"}
{"id":699,"first_name":"Giustino","last_name":"Killelea","email":"gkilleleaje@statcounter.com"}
{"id":700,"first_name":"Dillie","last_name":"Angell","email":"dangelljf@weather.com"}
{"id":701,"first_name":"Henri","last_name":"Arnison","email":"harnisonjg@bluehost.com"}
{"id":702,"first_name":"Fina","last_name":"Joules","email":"fjoulesjh@webmd.com"}
{"id":703,"first_name":"Elden","last_name":"Shortan","email":"eshortanji@github.com"}
{"id":704,"first_name":"Vevay","last_name":"Imison","email":"vimisonjj@slideshare.net"}
{"id":705,"first_name":"Marcellina","last_name":"Jagg","email":"mjaggjk@dmoz.org"}
{"id":706,"first_name":"Evin","last_name":"Lamacraft","email":"elamacraftjl@dagondesign.com"}
{"id":707,"first_name":"Marcel","last_name":"Edy","email":"medyjm@aboutads.info"}
{"id":708,"first_name":"Orlan","last_name":"Drei","email":"odreijn@oaic.gov.au"}
{"id":709,"first_name":"Egbert","last_name":"Shillington","email":"eshillingtonjo@simplemachines.org"}
{"id":710,"first_name":"Opal","last_name":"Oldnall","email":"ooldnalljp@indiatimes.com"}
{"id":711,"first_name":"Brianne","last_name":"Penticost","email":"bpenticostjq@webmd.com"}
{"id":712,"first_name":"Pip","last_name":"Blaney","email":"pblaneyjr@weather.com"}
{"id":713,"first_name":"Michaella","last_name":"Goldsberry","email":"mgoldsberryjs@dell.com"}
{"id":714,"first_name":"Jerrilee","last_name":"Paridge","email":"jparidgejt@wikipedia.org"}
{"id":715,"first_name":"Joelly","last_name":"Knightley","email":"jknightleyju@joomla.org"}
{"id":716,"first_name":"Eloisa","last_name":"Lee","email":"eleejv@abc.net.au"}
{"id":717,"first_name":"Andee","last_name":"Boscott","email":"aboscottjw@angelfire.com"}
{"id":718,"first_name":"Menard","last_name":"Bazley","email":"mbazleyjx@si.edu"}
{"id":719,"first_name":"Hadria","last_name":"MacDonough","email":"hmacdonoughjy@blogspot.com"}
{"id":720,"first_name":"Demetrius","last_name":"Ghelardi","email":"dghelardijz@4shared.com"}
{"id":721,"first_name":"Ingra","last_name":"Boshard","email":"iboshardk0@forbes.com"}
{"id":722,"first_name":"Shelley","last_name":"Cradoc","email":"scradock1@google.nl"}
{"id":723,"first_name":"Bertrando","last_name":"Wurst","email":"bwurstk2@hhs.gov"}
{"id":724,"first_name":"Duky","last_name":"Moresby","email":"dmoresbyk3@w3.org"}
{"id":725,"first_name":"Lynda","last_name":"Matzeitis","email":"lmatzeitisk4@bing.com"}
{"id":726,"first_name":"Galvan","last_name":"Challen","email":"gchallenk5@nasa.gov"}
{"id":727,"first_name":"Bette-ann","last_name":"Lytlle","email":"blytllek6@linkedin.com"}
{"id":728,"first_name":"Henderson","last_name":"Tonsley","email":"htonsleyk7@wikipedia.org"}
{"id":729,"first_name":"Daffi","last_name":"Welch","email":"dwelchk8@geocities.com"}
{"id":730,"first_name":"Enrique","last_name":"Emig","email":"eemigk9@digg.com"}
{"id":731,"first_name":"Darnall","last_name":"Tupman","email":"dtupmanka@indiegogo.com"}
{"id":732,"first_name":"Vicki","last_name":"Trayes","email":"vtrayeskb@phpbb.com"}
{"id":733,"first_name":"Quintus","last_name":"Sancroft","email":"qsancroftkc@ycombinator.com"}
{"id":734,"first_name":"Karola","last_name":"Mille","email":"kmillekd@ustream.tv"}
{"id":735,"first_name":"Aretha","last_name":"Callum","email":"acallumke@washingtonpost.com"}
{"id":736,"first_name":"Karisa","last_name":"Stainer","email":"kstainerkf@nsw.gov.au"}
{"id":737,"first_name":"Carine","last_name":"Goom","email":"cgoomkg@whitehouse.gov"}
{"id":738,"first_name":"Town","last_name":"Hannan","email":"thannankh@harvard.edu"}
{"id":739,"first_name":"Micheal","last_name":"Arnaudin","email":"marnaudinki@theatlantic.com"}
{"id":740,"first_name":"Shaun","last_name":"Prendergrass","email":"sprendergrasskj@mapquest.com"}
{"id":741,"first_name":"Chastity","last_name":"Waszczyk","email":"cwaszczykkk@gravatar.com"}
{"id":742,"first_name":"Christy","last_name":"Northey","email":"cnortheykl@nymag.com"}
{"id":743,"first_name":"Melamie","last_name":"Triggel","email":"mtriggelkm@myspace.com"}
{"id":744,"first_name":"Duffy","last_name":"Albrook","email":"dalbrookkn@oakley.com"}
{"id":745,"first_name":"Viv","last_name":"Millwall","email":"vmillwallko@technorati.com"}
{"id":746,"first_name":"Abie","last_name":"Cacacie","email":"acacaciekp@reference.com"}
{"id":747,"first_name":"Micah","last_name":"Howden","email":"mhowdenkq@youtube.com"}
{"id":748,"first_name":"Gerladina","last_name":"Sheeran","email":"gsheerankr@soundcloud.com"}
{"id":749,"first_name":"Reidar","last_name":"Withur","email":"rwithurks@1688.com"}
{"id":750,"first_name":"Killy","last_name":"Stroulger","email":"kstroulgerkt@webs.com"}
{"id":751,"first_name":"Penelope","last_name":"Foli","email":"pfoliku@ucoz.ru"}
{"id":752,"first_name":"Pascal","last_name":"Blethyn","email":"pblethynkv@people.com.cn"}
{"id":753,"first_name":"Jacobo","last_name":"Renols","email":"jrenolskw@nhs.uk"}
{"id":754,"first_name":"Donelle","last_name":"Jarrell","email":"djarrellkx@about.com"}
{"id":755,"first_name":"Hakim","last_name":"Pietrzyk","email":"hpietrzykky@123-reg.co.uk"}
{"id":756,"first_name":"Fania","last_name":"Hallick","email":"fhallickkz@state.gov"}
{"id":757,"first_name":"Boote","last_name":"Gomersal","email":"bgomersall0@virginia.edu"}
{"id":758,"first_name":"Luis","last_name":"Valler","email":"lvallerl1@zimbio.com"}
{"id":759,"first_name":"Shana","last_name":"Vittel","email":"svittell2@virginia.edu"}
{"id":760,"first_name":"Onofredo","last_name":"Philliphs","email":"ophilliphsl3@vistaprint.com"}
{"id":761,"first_name":"Osmond","last_name":"Moulson","email":"omoulsonl4@fema.gov"}
{"id":762,"first_name":"Ly","last_name":"Greenan","email":"lgreenanl5@ucla.edu"}
{"id":763,"first_name":"Mervin","last_name":"Koop","email":"mkoopl6@mediafire.com"}
{"id":764,"first_name":"Ferrel","last_name":"Redfearn","email":"fredfearnl7@nyu.edu"}
{"id":765,"first_name":"Robby","last_name":"Huglin","email":"rhuglinl8@nature.com"}
{"id":766,"first_name":"Kendre","last_name":"Youle","email":"kyoulel9@domainmarket.com"}
{"id":767,"first_name":"Windy","last_name":"Rubel","email":"wrubella@telegraph.co.uk"}
{"id":768,"first_name":"Crystal","last_name":"Carmichael","email":"ccarmichaellb@admin.ch"}
{"id":769,"first_name":"Agata","last_name":"Penner","email":"apennerlc@tinyurl.com"}
{"id":770,"first_name":"Odey","last_name":"Morse","email":"omorseld@wired.com"}
{"id":771,"first_name":"Siegfried","last_name":"Glackin","email":"sglackinle@hao123.com"}
{"id":772,"first_name":"Norbie","last_name":"Reiners","email":"nreinerslf@cmu.edu"}
{"id":773,"first_name":"Kipp","last_name":"Lowdes","email":"klowdeslg@privacy.gov.au"}
{"id":774,"first_name":"Dyann","last_name":"Francklyn","email":"dfrancklynlh@google.com.br"}
{"id":775,"first_name":"Gwennie","last_name":"McGlynn","email":"gmcglynnli@live.com"}
{"id":776,"first_name":"Viviyan","last_name":"Erdis","email":"verdislj@clickbank.net"}
{"id":777,"first_name":"Hallie","last_name":"Sherewood","email":"hsherewoodlk@trellian.com"}
{"id":778,"first_name":"Redd","last_name":"Stenton","email":"rstentonll@infoseek.co.jp"}
{"id":779,"first_name":"Wendall","last_name":"Bath","email":"wbathlm@upenn.edu"}
{"id":780,"first_name":"Corilla","last_name":"Zanetello","email":"czanetelloln@sfgate.com"}
{"id":781,"first_name":"Christye","last_name":"Dracey","email":"cdraceylo@qq.com"}
{"id":782,"first_name":"Nester","last_name":"Farleigh","email":"nfarleighlp@usgs.gov"}
{"id":783,"first_name":"Langsdon","last_name":"Haggard","email":"lhaggardlq@reddit.com"}
{"id":784,"first_name":"Chev","last_name":"Hay","email":"chaylr@timesonline.co.uk"}
{"id":785,"first_name":"Burlie","last_name":"Cutchee","email":"bcutcheels@dagondesign.com"}
{"id":786,"first_name":"Darya","last_name":"Mitchinson","email":"dmitchinsonlt@bizjournals.com"}
{"id":787,"first_name":"Bibi","last_name":"Skitral","email":"bskitrallu@homestead.com"}
{"id":788,"first_name":"Kaylee","last_name":"Olivo","email":"kolivolv@census.gov"}
{"id":789,"first_name":"Lenore","last_name":"Roseblade","email":"lrosebladelw@ning.com"}
{"id":790,"first_name":"Tulley","last_name":"Gonthard","email":"tgonthardlx@bloomberg.com"}
{"id":791,"first_name":"Olav","last_name":"Galfour","email":"ogalfourly@icq.com"}
{"id":792,"first_name":"Nicolas","last_name":"Margarson","email":"nmargarsonlz@free.fr"}
{"id":793,"first_name":"Reine","last_name":"Klugman","email":"rklugmanm0@fc2.com"}
{"id":794,"first_name":"Gnni","last_name":"Grewcock","email":"ggrewcockm1@clickbank.net"}
{"id":795,"first_name":"Lorain","last_name":"Crossby","email":"lcrossbym2@cdc.gov"}
{"id":796,"first_name":"Angil","last_name":"Toll","email":"atollm3@deliciousdays.com"}
{"id":797,"first_name":"Georgianne","last_name":"Piotrowski","email":"gpiotrowskim4@goo.gl"}
{"id":798,"first_name":"Sheelagh","last_name":"Orwin","email":"sorwinm5@xing.com"}
{"id":799,"first_name":"Ingrid","last_name":"Dallon","email":"idallonm6@noaa.gov"}
{"id":800,"first_name":"Tab","last_name":"Thomasson","email":"tthomassonm7@columbia.edu"}
{"id":801,"first_name":"Merridie","last_name":"Scandroot","email":"mscandrootm8@wsj.com"}
{"id":802,"first_name":"Morty","last_name":"MacDunleavy","email":"mmacdunleavym9@canalblog.com"}
{"id":803,"first_name":"Lind","last_name":"Jordanson","email":"ljordansonma@tinypic.com"}
{"id":804,"first_name":"Field","last_name":"Iiannoni","email":"fiiannonimb@over-blog.com"}
{"id":805,"first_name":"Sammie","last_name":"Whimper","email":"swhimpermc@imageshack.us"}
{"id":806,"first_name":"Davy","last_name":"Darthe","email":"ddarthemd@netvibes.com"}
{"id":807,"first_name":"Salli","last_name":"Binstead","email":"sbinsteadme@hubpages.com"}
{"id":808,"first_name":"Betty","last_name":"Chown","email":"bchownmf@flavors.me"}
{"id":809,"first_name":"Dinnie","last_name":"Ilyushkin","email":"dilyushkinmg@archive.org"}
{"id":810,"first_name":"Renee","last_name":"Daymond","email":"rdaymondmh@accuweather.com"}
{"id":811,"first_name":"Eddie","last_name":"Duley","email":"eduleymi@lulu.com"}
{"id":812,"first_name":"Izak","last_name":"Latour","email":"ilatourmj@narod.ru"}
{"id":813,"first_name":"Maura","last_name":"Stuckford","email":"mstuckfordmk@nymag.com"}
{"id":814,"first_name":"Sven","last_name":"Clampin","email":"sclampinml@163.com"}
{"id":815,"first_name":"Marlon","last_name":"Bischoff","email":"mbischoffmm@wsj.com"}
{"id":816,"first_name":"Gustave","last_name":"Hardbattle","email":"ghardbattlemn@mozilla.com"}
{"id":817,"first_name":"Alaine","last_name":"Dietzler","email":"adietzlermo@timesonline.co.uk"}
{"id":818,"first_name":"Alisa","last_name":"Ghirardi","email":"aghirardimp@blogspot.com"}
{"id":819,"first_name":"Irena","last_name":"Goskar","email":"igoskarmq@archive.org"}
{"id":820,"first_name":"Eugenius","last_name":"Taillant","email":"etaillantmr@linkedin.com"}
{"id":821,"first_name":"Patton","last_name":"Garbert","email":"pgarbertms@drupal.org"}
{"id":822,"first_name":"Callie","last_name":"Kubera","email":"ckuberamt@ed.gov"}
{"id":823,"first_name":"Carrissa","last_name":"Duplain","email":"cduplainmu@bing.com"}
{"id":824,"first_name":"Rena","last_name":"Thominga","email":"rthomingamv@cocolog-nifty.com"}
{"id":825,"first_name":"Adriaens","last_name":"Lye","email":"alyemw@wikipedia.org"}
{"id":826,"first_name":"Robena","last_name":"Tackett","email":"rtackettmx@360.cn"}
{"id":827,"first_name":"Yvon","last_name":"Emanuele","email":"yemanuelemy@odnoklassniki.ru"}
{"id":828,"first_name":"Marcel","last_name":"Beckinsall","email":"mbeckinsallmz@blinklist.com"}
{"id":829,"first_name":"Donaugh","last_name":"Gaitskill","email":"dgaitskilln0@cyberchimps.com"}
{"id":830,"first_name":"Daloris","last_name":"Leman","email":"dlemann1@etsy.com"}
{"id":831,"first_name":"Cad","last_name":"Fermin","email":"cferminn2@blogs.com"}
{"id":832,"first_name":"Brigida","last_name":"Hurry","email":"bhurryn3@wunderground.com"}
{"id":833,"first_name":"Carlene","last_name":"Duns","email":"cdunsn4@timesonline.co.uk"}
{"id":834,"first_name":"King","last_name":"Giblett","email":"kgiblettn5@bbc.co.uk"}
{"id":835,"first_name":"Emelita","last_name":"Benito","email":"ebeniton6@dell.com"}
{"id":836,"first_name":"Valentine","last_name":"MacCaughey","email":"vmaccaugheyn7@dropbox.com"}
{"id":837,"first_name":"Donnell","last_name":"Pitcock","email":"dpitcockn8@eepurl.com"}
{"id":838,"first_name":"Dasie","last_name":"Goburn","email":"dgoburnn9@sciencedirect.com"}
{"id":839,"first_name":"Berty","last_name":"Klulicek","email":"bklulicekna@artisteer.com"}
{"id":840,"first_name":"Franzen","last_name":"Pindred","email":"fpindrednb@dropbox.com"}
{"id":841,"first_name":"Othilia","last_name":"Mattia","email":"omattianc@hugedomains.com"}
{"id":842,"first_name":"Analise","last_name":"Absolom","email":"aabsolomnd@over-blog.com"}
{"id":843,"first_name":"Bella","last_name":"Cowndley","email":"bcowndleyne@networksolutions.com"}
{"id":844,"first_name":"Rich","last_name":"Sweedland","email":"rsweedlandnf@studiopress.com"}
{"id":845,"first_name":"Sinclair","last_name":"Bonsale","email":"sbonsaleng@icq.com"}
{"id":846,"first_name":"Thurston","last_name":"Blumsom","email":"tblumsomnh@foxnews.com"}
{"id":847,"first_name":"Howey","last_name":"Dufoure","email":"hdufoureni@geocities.jp"}
{"id":848,"first_name":"Hannie","last_name":"Kryzhov","email":"hkryzhovnj@deliciousdays.com"}
{"id":849,"first_name":"Anneliese","last_name":"Winchcum","email":"awinchcumnk@ifeng.com"}
{"id":850,"first_name":"Ronda","last_name":"Chicotti","email":"rchicottinl@liveinternet.ru"}
{"id":851,"first_name":"Lacy","last_name":"Dennis","email":"ldennisnm@paypal.com"}
{"id":852,"first_name":"Chery","last_name":"Leasor","email":"cleasornn@ning.com"}
{"id":853,"first_name":"Melli","last_name":"Gowler","email":"mgowlerno@prlog.org"}
{"id":854,"first_name":"Audi","last_name":"Ratnage","email":"aratnagenp@sbwire.com"}
{"id":855,"first_name":"Marci","last_name":"Cato","email":"mcatonq@vinaora.com"}
{"id":856,"first_name":"Verena","last_name":"de Guerre","email":"vdeguerrenr@latimes.com"}
{"id":857,"first_name":"Guglielmo","last_name":"Wiltshaw","email":"gwiltshawns@macromedia.com"}
{"id":858,"first_name":"Thatch","last_name":"Palin","email":"tpalinnt@elegantthemes.com"}
{"id":859,"first_name":"Amaleta","last_name":"Godthaab","email":"agodthaabnu@yellowpages.com"}
{"id":860,"first_name":"Danna","last_name":"Bertome","email":"dbertomenv@jimdo.com"}
{"id":861,"first_name":"Terrance","last_name":"Lade","email":"tladenw@php.net"}
{"id":862,"first_name":"Arlie","last_name":"Runsey","email":"arunseynx@icq.com"}
{"id":863,"first_name":"Ericha","last_name":"Tamas","email":"etamasny@businesswire.com"}
{"id":864,"first_name":"Annissa","last_name":"Carine","email":"acarinenz@sitemeter.com"}
{"id":865,"first_name":"Isaac","last_name":"Conybear","email":"iconybearo0@imgur.com"}
{"id":866,"first_name":"Susy","last_name":"Perris","email":"sperriso1@patch.com"}
{"id":867,"first_name":"Michele","last_name":"Malcher","email":"mmalchero2@google.com"}
{"id":868,"first_name":"Benn","last_name":"Serot","email":"bseroto3@altervista.org"}
{"id":869,"first_name":"Hewett","last_name":"Smoote","email":"hsmooteo4@dot.gov"}
{"id":870,"first_name":"Renie","last_name":"Rallings","email":"rrallingso5@ox.ac.uk"}
{"id":871,"first_name":"Sammy","last_name":"Trew","email":"strewo6@slideshare.net"}
{"id":872,"first_name":"Enos","last_name":"Fisbburne","email":"efisbburneo7@webs.com"}
{"id":873,"first_name":"Yancy","last_name":"Rookwell","email":"yrookwello8@sina.com.cn"}
{"id":874,"first_name":"Iolande","last_name":"Shillingford","email":"ishillingfordo9@forbes.com"}
{"id":875,"first_name":"Yorker","last_name":"Downes","email":"ydownesoa@addthis.com"}
{"id":876,"first_name":"Laina","last_name":"Jaulme","email":"ljaulmeob@elpais.com"}
{"id":877,"first_name":"Reta","last_name":"Argont","email":"rargontoc@harvard.edu"}
{"id":878,"first_name":"Mirabelle","last_name":"Schach","email":"mschachod@pen.io"}
{"id":879,"first_name":"Nataline","last_name":"Cornish","email":"ncornishoe@bbb.org"}
{"id":880,"first_name":"Rab","last_name":"MacPaden","email":"rmacpadenof@ameblo.jp"}
{"id":881,"first_name":"Cheryl","last_name":"Blaske","email":"cblaskeog@slate.com"}
{"id":882,"first_name":"Walton","last_name":"Fishburn","email":"wfishburnoh@china.com.cn"}
{"id":883,"first_name":"Leoine","last_name":"Habercham","email":"lhaberchamoi@dailymotion.com"}
{"id":884,"first_name":"Caria","last_name":"Lemmers","email":"clemmersoj@prweb.com"}
{"id":885,"first_name":"Ebenezer","last_name":"Renny","email":"erennyok@smugmug.com"}
{"id":886,"first_name":"Max","last_name":"Overy","email":"moveryol@elegantthemes.com"}
{"id":887,"first_name":"Patience","last_name":"Bilyard","email":"pbilyardom@hexun.com"}
{"id":888,"first_name":"Aubree","last_name":"Burdekin","email":"aburdekinon@house.gov"}
{"id":889,"first_name":"Grover","last_name":"Trivett","email":"gtrivettoo@stumbleupon.com"}
{"id":890,"first_name":"Brittani","last_name":"Durkin","email":"bdurkinop@chronoengine.com"}
{"id":891,"first_name":"Mair","last_name":"Denyer","email":"mdenyeroq@livejournal.com"}
{"id":892,"first_name":"Antons","last_name":"Pond-Jones","email":"apondjonesor@netvibes.com"}
{"id":893,"first_name":"Terri","last_name":"Edgeworth","email":"tedgeworthos@youtu.be"}
{"id":894,"first_name":"Rikki","last_name":"Schust","email":"rschustot@hatena.ne.jp"}
{"id":895,"first_name":"Emanuel","last_name":"Magee","email":"emageeou@shutterfly.com"}
{"id":896,"first_name":"Leodora","last_name":"Dewick","email":"ldewickov@ycombinator.com"}
{"id":897,"first_name":"Lani","last_name":"Caskey","email":"lcaskeyow@nyu.edu"}
{"id":898,"first_name":"Ashla","last_name":"Ordemann","email":"aordemannox@shareasale.com"}
{"id":899,"first_name":"Bran","last_name":"Glidder","email":"bglidderoy@dyndns.org"}
{"id":900,"first_name":"Ricardo","last_name":"Sarle","email":"rsarleoz@msu.edu"}
{"id":901,"first_name":"Marcille","last_name":"Strevens","email":"mstrevensp0@house.gov"}
{"id":902,"first_name":"Corbet","last_name":"Thurner","email":"cthurnerp1@theatlantic.com"}
{"id":903,"first_name":"Peirce","last_name":"Poveleye","email":"ppoveleyep2@so-net.ne.jp"}
{"id":904,"first_name":"Berti","last_name":"Baldacco","email":"bbaldaccop3@guardian.co.uk"}
{"id":905,"first_name":"Jemima","last_name":"Menichino","email":"jmenichinop4@mashable.com"}
{"id":906,"first_name":"Hobart","last_name":"Dawtry","email":"hdawtryp5@nationalgeographic.com"}
{"id":907,"first_name":"Tiena","last_name":"Giannazzo","email":"tgiannazzop6@goodreads.com"}
{"id":908,"first_name":"Buck","last_name":"Sturley","email":"bsturleyp7@apache.org"}
{"id":909,"first_name":"Corly","last_name":"Sidgwick","email":"csidgwickp8@elegantthemes.com"}
{"id":910,"first_name":"Lynnea","last_name":"Bezzant","email":"lbezzantp9@rakuten.co.jp"}
{"id":911,"first_name":"Skipp","last_name":"Shepperd","email":"sshepperdpa@apple.com"}
{"id":912,"first_name":"Jeffry","last_name":"Grierson","email":"jgriersonpb@nih.gov"}
{"id":913,"first_name":"Killian","last_name":"Grzegorzewski","email":"kgrzegorzewskipc@homestead.com"}
{"id":914,"first_name":"Phebe","last_name":"Holtaway","email":"pholtawaypd@tinypic.com"}
{"id":915,"first_name":"Morgan","last_name":"Glader","email":"mgladerpe@newsvine.com"}
{"id":916,"first_name":"Dallon","last_name":"Hamshere","email":"dhamsherepf@geocities.com"}
{"id":917,"first_name":"Sullivan","last_name":"Jorden","email":"sjordenpg@umich.edu"}
{"id":918,"first_name":"Barbara","last_name":"Simak","email":"bsimakph@nsw.gov.au"}
{"id":919,"first_name":"Arlyne","last_name":"Guiduzzi","email":"aguiduzzipi@pcworld.com"}
{"id":920,"first_name":"Raff","last_name":"Tremathick","email":"rtremathickpj@webs.com"}
{"id":921,"first_name":"Ailsun","last_name":"Castelain","email":"acastelainpk@engadget.com"}
{"id":922,"first_name":"Zelda","last_name":"Malt","email":"zmaltpl@icio.us"}
{"id":923,"first_name":"Chanda","last_name":"Loram","email":"clorampm@about.me"}
{"id":924,"first_name":"Kiel","last_name":"Binford","email":"kbinfordpn@latimes.com"}
{"id":925,"first_name":"Sawyer","last_name":"Lesslie","email":"slessliepo@webnode.com"}
{"id":926,"first_name":"Billi","last_name":"Hunte","email":"bhuntepp@bravesites.com"}
{"id":927,"first_name":"Thaxter","last_name":"Mellows","email":"tmellowspq@twitpic.com"}
{"id":928,"first_name":"Shani","last_name":"Djokic","email":"sdjokicpr@fastcompany.com"}
{"id":929,"first_name":"Hardy","last_name":"Ambrogelli","email":"hambrogellips@goo.ne.jp"}
{"id":930,"first_name":"Antonie","last_name":"Georgins","email":"ageorginspt@seesaa.net"}
{"id":931,"first_name":"Ennis","last_name":"Schuck","email":"eschuckpu@globo.com"}
{"id":932,"first_name":"Jermayne","last_name":"Reeson","email":"jreesonpv@networkadvertising.org"}
{"id":933,"first_name":"Claudio","last_name":"Stener","email":"cstenerpw@dyndns.org"}
{"id":934,"first_name":"Stella","last_name":"McLeoid","email":"smcleoidpx@bigcartel.com"}
{"id":935,"first_name":"Steven","last_name":"Warby","email":"swarbypy@cnn.com"}
{"id":936,"first_name":"Oby","last_name":"Prangle","email":"opranglepz@dedecms.com"}
{"id":937,"first_name":"Kellsie","last_name":"Roberson","email":"krobersonq0@skyrock.com"}
{"id":938,"first_name":"Chiquia","last_name":"De la croix","email":"cdelacroixq1@virginia.edu"}
{"id":939,"first_name":"Richie","last_name":"Pyett","email":"rpyettq2@hexun.com"}
{"id":940,"first_name":"Darb","last_name":"Pavitt","email":"dpavittq3@bbb.org"}
{"id":941,"first_name":"Gwenneth","last_name":"Champken","email":"gchampkenq4@stanford.edu"}
{"id":942,"first_name":"Roger","last_name":"Lghan","email":"rlghanq5@cdbaby.com"}
{"id":943,"first_name":"Aurelia","last_name":"Golt","email":"agoltq6@opera.com"}
{"id":944,"first_name":"Stefa","last_name":"Polini","email":"spoliniq7@elpais.com"}
{"id":945,"first_name":"Elden","last_name":"Kuschek","email":"ekuschekq8@imageshack.us"}
{"id":946,"first_name":"Lucille","last_name":"Davidy","email":"ldavidyq9@paginegialle.it"}
{"id":947,"first_name":"Amelina","last_name":"Rabson","email":"arabsonqa@ihg.com"}
{"id":948,"first_name":"Rustin","last_name":"Pickrill","email":"rpickrillqb@dedecms.com"}
{"id":949,"first_name":"Nicol","last_name":"Gargett","email":"ngargettqc@mit.edu"}
{"id":950,"first_name":"Malachi","last_name":"Chipman","email":"mchipmanqd@harvard.edu"}
{"id":951,"first_name":"Zebulon","last_name":"Wackly","email":"zwacklyqe@diigo.com"}
{"id":952,"first_name":"Casi","last_name":"Cosans","email":"ccosansqf@pbs.org"}
{"id":953,"first_name":"Gustavo","last_name":"Hampton","email":"ghamptonqg@tinyurl.com"}
{"id":954,"first_name":"Yves","last_name":"Dineen","email":"ydineenqh@godaddy.com"}
{"id":955,"first_name":"Ursala","last_name":"Oller","email":"uollerqi@jigsy.com"}
{"id":956,"first_name":"Emlynn","last_name":"Girardin","email":"egirardinqj@zdnet.com"}
{"id":957,"first_name":"Jarid","last_name":"Fargie","email":"jfargieqk@chicagotribune.com"}
{"id":958,"first_name":"Laurens","last_name":"Danihelka","email":"ldanihelkaql@gmpg.org"}
{"id":959,"first_name":"Ignaz","last_name":"Drinan","email":"idrinanqm@cbslocal.com"}
{"id":960,"first_name":"Michaela","last_name":"Benning","email":"mbenningqn@ocn.ne.jp"}
{"id":961,"first_name":"Anita","last_name":"Dericot","email":"adericotqo@ihg.com"}
{"id":962,"first_name":"Giselbert","last_name":"Grene","email":"ggreneqp@arizona.edu"}
{"id":963,"first_name":"Daphne","last_name":"Deny","email":"ddenyqq@google.co.uk"}
{"id":964,"first_name":"Josefa","last_name":"Scoular","email":"jscoularqr@cargocollective.com"}
{"id":965,"first_name":"Papagena","last_name":"Blatcher","email":"pblatcherqs@time.com"}
{"id":966,"first_name":"Symon","last_name":"Fearneley","email":"sfearneleyqt@usgs.gov"}
{"id":967,"first_name":"Flinn","last_name":"Oak","email":"foakqu@wsj.com"}
{"id":968,"first_name":"Aeriela","last_name":"Ofen","email":"aofenqv@about.me"}
{"id":969,"first_name":"Belia","last_name":"Abdee","email":"babdeeqw@lycos.com"}
{"id":970,"first_name":"Dee","last_name":"Sigg","email":"dsiggqx@360.cn"}
{"id":971,"first_name":"Gilberte","last_name":"Kitchin","email":"gkitchinqy@harvard.edu"}
{"id":972,"first_name":"Adelaide","last_name":"Clinch","email":"aclinchqz@opera.com"}
{"id":973,"first_name":"Lemmie","last_name":"Gonnet","email":"lgonnetr0@geocities.com"}
{"id":974,"first_name":"Redd","last_name":"Cham","email":"rchamr1@mtv.com"}
{"id":975,"first_name":"Hester","last_name":"Belton","email":"hbeltonr2@craigslist.org"}
{"id":976,"first_name":"Barry","last_name":"Sharrard","email":"bsharrardr3@mozilla.com"}
{"id":977,"first_name":"Carney","last_name":"Skepper","email":"cskepperr4@vkontakte.ru"}
{"id":978,"first_name":"Karleen","last_name":"Baigent","email":"kbaigentr5@topsy.com"}
{"id":979,"first_name":"Jany","last_name":"Geraghty","email":"jgeraghtyr6@google.com"}
{"id":980,"first_name":"Valdemar","last_name":"Kleinfeld","email":"vkleinfeldr7@github.io"}
{"id":981,"first_name":"Dierdre","last_name":"Sydenham","email":"dsydenhamr8@uiuc.edu"}
{"id":982,"first_name":"Florella","last_name":"Libermore","email":"flibermorer9@europa.eu"}
{"id":983,"first_name":"Stanley","last_name":"Agron","email":"sagronra@census.gov"}
{"id":984,"first_name":"Estel","last_name":"Guerrieri","email":"eguerrierirb@wikispaces.com"}
{"id":985,"first_name":"Leonie","last_name":"Potebury","email":"lpoteburyrc@ebay.co.uk"}
{"id":986,"first_name":"Freeland","last_name":"Caselli","email":"fcasellird@nydailynews.com"}
{"id":987,"first_name":"Sol","last_name":"Skamell","email":"sskamellre@gmpg.org"}
{"id":988,"first_name":"Jakie","last_name":"Portal","email":"jportalrf@freewebs.com"}
{"id":989,"first_name":"Flory","last_name":"Stothart","email":"fstothartrg@google.co.jp"}
{"id":990,"first_name":"Lacy","last_name":"Scotter","email":"lscotterrh@pagesperso-orange.fr"}
{"id":991,"first_name":"Mauricio","last_name":"Adamthwaite","email":"madamthwaiteri@cloudflare.com"}
{"id":992,"first_name":"Bev","last_name":"Whisson","email":"bwhissonrj@de.vu"}
{"id":993,"first_name":"Eryn","last_name":"Dowbakin","email":"edowbakinrk@salon.com"}
{"id":994,"first_name":"Marlo","last_name":"Craxford","email":"mcraxfordrl@aboutads.info"}
{"id":995,"first_name":"Tracy","last_name":"Dougliss","email":"tdouglissrm@php.net"}
{"id":996,"first_name":"Hermann","last_name":"Frantzen","email":"hfrantzenrn@sitemeter.com"}
{"id":997,"first_name":"Vivien","last_name":"Drewery","email":"vdreweryro@imgur.com"}
{"id":998,"first_name":"Papageno","last_name":"Greenstead","email":"pgreensteadrp@seattletimes.com"}
{"id":999,"first_name":"Freeman","last_name":"Laguerre","email":"flaguerrerq@cisco.com"}
{"id":1000,"first_name":"Cameron","last_name":"Tocque","email":"ctocquerr@newsvine.com"}

================================================
FILE: quickwit/quickwit-doc-mapper/benches/data/simple-routing-expression-bench.json
================================================
{"timestamp": 1698386133268880, "source": "custom_dealercrawl", "vin": "2GCUDDED0R1145310", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133269998, "source": "custom_dealercrawl", "vin": "1GNSKMKT9PR546598", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133270959, "source": "custom_dealercrawl", "vin": "1GT49PE78PF120870", "vid": "ae45b13a0a0e094a6d02e389bbed910c", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133271875, "source": "custom_dealercrawl", "vin": "1GKS2DKL0MR129721", "vid": "b3504f5c0a0e0a9939aadd20361ee300", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133272644, "source": "custom_dealercrawl", "vin": "1GT49RE75LF325021", "vid": "c4d98e290a0e081d6bd1a3a56ae3316c", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133273487, "source": "custom_dealercrawl", "vin": "1GNSKBED9PR545024", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133274290, "source": "custom_dealercrawl", "vin": "1GNEVKKWXPJ299402", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133275046, "source": "custom_dealercrawl", "vin": "1GNEVKKW4PJ315044", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133275396, "source": "custom_dealercrawl", "vin": "1GNEVJKW8PJ298811", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133275696, "source": "custom_dealercrawl", "vin": "3GTU9DED0LG360508", "vid": "f41107ba0a0e0a9a2d62f34c045a09fb", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133275998, "source": "custom_dealercrawl", "vin": "1GNEVFKW5PJ303735", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133276276, "source": "custom_dealercrawl", "vin": "1GNERNKW7PJ296754", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133276550, "source": "custom_dealercrawl", "vin": "1GCUDJED5RZ165154", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133276810, "source": "custom_dealercrawl", "vin": "1GCUDJED5RZ152193", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133277182, "source": "custom_dealercrawl", "vin": "1GCUDGED8RZ138291", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133277466, "source": "custom_dealercrawl", "vin": "1GCUDGED6PZ120207", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133277734, "source": "custom_dealercrawl", "vin": "1GCUDGE83RZ154188", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133278077, "source": "custom_dealercrawl", "vin": "1GCUDEEL1RZ134255", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133278398, "source": "custom_dealercrawl", "vin": "1GCUDEED9PZ113918", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133278656, "source": "custom_dealercrawl", "vin": "1FM5K8GC1LGB34005", "vid": "c4d98aa70a0e081d6bd1a3a56f70d391", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133278989, "source": "custom_dealercrawl", "vin": "1GCUDEED7PZ280620", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133279252, "source": "custom_dealercrawl", "vin": "1GCUDEED2PZ304676", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133279560, "source": "custom_dealercrawl", "vin": "1GCUDEED1RZ165143", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133279874, "source": "custom_dealercrawl", "vin": "1GCUYEED3LZ335014", "vid": "233aa6af0a0e087f102b3b1d5cd62eea", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133280134, "source": "custom_dealercrawl", "vin": "1GCRDDED3RZ176824", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133280403, "source": "custom_dealercrawl", "vin": "1FT7W2BT7KEG15697", "vid": "e8ea1e580a0e0a9260e76faa2bd7b4f1", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133280675, "source": "custom_dealercrawl", "vin": "1GCRDAED0PZ185444", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133281034, "source": "custom_dealercrawl", "vin": "1FTFW1RG4NFB39096", "vid": "195b2dcd0a0e0a9a61540bbc7f86eac8", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133281359, "source": "custom_dealercrawl", "vin": "1GTUUHEL3NZ514919", "vid": "ddba2a100a0e081d2e4f88904a3868a5", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133281604, "source": "custom_dealercrawl", "vin": "1GC4YVE74RF172409", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133281892, "source": "custom_dealercrawl", "vin": "1GYS4EKL5MR400679", "vid": "ce4cf2cf0a0e0a941d829089895c9fae", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133282239, "source": "custom_dealercrawl", "vin": "3C63R3EL0NG159716", "vid": "5e681fd40a0e0a92336a2c1ea2a91f48", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133282533, "source": "custom_dealercrawl", "vin": "1GC3YTE73RF130474", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133282796, "source": "custom_dealercrawl", "vin": "1GC3YSE7XRF160923", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133283072, "source": "custom_dealercrawl", "vin": "1GC3YSE78RF160340", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133283390, "source": "custom_dealercrawl", "vin": "ZASPAKBN5N7D33543", "vid": "50f38ef90a0e0a992b96b96b80dfbc36", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133283672, "source": "custom_dealercrawl", "vin": "1GC3YSE76RF160112", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133283988, "source": "custom_dealercrawl", "vin": "ZARFANAN2L7626049", "vid": "faeda5f50a0e0a9a61540bbc6e49a9be", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133284302, "source": "custom_dealercrawl", "vin": "WAUVVAFR6AA009328", "vid": "3c5a9bc50a0e087f42924702c68ba470", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133284526, "source": "custom_dealercrawl", "vin": "2GCUDAEDXR1145166", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133284799, "source": "custom_dealercrawl", "vin": "2GC4YPEY0R1157790", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133285091, "source": "custom_dealercrawl", "vin": "2GC4YNE70R1120928", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133285352, "source": "custom_dealercrawl", "vin": "2GC4YME7XR1144180", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133285580, "source": "custom_dealercrawl", "vin": "2GC4YME7XR1144177", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133285863, "source": "custom_dealercrawl", "vin": "WBA7T4C08NCK38450", "vid": "f42080210a0e0a943a15604b5241a31f", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133286120, "source": "custom_dealercrawl", "vin": "5UXCR6C03L9C58192", "vid": "500a3d1e0a0e094a3883bfc3d8ceccc5", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133286466, "source": "custom_dealercrawl", "vin": "WBXYH9C08P5V63695", "vid": "4184a7810a0e0a9a6585850e913a6837", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133286778, "source": "custom_dealercrawl", "vin": "1HTKJPVK2PH387965", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133287356, "source": "custom_dealercrawl", "vin": "1HTKJPVK0PH598842", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133287735, "source": "custom_dealercrawl", "vin": "KL4CJESBXLB327918", "vid": "184583ce0a0e0a913c8e19b0dec8f9c7", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133288096, "source": "custom_dealercrawl", "vin": "KL4CJASB6LB010338", "vid": "18469a970a0e0a943b89ecfdcc517607", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133288369, "source": "custom_dealercrawl", "vin": "1GNSKTKL4PR536961", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133288638, "source": "custom_dealercrawl", "vin": "KL4CJASB0LB340301", "vid": "3c5a94950a0e087f429247026603afc8", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133288935, "source": "custom_dealercrawl", "vin": "1GNSKRKD0PR547368", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133289205, "source": "custom_dealercrawl", "vin": "1GNSKPKD7PR537974", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133289479, "source": "custom_dealercrawl", "vin": "2G1FK1EJ5D9177823", "vid": "71ecfa260a0e0a906df43755e35c073a", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133289771, "source": "custom_dealercrawl", "vin": "2G1FK3DJ5C9187909", "vid": "1845efab0a0e0a9a61540bbc97d89eed", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133290064, "source": "custom_dealercrawl", "vin": "2G1FK3DJ9B9194103", "vid": "1845703e0a0e0a930a4d1cb070747df2", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133290357, "source": "custom_dealercrawl", "vin": "2G1FK3DJXB9171817", "vid": "1bdbf7d00a0e094a62ba84ba2c2466f0", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133290657, "source": "custom_dealercrawl", "vin": "1G1ZD5ST5RF108083", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133290954, "source": "custom_dealercrawl", "vin": "2G1FK3DJ8B9188647", "vid": "5d740da40a0e0a171983e9bd0190c4bc", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133291291, "source": "custom_dealercrawl", "vin": "2G1FT1EW9B9121678", "vid": "40123a2d0a0e0a992b96b96b5c7f2fa4", "date": "2023-10-26", "domain": "www.basilvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133291568, "source": "custom_dealercrawl", "vin": "1G1YC3D49P5139882", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133291887, "source": "custom_dealercrawl", "vin": "1G1YB3D46P5142225", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133292167, "source": "custom_dealercrawl", "vin": "1G1FG3D74P0159539", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133292413, "source": "custom_dealercrawl", "vin": "1G1FE1R70P0159072", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133292656, "source": "custom_dealercrawl", "vin": "1GC3YSE73RF149875", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133292987, "source": "custom_dealercrawl", "vin": "1GC3YSE71RF154511", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133293285, "source": "custom_dealercrawl", "vin": "1GC3YLE77RF186014", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133293580, "source": "custom_dealercrawl", "vin": "1GB5YSE72RF248118", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133293836, "source": "custom_dealercrawl", "vin": "1GB3YTE72RF155547", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133294117, "source": "custom_dealercrawl", "vin": "1GB3YSE76RF219549", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133294362, "source": "custom_dealercrawl", "vin": "1GB3YSE73RF165997", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133309877, "source": "custom_dealercrawl", "vin": "1GB0GRFP7P1150104", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133310190, "source": "custom_dealercrawl", "vin": "1G1ZE5ST6PF240800", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133310465, "source": "custom_dealercrawl", "vin": "1G1ZD5ST8RF108112", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133310752, "source": "custom_dealercrawl", "vin": "KL7CJPSB5JB703730", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133311070, "source": "custom_dealercrawl", "vin": "KL79MUSL9NB055307", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133311423, "source": "custom_dealercrawl", "vin": "3GNAXXEV1KS627838", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133311695, "source": "custom_dealercrawl", "vin": "3GNAXUEV5LL267497", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133311990, "source": "custom_dealercrawl", "vin": "3GNAXSEV3KS603494", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133312245, "source": "custom_dealercrawl", "vin": "3GCUYEEL3MG247234", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133333811, "source": "custom_dealercrawl", "vin": "3GCUYDED3LG221363", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133334141, "source": "custom_dealercrawl", "vin": "3GCPDFEK1NG501398", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133334392, "source": "custom_dealercrawl", "vin": "3GCPDCED4NG665390", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133334642, "source": "custom_dealercrawl", "vin": "2GC4YUEY6N1232937", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133334946, "source": "custom_dealercrawl", "vin": "1GC4YPE78LF156247", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133335284, "source": "custom_dealercrawl", "vin": "1GC4YPE71MF258796", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133335565, "source": "custom_dealercrawl", "vin": "1GC1YNE70MF193849", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133335905, "source": "custom_dealercrawl", "vin": "1GAZGPFG7L1237494", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133336163, "source": "custom_dealercrawl", "vin": "1G1YY2D73H5103077", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133351555, "source": "custom_dealercrawl", "vin": "1G1YB3D70K5109322", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133351882, "source": "custom_dealercrawl", "vin": "1G1PE5SB7E7112507", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133352152, "source": "custom_dealercrawl", "vin": "1G11F5SL4FF195476", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133352432, "source": "custom_dealercrawl", "vin": "5GAEVAKW0LJ217885", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133352711, "source": "custom_dealercrawl", "vin": "3GKALVEV5ML305732", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133353010, "source": "custom_dealercrawl", "vin": "1GCRYGEL2LZ112522", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133353345, "source": "custom_dealercrawl", "vin": "1GCRYEED3LZ304173", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133353611, "source": "custom_dealercrawl", "vin": "1GCRYDED7NZ193379", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133353912, "source": "custom_dealercrawl", "vin": "1GCPYFEDXKZ289103", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133364666, "source": "custom_dealercrawl", "vin": "1GCPYFED6LZ320090", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133365021, "source": "custom_dealercrawl", "vin": "1GCPYFED2LZ129380", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133365308, "source": "custom_dealercrawl", "vin": "1GCPYCEF5MZ451321", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133365540, "source": "custom_dealercrawl", "vin": "1GCGTDE34G1330583", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133365853, "source": "custom_dealercrawl", "vin": "1GC5YMEY5PF202554", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133366418, "source": "custom_dealercrawl", "vin": "1GC4YTE70NF180621", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133366723, "source": "custom_dealercrawl", "vin": "2G11Z5S39K9114885", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133367257, "source": "custom_dealercrawl", "vin": "1GNSKRKT7NR323437", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133367625, "source": "custom_dealercrawl", "vin": "1GNSKRKD5MR256750", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133381057, "source": "custom_dealercrawl", "vin": "1GNSKGKLXMR352045", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133381359, "source": "custom_dealercrawl", "vin": "1GNSKCKD7MR476355", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133381609, "source": "custom_dealercrawl", "vin": "1GNEVKKW2LJ237602", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133381884, "source": "custom_dealercrawl", "vin": "1GCUYGET0MZ323357", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133382123, "source": "custom_dealercrawl", "vin": "1GCUYEEDXLZ104871", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133382411, "source": "custom_dealercrawl", "vin": "1GCUYBEF3KZ319717", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133382722, "source": "custom_dealercrawl", "vin": "1GCUDEE83PZ102870", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133383062, "source": "custom_dealercrawl", "vin": "SADF12FX3L1Z88367", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133383382, "source": "custom_dealercrawl", "vin": "NMTKHMBX2MR137493", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133398814, "source": "custom_dealercrawl", "vin": "KNDPNCAC1H7255561", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133399150, "source": "custom_dealercrawl", "vin": "KNDMB5C10L6604551", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133399443, "source": "custom_dealercrawl", "vin": "KNDCR3LE4P5042602", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133399745, "source": "custom_dealercrawl", "vin": "KM8J23A49KU969899", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133400025, "source": "custom_dealercrawl", "vin": "JTHG81F20N5048760", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133400304, "source": "custom_dealercrawl", "vin": "JTEKU5JR8M5852396", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133400531, "source": "custom_dealercrawl", "vin": "JTEBU5JRXG5358237", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133400909, "source": "custom_dealercrawl", "vin": "JTDKAMFU6N3180730", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133401206, "source": "custom_dealercrawl", "vin": "1GTW7AFP6M1310458", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133401483, "source": "custom_dealercrawl", "vin": "1GTW7AFG9L1268253", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133405976, "source": "custom_dealercrawl", "vin": "1GTUUDED1NZ643825", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133406311, "source": "custom_dealercrawl", "vin": "1GTP9EEL4MZ171923", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133406559, "source": "custom_dealercrawl", "vin": "1GTG6CEN1H1223768", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133406822, "source": "custom_dealercrawl", "vin": "1GKS2JKL6PR311586", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133407094, "source": "custom_dealercrawl", "vin": "1GKKNXLSXJZ113083", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133422702, "source": "custom_dealercrawl", "vin": "WUAWAAFC9JN902605", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133423065, "source": "custom_dealercrawl", "vin": "WP1AA2A53NLB03425", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133423422, "source": "custom_dealercrawl", "vin": "WDD1K6JB1KF072204", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133423698, "source": "custom_dealercrawl", "vin": "WBAJS7C09LCE16859", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133424014, "source": "custom_dealercrawl", "vin": "WBAGV8C03PCL44518", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133424317, "source": "custom_dealercrawl", "vin": "WAULFAFH8DN013907", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133424629, "source": "custom_dealercrawl", "vin": "WAUC4CF58NA009405", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133424938, "source": "custom_dealercrawl", "vin": "WAUA4CF57MA004024", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133425227, "source": "custom_dealercrawl", "vin": "WA1LAAF76KD007304", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133454121, "source": "custom_dealercrawl", "vin": "WA1CAAFY7M2017816", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133454595, "source": "custom_dealercrawl", "vin": "WA1BNAFY0L2017008", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133454922, "source": "custom_dealercrawl", "vin": "WA12ABGE0LB035790", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133455212, "source": "custom_dealercrawl", "vin": "W1K3G4FB9NJ375434", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133455530, "source": "custom_dealercrawl", "vin": "5TDJSKFC3MS005112", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133455947, "source": "custom_dealercrawl", "vin": "5TDGZRBH0LS008662", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133456265, "source": "custom_dealercrawl", "vin": "5TDDZ3DC9LS239674", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133456503, "source": "custom_dealercrawl", "vin": "5NPEF4JA7LH023396", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133456772, "source": "custom_dealercrawl", "vin": "5NMS2CAD5LH250070", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133478001, "source": "custom_dealercrawl", "vin": "5LMTJ5DZ3NUL28344", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133478424, "source": "custom_dealercrawl", "vin": "5LMCJ3D93KUL43281", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133478730, "source": "custom_dealercrawl", "vin": "5J8TC2H64ML800234", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133479015, "source": "custom_dealercrawl", "vin": "5J6RM4H51GL087560", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133479322, "source": "custom_dealercrawl", "vin": "5FNYF6H59MB014961", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133479594, "source": "custom_dealercrawl", "vin": "5FNRL6H95LB010646", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133479924, "source": "custom_dealercrawl", "vin": "55SWF8EBXLU325311", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133480181, "source": "custom_dealercrawl", "vin": "4T1G11AKXMU407495", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133480425, "source": "custom_dealercrawl", "vin": "4S4BTGKD7L3186191", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133511190, "source": "custom_dealercrawl", "vin": "4S3GKAV67L3614428", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133511520, "source": "custom_dealercrawl", "vin": "4S3BNAR67K3009805", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133511884, "source": "custom_dealercrawl", "vin": "4JGFB4KB8LA042033", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133512133, "source": "custom_dealercrawl", "vin": "4JGFB4JB9LA180908", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133512416, "source": "custom_dealercrawl", "vin": "3VV2B7AX9LM149646", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133512664, "source": "custom_dealercrawl", "vin": "3VV2B7AX1LM001880", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133512998, "source": "custom_dealercrawl", "vin": "3VV0B7AXXMM019223", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133513341, "source": "custom_dealercrawl", "vin": "JM3TCBDY0G0107485", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133513569, "source": "custom_dealercrawl", "vin": "JM3KFBCM3L0848807", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133554061, "source": "custom_dealercrawl", "vin": "JM1GL1WY8L1511947", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133554439, "source": "custom_dealercrawl", "vin": "JF2SKADC3MH450456", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133554813, "source": "custom_dealercrawl", "vin": "JF2SKACC0KH523118", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133555130, "source": "custom_dealercrawl", "vin": "5YFEPMAE6MP244430", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133555454, "source": "custom_dealercrawl", "vin": "5XXG34J23MG004125", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133555834, "source": "custom_dealercrawl", "vin": "5UXCR6C02N9K75226", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133556136, "source": "custom_dealercrawl", "vin": "5UX53DP02N9K31493", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133556516, "source": "custom_dealercrawl", "vin": "5TFCZ5AN4MX268847", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133556913, "source": "custom_dealercrawl", "vin": "5TDJZRBH9MS106838", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133575788, "source": "custom_dealercrawl", "vin": "3C4NJDBB5LT106928", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133576134, "source": "custom_dealercrawl", "vin": "2FMPK4K98LBA22192", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133576436, "source": "custom_dealercrawl", "vin": "2FMPK4J94NBA51676", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133576696, "source": "custom_dealercrawl", "vin": "2C4RC1N77KR657719", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133577029, "source": "custom_dealercrawl", "vin": "2C4RC1EG5LR121448", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133577341, "source": "custom_dealercrawl", "vin": "2C4RC1BG0MR574995", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133577629, "source": "custom_dealercrawl", "vin": "2C3CDZBT7HH513223", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133577978, "source": "custom_dealercrawl", "vin": "1V2UR2CAXKC618353", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133578265, "source": "custom_dealercrawl", "vin": "1N6ED1EK1NN606666", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133591613, "source": "custom_dealercrawl", "vin": "1N6BA1F45KN525158", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133591993, "source": "custom_dealercrawl", "vin": "1N4AA6EV0LC379776", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133592308, "source": "custom_dealercrawl", "vin": "1HGCV3F56MA020208", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133592563, "source": "custom_dealercrawl", "vin": "3VWEM7BU5RM006791", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133592968, "source": "custom_dealercrawl", "vin": "3VVEX7B2XRM008059", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133593294, "source": "custom_dealercrawl", "vin": "3VVEX7B22RM009819", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133593662, "source": "custom_dealercrawl", "vin": "WVWHA7CDXRW125301", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133594035, "source": "custom_dealercrawl", "vin": "1GYS4JKL2NR104786", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133594330, "source": "custom_dealercrawl", "vin": "3VV4X7B21RM015803", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133601233, "source": "custom_dealercrawl", "vin": "1GYS4FKL2MR305325", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133601540, "source": "custom_dealercrawl", "vin": "1GYS4DKJ4LR186629", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133601975, "source": "custom_dealercrawl", "vin": "1V2KR2CA7RC529308", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133602258, "source": "custom_dealercrawl", "vin": "1V2KR2CA5RC528464", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133602584, "source": "custom_dealercrawl", "vin": "WVWAR7AN1PE010224", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133602903, "source": "custom_dealercrawl", "vin": "1V2VMPE8XPC015467", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133603211, "source": "custom_dealercrawl", "vin": "1G6DH5RL3L0150549", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133603510, "source": "custom_dealercrawl", "vin": "1G6AW5SX8K0107586", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133603832, "source": "custom_dealercrawl", "vin": "1FTRF3B61KEC64391", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133620398, "source": "custom_dealercrawl", "vin": "1FTFW1E80MFB98630", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133620725, "source": "custom_dealercrawl", "vin": "1FTEW1EP9MFA96665", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133621066, "source": "custom_dealercrawl", "vin": "1FT8W3BT7JEC71958", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133621345, "source": "custom_dealercrawl", "vin": "1FT8W2BT6NEC29443", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133621619, "source": "custom_dealercrawl", "vin": "1FT7W3BT5LEC65056", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133621963, "source": "custom_dealercrawl", "vin": "3VVMB7AX4RM035085", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133622372, "source": "custom_dealercrawl", "vin": "1FMSK8DH0LGC55725", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133622679, "source": "custom_dealercrawl", "vin": "1FMJU2ATXKEA77571", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133622982, "source": "custom_dealercrawl", "vin": "3VV8B7AX7RM036670", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133630960, "source": "custom_dealercrawl", "vin": "WVW2A7CDXRW124459", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133631372, "source": "custom_dealercrawl", "vin": "1V2AE2CA4RC213775", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133631672, "source": "custom_dealercrawl", "vin": "1V2AE2CA8RC213150", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133631970, "source": "custom_dealercrawl", "vin": "1V2WNPE89PC046503", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133632242, "source": "custom_dealercrawl", "vin": "1V2WNPE88PC049859", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133632473, "source": "custom_dealercrawl", "vin": "1V2WNPE84PC038521", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133632831, "source": "custom_dealercrawl", "vin": "1V2FE2CA5RC214603", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133633138, "source": "custom_dealercrawl", "vin": "1C6SRFFT7NN457229", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133655734, "source": "custom_dealercrawl", "vin": "1C6SRFFT5LN125674", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133656118, "source": "custom_dealercrawl", "vin": "1V2WNPE88PC047884", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133656416, "source": "custom_dealercrawl", "vin": "1V2WNPE82PC045824", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133656679, "source": "custom_dealercrawl", "vin": "1V2FR2CA6RC524389", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133657102, "source": "custom_dealercrawl", "vin": "1V2FR2CA7RC529066", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133657380, "source": "custom_dealercrawl", "vin": "1V2JNPE80PC050319", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133657630, "source": "custom_dealercrawl", "vin": "3VWBM7BU0RM020102", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133657919, "source": "custom_dealercrawl", "vin": "3VW7M7BU5RM021963", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133658194, "source": "custom_dealercrawl", "vin": "3VW9T7BU0RM021669", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133669957, "source": "custom_dealercrawl", "vin": "3VV2B7AX2KM060323", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133670355, "source": "custom_dealercrawl", "vin": "3VV2B7AX3LM144345", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133670736, "source": "custom_dealercrawl", "vin": "1V2RE2CA8MC203553", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133671100, "source": "custom_dealercrawl", "vin": "3VWGZ7AJXBM076102", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133671448, "source": "custom_dealercrawl", "vin": "3VV2B7AX3KM052120", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133671731, "source": "custom_dealercrawl", "vin": "3VV2B7AX2MM003719", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133672124, "source": "custom_dealercrawl", "vin": "1V2LR2CA5KC565816", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133672413, "source": "custom_dealercrawl", "vin": "KMHGH4JH4CU052338", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133731015, "source": "custom_dealercrawl", "vin": "KNDEPCAA8M7084818", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133731396, "source": "custom_dealercrawl", "vin": "5N1AT3BB6MC786205", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133731701, "source": "custom_dealercrawl", "vin": "4T1K61BKXLU010846", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133732018, "source": "custom_dealercrawl", "vin": "5N1DR2MM5KC649659", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133732301, "source": "custom_dealercrawl", "vin": "19UUB1F39LA016667", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133732565, "source": "custom_dealercrawl", "vin": "JN1BJ1CW0NW683093", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133732868, "source": "custom_dealercrawl", "vin": "1J4FA54198L519317", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133733178, "source": "custom_dealercrawl", "vin": "1C4AJWAG6GL152115", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133733415, "source": "custom_dealercrawl", "vin": "1J4AA2D14AL141924", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133733648, "source": "custom_dealercrawl", "vin": "5N1AT3CBXMC845562", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133773860, "source": "custom_dealercrawl", "vin": "1C4AJWAG5CL215389", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133774253, "source": "custom_dealercrawl", "vin": "1J4FA24117L218604", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133774574, "source": "custom_dealercrawl", "vin": "1FTEW1EG1FFA18612", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133774999, "source": "custom_dealercrawl", "vin": "1C4GJXAGXLW223308", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133775330, "source": "custom_dealercrawl", "vin": "1J4AA2D19BL557680", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133775680, "source": "custom_dealercrawl", "vin": "1FTEW1EG3HFA54823", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133776001, "source": "custom_dealercrawl", "vin": "2C3CDXJG5NH107400", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133776318, "source": "custom_dealercrawl", "vin": "1C4RJFBG5KC539748", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133776560, "source": "custom_dealercrawl", "vin": "1J4FA39S93P344607", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133776906, "source": "custom_dealercrawl", "vin": "1J4AA2D14BL537658", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133791019, "source": "custom_dealercrawl", "vin": "19UDE4H37PA009583", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133791372, "source": "custom_dealercrawl", "vin": "1C6RR7KG4JS253111", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133791688, "source": "custom_dealercrawl", "vin": "1J4FA39S32P723231", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133791991, "source": "custom_dealercrawl", "vin": "5J8TC2H34KL026652", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133792307, "source": "custom_dealercrawl", "vin": "2HKRW2H58NH660864", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133792544, "source": "custom_dealercrawl", "vin": "1C4AJWAG7HL580177", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133792879, "source": "custom_dealercrawl", "vin": "1C4AJWAG9EL250097", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133793185, "source": "custom_dealercrawl", "vin": "JN8BT3DD7NW270480", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133793435, "source": "custom_dealercrawl", "vin": "5N1DR3DK7NC202985", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133810322, "source": "custom_dealercrawl", "vin": "1J4FA69S73P310361", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133810644, "source": "custom_dealercrawl", "vin": "1C4BJWDG6EL179599", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133810975, "source": "custom_dealercrawl", "vin": "1C4AJWAG6FL632329", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133811314, "source": "custom_dealercrawl", "vin": "1C4BJWDG1DL610140", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133811592, "source": "custom_dealercrawl", "vin": "1C4AJWAG8DL517163", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133811910, "source": "custom_dealercrawl", "vin": "JM1BM1T7XF1263126", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133812190, "source": "custom_dealercrawl", "vin": "1C4AJWAG0CL126524", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133812437, "source": "custom_dealercrawl", "vin": "1C4RJKBG8M8173296", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133812684, "source": "custom_dealercrawl", "vin": "5NPEC4ACXBH284871", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133812997, "source": "custom_dealercrawl", "vin": "1C4RJHEG9N8621383", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133818109, "source": "custom_dealercrawl", "vin": "1C4BJWDG9JL838785", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133818418, "source": "custom_dealercrawl", "vin": "1C4RJFLG2LC135600", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133818675, "source": "custom_dealercrawl", "vin": "1C4RJFCG6LC437438", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133818983, "source": "custom_dealercrawl", "vin": "1C4RJFBGXLC243352", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133819329, "source": "custom_dealercrawl", "vin": "1C4RJFBGXKC674837", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133819610, "source": "custom_dealercrawl", "vin": "3N1CP5CV4ML475174", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133819911, "source": "custom_dealercrawl", "vin": "JF1GPAA62E8220984", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133820184, "source": "custom_dealercrawl", "vin": "3N1AB8CVXLY263601", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133820411, "source": "custom_dealercrawl", "vin": "1C4BJWDG2FL571688", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133826619, "source": "custom_dealercrawl", "vin": "JH4KC1F94EC005217", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133826957, "source": "custom_dealercrawl", "vin": "3N1CN8EV5ML880397", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133827282, "source": "custom_dealercrawl", "vin": "1J4BA3H13AL218920", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133827553, "source": "custom_dealercrawl", "vin": "3KPF24AD0ME269643", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133827902, "source": "custom_dealercrawl", "vin": "3FMCR9B63MRA46769", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133828201, "source": "custom_dealercrawl", "vin": "3FA6P0T91LR197271", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133828433, "source": "custom_dealercrawl", "vin": "3FA6P0SU5LR235414", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133828734, "source": "custom_dealercrawl", "vin": "3FA6P0HD2KR159334", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133829069, "source": "custom_dealercrawl", "vin": "3FA6P0H9XHR192831", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133848546, "source": "custom_dealercrawl", "vin": "3CZRU6H52MM717351", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133848871, "source": "custom_dealercrawl", "vin": "3C63R3EJ2JG430333", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133849167, "source": "custom_dealercrawl", "vin": "3C4PDCGB8LT268751", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133849537, "source": "custom_dealercrawl", "vin": "3C4NJDCB2MT511421", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133849814, "source": "custom_dealercrawl", "vin": "1GYS4BKL6MR254436", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133850232, "source": "custom_dealercrawl", "vin": "1GYS4AKJXLR180302", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133850525, "source": "custom_dealercrawl", "vin": "3N1AB8CV5MY263300", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133850802, "source": "custom_dealercrawl", "vin": "3N1CP5CV6NL522318", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133851134, "source": "custom_dealercrawl", "vin": "1GKKNSLS6KZ233905", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133858634, "source": "custom_dealercrawl", "vin": "JTMDJREVXJD202989", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133858979, "source": "custom_dealercrawl", "vin": "5N1AZ2AS6MC147137", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133859326, "source": "custom_dealercrawl", "vin": "1C4BJWDG1FL518979", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133859618, "source": "custom_dealercrawl", "vin": "1C4BJWFG2GL180104", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133859934, "source": "custom_dealercrawl", "vin": "1C4BJWDG9GL226000", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133860238, "source": "custom_dealercrawl", "vin": "WMW13DJ01N2S48557", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133860494, "source": "custom_dealercrawl", "vin": "1GYKPDRS9MZ151849", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133860801, "source": "custom_dealercrawl", "vin": "1GYKNHRS1PZ177153", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133861126, "source": "custom_dealercrawl", "vin": "5N1DL1GS1PC352045", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133861387, "source": "custom_dealercrawl", "vin": "1GYKNGRS4KZ256044", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133870550, "source": "custom_dealercrawl", "vin": "WA1VWBF78ND001041", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133870906, "source": "custom_dealercrawl", "vin": "19UUB1F55LA012441", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133871236, "source": "custom_dealercrawl", "vin": "19UUB3F39LA001355", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133871537, "source": "custom_dealercrawl", "vin": "1GYKNDRS7MZ110528", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133871899, "source": "custom_dealercrawl", "vin": "1GYKNDRS4NZ115963", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133872184, "source": "custom_dealercrawl", "vin": "1GYKNDRS1NZ111403", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133872441, "source": "custom_dealercrawl", "vin": "19UDE4H68PA020232", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133872689, "source": "custom_dealercrawl", "vin": "1N6AA1E56HN529816", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133887049, "source": "custom_dealercrawl", "vin": "19UDE4H68PA011188", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133887400, "source": "custom_dealercrawl", "vin": "1GYFZDR4XLF127072", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133887674, "source": "custom_dealercrawl", "vin": "1GYFZDR4XKF212265", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133887996, "source": "custom_dealercrawl", "vin": "1C4RJFBG0MC565936", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133888359, "source": "custom_dealercrawl", "vin": "1G6DX5RKXL0135783", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133888666, "source": "custom_dealercrawl", "vin": "5J8TC2H33KL039411", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133888980, "source": "custom_dealercrawl", "vin": "3TMCZ5AN4NM496905", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133889300, "source": "custom_dealercrawl", "vin": "1G6DS1E38C0117529", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133889537, "source": "custom_dealercrawl", "vin": "5J8YD4H88LL013138", "vid": "", "date": "2023-10-26", "domain": "www.speedcraftvw.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133905875, "source": "custom_dealercrawl", "vin": "1C4RJFBG8LC415281", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386133906219, "source": "custom_dealercrawl", "vin": "1C4RJFBG0LC273797", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133906455, "source": "custom_dealercrawl", "vin": "1C4RJFAGXKC853932", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133906700, "source": "custom_dealercrawl", "vin": "1C4RJFAG4LC242439", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133907041, "source": "custom_dealercrawl", "vin": "1C4PJMDXXKD299938", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133907382, "source": "custom_dealercrawl", "vin": "1C4HJXEG3MW561939", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386133907659, "source": "custom_dealercrawl", "vin": "1C4HJXAGXPW581986", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133907962, "source": "custom_dealercrawl", "vin": "19XFL2H86NE014300", "vid": "", "date": "2023-10-26", "domain": "www.blasiuschevrolet.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133908232, "source": "custom_dealercrawl", "vin": "1C4BJWDG7FL766041", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133976110, "source": "custom_dealercrawl", "vin": "1C4BJWDG2FL585896", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133976476, "source": "custom_dealercrawl", "vin": "1C4BJWDG5GL110244", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133976837, "source": "custom_dealercrawl", "vin": "1C4HJWEG4EL203990", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133977140, "source": "custom_dealercrawl", "vin": "1C4HJWEG0CL201943", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133977383, "source": "custom_dealercrawl", "vin": "1C4HJWEG6HL502319", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386133977633, "source": "custom_dealercrawl", "vin": "1C4BJWEG4HL631049", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133977956, "source": "custom_dealercrawl", "vin": "1C4BJWEG2DL574683", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386133978248, "source": "custom_dealercrawl", "vin": "1C4BJWDG7GL266690", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386133978473, "source": "custom_dealercrawl", "vin": "1C4BJWDG2EL115933", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386134023945, "source": "custom_dealercrawl", "vin": "1C4BJWDG8GL289248", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386134024319, "source": "custom_dealercrawl", "vin": "1C4HJXDN1MW544542", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386134024610, "source": "custom_dealercrawl", "vin": "1C4BJWDG7HL635002", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386134025015, "source": "custom_dealercrawl", "vin": "1C4HJWDG5CL140882", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386134025300, "source": "custom_dealercrawl", "vin": "1J8GA59138L587270", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386134025560, "source": "custom_dealercrawl", "vin": "1C4BJWDG8FL685517", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386134025847, "source": "custom_dealercrawl", "vin": "1C4BJWEGXFL529140", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386134026152, "source": "custom_dealercrawl", "vin": "1C4BJWDG4FL745289", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386134026519, "source": "custom_dealercrawl", "vin": "1C4BJWEG8HL751694", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386134026777, "source": "custom_dealercrawl", "vin": "1C4BJWDG8DL594924", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386134155775, "source": "custom_dealercrawl", "vin": "1J4BA3H17AL138715", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386134156150, "source": "custom_dealercrawl", "vin": "1C4BJWEG7GL284881", "vid": "", "date": "2023-10-26", "domain": "thejeepdepot.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386134998956, "source": "custom_dealercrawl", "vin": "JTDKAMFU6N3166469", "vid": "dc91a3f80a0e0a995e11ea711d17f70f", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386135016926, "source": "custom_dealercrawl", "vin": "4T1C11AK3LU369735", "vid": "e6f6f8360a0e0a992cac085c2ced42f5", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386135017300, "source": "custom_dealercrawl", "vin": "1G1ZD5ST1NF121455", "vid": "e577a5f20a0e0a936891e4acda13017a", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386135017620, "source": "custom_dealercrawl", "vin": "1G6DB5RK7N0116335", "vid": "32b380bf0a0e0a906c8422562b1409de", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386135017935, "source": "custom_dealercrawl", "vin": "2T3WFREV4GW288225", "vid": "4dfc33f70a0e094a3883bfc33cd2fa8a", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386135018250, "source": "custom_dealercrawl", "vin": "3CZRU5H51NM739353", "vid": "dc91a04c0a0e0a995e11ea7109195bb5", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386135018488, "source": "custom_dealercrawl", "vin": "2HGFC2F54HH533722", "vid": "ae684a6f0a0e0a9057a7066da9769c19", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386135155940, "source": "custom_dealercrawl", "vin": "5J6RT6H53NL023709", "vid": "dc91a6120a0e0a995e11ea719977e5ab", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386135156346, "source": "custom_dealercrawl", "vin": "1C6HJTFG9NL120530", "vid": "ff35ad660a0e094a1e8bea621ee5b473", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386135156658, "source": "custom_dealercrawl", "vin": "1HD1KBM15CB624431", "vid": "306e8c1e0a0e0a90290b5a5cca8f87a3", "date": "2023-10-26", "domain": "www.shapentoyota.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136305075, "source": "custom_dealercrawl", "vin": "3KPF24AD5RE701490", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136354464, "source": "custom_dealercrawl", "vin": "5XYK33DF4RG157196", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136354835, "source": "custom_dealercrawl", "vin": "5XYRL4LC7PG230943", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136355170, "source": "custom_dealercrawl", "vin": "3KPA24AD3PE621757", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136355509, "source": "custom_dealercrawl", "vin": "3KPF24AD5RE701974", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136355870, "source": "custom_dealercrawl", "vin": "5XYK6CDF9RG154740", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136356173, "source": "custom_dealercrawl", "vin": "3KPA24AD0PE617505", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136356482, "source": "custom_dealercrawl", "vin": "3KPA24AD2PE622723", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136356833, "source": "custom_dealercrawl", "vin": "3KPA24AD1PE613530", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136357142, "source": "custom_dealercrawl", "vin": "3KPA24AD7PE618750", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136357426, "source": "custom_dealercrawl", "vin": "3KPA24AD7PE621597", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136381496, "source": "custom_dealercrawl", "vin": "3KPA24AD0PE621926", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136381837, "source": "custom_dealercrawl", "vin": "3KPF24AD9PE684741", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136382147, "source": "custom_dealercrawl", "vin": "3KPF24AD5RE706320", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136382413, "source": "custom_dealercrawl", "vin": "3KPF24ADXPE690516", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136382675, "source": "custom_dealercrawl", "vin": "3KPF24AD1RE702944", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136382999, "source": "custom_dealercrawl", "vin": "3KPF24AD9PE690636", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136383344, "source": "custom_dealercrawl", "vin": "3KPF24AD5RE701358", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136383655, "source": "custom_dealercrawl", "vin": "3KPF24AD2RE704721", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136383926, "source": "custom_dealercrawl", "vin": "3KPF24AD2RE695468", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136384201, "source": "custom_dealercrawl", "vin": "KNDJ23AU9R7900577", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136398802, "source": "custom_dealercrawl", "vin": "KNDJ23AU1P7894254", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136399132, "source": "custom_dealercrawl", "vin": "3KPF24AD4PE666194", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136399497, "source": "custom_dealercrawl", "vin": "3KPF54AD2RE704659", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136399828, "source": "custom_dealercrawl", "vin": "5XXG64J28RG251896", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136400111, "source": "custom_dealercrawl", "vin": "5XXG64J2XRG253990", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136400411, "source": "custom_dealercrawl", "vin": "KNDPU3DF6R7217821", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136400676, "source": "custom_dealercrawl", "vin": "5XXG64J27RG250822", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136400986, "source": "custom_dealercrawl", "vin": "5XYK33DF5RG150077", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136401313, "source": "custom_dealercrawl", "vin": "KNDPUCDF7R7222896", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136405694, "source": "custom_dealercrawl", "vin": "5XYK33DF6RG161430", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136406109, "source": "custom_dealercrawl", "vin": "5XYRG4LC6PG237239", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136406389, "source": "custom_dealercrawl", "vin": "5XYRG4LCXPG238068", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136406660, "source": "custom_dealercrawl", "vin": "5XYRG4LC8PG230289", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136407124, "source": "custom_dealercrawl", "vin": "5XYRL4LC2PG231207", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136421565, "source": "custom_dealercrawl", "vin": "5XYK53DF8RG144509", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136421909, "source": "custom_dealercrawl", "vin": "5XYK53DF6RG151877", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136422226, "source": "custom_dealercrawl", "vin": "5XYRH4LF1PG230254", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136422494, "source": "custom_dealercrawl", "vin": "5XYRH4LF5PG225302", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136422815, "source": "custom_dealercrawl", "vin": "5XYK7CDF3RG154665", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136423076, "source": "custom_dealercrawl", "vin": "5XYK7CDF3RG151832", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136423373, "source": "custom_dealercrawl", "vin": "5XYRH4LF4PG230054", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136423658, "source": "custom_dealercrawl", "vin": "5XYK7CDF7RG162302", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136423989, "source": "custom_dealercrawl", "vin": "5XYP64GC0RG444118", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136451599, "source": "custom_dealercrawl", "vin": "5XYRHDLF4PG226845", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136451954, "source": "custom_dealercrawl", "vin": "5XYP3DGC3RG450732", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136452294, "source": "custom_dealercrawl", "vin": "KNDRMDLH4P5217245", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136452625, "source": "custom_dealercrawl", "vin": "5XYP5DGC4RG456873", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136452888, "source": "custom_dealercrawl", "vin": "5XYP5DGC2RG452918", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136453167, "source": "custom_dealercrawl", "vin": "3KPF24AD2RE708154", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136453393, "source": "custom_dealercrawl", "vin": "3KPF24AD8RE708241", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136453633, "source": "custom_dealercrawl", "vin": "3KPF24AD6RE708948", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136453893, "source": "custom_dealercrawl", "vin": "5XXG64J20RG251892", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136454146, "source": "custom_dealercrawl", "vin": "5XYK33DF5RG160656", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136471573, "source": "custom_dealercrawl", "vin": "5XXG44J88RG254680", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136471898, "source": "custom_dealercrawl", "vin": "5XXG34J27RG251333", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136472169, "source": "custom_dealercrawl", "vin": "5XYRH4LF8PG231983", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136472398, "source": "custom_dealercrawl", "vin": "5XYRH4LF9PG228638", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136472652, "source": "custom_dealercrawl", "vin": "5XYP5DGC0RG450892", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136472984, "source": "custom_dealercrawl", "vin": "5XYPH4A19HG277077", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136473264, "source": "custom_dealercrawl", "vin": "KNDJN2A2XK7010658", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136473510, "source": "custom_dealercrawl", "vin": "3KPF24AD8ME324436", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136473817, "source": "custom_dealercrawl", "vin": "5XXGU4L38JG248299", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136474118, "source": "custom_dealercrawl", "vin": "KNDJ23AU5L7704613", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136502735, "source": "custom_dealercrawl", "vin": "KNDJ23AU8N7168307", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136503071, "source": "custom_dealercrawl", "vin": "KNDJ23AU6M7790693", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136503394, "source": "custom_dealercrawl", "vin": "3KPF24AD5LE247104", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136503676, "source": "custom_dealercrawl", "vin": "3KPF44AC5PE525653", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136503940, "source": "custom_dealercrawl", "vin": "3KPF44AC9NE483050", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136504224, "source": "custom_dealercrawl", "vin": "3KPF44ACXPE570068", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136504469, "source": "custom_dealercrawl", "vin": "KNDMA5C14L6583416", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136504767, "source": "custom_dealercrawl", "vin": "5XXG64J24NG144841", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136505125, "source": "custom_dealercrawl", "vin": "3KPF54AD5PE662887", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136505424, "source": "custom_dealercrawl", "vin": "KNDPNCAC5M7891992", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136516101, "source": "custom_dealercrawl", "vin": "KNDPU3AG4P7059375", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136516433, "source": "custom_dealercrawl", "vin": "KNDPRCA67L7744778", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136516736, "source": "custom_dealercrawl", "vin": "5XYP3DHC1MG101186", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136517054, "source": "custom_dealercrawl", "vin": "5XYK53AF4PG062486", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136517316, "source": "custom_dealercrawl", "vin": "KNAE35LC3M6092222", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136517542, "source": "custom_dealercrawl", "vin": "5XYP34HC8NG225957", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136517788, "source": "custom_dealercrawl", "vin": "5XYRK4LF7NG150987", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136518127, "source": "custom_dealercrawl", "vin": "5XYK5CDF2RG146465", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136518383, "source": "custom_dealercrawl", "vin": "5XYP5DGC7PG355453", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136535933, "source": "custom_dealercrawl", "vin": "2GNALDEK4C6216921", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136536251, "source": "custom_dealercrawl", "vin": "1N6AD0EV6FN733787", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136536484, "source": "custom_dealercrawl", "vin": "3C4PDDEG1JT277972", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136536770, "source": "custom_dealercrawl", "vin": "5NPE34AF6KH820628", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136537073, "source": "custom_dealercrawl", "vin": "3VV3B7AX7KM131651", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136537424, "source": "custom_dealercrawl", "vin": "1FMCU9H90LUB85622", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136537678, "source": "custom_dealercrawl", "vin": "4S4BTADC7M3194424", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136537963, "source": "custom_dealercrawl", "vin": "KM8J33AL0LU119214", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136538243, "source": "custom_dealercrawl", "vin": "1C4HJXDG5JW240322", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136538477, "source": "custom_dealercrawl", "vin": "1FTER4EH9LLA76742", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136558046, "source": "custom_dealercrawl", "vin": "JTEZU5JR2G5117223", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136558350, "source": "custom_dealercrawl", "vin": "4T1K61AK8NU717125", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136558602, "source": "custom_dealercrawl", "vin": "3FMCR9B64NRE22333", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136558916, "source": "custom_dealercrawl", "vin": "5TDDZRFH4KS976680", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136559193, "source": "custom_dealercrawl", "vin": "5TFAZ5CN1MX114472", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136559514, "source": "custom_dealercrawl", "vin": "1C4RJKAG7N8559081", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136559789, "source": "custom_dealercrawl", "vin": "5TFAY5F18KX849412", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136560092, "source": "custom_dealercrawl", "vin": "3TMCZ5AN5MM372527", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136560334, "source": "custom_dealercrawl", "vin": "1GCPYFEDXKZ134891", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136560558, "source": "custom_dealercrawl", "vin": "1G1FF1R73P0127097", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136586505, "source": "custom_dealercrawl", "vin": "1GYS4KKJ7LR181476", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136586847, "source": "custom_dealercrawl", "vin": "1FTFW1E84NFA16705", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136587129, "source": "custom_dealercrawl", "vin": "1FTFW1RG9NFB37859", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136587448, "source": "custom_dealercrawl", "vin": "5XYK6CAF2PG015406", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136587825, "source": "custom_dealercrawl", "vin": "3KPA24ADXPE528749", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136588097, "source": "custom_dealercrawl", "vin": "KNDNB4H37N6064109", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136588357, "source": "custom_dealercrawl", "vin": "KNDPU3AF2P7087411", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136588615, "source": "custom_dealercrawl", "vin": "KNDCC3LCXN5533088", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136588910, "source": "custom_dealercrawl", "vin": "KNDPRCA6XN7009537", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136607117, "source": "custom_dealercrawl", "vin": "5XYP5DHC2NG320217", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136607458, "source": "custom_dealercrawl", "vin": "5XYRGDLC0NG100939", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136607729, "source": "custom_dealercrawl", "vin": "KNAE55LC2N6120376", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136608072, "source": "custom_dealercrawl", "vin": "KNDPN3AC2M7853460", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136608320, "source": "custom_dealercrawl", "vin": "5XYRLDLCXNG094997", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136608559, "source": "custom_dealercrawl", "vin": "3KPFK4A7XJE194018", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136608888, "source": "custom_dealercrawl", "vin": "5XXG64J25MG078993", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136609176, "source": "custom_dealercrawl", "vin": "5XYK6CAF6PG099097", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136609479, "source": "custom_dealercrawl", "vin": "5XYP34HC1MG122958", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136609710, "source": "custom_dealercrawl", "vin": "1C4PJMDX5KD476797", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136655889, "source": "custom_dealercrawl", "vin": "1FTFW1E83NFA67922", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136656205, "source": "custom_dealercrawl", "vin": "3GNAL3EK9ES607576", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136656513, "source": "custom_dealercrawl", "vin": "3N1AB8BV6NY210611", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136656822, "source": "custom_dealercrawl", "vin": "5TFLA5DB8NX002984", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136657146, "source": "custom_dealercrawl", "vin": "1C4RJKBG3M8109148", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136657424, "source": "custom_dealercrawl", "vin": "1C4HJXEN9MW634584", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136657649, "source": "custom_dealercrawl", "vin": "5TFLA5DB2NX013205", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136696239, "source": "custom_dealercrawl", "vin": "1C4RJKEGXM8111412", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136696522, "source": "custom_dealercrawl", "vin": "2C3CDZAG8MH560548", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136696840, "source": "custom_dealercrawl", "vin": "JN8AY2NC8L9621163", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136697123, "source": "custom_dealercrawl", "vin": "5NMJB3AE6NH123464", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136697401, "source": "custom_dealercrawl", "vin": "1C4RDHDGXMC626841", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136697648, "source": "custom_dealercrawl", "vin": "3C4NJCBB2NT187593", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136697991, "source": "custom_dealercrawl", "vin": "1N6AA1EF4NN105622", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136698272, "source": "custom_dealercrawl", "vin": "1C4RDHDGXMC608226", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136698521, "source": "custom_dealercrawl", "vin": "2T3C1RFVXMW105342", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136726637, "source": "custom_dealercrawl", "vin": "1C6JJTBG3ML597895", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136726998, "source": "custom_dealercrawl", "vin": "2C4RC1BG8NR138591", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136727362, "source": "custom_dealercrawl", "vin": "5NPEJ4J23NH134442", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136727641, "source": "custom_dealercrawl", "vin": "1GKKNMLA7KZ197077", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136727935, "source": "custom_dealercrawl", "vin": "1N4BL4DV9NN315392", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136728249, "source": "custom_dealercrawl", "vin": "1C4RJEAG5MC595235", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136728506, "source": "custom_dealercrawl", "vin": "4T3LWRFV5NU050513", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136728760, "source": "custom_dealercrawl", "vin": "1C6HJTAG9ML506340", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136729088, "source": "custom_dealercrawl", "vin": "2C3CDZFJ6MH655209", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136729337, "source": "custom_dealercrawl", "vin": "3GNAXKEV0NL100567", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136751446, "source": "custom_dealercrawl", "vin": "5TFJA5DBXNX009152", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136751760, "source": "custom_dealercrawl", "vin": "JTEBU5JR5L5749774", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136752117, "source": "custom_dealercrawl", "vin": "1C6RREFT4NN464082", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136752422, "source": "custom_dealercrawl", "vin": "5N1AT3BA7MC801608", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136752695, "source": "custom_dealercrawl", "vin": "1FMSK7FH2NGA51809", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136753002, "source": "custom_dealercrawl", "vin": "JTMC1RFV7LD051915", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136753311, "source": "custom_dealercrawl", "vin": "1C4HJXDN3LW169980", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136753608, "source": "custom_dealercrawl", "vin": "1C4PJLMX3ND521279", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136753904, "source": "custom_dealercrawl", "vin": "1C6RREBT3NN231686", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136754178, "source": "custom_dealercrawl", "vin": "1HGCV1F42JA018494", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136794988, "source": "custom_dealercrawl", "vin": "5TFEY5F19MX276542", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136795383, "source": "custom_dealercrawl", "vin": "1C6RREFT6NN372908", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136795681, "source": "custom_dealercrawl", "vin": "2FMPK3K93MBA60313", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136795996, "source": "custom_dealercrawl", "vin": "2FMPK4J93NBA90520", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136796255, "source": "custom_dealercrawl", "vin": "1C4HJXEN4LW115117", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136796540, "source": "custom_dealercrawl", "vin": "2C3CDZFJ5NH256907", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136796849, "source": "custom_dealercrawl", "vin": "3C4NJDDB8NT155217", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136797162, "source": "custom_dealercrawl", "vin": "5NMS24AJ9NH377743", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136797405, "source": "custom_dealercrawl", "vin": "5NMS4DALXNH467057", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136855490, "source": "custom_dealercrawl", "vin": "5TFJC5DB4PX021326", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136855856, "source": "custom_dealercrawl", "vin": "JTMCY7AJ0M4102192", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136856165, "source": "custom_dealercrawl", "vin": "5TFNA5ECXNX008866", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136856414, "source": "custom_dealercrawl", "vin": "KM8J33AL7MU350113", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136856665, "source": "custom_dealercrawl", "vin": "KMHRC8A33PU227154", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136856983, "source": "custom_dealercrawl", "vin": "1GCPWDED0KZ231270", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136857271, "source": "custom_dealercrawl", "vin": "2C4RC1BG9NR109309", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136857497, "source": "custom_dealercrawl", "vin": "1N6AA1EF4NN103272", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136857775, "source": "custom_dealercrawl", "vin": "1C4RJKBG8M8135289", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136858067, "source": "custom_dealercrawl", "vin": "3TMDZ5BN5NM130647", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136894091, "source": "custom_dealercrawl", "vin": "1C6RR7KG0NS188148", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136894388, "source": "custom_dealercrawl", "vin": "1LN6L9NP7L5607706", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136894690, "source": "custom_dealercrawl", "vin": "4T1K61AK5PU151251", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136895004, "source": "custom_dealercrawl", "vin": "KM8R54HE4MU295193", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136895303, "source": "custom_dealercrawl", "vin": "1C4RJJDG8M8152293", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136895597, "source": "custom_dealercrawl", "vin": "1C6RREFT0NN126517", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136895904, "source": "custom_dealercrawl", "vin": "1GKS2HKJXKR258293", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136896185, "source": "custom_dealercrawl", "vin": "3N1CP5CV9ML524515", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136896442, "source": "custom_dealercrawl", "vin": "WBA13AL04N7K04177", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136896728, "source": "custom_dealercrawl", "vin": "1C6SRFFT9PN642286", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136906072, "source": "custom_dealercrawl", "vin": "4JGFB4KB4MA375072", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136906367, "source": "custom_dealercrawl", "vin": "KM8J33A46MU318049", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136935195, "source": "custom_dealercrawl", "vin": "2T3E6RFV4MW010883", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136935497, "source": "custom_dealercrawl", "vin": "5LMJJ3LT8MEL05501", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136935813, "source": "custom_dealercrawl", "vin": "1FMCU0H62LUC34238", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136936143, "source": "custom_dealercrawl", "vin": "3GKALPEVXML376629", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386136936420, "source": "custom_dealercrawl", "vin": "2LMPJ6J96NBL12115", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136936697, "source": "custom_dealercrawl", "vin": "5N1DR3CC6NC265344", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136936999, "source": "custom_dealercrawl", "vin": "5NMS24AJXNH457634", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136937280, "source": "custom_dealercrawl", "vin": "5NTJDDAF7PH044577", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136937504, "source": "custom_dealercrawl", "vin": "KM8J33AL5MU389332", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136978979, "source": "custom_dealercrawl", "vin": "1C6HJTFG5NL131587", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136979354, "source": "custom_dealercrawl", "vin": "1FTEW1E51LFA62166", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136979635, "source": "custom_dealercrawl", "vin": "1GKKNXLS9MZ226320", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136979944, "source": "custom_dealercrawl", "vin": "1N4BL4CV9NN349561", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136980215, "source": "custom_dealercrawl", "vin": "5NPLM4AG3MH018635", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136980457, "source": "custom_dealercrawl", "vin": "7FARW2H80KE055200", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386136980719, "source": "custom_dealercrawl", "vin": "WDDUG6GB5JA396421", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386136981037, "source": "custom_dealercrawl", "vin": "1C4HJXFG3LW200787", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386136981337, "source": "custom_dealercrawl", "vin": "1GNSKGKL5MR349036", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386136981562, "source": "custom_dealercrawl", "vin": "5NMS24AJ9PH538482", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137014586, "source": "custom_dealercrawl", "vin": "1C4HJXDN7MW544609", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137014937, "source": "custom_dealercrawl", "vin": "1C4PJMMB8PD100719", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137015218, "source": "custom_dealercrawl", "vin": "1FMJU1LT9MEA29019", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137015541, "source": "custom_dealercrawl", "vin": "3C4NJDBB6NT120808", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137015861, "source": "custom_dealercrawl", "vin": "3FMCR9D98NRD55677", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137016145, "source": "custom_dealercrawl", "vin": "5TFCZ5AN5MX253287", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137016397, "source": "custom_dealercrawl", "vin": "1C4RJFLG7KC784727", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137016691, "source": "custom_dealercrawl", "vin": "1C6RREJT3MN625026", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137017025, "source": "custom_dealercrawl", "vin": "1GNEVNKW3NJ159111", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137017298, "source": "custom_dealercrawl", "vin": "3GKALVEV3LL191860", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137047061, "source": "custom_dealercrawl", "vin": "5NMS5DALXMH367441", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137047364, "source": "custom_dealercrawl", "vin": "1C4JJXR63MW727878", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137047644, "source": "custom_dealercrawl", "vin": "1FMCU0G66NUA69542", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137047945, "source": "custom_dealercrawl", "vin": "5N1AT3BA7MC707728", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137048205, "source": "custom_dealercrawl", "vin": "1G1FB1RX3N0119297", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137048539, "source": "custom_dealercrawl", "vin": "5TFRM5F18KX139294", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137048818, "source": "custom_dealercrawl", "vin": "1GKS2HKD8NR106754", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137049103, "source": "custom_dealercrawl", "vin": "3C4NJDCB6NT203069", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137049399, "source": "custom_dealercrawl", "vin": "3C4PDCBG1JT476647", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137049688, "source": "custom_dealercrawl", "vin": "3VWJL7AT8EM608802", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137092556, "source": "custom_dealercrawl", "vin": "5TFAZ5CN1MX096510", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137092890, "source": "custom_dealercrawl", "vin": "1C4PJMCB2LD612178", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137093221, "source": "custom_dealercrawl", "vin": "1C6JJTBM1NL146827", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137093471, "source": "custom_dealercrawl", "vin": "1GCUYGED2NZ172158", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137093713, "source": "custom_dealercrawl", "vin": "1N6AA1CF7NN100630", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137094003, "source": "custom_dealercrawl", "vin": "JTEBU5JR0F5224951", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137094267, "source": "custom_dealercrawl", "vin": "2C3CDXBG5NH141030", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137094515, "source": "custom_dealercrawl", "vin": "3GNAXKEV9NS200169", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137094756, "source": "custom_dealercrawl", "vin": "1C4RJEBG4NC125570", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137141293, "source": "custom_dealercrawl", "vin": "5NMS64AJ4NH433284", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137141642, "source": "custom_dealercrawl", "vin": "KM8R74GE7PU583886", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137141977, "source": "custom_dealercrawl", "vin": "3FTTW8E94NRA67662", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137142302, "source": "custom_dealercrawl", "vin": "JTEBU5JR0L5768605", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137142532, "source": "custom_dealercrawl", "vin": "3N1CP5BV5ML516185", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137142806, "source": "custom_dealercrawl", "vin": "1C4RJFBG9KC746160", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137143116, "source": "custom_dealercrawl", "vin": "1C6RREHT0NN260957", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137143415, "source": "custom_dealercrawl", "vin": "3TMCZ5AN6LM301707", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137143689, "source": "custom_dealercrawl", "vin": "5TFMA5DB3PX079687", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137144001, "source": "custom_dealercrawl", "vin": "1C4PJMCBXLD626328", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137155683, "source": "custom_dealercrawl", "vin": "1FA6P8TH5M5101765", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137156005, "source": "custom_dealercrawl", "vin": "1GCGTCEN3M1134271", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137156300, "source": "custom_dealercrawl", "vin": "3C6UR5DL2MG652975", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137406128, "source": "custom_dealercrawl", "vin": "3N1CN8BV7ML878526", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137497913, "source": "custom_dealercrawl", "vin": "3GCUDFED5RG145371", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137498223, "source": "custom_dealercrawl", "vin": "3GCNDAEK3RG148565", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137498538, "source": "custom_dealercrawl", "vin": "3GCNDAED2RG142676", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137498873, "source": "custom_dealercrawl", "vin": "2GCUDDEDXP1126700", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137499197, "source": "custom_dealercrawl", "vin": "1GCPDKEKXPZ276927", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137499491, "source": "custom_dealercrawl", "vin": "1GCRDAED1PZ307454", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137499824, "source": "custom_dealercrawl", "vin": "1GCUDEED6PZ311131", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137500075, "source": "custom_dealercrawl", "vin": "3GCUDDED0PG332079", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137500371, "source": "custom_dealercrawl", "vin": "1GCUDAED3PZ314013", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137525110, "source": "custom_dealercrawl", "vin": "1GCUDEED8PZ311616", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137525482, "source": "custom_dealercrawl", "vin": "3GNAXUEG7RL112394", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137525768, "source": "custom_dealercrawl", "vin": "3GNAXUEG6RL112516", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137526061, "source": "custom_dealercrawl", "vin": "1GCRDDED0RZ107394", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137526366, "source": "custom_dealercrawl", "vin": "1GNEVGKW2PJ299648", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137526601, "source": "custom_dealercrawl", "vin": "1GCPDKEK2RZ114700", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137526921, "source": "custom_dealercrawl", "vin": "1GCPDKEK8RZ109128", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137527181, "source": "custom_dealercrawl", "vin": "1GCPSCEK0P1230517", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137527476, "source": "custom_dealercrawl", "vin": "3GNAXXEG0RL144623", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137555500, "source": "custom_dealercrawl", "vin": "KL79MTSL8PB216713", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137555814, "source": "custom_dealercrawl", "vin": "1G1ZE5ST5RF116942", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137556115, "source": "custom_dealercrawl", "vin": "1GCUDEED2RZ109292", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137556425, "source": "custom_dealercrawl", "vin": "KL79MMS23RB033154", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137556694, "source": "custom_dealercrawl", "vin": "1GNEVJKW2PJ314226", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137557050, "source": "custom_dealercrawl", "vin": "1GCUDEED0RZ138130", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137557359, "source": "custom_dealercrawl", "vin": "2GC4YME70R1147170", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137557626, "source": "custom_dealercrawl", "vin": "1GCUDEED5RZ143825", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137557936, "source": "custom_dealercrawl", "vin": "3GNAXHEG4RL170793", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137570833, "source": "custom_dealercrawl", "vin": "3GNAXSEG5RL172078", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137571130, "source": "custom_dealercrawl", "vin": "3GNAXUEG1RS155585", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137571443, "source": "custom_dealercrawl", "vin": "1GNSKNKD7PR469941", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137571716, "source": "custom_dealercrawl", "vin": "3GNAXHEG1RL179807", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137571964, "source": "custom_dealercrawl", "vin": "3GNKBKRS9RS158000", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137572270, "source": "custom_dealercrawl", "vin": "1GC5YME7XRF229050", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137572552, "source": "custom_dealercrawl", "vin": "1GCUDJEL0RZ163772", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137572884, "source": "custom_dealercrawl", "vin": "3GNAXUEG2RS163341", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137573178, "source": "custom_dealercrawl", "vin": "1GC4YYEY9RF257949", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137573418, "source": "custom_dealercrawl", "vin": "3GCUDHE88RG140311", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137589079, "source": "custom_dealercrawl", "vin": "3GCUDEE88PG337006", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137589386, "source": "custom_dealercrawl", "vin": "3GCNDAED7RG142673", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137589740, "source": "custom_dealercrawl", "vin": "3GNAXUEG2RL198200", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137590072, "source": "custom_dealercrawl", "vin": "3GNKBKRS3RS162320", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137590367, "source": "custom_dealercrawl", "vin": "3GNKBKRS5RS145146", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137590619, "source": "custom_dealercrawl", "vin": "3GNKDCRJ0RS145448", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137590937, "source": "custom_dealercrawl", "vin": "KL79MRSLXRB063628", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137591238, "source": "custom_dealercrawl", "vin": "3GCUDCED0RG147088", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137591537, "source": "custom_dealercrawl", "vin": "3GNKBJR48RS165726", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137599682, "source": "custom_dealercrawl", "vin": "1GNSKPKDXPR543753", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137600042, "source": "custom_dealercrawl", "vin": "3GNKBLRS9RS146922", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137600325, "source": "custom_dealercrawl", "vin": "1GNSKRKD1PR483812", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137600607, "source": "custom_dealercrawl", "vin": "3N1CP5DV9LL514774", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137600976, "source": "custom_dealercrawl", "vin": "5NMJF3AEXPH197347", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137601261, "source": "custom_dealercrawl", "vin": "5UXTY3C02M9F02255", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137601521, "source": "custom_dealercrawl", "vin": "KL79MTSL1NB140880", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137601832, "source": "custom_dealercrawl", "vin": "KL7CJLSB4MB347333", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137602091, "source": "custom_dealercrawl", "vin": "1C4RJFAG9JC244958", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137602346, "source": "custom_dealercrawl", "vin": "1C4RJJBG5N8547908", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137607014, "source": "custom_dealercrawl", "vin": "1N6ED0EBXLN727929", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137607334, "source": "custom_dealercrawl", "vin": "3TYAX5GN7NT043922", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137607620, "source": "custom_dealercrawl", "vin": "KL79MMS24RB084260", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137607965, "source": "custom_dealercrawl", "vin": "KL79MTSL0RB079298", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137608229, "source": "custom_dealercrawl", "vin": "JTJDY7AX6L4315717", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137608527, "source": "custom_dealercrawl", "vin": "KM8JFCA1XNU013250", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137608814, "source": "custom_dealercrawl", "vin": "2GC4YPEY0R1161984", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137609111, "source": "custom_dealercrawl", "vin": "1GNSKSKD6PR535717", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137609392, "source": "custom_dealercrawl", "vin": "1GCPDKEK5RZ180187", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137615588, "source": "custom_dealercrawl", "vin": "1G1FW6S04P4186257", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137615978, "source": "custom_dealercrawl", "vin": "3C6UR5DL7MG579196", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137616273, "source": "custom_dealercrawl", "vin": "5NMJE3AE9NH027254", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137616560, "source": "custom_dealercrawl", "vin": "5NMJF3AE2NH064546", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137616839, "source": "custom_dealercrawl", "vin": "5NMS2DAJ3NH438519", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137617233, "source": "custom_dealercrawl", "vin": "5NPEL4JA0MH090061", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137617530, "source": "custom_dealercrawl", "vin": "JTDS4MCE1MJ064897", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137617793, "source": "custom_dealercrawl", "vin": "1C4SJVBT0NS110875", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137618153, "source": "custom_dealercrawl", "vin": "1GCRYDEDXKZ171288", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137618440, "source": "custom_dealercrawl", "vin": "1GC4YNE79MF312088", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137627979, "source": "custom_dealercrawl", "vin": "3GCPYFED2MG329385", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137628288, "source": "custom_dealercrawl", "vin": "1GC4YREY7MF270973", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137628546, "source": "custom_dealercrawl", "vin": "3GTU2PEJ2JG106243", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137628878, "source": "custom_dealercrawl", "vin": "JTDKARFP8J3094207", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137629174, "source": "custom_dealercrawl", "vin": "1C4BJWFG4EL243426", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137629472, "source": "custom_dealercrawl", "vin": "3GNAXSEV1LS606086", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137629767, "source": "custom_dealercrawl", "vin": "5TFPC5DB3NX005917", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137630088, "source": "custom_dealercrawl", "vin": "KL79MUSL8PB026139", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137630377, "source": "custom_dealercrawl", "vin": "1C6JJTEGXML621380", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137630660, "source": "custom_dealercrawl", "vin": "1FMJU1HT7MEA04323", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137655725, "source": "custom_dealercrawl", "vin": "3C6UR5FLXNG161536", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137656059, "source": "custom_dealercrawl", "vin": "3GCUYDET4LG395966", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137656329, "source": "custom_dealercrawl", "vin": "1GCUYEEL6LZ229051", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137656561, "source": "custom_dealercrawl", "vin": "JN8AY2BA4M9375216", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137675234, "source": "custom_dealercrawl", "vin": "3GNKBBRA6KS615651", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137675559, "source": "custom_dealercrawl", "vin": "1G1RC6S51JU137784", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137675959, "source": "custom_dealercrawl", "vin": "1C3CDFBB4FD180883", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137676253, "source": "custom_dealercrawl", "vin": "1G1RC6S51JU128051", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137676498, "source": "custom_dealercrawl", "vin": "1G1RC6S56JU127221", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137676741, "source": "custom_dealercrawl", "vin": "1G1RC6S56JU139174", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137677064, "source": "custom_dealercrawl", "vin": "1G1RC6S5XJU142885", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137677345, "source": "custom_dealercrawl", "vin": "1G1RC6S54JU139545", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137677569, "source": "custom_dealercrawl", "vin": "1G1RC6S56JU140938", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137703733, "source": "custom_dealercrawl", "vin": "1G1RC6S55JU149906", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137704069, "source": "custom_dealercrawl", "vin": "1GKKNMLA0KZ286201", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137704350, "source": "custom_dealercrawl", "vin": "3GTU2PEJ3JG472163", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137704594, "source": "custom_dealercrawl", "vin": "3N1AB7AP7DL621699", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137704915, "source": "custom_dealercrawl", "vin": "1FTER4FH4KLA37926", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137705239, "source": "custom_dealercrawl", "vin": "1FTEW1E85PFB86912", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137705475, "source": "custom_dealercrawl", "vin": "1GCPWBEK5NZ229232", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137705733, "source": "custom_dealercrawl", "vin": "1GKS2GKCXKR318195", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137706008, "source": "custom_dealercrawl", "vin": "1N4AL3AP4GC124621", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137706295, "source": "custom_dealercrawl", "vin": "2FMGK5C86DBD17093", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137724231, "source": "custom_dealercrawl", "vin": "2HKRM4H75EH685840", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137724533, "source": "custom_dealercrawl", "vin": "1G1JC6SH1G4124100", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137724834, "source": "custom_dealercrawl", "vin": "1C4RJEAG1KC662443", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137725120, "source": "custom_dealercrawl", "vin": "3GNCJPSB7JL157831", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137725386, "source": "custom_dealercrawl", "vin": "2C3CDXGJ6MH539835", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137725631, "source": "custom_dealercrawl", "vin": "3GNTKGE76DG304982", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137725971, "source": "custom_dealercrawl", "vin": "3C6UR5FL9NG147627", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137726302, "source": "custom_dealercrawl", "vin": "5GAEVBKW3NJ109995", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137726528, "source": "custom_dealercrawl", "vin": "5J6RW1H83NA022107", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137726771, "source": "custom_dealercrawl", "vin": "KM8J33AL0MU283614", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137744913, "source": "custom_dealercrawl", "vin": "KM8R74HE5NU487492", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137745217, "source": "custom_dealercrawl", "vin": "1C6SRFET8LN322100", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137745474, "source": "custom_dealercrawl", "vin": "1G1RA6S57HU178629", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137745705, "source": "custom_dealercrawl", "vin": "3GNAXSEV2JS570423", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137746031, "source": "custom_dealercrawl", "vin": "ZACNJDD14MPM38918", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137746315, "source": "custom_dealercrawl", "vin": "1GC4YUEY9MF202211", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137746553, "source": "custom_dealercrawl", "vin": "1HGCV1F59KA126704", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137746870, "source": "custom_dealercrawl", "vin": "3C63RRJL7NG292014", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137747154, "source": "custom_dealercrawl", "vin": "3FA6P0CD4KR265016", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137761896, "source": "custom_dealercrawl", "vin": "1C4PJMBX3KD194225", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137762225, "source": "custom_dealercrawl", "vin": "2C4RC1DG8MR538596", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137762465, "source": "custom_dealercrawl", "vin": "2C4RC1BG8MR598218", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137762717, "source": "custom_dealercrawl", "vin": "2C4RC1BG3MR512006", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137763049, "source": "custom_dealercrawl", "vin": "2GNAXLEX8L6202238", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137763383, "source": "custom_dealercrawl", "vin": "1FT7W2BT1CEC44876", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137763665, "source": "custom_dealercrawl", "vin": "2C4RC1BG9MR527707", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137763991, "source": "custom_dealercrawl", "vin": "2C4RC1BG4MR574627", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137764258, "source": "custom_dealercrawl", "vin": "2C4RC1BG5MR589377", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137764487, "source": "custom_dealercrawl", "vin": "1GNSKCKC9KR168480", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137776577, "source": "custom_dealercrawl", "vin": "7FARW2H90JE064373", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137776958, "source": "custom_dealercrawl", "vin": "5XYP2DHC1MG189126", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137777243, "source": "custom_dealercrawl", "vin": "1FTEW1EP1LFB60955", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137777506, "source": "custom_dealercrawl", "vin": "5NMJF3AE7PH198584", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137777792, "source": "custom_dealercrawl", "vin": "1GCUYEED5KZ218405", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137778138, "source": "custom_dealercrawl", "vin": "1C4AJWAG7FL616415", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137778399, "source": "custom_dealercrawl", "vin": "5YJ3E1EAXLF806293", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137778681, "source": "custom_dealercrawl", "vin": "JN8AZ2AF8M9718538", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137778999, "source": "custom_dealercrawl", "vin": "1FMSK8DH7LGB92168", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137779259, "source": "custom_dealercrawl", "vin": "1G6KJ5RS2GU155131", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137792080, "source": "custom_dealercrawl", "vin": "1C4BJWEG2HL600141", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137792375, "source": "custom_dealercrawl", "vin": "1FTEW1E45KFB48523", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137792639, "source": "custom_dealercrawl", "vin": "1GC2KVEG1JZ244548", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137792918, "source": "custom_dealercrawl", "vin": "YV4102PK2L1558063", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137793155, "source": "custom_dealercrawl", "vin": "1FTEW1EG7JKE84707", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137793422, "source": "custom_dealercrawl", "vin": "1FTFW1E55MFA26101", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137793664, "source": "custom_dealercrawl", "vin": "1GC4YRE75PF120808", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137793999, "source": "custom_dealercrawl", "vin": "1GKS2HKJ7KR403287", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137794260, "source": "custom_dealercrawl", "vin": "1N4AL21E49N555332", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137815725, "source": "custom_dealercrawl", "vin": "3FADP4DJXKM117260", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137816049, "source": "custom_dealercrawl", "vin": "3GNAXKEV8MS129576", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137816338, "source": "custom_dealercrawl", "vin": "1GT42YEY5JF102806", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137816627, "source": "custom_dealercrawl", "vin": "3GTUUGE88PG169282", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137816954, "source": "custom_dealercrawl", "vin": "1G1YC3D45N5120114", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137817237, "source": "custom_dealercrawl", "vin": "3VWD07AJ8FM407391", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137817481, "source": "custom_dealercrawl", "vin": "4JGFB4JB1NA635690", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137817768, "source": "custom_dealercrawl", "vin": "3GTP2VE38BG376842", "vid": "", "date": "2023-10-26", "domain": "www.denooyerchevy.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137818072, "source": "custom_dealercrawl", "vin": "JN8AY2ND5LX015310", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137818330, "source": "custom_dealercrawl", "vin": "KM8JFCA17PU130559", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137848345, "source": "custom_dealercrawl", "vin": "1FMSK7DH4LGB11136", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137848717, "source": "custom_dealercrawl", "vin": "1GKS1JKL2MR493317", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137849024, "source": "custom_dealercrawl", "vin": "2C3CDZFJ6MH594248", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137849321, "source": "custom_dealercrawl", "vin": "3C6UR5DJXMG554629", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137849557, "source": "custom_dealercrawl", "vin": "3GNAXUEV8NL189736", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137849887, "source": "custom_dealercrawl", "vin": "5NMS24AJ1NH444545", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137850164, "source": "custom_dealercrawl", "vin": "SHHFK8G73LU200431", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137850443, "source": "custom_dealercrawl", "vin": "1C6HJTAG4LL126434", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137850677, "source": "custom_dealercrawl", "vin": "1C6SRFBT0LN253424", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137850988, "source": "custom_dealercrawl", "vin": "JA4ARUAU7NU008285", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137879804, "source": "custom_dealercrawl", "vin": "1C4HJXDG6NW181352", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137880135, "source": "custom_dealercrawl", "vin": "3GCRCSE00AG142879", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137880396, "source": "custom_dealercrawl", "vin": "5N1AZ2BJ1MC144068", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137880659, "source": "custom_dealercrawl", "vin": "JTEAAAAH4MJ054957", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137880997, "source": "custom_dealercrawl", "vin": "KM8SRDHF5HU180607", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137881289, "source": "custom_dealercrawl", "vin": "1FTEW1CP1NKD56276", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137881529, "source": "custom_dealercrawl", "vin": "1FTMF1C5XMKE39178", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137881847, "source": "custom_dealercrawl", "vin": "5TDGY5B15NS189825", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137882144, "source": "custom_dealercrawl", "vin": "JN8AY2NE1L9781225", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137882413, "source": "custom_dealercrawl", "vin": "JTEHU5JR7M5960812", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137905725, "source": "custom_dealercrawl", "vin": "1N4AA6CV7MC506947", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137906072, "source": "custom_dealercrawl", "vin": "3GCPABEK3NG512100", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137906358, "source": "custom_dealercrawl", "vin": "3VWDP7AJXCM365815", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137906590, "source": "custom_dealercrawl", "vin": "JA4J3UA81NZ021668", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137906881, "source": "custom_dealercrawl", "vin": "SALRRBBV5HA028828", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137907155, "source": "custom_dealercrawl", "vin": "1C4RJFAG4JC166444", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137936272, "source": "custom_dealercrawl", "vin": "1C6HJTAG6LL211646", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137936575, "source": "custom_dealercrawl", "vin": "1GNSCAKC5KR254077", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137936950, "source": "custom_dealercrawl", "vin": "2T2HZMAA5LC181352", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137937224, "source": "custom_dealercrawl", "vin": "JM1BL1K6XB1493156", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137937468, "source": "custom_dealercrawl", "vin": "ZACNJBD15KPJ99803", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137937696, "source": "custom_dealercrawl", "vin": "1C6RREBG6NN177836", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137938000, "source": "custom_dealercrawl", "vin": "1FMSK7FH4NGA51990", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137938288, "source": "custom_dealercrawl", "vin": "1FT7W2BN5LEE33760", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137938522, "source": "custom_dealercrawl", "vin": "5LMYJ9YY5PNL02646", "vid": "e368e6420a0e0a9350297a7f1dbf8c95", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137946566, "source": "custom_dealercrawl", "vin": "1G1ZE5ST7GF310885", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137946881, "source": "custom_dealercrawl", "vin": "5LM5J7XC9PGL22819", "vid": "49043f600a0e0a9448ce3dca6c11e8f1", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137947182, "source": "custom_dealercrawl", "vin": "5LM5J7XC2PGL21902", "vid": "81007aaf0a0e0a9a31c50ba54c4a67db", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137947488, "source": "custom_dealercrawl", "vin": "2C3CDXGJ3NH261798", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137947759, "source": "custom_dealercrawl", "vin": "5GAERBKW3PJ156810", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137948093, "source": "custom_dealercrawl", "vin": "5TDDZRBH4MS524074", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137948366, "source": "custom_dealercrawl", "vin": "5LMCJ2DA9PUL22544", "vid": "0e22dc460a0e0a9a61540bbc5594e809", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137948669, "source": "custom_dealercrawl", "vin": "5LMCJ2DA4PUL23164", "vid": "1b13aae80a0e0a9a61540bbc94781d68", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137948999, "source": "custom_dealercrawl", "vin": "5LMCJ2DAXPUL25985", "vid": "211188f90a0e0a904cc2c9a75e2fcabc", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137958532, "source": "custom_dealercrawl", "vin": "1C6RREBT5NN201475", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137958861, "source": "custom_dealercrawl", "vin": "1FMJK2AT3MEA19567", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137959106, "source": "custom_dealercrawl", "vin": "1HGCV1F16LA108806", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137959432, "source": "custom_dealercrawl", "vin": "5LMCJ2DA1PUL22960", "vid": "251ff63a0a0e087f4292470254c06e82", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137959716, "source": "custom_dealercrawl", "vin": "2LMPJ8K92PBL25585", "vid": "2111862b0a0e0a904cc2c9a7e33f7570", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137960032, "source": "custom_dealercrawl", "vin": "2LMPJ8K91PBL26842", "vid": "2cd0a5ad0a0e0a92527f8edc2e762e3a", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137960325, "source": "custom_dealercrawl", "vin": "2LMPJ8K91PBL25884", "vid": "2cd0ac6e0a0e0a940a1dcbad7f6a1d02", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137960576, "source": "custom_dealercrawl", "vin": "2C3CDZAG5MH534344", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137960884, "source": "custom_dealercrawl", "vin": "3C4NJCCB4LT231170", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386137975493, "source": "custom_dealercrawl", "vin": "2LMPJ8K9XPBL24152", "vid": "33fa75590a0e0a926c4309f6f6b4334d", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137975845, "source": "custom_dealercrawl", "vin": "2LMPJ8K9XPBL22997", "vid": "452c43220a0e087f102b3b1d2e421a63", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386137976116, "source": "custom_dealercrawl", "vin": "2LMPJ8K9XPBL24815", "vid": "4eea3f940a0e0a992b96b96bdd79410b", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137976388, "source": "custom_dealercrawl", "vin": "2LMPJ8K90PBL29702", "vid": "561a30dd0a0e0a992b96b96b83982840", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137976631, "source": "custom_dealercrawl", "vin": "2LMPJ8K90PBL22166", "vid": "793efd8e0a0e0a912674cfa5ccc05176", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386137976961, "source": "custom_dealercrawl", "vin": "2LMPJ8K99PBL21114", "vid": "7f3139130a0e0a933ddc904ab161b393", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137977233, "source": "custom_dealercrawl", "vin": "2LMPJ8K98PBL21511", "vid": "7f313edc0a0e0a933ddc904abf73e022", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386137977477, "source": "custom_dealercrawl", "vin": "2LMPJ8K92PBL24372", "vid": "810071490a0e0a946c889dafee59ccca", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386137977705, "source": "custom_dealercrawl", "vin": "5LMCJ1DA2PUL22699", "vid": "4eea45480a0e0a992b96b96b03633e44", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138008968, "source": "custom_dealercrawl", "vin": "5LMCJ1DA2PUL25571", "vid": "4eea478f0a0e0a9169ea2c186ad93338", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138009265, "source": "custom_dealercrawl", "vin": "1FTEW1C89MKD57358", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138009501, "source": "custom_dealercrawl", "vin": "2LMPJ9JP3KBL39106", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138009768, "source": "custom_dealercrawl", "vin": "5LMCJ1DA2PUL22153", "vid": "636d0e230a0e0a99740e454b907d3269", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138010085, "source": "custom_dealercrawl", "vin": "4T1K61AKXPU729019", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138010346, "source": "custom_dealercrawl", "vin": "5LMCJ1DA2PUL20452", "vid": "8da53bab0a0e0a9033941ce1aa090bdb", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138010684, "source": "custom_dealercrawl", "vin": "5LMCJ1DA1PUL20863", "vid": "9072aaa40a0e0a9157b4dc7f15f2b848", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138011024, "source": "custom_dealercrawl", "vin": "5LMCJ1DA6PUL20552", "vid": "b6a36f3a0a0e0a934f6f2292ff376a40", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138011363, "source": "custom_dealercrawl", "vin": "5LMCJ1DA0PUL20692", "vid": "c19953780a0e087f29bc94ace939fba5", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138033517, "source": "custom_dealercrawl", "vin": "5LMCJ1DA6PUL20759", "vid": "c19958e50a0e087f29bc94ac1d076e00", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138033868, "source": "custom_dealercrawl", "vin": "1FT7W2BTXGEB94033", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138034178, "source": "custom_dealercrawl", "vin": "1G1FD1RS6P0133096", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138034454, "source": "custom_dealercrawl", "vin": "2LMPJ8K96PBL23340", "vid": "0f9c3e9c0a0e0a936ce9110d5b4e5e5b", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138034726, "source": "custom_dealercrawl", "vin": "2LMPJ8K93PBL23019", "vid": "0f9c412a0a0e0a936ce9110dcb98ca02", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138035103, "source": "custom_dealercrawl", "vin": "3C4NJDDB2MT598638", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138035425, "source": "custom_dealercrawl", "vin": "2LMPJ8K99PBL25583", "vid": "2111836d0a0e0a904cc2c9a7906bcb05", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138035744, "source": "custom_dealercrawl", "vin": "5LMCJ2DA6PUL21061", "vid": "292785750a0e087f102b3b1d73003275", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138036078, "source": "custom_dealercrawl", "vin": "3N1AB7AP3GY219556", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138068734, "source": "custom_dealercrawl", "vin": "5LMCJ2DA9PUL26285", "vid": "2f52432c0a0e0a992b96b96b777a9a06", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138069096, "source": "custom_dealercrawl", "vin": "5LMCJ2DAXPUL07812", "vid": "3eb562b80a0e0a9315b6be49cba0bd43", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138069336, "source": "custom_dealercrawl", "vin": "5LMJJ2KT7MEL00866", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138069695, "source": "custom_dealercrawl", "vin": "JTDEPMAE2MJ170203", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138070030, "source": "custom_dealercrawl", "vin": "5LMCJ2DA8PUL19392", "vid": "70ead7ae0a0e0a931b3f4bbcb6eed50b", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138070329, "source": "custom_dealercrawl", "vin": "KM8JF3AE0NU144531", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138070576, "source": "custom_dealercrawl", "vin": "5LMCJ1DA7PUL25517", "vid": "21117ff60a0e0a904cc2c9a7b2539a22", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138070949, "source": "custom_dealercrawl", "vin": "5LMCJ1DA9PUL21632", "vid": "22d009240a0e0a904cc2c9a7505f6af0", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138071243, "source": "custom_dealercrawl", "vin": "1C6RR7LT1MS516476", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138103554, "source": "custom_dealercrawl", "vin": "5LMCJ1DA5PUL23152", "vid": "2cd0a7c30a0e0a940a1dcbadd338bf00", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138103927, "source": "custom_dealercrawl", "vin": "1GNSKHKC3JR373238", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138104192, "source": "custom_dealercrawl", "vin": "1GT12TEG5GF124312", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138104509, "source": "custom_dealercrawl", "vin": "5LMCJ1CA9PUL22135", "vid": "44821d2d0a0e0a90290b5a5c2dd63fdc", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138104852, "source": "custom_dealercrawl", "vin": "1GTUUDEL2NZ504861", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138105198, "source": "custom_dealercrawl", "vin": "5LMCJ1DA8PUL22125", "vid": "4eea3c640a0e094a3883bfc37a4a2ae1", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138105482, "source": "custom_dealercrawl", "vin": "2LMPJ8K95PBL20817", "vid": "ed61e5820a0e081d1b14d1fde2a437d0", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138105751, "source": "custom_dealercrawl", "vin": "2LMPJ8K99PBL26412", "vid": "f6d8cd970a0e0a9a61540bbca562695a", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138106058, "source": "custom_dealercrawl", "vin": "2LMPJ8K98PBL25820", "vid": "f6d8d0010a0e0a9a61540bbcb53cb21f", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138150417, "source": "custom_dealercrawl", "vin": "3C6UR5DL2MG605137", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138150729, "source": "custom_dealercrawl", "vin": "3C6UR5DL6NG237675", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138151054, "source": "custom_dealercrawl", "vin": "2LMPJ8J95PBL25047", "vid": "561a32650a0e0a992b96b96b42af7b4f", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138151373, "source": "custom_dealercrawl", "vin": "5LMJJ2LG9PEL11406", "vid": "070302900a0e0a9a6d5216d69b6254bc", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138151647, "source": "custom_dealercrawl", "vin": "5LMJJ2LG7PEL08777", "vid": "0b568b240a0e0a934b7bca1ad31a3920", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138151939, "source": "custom_dealercrawl", "vin": "5LMJJ3LGXPEL05555", "vid": "2c5e74e10a0e081d0793dde267eafd54", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138152230, "source": "custom_dealercrawl", "vin": "3VWC57BU3MM003966", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138152499, "source": "custom_dealercrawl", "vin": "2LMPJ8K94PBL20842", "vid": "b6a375830a0e0a9174221517fb8cd624", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138152765, "source": "custom_dealercrawl", "vin": "5UXCR6C0XLLL65224", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138153062, "source": "custom_dealercrawl", "vin": "KM8J33A44KU074849", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138155696, "source": "custom_dealercrawl", "vin": "2LMPJ8K93PBL22890", "vid": "b6a388f90a0e087f1ff43b27278079b0", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138214559, "source": "custom_dealercrawl", "vin": "2LMPJ8K95PBL21157", "vid": "bae40af70a0e094a74e2589d3e23e58b", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138214980, "source": "custom_dealercrawl", "vin": "KM8R54HE6LU156987", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138215337, "source": "custom_dealercrawl", "vin": "WBXYJ3C34JEP75934", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138215628, "source": "custom_dealercrawl", "vin": "1C6RD7PT3CS211729", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138216014, "source": "custom_dealercrawl", "vin": "1FT7W2BT6KEC78570", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138216289, "source": "custom_dealercrawl", "vin": "1FTFW1RG4PFC37774", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138216549, "source": "custom_dealercrawl", "vin": "1GCGSCEAXK1256106", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138216863, "source": "custom_dealercrawl", "vin": "1GNSKBKC7JR167420", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138217153, "source": "custom_dealercrawl", "vin": "2LMPJ8K92PBL23612", "vid": "c3b38a640a0e094a69d51377b6b3ace9", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138240527, "source": "custom_dealercrawl", "vin": "2LMPJ8K90PBL23608", "vid": "dd6e746f0a0e094a5fad348d5a56227c", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138240915, "source": "custom_dealercrawl", "vin": "2LMPJ8K96PBL22267", "vid": "e18dc1530a0e0a90625213be23934685", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138241282, "source": "custom_dealercrawl", "vin": "2FMDK4KC4ABB58167", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138241540, "source": "custom_dealercrawl", "vin": "2T3C1RFV6NC209362", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138241814, "source": "custom_dealercrawl", "vin": "2LMPJ8K92PBL19298", "vid": "e64a6d190a0e094a72a865f2c1ca7879", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138242109, "source": "custom_dealercrawl", "vin": "3C4NJDBN7PT517103", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138242364, "source": "custom_dealercrawl", "vin": "5LMCJ2D96MUL17206", "vid": "5c888f390a0e0a91701c19688d571fe7", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138242627, "source": "custom_dealercrawl", "vin": "5LMCJ2D95LUL27062", "vid": "65a7beef0a0e0a9a7139bc36dac452b2", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138242946, "source": "custom_dealercrawl", "vin": "3VVDX7B25PM339141", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138272344, "source": "custom_dealercrawl", "vin": "5LMCJ1C90MUL25412", "vid": "510e3d970a0e087f42924702f0854360", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138272630, "source": "custom_dealercrawl", "vin": "5LMCJ1D92MUL28147", "vid": "65a7c1460a0e0a9a7139bc3601f4e41c", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138273004, "source": "custom_dealercrawl", "vin": "KL4CJASB8GB664070", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138273303, "source": "custom_dealercrawl", "vin": "5LMCJ3D90KUL09346", "vid": "e45cee2a0a0e0a9260e76faadbdf3e97", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138273543, "source": "custom_dealercrawl", "vin": "2LMHJ5AT8ABJ15645", "vid": "e2b6a6e00a0e0a9a0f753ea1d8b4b7ed", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138273895, "source": "custom_dealercrawl", "vin": "KM8R4DHE2NU483201", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138274192, "source": "custom_dealercrawl", "vin": "3LN6L2LU7GR617901", "vid": "3c805d3b0a0e081d114b2b417f2f1fbe", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138274469, "source": "custom_dealercrawl", "vin": "1G6KD57Y69U130623", "vid": "dfbf7a870a0e094a0c1254ea94dd8c80", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138274705, "source": "custom_dealercrawl", "vin": "2GNALCEK9F1156422", "vid": "e67defb00a0e094a5fad348d839627af", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138301130, "source": "custom_dealercrawl", "vin": "1G11H5SL6EF247232", "vid": "d7a1a21b0a0e0a9410ae358d62433a35", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138301464, "source": "custom_dealercrawl", "vin": "KNDME5C17F6028890", "vid": "2d21b0f10a0e0a992b96b96b9b2f9be1", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138301904, "source": "custom_dealercrawl", "vin": "5XYPGDA36JG388051", "vid": "c26bec1c0a0e0a9a49b1b26ae6a085af", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138302222, "source": "custom_dealercrawl", "vin": "KNDJP3A55F7147782", "vid": "3c8061bb0a0e094a3883bfc36fecfacb", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138302523, "source": "custom_dealercrawl", "vin": "WDCGG5HB6DF979212", "vid": "2d21b27f0a0e0a992b96b96b09c73640", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138302841, "source": "custom_dealercrawl", "vin": "WD4PG2EE6H3316917", "vid": "1cd336bf0a0e087f78ac9134d392d371", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138303147, "source": "custom_dealercrawl", "vin": "WDDPK4HA1DF055529", "vid": "673f6c4a0a0e081d455631da840515ba", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138303479, "source": "custom_dealercrawl", "vin": "4A37L3ETXBE002156", "vid": "3c805eb90a0e081d114b2b41d737513c", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138303764, "source": "custom_dealercrawl", "vin": "JN8AF5MV5CT109129", "vid": "2ec579b80a0e087f102b3b1dc061c674", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138304085, "source": "custom_dealercrawl", "vin": "LRBFZNR45PD033256", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138353621, "source": "custom_dealercrawl", "vin": "1C4SJVBT9NS123429", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138353991, "source": "custom_dealercrawl", "vin": "5XYK6CDF2RG150027", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138354304, "source": "custom_dealercrawl", "vin": "5XYK6CDFXRG151927", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138354541, "source": "custom_dealercrawl", "vin": "5N1AR2MM6FC703799", "vid": "90ca2b640a0e081d2055119d8144148e", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138354862, "source": "custom_dealercrawl", "vin": "1C4RJFCG0LC426192", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138355134, "source": "custom_dealercrawl", "vin": "3C6TRVBG6JE104146", "vid": "e45ce82c0a0e0a9a2d62f34ce9cd30f7", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138355431, "source": "custom_dealercrawl", "vin": "1GYKPGRSXLZ101512", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138355709, "source": "custom_dealercrawl", "vin": "5XYRK4LF0PG228710", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138356028, "source": "custom_dealercrawl", "vin": "YV4902DZ0D2425320", "vid": "2d21afaa0a0e0a992b96b96bbc5065c9", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138372630, "source": "custom_dealercrawl", "vin": "5XYRKDLF6PG221339", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138372946, "source": "custom_dealercrawl", "vin": "YV4A22PK5G1075263", "vid": "9b0fb40d0a0e0a9209f3bda229b8e03a", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138373271, "source": "custom_dealercrawl", "vin": "3TMCZ5AN3NM525116", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138373533, "source": "custom_dealercrawl", "vin": "1FTFW1E8XMFB63514", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138373853, "source": "custom_dealercrawl", "vin": "KNDC3DLC7P5156664", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138374135, "source": "custom_dealercrawl", "vin": "KNDC3DLC5P5150832", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138374379, "source": "custom_dealercrawl", "vin": "1GNEVHKW7JJ117763", "vid": "f434a51d0a0e094a5fad348d81d4441b", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138374638, "source": "custom_dealercrawl", "vin": "1C4RJJDG2P8733437", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138374898, "source": "custom_dealercrawl", "vin": "3KPA24AD5PE616348", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138396113, "source": "custom_dealercrawl", "vin": "3KPA24AD9PE618703", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138396502, "source": "custom_dealercrawl", "vin": "4S4BTANC7M3210359", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138396890, "source": "custom_dealercrawl", "vin": "5GAEVBKW3KJ119700", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138397199, "source": "custom_dealercrawl", "vin": "1FT7W2BT3MED43801", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138397491, "source": "custom_dealercrawl", "vin": "3KPA24ADXPE611467", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138397820, "source": "custom_dealercrawl", "vin": "1FT8W2BT9NED14213", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138398112, "source": "custom_dealercrawl", "vin": "3KPA25AD4PE612104", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138398394, "source": "custom_dealercrawl", "vin": "3KPA24ADXPE606043", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138398636, "source": "custom_dealercrawl", "vin": "3KPA24AD8PE613489", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138405847, "source": "custom_dealercrawl", "vin": "3GNEC12078G294611", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138406131, "source": "custom_dealercrawl", "vin": "3TMCZ5AN0PM543303", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138406432, "source": "custom_dealercrawl", "vin": "1C4SDJETXCC104326", "vid": "e67df11e0a0e094a5fad348d36a283af", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138406724, "source": "custom_dealercrawl", "vin": "3TMCZ5AN4PM535009", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138407008, "source": "custom_dealercrawl", "vin": "JF2GTACC1K8326039", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138407312, "source": "custom_dealercrawl", "vin": "3TMCZ5AN5PM542017", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138417387, "source": "custom_dealercrawl", "vin": "WA1A4AFY3J2176035", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138417706, "source": "custom_dealercrawl", "vin": "3VWC57BU3KM100033", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138418024, "source": "custom_dealercrawl", "vin": "ZFBCFYDT6GP396129", "vid": "673f71400a0e081d455631daa6d41924", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138418289, "source": "custom_dealercrawl", "vin": "1GCGTEEN5J1207440", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138418579, "source": "custom_dealercrawl", "vin": "5XXG64J25RG253556", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138418875, "source": "custom_dealercrawl", "vin": "1HGCV2F96JA008617", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138419198, "source": "custom_dealercrawl", "vin": "5XYK33DF5RG163332", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138419492, "source": "custom_dealercrawl", "vin": "2C3CDZFJ4MH507477", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138419782, "source": "custom_dealercrawl", "vin": "5TFDY5F12MX021288", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138433813, "source": "custom_dealercrawl", "vin": "5XXG64J25RG251287", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138434140, "source": "custom_dealercrawl", "vin": "1ZVBP8EM5C5279402", "vid": "3e071cff0a0e0a9169ea2c18c86e2ec6", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138434404, "source": "custom_dealercrawl", "vin": "1GTV2UEH6FZ350999", "vid": "673f6a8c0a0e081d455631da145b193a", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138434653, "source": "custom_dealercrawl", "vin": "1FTFW1E5XNKE75685", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138434976, "source": "custom_dealercrawl", "vin": "KMHGN4JE6JU225675", "vid": "f434a3ef0a0e094a5fad348dca398bb7", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138435282, "source": "custom_dealercrawl", "vin": "KMHGH4JH4GU103729", "vid": "0e38c41e0a0e0a92630d01ba2853198a", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138435554, "source": "custom_dealercrawl", "vin": "5XYK33DF9RG158361", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138435891, "source": "custom_dealercrawl", "vin": "19XFA1F5XAE072672", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138436173, "source": "custom_dealercrawl", "vin": "1C4PJLCB5KD164768", "vid": "673f6de60a0e081d455631da1f15c287", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138471288, "source": "custom_dealercrawl", "vin": "1FT8W3BT5MED79385", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138471606, "source": "custom_dealercrawl", "vin": "3CZRU6H10MM749521", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138471891, "source": "custom_dealercrawl", "vin": "1C4RJEAG7JC429648", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138472178, "source": "custom_dealercrawl", "vin": "1FMJK2AT3KEA77398", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138472414, "source": "custom_dealercrawl", "vin": "1C4NJRBB0CD509587", "vid": "d5879ab10a0e0a93227b34edb258601a", "date": "2023-10-26", "domain": "www.southgatelincoln.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138472675, "source": "custom_dealercrawl", "vin": "1C6SRFMT5NN307686", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "4", "name": "Hendrick Motors of Charlotte", "address": "5201 E INDEPENDENCE BLVD", "zip": "28212"}}
{"timestamp": 1698386138472985, "source": "custom_dealercrawl", "vin": "KNDCR3LE2R5124881", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "2", "name": "Mercedes-Benz of Spokane", "address": "21802 E GEORGE GEE AVE", "zip": "99019"}}
{"timestamp": 1698386138473286, "source": "custom_dealercrawl", "vin": "1FTFW1ED9PFC02837", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138473521, "source": "custom_dealercrawl", "vin": "JTKKT624860169672", "vid": "82836027", "date": "2023-10-26", "domain": "www.napletonnissanschererville.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138483669, "source": "custom_dealercrawl", "vin": "5XYK6CDFXRG164046", "vid": "", "date": "2023-10-26", "domain": "www.kiaofchattanooga.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138484008, "source": "custom_dealercrawl", "vin": "JF1VA1J6XH9814889", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "1", "name": "Ozzy's Car Company", "address": "4195 W. Chinden Blvd", "zip": "83714"}}
{"timestamp": 1698386138484314, "source": "custom_dealercrawl", "vin": "YV4952CZ5D1668226", "vid": "82186503", "date": "2023-10-26", "domain": "www.napletonnissanschererville.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}
{"timestamp": 1698386138484591, "source": "custom_dealercrawl", "vin": "3C6UR5CJ9KG619579", "vid": "", "date": "2023-10-26", "domain": "www.parklinemotors.com", "seller": {"id": "3", "name": "Select Auto Imports", "address": "5630 S Van Dorn St", "zip": "22310"}}
{"timestamp": 1698386138484912, "source": "custom_dealercrawl", "vin": "1N6AA1EF1LN505490", "vid": "", "date": "2023-10-26", "domain": "www.kiaofabilene.com", "seller": {"id": "5", "name": "Mercedes-Benz of Draper", "address": "11548 S LONE PEAK PARKWAY", "zip": "84020"}}


================================================
FILE: quickwit/quickwit-doc-mapper/benches/doc_to_json_bench.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use binggan::plugins::*;
use binggan::{BenchRunner, INSTRUMENTED_SYSTEM, PeakMemAlloc, black_box};
use quickwit_doc_mapper::DocMapper;
use tantivy::TantivyDocument;

const SIMPLE_JSON_TEST_DATA: &str = include_str!("data/simple-parse-bench.json");
const ROUTING_TEST_DATA: &str = include_str!("data/simple-routing-expression-bench.json");

const DOC_MAPPER_CONF_SIMPLE_JSON: &str = r#"{
    "type": "default",
    "default_search_fields": [],
    "tag_fields": [],
    "field_mappings": [
        {"name": "id", "type": "u64", "fast": false },
        {"name": "first_name", "type": "text" },
        {"name": "last_name", "type": "text" },
        {"name": "email", "type": "text" }
    ]
}"#;

/// Note that {"name": "date", "type": "datetime", "input_formats": ["%Y-%m-%d"], "output_format":
/// "%Y-%m-%d"}, is removed since tantivy parsing only supports RFC3339
const ROUTING_DOC_MAPPER_CONF: &str = r#"{
    "type": "default",
    "default_search_fields": [],
    "tag_fields": [],
    "field_mappings": [
        {"name": "timestamp", "type": "datetime", "input_formats": ["unix_timestamp"], "output_format": "%Y-%m-%d %H:%M:%S", "output_format": "%Y-%m-%d %H:%M:%S", "fast": true },
        {"name": "source", "type": "text" },
        {"name": "vin", "type": "text" },
        {"name": "vid", "type": "text" },
        {"name": "domain", "type": "text" },
        {"name": "seller", "type": "object", "field_mappings": [
            {"name": "id", "type": "text" },
            {"name": "name", "type": "text" },
            {"name": "address", "type": "text" },
            {"name": "zip", "type": "text" }
        ]}
    ],
    "partition_key": "seller.id"
}"#;

#[global_allocator]
pub static GLOBAL: &PeakMemAlloc<std::alloc::System> = &INSTRUMENTED_SYSTEM;

fn get_test_data(
    name: &'static str,
    raw: &'static str,
    doc_mapper: &'static str,
) -> (&'static str, usize, Vec<&'static str>, Box<DocMapper>) {
    let lines: Vec<&str> = raw.lines().map(|line| line.trim()).collect();
    (
        name,
        raw.len(),
        lines,
        serde_json::from_str(doc_mapper).unwrap(),
    )
}

fn run_bench() {
    let inputs: Vec<(&str, usize, Vec<&str>, Box<DocMapper>)> = vec![
        (get_test_data(
            "flat_json",
            SIMPLE_JSON_TEST_DATA,
            DOC_MAPPER_CONF_SIMPLE_JSON,
        )),
        (get_test_data("routing_json", ROUTING_TEST_DATA, ROUTING_DOC_MAPPER_CONF)),
    ];

    let mut runner: BenchRunner = BenchRunner::new();

    runner.config().set_num_iter_for_bench(1);
    runner.config().set_num_iter_for_group(100);
    runner
        .add_plugin(CacheTrasher::default())
        .add_plugin(BPUTrasher::default())
        .add_plugin(PeakMemAllocPlugin::new(GLOBAL));

    for (input_name, size, data, doc_mapper) in inputs.iter() {
        let dynamic_doc_mapper: DocMapper =
            serde_json::from_str(r#"{ "mode": "dynamic" }"#).unwrap();
        let mut group = runner.new_group();
        group.set_name(input_name);
        group.set_input_size(*size);
        group.register_with_input("doc_mapper", data, |lines| {
            for line in lines {
                black_box(doc_mapper.doc_from_json_str(line).unwrap());
            }
        });

        group.register_with_input("doc_mapper_dynamic", data, |lines| {
            for line in lines {
                black_box(dynamic_doc_mapper.doc_from_json_str(line).unwrap());
            }
        });

        group.register_with_input("tantivy parse json", data, |lines| {
            let schema = doc_mapper.schema();
            for line in lines {
                let _doc = black_box(TantivyDocument::parse_json(&schema, line).unwrap());
            }
        });
        group.run();
    }
}

fn main() {
    run_bench();
}


================================================
FILE: quickwit/quickwit-doc-mapper/benches/routing_expression_bench.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use binggan::plugins::*;
use binggan::{BenchRunner, INSTRUMENTED_SYSTEM, PeakMemAlloc};
use quickwit_doc_mapper::RoutingExpr;
use serde_json::Value as JsonValue;

#[global_allocator]
pub static GLOBAL: &PeakMemAlloc<std::alloc::System> = &INSTRUMENTED_SYSTEM;

const JSON_TEST_DATA: &str = include_str!("data/simple-routing-expression-bench.json");

fn run_bench() {
    let json_lines: Vec<serde_json::Map<String, JsonValue>> = JSON_TEST_DATA
        .lines()
        .map(|line| serde_json::from_str(line).unwrap())
        .collect();

    let mut runner: BenchRunner = BenchRunner::new();

    runner
        .add_plugin(CacheTrasher::default())
        .add_plugin(PeakMemAllocPlugin::new(GLOBAL));

    {
        let (input_name, size, data) = &("routing_expr", JSON_TEST_DATA.len(), &json_lines);
        let mut group = runner.new_group();
        group.set_name(input_name);
        group.set_input_size(*size);
        group.register_with_input("simple-eval-hash", data, |lines| {
            let routing_expr = RoutingExpr::new("seller.id").unwrap();
            for json in lines.iter() {
                routing_expr.eval_hash(json);
            }
        });

        group.run();
    }
}

fn main() {
    run_bench();
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/date_time_type.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use indexmap::IndexSet;
use quickwit_common::true_fn;
use quickwit_datetime::{DateTimeInputFormat, DateTimeOutputFormat, TantivyDateTime};
use serde::{Deserialize, Deserializer, Serialize};
use serde_json::Value as JsonValue;
use tantivy::schema::{DateTimePrecision, OwnedValue as TantivyValue};

/// A struct holding DateTime field options.
#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct QuickwitDateTimeOptions {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,

    /// Accepted input formats.
    #[serde(default)]
    pub input_formats: InputFormats,

    /// Output format
    #[serde(default)]
    pub output_format: DateTimeOutputFormat,

    /// Internal storage precision.
    #[serde(default)]
    #[serde(alias = "precision")]
    pub fast_precision: DateTimePrecision,

    #[serde(default = "true_fn")]
    pub indexed: bool,

    #[serde(default = "true_fn")]
    pub stored: bool,

    #[serde(default)]
    pub fast: bool,
}

impl Default for QuickwitDateTimeOptions {
    fn default() -> Self {
        Self {
            description: None,
            input_formats: InputFormats::default(),
            output_format: DateTimeOutputFormat::default(),
            fast_precision: DateTimePrecision::default(),
            indexed: true,
            stored: true,
            fast: false,
        }
    }
}

impl QuickwitDateTimeOptions {
    pub(crate) fn validate_json(
        &self,
        json_value: &serde_json_borrow::Value,
    ) -> Result<(), String> {
        match json_value {
            serde_json_borrow::Value::Number(timestamp) => {
                // `.as_f64()` actually converts floats to integers, so we must check for integers
                // first.
                if let Some(timestamp_i64) = timestamp.as_i64() {
                    quickwit_datetime::parse_timestamp_int(timestamp_i64, &self.input_formats.0)?;
                    Ok(())
                } else if let Some(timestamp_f64) = timestamp.as_f64() {
                    quickwit_datetime::parse_timestamp_float(timestamp_f64, &self.input_formats.0)?;
                    Ok(())
                } else {
                    Err(format!(
                        "failed to convert timestamp to f64 ({:?}). this should never happen",
                        serde_json::Number::from(*timestamp)
                    ))
                }
            }
            serde_json_borrow::Value::Str(date_time_str) => {
                quickwit_datetime::parse_date_time_str(date_time_str, &self.input_formats.0)?;
                Ok(())
            }
            _ => Err(format!(
                "failed to parse datetime: expected a float, integer, or string, got \
                 `{json_value}`"
            )),
        }
    }

    pub(crate) fn parse_json(&self, json_value: &JsonValue) -> Result<TantivyValue, String> {
        let date_time = match json_value {
            JsonValue::Number(timestamp) => {
                // `.as_f64()` actually converts floats to integers, so we must check for integers
                // first.
                if let Some(timestamp_i64) = timestamp.as_i64() {
                    quickwit_datetime::parse_timestamp_int(timestamp_i64, &self.input_formats.0)?
                } else if let Some(timestamp_f64) = timestamp.as_f64() {
                    quickwit_datetime::parse_timestamp_float(timestamp_f64, &self.input_formats.0)?
                } else {
                    return Err(format!(
                        "failed to parse datetime `{timestamp:?}`: value is larger than i64::MAX",
                    ));
                }
            }
            JsonValue::String(date_time_str) => {
                quickwit_datetime::parse_date_time_str(date_time_str, &self.input_formats.0)?
            }
            _ => {
                return Err(format!(
                    "failed to parse datetime: expected a float, integer, or string, got \
                     `{json_value}`"
                ));
            }
        };
        Ok(TantivyValue::Date(date_time))
    }

    pub(crate) fn reparse_tantivy_value(
        &self,
        tantivy_value: &TantivyValue,
    ) -> Option<TantivyDateTime> {
        match tantivy_value {
            TantivyValue::Date(date) => Some(*date),
            TantivyValue::Str(date_time_str) => {
                quickwit_datetime::parse_date_time_str(date_time_str, &self.input_formats.0).ok()
            }
            TantivyValue::U64(timestamp_u64) => {
                let timestamp_i64 = (*timestamp_u64).try_into().ok()?;
                quickwit_datetime::parse_timestamp_int(timestamp_i64, &self.input_formats.0).ok()
            }
            TantivyValue::I64(timestamp_i64) => {
                quickwit_datetime::parse_timestamp_int(*timestamp_i64, &self.input_formats.0).ok()
            }
            TantivyValue::F64(timestamp_f64) => {
                quickwit_datetime::parse_timestamp_float(*timestamp_f64, &self.input_formats.0).ok()
            }
            _ => None,
        }
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize)]
pub struct InputFormats(Vec<DateTimeInputFormat>);

impl Default for InputFormats {
    fn default() -> Self {
        Self(vec![
            DateTimeInputFormat::Rfc3339,
            DateTimeInputFormat::Timestamp,
        ])
    }
}

impl<'de> Deserialize<'de> for InputFormats {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let date_time_formats = IndexSet::<DateTimeInputFormat>::deserialize(deserializer)?;

        if date_time_formats.is_empty() {
            return Ok(InputFormats::default());
        }
        Ok(InputFormats(date_time_formats.into_iter().collect()))
    }
}

#[cfg(test)]
mod tests {

    use time::macros::datetime;

    use super::*;
    use crate::doc_mapper::FieldMappingType;
    use crate::{Cardinality, FieldMappingEntry};

    #[test]
    fn test_date_time_options_single_value_deser() {
        let field_mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "updated_at",
                "type": "datetime",
                "description": "When the record was last updated.",
                "input_formats": [
                    "rfc3339"
                ],
                "fast_precision": "milliseconds",
                "indexed": true,
                "fast": true,
                "stored": false
            }
            "#,
        )
        .unwrap();

        assert_eq!(field_mapping_entry.name, "updated_at");

        let date_time_options = match field_mapping_entry.mapping_type {
            FieldMappingType::DateTime(date_time_options, Cardinality::SingleValued) => {
                date_time_options
            }
            _ => panic!("Expected a date time field mapping"),
        };
        let expected_input_formats = InputFormats(vec![DateTimeInputFormat::Rfc3339]);
        let expected_date_time_options = QuickwitDateTimeOptions {
            description: Some("When the record was last updated.".to_string()),
            input_formats: expected_input_formats,
            output_format: DateTimeOutputFormat::Rfc3339,
            fast_precision: DateTimePrecision::Milliseconds,
            indexed: true,
            fast: true,
            stored: false,
        };
        assert_eq!(date_time_options, expected_date_time_options);
    }

    #[test]
    fn test_backward_compatibility_after_fast_precision_rename() {
        let field_mapping_entry: FieldMappingEntry = serde_json::from_str(
            r#"
        {
            "name": "updated_at",
            "type": "datetime",
            "description": "When the record was last updated.",
            "input_formats": ["rfc3339"],
            "precision": "milliseconds",
            "indexed": true,
            "fast": true,
            "stored": false
        }
    "#,
        )
        .unwrap();

        if let FieldMappingType::DateTime(date_time_options, _) = field_mapping_entry.mapping_type {
            assert_eq!(
                date_time_options.fast_precision,
                DateTimePrecision::Milliseconds
            );
        } else {
            panic!("Expected a date time field mapping");
        }
    }

    #[test]
    fn test_date_time_options_multi_values_deser() {
        let field_mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "updated_at",
                "type": "array<datetime>",
                "description": "When the record was last updated.",
                "input_formats": [
                    "rfc3339"
                ],
                "output_format": "unix_timestamp_secs",
                "fast_precision": "milliseconds",
                "indexed": true,
                "fast": true,
                "stored": false
            }
            "#,
        )
        .unwrap();

        assert_eq!(field_mapping_entry.name, "updated_at");

        let date_time_options = match field_mapping_entry.mapping_type {
            FieldMappingType::DateTime(date_time_options, Cardinality::MultiValued) => {
                date_time_options
            }
            _ => panic!("Expected a date time field mapping."),
        };
        let expected_input_formats = InputFormats(vec![DateTimeInputFormat::Rfc3339]);
        let expected_date_time_options = QuickwitDateTimeOptions {
            description: Some("When the record was last updated.".to_string()),
            input_formats: expected_input_formats,
            output_format: DateTimeOutputFormat::TimestampSecs,
            fast_precision: DateTimePrecision::Milliseconds,
            indexed: true,
            fast: true,
            stored: false,
        };
        assert_eq!(date_time_options, expected_date_time_options);
    }

    #[test]
    fn test_date_time_options_deser_default() {
        let date_time_options = serde_json::from_str::<QuickwitDateTimeOptions>("{}").unwrap();
        assert_eq!(date_time_options, QuickwitDateTimeOptions::default());
        assert_eq!(
            date_time_options.input_formats.0,
            &[DateTimeInputFormat::Rfc3339, DateTimeInputFormat::Timestamp]
        );
        assert_eq!(
            date_time_options.output_format,
            DateTimeOutputFormat::Rfc3339
        );
        assert_eq!(date_time_options.fast_precision, DateTimePrecision::Seconds);
        assert!(date_time_options.indexed);
        assert!(date_time_options.stored);
        assert!(!date_time_options.fast);
    }

    #[test]
    fn test_date_time_options_deser_denies_unknown_fields() {
        let error = serde_json::from_str::<QuickwitDateTimeOptions>(
            r#"
            {
                "tokenizer": "raw",
            }
            "#,
        )
        .unwrap_err()
        .to_string();
        assert!(error.contains("unknown field `tokenizer`"));

        let error = serde_json::from_str::<QuickwitDateTimeOptions>(
            r#"
            {
                "fast_precision": "hours",
            }
            "#,
        )
        .unwrap_err()
        .to_string();
        assert!(error.contains("unknown variant `hours`"));
    }

    #[test]
    fn test_test_date_time_options_ser() {
        let field_mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "updated_at",
                "type": "datetime",
                "description": "When the record was last updated.",
                "input_formats": ["iso8601"]
            }"#,
        )
        .unwrap();

        let entry_json = serde_json::to_value(&field_mapping_entry).unwrap();
        assert_eq!(
            entry_json,
            serde_json::json!({
                "name": "updated_at",
                "type": "datetime",
                "description": "When the record was last updated.",
                "input_formats": ["iso8601"],
                "output_format": "rfc3339",
                "fast_precision": "seconds",
                "indexed": true,
                "fast": false,
                "stored": true
            })
        );
    }

    #[test]
    fn test_deserialize_input_formats_deser() {
        {
            let input_formats_json = r#"[]"#;
            let input_formats: InputFormats = serde_json::from_str(input_formats_json).unwrap();
            assert_eq!(
                input_formats.0,
                &[DateTimeInputFormat::Rfc3339, DateTimeInputFormat::Timestamp]
            );
        }
        {
            let input_formats_json = r#"["rfc3339", "unix_timestamp", "unix_timestamp"]"#;
            let input_formats: InputFormats = serde_json::from_str(input_formats_json).unwrap();
            assert_eq!(
                input_formats.0,
                &[DateTimeInputFormat::Rfc3339, DateTimeInputFormat::Timestamp]
            );
        }
    }

    #[test]
    fn test_deserialize_invalid_input_formats_should_error() {
        {
            let input_formats_json = r#"["rfc3339", "%Y-%Q-%d"]"#;
            let error = serde_json::from_str::<InputFormats>(input_formats_json)
                .unwrap_err()
                .to_string();
            assert!(error.contains("invalid strptime format"));
        }
    }

    #[test]
    fn test_date_time_options_parse_json() {
        let date_time_options = QuickwitDateTimeOptions {
            input_formats: InputFormats(vec![
                DateTimeInputFormat::Rfc3339,
                DateTimeInputFormat::Timestamp,
            ]),
            ..Default::default()
        };
        let expected_timestamp = datetime!(2012-05-21 12:09:14 UTC).unix_timestamp();
        {
            let json_value = serde_json::json!("2012-05-21T12:09:14-00:00");
            let tantivy_value = date_time_options.parse_json(&json_value).unwrap();
            let date_time = match tantivy_value {
                TantivyValue::Date(date_time) => date_time,
                other => panic!("Expected a tantivy date time, got `{other:?}`."),
            };
            assert_eq!(date_time.into_timestamp_secs(), expected_timestamp);
        }
        {
            let json_value = serde_json::json!(expected_timestamp);
            let tantivy_value = date_time_options.parse_json(&json_value).unwrap();
            let date_time = match tantivy_value {
                TantivyValue::Date(date_time) => date_time,
                other => panic!("Expected a tantivy date time, got `{other:?}`."),
            };
            assert_eq!(date_time.into_timestamp_secs(), expected_timestamp);
        }
        {
            let json_value = serde_json::json!(expected_timestamp as f64);
            let tantivy_value = date_time_options.parse_json(&json_value).unwrap();
            let date_time = match tantivy_value {
                TantivyValue::Date(date_time) => date_time,
                other => panic!("Expected a tantivy date time, got `{other:?}`."),
            };
            assert_eq!(date_time.into_timestamp_secs(), expected_timestamp);
        }
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/doc_mapper_builder.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::de::IgnoredAny;
use serde::{Deserialize, Serialize};

use crate::{DocMapper, DocMapping};

/// DocMapperBuilder is here
/// to create a valid DocMapper.
///
/// It is also used to serialize/deserialize a DocMapper.
/// note that this is not the way is the DocMapping is deserialized
/// from the configuration.
#[derive(Clone, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct DocMapperBuilder {
    /// Doc mapping.
    #[serde(flatten)]
    pub doc_mapping: DocMapping,
    /// Default search field names.
    #[serde(default)]
    pub default_search_fields: Vec<String>,

    /// Allow the "type" field separately.
    /// This is a residue from when the DocMapper was a trait.
    #[serde(rename = "type", default)]
    #[serde(skip_serializing)]
    pub legacy_type_tag: Option<IgnoredAny>,
}

#[cfg(test)]
impl Default for DocMapperBuilder {
    fn default() -> Self {
        serde_json::from_str("{}").unwrap()
    }
}

impl DocMapperBuilder {
    /// Build a valid `DocMapper`.
    /// This will consume your `DocMapperBuilder`.
    pub fn try_build(self) -> anyhow::Result<DocMapper> {
        self.try_into()
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::ModeType;

    #[test]
    fn test_default_mapper_builder_deserialize_from_empty_object() {
        let default_doc_mapper_builder: DocMapperBuilder = serde_json::from_str("{}").unwrap();
        assert_eq!(
            default_doc_mapper_builder.doc_mapping.mode.mode_type(),
            ModeType::Dynamic
        );
        assert!(
            default_doc_mapper_builder
                .doc_mapping
                .field_mappings
                .is_empty()
        );
        assert!(
            default_doc_mapper_builder
                .doc_mapping
                .timestamp_field
                .is_none()
        );
        assert!(default_doc_mapper_builder.doc_mapping.tag_fields.is_empty());
        assert_eq!(default_doc_mapper_builder.doc_mapping.store_source, false);
        assert!(default_doc_mapper_builder.default_search_fields.is_empty());
    }

    #[test]
    fn test_default_mapper_builder_extra_field() {
        assert!(serde_json::from_str::<DocMapperBuilder>(r#"{"unknownfield": "blop"}"#).is_err());
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/doc_mapper_impl.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, BTreeSet, HashSet};
use std::num::NonZeroU32;
use std::sync::Arc;

use anyhow::{Context, bail};
use fnv::FnvHashSet;
use quickwit_proto::types::DocMappingUid;
use quickwit_query::create_default_quickwit_tokenizer_manager;
use quickwit_query::query_ast::{BuildTantivyAstContext, QueryAst};
use quickwit_query::tokenizers::TokenizerManager;
use serde::{Deserialize, Serialize};
use serde_json::{self, Value as JsonValue};
use serde_json_borrow::Map as BorrowedJsonMap;
use tantivy::TantivyDocument as Document;
use tantivy::query::Query;
use tantivy::schema::{Field, FieldType, INDEXED, OwnedValue as TantivyValue, STORED, Schema};

use super::DocMapperBuilder;
use super::field_mapping_entry::RAW_TOKENIZER_NAME;
use super::field_presence::populate_field_presence;
use super::tantivy_val_to_json::tantivy_value_to_json;
use crate::doc_mapper::mapping_tree::{
    JsonValueIterator, MappingNode, MappingNodeRoot, build_field_path_from_str, build_mapping_tree,
    map_primitive_json_to_concatenate_value,
};
use crate::doc_mapper::{FieldMappingType, JsonObject, Partition};
use crate::query_builder::build_query;
use crate::routing_expression::RoutingExpr;
use crate::{
    Cardinality, DOCUMENT_SIZE_FIELD_NAME, DYNAMIC_FIELD_NAME, DocMapping, DocParsingError,
    FIELD_PRESENCE_FIELD_NAME, Mode, ModeType, NamedField, QueryParserError, SOURCE_FIELD_NAME,
    TokenizerEntry, WarmupInfo,
};

const FIELD_PRESENCE_FIELD: Field = Field::from_field_id(0u32);

/// which defines a set of rules to map json fields
/// to tantivy index fields.
///
/// The mains rules are defined by the field mappings.
#[derive(Clone, Serialize, Deserialize)]
#[serde(into = "DocMapperBuilder", try_from = "DocMapperBuilder")]
pub struct DocMapper {
    /// The UID of the doc mapping.
    doc_mapping_uid: DocMappingUid,
    /// Field in which the source should be stored.
    /// This field is only valid when using the schema associated with the default
    /// doc mapper, and therefore cannot be used in the `query` method.
    source_field: Option<Field>,
    /// Indexes field presence. It is necessary to enable this in order to run exists
    /// queries.
    index_field_presence: bool,
    /// Field in which the dynamically mapped fields should be stored.
    /// This field is only valid when using the schema associated with the default
    /// doc mapper, and therefore cannot be used in the `query` method.
    dynamic_field: Option<Field>,
    /// Field in which the len of the source document is stored as a fast field.
    document_size_field: Option<Field>,
    /// Default list of field names used for search.
    default_search_field_names: Vec<String>,
    /// Timestamp field name.
    timestamp_field_name: Option<String>,
    /// Timestamp field path (name parsed)
    timestamp_field_path: Option<Vec<String>>,
    /// Root node of the field mapping tree.
    /// See [`MappingNode`].
    field_mappings: MappingNode,
    /// Concat fields which needs to learn about any element put in dynamic_field
    concatenate_dynamic_fields: Vec<Field>,
    /// Schema generated by the store source and field mappings parameters.
    schema: Schema,
    /// List of field names used for tagging.
    tag_field_names: BTreeSet<String>,
    /// The partition key is a DSL used to route documents
    /// into specific splits.
    partition_key: RoutingExpr,
    /// Maximum number of partitions
    max_num_partitions: NonZeroU32,
    /// Defines how unmapped fields should be handle.
    mode: Mode,
    /// User-defined tokenizers.
    tokenizer_entries: Vec<TokenizerEntry>,
    /// Tokenizer manager.
    tokenizer_manager: TokenizerManager,
}

fn validate_timestamp_field(
    timestamp_field_path: &str,
    mapping_root_node: &MappingNode,
) -> anyhow::Result<()> {
    if timestamp_field_path.starts_with('.') || timestamp_field_path.starts_with("\\.") {
        bail!("timestamp field `{timestamp_field_path}` should not start with a `.`");
    }
    if timestamp_field_path.ends_with('.') {
        bail!("timestamp field `{timestamp_field_path}` should not end with a `.`");
    }
    let Some(timestamp_field_type) =
        mapping_root_node.find_field_mapping_type(timestamp_field_path)
    else {
        bail!("could not find timestamp field `{timestamp_field_path}` in field mappings");
    };
    if let FieldMappingType::DateTime(date_time_option, cardinality) = &timestamp_field_type {
        if cardinality != &Cardinality::SingleValued {
            bail!("timestamp field `{timestamp_field_path}` should be single-valued");
        }
        if !date_time_option.fast {
            bail!("timestamp field `{timestamp_field_path}` should be a fast field");
        }
    } else {
        bail!("timestamp field `{timestamp_field_path}` should be a datetime field");
    }
    Ok(())
}

impl From<DocMapper> for DocMapperBuilder {
    fn from(default_doc_mapper: DocMapper) -> Self {
        let partition_key_str = default_doc_mapper.partition_key.to_string();
        let partition_key_opt: Option<String> = if !partition_key_str.is_empty() {
            Some(partition_key_str)
        } else {
            None
        };
        let doc_mapping = DocMapping {
            doc_mapping_uid: default_doc_mapper.doc_mapping_uid,
            mode: default_doc_mapper.mode,
            field_mappings: default_doc_mapper.field_mappings.into(),
            timestamp_field: default_doc_mapper.timestamp_field_name,
            tag_fields: default_doc_mapper.tag_field_names,
            partition_key: partition_key_opt,
            max_num_partitions: default_doc_mapper.max_num_partitions,
            index_field_presence: default_doc_mapper.index_field_presence,
            store_document_size: default_doc_mapper.document_size_field.is_some(),
            store_source: default_doc_mapper.source_field.is_some(),
            tokenizers: default_doc_mapper.tokenizer_entries,
        };
        Self {
            doc_mapping,
            default_search_fields: default_doc_mapper.default_search_field_names,
            legacy_type_tag: None,
        }
    }
}

impl TryFrom<DocMapperBuilder> for DocMapper {
    type Error = anyhow::Error;

    fn try_from(builder: DocMapperBuilder) -> anyhow::Result<DocMapper> {
        let mut schema_builder = Schema::builder();

        // We want the field ID of the field presence field to be 0, so we add it to the schema
        // first.
        let field_presence_field = schema_builder.add_u64_field(FIELD_PRESENCE_FIELD_NAME, INDEXED);
        assert_eq!(field_presence_field, FIELD_PRESENCE_FIELD);

        let doc_mapping = builder.doc_mapping;

        let dynamic_field = if let Mode::Dynamic(json_options) = &doc_mapping.mode {
            Some(schema_builder.add_json_field(DYNAMIC_FIELD_NAME, json_options.clone()))
        } else {
            None
        };
        let document_size_field = if doc_mapping.store_document_size {
            let document_size_field_options = tantivy::schema::NumericOptions::default().set_fast();
            Some(
                schema_builder.add_u64_field(DOCUMENT_SIZE_FIELD_NAME, document_size_field_options),
            )
        } else {
            None
        };
        let source_field = if doc_mapping.store_source {
            Some(schema_builder.add_json_field(SOURCE_FIELD_NAME, STORED))
        } else {
            None
        };
        let MappingNodeRoot {
            field_mappings,
            concatenate_dynamic_fields,
        } = build_mapping_tree(&doc_mapping.field_mappings, &mut schema_builder)?;
        if !concatenate_dynamic_fields.is_empty() && dynamic_field.is_none() {
            bail!("concatenate field has `include_dynamic_fields` set, but index isn't dynamic");
        }
        let timestamp_field_path = if let Some(timestamp_field_name) = &doc_mapping.timestamp_field
        {
            validate_timestamp_field(timestamp_field_name, &field_mappings)?;
            Some(build_field_path_from_str(timestamp_field_name))
        } else {
            None
        };
        let schema = schema_builder.build();

        let tokenizer_manager = create_default_quickwit_tokenizer_manager();
        let mut custom_tokenizer_names = HashSet::new();
        for tokenizer_config_entry in &doc_mapping.tokenizers {
            if custom_tokenizer_names.contains(&tokenizer_config_entry.name) {
                bail!(
                    "duplicated custom tokenizer: `{}`",
                    tokenizer_config_entry.name
                );
            }
            if tokenizer_manager
                .get_tokenizer(&tokenizer_config_entry.name)
                .is_some()
            {
                bail!(
                    "custom tokenizer name `{}` should be different from built-in tokenizer's \
                     names",
                    tokenizer_config_entry.name
                );
            }
            let tokenizer = tokenizer_config_entry
                .config
                .text_analyzer()
                .map_err(|error| {
                    anyhow::anyhow!(
                        "failed to build tokenizer `{}`: {:?}",
                        tokenizer_config_entry.name,
                        error
                    )
                })?;
            let does_lowercasing = tokenizer_config_entry
                .config
                .filters
                .iter()
                .any(|filter| matches!(filter, crate::TokenFilterType::LowerCaser));
            tokenizer_manager.register(&tokenizer_config_entry.name, tokenizer, does_lowercasing);
            custom_tokenizer_names.insert(&tokenizer_config_entry.name);
        }
        validate_fields_tokenizers(&schema, &tokenizer_manager)?;

        // Resolve default search fields
        let mut default_search_field_names = Vec::new();
        for default_search_field_name in &builder.default_search_fields {
            if default_search_field_names.contains(default_search_field_name) {
                bail!(
                    "duplicated default search field: `{}`",
                    default_search_field_name
                )
            }
            let (default_search_field, _json_path) = schema
                .find_field_with_default(default_search_field_name, dynamic_field)
                .with_context(|| {
                    format!("unknown default search field `{default_search_field_name}`")
                })?;
            if !schema.get_field_entry(default_search_field).is_indexed() {
                bail!("default search field `{default_search_field_name}` is not indexed",);
            }
            default_search_field_names.push(default_search_field_name.clone());
        }

        // Resolve tag fields
        for tag_field_name in &doc_mapping.tag_fields {
            validate_tag(tag_field_name, &schema)?;
        }

        let partition_key_expr: &str = doc_mapping.partition_key.as_deref().unwrap_or("");
        let partition_key = RoutingExpr::new(partition_key_expr).with_context(|| {
            format!("failed to interpret the partition key: `{partition_key_expr}`")
        })?;

        // If valid, partition key fields should be considered as tags.
        let mut tag_field_names = doc_mapping.tag_fields;

        for partition_key in partition_key.field_names() {
            if validate_tag(&partition_key, &schema).is_ok() {
                tag_field_names.insert(partition_key);
            }
        }
        Ok(DocMapper {
            doc_mapping_uid: doc_mapping.doc_mapping_uid,
            schema,
            index_field_presence: doc_mapping.index_field_presence,
            source_field,
            dynamic_field,
            document_size_field,
            default_search_field_names,
            timestamp_field_name: doc_mapping.timestamp_field,
            timestamp_field_path,
            field_mappings,
            concatenate_dynamic_fields,
            tag_field_names,
            partition_key,
            max_num_partitions: doc_mapping.max_num_partitions,
            mode: doc_mapping.mode,
            tokenizer_entries: doc_mapping.tokenizers,
            tokenizer_manager,
        })
    }
}

/// Checks that a given field name is a valid candidate for a tag.
///
/// The conditions are:
/// - the field must be str, u64, or i64
/// - if str, the field must use the `raw` tokenizer for indexing.
/// - the field must be indexed.
fn validate_tag(tag_field_name: &str, schema: &Schema) -> Result<(), anyhow::Error> {
    if tag_field_name.starts_with('.') || tag_field_name.starts_with("\\.") {
        bail!("tag field `{tag_field_name}` should not start with a `.`");
    }
    if tag_field_name.ends_with('.') {
        bail!("tag field `{tag_field_name}` should not end with a `.`");
    }
    let field = schema
        .get_field(tag_field_name)
        .with_context(|| format!("unknown tag field: `{tag_field_name}`"))?;
    let field_type = schema.get_field_entry(field).field_type();
    match field_type {
        FieldType::Str(options) => {
            let tokenizer_opt = options
                .get_indexing_options()
                .map(|text_options: &tantivy::schema::TextFieldIndexing| text_options.tokenizer());
            if tokenizer_opt != Some(RAW_TOKENIZER_NAME) {
                bail!("tags collection is only allowed on text fields with the `raw` tokenizer");
            }
        }
        FieldType::U64(_) | FieldType::I64(_) => {
            // u64 and i64 are accepted as tags.
        }
        _ => {
            // We avoid the bytes / bool / f64 types,
            // as they are generally speaking poor tags and we want to avoid
            // bugs associated to the multiplicity of their representation.
            //
            // (Tags are relying heavily on string manipulation and we want to
            // avoid a "ZRP because you searched you searched for 0.100 instead of 0.1",
            // or `myflag:1`, `myflag:True` instead of `myflag:true`.
            bail!(
                "tags collection is not allowed on `{}` fields",
                field_type.value_type().name().to_lowercase()
            )
        }
    }
    if !field_type.is_indexed() {
        bail!(
            "tag fields are required to be indexed. (`{}` is not configured as indexed)",
            tag_field_name
        )
    }
    Ok(())
}

/// Checks that a given text/json field name has a registered tokenizer.
fn validate_fields_tokenizers(
    schema: &Schema,
    tokenizer_manager: &TokenizerManager,
) -> Result<(), anyhow::Error> {
    for (_, field_entry) in schema.fields() {
        let tokenizer_name_opt = match field_entry.field_type() {
            FieldType::Str(options) => options
                .get_indexing_options()
                .map(|text_options: &tantivy::schema::TextFieldIndexing| text_options.tokenizer()),
            FieldType::JsonObject(options) => options
                .get_text_indexing_options()
                .map(|text_options: &tantivy::schema::TextFieldIndexing| text_options.tokenizer()),
            _ => None,
        };
        if let Some(tokenizer_name) = tokenizer_name_opt
            && tokenizer_manager.get_tokenizer(tokenizer_name).is_none()
        {
            bail!(
                "unknown tokenizer `{}` for field `{}`",
                tokenizer_name,
                field_entry.name()
            );
        }
    }
    Ok(())
}

impl std::fmt::Debug for DocMapper {
    fn fmt(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
        formatter
            .debug_struct("DocMapper")
            .field("store_source", &self.source_field.is_some())
            .field(
                "default_search_field_names",
                &self.default_search_field_names,
            )
            .field("timestamp_field_name", &self.timestamp_field_name())
            // TODO: complete it.
            .finish()
    }
}

fn extract_single_obj(
    doc: &mut BTreeMap<String, Vec<TantivyValue>>,
    key: &str,
) -> anyhow::Result<Option<serde_json::Map<String, JsonValue>>> {
    let mut values = if let Some(values) = doc.remove(key) {
        values
    } else {
        return Ok(None);
    };
    if values.len() > 1 {
        bail!(
            "invalid named document. there are more than 1 value associated to the `{key}` field"
        );
    }
    match values.pop() {
        Some(TantivyValue::Object(dynamic_json_obj)) => Ok(Some(
            dynamic_json_obj
                .into_iter()
                .map(|(key, val)| (key, tantivy_value_to_json(val)))
                .collect(),
        )),
        Some(_) => {
            bail!("the `{key}` value has to be a json object");
        }
        None => Ok(None),
    }
}

impl DocMapper {
    /// Returns the unique identifier of the doc mapping.
    pub fn doc_mapping_uid(&self) -> DocMappingUid {
        self.doc_mapping_uid
    }

    /// Validates a JSON object according to the doc mapper.
    pub fn validate_json_obj(&self, json_obj: &BorrowedJsonMap) -> Result<(), DocParsingError> {
        let is_strict = self.mode.mode_type() == ModeType::Strict;
        let mut field_path = Vec::new();
        self.field_mappings
            .validate_from_json(json_obj, is_strict, &mut field_path)?;
        if let Some(timestamp_field_path) = &self.timestamp_field_path {
            let missing_ts_field =
                || DocParsingError::RequiredField("timestamp field is required".to_string());
            match &timestamp_field_path[..] {
                [] => (), // ?
                [single_part] => {
                    let obj = json_obj.get(single_part).ok_or_else(missing_ts_field)?;
                    if !(obj.is_string() || obj.is_number()) {
                        return Err(missing_ts_field());
                    }
                }
                [first_part, more_part @ ..] => {
                    let mut obj = json_obj.get(first_part).ok_or_else(missing_ts_field)?;
                    for part in more_part {
                        obj = obj
                            .as_object()
                            .ok_or_else(missing_ts_field)?
                            .get(part)
                            .ok_or_else(missing_ts_field)?;
                    }
                    if !(obj.is_string() || obj.is_number()) {
                        return Err(missing_ts_field());
                    }
                }
            };
        }
        Ok(())
    }

    /// Parses a JSON byte slice into a tantivy [`Document`].
    pub fn doc_from_json_bytes(
        &self,
        json_doc: &[u8],
    ) -> Result<(Partition, Document), DocParsingError> {
        let json_obj: JsonObject = serde_json::from_slice(json_doc).map_err(|_| {
            let json_doc_sample: String = std::str::from_utf8(json_doc)
                .map(|doc_str| doc_str.chars().take(20).chain("...".chars()).collect())
                .unwrap_or_else(|_| "document contains some invalid UTF-8 characters".to_string());
            DocParsingError::NotJsonObject(json_doc_sample)
        })?;
        self.doc_from_json_obj(json_obj, json_doc.len() as u64)
    }

    /// Parses a JSON string into a tantivy [`Document`].
    pub fn doc_from_json_str(
        &self,
        json_doc: &str,
    ) -> Result<(Partition, Document), DocParsingError> {
        let json_obj: JsonObject = serde_json::from_str(json_doc).map_err(|_| {
            let json_doc_sample: String = json_doc.chars().take(20).chain("...".chars()).collect();
            DocParsingError::NotJsonObject(json_doc_sample)
        })?;
        self.doc_from_json_obj(json_obj, json_doc.len() as u64)
    }

    /// Transforms a JSON object into a tantivy [`Document`] according to the rules
    /// defined for the `DocMapper`.
    pub fn doc_from_json_obj(
        &self,
        json_obj: JsonObject,
        document_len: u64,
    ) -> Result<(Partition, Document), DocParsingError> {
        let partition: Partition = self.partition_key.eval_hash(&json_obj);

        let mut dynamic_json_obj = serde_json::Map::default();
        let mut field_path = Vec::new();
        let mut document = Document::default();

        if let Some(source_field) = self.source_field {
            document.add_object(
                source_field,
                json_obj
                    .clone()
                    .into_iter()
                    .map(|(key, val)| (key, TantivyValue::from(val)))
                    .collect(),
            );
        }

        let mode = self.mode.mode_type();
        self.field_mappings.doc_from_json(
            json_obj,
            mode,
            &mut document,
            &mut field_path,
            &mut dynamic_json_obj,
        )?;

        if let Some(dynamic_field) = self.dynamic_field
            && !dynamic_json_obj.is_empty()
        {
            if !self.concatenate_dynamic_fields.is_empty() {
                let json_obj_values =
                    JsonValueIterator::new(serde_json::Value::Object(dynamic_json_obj.clone()))
                        .flat_map(map_primitive_json_to_concatenate_value);

                for value in json_obj_values {
                    for concatenate_dynamic_field in self.concatenate_dynamic_fields.iter() {
                        document.add_field_value(*concatenate_dynamic_field, &value);
                    }
                }
            }
            document.add_object(
                dynamic_field,
                dynamic_json_obj
                    .into_iter()
                    .map(|(key, val)| (key, TantivyValue::from(val)))
                    .collect(),
            );
        }

        if let Some(document_size_field) = self.document_size_field {
            document.add_u64(document_size_field, document_len);
        }

        if self.index_field_presence {
            let field_presence_hashes: FnvHashSet<u64> =
                populate_field_presence(&document, &self.schema, true);
            for field_presence_hash in field_presence_hashes {
                document.add_field_value(FIELD_PRESENCE_FIELD, &field_presence_hash);
            }
        }
        Ok((partition, document))
    }

    /// Converts a tantivy named Document to the json format.
    ///
    /// Tantivy does not have any notion of cardinality nor object.
    /// It is therefore up to the `DocMapper` to pick a tantivy named document
    /// and convert it into a final quickwit document.
    ///
    /// Because this operation is dependent on the `DocMapper`, this
    /// method is meant to be called on the root node using the most recent
    /// `DocMapper`. This ensures that the different hits are formatted according
    /// to the same schema.
    pub fn doc_to_json(
        &self,
        mut named_doc: BTreeMap<String, Vec<TantivyValue>>,
    ) -> anyhow::Result<serde_json::Map<String, JsonValue>> {
        let mut doc_json =
            extract_single_obj(&mut named_doc, DYNAMIC_FIELD_NAME)?.unwrap_or_default();
        let mut field_path: Vec<&str> = Vec::new();
        self.field_mappings
            .populate_json(&mut named_doc, &mut field_path, &mut doc_json);
        if let Some(source_json) = extract_single_obj(&mut named_doc, SOURCE_FIELD_NAME)? {
            doc_json.insert(
                SOURCE_FIELD_NAME.to_string(),
                JsonValue::Object(source_json),
            );
        }
        if matches!(
            self.mode,
            Mode::Dynamic(ref opt) if opt.stored
        ) {
            // if we are in dynamic mode and there are other fields lefts, we should print them.
            // They probably come from older schemas when these fields had a dedicated entry
            'field: for (key, mut value) in named_doc {
                if key.starts_with('_') {
                    // this is an internal field, not meant to be shown
                    continue 'field;
                }
                let Ok(path) = crate::routing_expression::parse_field_name(&key) else {
                    continue 'field;
                };
                let Some((last_segment, path)) = path.split_last() else {
                    continue 'field;
                };
                let mut map = &mut doc_json;
                for segment in path {
                    let obj = if map.contains_key(&**segment) {
                        // we have to do this strange dance to please the borrowchecker
                        map.get_mut(&**segment).unwrap()
                    } else {
                        map.insert(segment.to_string(), serde_json::Map::new().into());
                        map.get_mut(&**segment).unwrap()
                    };
                    let JsonValue::Object(inner_map) = obj else {
                        continue 'field;
                    };
                    map = inner_map;
                }
                map.entry(&**last_segment).or_insert_with(|| {
                    if value.len() == 1 {
                        tantivy_value_to_json(value.pop().unwrap())
                    } else {
                        JsonValue::Array(value.into_iter().map(tantivy_value_to_json).collect())
                    }
                });
            }
        }

        Ok(doc_json)
    }

    /// Returns the query.
    ///
    /// Considering schema evolution, splits within an index can have different schema
    /// over time. So `split_schema` is the schema of the split the query is targeting.
    pub fn query(
        &self,
        split_schema: Schema,
        query_ast: QueryAst,
        with_validation: bool,
        cache_context: Option<(Arc<dyn quickwit_query::query_ast::PredicateCache>, String)>,
    ) -> Result<(Box<dyn Query>, WarmupInfo), QueryParserError> {
        build_query(
            query_ast,
            &BuildTantivyAstContext {
                schema: &split_schema,
                tokenizer_manager: self.tokenizer_manager(),
                search_fields: &self.default_search_field_names[..],
                with_validation,
            },
            cache_context,
        )
    }

    /// Returns the list of search fields to search into, when no field is specified.
    /// (See `UserInputQuery`).
    pub fn default_search_fields(&self) -> &[String] {
        &self.default_search_field_names
    }

    /// Returns the schema.
    ///
    /// Considering schema evolution, splits within an index can have different schema
    /// over time. The schema returned here represents the most up-to-date schema of the index.
    pub fn schema(&self) -> Schema {
        self.schema.clone()
    }

    /// Returns the timestamp field name.
    pub fn timestamp_field_name(&self) -> Option<&str> {
        self.timestamp_field_name.as_deref()
    }

    /// Returns the tag `NameField`s on the current schema.
    /// Returns an error if a tag field is not found in this schema.
    pub fn tag_named_fields(&self) -> anyhow::Result<Vec<NamedField>> {
        let index_schema = self.schema();
        self.tag_field_names()
            .iter()
            .map(|field_name| {
                index_schema
                    .get_field(field_name)
                    .context(format!("field `{field_name}` must exist in the schema"))
                    .map(|field| NamedField {
                        name: field_name.clone(),
                        field,
                        field_type: index_schema.get_field_entry(field).field_type().clone(),
                    })
            })
            .collect::<Result<Vec<_>, _>>()
    }

    /// Returns the tag `NameField`s on the current schema.
    /// Returns an error if a tag field is not found in this schema.
    pub fn tag_field_names(&self) -> BTreeSet<String> {
        self.tag_field_names.clone()
    }

    /// Returns the maximum number of partitions.
    pub fn max_num_partitions(&self) -> NonZeroU32 {
        self.max_num_partitions
    }

    /// Returns the tokenizer manager.
    pub fn tokenizer_manager(&self) -> &TokenizerManager {
        &self.tokenizer_manager
    }
}

#[cfg(test)]
mod tests {
    use std::collections::{HashMap, HashSet};
    use std::iter::zip;

    use itertools::Itertools;
    use quickwit_common::PathHasher;
    use quickwit_query::query_ast::query_ast_from_user_text;
    use serde_json::{self, Value as JsonValue, json};
    use tantivy::schema::{
        FieldType, IndexRecordOption, OwnedValue as TantivyValue, OwnedValue, Type, Value,
    };

    use super::DocMapper;
    use crate::doc_mapper::field_mapping_entry::{DEFAULT_TOKENIZER_NAME, RAW_TOKENIZER_NAME};
    use crate::{
        DOCUMENT_SIZE_FIELD_NAME, DYNAMIC_FIELD_NAME, DocMapperBuilder, DocParsingError,
        FIELD_PRESENCE_FIELD_NAME, SOURCE_FIELD_NAME,
    };

    fn example_json_doc_value() -> JsonValue {
        serde_json::json!({
            "timestamp": 1586960586i64,
            "body": "20200415T072306-0700 INFO This is a great log",
            "response_date2": "2021-12-19T16:39:57+00:00",
            "response_date": "2021-12-19T16:39:57Z",
            "response_time": 2.3,
            "response_payload": "YWJj",
            "owner": "foo",
            "isImportant": false,
            "attributes": {
                "server": "ABC",
                "tags": [22, 23],
                "server.status": ["200", "201"],
                "server.payload": ["YQ==", "Yg=="]
            }
        })
    }

    const EXPECTED_JSON_PATHS_AND_VALUES: &str = r#"{
            "timestamp": ["2020-04-15T14:23:06Z"],
            "body": ["20200415T072306-0700 INFO This is a great log"],
            "response_date": ["2021-12-19T16:39:57Z"],
            "response_time": [2.3],
            "response_payload": ["YWJj"],
            "owner": ["foo"],
            "isImportant": [false],
            "body_other_tokenizer": ["20200415T072306-0700 INFO This is a great log"],
            "attributes.server": ["ABC"],
            "attributes.server\\.payload": ["YQ==", "Yg=="],
            "attributes.tags": [22, 23],
            "attributes.server\\.status": ["200", "201"]
        }"#;

    #[test]
    fn test_json_deserialize() -> anyhow::Result<()> {
        let config = crate::default_doc_mapper_for_test();
        assert!(config.source_field.is_some());
        let mut default_search_field_names: Vec<String> = config.default_search_field_names;
        default_search_field_names.sort();
        assert_eq!(
            default_search_field_names,
            ["attributes.server", r"attributes.server\.status", "body"]
        );
        assert_eq!(config.field_mappings.num_fields(), 10);
        Ok(())
    }

    #[test]
    fn test_parsing_document() {
        let json_doc = example_json_doc_value();
        let doc_mapper = crate::default_doc_mapper_for_test();
        let (_, document) = doc_mapper
            .doc_from_json_obj(json_doc.as_object().unwrap().clone(), 0)
            .unwrap();
        let schema = doc_mapper.schema();
        // 9 property entry + 1 field "_source" + 2 fields values for "tags" field
        // + 2 values inf "server.status" field + 2 values in "server.payload" field
        // + 7 values for field presence
        assert_eq!(document.len(), 23);
        let expected_json_paths_and_values: HashMap<String, JsonValue> =
            serde_json::from_str(EXPECTED_JSON_PATHS_AND_VALUES).unwrap();
        let mut field_presences: HashSet<u64> = HashSet::new();
        for (field, value) in document.field_values() {
            let owned_value: OwnedValue = value.into();
            let field_name = schema.get_field_name(field);
            if field_name == SOURCE_FIELD_NAME {
                // some part of aws-sdk enables `preserve_order` on serde_json.
                // to get "normal" equality, we are forced to recreate the json object
                // with sorted keys.
                let sorted_json_values = json_doc
                    .as_object()
                    .unwrap()
                    .clone()
                    .into_iter()
                    .sorted_by(|k1, k2| k1.0.cmp(&k2.0))
                    .collect::<serde_json::Map<_, _>>();
                assert_eq!(
                    tantivy::schema::OwnedValue::from(value.as_value()),
                    tantivy::schema::OwnedValue::from(sorted_json_values)
                );
            } else if field_name == DYNAMIC_FIELD_NAME {
                assert_eq!(
                    serde_json::to_string(&owned_value).unwrap(),
                    r#"{"response_date2":"2021-12-19T16:39:57Z"}"#
                );
            } else if field_name == FIELD_PRESENCE_FIELD_NAME {
                let field_presence_u64 = value.as_u64().unwrap();
                field_presences.insert(field_presence_u64);
            } else {
                let value = serde_json::to_string(&owned_value).unwrap();
                let is_value_in_expected_values = expected_json_paths_and_values
                    .get(field_name)
                    .unwrap()
                    .as_array()
                    .unwrap()
                    .iter()
                    .map(|expected_value| format!("{expected_value}"))
                    .any(|expected_value| expected_value == value);
                if !is_value_in_expected_values {
                    panic!("Could not find: {value:?} in {expected_json_paths_and_values:?}");
                }
            }
        }
        assert_eq!(field_presences.len(), 7);
        let timestamp_field = schema.get_field("timestamp").unwrap();
        let body_field = schema.get_field("body").unwrap();
        let attributes_field = schema.get_field("attributes.server").unwrap();
        assert!(!field_presences.contains(&PathHasher::hash_path(&[
            &timestamp_field.field_id().to_le_bytes()[..]
        ])));
        assert!(field_presences.contains(&PathHasher::hash_path(&[
            &body_field.field_id().to_le_bytes()[..]
        ])));
        assert!(field_presences.contains(&PathHasher::hash_path(&[
            &attributes_field.field_id().to_le_bytes()[..]
        ])));
    }

    #[test]
    fn test_accept_parsing_document_with_unknown_fields_and_missing_fields() {
        let doc_mapper = crate::default_doc_mapper_for_test();
        doc_mapper
            .doc_from_json_str(
                r#"{
                "timestamp": 1586960586000,
                "unknown_field": "20200415T072306-0700 INFO This is a great log",
                "response_date": "2021-12-19T16:39:57+00:00",
                "response_time": 12,
                "response_payload": "YWJj"
            }"#,
            )
            .unwrap();
    }

    #[test]
    fn test_fail_to_parse_document_with_wrong_cardinality() -> anyhow::Result<()> {
        let doc_mapper = crate::default_doc_mapper_for_test();
        let result = doc_mapper.doc_from_json_str(
            r#"{
                "timestamp": 1586960586000,
                "body": ["text 1", "text 2"]
            }"#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error,
            DocParsingError::MultiValuesNotSupported("body".to_owned())
        );
        Ok(())
    }

    #[test]
    fn test_fail_to_parse_document_with_wrong_value() -> anyhow::Result<()> {
        let doc_mapper = crate::default_doc_mapper_for_test();
        let result = doc_mapper.doc_from_json_str(
            r#"{
                "timestamp": 1586960586000,
                "body": 1
            }"#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error,
            DocParsingError::ValueError("body".to_owned(), "expected string, got `1`".to_owned())
        );
        Ok(())
    }

    #[test]
    fn test_timestamp_field_in_object_is_valid() {
        serde_json::from_str::<DocMapper>(
            r#"{
            "field_mappings": [
                {
                    "name": "some_obj",
                    "type": "object",
                    "field_mappings": [
                        {
                            "name": "timestamp",
                            "type": "datetime",
                            "fast": true
                        }
                    ]
                }
            ],
            "timestamp_field": "some_obj.timestamp"
        }"#,
        )
        .unwrap();

        serde_yaml::from_str::<DocMapper>(
            r#"
            field_mappings:
              - name: some_obj
                type: object
                field_mappings:
                  - name: timestamp
                    type: datetime
                    fast: true
            timestamp_field: some_obj.timestamp
        "#,
        )
        .unwrap();
    }

    #[test]
    fn test_timestamp_field_with_dots_in_its_name_is_valid() {
        serde_json::from_str::<DocMapper>(
            r#"{
            "field_mappings": [
                {
                    "name": "my.timestamp",
                    "type": "datetime",
                    "fast": true
                }
            ],
            "timestamp_field": "my\\.timestamp"
        }"#,
        )
        .unwrap();

        serde_yaml::from_str::<DocMapper>(
            r#"
            field_mappings:
              - name: my.timestamp
                type: datetime
                fast: true
            timestamp_field: "my\\.timestamp"
        "#,
        )
        .unwrap();
    }

    #[test]
    fn test_timestamp_field_that_start_with_dot_is_invalid() {
        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                "field_mappings": [
                    {
                        "name": "my.timestamp",
                        "type": "datetime",
                        "fast": true
                    }
                ],
                "timestamp_field": ".my.timestamp"
            }"#,
            )
            .unwrap_err()
            .to_string(),
            "timestamp field `.my.timestamp` should not start with a `.`",
        );

        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                "field_mappings": [
                    {
                        "name": "my.timestamp",
                        "type": "datetime",
                        "fast": true
                    }
                ],
                "timestamp_field": "\\.my\\.timestamp"
            }"#,
            )
            .unwrap_err()
            .to_string(),
            "timestamp field `\\.my\\.timestamp` should not start with a `.`",
        )
    }

    #[test]
    fn test_timestamp_field_that_ends_with_dot_is_invalid() {
        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                    "timestamp_field": "my.timestamp."
                }"#,
            )
            .unwrap_err()
            .to_string(),
            "timestamp field `my.timestamp.` should not end with a `.`",
        );

        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                    "timestamp_field": "my\\.timestamp\\."
                }"#,
            )
            .unwrap_err()
            .to_string(),
            "timestamp field `my\\.timestamp\\.` should not end with a `.`",
        )
    }

    #[test]
    fn test_tag_field_name_that_starts_with_dot_is_invalid() {
        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                    "tag_fields": [".my.tag"]
                }"#,
            )
            .unwrap_err()
            .to_string(),
            "tag field `.my.tag` should not start with a `.`",
        );

        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                    "tag_fields": ["\\.my\\.tag"]
                }"#,
            )
            .unwrap_err()
            .to_string(),
            "tag field `\\.my\\.tag` should not start with a `.`",
        )
    }

    #[test]
    fn test_tag_field_name_that_ends_with_dot_is_invalid() {
        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                    "tag_fields": ["my.tag."]
                }"#,
            )
            .unwrap_err()
            .to_string(),
            "tag field `my.tag.` should not end with a `.`",
        );

        assert_eq!(
            serde_json::from_str::<DocMapper>(
                r#"{
                    "tag_fields": ["my\\.tag\\."]
                }"#,
            )
            .unwrap_err()
            .to_string(),
            "tag field `my\\.tag\\.` should not end with a `.`",
        )
    }

    #[test]
    fn test_fail_to_build_doc_mapper_with_timestamp_field_with_multivalues_cardinality() {
        let doc_mapper = r#"{
            "timestamp_field": "timestamp",
            "tag_fields": [],
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "array<i64>"
                }
            ]
        }"#;
        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let expected_msg = "timestamp field `timestamp` should be a datetime field";
        assert_eq!(&builder.try_build().unwrap_err().to_string(), &expected_msg);
    }

    #[test]
    fn test_fail_to_build_doc_mapper_with_non_fast_timestamp_field() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "timestamp_field": "timestamp",
            "tag_fields": [],
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "datetime",
                    "fast": false
                }
            ]
        }"#;
        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let expected_msg = "timestamp field `timestamp` should be a fast field";
        assert_eq!(&builder.try_build().unwrap_err().to_string(), &expected_msg);
    }

    #[test]
    fn test_fail_to_build_doc_mapper_with_duplicate_fields() {
        {
            let doc_mapper = r#"{
                "field_mappings": [
                    {"name": "body","type": "text"},
                    {"name": "body","type": "bytes"}
                ]
            }"#;
            let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
            let expected_msg = "duplicated field definition `body`";
            assert_eq!(&builder.try_build().unwrap_err().to_string(), expected_msg);
        }

        {
            let doc_mapper = r#"{
                "field_mappings": [
                    {
                        "name": "identity",
                        "type": "object",
                        "field_mappings": [
                            {"type": "text", "name": "username"},
                            {"type": "text", "name": "username"}
                        ]
                    },
                    {"type": "text", "name": "body"}
                ]
            }"#;
            let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
            let expected_msg = "duplicated field definition `username`";
            assert_eq!(&builder.try_build().unwrap_err().to_string(), expected_msg);
        }
    }

    #[test]
    fn test_should_build_doc_mapper_with_duplicate_fields_at_different_level() {
        let doc_mapper = r#"{
            "field_mappings": [
                {
                    "name": "identity",
                    "type": "object",
                    "field_mappings": [
                        {"type": "text", "name": "body"},
                        {"type": "text", "name": "username"}
                    ]
                },
                {"type": "text", "name": "body"}
            ]
        }"#;
        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        assert!(builder.try_build().is_ok());
    }

    #[test]
    fn test_fail_to_build_doc_mapper_with_multivalued_timestamp_field() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "timestamp_field": "timestamp",
            "tag_fields": [],
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "array<datetime>",
                    "fast": true
                }
            ]
        }"#;

        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let expected_msg = "timestamp field `timestamp` should be single-valued";
        assert_eq!(&builder.try_build().unwrap_err().to_string(), expected_msg);
    }

    #[test]
    fn test_fail_with_field_name_equal_to_source() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "tag_fields": [],
            "field_mappings": [
                {
                    "name": "_source",
                    "type": "i64"
                }
            ]
        }"#;
        let deser_err = serde_json::from_str::<DocMapperBuilder>(doc_mapper)
            .err()
            .unwrap();
        assert!(
            deser_err
                .to_string()
                .contains("the following fields are reserved for Quickwit internal usage")
        );
    }

    #[test]
    fn test_fail_to_parse_document_with_wrong_base64_value() -> anyhow::Result<()> {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "timestamp_field": null,
            "tag_fields": [],
            "field_mappings": [
                {
                    "name": "image",
                    "type": "bytes",
                    "stored": true
                }
            ]
        }"#;
        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper)?;
        let doc_mapper = builder.try_build()?;
        let result = doc_mapper.doc_from_json_str(
            r#"{
            "image": "invalid base64 data"
        }"#,
        );
        let expected_msg = "the field `image` could not be parsed: expected base64 string, got \
                            `invalid base64 data`: Invalid symbol 32, offset 7.";
        assert_eq!(result.unwrap_err().to_string(), expected_msg);
        Ok(())
    }

    #[test]
    fn test_parse_document_with_tag_fields() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "index_field_presence": true,
            "timestamp_field": null,
            "tag_fields": ["city"],
            "store_source": true,
            "field_mappings": [
                {
                    "name": "city",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                },
                {
                    "name": "image",
                    "type": "bytes",
                    "stored": true
                }
            ]
        }"#;

        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let doc_mapper = builder.try_build().unwrap();
        let schema = doc_mapper.schema();
        let json_doc_value: JsonValue = serde_json::json!({
            "city": "tokio",
            "image": "YWJj"
        });
        let (_, document) = doc_mapper
            .doc_from_json_obj(json_doc_value.as_object().unwrap().clone(), 0)
            .unwrap();

        // 2 properties, + 1 value for "_source" + 2 for field presence.
        assert_eq!(document.len(), 5);
        let expected_json_paths_and_values: HashMap<String, JsonValue> = serde_json::from_str(
            r#"{
                "city": ["tokio"],
                "image": ["YWJj"]
            }"#,
        )
        .unwrap();
        let mut field_presences: HashSet<u64> = HashSet::default();
        document.field_values().for_each(|(field, value)| {
            let owned_value: OwnedValue = value.into();
            let field_name = schema.get_field_name(field);
            if field_name == SOURCE_FIELD_NAME {
                assert_eq!(
                    tantivy::schema::OwnedValue::from(value.as_value()),
                    tantivy::schema::OwnedValue::from(json_doc_value.as_object().unwrap().clone())
                );
            } else if field_name == FIELD_PRESENCE_FIELD_NAME {
                let field_value_hash = value.as_u64().unwrap();
                field_presences.insert(field_value_hash);
            } else {
                let value = serde_json::to_string(&owned_value).unwrap();
                let is_value_in_expected_values = expected_json_paths_and_values
                    .get(field_name)
                    .unwrap()
                    .as_array()
                    .unwrap()
                    .iter()
                    .map(|expected_value| format!("{expected_value}"))
                    .any(|expected_value| expected_value == value);
                assert!(is_value_in_expected_values);
            }
        });
        assert_eq!(field_presences.len(), 2);
        let city_field = schema.get_field("city").unwrap();
        let image_field = schema.get_field("image").unwrap();
        assert!(field_presences.contains(&PathHasher::hash_path(&[
            &city_field.field_id().to_le_bytes()
        ])));
        assert!(field_presences.contains(&PathHasher::hash_path(&[
            &image_field.field_id().to_le_bytes()
        ])));
    }

    #[test]
    fn test_partition_key_in_tags() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "timestamp_field": null,
            "tag_fields": ["city"],
            "store_source": true,
            "partition_key": "hash_mod((service,division,city), 50)",
            "field_mappings": [
                {
                    "name": "city",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                },
                {
                    "name": "division",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                },
                {
                    "name": "service",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                }
            ]
        }"#;

        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let doc_mapper = builder.try_build().unwrap();
        let tag_fields: Vec<_> = doc_mapper.tag_field_names.into_iter().collect();
        assert_eq!(tag_fields, vec!["city", "division", "service",]);
    }

    #[test]
    fn test_partition_key_in_tags_without_explicit_tags() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "timestamp_field": null,
            "store_source": true,
            "partition_key": "service,hash_mod((division,city), 50)",
            "field_mappings": [
                {
                    "name": "city",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                },
                {
                    "name": "division",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                },
                {
                    "name": "service",
                    "type": "text",
                    "stored": true,
                    "tokenizer": "raw"
                }
            ]
        }"#;

        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let doc_mapper = builder.try_build().unwrap();
        let tag_fields: Vec<_> = doc_mapper.tag_field_names.into_iter().collect();
        assert_eq!(tag_fields, vec!["city", "division", "service",]);
    }

    #[test]
    fn test_build_doc_mapper_with_tag_field_with_dots_in_its_name() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "tag_fields": ["my\\.city\\.id"],
            "field_mappings": [
                {
                    "name": "my.city.id",
                    "type": "u64"
                }
            ]
        }"#;
        serde_json::from_str::<DocMapper>(doc_mapper).unwrap();
    }

    #[test]
    fn test_build_doc_mapper_with_tag_field_in_object() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "tag_fields": ["location.city"],
            "field_mappings": [
                {
                    "name": "location",
                    "type": "object",
                    "field_mappings": [
                        {
                            "name": "city",
                            "type": "u64"
                        }
                    ]
                }
            ]
        }"#;
        serde_json::from_str::<DocMapper>(doc_mapper).unwrap();
    }

    #[test]
    fn test_fail_to_build_doc_mapper_with_wrong_tag_fields_types() -> anyhow::Result<()> {
        let doc_mapper_one = r#"{
            "default_search_fields": [],
            "tag_fields": ["city"],
            "field_mappings": [
                {
                    "name": "city",
                    "type": "text"
                }
            ]
        }"#;
        assert_eq!(
            serde_json::from_str::<DocMapperBuilder>(doc_mapper_one)?
                .try_build()
                .unwrap_err()
                .to_string(),
            "tags collection is only allowed on text fields with the `raw` tokenizer".to_string(),
        );

        let doc_mapper_two = r#"{
            "default_search_fields": [],
            "tag_fields": ["photo"],
            "field_mappings": [
                {
                    "name": "photo",
                    "type": "bytes"
                }
            ]
        }"#;
        assert_eq!(
            serde_json::from_str::<DocMapperBuilder>(doc_mapper_two)?
                .try_build()
                .unwrap_err()
                .to_string(),
            "tags collection is not allowed on `bytes` fields".to_string(),
        );
        Ok(())
    }

    // See #1132
    #[test]
    fn test_by_default_store_source_is_false_and_fields_are_stored_individually() {
        let doc_mapper = r#"{
            "default_search_fields": [],
            "field_mappings": [
                {
                    "name": "my-field",
                    "type": "u64",
                    "indexed": true
                }
            ]
        }"#;
        let builder = serde_json::from_str::<DocMapperBuilder>(doc_mapper).unwrap();
        let default_doc_mapper = builder.try_build().unwrap();
        assert!(default_doc_mapper.source_field.is_none());
        let schema = default_doc_mapper.schema();
        let field = schema.get_field("my-field").unwrap();
        let field_entry = schema.get_field_entry(field);
        assert!(field_entry.is_stored());
    }

    #[test]
    fn test_lenient_mode_schema() {
        let default_doc_mapper: DocMapper =
            serde_json::from_str(r#"{ "mode": "lenient" }"#).unwrap();
        let schema = default_doc_mapper.schema();
        assert_eq!(schema.num_fields(), 1);
        assert!(default_doc_mapper.default_search_field_names.is_empty());
    }

    #[test]
    fn test_dynamic_mode_schema() {
        let default_doc_mapper: DocMapper =
            serde_json::from_str(r#"{ "mode": "dynamic" }"#).unwrap();
        let schema = default_doc_mapper.schema();
        assert_eq!(schema.num_fields(), 2);
        let dynamic_field = schema.get_field(DYNAMIC_FIELD_NAME).unwrap();
        let dynamic_field_entry = schema.get_field_entry(dynamic_field);
        assert_eq!(dynamic_field_entry.field_type().value_type(), Type::Json);
        // the dynamic field will be added implicitly at search time.
        assert!(default_doc_mapper.default_search_field_names.is_empty());
    }

    #[test]
    fn test_dynamic_mode_schema_not_indexed() {
        let default_doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "mode": "dynamic",
            "dynamic_mapping": {
                "indexed": false,
                "stored": true
            }
        }"#,
        )
        .unwrap();
        let schema = default_doc_mapper.schema();
        assert_eq!(schema.num_fields(), 2);
        let dynamic_field = schema.get_field(DYNAMIC_FIELD_NAME).unwrap();
        let dynamic_field_entry = schema.get_field_entry(dynamic_field);
        let FieldType::JsonObject(json_opt) = dynamic_field_entry.field_type() else {
            panic!("Expected a json object");
        };
        assert_eq!(json_opt.is_indexed(), false);
        default_doc_mapper.default_search_field_names.is_empty();
    }

    #[test]
    fn test_strict_mode_simple() {
        let default_doc_mapper: DocMapper =
            serde_json::from_str(r#"{ "mode": "strict" }"#).unwrap();
        let parsing_err = default_doc_mapper
            .doc_from_json_str(r#"{ "a": { "b": 5, "c": 6 } }"#)
            .err()
            .unwrap();
        assert!(
            matches!(parsing_err, DocParsingError::NoSuchFieldInSchema(field_name) if field_name == "a")
        );
    }

    #[test]
    fn test_strict_mode_inner() {
        let default_doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "field_mappings": [
                {
                    "name": "some_obj",
                    "type": "object",
                    "field_mappings": [
                        {
                            "name": "child_a",
                            "type": "text"
                        }
                    ]
                }
            ],
            "mode": "strict"
        }"#,
        )
        .unwrap();
        assert!(
            default_doc_mapper
                .doc_from_json_str(r#"{ "some_obj": { "child_a": "hello" } }"#)
                .is_ok()
        );
        let parsing_err = default_doc_mapper
            .doc_from_json_str(r#"{ "some_obj": { "child_a": "hello", "child_b": 6 } }"#)
            .err()
            .unwrap();
        assert!(
            matches!(parsing_err, DocParsingError::NoSuchFieldInSchema(field_name) if field_name == "some_obj.child_b")
        );
    }

    #[test]
    fn test_lenient_mode_simple() {
        let default_doc_mapper: DocMapper =
            serde_json::from_str(r#"{ "mode": "lenient" }"#).unwrap();
        let (_, doc) = default_doc_mapper
            .doc_from_json_str(r#"{ "a": { "b": 5, "c": 6 } }"#)
            .unwrap();
        assert_eq!(doc.len(), 0);
    }

    #[track_caller]
    fn test_doc_from_json_test_aux(
        doc_mapper_json: &str,
        field: &str,
        document_json: &str,
        expected_values: Vec<TantivyValue>,
    ) {
        let default_doc_mapper: DocMapper = serde_json::from_str(doc_mapper_json).unwrap();
        let schema = default_doc_mapper.schema();
        let field = schema.get_field(field).unwrap();
        let (_, doc) = default_doc_mapper.doc_from_json_str(document_json).unwrap();

        let values: Vec<OwnedValue> = doc.get_all(field).map(|value| value.into()).collect();
        assert_eq!(values.len(), expected_values.len());

        for (value, expected_value) in zip(values, expected_values) {
            assert_eq!(value, expected_value);
        }
    }

    #[test]
    fn test_dymamic_mode_simple() {
        test_doc_from_json_test_aux(
            r#"{ "mode": "dynamic" }"#,
            DYNAMIC_FIELD_NAME,
            r#"{ "a": { "b": 5, "c": 6 } }"#,
            vec![
                json!({
                    "a": {
                        "b": 5,
                        "c": 6
                    }
                })
                .into(),
            ],
        );
    }

    #[test]
    fn test_dymamic_mode_inner() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_obj",
                        "type": "object",
                        "field_mappings": [
                            {
                                "name": "child_a",
                                "type": "text"
                            }
                        ]
                    }
                ],
                "mode": "dynamic"
            }"#,
            DYNAMIC_FIELD_NAME,
            r#"{ "some_obj": { "child_a": "", "child_b": {"c": 3} }, "some_obj2": 4 }"#,
            vec![
                json!({
                    "some_obj": {
                        "child_b": {
                            "c": 3
                        }
                    },
                    "some_obj2": 4
                })
                .into(),
            ],
        );
    }

    #[test]
    fn test_json_object_in_mapping() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_obj",
                        "type": "object",
                        "field_mappings": [
                            {
                                "name": "json_obj",
                                "type": "json"
                            }
                        ]
                    }
                ],
                "mode": "strict"
            }"#,
            "some_obj.json_obj",
            r#"{ "some_obj": { "json_obj": {"hello": 2} } }"#,
            vec![
                json!({
                    "hello": 2
                })
                .into(),
            ],
        );
    }

    #[test]
    fn test_reject_invalid_concatenate_field() {
        assert!(
            serde_json::from_str::<DocMapper>(
                r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["inexistent_field"]
                    }
                ]
            }"#
            )
            .unwrap_err()
            .to_string()
            .contains("uses an unknown field")
        );
        assert!(
            serde_json::from_str::<DocMapper>(
                r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "include_dynamic_fields": true
                    }
                ],
                "mode": "strict"
            }"#
            )
            .unwrap_err()
            .to_string()
            .contains(
                "concatenate field has `include_dynamic_fields` set, but index isn't dynamic"
            )
        );
        assert!(
            serde_json::from_str::<DocMapper>(
                r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate"
                    }
                ]
            }"#
            )
            .unwrap_err()
            .to_string()
            .contains("concatenate type must have at least one sub-field")
        );
    }

    #[test]
    fn test_concatenate_field_in_default_field() {
        serde_json::from_str::<DocMapper>(
            r#"{
                "default_search_fields": ["concat"],
                "field_mappings": [
                    {
                        "name": "some_text",
                        "type": "text"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    }
                ],
                "mode": "strict"
            }"#,
        )
        .unwrap();
    }

    #[test]
    fn test_concatenate_field_in_mapping() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_text",
                        "type": "text"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{"some_text": "this is a text"}"#,
            vec!["this is a text".into()],
        );
    }

    #[test]
    fn test_concatenate_field_in_mapping_dynamic() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "include_dynamic_fields": true
                    }
                ],
                "mode": "dynamic"
            }"#,
            "concat",
            r#"{"other_field": "this is a text"}"#,
            vec!["this is a text".into()],
        );
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "include_dynamic_fields": true
                    }
                ],
                "mode": "dynamic"
            }"#,
            "concat",
            r#"{"first_field": "this is a text", "second_field": "this is a text field too"}"#,
            vec!["this is a text".into(), "this is a text field too".into()],
        );
    }

    #[test]
    fn test_concatenate_field_in_mapping_integer() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_int",
                        "type": "u64"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_int"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{"some_int": 25}"#,
            vec![25_u64.into()],
        );
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "include_dynamic_fields": true
                    }
                ],
                "mode": "dynamic"
            }"#,
            "concat",
            r#"{"some_int": 25}"#,
            // i64 comes before u64
            vec![25_i64.into()],
        );
    }

    #[test]
    fn test_concatenate_field_in_mapping_boolean() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_bool",
                        "type": "bool"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_bool"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{"some_bool": false}"#,
            vec![false.into()],
        );
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "include_dynamic_fields": true
                    }
                ],
                "mode": "dynamic"
            }"#,
            "concat",
            r#"{"some_bool": true}"#,
            vec![true.into()],
        );
    }

    #[test]
    fn test_concatenate_field_array() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_text",
                        "type": "array<text>"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{"some_text": ["this is a text", "this is a text too"]}"#,
            vec!["this is a text".into(), "this is a text too".into()],
        );
    }

    #[test]
    fn test_concatenate_multiple_field() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_text",
                        "type": "text"
                    },
                    {
                        "name": "other_text",
                        "type": "text"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text", "other_text"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{"some_text": "this is a text", "other_text": "this is a text too"}"#,
            vec!["this is a text".into(), "this is a text too".into()],
        );
    }

    #[test]
    fn test_concatenate_field_object() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_obj",
                        "type": "object",
                        "field_mappings": [
                            {
                                "name": "json_obj",
                                "type": "json"
                            }
                        ]
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["some_obj.json_obj"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{ "some_obj": { "json_obj": {"hello": "world"} } }"#,
            vec!["world".into()],
        );
    }

    /*
     * in the future we may want to make this works. Currently it isn't supported and fail at index
     * creation
    #[test]
    fn test_concatenate_field_json_subpath() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "json_obj",
                        "type": "json"
                    },
                    {
                        "name": "concat",
                        "type": "concatenate",
                        "concatenate_fields": ["json_obj.hello"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat",
            r#"{ "json_obj": { "hello": "1", "world": "2"} }"#,
            vec!["1".into()],
        );
    }
    */

    #[test]
    fn test_concatenate_field_text() {
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_text",
                        "type": "text"
                    },
                    {
                        "name": "concat1",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    },
                    {
                        "name": "concat2",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat1",
            r#"{"some_text": "this is a text"}"#,
            vec!["this is a text".into()],
        );
        test_doc_from_json_test_aux(
            r#"{
                "field_mappings": [
                    {
                        "name": "some_text",
                        "type": "text"
                    },
                    {
                        "name": "concat1",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    },
                    {
                        "name": "concat2",
                        "type": "concatenate",
                        "concatenate_fields": ["some_text"]
                    }
                ],
                "mode": "strict"
            }"#,
            "concat2",
            r#"{"some_text": "this is a text"}"#,
            vec!["this is a text".into()],
        );
    }

    #[test]
    fn test_length_field() {
        let raw_doc = r#"{ "some_obj": { "json_obj": {"hello": 2} } }"#;
        test_doc_from_json_test_aux(
            r#"{
                "document_length": true,
                "mode": "dynamic"
            }"#,
            DOCUMENT_SIZE_FIELD_NAME,
            raw_doc,
            vec![(raw_doc.len() as u64).into()],
        );
    }

    fn default_doc_mapper_query_aux(doc_mapper: &DocMapper, query: &str) -> Result<String, String> {
        let query_ast = query_ast_from_user_text(query, None)
            .parse_user_query(doc_mapper.default_search_fields())
            .map_err(|err| err.to_string())?;
        let (query, _) = doc_mapper
            .query(doc_mapper.schema(), query_ast, true, None)
            .map_err(|err| err.to_string())?;
        Ok(format!("{query:?}"))
    }

    #[test]
    fn test_doc_mapper_sub_field_query_on_non_json_field_should_error() {
        let doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "field_mappings": [{"name": "body", "type": "text"}],
            "mode": "dynamic"
        }"#,
        )
        .unwrap();
        assert_eq!(
            default_doc_mapper_query_aux(&doc_mapper, "body.wrong_field:hello").unwrap_err(),
            "invalid query: field does not exist: `body.wrong_field`"
        );
    }

    #[test]
    fn test_doc_mapper_accept_sub_field_query_on_json_field() {
        let doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "field_mappings": [{"name": "body", "type": "json"}],
            "mode": "dynamic"
        }"#,
        )
        .unwrap();
        assert_eq!(
            default_doc_mapper_query_aux(&doc_mapper, "body.dynamic_field:hello"),
            Ok(
                r#"TermQuery(Term(field=2, type=Json, path=dynamic_field, type=Str, "hello"))"#
                    .to_string()
            )
        );
    }

    #[test]
    fn test_doc_mapper_object_dot_collision_with_object_field() {
        let doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "field_mappings": [
                {
                    "name": "identity",
                    "type": "object",
                    "field_mappings": [{"type": "text", "name": "username"}]
                },
                {"type": "text", "name": "identity.username"}
            ]
        }"#,
        )
        .unwrap();
        assert_eq!(
            default_doc_mapper_query_aux(&doc_mapper, "identity.username:toto").unwrap(),
            r#"TermQuery(Term(field=2, type=Str, "toto"))"#
        );
        assert_eq!(
            default_doc_mapper_query_aux(&doc_mapper, r"identity\.username:toto").unwrap(),
            r#"TermQuery(Term(field=3, type=Str, "toto"))"#
        );
    }

    #[test]
    fn test_doc_mapper_object_dot_collision_with_json_field() {
        let doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "field_mappings": [
                {"name": "identity", "type": "json"},
                {"type": "text", "name": "identity.username"}
            ]
        }"#,
        )
        .unwrap();
        assert_eq!(
            default_doc_mapper_query_aux(&doc_mapper, "identity.username:toto").unwrap(),
            r#"TermQuery(Term(field=2, type=Json, path=username, type=Str, "toto"))"#
        );
        assert_eq!(
            default_doc_mapper_query_aux(&doc_mapper, r"identity\.username:toto").unwrap(),
            r#"TermQuery(Term(field=3, type=Str, "toto"))"#
        );
    }

    #[test]
    fn test_doc_mapper_default_tokenizers() {
        let doc_mapper: DocMapper = serde_json::from_str(
            r#"{
            "field_mappings": [
                {"name": "json_field", "type": "json"},
                {"name": "text_field", "type": "text"}
            ]
        }"#,
        )
        .unwrap();
        let schema = doc_mapper.schema();

        {
            let json_field = schema.get_field("json_field").unwrap();
            let FieldType::JsonObject(json_options) =
                schema.get_field_entry(json_field).field_type()
            else {
                panic!()
            };
            let text_indexing_options = json_options.get_text_indexing_options().unwrap();
            assert_eq!(text_indexing_options.tokenizer(), RAW_TOKENIZER_NAME);
            assert_eq!(
                text_indexing_options.index_option(),
                IndexRecordOption::Basic
            );
        }

        {
            let text_field = schema.get_field("text_field").unwrap();
            let FieldType::Str(text_options) = schema.get_field_entry(text_field).field_type()
            else {
                panic!()
            };
            assert_eq!(
                text_options.get_indexing_options().unwrap().tokenizer(),
                DEFAULT_TOKENIZER_NAME
            );
        }
    }

    #[test]
    fn test_find_field_mapping_type() {
        let mapper = serde_json::from_str::<DocMapper>(
            r#"{
            "field_mappings": [
                {
                    "name": "some_obj",
                    "type": "object",
                    "field_mappings": [
                        {
                            "name": "timestamp",
                            "type": "datetime",
                            "fast": true
                        },
                        {
                            "name": "object2",
                            "type": "object",
                            "field_mappings": [
                                {
                                    "name": "id",
                                    "type": "u64"
                                },
                                {
                                    "name": "my.id",
                                    "type": "u64"
                                }
                            ]
                        }
                    ]
                },
                {
                    "name": "my.timestamp",
                    "type": "datetime",
                    "fast": true
                }
            ]
        }"#,
        )
        .unwrap();
        mapper
            .field_mappings
            .find_field_mapping_type("some_obj.timestamp")
            .unwrap();
        mapper
            .field_mappings
            .find_field_mapping_type("some_obj.object2.id")
            .unwrap();
        mapper
            .field_mappings
            .find_field_mapping_type("some_obj.object2")
            .unwrap();
        mapper
            .field_mappings
            .find_field_mapping_type("some_obj.object2.my\\.id")
            .unwrap();
        mapper
            .field_mappings
            .find_field_mapping_type("my\\.timestamp")
            .unwrap();
    }

    #[test]
    fn test_build_doc_mapper_with_custom_ngram_tokenizer() {
        let mapper = serde_json::from_str::<DocMapper>(
            r#"{
            "tokenizers": [
                {
                    "name": "my_tokenizer",
                    "filters": ["lower_caser", "ascii_folding", "remove_long"],
                    "type": "ngram",
                    "min_gram": 3,
                    "max_gram": 5
                }
            ],
            "field_mappings": [
                {
                    "name": "my_text",
                    "type": "text",
                    "tokenizer": "my_tokenizer"
                }
            ]
        }"#,
        )
        .unwrap();
        let field_mapping_type = mapper
            .field_mappings
            .find_field_mapping_type("my_text")
            .unwrap();
        match &field_mapping_type {
            super::FieldMappingType::Text(options, _) => {
                assert!(options.indexing_options.is_some());
                let tokenizer = &options.indexing_options.as_ref().unwrap().tokenizer;
                assert_eq!(tokenizer.name(), "my_tokenizer");
            }
            _ => panic!("Expected a text field"),
        }
        assert!(
            mapper
                .tokenizer_manager()
                .get_tokenizer("my_tokenizer")
                .is_some()
        );
    }

    #[test]
    fn test_build_doc_mapper_should_fail_with_unknown_tokenizer() {
        let mapper_builder = serde_json::from_str::<DocMapperBuilder>(
            r#"{
            "field_mappings": [
                {
                    "name": "my_text",
                    "type": "text",
                    "tokenizer": "my_tokenizer"
                }
            ]
        }"#,
        )
        .unwrap();
        let mapper = mapper_builder.try_build();
        let error_msg = mapper.unwrap_err().to_string();
        assert!(error_msg.contains("unknown tokenizer"));
    }

    #[test]
    fn test_build_doc_mapper_tokenizer_manager_with_custom_tokenizer() {
        let mapper = serde_json::from_str::<DocMapper>(
            r#"{
            "tokenizers": [
                {
                    "name": "my_tokenizer",
                    "filters": ["lower_caser"],
                    "type": "ngram",
                    "min_gram": 3,
                    "max_gram": 5
                }
            ],
            "field_mappings": [
                {
                    "name": "my_text",
                    "type": "text",
                    "tokenizer": "my_tokenizer"
                }
            ]
        }"#,
        )
        .unwrap();
        let mut tokenizer = mapper
            .tokenizer_manager()
            .get_tokenizer("my_tokenizer")
            .unwrap();
        let mut token_stream = tokenizer.token_stream("HELLO WORLD");
        assert_eq!(token_stream.next().unwrap().text, "hel");
        assert_eq!(token_stream.next().unwrap().text, "hell");
        assert_eq!(token_stream.next().unwrap().text, "hello");
    }

    #[test]
    fn test_build_doc_mapper_with_custom_invalid_regex_tokenizer() {
        let mapper_builder = serde_json::from_str::<DocMapperBuilder>(
            r#"{
            "tokenizers": [
                {
                    "name": "my_tokenizer",
                    "type": "regex",
                    "pattern": "(my_pattern"
                }
            ],
            "field_mappings": [
                {
                    "name": "my_text",
                    "type": "text",
                    "tokenizer": "my_tokenizer"
                }
            ]
        }"#,
        )
        .unwrap();
        let mapper = mapper_builder.try_build();
        assert!(mapper.is_err());
        let error_mesg = mapper.unwrap_err().to_string();
        assert!(error_mesg.contains("invalid regex tokenizer"));
    }

    #[test]
    fn test_doc_mapper_with_custom_tokenizer_equivalent_to_default() {
        let mapper = serde_json::from_str::<DocMapper>(
            r#"{
            "tokenizers": [
                {
                    "name": "my_tokenizer",
                    "filters": ["remove_long", "lower_caser"],
                    "type": "simple",
                    "min_gram": 3,
                    "max_gram": 5
                }
            ],
            "field_mappings": [
                {
                    "name": "my_text",
                    "type": "text",
                    "tokenizer": "my_tokenizer"
                }
            ]
        }"#,
        )
        .unwrap();
        let mut default_tokenizer = mapper.tokenizer_manager().get_tokenizer("default").unwrap();
        let mut tokenizer = mapper
            .tokenizer_manager()
            .get_tokenizer("my_tokenizer")
            .unwrap();
        let text = "I've seen things... seen things you little people wouldn't believe.";
        let mut default_token_stream = default_tokenizer.token_stream(text);
        let mut token_stream = tokenizer.token_stream(text);
        for _ in 0..10 {
            assert_eq!(
                default_token_stream.next().unwrap().text,
                token_stream.next().unwrap().text
            );
        }
    }

    #[test]
    fn test_deserialize_doc_after_mapping_change_json_to_obj() {
        use serde::Deserialize;
        use tantivy::Document;

        let old_mapper = json!({
            "field_mappings": [
                {"name": "body", "type": "json"}
            ]
        });

        let builder = DocMapperBuilder::deserialize(old_mapper.clone()).unwrap();
        let old_mapper = builder.try_build().unwrap();

        let JsonValue::Object(doc) = json!({
            "body": {
                "field.1": "hola",
                "field2": {
                    "key": "val",
                    "arr": [1,"abc", {"k": "v"}],
                },
                "field3": ["a", "b"]
            }
        }) else {
            panic!();
        };
        let tantivy_doc = old_mapper.doc_from_json_obj(doc.clone(), 0).unwrap().1;
        let named_doc = tantivy_doc.to_named_doc(&old_mapper.schema());

        let new_mapper = json!({
            "field_mappings": [
                {
                    "name": "body",
                    "type": "object",
                    "field_mappings": [
                        {"name": "field.1", "type": "text"},
                        {"name": "field2", "type": "json"},
                        {"name": "field3", "type": "array<text>"},
                    ]
                }
            ]
        });
        let builder = DocMapperBuilder::deserialize(new_mapper).unwrap();
        let new_mapper = builder.try_build().unwrap();

        assert_eq!(new_mapper.doc_to_json(named_doc.0).unwrap(), doc);
    }

    #[test]
    fn test_deserialize_doc_after_mapping_change_obj_to_json() {
        use serde::Deserialize;
        use tantivy::Document;

        let old_mapper = json!({
            "field_mappings": [
                {
                    "name": "body",
                    "type": "object",
                    "field_mappings": [
                        {"name": "field.1", "type": "text"},
                        {"name": "field2", "type": "json"},
                        {"name": "field3", "type": "array<text>"},
                    ]
                }
            ]
        });

        let builder = DocMapperBuilder::deserialize(old_mapper.clone()).unwrap();
        let old_mapper = builder.try_build().unwrap();

        let JsonValue::Object(doc) = json!({
            "body": {
                "field.1": "hola",
                "field2": {
                    "key": "val",
                    "arr": [1,"abc", {"k": "v"}],
                },
                "field3": ["a", "b"]
            }
        }) else {
            panic!();
        };
        let tantivy_doc = old_mapper.doc_from_json_obj(doc.clone(), 0).unwrap().1;
        let named_doc = tantivy_doc.to_named_doc(&old_mapper.schema());

        let new_mapper = json!({
            "field_mappings": [
                {"name": "body", "type": "json"}
            ]
        });
        let builder = DocMapperBuilder::deserialize(new_mapper).unwrap();
        let new_mapper = builder.try_build().unwrap();

        assert_eq!(new_mapper.doc_to_json(named_doc.0).unwrap(), doc);
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/field_mapping_entry.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::convert::TryFrom;

use anyhow::bail;
use base64::prelude::{BASE64_STANDARD, Engine};
use once_cell::sync::Lazy;
use quickwit_common::true_fn;
use regex::Regex;
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;
use tantivy::schema::{
    IndexRecordOption, JsonObjectOptions, OwnedValue as TantivyValue, TextFieldIndexing,
    TextOptions, Type,
};

use super::FieldMappingType;
use super::date_time_type::QuickwitDateTimeOptions;
use crate::doc_mapper::field_mapping_type::QuickwitFieldType;
use crate::{Cardinality, QW_RESERVED_FIELD_NAMES};

#[derive(Serialize, Deserialize, Default, Clone, Debug, PartialEq)]
pub struct QuickwitObjectOptions {
    pub field_mappings: Vec<FieldMappingEntry>,
}

/// A `FieldMappingEntry` defines how a field is indexed, stored,
/// and mapped from a JSON document to the related index fields.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(
    try_from = "FieldMappingEntryForSerialization",
    into = "FieldMappingEntryForSerialization"
)]
pub struct FieldMappingEntry {
    /// Field name in the index schema.
    pub name: String,
    /// Property parameters which define the type and the way the value must be indexed.
    pub mapping_type: FieldMappingType,
}

// Struct used for serialization and deserialization
// Main advantage: having a flat structure and gain flexibility
// if we want to add some syntactic sugar in the mapping.
// Main drawback: we have a bunch of mixed parameters in it but
// seems to be reasonable.
//
// We do not rely on enum with inline tagging and flatten because
// - serde does not support it in combination with `deny_unknown_field`
// - it is clumsy to handle `array<type>` keys.

// Docs bellow used for OpenAPI generation:
/// A `FieldMappingEntry` defines how a field is indexed, stored,
/// and mapped from a JSON document to the related index fields.
///
/// Property parameters which defines the way the value must be indexed.
///
/// Properties are determined by the specified type, for more information
/// please see: <https://quickwit.io/docs/configuration/index-config#field-types>
#[derive(Clone, Serialize, Deserialize, Debug, utoipa::ToSchema)]
pub(crate) struct FieldMappingEntryForSerialization {
    /// Field name in the index schema.
    name: String,
    #[serde(rename = "type")]
    type_id: String,
    #[serde(flatten)]
    #[schema(value_type = HashMap<String, Object>)]
    pub field_mapping_json: serde_json::Map<String, JsonValue>,
}

#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitNumericOptions {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    #[serde(default = "true_fn")]
    pub stored: bool,
    #[serde(default = "true_fn")]
    pub indexed: bool,
    #[serde(default)]
    pub fast: bool,
    #[serde(default = "true_fn")]
    pub coerce: bool,
    #[serde(default)]
    pub output_format: NumericOutputFormat,
}

impl Default for QuickwitNumericOptions {
    fn default() -> Self {
        Self {
            description: None,
            indexed: true,
            stored: true,
            fast: false,
            coerce: true,
            output_format: NumericOutputFormat::default(),
        }
    }
}

#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitBoolOptions {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    #[serde(default = "true_fn")]
    pub stored: bool,
    #[serde(default = "true_fn")]
    pub indexed: bool,
    #[serde(default)]
    pub fast: bool,
}

impl Default for QuickwitBoolOptions {
    fn default() -> Self {
        Self {
            description: None,
            indexed: true,
            stored: true,
            fast: false,
        }
    }
}

/// Options associated to a bytes field.
#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitBytesOptions {
    /// Optional description of the bytes field.
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    /// If true, the field will be stored in the doc store.
    #[serde(default = "true_fn")]
    pub stored: bool,
    /// If true, the field will be indexed.
    #[serde(default = "true_fn")]
    pub indexed: bool,
    /// If true, the field will be stored in columnar format.
    #[serde(default)]
    pub fast: bool,
    /// Input format of the bytes field.
    #[serde(default)]
    pub input_format: BinaryFormat,
    /// Output format of the bytes field.
    #[serde(default)]
    pub output_format: BinaryFormat,
}

impl Default for QuickwitBytesOptions {
    fn default() -> Self {
        Self {
            description: None,
            indexed: true,
            stored: true,
            fast: false,
            input_format: BinaryFormat::default(),
            output_format: BinaryFormat::default(),
        }
    }
}

/// Available binary formats.
#[derive(Clone, Copy, Debug, Eq, PartialEq, Hash, Default, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum BinaryFormat {
    /// Base64 format.
    #[default]
    Base64,
    /// Hexadecimal format.
    Hex,
}

impl BinaryFormat {
    /// Returns the string representation of the format.
    pub fn as_str(&self) -> &str {
        match self {
            Self::Base64 => "base64",
            Self::Hex => "hex",
        }
    }

    /// Returns representation of the format in `serde_json::Value`.
    pub fn format_to_json(&self, value: &[u8]) -> JsonValue {
        match self {
            Self::Base64 => BASE64_STANDARD.encode(value).into(),
            Self::Hex => hex::encode(value).into(),
        }
    }

    /// Parses the `serde_json::Value` into `tantivy::schema::Value`.
    pub fn parse_str(&self, byte_str: &str) -> Result<Vec<u8>, String> {
        let payload = match self {
            Self::Base64 => BASE64_STANDARD
                .decode(byte_str)
                .map_err(|base64_decode_err| {
                    format!("expected base64 string, got `{byte_str}`: {base64_decode_err}")
                })?,
            Self::Hex => hex::decode(byte_str).map_err(|hex_decode_err| {
                format!("expected hex string, got `{byte_str}`: {hex_decode_err}")
            })?,
        };
        Ok(payload)
    }

    /// Parses the `serde_json::Value` into `tantivy::schema::Value`.
    pub fn parse_json(&self, json_val: &JsonValue) -> Result<TantivyValue, String> {
        let byte_str = if let JsonValue::String(byte_str) = json_val {
            byte_str
        } else {
            return Err(format!(
                "expected {} string, got `{json_val}`",
                self.as_str()
            ));
        };
        let payload = self.parse_str(byte_str)?;
        Ok(TantivyValue::Bytes(payload))
    }
}

#[derive(Clone, Copy, Debug, Eq, PartialEq, Hash, Default, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum NumericOutputFormat {
    #[default]
    Number,
    String,
}

#[derive(Clone, Debug, Serialize, Deserialize, PartialEq, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitIpAddrOptions {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    #[serde(default = "true_fn")]
    pub stored: bool,
    #[serde(default = "true_fn")]
    pub indexed: bool,
    #[serde(default)]
    pub fast: bool,
}

impl Default for QuickwitIpAddrOptions {
    fn default() -> Self {
        Self {
            description: None,
            indexed: true,
            stored: true,
            fast: false,
        }
    }
}

#[derive(Clone, PartialEq, Debug, Eq, Serialize, Deserialize, utoipa::ToSchema)]
pub struct QuickwitTextTokenizer(Cow<'static, str>);

pub(crate) const DEFAULT_TOKENIZER_NAME: &str = "default";

pub(crate) const RAW_TOKENIZER_NAME: &str = "raw";

impl Default for QuickwitTextTokenizer {
    fn default() -> Self {
        Self::from_static(DEFAULT_TOKENIZER_NAME)
    }
}

impl QuickwitTextTokenizer {
    pub const fn from_static(name: &'static str) -> Self {
        Self(Cow::Borrowed(name))
    }
    pub(crate) fn name(&self) -> &str {
        &self.0
    }
    pub fn raw() -> Self {
        Self::from_static(RAW_TOKENIZER_NAME)
    }
}

#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
pub enum QuickwitTextNormalizer {
    Raw,
    Lowercase,
}

impl QuickwitTextNormalizer {
    pub fn get_name(&self) -> &str {
        match self {
            QuickwitTextNormalizer::Raw => "raw",
            QuickwitTextNormalizer::Lowercase => "lowercase",
        }
    }
}

#[derive(Clone, PartialEq, Debug)]
pub struct TextIndexingOptions {
    pub tokenizer: QuickwitTextTokenizer,
    pub record: IndexRecordOption,
    pub fieldnorms: bool,
}

impl TextIndexingOptions {
    fn from_parts_text(
        indexed: bool,
        tokenizer: Option<QuickwitTextTokenizer>,
        record: Option<IndexRecordOption>,
        fieldnorms: bool,
    ) -> anyhow::Result<Option<Self>> {
        if indexed {
            Ok(Some(TextIndexingOptions {
                tokenizer: tokenizer.unwrap_or_default(),
                record: record.unwrap_or(IndexRecordOption::Basic),
                fieldnorms,
            }))
        } else {
            if tokenizer.is_some() || record.is_some() || fieldnorms {
                bail!(
                    "`record`, `tokenizer`, and `fieldnorms` parameters are allowed only if \
                     indexed is true"
                )
            }
            Ok(None)
        }
    }

    fn from_parts_json(
        indexed: bool,
        tokenizer: Option<QuickwitTextTokenizer>,
        record: Option<IndexRecordOption>,
    ) -> anyhow::Result<Option<Self>> {
        if indexed {
            Ok(Some(TextIndexingOptions {
                tokenizer: tokenizer.unwrap_or_else(QuickwitTextTokenizer::raw),
                record: record.unwrap_or(IndexRecordOption::Basic),
                fieldnorms: false,
            }))
        } else {
            if tokenizer.is_some() || record.is_some() {
                bail!("`record` and `tokenizer` parameters are allowed only if indexed is true")
            }
            Ok(None)
        }
    }

    fn from_parts_concatenate(
        tokenizer: Option<QuickwitTextTokenizer>,
        record: Option<IndexRecordOption>,
    ) -> anyhow::Result<Self> {
        let text_index_options_opt = Self::from_parts_text(true, tokenizer, record, false)?;
        let text_index_options = text_index_options_opt.expect("concatenate field must be indexed");
        Ok(text_index_options)
    }

    fn to_parts_text(
        this: Option<Self>,
    ) -> (
        bool, // indexed
        Option<QuickwitTextTokenizer>,
        Option<IndexRecordOption>,
        bool, // fieldnorms
    ) {
        match this {
            Some(this) => (
                true,
                Some(this.tokenizer),
                Some(this.record),
                this.fieldnorms,
            ),
            None => (false, None, None, false),
        }
    }

    fn to_parts_json(
        this: Option<Self>,
    ) -> (
        bool, // indexed
        Option<QuickwitTextTokenizer>,
        Option<IndexRecordOption>,
    ) {
        let (indexed, tokenizer, record, _fieldorm) = TextIndexingOptions::to_parts_text(this);
        (indexed, tokenizer, record)
    }

    fn to_parts_concatenate(
        this: Self,
    ) -> (Option<QuickwitTextTokenizer>, Option<IndexRecordOption>) {
        let (_indexed, tokenizer, record, _fieldorm) =
            TextIndexingOptions::to_parts_text(Some(this));
        (tokenizer, record)
    }

    fn default_json() -> Self {
        TextIndexingOptions {
            tokenizer: QuickwitTextTokenizer::raw(),
            record: IndexRecordOption::Basic,
            fieldnorms: false,
        }
    }
}

impl Default for TextIndexingOptions {
    fn default() -> Self {
        TextIndexingOptions {
            tokenizer: QuickwitTextTokenizer::default(),
            record: IndexRecordOption::Basic,
            fieldnorms: false,
        }
    }
}

#[quickwit_macros::serde_multikey]
#[derive(Clone, PartialEq, Serialize, Deserialize, Debug, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitTextOptions {
    #[schema(value_type = String)]
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    #[serde_multikey(
        deserializer = TextIndexingOptions::from_parts_text,
        serializer = TextIndexingOptions::to_parts_text,
        fields = (
            #[serde(default = "true_fn")]
            pub indexed: bool,
            #[serde(default)]
            #[serde(skip_serializing_if = "Option::is_none")]
            pub tokenizer: Option<QuickwitTextTokenizer>,
            #[schema(value_type = IndexRecordOptionSchema)]
            #[serde(default)]
            #[serde(skip_serializing_if = "Option::is_none")]
            pub record: Option<IndexRecordOption>,
            #[serde(default)]
            pub fieldnorms: bool,
        ),
    )]
    pub indexing_options: Option<TextIndexingOptions>,
    #[serde(default = "true_fn")]
    pub stored: bool,
    #[serde(default)]
    pub fast: FastFieldOptions,
}

#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(
    into = "FastFieldOptionsForSerialization",
    from = "FastFieldOptionsForSerialization"
)]
pub enum FastFieldOptions {
    #[default]
    Disabled,
    EnabledWithNormalizer {
        normalizer: QuickwitTextNormalizer,
    },
}

impl FastFieldOptions {
    pub fn default_enabled() -> Self {
        FastFieldOptions::EnabledWithNormalizer {
            normalizer: QuickwitTextNormalizer::Raw,
        }
    }
}

#[derive(Serialize, Deserialize)]
#[serde(untagged)]
enum FastFieldOptionsForSerialization {
    IsEnabled(bool),
    EnabledWithNormalizer { normalizer: QuickwitTextNormalizer },
}

impl From<FastFieldOptionsForSerialization> for FastFieldOptions {
    fn from(fast_field_options: FastFieldOptionsForSerialization) -> Self {
        match fast_field_options {
            FastFieldOptionsForSerialization::IsEnabled(is_enabled) => {
                if is_enabled {
                    FastFieldOptions::default_enabled()
                } else {
                    FastFieldOptions::Disabled
                }
            }
            FastFieldOptionsForSerialization::EnabledWithNormalizer { normalizer } => {
                FastFieldOptions::EnabledWithNormalizer { normalizer }
            }
        }
    }
}

impl From<FastFieldOptions> for FastFieldOptionsForSerialization {
    fn from(fast_field_options: FastFieldOptions) -> Self {
        match fast_field_options {
            FastFieldOptions::Disabled => FastFieldOptionsForSerialization::IsEnabled(false),
            FastFieldOptions::EnabledWithNormalizer { normalizer } => {
                FastFieldOptionsForSerialization::EnabledWithNormalizer { normalizer }
            }
        }
    }
}

impl Default for QuickwitTextOptions {
    fn default() -> Self {
        Self {
            description: None,
            indexing_options: Some(TextIndexingOptions::default()),
            stored: true,
            fast: FastFieldOptions::default(),
        }
    }
}

impl From<QuickwitTextOptions> for TextOptions {
    fn from(quickwit_text_options: QuickwitTextOptions) -> Self {
        let mut text_options = TextOptions::default();
        if quickwit_text_options.stored {
            text_options = text_options.set_stored();
        }
        match &quickwit_text_options.fast {
            FastFieldOptions::EnabledWithNormalizer { normalizer } => {
                text_options = text_options.set_fast(Some(normalizer.get_name()));
            }
            FastFieldOptions::Disabled => {}
        }
        if let Some(indexing_options) = quickwit_text_options.indexing_options {
            let text_field_indexing = TextFieldIndexing::default()
                .set_index_option(indexing_options.record)
                .set_fieldnorms(indexing_options.fieldnorms)
                .set_tokenizer(indexing_options.tokenizer.name());

            text_options = text_options.set_indexing_options(text_field_indexing);
        }
        text_options
    }
}

#[allow(unused)]
#[derive(utoipa::ToSchema)]
pub enum IndexRecordOptionSchema {
    /// records only the `DocId`s
    #[schema(rename = "basic")]
    Basic,
    /// records the document ids as well as the term frequency.
    /// The term frequency can help giving better scoring of the documents.
    #[schema(rename = "freq")]
    WithFreqs,
    /// records the document id, the term frequency and the positions of
    /// the occurrences in the document.
    #[schema(rename = "position")]
    WithFreqsAndPositions,
}

/// Options associated to a json field.
///
/// `QuickwitJsonOptions` is also used to configure
/// the dynamic mapping.
#[quickwit_macros::serde_multikey]
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitJsonOptions {
    /// Optional description of JSON object.
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    #[serde_multikey(
        deserializer = TextIndexingOptions::from_parts_json,
        serializer = TextIndexingOptions::to_parts_json,
        fields = (
            /// If true, all of the element in the json object will be indexed.
            #[serde(default = "true_fn")]
            pub indexed: bool,
            /// Sets the tokenize that should be used with the text fields in the
            /// json object.
            #[serde(default)]
            #[serde(skip_serializing_if = "Option::is_none")]
            pub tokenizer: Option<QuickwitTextTokenizer>,
            /// Sets how much information should be added in the index
            /// with each token.
            ///
            /// Setting `record` is only allowed if indexed == true.
            #[schema(value_type = IndexRecordOptionSchema)]
            #[serde(default)]
            #[serde(skip_serializing_if = "Option::is_none")]
            pub record: Option<IndexRecordOption>,
        ),
    )]
    /// Options for indexing text in a Json field.
    pub indexing_options: Option<TextIndexingOptions>,
    /// If true, the field will be stored in the doc store.
    #[serde(default = "true_fn")]
    pub stored: bool,
    /// If true, the '.' in json keys will be expanded.
    #[serde(default = "true_fn")]
    pub expand_dots: bool,
    /// If true, the json object will be stored in columnar format.
    #[serde(default)]
    pub fast: FastFieldOptions,
}

impl QuickwitJsonOptions {
    /// Build a default QuickwitJsonOptions for dynamic fields.
    pub fn default_dynamic() -> Self {
        QuickwitJsonOptions {
            fast: FastFieldOptions::default_enabled(),
            ..Default::default()
        }
    }
}

impl Default for QuickwitJsonOptions {
    fn default() -> Self {
        QuickwitJsonOptions {
            description: None,
            indexing_options: Some(TextIndexingOptions::default_json()),
            stored: true,
            expand_dots: true,
            fast: FastFieldOptions::default(),
        }
    }
}

impl From<QuickwitJsonOptions> for JsonObjectOptions {
    fn from(quickwit_json_options: QuickwitJsonOptions) -> Self {
        let mut json_options = JsonObjectOptions::default();
        if quickwit_json_options.stored {
            json_options = json_options.set_stored();
        }
        if let Some(indexing_options) = quickwit_json_options.indexing_options {
            let text_field_indexing = TextFieldIndexing::default()
                .set_tokenizer(indexing_options.tokenizer.name())
                .set_index_option(indexing_options.record);
            json_options = json_options.set_indexing_options(text_field_indexing);
        }
        if quickwit_json_options.expand_dots {
            json_options = json_options.set_expand_dots_enabled();
        }
        match &quickwit_json_options.fast {
            FastFieldOptions::EnabledWithNormalizer { normalizer } => {
                json_options = json_options.set_fast(Some(normalizer.get_name()));
            }
            FastFieldOptions::Disabled => {}
        }
        json_options
    }
}

/// Options associated to a concatenate field.
#[quickwit_macros::serde_multikey]
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct QuickwitConcatenateOptions {
    /// Optional description of JSON object.
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub description: Option<String>,
    /// Fields to concatenate
    #[serde(default)]
    pub concatenate_fields: Vec<String>,
    #[serde(default)]
    pub include_dynamic_fields: bool,
    #[serde_multikey(
        deserializer = TextIndexingOptions::from_parts_concatenate,
        serializer = TextIndexingOptions::to_parts_concatenate,
        fields = (
            /// Sets the tokenize that should be used with the text fields in the
            /// concatenate field.
            #[serde(default)]
            #[serde(skip_serializing_if = "Option::is_none")]
            pub tokenizer: Option<QuickwitTextTokenizer>,
            /// Sets how much information should be added in the index
            /// with each token.
            #[schema(value_type = IndexRecordOptionSchema)]
            #[serde(default)]
            #[serde(skip_serializing_if = "Option::is_none")]
            pub record: Option<IndexRecordOption>,
        ),
    )]
    /// Options for indexing text in a concatenate field.
    pub indexing_options: TextIndexingOptions,
}

impl Default for QuickwitConcatenateOptions {
    fn default() -> Self {
        QuickwitConcatenateOptions {
            description: None,
            concatenate_fields: Vec::new(),
            include_dynamic_fields: false,
            indexing_options: TextIndexingOptions {
                tokenizer: QuickwitTextTokenizer::default(),
                record: IndexRecordOption::Basic,
                fieldnorms: false,
            },
        }
    }
}

impl From<QuickwitConcatenateOptions> for JsonObjectOptions {
    fn from(quickwit_text_options: QuickwitConcatenateOptions) -> Self {
        let mut text_options = JsonObjectOptions::default();
        let text_field_indexing = TextFieldIndexing::default()
            .set_index_option(quickwit_text_options.indexing_options.record)
            .set_fieldnorms(quickwit_text_options.indexing_options.fieldnorms)
            .set_tokenizer(quickwit_text_options.indexing_options.tokenizer.name());

        text_options = text_options.set_indexing_options(text_field_indexing);
        text_options
    }
}

fn deserialize_mapping_type(
    quickwit_field_type: QuickwitFieldType,
    json: JsonValue,
) -> anyhow::Result<FieldMappingType> {
    let (typ, cardinality) = match quickwit_field_type {
        QuickwitFieldType::Simple(typ) => (typ, Cardinality::SingleValued),
        QuickwitFieldType::Array(typ) => (typ, Cardinality::MultiValued),
        QuickwitFieldType::Object => {
            let object_options: QuickwitObjectOptions = serde_json::from_value(json)?;
            if object_options.field_mappings.is_empty() {
                anyhow::bail!("object type must have at least one field mapping");
            }
            return Ok(FieldMappingType::Object(object_options));
        }
        QuickwitFieldType::Concatenate => {
            let concatenate_options: QuickwitConcatenateOptions = serde_json::from_value(json)?;
            if concatenate_options.concatenate_fields.is_empty()
                && !concatenate_options.include_dynamic_fields
            {
                anyhow::bail!("concatenate type must have at least one sub-field");
            }
            return Ok(FieldMappingType::Concatenate(concatenate_options));
        }
    };
    match typ {
        Type::Str => {
            let text_options: QuickwitTextOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::Text(text_options, cardinality))
        }
        Type::U64 => {
            let numeric_options: QuickwitNumericOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::U64(numeric_options, cardinality))
        }
        Type::I64 => {
            let numeric_options: QuickwitNumericOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::I64(numeric_options, cardinality))
        }
        Type::F64 => {
            let numeric_options: QuickwitNumericOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::F64(numeric_options, cardinality))
        }
        Type::Bool => {
            let bool_options: QuickwitBoolOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::Bool(bool_options, cardinality))
        }
        Type::IpAddr => {
            let ip_addr_options: QuickwitIpAddrOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::IpAddr(ip_addr_options, cardinality))
        }
        Type::Date => {
            let date_time_options = serde_json::from_value::<QuickwitDateTimeOptions>(json)?;
            Ok(FieldMappingType::DateTime(date_time_options, cardinality))
        }
        Type::Facet => unimplemented!("Facet are not supported in quickwit yet."),
        Type::Bytes => {
            let numeric_options: QuickwitBytesOptions = serde_json::from_value(json)?;
            if numeric_options.fast && cardinality == Cardinality::MultiValued {
                bail!("fast field is not allowed for array<bytes>");
            }
            Ok(FieldMappingType::Bytes(numeric_options, cardinality))
        }
        Type::Json => {
            let json_options: QuickwitJsonOptions = serde_json::from_value(json)?;
            Ok(FieldMappingType::Json(json_options, cardinality))
        }
    }
}

impl TryFrom<FieldMappingEntryForSerialization> for FieldMappingEntry {
    type Error = String;

    fn try_from(value: FieldMappingEntryForSerialization) -> Result<Self, String> {
        validate_field_mapping_name(&value.name).map_err(|err| err.to_string())?;
        let quickwit_field_type =
            QuickwitFieldType::parse_type_id(&value.type_id).ok_or_else(|| {
                format!(
                    "field `{}` has an unknown type: `{}`",
                    &value.name, &value.type_id
                )
            })?;
        let mapping_type = deserialize_mapping_type(
            quickwit_field_type,
            JsonValue::Object(value.field_mapping_json),
        )
        .map_err(|err| format!("error while parsing field `{}`: {}", value.name, err))?;
        Ok(FieldMappingEntry {
            name: value.name,
            mapping_type,
        })
    }
}

/// Serialize object into a `Map` of json values.
fn serialize_to_map<S: Serialize>(val: &S) -> Option<serde_json::Map<String, JsonValue>> {
    let json_val = serde_json::to_value(val).ok()?;
    if let JsonValue::Object(map) = json_val {
        Some(map)
    } else {
        None
    }
}

fn typed_mapping_to_json_params(
    field_mapping_type: FieldMappingType,
) -> serde_json::Map<String, JsonValue> {
    match field_mapping_type {
        FieldMappingType::Text(text_options, _) => serialize_to_map(&text_options),
        FieldMappingType::U64(options, _)
        | FieldMappingType::I64(options, _)
        | FieldMappingType::F64(options, _) => serialize_to_map(&options),
        FieldMappingType::Bool(options, _) => serialize_to_map(&options),
        FieldMappingType::Bytes(options, _) => serialize_to_map(&options),
        FieldMappingType::IpAddr(options, _) => serialize_to_map(&options),
        FieldMappingType::DateTime(date_time_options, _) => serialize_to_map(&date_time_options),
        FieldMappingType::Json(json_options, _) => serialize_to_map(&json_options),
        FieldMappingType::Object(object_options) => serialize_to_map(&object_options),
        FieldMappingType::Concatenate(concatenate_options) => {
            serialize_to_map(&concatenate_options)
        }
    }
    .unwrap()
}

impl From<FieldMappingEntry> for FieldMappingEntryForSerialization {
    fn from(field_mapping_entry: FieldMappingEntry) -> FieldMappingEntryForSerialization {
        let type_id = field_mapping_entry
            .mapping_type
            .quickwit_field_type()
            .to_type_id();
        let field_mapping_json = typed_mapping_to_json_params(field_mapping_entry.mapping_type);
        FieldMappingEntryForSerialization {
            name: field_mapping_entry.name,
            type_id,
            field_mapping_json,
        }
    }
}

/// Regular expression validating a field mapping name.
pub const FIELD_MAPPING_NAME_PATTERN: &str = r"^[@$_\-a-zA-Z][@$_/\.\-a-zA-Z0-9]{0,254}$";

/// Validates a field mapping name.
/// Returns `Ok(())` if the name can be used for a field mapping.
///
/// A field mapping name:
/// - can only contain uppercase and lowercase ASCII letters `[a-zA-Z]`, digits `[0-9]`, `.`,
///   hyphens `-`, underscores `_`, at `@` and dollar `$` signs;
/// - must not start with a dot or a digit;
/// - must be different from Quickwit's reserved field mapping names `_source`, `_dynamic`,
///   `_field_presence`;
/// - must not be longer than 255 characters.
pub fn validate_field_mapping_name(field_mapping_name: &str) -> anyhow::Result<()> {
    static FIELD_MAPPING_NAME_PTN: Lazy<Regex> =
        Lazy::new(|| Regex::new(FIELD_MAPPING_NAME_PATTERN).unwrap());

    if QW_RESERVED_FIELD_NAMES.contains(&field_mapping_name) {
        bail!(
            "field name `{field_mapping_name}` is reserved. the following fields are reserved for \
             Quickwit internal usage: {}",
            QW_RESERVED_FIELD_NAMES.join(", "),
        );
    }
    if FIELD_MAPPING_NAME_PTN.is_match(field_mapping_name) {
        return Ok(());
    }
    if field_mapping_name.is_empty() {
        bail!("field name is empty");
    }
    if field_mapping_name.starts_with('.') {
        bail!(
            "field name `{}` must not start with a dot `.`",
            field_mapping_name
        );
    }
    if field_mapping_name.len() > 255 {
        bail!(
            "field name `{}` is too long. field names must not be longer than 255 characters",
            field_mapping_name
        )
    }
    let first_char = field_mapping_name.chars().next().unwrap();
    if !first_char.is_ascii_alphabetic() {
        bail!(
            "field name `{}` is invalid. field names must start with an uppercase or lowercase \
             ASCII letter, or an underscore `_`",
            field_mapping_name
        )
    }
    bail!(
        "field name `{}` contains illegal characters. field names must only contain uppercase and \
         lowercase ASCII letters, digits, hyphens `-`, periods `.`, and underscores `_`",
        field_mapping_name
    );
}

#[cfg(test)]
mod tests {
    use anyhow::bail;
    use matches::matches;
    use serde_json::json;
    use tantivy::schema::{IndexRecordOption, JsonObjectOptions, TextOptions};

    use super::*;
    use crate::Cardinality;
    use crate::doc_mapper::{FastFieldOptions, FieldMappingType};

    #[test]
    fn test_validate_field_mapping_name() {
        assert!(
            validate_field_mapping_name("")
                .unwrap_err()
                .to_string()
                .contains("is empty")
        );
        assert!(
            validate_field_mapping_name(&"a".repeat(256))
                .unwrap_err()
                .to_string()
                .contains("is too long")
        );
        assert!(
            validate_field_mapping_name("0")
                .unwrap_err()
                .to_string()
                .contains("must start with")
        );
        assert!(
            validate_field_mapping_name(".my-field")
                .unwrap_err()
                .to_string()
                .contains("must not start with")
        );
        assert!(
            validate_field_mapping_name("_source")
                .unwrap_err()
                .to_string()
                .contains("are reserved for Quickwit")
        );
        assert!(
            validate_field_mapping_name("_dynamic")
                .unwrap_err()
                .to_string()
                .contains("are reserved for Quickwit")
        );
        assert!(
            validate_field_mapping_name("my-field!")
                .unwrap_err()
                .to_string()
                .contains("illegal characters")
        );
        assert!(validate_field_mapping_name("_my_field").is_ok());
        assert!(validate_field_mapping_name("-my-field").is_ok());
        assert!(validate_field_mapping_name("my-field").is_ok());
        assert!(validate_field_mapping_name("my.field").is_ok());
        assert!(validate_field_mapping_name("my_field").is_ok());
        assert!(validate_field_mapping_name("$my_field@").is_ok());
        assert!(validate_field_mapping_name("my/field").is_ok());
        assert!(validate_field_mapping_name(&"a".repeat(255)).is_ok());
    }

    #[test]
    fn test_quickwit_json_options_default() {
        let serde_default_json_options: QuickwitJsonOptions = serde_json::from_str("{}").unwrap();
        assert_eq!(serde_default_json_options, QuickwitJsonOptions::default())
    }

    #[test]
    fn test_tantivy_text_options_from_quickwit_text_options() {
        let tantivy_text_option = TextOptions::from(QuickwitTextOptions::default());

        assert_eq!(tantivy_text_option.is_stored(), true);
        assert_eq!(tantivy_text_option.is_fast(), false);

        match tantivy_text_option.get_indexing_options() {
            Some(text_field_indexing) => {
                assert_eq!(text_field_indexing.index_option(), IndexRecordOption::Basic);
                assert_eq!(text_field_indexing.fieldnorms(), false);
                assert_eq!(text_field_indexing.tokenizer(), "default");
            }
            _ => panic!("text field indexing is None"),
        }
    }

    #[test]
    fn test_tantivy_json_options_from_quickwit_json_options() {
        let tantivy_json_option = JsonObjectOptions::from(QuickwitJsonOptions::default());
        assert_eq!(tantivy_json_option.is_stored(), true);
        match tantivy_json_option.get_text_indexing_options() {
            Some(text_field_indexing) => {
                assert_eq!(text_field_indexing.index_option(), IndexRecordOption::Basic);
                assert_eq!(text_field_indexing.tokenizer(), "raw");
            }
            _ => panic!("text field indexing is None"),
        }
    }

    #[test]
    fn test_deserialize_text_mapping_entry_not_indexed() -> anyhow::Result<()> {
        let mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "data_binary",
                "type": "text",
                "indexed": false,
                "stored": true
            }"#,
        )?;
        assert_eq!(mapping_entry.name, "data_binary");
        match mapping_entry.mapping_type {
            FieldMappingType::Text(options, _) => {
                assert_eq!(options.stored, true);
                assert!(options.indexing_options.is_none());
            }
            _ => panic!("wrong property type"),
        }
        Ok(())
    }

    #[test]
    fn test_deserialize_text_mapping_entry_not_indexed_invalid() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "data_binary",
                "type": "text",
                "indexed": false,
                "record": "basic"
            }
            "#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error.to_string(),
            "error while parsing field `data_binary`: `record`, `tokenizer`, and `fieldnorms` \
             parameters are allowed only if indexed is true"
        );
    }

    #[test]
    fn test_deserialize_json_mapping_entry_not_indexed() -> anyhow::Result<()> {
        let mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "data_binary",
                "type": "json",
                "indexed": false,
                "stored": true
            }"#,
        )?;
        assert_eq!(mapping_entry.name, "data_binary");
        match mapping_entry.mapping_type {
            FieldMappingType::Json(options, _) => {
                assert_eq!(options.stored, true);
                assert!(options.indexing_options.is_none());
            }
            _ => panic!("wrong property type"),
        }
        Ok(())
    }

    #[test]
    fn test_deserialize_json_mapping_entry_not_indexed_invalid() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "data_binary",
                "type": "json",
                "indexed": false,
                "record": "basic"
            }
            "#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error.to_string(),
            "error while parsing field `data_binary`: `record` and `tokenizer` parameters are \
             allowed only if indexed is true"
        );
    }

    #[test]
    fn test_deserialize_invalid_text_mapping_entry() -> anyhow::Result<()> {
        let mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "text",
                "stored": true,
                "record": "notexist"
            }
            "#,
        );
        assert!(mapping_entry.is_err());
        assert_eq!(
            mapping_entry.unwrap_err().to_string(),
            "error while parsing field `my_field_name`: unknown variant `notexist`, expected one \
             of `basic`, `freq`, `position`"
                .to_string()
        );
        Ok(())
    }

    #[test]
    fn test_deserialize_invalid_json_mapping_entry() -> anyhow::Result<()> {
        let mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
        {
            "name": "my_field_name",
            "type": "json",
            "blub": true
        }
    "#,
        );
        assert!(mapping_entry.is_err());
        assert!(
            mapping_entry
                .unwrap_err()
                .to_string()
                .contains("error while parsing field `my_field_name`: unknown field `blub`")
        );
        Ok(())
    }

    #[test]
    fn test_deserialize_text_mapping_entry() -> anyhow::Result<()> {
        let mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
        {
            "name": "my_field_name",
            "type": "text",
            "stored": true,
            "record": "basic",
            "tokenizer": "lowercase"
        }
        "#,
        )?;
        assert_eq!(mapping_entry.name, "my_field_name");
        match mapping_entry.mapping_type {
            FieldMappingType::Text(options, _) => {
                assert_eq!(options.stored, true);
                let indexing_options = options.indexing_options.unwrap();
                assert_eq!(indexing_options.tokenizer.name(), "lowercase");
                assert_eq!(indexing_options.record, IndexRecordOption::Basic);
            }
            _ => panic!("wrong property type"),
        }
        Ok(())
    }

    #[test]
    fn test_deserialize_valid_fieldnorms() -> anyhow::Result<()> {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
        {
            "name": "my_field_name",
            "type": "text",
            "stored": true,
            "indexed": true,
            "fieldnorms": true,
            "record": "basic",
            "tokenizer": "en_stem"
        }"#,
        );
        match result.unwrap().mapping_type {
            FieldMappingType::Text(options, _) => {
                assert_eq!(options.stored, true);
                let indexing_options = options.indexing_options.unwrap();
                assert_eq!(indexing_options.fieldnorms, true);
            }
            _ => panic!("wrong property type"),
        }

        Ok(())
    }

    #[test]
    fn test_error_on_text_with_invalid_options() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "text",
                "indexed": false,
                "tokenizer": "default",
                "record": "position"
            }
            "#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error.to_string(),
            "error while parsing field `my_field_name`: `record`, `tokenizer`, and `fieldnorms` \
             parameters are allowed only if indexed is true"
        );
    }

    #[test]
    fn test_error_on_unknown_fields() -> anyhow::Result<()> {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "text",
                "indexing": false,
                "tokenizer": "default",
                "record": "position"
            }
            "#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert!(error.to_string().contains("unknown field `indexing`"));
        Ok(())
    }

    #[test]
    fn test_deserialize_object_mapping_entry() {
        let mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
            "name": "my_field_name",
            "type": "object",
            "field_mappings": [
                {
                    "name": "my_field_name",
                    "type": "text"
                }
            ]
            }
            "#,
        )
        .unwrap();
        assert_eq!(mapping_entry.name, "my_field_name");
        match mapping_entry.mapping_type {
            FieldMappingType::Object(options) => {
                assert_eq!(options.field_mappings.len(), 1);
            }
            _ => panic!("wrong property type"),
        }
    }

    #[test]
    fn test_deserialize_object_mapping_with_no_field_mappings() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "object",
                "field_mappings": []
            }
            "#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error.to_string(),
            "error while parsing field `my_field_name`: object type must have at least one field \
             mapping"
        );
    }

    #[test]
    fn test_deserialize_mapping_with_unknown_type() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "my custom type"
            }
            "#,
        );
        assert!(result.is_err());
        let error = result.unwrap_err();
        assert_eq!(
            error.to_string(),
            "field `my_field_name` has an unknown type: `my custom type`"
        );
    }

    #[test]
    fn test_deserialize_i64_mapping_with_invalid_name() {
        assert!(
            serde_json::from_str::<FieldMappingEntry>(
                r#"
            {
                "name": "this is not ok",
                "type": "i64"
            }
            "#,
            )
            .unwrap_err()
            .to_string()
            .contains("illegal characters")
        );
    }

    #[test]
    fn test_deserialize_i64_parsing_error_with_text_options() {
        let error = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "i64",
                "tokenizer": "basic"
            }
            "#,
        )
        .unwrap_err();

        assert_eq!(
            error.to_string(),
            "error while parsing field `my_field_name`: unknown field `tokenizer`, expected one \
             of `description`, `stored`, `indexed`, `fast`, `coerce`, `output_format`"
        );
    }

    #[test]
    fn test_deserialize_i64_mapping_multivalued() -> anyhow::Result<()> {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "array<i64>"
            }
            "#,
        )?;

        match result.mapping_type {
            FieldMappingType::I64(options, cardinality) => {
                assert_eq!(options.indexed, true); // default
                assert_eq!(options.fast, false); // default
                assert_eq!(options.stored, true); // default
                assert_eq!(cardinality, Cardinality::MultiValued);
            }
            _ => bail!("Wrong type"),
        }

        Ok(())
    }

    #[test]
    fn test_deserialize_i64_mapping_singlevalued() -> anyhow::Result<()> {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "i64"
            }
            "#,
        )?;

        match result.mapping_type {
            FieldMappingType::I64(options, cardinality) => {
                assert_eq!(options.indexed, true); // default
                assert_eq!(options.fast, false); // default
                assert_eq!(options.stored, true); // default
                assert_eq!(cardinality, Cardinality::SingleValued);
            }
            _ => bail!("Wrong type"),
        }

        Ok(())
    }

    #[test]
    fn test_serialize_i64_mapping() -> anyhow::Result<()> {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "i64"
            }
            "#,
        )?;
        let entry_str = serde_json::to_value(&entry)?;
        assert_eq!(
            entry_str,
            serde_json::json!({
                "name": "my_field_name",
                "type": "i64",
                "stored": true,
                "fast": false,
                "indexed": true,
                "coerce": true,
                "output_format": "number"
            })
        );
        Ok(())
    }

    #[test]
    fn test_deserialize_u64_mapping_with_wrong_options() {
        assert_eq!(
            serde_json::from_str::<FieldMappingEntry>(
                r#"
            {
                "name": "my_field_name",
                "type": "u64",
                "tokenizer": "basic"
            }"#
            )
            .unwrap_err()
            .to_string(),
            "error while parsing field `my_field_name`: unknown field `tokenizer`, expected one \
             of `description`, `stored`, `indexed`, `fast`, `coerce`, `output_format`"
        );
    }

    #[test]
    fn test_deserialize_u64_u64_mapping_multivalued() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "array<u64>"
            }
            "#,
        )
        .unwrap();

        if let FieldMappingType::U64(options, cardinality) = result.mapping_type {
            assert_eq!(options.indexed, true); // default
            assert_eq!(options.fast, false); // default
            assert_eq!(options.stored, true); // default
            assert_eq!(cardinality, Cardinality::MultiValued);
        } else {
            panic!("Wrong type");
        }
    }

    #[test]
    fn test_deserialize_u64_mapping_singlevalued() {
        let result = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "u64"
            }
            "#,
        )
        .unwrap();
        if let FieldMappingType::U64(options, cardinality) = result.mapping_type {
            assert_eq!(options.indexed, true); // default
            assert_eq!(options.fast, false); // default
            assert_eq!(options.stored, true); // default
            assert_eq!(cardinality, Cardinality::SingleValued);
        } else {
            panic!("Wrong type");
        }
    }

    #[test]
    fn test_serialize_u64_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "u64"
            }
            "#,
        )
        .unwrap();
        let entry_str = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_str,
            serde_json::json!({
                "name": "my_field_name",
                "type":"u64",
                "stored": true,
                "fast": false,
                "indexed": true,
                "coerce": true,
                "output_format": "number"
            })
        );
    }

    #[test]
    fn test_parse_f64_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "f64"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type":"f64",
                "stored": true,
                "fast": false,
                "indexed": true,
                "coerce": true,
                "output_format": "number"
            })
        );
    }

    #[test]
    fn test_parse_bool_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "bool"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "bool",
                "stored": true,
                "fast": false,
                "indexed": true,
            })
        );
    }

    #[test]
    fn test_parse_ip_addr_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "ip_address",
                "description": "Client IP address",
                "type": "ip"
            }
            "#,
        )
        .unwrap();
        let entry_str = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_str,
            serde_json::json!({
                "name": "ip_address",
                "description": "Client IP address",
                "type": "ip",
                "stored": true,
                "fast": false,
                "indexed": true
            })
        );
    }

    #[test]
    fn test_parse_text_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "text"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "text",
                "fast": false,
                "stored": true,
                "indexed": true,
                "record": "basic",
                "tokenizer": "default",
                "fieldnorms": false,
            })
        );
    }

    #[test]
    fn test_parse_text_fast_field_normalizer() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "text",
                "fast": {"normalizer": "lowercase"}
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "text",
                "fast": {"normalizer": "lowercase"},
                "stored": true,
                "indexed": true,
                "record": "basic",
                "tokenizer": "default",
                "fieldnorms": false,
            })
        );
    }

    #[test]
    fn test_parse_text_mapping_multivalued() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "array<text>"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "array<text>",
                "stored": true,
                "indexed": true,
                "record": "basic",
                "tokenizer": "default",
                "fieldnorms": false,
                "fast": false,
            })
        );
    }

    #[test]
    fn test_parse_date_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "datetime"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "datetime",
                "input_formats": ["rfc3339", "unix_timestamp"],
                "output_format": "rfc3339",
                "fast_precision": "seconds",
                "stored": true,
                "indexed": true,
                "fast": false,
            })
        );
    }

    #[test]
    fn test_parse_date_arr_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "array<datetime>",
                "fast_precision": "milliseconds"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "array<datetime>",
                "input_formats": ["rfc3339", "unix_timestamp"],
                "output_format": "rfc3339",
                "fast_precision": "milliseconds",
                "stored": true,
                "indexed": true,
                "fast": false,
            })
        );
    }

    #[test]
    fn test_parse_bytes_mapping() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "bytes",
                "input_format": "hex",
                "output_format": "base64"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "bytes",
                "stored": true,
                "indexed": true,
                "fast": false,
                "input_format": "hex",
                "output_format": "base64"
            })
        );
    }

    #[test]
    fn test_parse_bytes_mapping_arr() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "array<bytes>"
            }
            "#,
        )
        .unwrap();
        let entry_deserser = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_deserser,
            json!({
                "name": "my_field_name",
                "type": "array<bytes>",
                "stored": true,
                "indexed": true,
                "fast": false,
                "input_format": "base64",
                "output_format": "base64"
            })
        );
    }

    #[test]
    fn test_parse_bytes_mapping_arr_and_fast_forbidden() {
        let err = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "type": "array<bytes>",
                "fast": true
            }
            "#,
        )
        .err()
        .unwrap();
        assert_eq!(
            err.to_string(),
            "error while parsing field `my_field_name`: fast field is not allowed for array<bytes>",
        );
    }

    #[test]
    fn test_parse_json_mapping_singlevalue() {
        let field_mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "type": "json",
                "name": "my_json_field",
                "stored": true
            }
            "#,
        )
        .unwrap();
        let expected_json_options = QuickwitJsonOptions {
            description: None,
            indexing_options: Some(TextIndexingOptions::default_json()),
            stored: true,
            fast: FastFieldOptions::Disabled,
            expand_dots: true,
        };
        assert_eq!(&field_mapping_entry.name, "my_json_field");
        assert!(
            matches!(field_mapping_entry.mapping_type, FieldMappingType::Json(json_config,
            Cardinality::SingleValued) if json_config == expected_json_options)
        );
    }

    #[test]
    fn test_quickwit_json_options_default_tokenizer_is_raw() {
        let quickwit_json_options = QuickwitJsonOptions::default();
        assert_eq!(
            quickwit_json_options
                .indexing_options
                .unwrap()
                .tokenizer
                .name(),
            "raw"
        );
    }

    #[test]
    fn test_quickwit_json_options_default_fast_is_false() {
        let quickwit_json_options = QuickwitJsonOptions::default();
        assert_eq!(quickwit_json_options.fast, FastFieldOptions::Disabled);
    }

    #[test]
    fn test_quickwit_json_options_default_consistent_with_default() {
        let quickwit_json_options: QuickwitJsonOptions = serde_json::from_str("{}").unwrap();
        assert_eq!(quickwit_json_options, QuickwitJsonOptions::default());
    }

    #[test]
    fn test_parse_json_mapping_multivalued() {
        let field_mapping_entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "type": "array<json>",
                "name": "my_json_field_multi",
                "tokenizer": "raw",
                "stored": false,
                "fast": false
            }
            "#,
        )
        .unwrap();
        let expected_json_options = QuickwitJsonOptions {
            description: None,
            indexing_options: Some(TextIndexingOptions::default_json()),
            stored: false,
            expand_dots: true,
            fast: FastFieldOptions::Disabled,
        };
        assert_eq!(&field_mapping_entry.name, "my_json_field_multi");
        assert!(
            matches!(field_mapping_entry.mapping_type, FieldMappingType::Json(json_config,
    Cardinality::MultiValued) if json_config == expected_json_options)
        );
    }

    #[test]
    fn test_serialize_i64_with_description_field() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "description": "If you see this description, your test is failed",
                "type": "i64"
            }"#,
        )
        .unwrap();

        let entry_str = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_str,
            serde_json::json!({
                "name": "my_field_name",
                "description": "If you see this description, your test is failed",
                "type": "i64",
                "stored": true,
                "fast": false,
                "indexed": true,
                "coerce": true,
                "output_format": "number"
            })
        );
    }

    #[test]
    fn test_serialize_text_with_description_field() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "description": "If you see this description, your test is failed",
                "type": "text"
            }"#,
        )
        .unwrap();

        let entry_str = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_str,
            serde_json::json!({
                "name": "my_field_name",
                "description": "If you see this description, your test is failed",
                "type": "text",
                "fast": false,
                "stored": true,
                "indexed": true,
                "record": "basic",
                "tokenizer": "default",
                "fieldnorms": false,
            })
        );
    }
    #[test]
    fn test_serialize_json_with_description_field() {
        let entry = serde_json::from_str::<FieldMappingEntry>(
            r#"
            {
                "name": "my_field_name",
                "description": "If you see this description, your test failed",
                "type": "json"
            }"#,
        )
        .unwrap();

        let entry_str = serde_json::to_value(&entry).unwrap();
        assert_eq!(
            entry_str,
            serde_json::json!({
                "name": "my_field_name",
                "description": "If you see this description, your test failed",
                "type": "json",
                "stored": true,
                "indexed": true,
                "tokenizer": "raw",
                "record": "basic",
                "fast": false,
                "expand_dots": true,
            })
        );
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/field_mapping_type.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use tantivy::schema::Type;

use super::date_time_type::QuickwitDateTimeOptions;
use super::field_mapping_entry::QuickwitBoolOptions;
use crate::Cardinality;
use crate::doc_mapper::field_mapping_entry::{
    QuickwitBytesOptions, QuickwitConcatenateOptions, QuickwitIpAddrOptions, QuickwitJsonOptions,
    QuickwitNumericOptions, QuickwitObjectOptions, QuickwitTextOptions,
};

/// A `FieldMappingType` defines the type and indexing options
/// of a mapping field.
#[derive(Clone, Debug, PartialEq)]
pub enum FieldMappingType {
    /// String mapping type configuration.
    Text(QuickwitTextOptions, Cardinality),
    /// Signed 64-bit integer mapping type configuration.
    I64(QuickwitNumericOptions, Cardinality),
    /// Unsigned 64-bit integer mapping type configuration.
    U64(QuickwitNumericOptions, Cardinality),
    /// DateTime mapping type configuration
    DateTime(QuickwitDateTimeOptions, Cardinality),
    /// 64-bit float mapping type configuration.
    F64(QuickwitNumericOptions, Cardinality),
    /// Bool mapping type configuration.
    Bool(QuickwitBoolOptions, Cardinality),
    /// IP Address mapping type configuration.
    IpAddr(QuickwitIpAddrOptions, Cardinality),
    /// Bytes mapping type configuration.
    Bytes(QuickwitBytesOptions, Cardinality),
    /// Json mapping type configuration.
    Json(QuickwitJsonOptions, Cardinality),
    /// Object mapping type configuration.
    Object(QuickwitObjectOptions),
    /// Concatenate field mapping type configuration.
    Concatenate(QuickwitConcatenateOptions),
}

impl FieldMappingType {
    /// Returns the field mapping type name.
    pub fn quickwit_field_type(&self) -> QuickwitFieldType {
        let (primitive_type, cardinality) = match self {
            FieldMappingType::Text(_, cardinality) => (Type::Str, *cardinality),
            FieldMappingType::I64(_, cardinality) => (Type::I64, *cardinality),
            FieldMappingType::U64(_, cardinality) => (Type::U64, *cardinality),
            FieldMappingType::F64(_, cardinality) => (Type::F64, *cardinality),
            FieldMappingType::Bool(_, cardinality) => (Type::Bool, *cardinality),
            FieldMappingType::IpAddr(_, cardinality) => (Type::IpAddr, *cardinality),
            FieldMappingType::DateTime(_, cardinality) => (Type::Date, *cardinality),
            FieldMappingType::Bytes(_, cardinality) => (Type::Bytes, *cardinality),
            FieldMappingType::Json(_, cardinality) => (Type::Json, *cardinality),
            FieldMappingType::Object(_) => {
                return QuickwitFieldType::Object;
            }
            FieldMappingType::Concatenate(_) => return QuickwitFieldType::Concatenate,
        };
        match cardinality {
            Cardinality::SingleValued => QuickwitFieldType::Simple(primitive_type),
            Cardinality::MultiValued => QuickwitFieldType::Array(primitive_type),
        }
    }
}

#[derive(Debug, Eq, PartialEq)]
pub enum QuickwitFieldType {
    Simple(Type),
    Object,
    Concatenate,
    Array(Type),
}

impl QuickwitFieldType {
    pub fn to_type_id(&self) -> String {
        match self {
            QuickwitFieldType::Simple(typ) => primitive_type_to_str(typ).to_string(),
            QuickwitFieldType::Object => "object".to_string(),
            QuickwitFieldType::Array(typ) => format!("array<{}>", primitive_type_to_str(typ)),
            QuickwitFieldType::Concatenate => "concatenate".to_string(),
        }
    }

    pub fn parse_type_id(type_str: &str) -> Option<QuickwitFieldType> {
        if type_str == "object" {
            return Some(QuickwitFieldType::Object);
        }
        if type_str == "concatenate" {
            return Some(QuickwitFieldType::Concatenate);
        }
        if type_str.starts_with("array<") && type_str.ends_with('>') {
            let parsed_type_str = parse_primitive_type(&type_str[6..type_str.len() - 1])?;
            return Some(QuickwitFieldType::Array(parsed_type_str));
        }
        let parsed_type_str = parse_primitive_type(type_str)?;
        Some(QuickwitFieldType::Simple(parsed_type_str))
    }
}

fn parse_primitive_type(primitive_type_str: &str) -> Option<Type> {
    match primitive_type_str {
        "text" => Some(Type::Str),
        "u64" => Some(Type::U64),
        "i64" => Some(Type::I64),
        "f64" => Some(Type::F64),
        "bool" => Some(Type::Bool),
        "ip" => Some(Type::IpAddr),
        "datetime" => Some(Type::Date),
        "bytes" => Some(Type::Bytes),
        "json" => Some(Type::Json),
        _unknown_type => None,
    }
}

fn primitive_type_to_str(primitive_type: &Type) -> &'static str {
    match primitive_type {
        Type::Str => "text",
        Type::U64 => "u64",
        Type::I64 => "i64",
        Type::F64 => "f64",
        Type::Bool => "bool",
        Type::IpAddr => "ip",
        Type::Date => "datetime",
        Type::Bytes => "bytes",
        Type::Json => "json",
        Type::Facet => {
            unimplemented!("Facets are not supported by quickwit at the moment.")
        }
    }
}

#[cfg(test)]
mod tests {
    use tantivy::schema::Type;

    use super::QuickwitFieldType;

    #[track_caller]
    fn test_parse_type_aux(type_str: &str, expected: Option<QuickwitFieldType>) {
        let quickwit_field_type = QuickwitFieldType::parse_type_id(type_str);
        assert_eq!(quickwit_field_type, expected);
    }

    #[test]
    fn test_parse_type() {
        test_parse_type_aux("array<i64>", Some(QuickwitFieldType::Array(Type::I64)));
        test_parse_type_aux("array<text>", Some(QuickwitFieldType::Array(Type::Str)));
        test_parse_type_aux("array<texto>", None);
        test_parse_type_aux("text", Some(QuickwitFieldType::Simple(Type::Str)));
        test_parse_type_aux("object", Some(QuickwitFieldType::Object));
        test_parse_type_aux("object2", None);
        test_parse_type_aux("bool", Some(QuickwitFieldType::Simple(Type::Bool)));
        test_parse_type_aux("ip", Some(QuickwitFieldType::Simple(Type::IpAddr)));
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/field_presence.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use fnv::FnvHashSet;
use quickwit_common::PathHasher;
use tantivy::Document;
use tantivy::schema::document::{ReferenceValue, ReferenceValueLeaf};
use tantivy::schema::{FieldType, Schema, Value};

/// Populates the field presence for a document.
///
/// The field presence is a set of hashes that represent the fields that are present in the
/// document. Each hash is computed from the field path.
///
/// It is only added if the field is indexed and not fast.
pub(crate) fn populate_field_presence<D: Document>(
    document: &D,
    schema: &Schema,
    populate_object_fields: bool,
) -> FnvHashSet<u64> {
    let mut field_presence_hashes: FnvHashSet<u64> =
        FnvHashSet::with_capacity_and_hasher(schema.num_fields(), Default::default());
    for (field, value) in document.iter_fields_and_values() {
        let field_entry = schema.get_field_entry(field);
        if !field_entry.is_indexed() || field_entry.is_fast() {
            // We are using an tantivy's ExistsQuery for fast fields.
            continue;
        }
        let mut path_hasher: PathHasher = PathHasher::default();
        path_hasher.append(&field.field_id().to_le_bytes()[..]);
        if let Some(json_obj) = value.as_object() {
            let is_expand_dots_enabled: bool =
                if let FieldType::JsonObject(json_options) = field_entry.field_type() {
                    json_options.is_expand_dots_enabled()
                } else {
                    false
                };
            let mut subfields_populator = SubfieldsPopulator {
                populate_object_fields,
                is_expand_dots_enabled,
                field_presence_hashes,
            };
            subfields_populator.populate_field_presence_for_json_obj(path_hasher, json_obj);
            field_presence_hashes = subfields_populator.field_presence_hashes;
        } else {
            field_presence_hashes.insert(path_hasher.finish_leaf());
        }
    }
    field_presence_hashes
}

/// A struct to help populate field presence hashes for nested JSON field.
struct SubfieldsPopulator {
    populate_object_fields: bool,
    is_expand_dots_enabled: bool,
    field_presence_hashes: FnvHashSet<u64>,
}

impl SubfieldsPopulator {
    #[inline]
    fn populate_field_presence_for_json_value<'a>(
        &mut self,
        path_hasher: PathHasher,
        json_value: impl Value<'a>,
    ) {
        match json_value.as_value() {
            ReferenceValue::Leaf(ReferenceValueLeaf::Null) => {}
            ReferenceValue::Leaf(_) => {
                self.field_presence_hashes.insert(path_hasher.finish_leaf());
            }
            ReferenceValue::Array(items) => {
                for item in items {
                    self.populate_field_presence_for_json_value(path_hasher.clone(), item);
                }
            }
            ReferenceValue::Object(json_obj) => {
                self.populate_field_presence_for_json_obj(path_hasher, json_obj);
            }
        }
    }

    fn populate_field_presence_for_json_obj<'a, I, V>(
        &mut self,
        path_hasher: PathHasher,
        json_obj: I,
    ) where
        I: Iterator<Item = (&'a str, V)>,
        V: Value<'a>,
    {
        if self.populate_object_fields {
            self.field_presence_hashes
                .insert(path_hasher.finish_intermediate());
        }
        for (field_key, field_value) in json_obj {
            let mut child_path_hasher = path_hasher.clone();
            if self.is_expand_dots_enabled {
                let mut expanded_key = field_key.split('.').peekable();
                while let Some(segment) = expanded_key.next() {
                    child_path_hasher.append(segment.as_bytes());
                    if self.populate_object_fields && expanded_key.peek().is_some() {
                        self.field_presence_hashes
                            .insert(child_path_hasher.finish_intermediate());
                    }
                }
            } else {
                child_path_hasher.append(field_key.as_bytes());
            };
            self.populate_field_presence_for_json_value(child_path_hasher, field_value);
        }
    }
}

#[cfg(test)]
mod tests {
    use tantivy::TantivyDocument;
    use tantivy::schema::*;

    use super::*;

    #[test]
    fn test_populate_field_presence_basic() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("indexed_text", TEXT);
        schema_builder.add_text_field("text_not_indexed", STORED);
        let schema = schema_builder.build();
        let json_doc = r#"{"indexed_text": "hello", "text_not_indexed": "world"}"#;
        let document = TantivyDocument::parse_json(&schema, json_doc).unwrap();

        let field_presence = populate_field_presence(&document, &schema, true);
        assert_eq!(field_presence.len(), 1);
    }

    #[test]
    fn test_populate_field_presence_with_array() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("list", TEXT);
        let schema = schema_builder.build();
        let json_doc = r#"{"list": ["value1", "value2"]}"#;
        let document = TantivyDocument::parse_json(&schema, json_doc).unwrap();

        let field_presence = populate_field_presence(&document, &schema, true);
        assert_eq!(field_presence.len(), 1);
    }

    #[test]
    fn test_populate_field_presence_with_json() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let json_doc = r#"{"json": {"subfield": "a"}}"#;
        let document = TantivyDocument::parse_json(&schema, json_doc).unwrap();

        let field_presence = populate_field_presence(&document, &schema, false);
        assert_eq!(field_presence.len(), 1);
        let field_presence = populate_field_presence(&document, &schema, true);
        assert_eq!(field_presence.len(), 2);
    }

    #[test]
    fn test_populate_field_presence_with_nested_jsons() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let json_doc = r#"{"json": {"subfield": {"subsubfield": "a"}}}"#;
        let document = TantivyDocument::parse_json(&schema, json_doc).unwrap();

        let field_presence = populate_field_presence(&document, &schema, false);
        assert_eq!(field_presence.len(), 1);
        let field_presence = populate_field_presence(&document, &schema, true);
        assert_eq!(field_presence.len(), 3);
    }

    #[test]
    fn test_populate_field_presence_with_array_of_objects() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let json_doc = r#"{"json": {"list": [{"key1":"value1"}, {"key2":"value2"}]}}"#;
        let document = TantivyDocument::parse_json(&schema, json_doc).unwrap();

        let field_presence = populate_field_presence(&document, &schema, false);
        assert_eq!(field_presence.len(), 2);
        let field_presence = populate_field_presence(&document, &schema, true);
        assert_eq!(field_presence.len(), 4);
    }

    #[test]
    fn test_populate_field_presence_with_expand_dots() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_json_field(
            "json",
            Into::<JsonObjectOptions>::into(TEXT).set_expand_dots_enabled(),
        );
        let schema = schema_builder.build();
        let json_doc = r#"{"json": {"key.with.dots": "value"}}"#;
        let document = TantivyDocument::parse_json(&schema, json_doc).unwrap();

        let field_presence = populate_field_presence(&document, &schema, false);
        assert_eq!(field_presence.len(), 1);
        let field_presence = populate_field_presence(&document, &schema, true);
        assert_eq!(field_presence.len(), 4);
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/mapping_tree.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::type_name;
use std::collections::BTreeMap;
use std::net::IpAddr;
use std::str::FromStr;

use anyhow::bail;
use itertools::Itertools;
use serde_json::Value as JsonValue;
use serde_json_borrow::{Map as BorrowedJsonMap, Value as BorrowedJsonValue};
use tantivy::TantivyDocument as Document;
use tantivy::schema::{
    BytesOptions, DateOptions, Field, IntoIpv6Addr, IpAddrOptions, JsonObjectOptions,
    NumericOptions, OwnedValue as TantivyValue, SchemaBuilder, TextOptions,
};

use super::date_time_type::QuickwitDateTimeOptions;
use super::field_mapping_entry::QuickwitBoolOptions;
use super::tantivy_val_to_json::formatted_tantivy_value_to_json;
use crate::doc_mapper::field_mapping_entry::{
    QuickwitBytesOptions, QuickwitIpAddrOptions, QuickwitNumericOptions, QuickwitObjectOptions,
    QuickwitTextOptions,
};
use crate::doc_mapper::{FieldMappingType, QuickwitJsonOptions};
use crate::{Cardinality, DocParsingError, FieldMappingEntry, ModeType};

#[derive(Clone, Debug)]
pub enum LeafType {
    Bool(QuickwitBoolOptions),
    Bytes(QuickwitBytesOptions),
    DateTime(QuickwitDateTimeOptions),
    F64(QuickwitNumericOptions),
    I64(QuickwitNumericOptions),
    U64(QuickwitNumericOptions),
    IpAddr(QuickwitIpAddrOptions),
    Json(QuickwitJsonOptions),
    Text(QuickwitTextOptions),
}

enum MapOrArrayIter {
    Array(std::vec::IntoIter<JsonValue>),
    Map(serde_json::map::IntoIter),
    Value(JsonValue),
}

impl Iterator for MapOrArrayIter {
    type Item = JsonValue;

    fn next(&mut self) -> Option<JsonValue> {
        match self {
            MapOrArrayIter::Array(iter) => iter.next(),
            MapOrArrayIter::Map(iter) => iter.next().map(|(_, val)| val),
            MapOrArrayIter::Value(val) => {
                if val.is_null() {
                    None
                } else {
                    Some(std::mem::take(val))
                }
            }
        }
    }
}

/// Iterate over all primitive values inside the provided JsonValue, ignoring Nulls, and opening
/// arrays and objects.
pub(crate) struct JsonValueIterator {
    currently_itered: Vec<MapOrArrayIter>,
}

impl JsonValueIterator {
    pub fn new(source: JsonValue) -> JsonValueIterator {
        let base_value = match source {
            JsonValue::Array(array) => MapOrArrayIter::Array(array.into_iter()),
            JsonValue::Object(map) => MapOrArrayIter::Map(map.into_iter()),
            other => MapOrArrayIter::Value(other),
        };
        JsonValueIterator {
            currently_itered: vec![base_value],
        }
    }
}

impl Iterator for JsonValueIterator {
    type Item = JsonValue;

    fn next(&mut self) -> Option<JsonValue> {
        loop {
            let currently_itered = self.currently_itered.last_mut()?;
            match currently_itered.next() {
                Some(JsonValue::Array(array)) => self
                    .currently_itered
                    .push(MapOrArrayIter::Array(array.into_iter())),
                Some(JsonValue::Object(map)) => self
                    .currently_itered
                    .push(MapOrArrayIter::Map(map.into_iter())),
                Some(JsonValue::Null) => continue,
                Some(other) => return Some(other),
                None => {
                    self.currently_itered.pop();
                    continue;
                }
            }
        }
    }
}

enum OneOrIter<T, I: Iterator<Item = T>> {
    One(Option<T>),
    Iter(I),
}

impl<T, I: Iterator<Item = T>> OneOrIter<T, I> {
    pub fn one(item: T) -> Self {
        OneOrIter::One(Some(item))
    }
}

impl<T, I: Iterator<Item = T>> Iterator for OneOrIter<T, I> {
    type Item = T;

    fn next(&mut self) -> Option<T> {
        match self {
            OneOrIter::Iter(iter) => iter.next(),
            OneOrIter::One(item) => std::mem::take(item),
        }
    }
}

/// Similar to the native `From<JsonValue> for TantivyValue` implementation, with a
/// subtle difference: no automatic parsing to DateTime is performed when the string
/// is a valid RFC3339 date. This enables some level of range querying through prefix
/// queries despite concatenate fields not supporting fast fields.
pub(crate) fn map_primitive_json_to_concatenate_value(value: JsonValue) -> Option<TantivyValue> {
    match value {
        JsonValue::Array(_) | JsonValue::Object(_) | JsonValue::Null => None,
        JsonValue::String(text) => Some(TantivyValue::Str(text)),
        JsonValue::Bool(val) => Some((val).into()),
        JsonValue::Number(number) => {
            if let Some(val) = i64::from_json_number(&number) {
                Some((val).into())
            } else if let Some(val) = u64::from_json_number(&number) {
                Some((val).into())
            } else {
                f64::from_json_number(&number).map(|val| (val).into())
            }
        }
    }
}

impl LeafType {
    fn validate_from_json(&self, json_val: &BorrowedJsonValue) -> Result<(), String> {
        match self {
            LeafType::Text(_) => {
                if json_val.is_string() {
                    Ok(())
                } else {
                    Err(format!("expected string, got `{json_val}`"))
                }
            }
            LeafType::I64(numeric_options) => {
                i64::validate_json(json_val, numeric_options.coerce).map(|_| ())
            }
            LeafType::U64(numeric_options) => {
                u64::validate_json(json_val, numeric_options.coerce).map(|_| ())
            }
            LeafType::F64(numeric_options) => {
                f64::validate_json(json_val, numeric_options.coerce).map(|_| ())
            }
            LeafType::Bool(_) => {
                if json_val.is_bool() {
                    Ok(())
                } else {
                    Err(format!("expected boolean, got `{json_val}`"))
                }
            }
            LeafType::IpAddr(_) => {
                let Some(ip_address) = json_val.as_str() else {
                    return Err(format!("expected string, got `{json_val}`"));
                };
                IpAddr::from_str(ip_address)
                    .map_err(|err| format!("failed to parse IP address `{ip_address}`: {err}"))?;
                Ok(())
            }
            LeafType::DateTime(date_time_options) => {
                date_time_options.validate_json(json_val).map(|_| ())
            }
            LeafType::Bytes(binary_options) => {
                if let Some(byte_str) = json_val.as_str() {
                    binary_options.input_format.parse_str(byte_str)?;
                    Ok(())
                } else {
                    Err(format!(
                        "expected {} string, got `{json_val}`",
                        binary_options.input_format.as_str()
                    ))
                }
            }
            LeafType::Json(_) => {
                if json_val.is_object() {
                    Ok(())
                } else {
                    Err(format!("expected object, got `{json_val}`"))
                }
            }
        }
    }

    fn value_from_json(&self, json_val: JsonValue) -> Result<TantivyValue, String> {
        match self {
            LeafType::Text(_) => {
                if let JsonValue::String(text) = json_val {
                    Ok(TantivyValue::Str(text))
                } else {
                    Err(format!("expected string, got `{json_val}`"))
                }
            }
            LeafType::I64(numeric_options) => i64::from_json(json_val, numeric_options.coerce),
            LeafType::U64(numeric_options) => u64::from_json(json_val, numeric_options.coerce),
            LeafType::F64(numeric_options) => f64::from_json(json_val, numeric_options.coerce),
            LeafType::Bool(_) => {
                if let JsonValue::Bool(val) = json_val {
                    Ok(TantivyValue::Bool(val))
                } else {
                    Err(format!("expected boolean, got `{json_val}`"))
                }
            }
            LeafType::IpAddr(_) => {
                if let JsonValue::String(ip_address) = json_val {
                    let ipv6_value = IpAddr::from_str(ip_address.as_str())
                        .map_err(|err| format!("failed to parse IP address `{ip_address}`: {err}"))?
                        .into_ipv6_addr();
                    Ok(TantivyValue::IpAddr(ipv6_value))
                } else {
                    Err(format!("expected string, got `{json_val}`"))
                }
            }
            LeafType::DateTime(date_time_options) => date_time_options.parse_json(&json_val),
            LeafType::Bytes(binary_options) => binary_options.input_format.parse_json(&json_val),
            LeafType::Json(_) => {
                if let JsonValue::Object(json_obj) = json_val {
                    Ok(TantivyValue::Object(
                        json_obj
                            .into_iter()
                            .map(|(key, val)| (key, val.into()))
                            .collect(),
                    ))
                } else {
                    Err(format!("expected object, got `{json_val}`"))
                }
            }
        }
    }

    fn concatenate_values_from_json(
        &self,
        json_val: JsonValue,
    ) -> Result<impl Iterator<Item = TantivyValue>, String> {
        match self {
            LeafType::Text(_) => {
                if let JsonValue::String(text) = json_val {
                    Ok(OneOrIter::one(TantivyValue::Str(text)))
                } else {
                    Err(format!("expected string, got `{json_val}`"))
                }
            }
            LeafType::I64(numeric_options) => {
                let val = i64::from_json_to_self(&json_val, numeric_options.coerce)?;
                Ok(OneOrIter::one((val).into()))
            }
            LeafType::U64(numeric_options) => {
                let val = u64::from_json_to_self(&json_val, numeric_options.coerce)?;
                Ok(OneOrIter::one((val).into()))
            }
            LeafType::F64(numeric_options) => {
                let val = f64::from_json_to_self(&json_val, numeric_options.coerce)?;
                Ok(OneOrIter::one((val).into()))
            }
            LeafType::Bool(_) => {
                if let JsonValue::Bool(val) = json_val {
                    Ok(OneOrIter::one((val).into()))
                } else {
                    Err(format!("expected boolean, got `{json_val}`"))
                }
            }
            LeafType::IpAddr(_) => Err("unsupported concat type: IpAddr".to_string()),
            LeafType::DateTime(_date_time_options) => {
                Err("unsupported concat type: DateTime".to_string())
            }
            LeafType::Bytes(_binary_options) => Err("unsupported concat type: Bytes".to_string()),
            LeafType::Json(_) => {
                if let JsonValue::Object(json_obj) = json_val {
                    Ok(OneOrIter::Iter(
                        json_obj
                            .into_iter()
                            .flat_map(|(_key, val)| JsonValueIterator::new(val))
                            .flat_map(map_primitive_json_to_concatenate_value),
                    ))
                } else {
                    Err(format!("expected object, got `{json_val}`"))
                }
            }
        }
    }

    fn supported_for_concat(&self) -> bool {
        use LeafType::*;
        matches!(self, Text(_) | U64(_) | I64(_) | F64(_) | Bool(_) | Json(_))
        /*
            // Since concat is a JSON field, anything that JSON supports can be supported
            DateTime(_), // Could be supported if the date is converted to Rfc3339
            IpAddr(_),
            // won't be supported
            Bytes(_),
        */
    }
}

#[derive(Clone)]
pub(crate) struct MappingLeaf {
    field: Field,
    typ: LeafType,
    cardinality: Cardinality,
    // concatenate fields this field is part of
    concatenate: Vec<Field>,
}

impl MappingLeaf {
    fn validate_from_json(
        &self,
        json_value: &BorrowedJsonValue,
        path: &[&str],
    ) -> Result<(), DocParsingError> {
        if json_value.is_null() {
            // We just ignore `null`.
            return Ok(());
        }
        if let BorrowedJsonValue::Array(els) = json_value {
            if self.cardinality == Cardinality::SingleValued {
                return Err(DocParsingError::MultiValuesNotSupported(path.join(".")));
            }
            for el_json_val in els {
                if el_json_val.is_null() {
                    // We just ignore `null`.
                    continue;
                }
                self.typ
                    .validate_from_json(el_json_val)
                    .map_err(|err_msg| DocParsingError::ValueError(path.join("."), err_msg))?;
            }
            return Ok(());
        }

        self.typ
            .validate_from_json(json_value)
            .map_err(|err_msg| DocParsingError::ValueError(path.join("."), err_msg))?;

        Ok(())
    }

    pub fn doc_from_json(
        &self,
        json_val: JsonValue,
        document: &mut Document,
        path: &mut [String],
    ) -> Result<(), DocParsingError> {
        if json_val.is_null() {
            // We just ignore `null`.
            return Ok(());
        }
        if let JsonValue::Array(els) = json_val {
            if self.cardinality == Cardinality::SingleValued {
                return Err(DocParsingError::MultiValuesNotSupported(path.join(".")));
            }
            for el_json_val in els {
                if el_json_val.is_null() {
                    // We just ignore `null`.
                    continue;
                }
                if !self.concatenate.is_empty() {
                    let concat_values = self
                        .typ
                        .concatenate_values_from_json(el_json_val.clone())
                        .map_err(|err_msg| DocParsingError::ValueError(path.join("."), err_msg))?;
                    for concat_value in concat_values {
                        for field in &self.concatenate {
                            document.add_field_value(*field, &concat_value);
                        }
                    }
                }
                let value = self
                    .typ
                    .value_from_json(el_json_val)
                    .map_err(|err_msg| DocParsingError::ValueError(path.join("."), err_msg))?;
                document.add_field_value(self.field, &value);
            }
            return Ok(());
        }

        if !self.concatenate.is_empty() {
            let concat_values = self
                .typ
                .concatenate_values_from_json(json_val.clone())
                .map_err(|err_msg| DocParsingError::ValueError(path.join("."), err_msg))?;
            for concat_value in concat_values {
                for field in &self.concatenate {
                    document.add_field_value(*field, &concat_value);
                }
            }
        }
        let value = self
            .typ
            .value_from_json(json_val)
            .map_err(|err_msg| DocParsingError::ValueError(path.join("."), err_msg))?;
        document.add_field_value(self.field, &value);
        Ok(())
    }

    fn populate_json<'a>(
        &'a self,
        named_doc: &mut BTreeMap<String, Vec<TantivyValue>>,
        field_path: &[&'a str],
        doc_json: &mut serde_json::Map<String, JsonValue>,
    ) {
        if let Some(json_val) =
            extract_json_val(self.get_type(), named_doc, field_path, self.cardinality)
        {
            insert_json_val(field_path, json_val, doc_json);
        }
    }

    pub fn get_type(&self) -> &LeafType {
        &self.typ
    }
}

fn extract_json_val(
    leaf_type: &LeafType,
    named_doc: &mut BTreeMap<String, Vec<TantivyValue>>,
    field_path: &[&str],
    cardinality: Cardinality,
) -> Option<JsonValue> {
    let mut full_path = field_path.join(".");
    let vals: Vec<TantivyValue> = if let Some(vals) = named_doc.remove(&full_path) {
        // we have our value directly
        vals
    } else {
        let mut end_range = full_path.clone();
        full_path.push('.');
        // '/' is the character directly after . lexicographically
        end_range.push('/');

        // TODO use BTreeMap::drain once it exists and is stable
        let matches = named_doc
            .range::<String, _>(&full_path..&end_range)
            .map(|(k, _)| k.clone())
            .collect::<Vec<_>>();

        if !matches.is_empty() {
            let mut map = Vec::new();
            for match_ in matches {
                let Some(suffix) = match_.strip_prefix(&full_path) else {
                    // this should never happen
                    continue;
                };
                let Some(tantivy_values) = named_doc.remove(&match_) else {
                    continue;
                };

                add_key_to_vec_map(&mut map, suffix, tantivy_values);
            }
            vec![TantivyValue::Object(map)]
        } else {
            // we didn't find our value, or any child of it, but maybe what we search is actually a
            // json field closer to the root?
            let mut split_point_iter = (1..(field_path.len())).rev();
            loop {
                let split_point = split_point_iter.next()?;
                let (doc_path, json_path) = field_path.split_at(split_point);
                let prefix_path = doc_path.join(".");
                if let Some(vals) = named_doc.get_mut(&prefix_path) {
                    // if we found a possible json field, there is no point in searching higher, our
                    // result would have been in it.
                    break extract_val_from_tantivy_val(json_path, vals);
                }
            }
        }
    };
    let mut vals_with_correct_type_it = vals
        .into_iter()
        .flat_map(|value| formatted_tantivy_value_to_json(value, leaf_type));
    match cardinality {
        Cardinality::SingleValued => vals_with_correct_type_it.next(),
        Cardinality::MultiValued => Some(JsonValue::Array(vals_with_correct_type_it.collect())),
    }
}

/// extract a subfield from a TantivyValue. The path must be non-empty
fn extract_val_from_tantivy_val(
    full_path: &[&str],
    tantivy_values: &mut [TantivyValue],
) -> Vec<TantivyValue> {
    // return *objects* matching path
    fn extract_val_aux<'a>(
        path: &[&str],
        tantivy_values: &'a mut [TantivyValue],
    ) -> Vec<&'a mut Vec<(String, TantivyValue)>> {
        let mut maps: Vec<&'a mut Vec<(String, TantivyValue)>> = tantivy_values
            .iter_mut()
            .filter_map(|value| {
                if let TantivyValue::Object(map) = value {
                    Some(map)
                } else {
                    None
                }
            })
            .collect();
        let mut scratch_buffer = Vec::new();
        for path_segment in path {
            scratch_buffer.extend(
                maps.drain(..)
                    .flatten()
                    .filter(|(key, _)| key == path_segment)
                    .filter_map(|(_, value)| {
                        if let TantivyValue::Object(map) = value {
                            Some(map)
                        } else {
                            None
                        }
                    }),
            );
            std::mem::swap(&mut maps, &mut scratch_buffer);
        }
        maps
    }

    let Some((last_segment, path)) = full_path.split_last() else {
        return Vec::new();
    };

    let mut results = Vec::new();
    for object in extract_val_aux(path, tantivy_values) {
        // TODO use extract_if once it's stable
        let mut i = 0;
        while i < object.len() {
            if object[i].0 == *last_segment {
                let (_, val) = object.swap_remove(i);
                match val {
                    TantivyValue::Array(mut vals) => results.append(&mut vals),
                    _ => results.push(val),
                }
            } else {
                i += 1;
            }
        }
    }

    results
}

fn add_key_to_vec_map(
    mut map: &mut Vec<(String, TantivyValue)>,
    suffix: &str,
    mut tantivy_value: Vec<TantivyValue>,
) {
    let Ok(full_inner_path) = crate::routing_expression::parse_field_name(suffix) else {
        return;
    };
    let Some((last_segment, inner_path)) = full_inner_path.split_last() else {
        return;
    };
    for path_segment in inner_path {
        // there is a cleaner way with find(), but the borrow checker is unhappy for no real reason
        // thinking there are lifetime issues between two exclusive branches
        map = if let Some(pos) = map.iter().position(|(key, _)| key == path_segment) {
            if let (_, TantivyValue::Object(ref mut value)) = map[pos] {
                value
            } else {
                // there is already a key before the end of the path ?!
                return;
            }
        } else {
            map.push((path_segment.to_string(), TantivyValue::Object(Vec::new())));
            let TantivyValue::Object(ref mut new_map) = map.last_mut().unwrap().1 else {
                unreachable!();
            };
            new_map
        }
    }
    // if we are here the doc mapping was changed from obj to json. We don't really know if the
    // field of that obj was multivalued or not. As a best effort, we say it was multivalued
    // if we have !=1 value. We could always return a vec, but then *every* field would be
    // transformed into an array of itself.
    if tantivy_value.len() == 1 {
        map.push((last_segment.to_string(), tantivy_value.pop().unwrap()));
    } else {
        map.push((last_segment.to_string(), TantivyValue::Array(tantivy_value)));
    }
}

fn insert_json_val(
    field_path: &[&str], //< may not be empty
    json_val: JsonValue,
    mut doc_json: &mut serde_json::Map<String, JsonValue>,
) {
    let (last_field_name, up_to_last) = field_path.split_last().expect("Empty path is forbidden");
    for &field_name in up_to_last {
        let entry = doc_json
            .entry(field_name.to_string())
            .or_insert_with(|| JsonValue::Object(Default::default()));
        if let JsonValue::Object(child_json_obj) = entry {
            doc_json = child_json_obj;
        } else {
            return;
        }
    }
    doc_json.insert(last_field_name.to_string(), json_val);
}

pub(crate) trait NumVal: Sized + FromStr + ToString + Into<TantivyValue> {
    fn from_json_number(num: &serde_json::Number) -> Option<Self>;

    fn validate_json(json_val: &BorrowedJsonValue, coerce: bool) -> Result<(), String> {
        match json_val {
            BorrowedJsonValue::Number(num_val) => {
                let num_val = serde_json::Number::from(*num_val);
                Self::from_json_number(&num_val).ok_or_else(|| {
                    format!(
                        "expected {}, got inconvertible JSON number `{}`",
                        type_name::<Self>(),
                        num_val
                    )
                })?;
                Ok(())
            }
            BorrowedJsonValue::Str(str_val) => {
                if coerce {
                    str_val.parse::<Self>().map_err(|_| {
                        format!(
                            "failed to coerce JSON string `\"{str_val}\"` to {}",
                            type_name::<Self>()
                        )
                    })?;
                    Ok(())
                } else {
                    Err(format!(
                        "expected JSON number, got string `\"{str_val}\"`. enable coercion to {} \
                         with the `coerce` parameter in the field mapping",
                        type_name::<Self>()
                    ))
                }
            }
            _ => {
                let message = if coerce {
                    format!("expected JSON number or string, got `{json_val}`")
                } else {
                    format!("expected JSON number, got `{json_val}`")
                };
                Err(message)
            }
        }
    }

    fn from_json_to_self(json_val: &JsonValue, coerce: bool) -> Result<Self, String> {
        match json_val {
            JsonValue::Number(num_val) => Self::from_json_number(num_val).ok_or_else(|| {
                format!(
                    "expected {}, got inconvertible JSON number `{}`",
                    type_name::<Self>(),
                    num_val
                )
            }),
            JsonValue::String(str_val) => {
                if coerce {
                    str_val.parse::<Self>().map_err(|_| {
                        format!(
                            "failed to coerce JSON string `\"{str_val}\"` to {}",
                            type_name::<Self>()
                        )
                    })
                } else {
                    Err(format!(
                        "expected JSON number, got string `\"{str_val}\"`. enable coercion to {} \
                         with the `coerce` parameter in the field mapping",
                        type_name::<Self>()
                    ))
                }
            }
            _ => {
                let message = if coerce {
                    format!("expected JSON number or string, got `{json_val}`")
                } else {
                    format!("expected JSON number, got `{json_val}`")
                };
                Err(message)
            }
        }
    }

    fn from_json(json_val: JsonValue, coerce: bool) -> Result<TantivyValue, String> {
        Self::from_json_to_self(&json_val, coerce).map(Self::into)
    }
}

impl NumVal for u64 {
    fn from_json_number(num: &serde_json::Number) -> Option<Self> {
        num.as_u64()
    }
}

impl NumVal for i64 {
    fn from_json_number(num: &serde_json::Number) -> Option<Self> {
        num.as_i64()
    }
}
impl NumVal for f64 {
    fn from_json_number(num: &serde_json::Number) -> Option<Self> {
        num.as_f64()
    }
}

#[derive(Clone, Default)]
pub(crate) struct MappingNode {
    pub branches: fnv::FnvHashMap<String, MappingTree>,
    branches_order: Vec<String>,
}

fn get_or_insert_path<'a>(
    path: &[String],
    mut dynamic_json_obj: &'a mut serde_json::Map<String, JsonValue>,
) -> &'a mut serde_json::Map<String, JsonValue> {
    for field_name in path {
        let child_json_val = dynamic_json_obj
            .entry(field_name.clone())
            .or_insert_with(|| JsonValue::Object(Default::default()));
        dynamic_json_obj = if let JsonValue::Object(child_map) = child_json_val {
            child_map
        } else {
            panic!("Expected Json object.");
        };
    }
    dynamic_json_obj
}

impl MappingNode {
    /// Finds the field mapping type for a given field path in the mapping tree.
    /// Dots in `field_path_as_str` define the boundaries between field names.
    /// If a dot is part of a field name, it must be escaped with '\'.
    pub fn find_field_mapping_type(&self, field_path_as_str: &str) -> Option<FieldMappingType> {
        let field_path = build_field_path_from_str(field_path_as_str);
        self.internal_find_field_mapping_type(&field_path)
    }

    fn internal_find_field_mapping_type(&self, field_path: &[String]) -> Option<FieldMappingType> {
        let (first_path_fragment, sub_field_path) = field_path.split_first()?;
        let child_tree = self.branches.get(first_path_fragment)?;
        match (child_tree, sub_field_path.is_empty()) {
            (_, true) => Some(child_tree.clone().into()),
            (MappingTree::Leaf(_), false) => None,
            (MappingTree::Node(child_node), false) => {
                child_node.internal_find_field_mapping_type(sub_field_path)
            }
        }
    }

    /// Finds the field mapping type for a given field path in the mapping tree.
    /// Dots in `field_path_as_str` define the boundaries between field names.
    /// If a dot is part of a field name, it must be escaped with '\'.
    pub fn find_field_mapping_leaf<'a>(
        &'a mut self,
        field_path_as_str: &str,
    ) -> Option<impl Iterator<Item = &'a mut MappingLeaf> + use<'a>> {
        let field_path = build_field_path_from_str(field_path_as_str);
        self.internal_find_field_mapping_leaf(&field_path)
    }

    fn internal_find_field_mapping_leaf<'a>(
        &'a mut self,
        field_path: &[String],
    ) -> Option<impl Iterator<Item = &'a mut MappingLeaf> + use<'a>> {
        let (first_path_fragment, sub_field_path) = field_path.split_first()?;
        let child_tree = self.branches.get_mut(first_path_fragment)?;
        match (child_tree, sub_field_path.is_empty()) {
            (MappingTree::Leaf(_), false) => None,
            (MappingTree::Node(child_node), false) => {
                child_node.internal_find_field_mapping_leaf(sub_field_path)
            }
            (MappingTree::Leaf(leaf), true) => Some([leaf].into_iter()),
            (MappingTree::Node(_), true) => None,
        }
    }

    #[cfg(test)]
    pub fn num_fields(&self) -> usize {
        self.branches.len()
    }

    pub fn insert(&mut self, path: &str, node: MappingTree) {
        self.branches_order.push(path.to_string());
        self.branches.insert(path.to_string(), node);
    }

    pub fn ordered_field_mapping_entries(&self) -> Vec<FieldMappingEntry> {
        assert_eq!(self.branches.len(), self.branches_order.len());
        let mut field_mapping_entries = Vec::new();
        for field_name in &self.branches_order {
            let child_tree = self.branches.get(field_name).expect("Missing field");
            let field_mapping_entry = FieldMappingEntry {
                name: field_name.clone(),
                mapping_type: child_tree.clone().into(),
            };
            field_mapping_entries.push(field_mapping_entry);
        }
        field_mapping_entries
    }

    pub fn validate_from_json<'a>(
        &self,
        json_obj: &'a BorrowedJsonMap,
        strict_mode: bool,
        path: &mut Vec<&'a str>,
    ) -> Result<(), DocParsingError> {
        for (field_name, json_val) in json_obj.iter() {
            if let Some(child_tree) = self.branches.get(field_name) {
                path.push(field_name);
                child_tree.validate_from_json(json_val, path, strict_mode)?;
                path.pop();
            } else if strict_mode {
                path.push(field_name);
                let field_path = path.join(".");
                return Err(DocParsingError::NoSuchFieldInSchema(field_path));
            }
        }
        Ok(())
    }

    pub fn doc_from_json(
        &self,
        json_obj: serde_json::Map<String, JsonValue>,
        mode: ModeType,
        document: &mut Document,
        path: &mut Vec<String>,
        dynamic_json_obj: &mut serde_json::Map<String, JsonValue>,
    ) -> Result<(), DocParsingError> {
        for (field_name, val) in json_obj {
            if let Some(child_tree) = self.branches.get(&field_name) {
                path.push(field_name);
                child_tree.doc_from_json(val, mode, document, path, dynamic_json_obj)?;
                path.pop();
            } else {
                match mode {
                    ModeType::Lenient => {
                        // In lenient mode we simply ignore these unmapped fields.
                    }
                    ModeType::Dynamic => {
                        let dynamic_json_obj_after_path =
                            get_or_insert_path(path, dynamic_json_obj);
                        dynamic_json_obj_after_path.insert(field_name, val);
                    }
                    ModeType::Strict => {
                        path.push(field_name);
                        let field_path = path.join(".");
                        return Err(DocParsingError::NoSuchFieldInSchema(field_path));
                    }
                }
            }
        }
        Ok(())
    }

    pub fn populate_json<'a>(
        &'a self,
        named_doc: &mut BTreeMap<String, Vec<TantivyValue>>,
        field_path: &mut Vec<&'a str>,
        doc_json: &mut serde_json::Map<String, JsonValue>,
    ) {
        for (field_name, field_mapping) in &self.branches {
            field_path.push(field_name);
            field_mapping.populate_json(named_doc, field_path, doc_json);
            field_path.pop();
        }
    }
}

impl From<MappingTree> for FieldMappingType {
    fn from(mapping_tree: MappingTree) -> Self {
        match mapping_tree {
            MappingTree::Leaf(leaf) => leaf.into(),
            MappingTree::Node(node) => FieldMappingType::Object(QuickwitObjectOptions {
                field_mappings: node.into(),
            }),
        }
    }
}

impl From<MappingLeaf> for FieldMappingType {
    fn from(leaf: MappingLeaf) -> Self {
        match leaf.typ {
            LeafType::Text(opt) => FieldMappingType::Text(opt, leaf.cardinality),
            LeafType::I64(opt) => FieldMappingType::I64(opt, leaf.cardinality),
            LeafType::U64(opt) => FieldMappingType::U64(opt, leaf.cardinality),
            LeafType::F64(opt) => FieldMappingType::F64(opt, leaf.cardinality),
            LeafType::Bool(opt) => FieldMappingType::Bool(opt, leaf.cardinality),
            LeafType::IpAddr(opt) => FieldMappingType::IpAddr(opt, leaf.cardinality),
            LeafType::DateTime(opt) => FieldMappingType::DateTime(opt, leaf.cardinality),
            LeafType::Bytes(opt) => FieldMappingType::Bytes(opt, leaf.cardinality),
            LeafType::Json(opt) => FieldMappingType::Json(opt, leaf.cardinality),
        }
    }
}

impl From<MappingNode> for Vec<FieldMappingEntry> {
    fn from(node: MappingNode) -> Self {
        node.ordered_field_mapping_entries()
    }
}

#[derive(Clone)]
pub(crate) enum MappingTree {
    Leaf(MappingLeaf),
    Node(MappingNode),
}

impl MappingTree {
    fn validate_from_json<'a>(
        &self,
        json_value: &'a BorrowedJsonValue<'a>,
        field_path: &mut Vec<&'a str>,
        strict_mode: bool,
    ) -> Result<(), DocParsingError> {
        match self {
            MappingTree::Leaf(mapping_leaf) => {
                mapping_leaf.validate_from_json(json_value, field_path)
            }
            MappingTree::Node(mapping_node) => {
                if let Some(json_obj) = json_value.as_object() {
                    mapping_node.validate_from_json(json_obj, strict_mode, field_path)
                } else {
                    Err(DocParsingError::ValueError(
                        field_path.join("."),
                        format!("expected an JSON object, got {json_value}"),
                    ))
                }
            }
        }
    }

    fn doc_from_json(
        &self,
        json_value: JsonValue,
        mode: ModeType,
        document: &mut Document,
        path: &mut Vec<String>,
        dynamic_json_obj: &mut serde_json::Map<String, JsonValue>,
    ) -> Result<(), DocParsingError> {
        match self {
            MappingTree::Leaf(mapping_leaf) => {
                mapping_leaf.doc_from_json(json_value, document, path)
            }
            MappingTree::Node(mapping_node) => {
                if let JsonValue::Object(json_obj) = json_value {
                    mapping_node.doc_from_json(json_obj, mode, document, path, dynamic_json_obj)
                } else {
                    Err(DocParsingError::ValueError(
                        path.join("."),
                        format!("expected an JSON object, got {json_value}"),
                    ))
                }
            }
        }
    }

    fn populate_json<'a>(
        &'a self,
        named_doc: &mut BTreeMap<String, Vec<TantivyValue>>,
        field_path: &mut Vec<&'a str>,
        doc_json: &mut serde_json::Map<String, JsonValue>,
    ) {
        match self {
            MappingTree::Leaf(mapping_leaf) => {
                mapping_leaf.populate_json(named_doc, field_path, doc_json)
            }
            MappingTree::Node(mapping_node) => {
                mapping_node.populate_json(named_doc, field_path, doc_json);
            }
        }
    }
}

pub(crate) struct MappingNodeRoot {
    /// The root of a mapping tree
    pub field_mappings: MappingNode,
    /// The list of concatenate fields which includes the dynamic field
    pub concatenate_dynamic_fields: Vec<Field>,
}

pub(crate) fn build_mapping_tree(
    entries: &[FieldMappingEntry],
    schema: &mut SchemaBuilder,
) -> anyhow::Result<MappingNodeRoot> {
    let mut field_path = Vec::new();
    build_mapping_tree_from_entries(entries, &mut field_path, schema)
}

fn build_mapping_tree_from_entries<'a>(
    entries: &'a [FieldMappingEntry],
    field_path: &mut Vec<&'a str>,
    schema: &mut SchemaBuilder,
) -> anyhow::Result<MappingNodeRoot> {
    let mut mapping_node = MappingNode::default();
    let mut concatenate_fields = Vec::new();
    let mut concatenate_dynamic_fields = Vec::new();
    for entry in entries {
        if let FieldMappingType::Concatenate(_) = &entry.mapping_type {
            concatenate_fields.push(entry);
        } else {
            field_path.push(&entry.name);
            if mapping_node.branches.contains_key(&entry.name) {
                bail!("duplicated field definition `{}`", entry.name);
            }
            let (child_tree, mut dynamic_fields) =
                build_mapping_from_field_type(&entry.mapping_type, field_path, schema)?;
            field_path.pop();
            mapping_node.insert(&entry.name, child_tree);
            concatenate_dynamic_fields.append(&mut dynamic_fields);
        }
    }
    for concatenate_field_entry in concatenate_fields {
        let FieldMappingType::Concatenate(options) = &concatenate_field_entry.mapping_type else {
            // we only pushed Concatenate fields in `concatenate_fields`
            unreachable!();
        };
        let name = &concatenate_field_entry.name;
        if mapping_node.branches.contains_key(name) {
            bail!("duplicated field definition `{}`", name);
        }
        let text_options: JsonObjectOptions = options.clone().into();
        let field = schema.add_json_field(name, text_options);
        for sub_field in &options.concatenate_fields {
            for matched_field in
                mapping_node
                    .find_field_mapping_leaf(sub_field)
                    .ok_or_else(|| {
                        anyhow::anyhow!("concatenate field uses an unknown field `{sub_field}`")
                    })?
            {
                if !matched_field.typ.supported_for_concat() {
                    bail!(
                        "subfield `{}` not supported inside a concatenate field",
                        sub_field
                    );
                }
                matched_field.concatenate.push(field);
            }
        }
        if options.include_dynamic_fields {
            concatenate_dynamic_fields.push(field);
        }
    }
    Ok(MappingNodeRoot {
        field_mappings: mapping_node,
        concatenate_dynamic_fields,
    })
}

fn get_numeric_options_for_bool_field(
    quickwit_bool_options: &QuickwitBoolOptions,
) -> NumericOptions {
    let mut numeric_options = NumericOptions::default();
    if quickwit_bool_options.stored {
        numeric_options = numeric_options.set_stored();
    }
    if quickwit_bool_options.indexed {
        numeric_options = numeric_options.set_indexed();
    }
    if quickwit_bool_options.fast {
        numeric_options = numeric_options.set_fast();
    }
    numeric_options
}

fn get_numeric_options_for_numeric_field(
    quickwit_numeric_options: &QuickwitNumericOptions,
) -> NumericOptions {
    let mut numeric_options = NumericOptions::default();
    if quickwit_numeric_options.stored {
        numeric_options = numeric_options.set_stored();
    }
    if quickwit_numeric_options.indexed {
        numeric_options = numeric_options.set_indexed();
    }
    if quickwit_numeric_options.fast {
        numeric_options = numeric_options.set_fast();
    }
    numeric_options
}

fn get_date_time_options(quickwit_date_time_options: &QuickwitDateTimeOptions) -> DateOptions {
    let mut date_time_options = DateOptions::default();
    if quickwit_date_time_options.stored {
        date_time_options = date_time_options.set_stored();
    }
    if quickwit_date_time_options.indexed {
        date_time_options = date_time_options.set_indexed();
    }
    if quickwit_date_time_options.fast {
        date_time_options = date_time_options.set_fast();
    }
    date_time_options.set_precision(quickwit_date_time_options.fast_precision)
}

fn get_bytes_options(quickwit_numeric_options: &QuickwitBytesOptions) -> BytesOptions {
    let mut bytes_options = BytesOptions::default();
    if quickwit_numeric_options.indexed {
        bytes_options = bytes_options.set_indexed();
    }
    if quickwit_numeric_options.fast {
        bytes_options = bytes_options.set_fast();
    }
    if quickwit_numeric_options.stored {
        bytes_options = bytes_options.set_stored();
    }
    bytes_options
}

fn get_ip_address_options(quickwit_ip_address_options: &QuickwitIpAddrOptions) -> IpAddrOptions {
    let mut ip_address_options = IpAddrOptions::default();
    if quickwit_ip_address_options.stored {
        ip_address_options = ip_address_options.set_stored();
    }
    if quickwit_ip_address_options.indexed {
        ip_address_options = ip_address_options.set_indexed();
    }
    if quickwit_ip_address_options.fast {
        ip_address_options = ip_address_options.set_fast();
    }
    ip_address_options
}

/// Creates a tantivy field name for a given field path.
///
/// By field path, we mean the list of `field_name` that are crossed
/// to reach the field starting from the root of the document.
/// There can be more than one due to quickwit object type.
///
/// We simply concatenate these field names, interleaving them with '.'.
/// If a fieldname itself contains a '.', we escape it with '\'.
/// ('\' itself is forbidden).
fn field_name_for_field_path(field_path: &[&str]) -> String {
    field_path.iter().cloned().map(escape_dots).join(".")
}

/// Builds the sequence of field names crossed to reach the field
/// starting from the root of the document.
/// Dots '.' define the boundaries between field names.
/// If a dot is part of a field name, it must be escaped with '\'.
pub(crate) fn build_field_path_from_str(field_path_as_str: &str) -> Vec<String> {
    let mut field_path = Vec::new();
    let mut current_path_fragment = String::new();
    let mut escaped = false;
    for char in field_path_as_str.chars() {
        if escaped {
            current_path_fragment.push(char);
            escaped = false;
        } else if char == '\\' {
            escaped = true;
        } else if char == '.' {
            let path_fragment = std::mem::take(&mut current_path_fragment);
            field_path.push(path_fragment);
        } else {
            current_path_fragment.push(char);
        }
    }
    if !current_path_fragment.is_empty() {
        field_path.push(current_path_fragment);
    }
    field_path
}

fn escape_dots(field_name: &str) -> String {
    let mut escaped_field_name = String::new();
    for chr in field_name.chars() {
        if chr == '.' {
            escaped_field_name.push('\\');
        }
        escaped_field_name.push(chr);
    }
    escaped_field_name
}

/// build a sub-mapping tree from the fields it contains.
///
/// also returns the list of concatenate fields which consume the dynamic field
fn build_mapping_from_field_type<'a>(
    field_mapping_type: &'a FieldMappingType,
    field_path: &mut Vec<&'a str>,
    schema_builder: &mut SchemaBuilder,
) -> anyhow::Result<(MappingTree, Vec<Field>)> {
    let field_name = field_name_for_field_path(field_path);
    match field_mapping_type {
        FieldMappingType::Text(options, cardinality) => {
            let text_options: TextOptions = options.clone().into();
            let field = schema_builder.add_text_field(&field_name, text_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::Text(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::I64(options, cardinality) => {
            let numeric_options = get_numeric_options_for_numeric_field(options);
            let field = schema_builder.add_i64_field(&field_name, numeric_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::I64(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::U64(options, cardinality) => {
            let numeric_options = get_numeric_options_for_numeric_field(options);
            let field = schema_builder.add_u64_field(&field_name, numeric_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::U64(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::F64(options, cardinality) => {
            let numeric_options = get_numeric_options_for_numeric_field(options);
            let field = schema_builder.add_f64_field(&field_name, numeric_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::F64(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::Bool(options, cardinality) => {
            let numeric_options = get_numeric_options_for_bool_field(options);
            let field = schema_builder.add_bool_field(&field_name, numeric_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::Bool(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::IpAddr(options, cardinality) => {
            let ip_addr_options = get_ip_address_options(options);
            let field = schema_builder.add_ip_addr_field(&field_name, ip_addr_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::IpAddr(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::DateTime(options, cardinality) => {
            let date_time_options = get_date_time_options(options);
            let field = schema_builder.add_date_field(&field_name, date_time_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::DateTime(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::Bytes(options, cardinality) => {
            let bytes_options = get_bytes_options(options);
            let field = schema_builder.add_bytes_field(&field_name, bytes_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::Bytes(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::Json(options, cardinality) => {
            let json_options = JsonObjectOptions::from(options.clone());
            let field = schema_builder.add_json_field(&field_name, json_options);
            let mapping_leaf = MappingLeaf {
                field,
                typ: LeafType::Json(options.clone()),
                cardinality: *cardinality,
                concatenate: Vec::new(),
            };
            Ok((MappingTree::Leaf(mapping_leaf), Vec::new()))
        }
        FieldMappingType::Object(entries) => {
            let MappingNodeRoot {
                field_mappings,
                concatenate_dynamic_fields,
            } = build_mapping_tree_from_entries(
                &entries.field_mappings,
                field_path,
                schema_builder,
            )?;
            Ok((
                MappingTree::Node(field_mappings),
                concatenate_dynamic_fields,
            ))
        }
        FieldMappingType::Concatenate(_) => {
            bail!("Concatenate shouldn't reach build_mapping_from_field_type: this is a bug")
        }
    }
}

#[cfg(test)]
mod tests {
    use std::net::IpAddr;

    use serde_json::{Value as JsonValue, json};
    use tantivy::schema::{Field, IntoIpv6Addr, OwnedValue as TantivyValue, Value};
    use tantivy::{DateTime, TantivyDocument as Document};
    use time::OffsetDateTime;
    use time::macros::datetime;

    use super::{
        JsonValueIterator, LeafType, MapOrArrayIter, MappingLeaf, add_key_to_vec_map,
        extract_val_from_tantivy_val,
    };
    use crate::Cardinality;
    use crate::doc_mapper::date_time_type::QuickwitDateTimeOptions;
    use crate::doc_mapper::field_mapping_entry::{
        BinaryFormat, QuickwitBoolOptions, QuickwitBytesOptions, QuickwitIpAddrOptions,
        QuickwitNumericOptions, QuickwitTextOptions,
    };

    #[test]
    fn test_field_name_from_field_path() {
        // not really a possibility, but still, let's test it.
        assert_eq!(super::field_name_for_field_path(&[]), "");
        assert_eq!(super::field_name_for_field_path(&["hello"]), "hello");
        assert_eq!(
            super::field_name_for_field_path(&["one", "two", "three"]),
            "one.two.three"
        );
        assert_eq!(
            super::field_name_for_field_path(&["one", "two", "three"]),
            "one.two.three"
        );
        assert_eq!(super::field_name_for_field_path(&["one.two"]), r"one\.two");
        assert_eq!(
            super::field_name_for_field_path(&["one.two", "three"]),
            r"one\.two.three"
        );
    }

    #[test]
    fn test_get_or_insert_path() {
        let mut map = Default::default();
        super::get_or_insert_path(&["a".to_string(), "b".to_string()], &mut map)
            .insert("c".to_string(), JsonValue::from(3u64));
        assert_eq!(
            &serde_json::to_value(&map).unwrap(),
            &serde_json::json!({
                "a": {
                    "b": {
                        "c": 3u64
                    }
                }
            })
        );
        super::get_or_insert_path(&["a".to_string(), "b".to_string()], &mut map)
            .insert("d".to_string(), JsonValue::from(2u64));
        assert_eq!(
            &serde_json::to_value(&map).unwrap(),
            &serde_json::json!({
                "a": {
                    "b": {
                        "c": 3u64,
                        "d": 2u64
                    }
                }
            })
        );
        super::get_or_insert_path(&["e".to_string()], &mut map)
            .insert("f".to_string(), JsonValue::from(5u64));
        assert_eq!(
            &serde_json::to_value(&map).unwrap(),
            &serde_json::json!({
                "a": {
                    "b": {
                        "c": 3u64,
                        "d": 2u64
                    }
                },
                "e": { "f": 5u64 }
            })
        );
        super::get_or_insert_path(&[], &mut map).insert("g".to_string(), JsonValue::from(6u64));
        assert_eq!(
            &serde_json::to_value(&map).unwrap(),
            &serde_json::json!({
                "a": {
                    "b": {
                        "c": 3u64,
                        "d": 2u64
                    }
                },
                "e": { "f": 5u64 },
                "g": 6u64
            })
        );
    }

    #[test]
    fn test_parse_u64_mapping() {
        let leaf = LeafType::U64(QuickwitNumericOptions::default());
        assert_eq!(
            leaf.value_from_json(json!(20i64)).unwrap(),
            TantivyValue::U64(20u64)
        );
    }

    #[test]
    fn test_parse_u64_coercion() {
        let leaf = LeafType::U64(QuickwitNumericOptions::default());
        assert_eq!(
            leaf.value_from_json(json!("20")).unwrap(),
            TantivyValue::U64(20u64)
        );
        assert_eq!(
            leaf.value_from_json(json!("foo")).unwrap_err(),
            "failed to coerce JSON string `\"foo\"` to u64"
        );

        let numeric_options = QuickwitNumericOptions {
            coerce: false,
            ..Default::default()
        };
        let leaf = LeafType::U64(numeric_options);
        assert_eq!(
            leaf.value_from_json(json!("20")).unwrap_err(),
            "expected JSON number, got string `\"20\"`. enable coercion to u64 with the `coerce` \
             parameter in the field mapping"
        );
    }

    #[test]
    fn test_parse_u64_negative_should_error() {
        let leaf = LeafType::U64(QuickwitNumericOptions::default());
        assert_eq!(
            leaf.value_from_json(json!(-20i64)).unwrap_err(),
            "expected u64, got inconvertible JSON number `-20`"
        );
    }

    #[test]
    fn test_parse_i64_mapping() {
        let leaf = LeafType::I64(QuickwitNumericOptions::default());
        assert_eq!(
            leaf.value_from_json(json!(20u64)).unwrap(),
            TantivyValue::I64(20i64)
        );
    }

    #[test]
    fn test_parse_i64_from_f64_should_error() {
        let leaf = LeafType::I64(QuickwitNumericOptions::default());
        assert_eq!(
            leaf.value_from_json(json!(20.2f64)).unwrap_err(),
            "expected i64, got inconvertible JSON number `20.2`"
        );
    }

    #[test]
    fn test_parse_i64_too_large() {
        let leaf = LeafType::I64(QuickwitNumericOptions::default());
        let err = leaf.value_from_json(json!(u64::MAX)).err().unwrap();
        assert_eq!(
            err,
            "expected i64, got inconvertible JSON number `18446744073709551615`"
        );
    }

    #[test]
    fn test_parse_f64_from_u64() {
        let leaf = LeafType::F64(QuickwitNumericOptions::default());
        assert_eq!(
            leaf.value_from_json(json!(4_000u64)).unwrap(),
            TantivyValue::F64(4_000f64)
        );
    }

    #[test]
    fn test_parse_bool_mapping() {
        let leaf = LeafType::Bool(QuickwitBoolOptions::default());
        assert_eq!(
            leaf.value_from_json(json!(true)).unwrap(),
            TantivyValue::Bool(true)
        );
    }

    #[test]
    fn test_parse_bool_multivalued() {
        let typ = LeafType::Bool(QuickwitBoolOptions::default());
        let field = Field::from_field_id(10);
        let leaf_entry = MappingLeaf {
            field,
            typ,
            cardinality: Cardinality::MultiValued,
            concatenate: Vec::new(),
        };
        let mut document = Document::default();
        let mut path = Vec::new();
        leaf_entry
            .doc_from_json(json!([true, false, true]), &mut document, &mut path)
            .unwrap();
        assert_eq!(document.len(), 3);
        let values: Vec<bool> = document
            .get_all(field)
            .flat_map(|val| val.as_bool())
            .collect();
        assert_eq!(&values, &[true, false, true])
    }

    #[test]
    fn test_parse_ip_addr_from_str() {
        let leaf = LeafType::IpAddr(QuickwitIpAddrOptions::default());
        let ips = vec![
            "127.0.0.0",
            "2605:2700:0:3::4713:93e3",
            "::afff:4567:890a",
            "10.10.12.123",
            "192.168.0.1",
            "2001:db8::1:0:0:1",
        ];
        for ip_str in ips {
            let parsed_ip_addr = leaf.value_from_json(json!(ip_str)).unwrap();
            let expected_ip_addr =
                TantivyValue::IpAddr(ip_str.parse::<IpAddr>().unwrap().into_ipv6_addr());
            assert_eq!(parsed_ip_addr, expected_ip_addr);
        }
    }

    #[test]
    fn test_parse_ip_addr_should_error() {
        let typ = LeafType::IpAddr(QuickwitIpAddrOptions::default());
        let err = typ.value_from_json(json!("foo")).err().unwrap();
        assert!(err.contains("failed to parse IP address `foo`"));

        let err = typ.value_from_json(json!(1200)).err().unwrap();
        assert!(err.contains("expected string, got `1200`"));
    }

    #[test]
    fn test_parse_i64_mutivalued() {
        let typ = LeafType::I64(QuickwitNumericOptions::default());
        let field = Field::from_field_id(10);
        let leaf_entry = MappingLeaf {
            field,
            typ,
            cardinality: Cardinality::MultiValued,
            concatenate: Vec::new(),
        };
        let mut document = Document::default();
        let mut path = Vec::new();
        leaf_entry
            .doc_from_json(serde_json::json!([10u64, 20u64]), &mut document, &mut path)
            .unwrap();
        assert_eq!(document.len(), 2);
        let values: Vec<i64> = document
            .get_all(field)
            .flat_map(|val| val.as_i64())
            .collect();
        assert_eq!(&values, &[10i64, 20i64]);
    }

    #[test]
    fn test_parse_null_is_just_ignored() {
        let typ = LeafType::I64(QuickwitNumericOptions::default());
        let field = Field::from_field_id(10);
        let leaf_entry = MappingLeaf {
            field,
            typ,
            cardinality: Cardinality::MultiValued,
            concatenate: Vec::new(),
        };
        let mut document = Document::default();
        let mut path = Vec::new();
        leaf_entry
            .doc_from_json(serde_json::json!(null), &mut document, &mut path)
            .unwrap();
        assert_eq!(document.len(), 0);
    }

    #[test]
    fn test_parse_i64_mutivalued_accepts_scalar() {
        let typ = LeafType::I64(QuickwitNumericOptions::default());
        let field = Field::from_field_id(10);
        let leaf_entry = MappingLeaf {
            field,
            typ,
            cardinality: Cardinality::MultiValued,
            concatenate: Vec::new(),
        };
        let mut document = Document::default();
        let mut path = Vec::new();
        leaf_entry
            .doc_from_json(serde_json::json!(10u64), &mut document, &mut path)
            .unwrap();
        assert_eq!(document.len(), 1);
        assert_eq!(document.get_first(field).unwrap().as_i64().unwrap(), 10i64);
    }

    #[test]
    fn test_parse_u64_mutivalued_nested_array_forbidden() {
        let typ = LeafType::I64(QuickwitNumericOptions::default());
        let field = Field::from_field_id(10);
        let leaf_entry = MappingLeaf {
            field,
            typ,
            cardinality: Cardinality::MultiValued,
            concatenate: Vec::new(),
        };
        let mut document = Document::default();
        let mut path = vec!["root".to_string(), "my_field".to_string()];
        let parse_err = leaf_entry
            .doc_from_json(
                serde_json::json!([10u64, [1u64, 2u64]]),
                &mut document,
                &mut path,
            )
            .unwrap_err();
        assert_eq!(
            parse_err.to_string(),
            "the field `root.my_field` could not be parsed: expected JSON number or string, got \
             `[1,2]`"
        );
    }

    #[test]
    fn test_parse_text() {
        let typ = LeafType::Text(QuickwitTextOptions::default());
        let parsed_value = typ.value_from_json(json!("bacon and eggs")).unwrap();
        assert_eq!(
            parsed_value,
            TantivyValue::Str("bacon and eggs".to_string())
        );
    }

    #[test]
    fn test_parse_text_number_should_error() {
        let typ = LeafType::Text(QuickwitTextOptions::default());
        let err = typ.value_from_json(json!(2u64)).err().unwrap();
        assert_eq!(err, "expected string, got `2`");
    }

    #[test]
    fn test_parse_date_time_str() {
        let typ = LeafType::DateTime(QuickwitDateTimeOptions::default());
        let value = typ
            .value_from_json(json!("2021-12-19T16:39:57-01:00"))
            .unwrap();
        let date_time = datetime!(2021-12-19 17:39:57 UTC);
        assert_eq!(value, TantivyValue::Date(DateTime::from_utc(date_time)));
    }

    #[test]
    fn test_parse_timestamp_float() {
        let typ = LeafType::DateTime(QuickwitDateTimeOptions::default());
        let unix_ts_secs = OffsetDateTime::now_utc().unix_timestamp();
        let value = typ
            .value_from_json(json!(unix_ts_secs as f64 + 0.1))
            .unwrap();
        let date_time = match value {
            TantivyValue::Date(date_time) => date_time,
            other => panic!("Expected a tantivy date time, got `{other:?}`."),
        };
        assert!((date_time.into_timestamp_millis() - (unix_ts_secs * 1_000 + 100)).abs() <= 1);
    }

    #[test]
    fn test_parse_timestamp_int() {
        let typ = LeafType::DateTime(QuickwitDateTimeOptions::default());
        let unix_ts_secs = OffsetDateTime::now_utc().unix_timestamp();
        let value = typ.value_from_json(json!(unix_ts_secs)).unwrap();
        assert_eq!(
            value,
            TantivyValue::Date(DateTime::from_timestamp_secs(unix_ts_secs))
        );
    }

    #[test]
    fn test_parse_date_number_should_error() {
        let typ = LeafType::DateTime(QuickwitDateTimeOptions::default());
        let err = typ.value_from_json(json!("foo-datetime")).unwrap_err();
        assert_eq!(
            err,
            "failed to parse datetime `foo-datetime` using the following formats: `rfc3339`, \
             `unix_timestamp`"
        );
    }

    #[test]
    fn test_parse_date_array_should_error() {
        let typ = LeafType::DateTime(QuickwitDateTimeOptions::default());
        let err = typ.value_from_json(json!(["foo", "bar"])).err().unwrap();
        assert_eq!(
            err,
            "failed to parse datetime: expected a float, integer, or string, got \
             `[\"foo\",\"bar\"]`"
        );
    }

    #[test]
    fn test_parse_bytes() {
        let typ = LeafType::Bytes(QuickwitBytesOptions::default());
        let value = typ
            .value_from_json(json!("dGhpcyBpcyBhIGJhc2U2NCBlbmNvZGVkIHN0cmluZw=="))
            .unwrap();
        assert_eq!(
            (&value).as_bytes().unwrap(),
            b"this is a base64 encoded string"
        );
    }

    #[test]
    fn test_parse_bytes_hex() {
        let typ = LeafType::Bytes(QuickwitBytesOptions {
            input_format: BinaryFormat::Hex,
            ..QuickwitBytesOptions::default()
        });
        let value = typ
            .value_from_json(json!(
                "7468697320697320612068657820656e636f64656420737472696e67"
            ))
            .unwrap();
        assert_eq!(
            (&value).as_bytes().unwrap(),
            b"this is a hex encoded string"
        );
    }

    #[test]
    fn test_parse_bytes_number_should_err() {
        let typ = LeafType::Bytes(QuickwitBytesOptions::default());
        let error = typ.value_from_json(json!(2u64)).err().unwrap();
        assert_eq!(error, "expected base64 string, got `2`");
    }

    #[test]
    fn test_parse_bytes_invalid_base64() {
        let typ = LeafType::Bytes(QuickwitBytesOptions::default());
        let error = typ.value_from_json(json!("dEwerwer#!%")).err().unwrap();
        assert_eq!(
            error,
            "expected base64 string, got `dEwerwer#!%`: Invalid symbol 35, offset 8."
        );
    }

    #[test]
    fn test_parse_array_of_bytes() {
        let typ = LeafType::Bytes(QuickwitBytesOptions::default());
        let field = Field::from_field_id(10);
        let leaf_entry = MappingLeaf {
            field,
            typ,
            cardinality: Cardinality::MultiValued,
            concatenate: Vec::new(),
        };
        let mut document = Document::default();
        let mut path = vec!["root".to_string(), "my_field".to_string()];
        leaf_entry
            .doc_from_json(
                serde_json::json!([
                    "dGhpcyBpcyBhIGJhc2U2NCBlbmNvZGVkIHN0cmluZw==",
                    "dGhpcyBpcyBhIGJhc2U2NCBlbmNvZGVkIHN0cmluZw=="
                ]),
                &mut document,
                &mut path,
            )
            .unwrap();
        assert_eq!(document.len(), 2);
        let bytes_vec: Vec<&[u8]> = document
            .get_all(field)
            .flat_map(|val| val.as_bytes())
            .collect();
        assert_eq!(
            &bytes_vec[..],
            &[
                b"this is a base64 encoded string",
                b"this is a base64 encoded string"
            ]
        )
    }

    #[test]
    fn test_field_path_for_field_name() {
        assert_eq!(super::build_field_path_from_str(""), Vec::<String>::new());
        assert_eq!(super::build_field_path_from_str("hello"), vec!["hello"]);
        assert_eq!(
            super::build_field_path_from_str("one.two.three"),
            vec!["one", "two", "three"]
        );
        assert_eq!(
            super::build_field_path_from_str(r"one\.two"),
            vec!["one.two"]
        );
        assert_eq!(
            super::build_field_path_from_str(r"one\.two.three"),
            vec!["one.two", "three"]
        );
        assert_eq!(super::build_field_path_from_str(r#"one."#), vec!["one"]);
        // Those are invalid field paths, but we check that it does not panic.
        // Issue #3538 is about validating field paths before trying to build the path.
        assert_eq!(super::build_field_path_from_str("\\."), vec!["."]);
        assert_eq!(super::build_field_path_from_str("a."), vec!["a"]);
        assert_eq!(super::build_field_path_from_str(".a"), vec!["", "a"]);
    }

    #[test]
    fn test_map_or_array_iter() {
        // single element
        let single_value = MapOrArrayIter::Value(json!({"a": "b", "c": 4}));
        let res: Vec<_> = single_value.collect();
        assert_eq!(res, vec![json!({"a": "b", "c": 4})]);

        // array of elements
        let multiple_values =
            MapOrArrayIter::Array(vec![json!({"a": "b", "c": 4}), json!(5)].into_iter());
        let res: Vec<_> = multiple_values.collect();
        assert_eq!(res, vec![json!({"a": "b", "c": 4}), json!(5)]);

        // map of elements
        let multiple_values = MapOrArrayIter::Map(
            json!({"a": {"a": "b", "c": 4}, "b":5})
                .as_object()
                .unwrap()
                .clone()
                .into_iter(),
        );
        let res: Vec<_> = multiple_values.collect();
        assert_eq!(res, vec![json!({"a": "b", "c": 4}), json!(5)]);
    }

    #[test]
    fn test_json_value_iterator() {
        assert_eq!(
            JsonValueIterator::new(json!(5)).collect::<Vec<_>>(),
            vec![json!(5)]
        );
        assert_eq!(
            JsonValueIterator::new(json!([5, "a"])).collect::<Vec<_>>(),
            vec![json!(5), json!("a")]
        );
        assert_eq!(
            JsonValueIterator::new(json!({"a":1, "b": 2})).collect::<Vec<_>>(),
            vec![json!(1), json!(2)]
        );
        assert_eq!(
            JsonValueIterator::new(json!([{"a":1, "b": 2}, "a"])).collect::<Vec<_>>(),
            vec![json!(1), json!(2), json!("a")]
        );
        assert_eq!(
            JsonValueIterator::new(json!([{"a":1, "b": 2}, {"a": {"b": [3, 4]}}]))
                .collect::<Vec<_>>(),
            vec![json!(1), json!(2), json!(3), json!(4)]
        );
    }

    #[test]
    fn test_extract_val_from_tantivy_val() {
        let obj = TantivyValue::Object;
        fn array(val: impl IntoIterator<Item = impl Into<TantivyValue>>) -> TantivyValue {
            TantivyValue::Array(val.into_iter().map(Into::into).collect())
        }

        let mut sample = vec![obj(vec![
            (
                "some".to_string(),
                obj(vec![
                    (
                        "path".to_string(),
                        obj(vec![("with.dots".to_string(), 1u64.into())]),
                    ),
                    (
                        "other".to_string(),
                        obj(vec![("path".to_string(), array([2u64, 3]))]),
                    ),
                ]),
            ),
            ("short".to_string(), 4u64.into()),
        ])];

        assert_eq!(
            extract_val_from_tantivy_val(&["some", "other"], &mut sample),
            vec![obj(vec![("path".to_string(), array([2u64, 3]))])]
        );
        assert_eq!(
            extract_val_from_tantivy_val(&["some", "other"], &mut sample),
            Vec::new()
        );
        assert_eq!(
            extract_val_from_tantivy_val(&["some", "path", "with.dots"], &mut sample),
            vec![1u64.into()]
        );
        assert_eq!(
            extract_val_from_tantivy_val(&["some", "path", "with.dots"], &mut sample),
            Vec::new()
        );
        assert_eq!(
            extract_val_from_tantivy_val(&["short"], &mut sample),
            vec![4u64.into()]
        );
        assert_eq!(
            extract_val_from_tantivy_val(&["short"], &mut sample),
            Vec::new()
        );
    }

    #[test]
    fn test_add_key_to_vec_map() {
        let obj = TantivyValue::Object;
        fn array(val: impl IntoIterator<Item = impl Into<TantivyValue>>) -> TantivyValue {
            TantivyValue::Array(val.into_iter().map(Into::into).collect())
        }

        let mut map = Vec::new();

        add_key_to_vec_map(&mut map, "some.path.with\\.dots", vec![1u64.into()]);
        assert_eq!(
            map,
            &[(
                "some".to_string(),
                obj(vec![(
                    "path".to_string(),
                    obj(vec![("with.dots".to_string(), 1u64.into())])
                )])
            )]
        );

        add_key_to_vec_map(&mut map, "some.other.path", vec![2u64.into(), 3u64.into()]);
        assert_eq!(
            map,
            &[(
                "some".to_string(),
                obj(vec![
                    (
                        "path".to_string(),
                        obj(vec![("with.dots".to_string(), 1u64.into())])
                    ),
                    (
                        "other".to_string(),
                        obj(vec![("path".to_string(), array([2u64, 3]))])
                    ),
                ])
            )]
        );

        add_key_to_vec_map(&mut map, "short", vec![4u64.into()]);
        assert_eq!(
            map,
            &[
                (
                    "some".to_string(),
                    obj(vec![
                        (
                            "path".to_string(),
                            obj(vec![("with.dots".to_string(), 1u64.into())])
                        ),
                        (
                            "other".to_string(),
                            obj(vec![("path".to_string(), array([2u64, 3]))])
                        ),
                    ])
                ),
                ("short".to_string(), 4u64.into())
            ]
        );
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod date_time_type;
mod doc_mapper_builder;
mod doc_mapper_impl;
mod field_mapping_entry;
mod field_mapping_type;
mod field_presence;
mod mapping_tree;
mod tantivy_val_to_json;
mod tokenizer_entry;

use std::collections::{HashMap, HashSet};
use std::fmt::Debug;
use std::ops::Bound;

pub use doc_mapper_builder::DocMapperBuilder;
pub use doc_mapper_impl::DocMapper;
pub use field_mapping_entry::{
    BinaryFormat, FastFieldOptions, FieldMappingEntry, QuickwitBytesOptions, QuickwitJsonOptions,
    QuickwitTextNormalizer,
};
pub(crate) use field_mapping_entry::{
    FieldMappingEntryForSerialization, IndexRecordOptionSchema, QuickwitTextTokenizer,
};
#[cfg(test)]
pub(crate) use field_mapping_entry::{QuickwitNumericOptions, QuickwitTextOptions};
pub use field_mapping_type::FieldMappingType;
use serde_json::Value as JsonValue;
use tantivy::Term;
use tantivy::schema::{Field, FieldType};
pub(crate) use tokenizer_entry::{
    NgramTokenizerOption, RegexTokenizerOption, TokenFilterType, TokenizerType,
};
pub use tokenizer_entry::{TokenizerConfig, TokenizerEntry, analyze_text};

pub type Partition = u64;

/// An alias for serde_json's object type.
pub type JsonObject = serde_json::Map<String, JsonValue>;

/// A struct to wrap a tantivy field with its name.
#[derive(Clone, Debug)]
pub struct NamedField {
    /// Name of the field.
    pub name: String,
    /// Tantivy schema field.
    pub field: Field,
    /// Tantivy schema field type.
    pub field_type: FieldType,
}

/// Bounds for a range of terms, with an optional max count of terms being matched.
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct TermRange {
    /// Start of the range
    pub start: Bound<Term>,
    /// End of the range
    pub end: Bound<Term>,
    /// Max number of matched terms
    pub limit: Option<u64>,
}

#[derive(Debug, Clone, PartialEq, Eq, Hash)]
/// Supported automaton types to warmup
pub enum Automaton {
    /// A regex in it's str representation as tantivy_fst::Regex isn't PartialEq, and the path if
    /// inside a json field
    Regex(Option<Vec<u8>>, String),
    // we could add termset query here, instead of downloading the whole dictionary
}

/// Description of how a fast field should be warmed up
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct FastFieldWarmupInfo {
    /// Name of the fast field
    pub name: String,
    /// Whether subfields should also be loaded for warmup
    pub with_subfields: bool,
}

/// Information about what a DocMapper think should be warmed up before
/// running the query.
#[derive(Debug, Default, Clone, PartialEq, Eq)]
pub struct WarmupInfo {
    /// Name of fields from the term dictionary and posting list which needs to
    /// be entirely loaded
    pub term_dict_fields: HashSet<Field>,
    /// Fast fields which needs to be loaded
    pub fast_fields: HashSet<FastFieldWarmupInfo>,
    /// Whether to warmup field norms. Used mostly for scoring.
    pub field_norms: bool,
    /// Terms to warmup, and whether their position is needed too.
    pub terms_grouped_by_field: HashMap<Field, HashMap<Term, bool>>,
    /// Term ranges to warmup, and whether their position is needed too.
    pub term_ranges_grouped_by_field: HashMap<Field, HashMap<TermRange, bool>>,
    /// Automatons to warmup
    pub automatons_grouped_by_field: HashMap<Field, HashSet<Automaton>>,
}

impl WarmupInfo {
    /// Merge other WarmupInfo into self.
    pub fn merge(&mut self, other: WarmupInfo) {
        self.term_dict_fields.extend(other.term_dict_fields);
        self.field_norms |= other.field_norms;

        for fast_field_warmup_info in other.fast_fields.into_iter() {
            // avoid overwriting with a less demanding warmup
            if !self.fast_fields.contains(&FastFieldWarmupInfo {
                name: fast_field_warmup_info.name.clone(),
                with_subfields: true,
            }) {
                self.fast_fields.insert(fast_field_warmup_info);
            }
        }

        for (field, term_and_pos) in other.terms_grouped_by_field.into_iter() {
            let sub_map = self.terms_grouped_by_field.entry(field).or_default();

            for (term, include_position) in term_and_pos.into_iter() {
                *sub_map.entry(term).or_default() |= include_position;
            }
        }

        // this merge is suboptimal in case of overlapping range with no limit.
        for (field, term_range_and_pos) in other.term_ranges_grouped_by_field.into_iter() {
            let sub_map = self.term_ranges_grouped_by_field.entry(field).or_default();

            for (term_range, include_position) in term_range_and_pos.into_iter() {
                *sub_map.entry(term_range).or_default() |= include_position;
            }
        }

        for (field, automatons) in other.automatons_grouped_by_field.into_iter() {
            let sub_map = self.automatons_grouped_by_field.entry(field).or_default();
            sub_map.extend(automatons);
        }
    }

    /// Simplify a WarmupInfo, removing some redundant tasks
    pub fn simplify(&mut self) {
        self.terms_grouped_by_field.retain(|field, terms| {
            if self.term_dict_fields.contains(field) {
                // we are already about to full-load this dictionary. We only care about terms
                // which needs additional position
                terms.retain(|_term, include_position| *include_position);
            }
            // if no term is left, remove the entry from the hashmap
            !terms.is_empty()
        });
        self.term_ranges_grouped_by_field.retain(|field, terms| {
            if self.term_dict_fields.contains(field) {
                terms.retain(|_term, include_position| *include_position);
            }
            !terms.is_empty()
        });
        // TODO we could remove from terms_grouped_by_field for ranges with no `limit` in
        // term_ranges_grouped_by_field
    }
}

#[cfg(test)]
mod tests {
    use std::collections::{HashMap, HashSet};
    use std::ops::Bound;

    use quickwit_query::BooleanOperand;
    use quickwit_query::query_ast::{UserInputQuery, query_ast_from_user_text};
    use tantivy::schema::{Field, FieldType, Term};

    use super::*;
    use crate::{
        Cardinality, DYNAMIC_FIELD_NAME, DocMapper, DocMapperBuilder, DocParsingError,
        FieldMappingEntry, TermRange, WarmupInfo,
    };

    const JSON_DEFAULT_DOC_MAPPER: &str = r#"
        {
            "type": "default",
            "default_search_fields": [],
            "tag_fields": [],
            "field_mappings": []
        }"#;

    #[test]
    fn test_doc_from_json_bytes() {
        let doc_mapper = DocMapperBuilder::default().try_build().unwrap();
        let json_doc = br#"{"title": "hello", "body": "world"}"#;
        doc_mapper.doc_from_json_bytes(json_doc).unwrap();

        let DocParsingError::NotJsonObject(json_doc_sample) = doc_mapper
            .doc_from_json_bytes(br#"Not a JSON object"#)
            .unwrap_err()
        else {
            panic!("Expected `DocParsingError::NotJsonObject` error");
        };
        assert_eq!(json_doc_sample, "Not a JSON object...");
    }

    #[test]
    fn test_doc_from_json_str() {
        let doc_mapper = DocMapperBuilder::default().try_build().unwrap();
        let json_doc = r#"{"title": "hello", "body": "world"}"#;
        doc_mapper.doc_from_json_str(json_doc).unwrap();

        let DocParsingError::NotJsonObject(json_doc_sample) = doc_mapper
            .doc_from_json_str(r#"Not a JSON object"#)
            .unwrap_err()
        else {
            panic!("Expected `DocParsingError::NotJsonObject` error");
        };
        assert_eq!(json_doc_sample, "Not a JSON object...");
    }

    #[test]
    fn test_deserialize_doc_mapper() -> anyhow::Result<()> {
        let deserialized_default_doc_mapper =
            serde_json::from_str::<Box<DocMapper>>(JSON_DEFAULT_DOC_MAPPER)?;
        let expected_default_doc_mapper = DocMapperBuilder::default().try_build()?;
        assert_eq!(
            format!("{deserialized_default_doc_mapper:?}"),
            format!("{expected_default_doc_mapper:?}"),
        );
        Ok(())
    }

    #[test]
    fn test_deserialize_minimal_doc_mapper() -> anyhow::Result<()> {
        let deserialized_default_doc_mapper =
            serde_json::from_str::<Box<DocMapper>>(r#"{"type": "default"}"#)?;
        let expected_default_doc_mapper = DocMapperBuilder::default().try_build()?;
        assert_eq!(
            format!("{deserialized_default_doc_mapper:?}"),
            format!("{expected_default_doc_mapper:?}"),
        );
        Ok(())
    }

    #[test]
    fn test_deserialize_doc_mapper_default_dynamic_tokenizer() {
        let doc_mapper =
            serde_json::from_str::<Box<DocMapper>>(r#"{"type": "default", "mode": "dynamic"}"#)
                .unwrap();
        let tantivy_schema = doc_mapper.schema();
        let dynamic_field = tantivy_schema.get_field(DYNAMIC_FIELD_NAME).unwrap();
        if let FieldType::JsonObject(json_options) =
            tantivy_schema.get_field_entry(dynamic_field).field_type()
        {
            let text_opt = json_options.get_text_indexing_options().unwrap();
            assert_eq!(text_opt.tokenizer(), "raw");
        } else {
            panic!("dynamic field should be of JSON type");
        }
    }

    #[test]
    fn test_doc_mapper_query_with_json_field() {
        let mut doc_mapper_builder = DocMapperBuilder::default();
        doc_mapper_builder
            .doc_mapping
            .field_mappings
            .push(FieldMappingEntry {
                name: "json_field".to_string(),
                mapping_type: FieldMappingType::Json(
                    QuickwitJsonOptions::default(),
                    Cardinality::SingleValued,
                ),
            });
        let doc_mapper = doc_mapper_builder.try_build().unwrap();
        let schema = doc_mapper.schema();
        let query_ast = UserInputQuery {
            user_text: "json_field.toto.titi:hello".to_string(),
            default_fields: None,
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&[])
        .unwrap();
        let (query, _) = doc_mapper.query(schema, query_ast, true, None).unwrap();
        assert_eq!(
            format!("{query:?}"),
            r#"TermQuery(Term(field=2, type=Json, path=toto.titi, type=Str, "hello"))"#
        );
    }

    #[test]
    fn test_doc_mapper_query_with_json_field_default_search_fields() {
        let doc_mapper = DocMapperBuilder::default().try_build().unwrap();
        let schema = doc_mapper.schema();
        let query_ast = query_ast_from_user_text("toto.titi:hello", None)
            .parse_user_query(doc_mapper.default_search_fields())
            .unwrap();
        let (query, _) = doc_mapper.query(schema, query_ast, true, None).unwrap();
        assert_eq!(
            format!("{query:?}"),
            r#"TermQuery(Term(field=1, type=Json, path=toto.titi, type=Str, "hello"))"#
        );
    }

    #[test]
    fn test_doc_mapper_query_with_json_field_ambiguous_term() {
        let doc_mapper = DocMapperBuilder::default().try_build().unwrap();
        let schema = doc_mapper.schema();
        let query_ast = query_ast_from_user_text("toto:5", None)
            .parse_user_query(&[])
            .unwrap();
        let (query, _) = doc_mapper.query(schema, query_ast, true, None).unwrap();
        assert_eq!(
            format!("{query:?}"),
            r#"BooleanQuery { subqueries: [(Should, TermQuery(Term(field=1, type=Json, path=toto, type=I64, 5))), (Should, TermQuery(Term(field=1, type=Json, path=toto, type=Str, "5")))], minimum_number_should_match: 1 }"#
        );
    }

    #[track_caller]
    fn test_validate_doc_aux(
        doc_mapper: &DocMapper,
        doc_json: &str,
    ) -> Result<(), DocParsingError> {
        let json_val: serde_json_borrow::Value = serde_json::from_str(doc_json).unwrap();
        let json_obj = json_val.as_object().unwrap();
        doc_mapper.validate_json_obj(json_obj)
    }

    #[test]
    fn test_validate_doc() {
        const JSON_CONFIG_VALUE: &str = r#"{
            "timestamp_field": "timestamp",
            "field_mappings": [
            {
                "name": "timestamp",
                "type": "datetime",
                "fast": true
            },
            {
                "name": "body",
                "type": "text"
            },
            {
                "name": "response_date",
                "type": "datetime",
                "input_formats": ["rfc3339", "unix_timestamp"]
            },
            {
                "name": "response_time",
                "type": "f64"
            },
            {
                "name": "response_time_no_coercion",
                "type": "f64",
                "coerce": false
            },
            {
                "name": "response_payload",
                "type": "bytes"
            },
            {
                "name": "is_important",
                "type": "bool"
            },
            {
                "name": "properties",
                "type": "json"
            },
            {
                "name": "attributes",
                "type": "object",
                "field_mappings": [
                    {
                        "name": "numbers",
                        "type": "array<i64>"
                    }
                ]
            }]
        }"#;
        let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_VALUE).unwrap();
        {
            assert!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .is_ok()
            );
        }
        {
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "response_time": "toto", "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .unwrap_err(),
                DocParsingError::ValueError(_, _)
            ));
        }
        {
            assert!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "response_time": "2.3", "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .is_ok(),
            );
        }
        {
            // coercion disabled
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{"response_time_no_coercion": "2.3", "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .unwrap_err(),
                DocParsingError::ValueError(_, _)
            ));
        }
        {
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{"response_time": [2.3], "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .unwrap_err(),
                DocParsingError::MultiValuesNotSupported(_)
            ));
        }
        {
            assert!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{"attributes": {"numbers": [-2]}, "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .is_ok()
            );
        }
    }

    #[test]
    fn test_validate_doc_timestamp() {
        const JSON_CONFIG_TS_AT_ROOT: &str = r#"{
            "timestamp_field": "timestamp",
            "field_mappings": [
            {
                "name": "timestamp",
                "type": "datetime",
                "fast": true
            },
            {
                "name": "body",
                "type": "text"
            }
            ]
        }"#;
        const JSON_CONFIG_TS_WITH_DOT: &str = r#"{
            "timestamp_field": "timestamp\\.now",
            "field_mappings": [
            {
                "name": "timestamp.now",
                "type": "datetime",
                "fast": true
            },
            {
                "name": "body",
                "type": "text"
            }
            ]
        }"#;
        const JSON_CONFIG_TS_NESTED: &str = r#"{
            "timestamp_field": "doc.timestamp",
            "field_mappings": [
            {
                "name": "doc",
                "type": "object",
                "field_mappings": [
                    {
                        "name": "timestamp",
                        "type": "datetime",
                        "fast": true
                    }
                ]
            },
            {
                "name": "body",
                "type": "text"
            }
            ]
        }"#;
        let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_TS_AT_ROOT).unwrap();
        {
            assert!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .is_ok()
            );
        }
        {
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "timestamp": "invalid timestamp"}"#
                )
                .unwrap_err(),
                DocParsingError::ValueError(_, _),
            ));
        }
        {
            assert!(matches!(
                test_validate_doc_aux(&doc_mapper, r#"{ "body": "toto", "timestamp": null}"#)
                    .unwrap_err(),
                DocParsingError::RequiredField(_),
            ));
        }
        {
            assert!(matches!(
                test_validate_doc_aux(&doc_mapper, r#"{ "body": "toto"}"#).unwrap_err(),
                DocParsingError::RequiredField(_),
            ));
        }

        let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_TS_WITH_DOT).unwrap();
        {
            assert!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "timestamp.now": "2024-01-01T01:01:01Z"}"#
                )
                .is_ok()
            );
        }
        {
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "timestamp.now": "invalid timestamp"}"#
                )
                .unwrap_err(),
                DocParsingError::ValueError(_, _),
            ));
        }
        {
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "timestamp": {"now": "2024-01-01T01:01:01Z"}}"#
                )
                .unwrap_err(),
                DocParsingError::RequiredField(_),
            ));
        }

        let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_TS_NESTED).unwrap();
        {
            assert!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "doc":{"timestamp": "2024-01-01T01:01:01Z"}}"#
                )
                .is_ok()
            );
        }
        {
            assert!(matches!(
                test_validate_doc_aux(
                    &doc_mapper,
                    r#"{ "body": "toto", "doc.timestamp": "2024-01-01T01:01:01Z"}"#
                )
                .unwrap_err(),
                DocParsingError::RequiredField(_),
            ));
        }
    }

    #[test]
    fn test_validate_doc_mode() {
        const DOC: &str = r#"{ "whatever": "blop" }"#;
        {
            const JSON_CONFIG_VALUE: &str = r#"{ "mode": "strict", "field_mappings": [] }"#;
            let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_VALUE).unwrap();
            assert!(matches!(
                test_validate_doc_aux(&doc_mapper, DOC).unwrap_err(),
                DocParsingError::NoSuchFieldInSchema(_)
            ));
        }
        {
            const JSON_CONFIG_VALUE: &str = r#"{ "mode": "lenient", "field_mappings": [] }"#;
            let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_VALUE).unwrap();
            assert!(test_validate_doc_aux(&doc_mapper, DOC).is_ok());
        }
        {
            const JSON_CONFIG_VALUE: &str = r#"{ "mode": "dynamic", "field_mappings": [] }"#;
            let doc_mapper = serde_json::from_str::<DocMapper>(JSON_CONFIG_VALUE).unwrap();
            assert!(test_validate_doc_aux(&doc_mapper, DOC).is_ok());
        }
    }

    fn hashset_fast(elements: &[&str]) -> HashSet<FastFieldWarmupInfo> {
        elements
            .iter()
            .map(|elem| FastFieldWarmupInfo {
                name: elem.to_string(),
                with_subfields: false,
            })
            .collect()
    }

    fn automaton_hashset(elements: &[&str]) -> HashSet<Automaton> {
        elements
            .iter()
            .map(|elem| Automaton::Regex(None, elem.to_string()))
            .collect()
    }

    fn hashset_field(elements: &[u32]) -> HashSet<Field> {
        elements
            .iter()
            .map(|elem| Field::from_field_id(*elem))
            .collect()
    }

    fn hashmap(elements: &[(u32, &str, bool)]) -> HashMap<Field, HashMap<Term, bool>> {
        let mut result: HashMap<Field, HashMap<Term, bool>> = HashMap::new();
        for (field, term, pos) in elements {
            let field = Field::from_field_id(*field);
            *result
                .entry(field)
                .or_default()
                .entry(Term::from_field_text(field, term))
                .or_default() |= pos;
        }

        result
    }

    fn hashmap_ranges(elements: &[(u32, &str, bool)]) -> HashMap<Field, HashMap<TermRange, bool>> {
        let mut result: HashMap<Field, HashMap<TermRange, bool>> = HashMap::new();
        for (field, term, pos) in elements {
            let field = Field::from_field_id(*field);
            let term = Term::from_field_text(field, term);
            // this is a 1 element bound, but it's enough for testing.
            let range = TermRange {
                start: Bound::Included(term.clone()),
                end: Bound::Included(term),
                limit: None,
            };
            *result.entry(field).or_default().entry(range).or_default() |= pos;
        }

        result
    }

    #[test]
    fn test_warmup_info_merge() {
        let wi_base = WarmupInfo {
            term_dict_fields: hashset_field(&[1, 2]),
            fast_fields: hashset_fast(&["fast1", "fast2"]),
            field_norms: false,
            terms_grouped_by_field: hashmap(&[(1, "term1", false), (1, "term2", false)]),
            term_ranges_grouped_by_field: hashmap_ranges(&[
                (2, "term1", false),
                (2, "term2", false),
            ]),
            automatons_grouped_by_field: [(
                Field::from_field_id(1),
                automaton_hashset(&["my_reg.*ex"]),
            )]
            .into_iter()
            .collect(),
        };

        // merging with default has no impact
        let mut wi_cloned = wi_base.clone();
        wi_cloned.merge(WarmupInfo::default());
        assert_eq!(wi_cloned, wi_base);

        let mut wi_base = wi_base;
        let wi_2 = WarmupInfo {
            term_dict_fields: hashset_field(&[2, 3]),
            fast_fields: hashset_fast(&["fast2", "fast3"]),
            field_norms: true,
            terms_grouped_by_field: hashmap(&[(2, "term1", false), (1, "term2", true)]),
            term_ranges_grouped_by_field: hashmap_ranges(&[
                (3, "term1", false),
                (2, "term2", true),
            ]),
            automatons_grouped_by_field: [
                (Field::from_field_id(1), automaton_hashset(&["other-re.ex"])),
                (Field::from_field_id(2), automaton_hashset(&["my_reg.*ex"])),
            ]
            .into_iter()
            .collect(),
        };
        wi_base.merge(wi_2.clone());

        assert_eq!(wi_base.term_dict_fields, hashset_field(&[1, 2, 3]));
        assert_eq!(
            wi_base.fast_fields,
            hashset_fast(&["fast1", "fast2", "fast3"])
        );
        assert!(wi_base.field_norms);

        let expected_terms = [(1, "term1", false), (1, "term2", true), (2, "term1", false)];
        for (field, term, pos) in expected_terms {
            let field = Field::from_field_id(field);
            let term = Term::from_field_text(field, term);

            assert_eq!(
                *wi_base
                    .terms_grouped_by_field
                    .get(&field)
                    .unwrap()
                    .get(&term)
                    .unwrap(),
                pos
            );
        }

        let expected_ranges = [(2, "term1", false), (2, "term2", true), (3, "term1", false)];
        for (field, term, pos) in expected_ranges {
            let field = Field::from_field_id(field);
            let term = Term::from_field_text(field, term);
            let range = TermRange {
                start: Bound::Included(term.clone()),
                end: Bound::Included(term),
                limit: None,
            };

            assert_eq!(
                *wi_base
                    .term_ranges_grouped_by_field
                    .get(&field)
                    .unwrap()
                    .get(&range)
                    .unwrap(),
                pos
            );
        }

        let expected_automatons = [(1, "my_reg.*ex"), (1, "other-re.ex"), (2, "my_reg.*ex")];
        for (field, regex) in expected_automatons {
            let field = Field::from_field_id(field);
            let automaton = Automaton::Regex(None, regex.to_string());
            assert!(
                wi_base
                    .automatons_grouped_by_field
                    .get(&field)
                    .unwrap()
                    .contains(&automaton)
            );
        }

        // merge is idempotent
        let mut wi_cloned = wi_base.clone();
        wi_cloned.merge(wi_2);
        assert_eq!(wi_cloned, wi_base);
    }

    #[test]
    fn test_warmup_info_simplify() {
        let mut warmup_info = WarmupInfo {
            term_dict_fields: hashset_field(&[1]),
            fast_fields: hashset_fast(&["fast1", "fast2"]),
            field_norms: false,
            terms_grouped_by_field: hashmap(&[
                (1, "term1", false),
                (1, "term2", true),
                (2, "term3", false),
            ]),
            term_ranges_grouped_by_field: hashmap_ranges(&[
                (1, "term1", false),
                (1, "term2", true),
                (2, "term3", false),
            ]),
            automatons_grouped_by_field: [
                (Field::from_field_id(1), automaton_hashset(&["other-re.ex"])),
                (Field::from_field_id(1), automaton_hashset(&["other-re.ex"])),
                (Field::from_field_id(2), automaton_hashset(&["my_reg.ex"])),
            ]
            .into_iter()
            .collect(),
        };
        let expected = WarmupInfo {
            term_dict_fields: hashset_field(&[1]),
            fast_fields: hashset_fast(&["fast1", "fast2"]),
            field_norms: false,
            terms_grouped_by_field: hashmap(&[(1, "term2", true), (2, "term3", false)]),
            term_ranges_grouped_by_field: hashmap_ranges(&[
                (1, "term2", true),
                (2, "term3", false),
            ]),
            automatons_grouped_by_field: [
                (Field::from_field_id(1), automaton_hashset(&["other-re.ex"])),
                (Field::from_field_id(2), automaton_hashset(&["my_reg.ex"])),
            ]
            .into_iter()
            .collect(),
        };

        warmup_info.simplify();
        assert_eq!(warmup_info, expected);
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/tantivy_val_to_json.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde_json::Value as JsonValue;
use tantivy::schema::OwnedValue as TantivyValue;

use super::BinaryFormat;
use super::field_mapping_entry::{NumericOutputFormat, QuickwitNumericOptions};
use super::mapping_tree::LeafType;

pub(crate) trait NumToJson {
    fn to_json(&self, output_format: NumericOutputFormat) -> Option<JsonValue>;
}

impl NumToJson for u64 {
    fn to_json(&self, output_format: NumericOutputFormat) -> Option<JsonValue> {
        let json_value = match output_format {
            NumericOutputFormat::String => JsonValue::String(self.to_string()),
            NumericOutputFormat::Number => JsonValue::Number(serde_json::Number::from(*self)),
        };
        Some(json_value)
    }
}

impl NumToJson for i64 {
    fn to_json(&self, output_format: NumericOutputFormat) -> Option<JsonValue> {
        let json_value = match output_format {
            NumericOutputFormat::String => JsonValue::String(self.to_string()),
            NumericOutputFormat::Number => JsonValue::Number(serde_json::Number::from(*self)),
        };
        Some(json_value)
    }
}
impl NumToJson for f64 {
    fn to_json(&self, output_format: NumericOutputFormat) -> Option<JsonValue> {
        match output_format {
            NumericOutputFormat::String => Some(JsonValue::String(self.to_string())),
            NumericOutputFormat::Number => {
                serde_json::Number::from_f64(*self).map(JsonValue::Number)
            }
        }
    }
}

fn value_to_string(value: TantivyValue) -> Result<JsonValue, TantivyValue> {
    match value {
        TantivyValue::Str(s) => return Ok(JsonValue::String(s)),
        TantivyValue::U64(number) => Some(number.to_string()),
        TantivyValue::I64(number) => Some(number.to_string()),
        TantivyValue::F64(number) => Some(number.to_string()),
        TantivyValue::Bool(b) => Some(b.to_string()),
        TantivyValue::Date(date) => {
            return quickwit_datetime::DateTimeOutputFormat::default()
                .format_to_json(date)
                .map_err(|_| value);
        }
        TantivyValue::IpAddr(ip) => Some(ip.to_string()),
        _ => None,
    }
    .map(JsonValue::String)
    .ok_or(value)
}

fn value_to_bool(value: TantivyValue) -> Result<JsonValue, TantivyValue> {
    match &value {
        TantivyValue::Str(s) => s.parse().ok(),
        TantivyValue::U64(number) => match number {
            0 => Some(false),
            1 => Some(true),
            _ => None,
        },
        TantivyValue::I64(number) => match number {
            0 => Some(false),
            1 => Some(true),
            _ => None,
        },
        TantivyValue::F64(number) => match number {
            0.0 => Some(false),
            1.0 => Some(true),
            _ => None,
        },
        TantivyValue::Bool(b) => Some(*b),
        _ => None,
    }
    .map(JsonValue::Bool)
    .ok_or(value)
}

fn value_to_ip(value: TantivyValue) -> Result<JsonValue, TantivyValue> {
    match &value {
        TantivyValue::Str(s) => s
            .parse::<std::net::Ipv6Addr>()
            .or_else(|_| {
                s.parse::<std::net::Ipv4Addr>()
                    .map(|ip| ip.to_ipv6_mapped())
            })
            .ok(),
        TantivyValue::IpAddr(ip) => Some(*ip),
        _ => None,
    }
    .map(|ip| {
        serde_json::to_value(TantivyValue::IpAddr(ip))
            .expect("Json serialization should never fail.")
    })
    .ok_or(value)
}

fn value_to_float(
    value: TantivyValue,
    numeric_options: &QuickwitNumericOptions,
) -> Result<JsonValue, TantivyValue> {
    match &value {
        TantivyValue::Str(s) => s.parse().ok(),
        TantivyValue::U64(number) => Some(*number as f64),
        TantivyValue::I64(number) => Some(*number as f64),
        TantivyValue::F64(number) => Some(*number),
        TantivyValue::Bool(b) => Some(if *b { 1.0 } else { 0.0 }),
        _ => None,
    }
    .and_then(|f64_val| f64_val.to_json(numeric_options.output_format))
    .ok_or(value)
}

fn value_to_u64(
    value: TantivyValue,
    numeric_options: &QuickwitNumericOptions,
) -> Result<JsonValue, TantivyValue> {
    match &value {
        TantivyValue::Str(s) => s.parse().ok(),
        TantivyValue::U64(number) => Some(*number),
        TantivyValue::I64(number) => (*number).try_into().ok(),
        TantivyValue::F64(number) => {
            if (0.0..=(u64::MAX as f64)).contains(number) {
                Some(*number as u64)
            } else {
                None
            }
        }
        TantivyValue::Bool(b) => Some(*b as u64),
        _ => None,
    }
    .and_then(|u64_val| u64_val.to_json(numeric_options.output_format))
    .ok_or(value)
}

fn value_to_i64(
    value: TantivyValue,
    numeric_options: &QuickwitNumericOptions,
) -> Result<JsonValue, TantivyValue> {
    match &value {
        TantivyValue::Str(s) => s.parse().ok(),
        TantivyValue::U64(number) => (*number).try_into().ok(),
        TantivyValue::I64(number) => Some(*number),
        TantivyValue::F64(number) => {
            if ((i64::MIN as f64)..=(i64::MAX as f64)).contains(number) {
                Some(*number as i64)
            } else {
                None
            }
        }
        TantivyValue::Bool(b) => Some(*b as i64),
        _ => None,
    }
    .and_then(|u64_val| u64_val.to_json(numeric_options.output_format))
    .ok_or(value)
}

/// Transforms a tantivy object into a serde_json one, without cloning strings.
/// It still allocates maps.
// TODO we should probably move this to tantivy, it has the opposite conversion already
pub fn tantivy_object_to_json_value(object: Vec<(String, TantivyValue)>) -> JsonValue {
    JsonValue::Object(
        object
            .into_iter()
            .map(|(key, value)| (key, tantivy_value_to_json(value)))
            .collect(),
    )
}

/// Converts Tantivy::Value into Json Value.
///
/// Formatting by defaults, e.g. Rfc3339 for dates.
pub fn tantivy_value_to_json(value: TantivyValue) -> JsonValue {
    match value {
        TantivyValue::Null => JsonValue::Null,
        TantivyValue::Str(s) => JsonValue::String(s),
        TantivyValue::U64(number) => JsonValue::Number(number.into()),
        TantivyValue::I64(number) => JsonValue::Number(number.into()),
        TantivyValue::F64(f) => {
            JsonValue::Number(serde_json::Number::from_f64(f).expect("expected finite f64"))
        }
        TantivyValue::Bool(b) => JsonValue::Bool(b),
        TantivyValue::Array(array) => {
            JsonValue::Array(array.into_iter().map(tantivy_value_to_json).collect())
        }
        TantivyValue::Object(object) => tantivy_object_to_json_value(object),
        // we shouldn't have these types inside a json field in quickwit
        TantivyValue::PreTokStr(pretok) => JsonValue::String(pretok.text),
        TantivyValue::Date(date) => quickwit_datetime::DateTimeOutputFormat::Rfc3339
            .format_to_json(date)
            .expect("Invalid datetime is not allowed."),
        TantivyValue::Facet(facet) => JsonValue::String(facet.to_string()),
        TantivyValue::Bytes(bytes) => BinaryFormat::Base64.format_to_json(&bytes),
        TantivyValue::IpAddr(ip_v6) => {
            let ip_str = if let Some(ip_v4) = ip_v6.to_ipv4_mapped() {
                ip_v4.to_string()
            } else {
                ip_v6.to_string()
            };
            JsonValue::String(ip_str)
        }
    }
}

/// Converts TantivyValue into Json Value and formats according to the LeafType.
///
/// Makes sure the type and value are consistent before converting.
/// For certain LeafType, we use the type options to format the output.
pub fn formatted_tantivy_value_to_json(
    value: TantivyValue,
    leaf_type: &LeafType,
) -> Option<JsonValue> {
    let res = match leaf_type {
        LeafType::Text(_) => value_to_string(value),
        LeafType::Bool(_) => value_to_bool(value),
        LeafType::IpAddr(_) => value_to_ip(value),
        LeafType::F64(numeric_options) => value_to_float(value, numeric_options),
        LeafType::U64(numeric_options) => value_to_u64(value, numeric_options),
        LeafType::I64(numeric_options) => value_to_i64(value, numeric_options),
        LeafType::Json(_) => {
            if let TantivyValue::Object(obj) = value {
                // TODO do we want to allow almost everything here?
                return Some(tantivy_object_to_json_value(obj));
            } else {
                Err(value)
            }
        }
        LeafType::Bytes(bytes_options) => {
            if let TantivyValue::Bytes(ref bytes) = value {
                // TODO we could cast str to bytes
                let json_value = bytes_options.output_format.format_to_json(bytes);
                Ok(json_value)
            } else {
                Err(value)
            }
        }
        LeafType::DateTime(date_time_options) => date_time_options
            .reparse_tantivy_value(&value)
            .map(|date_time| {
                date_time_options
                    .output_format
                    .format_to_json(date_time)
                    .expect("Invalid datetime is not allowed.")
            })
            .ok_or(value),
    };
    match res {
        Ok(res) => Some(res),
        Err(value) => {
            quickwit_common::rate_limited_warn!(
                limit_per_min = 2,
                "the value type `{:?}` doesn't match the requested type `{:?}`",
                value,
                leaf_type
            );
            None
        }
    }
}

#[cfg(test)]
mod tests {

    use tantivy::schema::OwnedValue as TantivyValue;

    use super::*;
    use crate::doc_mapper::field_mapping_entry::{
        BinaryFormat, NumericOutputFormat, QuickwitBytesOptions, QuickwitNumericOptions,
    };
    use crate::doc_mapper::mapping_tree::LeafType;

    #[test]
    fn test_tantivy_value_to_json_value_bytes() {
        let bytes_options_base64 = QuickwitBytesOptions::default();
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::Bytes(vec![1, 2, 3]),
                &LeafType::Bytes(bytes_options_base64)
            )
            .unwrap(),
            serde_json::json!("AQID")
        );

        let bytes_options_hex = QuickwitBytesOptions {
            output_format: BinaryFormat::Hex,
            ..Default::default()
        };
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::Bytes(vec![1, 2, 3]),
                &LeafType::Bytes(bytes_options_hex)
            )
            .unwrap(),
            serde_json::json!("010203")
        );
    }

    #[test]
    fn test_tantivy_value_to_json_value_f64() {
        let numeric_options_number = QuickwitNumericOptions::default();
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::F64(0.1),
                &LeafType::F64(numeric_options_number.clone())
            )
            .unwrap(),
            serde_json::json!(0.1)
        );
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::U64(1),
                &LeafType::F64(numeric_options_number.clone())
            )
            .unwrap(),
            serde_json::json!(1.0)
        );
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::Str("0.1".to_string()),
                &LeafType::F64(numeric_options_number.clone())
            )
            .unwrap(),
            serde_json::json!(0.1)
        );

        let numeric_options_str = QuickwitNumericOptions {
            output_format: NumericOutputFormat::String,
            ..Default::default()
        };
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::F64(0.1),
                &LeafType::F64(numeric_options_str)
            )
            .unwrap(),
            serde_json::json!("0.1")
        );
    }

    #[test]
    fn test_tantivy_value_to_json_value_i64() {
        let numeric_options_number = QuickwitNumericOptions::default();
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::I64(-1),
                &LeafType::I64(numeric_options_number.clone())
            )
            .unwrap(),
            serde_json::json!(-1)
        );
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::I64(1),
                &LeafType::I64(numeric_options_number)
            )
            .unwrap(),
            serde_json::json!(1)
        );

        let numeric_options_str = QuickwitNumericOptions {
            output_format: NumericOutputFormat::String,
            ..Default::default()
        };
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::I64(-1),
                &LeafType::I64(numeric_options_str)
            )
            .unwrap(),
            serde_json::json!("-1")
        );
    }

    #[test]
    fn test_tantivy_value_to_json_value_u64() {
        let numeric_options_number = QuickwitNumericOptions::default();
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::U64(1),
                &LeafType::U64(numeric_options_number.clone())
            )
            .unwrap(),
            serde_json::json!(1u64)
        );
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::I64(1),
                &LeafType::U64(numeric_options_number)
            )
            .unwrap(),
            serde_json::json!(1u64)
        );

        let numeric_options_str = QuickwitNumericOptions {
            output_format: NumericOutputFormat::String,
            ..Default::default()
        };
        assert_eq!(
            formatted_tantivy_value_to_json(
                TantivyValue::U64(1),
                &LeafType::U64(numeric_options_str)
            )
            .unwrap(),
            serde_json::json!("1")
        );
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapper/tokenizer_entry.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use anyhow::Context;
use quickwit_query::{CodeTokenizer, DEFAULT_REMOVE_TOKEN_LENGTH};
use serde::{Deserialize, Serialize};
use tantivy::tokenizer::{
    AsciiFoldingFilter, LowerCaser, NgramTokenizer, RegexTokenizer, RemoveLongFilter,
    SimpleTokenizer, TextAnalyzer, Token,
};

/// A `TokenizerEntry` defines a custom tokenizer with its name and configuration.
#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, Eq, Hash, utoipa::ToSchema)]
pub struct TokenizerEntry {
    /// Tokenizer name.
    pub name: String,
    /// Tokenizer configuration.
    #[serde(flatten)]
    pub(crate) config: TokenizerConfig,
}

/// Tokenizer configuration.
#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, Eq, Hash, utoipa::ToSchema)]
pub struct TokenizerConfig {
    #[serde(flatten)]
    pub(crate) tokenizer_type: TokenizerType,
    #[serde(default)]
    pub(crate) filters: Vec<TokenFilterType>,
}

impl TokenizerConfig {
    /// Build a `TextAnalyzer` from a `TokenizerConfig`.
    pub fn text_analyzer(&self) -> anyhow::Result<TextAnalyzer> {
        let mut text_analyzer_builder = match &self.tokenizer_type {
            TokenizerType::Simple => TextAnalyzer::builder(SimpleTokenizer::default()).dynamic(),
            TokenizerType::SourceCode => TextAnalyzer::builder(CodeTokenizer::default()).dynamic(),
            TokenizerType::Ngram(options) => {
                let tokenizer =
                    NgramTokenizer::new(options.min_gram, options.max_gram, options.prefix_only)
                        .with_context(|| "invalid ngram tokenizer".to_string())?;
                TextAnalyzer::builder(tokenizer).dynamic()
            }
            TokenizerType::Regex(options) => {
                let tokenizer = RegexTokenizer::new(&options.pattern)
                    .with_context(|| "invalid regex tokenizer".to_string())?;
                TextAnalyzer::builder(tokenizer).dynamic()
            }
        };
        for filter in &self.filters {
            match filter.tantivy_token_filter_enum() {
                TantivyTokenFilterEnum::RemoveLong(token_filter) => {
                    text_analyzer_builder = text_analyzer_builder.filter_dynamic(token_filter);
                }
                TantivyTokenFilterEnum::LowerCaser(token_filter) => {
                    text_analyzer_builder = text_analyzer_builder.filter_dynamic(token_filter);
                }
                TantivyTokenFilterEnum::AsciiFolding(token_filter) => {
                    text_analyzer_builder = text_analyzer_builder.filter_dynamic(token_filter);
                }
            }
        }
        Ok(text_analyzer_builder.build())
    }
}

/// Helper function to analyze a text with a given `TokenizerConfig`.
pub fn analyze_text(text: &str, tokenizer: &TokenizerConfig) -> anyhow::Result<Vec<Token>> {
    let mut text_analyzer = tokenizer.text_analyzer()?;
    let mut token_stream = text_analyzer.token_stream(text);
    let mut tokens = Vec::new();
    token_stream.process(&mut |token| {
        tokens.push(token.clone());
    });
    Ok(tokens)
}

#[derive(Clone, Debug, PartialEq, Eq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
pub enum TokenFilterType {
    RemoveLong,
    LowerCaser,
    AsciiFolding,
}

/// Tantivy token filter enum to build
/// a `TextAnalyzer` with dynamic token filters.
enum TantivyTokenFilterEnum {
    RemoveLong(RemoveLongFilter),
    LowerCaser(LowerCaser),
    AsciiFolding(AsciiFoldingFilter),
}

impl TokenFilterType {
    fn tantivy_token_filter_enum(&self) -> TantivyTokenFilterEnum {
        match &self {
            Self::RemoveLong => TantivyTokenFilterEnum::RemoveLong(RemoveLongFilter::limit(
                DEFAULT_REMOVE_TOKEN_LENGTH,
            )),
            Self::LowerCaser => TantivyTokenFilterEnum::LowerCaser(LowerCaser),
            Self::AsciiFolding => TantivyTokenFilterEnum::AsciiFolding(AsciiFoldingFilter),
        }
    }
}

#[derive(Clone, Debug, PartialEq, Eq, Hash, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(tag = "type", rename_all = "snake_case")]
pub enum TokenizerType {
    Ngram(NgramTokenizerOption),
    Regex(RegexTokenizerOption),
    Simple,
    SourceCode,
}

#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, Eq, Hash, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct NgramTokenizerOption {
    pub min_gram: usize,
    pub max_gram: usize,
    #[serde(default)]
    pub prefix_only: bool,
}

#[derive(Clone, Serialize, Deserialize, Debug, PartialEq, Eq, Hash, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct RegexTokenizerOption {
    pub pattern: String,
}

#[cfg(test)]
mod tests {
    use super::{NgramTokenizerOption, TokenizerType};
    use crate::TokenizerEntry;
    use crate::doc_mapper::RegexTokenizerOption;

    #[test]
    fn test_deserialize_tokenizer_entry() {
        let result: Result<TokenizerEntry, serde_json::Error> =
            serde_json::from_str::<TokenizerEntry>(
                r#"
            {
                "name": "my_tokenizer",
                "type": "ngram",
                "min_gram": 1,
                "max_gram": 3,
                "filters": [
                    "remove_long",
                    "lower_caser",
                    "ascii_folding"
                ]
            }
            "#,
            );
        assert!(result.is_ok());
        let tokenizer_config_entry = result.unwrap();
        assert_eq!(tokenizer_config_entry.config.filters.len(), 3);
        match tokenizer_config_entry.config.tokenizer_type {
            TokenizerType::Ngram(options) => {
                assert_eq!(
                    options,
                    NgramTokenizerOption {
                        min_gram: 1,
                        max_gram: 3,
                        prefix_only: false,
                    }
                )
            }
            _ => panic!("Unexpected tokenizer type"),
        }
    }

    #[test]
    fn test_deserialize_tokenizer_entry_failed_with_wrong_key() {
        let result: Result<TokenizerEntry, serde_json::Error> =
            serde_json::from_str::<TokenizerEntry>(
                r#"
            {
                "name": "my_tokenizer",
                "type": "ngram",
                "min_gram": 1,
                "max_gram": 3,
                "filters": [
                    "remove_long",
                    "lower_caser",
                    "ascii_folding"
                ],
                "abc": 123
            }
            "#,
            );
        assert!(result.is_err());
        assert!(
            result
                .unwrap_err()
                .to_string()
                .contains("unknown field `abc`")
        );
    }

    #[test]
    fn test_tokenizer_entry_regex() {
        let result: Result<TokenizerEntry, serde_json::Error> =
            serde_json::from_str::<TokenizerEntry>(
                r#"
            {
                "name": "my_tokenizer",
                "type": "regex",
                "pattern": "(my_pattern)"
            }
            "#,
            );
        assert!(result.is_ok());
        let tokenizer_config_entry = result.unwrap();
        assert_eq!(tokenizer_config_entry.config.filters.len(), 0);
        match tokenizer_config_entry.config.tokenizer_type {
            TokenizerType::Regex(options) => {
                assert_eq!(
                    options,
                    RegexTokenizerOption {
                        pattern: "(my_pattern)".to_string(),
                    }
                )
            }
            _ => panic!("Unexpected tokenizer type"),
        }
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/doc_mapping.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::num::NonZeroU32;

use quickwit_proto::types::DocMappingUid;
use serde::{Deserialize, Serialize};

use crate::{FieldMappingEntry, QuickwitJsonOptions, TokenizerEntry};

/// Defines how unmapped fields should be handled.
#[derive(Clone, Copy, Default, Debug, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "lowercase")]
pub enum ModeType {
    /// Lenient mode: ignores unmapped fields.
    Lenient,
    /// Strict mode: returns an error when an unmapped field is encountered.
    Strict,
    /// Dynamic mode: captures and handles unmapped fields according to the dynamic field
    /// configuration.
    #[default]
    Dynamic,
}

/// Defines how unmapped fields should be handled.
#[derive(Clone, Debug, Serialize, Deserialize, PartialEq)]
pub enum Mode {
    /// Lenient mode: ignores unmapped fields.
    Lenient,
    /// Strict mode: returns an error when an unmapped field is encountered.
    Strict,
    /// Dynamic mode: captures and handles unmapped fields according to the dynamic field
    /// configuration.
    Dynamic(QuickwitJsonOptions),
}

impl Mode {
    /// Extracts the [`ModeType`] of this [`Mode`]
    pub fn mode_type(&self) -> ModeType {
        match self {
            Self::Lenient => ModeType::Lenient,
            Self::Strict => ModeType::Strict,
            Self::Dynamic(_) => ModeType::Dynamic,
        }
    }

    /// Builds a [`Mode`] from its type and optional dynamic mapping options.
    pub fn from_parts(
        mode: ModeType,
        dynamic_mapping: Option<QuickwitJsonOptions>,
    ) -> anyhow::Result<Mode> {
        Ok(match (mode, dynamic_mapping) {
            (ModeType::Lenient, None) => Self::Lenient,
            (ModeType::Strict, None) => Self::Strict,
            (ModeType::Dynamic, Some(dynamic_mapping)) => Self::Dynamic(dynamic_mapping),
            (ModeType::Dynamic, None) => Self::default(), // Dynamic with default options
            (_, Some(_)) => anyhow::bail!(
                "`dynamic_mapping` is only allowed with mode=dynamic. (here mode=`{:?}`)",
                mode
            ),
        })
    }

    /// Obtains the mode type and dynamic options from a [`Mode`].
    pub fn into_parts(self) -> (ModeType, Option<QuickwitJsonOptions>) {
        match self {
            Self::Lenient => (ModeType::Lenient, None),
            Self::Strict => (ModeType::Strict, None),
            Self::Dynamic(json_options) => (ModeType::Dynamic, Some(json_options)),
        }
    }
}

impl Default for Mode {
    fn default() -> Self {
        Self::Dynamic(QuickwitJsonOptions::default_dynamic())
    }
}

/// Defines how the document of an index should be parsed, tokenized, partitioned, indexed, and
/// stored.
#[quickwit_macros::serde_multikey]
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct DocMapping {
    /// Doc mapping UID.
    ///
    /// Splits with the same doc mapping UID share the same schema and should use the same doc
    /// mapper during indexing and querying.
    #[serde(default = "DocMappingUid::random")]
    pub doc_mapping_uid: DocMappingUid,

    /// Defines how unmapped fields should be handled.
    #[serde_multikey(
        deserializer = Mode::from_parts,
        serializer = Mode::into_parts,
        fields = (
            #[serde(default)]
            mode: ModeType,
            #[serde(skip_serializing_if = "Option::is_none")]
            dynamic_mapping: Option<QuickwitJsonOptions>
        ),
    )]
    pub mode: Mode,

    /// Defines the schema of ingested documents and describes how each field value should be
    /// parsed, tokenized, indexed, and stored.
    #[serde(default)]
    #[schema(value_type = Vec<FieldMappingEntryForSerialization>)]
    pub field_mappings: Vec<FieldMappingEntry>,

    /// Declares the field which contains the date or timestamp at which the document
    /// was emitted.
    #[serde(default)]
    pub timestamp_field: Option<String>,

    /// Declares the low cardinality fields for which the values ​​are recorded directly in the
    /// splits metadata.
    #[schema(value_type = Vec<String>)]
    #[serde(default)]
    pub tag_fields: BTreeSet<String>,

    /// Expresses via a "mini-DSL" how to route documents to split partitions.
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub partition_key: Option<String>,

    /// The maximum number of partitions that an indexer can generate.
    #[schema(value_type = u32)]
    #[serde(default = "DocMapping::default_max_num_partitions")]
    pub max_num_partitions: NonZeroU32,

    /// Whether to record the presence of the fields of each indexed document to allow `exists`
    /// queries.
    #[serde(default)]
    pub index_field_presence: bool,

    /// Whether to record and store the size (bytes) of each ingested document in a fast field.
    #[serde(alias = "document_length")]
    #[serde(default)]
    pub store_document_size: bool,

    /// Whether to store the original source documents in the doc store.
    #[serde(default)]
    pub store_source: bool,

    /// A set of additional user-defined tokenizers to be used during indexing.
    #[serde(default)]
    pub tokenizers: Vec<TokenizerEntry>,
}

impl DocMapping {
    /// Returns the default value for `max_num_partitions`.
    pub fn default_max_num_partitions() -> NonZeroU32 {
        NonZeroU32::new(200).unwrap()
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::doc_mapper::{QuickwitNumericOptions, QuickwitTextOptions};
    use crate::{
        Cardinality, FieldMappingType, RegexTokenizerOption, TokenFilterType, TokenizerConfig,
        TokenizerType,
    };

    #[test]
    fn test_doc_mapping_serde_roundtrip() {
        let doc_mapping = DocMapping {
            doc_mapping_uid: DocMappingUid::random(),
            mode: Mode::Strict,
            field_mappings: vec![
                FieldMappingEntry {
                    name: "timestamp".to_string(),
                    mapping_type: FieldMappingType::U64(
                        QuickwitNumericOptions::default(),
                        Cardinality::SingleValued,
                    ),
                },
                FieldMappingEntry {
                    name: "message".to_string(),
                    mapping_type: FieldMappingType::Text(
                        QuickwitTextOptions::default(),
                        Cardinality::SingleValued,
                    ),
                },
            ],
            timestamp_field: Some("timestamp".to_string()),
            tag_fields: BTreeSet::from_iter(["level".to_string()]),
            partition_key: Some("tenant_id".to_string()),
            max_num_partitions: NonZeroU32::new(100).unwrap(),
            index_field_presence: true,
            store_document_size: true,
            store_source: true,
            tokenizers: vec![TokenizerEntry {
                name: "whitespace".to_string(),
                config: TokenizerConfig {
                    tokenizer_type: TokenizerType::Regex(RegexTokenizerOption {
                        pattern: r"\s+".to_string(),
                    }),
                    filters: vec![TokenFilterType::LowerCaser],
                },
            }],
        };
        let serialized = serde_json::to_string(&doc_mapping).unwrap();
        let deserialized: DocMapping = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, doc_mapping);
    }

    #[test]
    fn test_doc_mapping_serde_default_values() {
        let doc_mapping: DocMapping = serde_json::from_str("{}").unwrap();
        assert_eq!(
            doc_mapping.mode,
            Mode::Dynamic(QuickwitJsonOptions::default_dynamic())
        );
        assert!(doc_mapping.field_mappings.is_empty());
        assert_eq!(doc_mapping.timestamp_field, None);
        assert!(doc_mapping.tag_fields.is_empty());
        assert_eq!(doc_mapping.partition_key, None);
        assert_eq!(
            doc_mapping.max_num_partitions,
            NonZeroU32::new(200).unwrap()
        );
        assert_eq!(doc_mapping.index_field_presence, false);
        assert_eq!(doc_mapping.store_document_size, false);
        assert_eq!(doc_mapping.store_source, false);
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_query::InvalidQuery;
use tantivy::schema::DocParsingError as TantivyDocParsingError;
use thiserror::Error;

/// Failed to parse query.
#[derive(Error, Debug)]
#[allow(missing_docs)]
pub enum QueryParserError {
    #[error("invalid json: {0}")]
    InvalidJson(#[from] serde_json::Error),
    #[error("invalid query: {0}")]
    InvalidQuery(#[from] InvalidQuery),
    #[error("invalid default search field: `{field_name}` {cause}")]
    InvalidDefaultField {
        cause: &'static str,
        field_name: String,
    },
    #[error("{0}")]
    Other(#[from] anyhow::Error),
}

/// Error that may happen when parsing
/// a document from JSON.
#[derive(Debug, Error, Eq, PartialEq)]
pub enum DocParsingError {
    /// The provided string is not a syntactically valid JSON object.
    #[error("the provided string is not a syntactically valid JSON object: {0}")]
    NotJsonObject(String),
    /// One of the value could not be parsed.
    #[error("the field `{0}` could not be parsed: {1}")]
    ValueError(String, String),
    /// The json-document contains a field that is not declared in the schema.
    #[error("the document contains a field that is not declared in the schema: {0:?}")]
    NoSuchFieldInSchema(String),
    /// The document contains a array of values but a single value is expected.
    #[error("the document contains an array of values but a single value is expected: {0:?}")]
    MultiValuesNotSupported(String),
    /// The document does not contain a field that is required.
    #[error("the document must contain field {0:?}")]
    RequiredField(String),
}

impl From<TantivyDocParsingError> for DocParsingError {
    fn from(value: TantivyDocParsingError) -> Self {
        match value {
            TantivyDocParsingError::InvalidJson(text) => DocParsingError::NoSuchFieldInSchema(text),
            TantivyDocParsingError::ValueError(text, error) => {
                DocParsingError::ValueError(text, format!("{error:?}"))
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![warn(missing_docs)]
#![allow(clippy::bool_assert_comparison)]
#![deny(clippy::disallowed_methods)]

//! Index config defines how to configure an index and especially how
//! to convert a json like documents to a document indexable by tantivy
//! engine, aka tantivy::Document.

mod doc_mapper;
mod doc_mapping;
mod error;
mod query_builder;
mod routing_expression;

/// Pruning tags manipulation.
pub mod tag_pruning;

pub use doc_mapper::{
    Automaton, BinaryFormat, DocMapper, DocMapperBuilder, FastFieldWarmupInfo, FieldMappingEntry,
    FieldMappingType, JsonObject, NamedField, QuickwitBytesOptions, QuickwitJsonOptions, TermRange,
    TokenizerConfig, TokenizerEntry, WarmupInfo, analyze_text,
};
use doc_mapper::{
    FastFieldOptions, FieldMappingEntryForSerialization, IndexRecordOptionSchema,
    NgramTokenizerOption, QuickwitTextNormalizer, QuickwitTextTokenizer, RegexTokenizerOption,
    TokenFilterType, TokenizerType,
};
pub use doc_mapping::{DocMapping, Mode, ModeType};
pub use error::{DocParsingError, QueryParserError};
use quickwit_common::shared_consts::FIELD_PRESENCE_FIELD_NAME;
use quickwit_proto::types::DocMappingUid;
pub use routing_expression::RoutingExpr;

/// Field name reserved for storing the source document.
pub const SOURCE_FIELD_NAME: &str = "_source";

/// Field name reserved for storing the dynamically indexed fields.
pub const DYNAMIC_FIELD_NAME: &str = "_dynamic";

/// Field name reserved for storing the length of source document.
pub const DOCUMENT_SIZE_FIELD_NAME: &str = "_doc_length";

/// Quickwit reserved field names.
const QW_RESERVED_FIELD_NAMES: &[&str] = &[
    DOCUMENT_SIZE_FIELD_NAME,
    DYNAMIC_FIELD_NAME,
    FIELD_PRESENCE_FIELD_NAME,
    SOURCE_FIELD_NAME,
];

/// Cardinality of a field.
#[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash)]
pub enum Cardinality {
    /// Single-valued field.
    SingleValued,
    /// Multivalued field.
    MultiValued,
}

#[derive(utoipa::OpenApi)]
#[openapi(components(schemas(
    DocMappingUid,
    FastFieldOptions,
    FieldMappingEntryForSerialization,
    IndexRecordOptionSchema,
    ModeType,
    NgramTokenizerOption,
    QuickwitJsonOptions,
    QuickwitTextNormalizer,
    QuickwitTextTokenizer,
    RegexTokenizerOption,
    TokenFilterType,
    TokenizerConfig,
    TokenizerEntry,
    TokenizerType,
)))]
/// Schema used for the OpenAPI generation which are apart of this crate.
pub struct DocMapperApiSchemas;

/// Returns a default `DefaultIndexConfig` for unit tests.
#[cfg(any(test, feature = "testsuite"))]
pub fn default_doc_mapper_for_test() -> DocMapper {
    const JSON_CONFIG_VALUE: &str = r#"
        {
            "store_source": true,
            "index_field_presence": true,
            "default_search_fields": [
                "body", "attributes.server", "attributes.server\\.status"
            ],
            "timestamp_field": "timestamp",
            "tag_fields": ["owner"],
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "datetime",
                    "output_format": "unix_timestamp_secs",
                    "fast": true
                },
                {
                    "name": "body",
                    "type": "text",
                    "stored": true
                },
                {
                    "name": "response_date",
                    "type": "datetime",
                    "input_formats": ["rfc3339", "unix_timestamp"],
                    "fast": true
                },
                {
                    "name": "response_time",
                    "type": "f64",
                    "fast": true
                },
                {
                    "name": "response_payload",
                    "type": "bytes",
                    "fast": true
                },
                {
                    "name": "owner",
                    "type": "text",
                    "tokenizer": "raw"
                },
                {
                    "name": "isImportant",
                    "type": "bool"
                },
                {
                    "name": "properties",
                    "type": "json"
                },
                {
                    "name": "children",
                    "type": "array<json>"
                },
                {
                    "name": "attributes",
                    "type": "object",
                    "field_mappings": [
                        {
                            "name": "tags",
                            "type": "array<i64>"
                        },
                        {
                            "name": "server",
                            "type": "text"
                        },
                        {
                            "name": "server.status",
                            "type": "array<text>"
                        },
                        {
                            "name": "server.payload",
                            "type": "array<bytes>"
                        }
                    ]
                }
            ]
        }"#;
    serde_json::from_str::<DocMapper>(JSON_CONFIG_VALUE).unwrap()
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/query_builder.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::convert::Infallible;
use std::ops::Bound;
use std::sync::Arc;

use quickwit_proto::types::SplitId;
use quickwit_query::query_ast::{
    BuildTantivyAstContext, FieldPresenceQuery, FullTextQuery, PhrasePrefixQuery, QueryAst,
    QueryAstTransformer, QueryAstVisitor, RangeQuery, RegexQuery, TermSetQuery, WildcardQuery,
};
use quickwit_query::tokenizers::TokenizerManager;
use quickwit_query::{InvalidQuery, find_field_or_hit_dynamic};
use tantivy::Term;
use tantivy::query::Query;
use tantivy::schema::{Field, Schema};
use tracing::error;

use crate::doc_mapper::FastFieldWarmupInfo;
use crate::{Automaton, QueryParserError, TermRange, WarmupInfo};

#[derive(Default)]
struct RangeQueryFields {
    range_query_field_names: HashSet<String>,
}

impl<'a> QueryAstVisitor<'a> for RangeQueryFields {
    type Err = Infallible;

    fn visit_range(&mut self, range_query: &'a RangeQuery) -> Result<(), Infallible> {
        self.range_query_field_names
            .insert(range_query.field.to_string());
        Ok(())
    }
}

/// Term Queries on fields which are fast but not indexed.
struct TermSearchOnColumnar<'f> {
    fields: &'f mut HashSet<FastFieldWarmupInfo>,
    schema: Schema,
}
impl<'a, 'f> QueryAstVisitor<'a> for TermSearchOnColumnar<'f> {
    type Err = Infallible;

    fn visit_term_set(&mut self, term_set_query: &'a TermSetQuery) -> Result<(), Infallible> {
        for field in term_set_query.terms_per_field.keys() {
            if let Some((_field, field_entry, path)) =
                find_field_or_hit_dynamic(field, &self.schema)
                && field_entry.is_fast()
                && !field_entry.is_indexed()
            {
                self.fields.insert(FastFieldWarmupInfo {
                    name: if path.is_empty() {
                        field_entry.name().to_string()
                    } else {
                        format!("{}.{}", field_entry.name(), path)
                    },
                    with_subfields: false,
                });
            }
        }
        Ok(())
    }

    fn visit_term(
        &mut self,
        term_query: &'a quickwit_query::query_ast::TermQuery,
    ) -> Result<(), Infallible> {
        if let Some((_field, field_entry, path)) =
            find_field_or_hit_dynamic(&term_query.field, &self.schema)
            && field_entry.is_fast()
            && !field_entry.is_indexed()
        {
            self.fields.insert(FastFieldWarmupInfo {
                name: if path.is_empty() {
                    field_entry.name().to_string()
                } else {
                    format!("{}.{}", field_entry.name(), path)
                },
                with_subfields: false,
            });
        }
        Ok(())
    }
    /// We also need to visit full text queries because they can be converted to term queries
    /// on fast fields. We only care about the field being fast and not indexed AND the tokenizer
    /// being `raw` or None.
    fn visit_full_text(&mut self, full_text_query: &'a FullTextQuery) -> Result<(), Infallible> {
        if let Some((_field, field_entry, path)) =
            find_field_or_hit_dynamic(&full_text_query.field, &self.schema)
            && field_entry.is_fast()
            && !field_entry.is_indexed()
            && (full_text_query.params.tokenizer.is_none()
                || full_text_query.params.tokenizer.as_deref() == Some("raw"))
        {
            self.fields.insert(FastFieldWarmupInfo {
                name: if path.is_empty() {
                    field_entry.name().to_string()
                } else {
                    format!("{}.{}", field_entry.name(), path)
                },
                with_subfields: false,
            });
        }
        Ok(())
    }
}

struct ExistsQueryFastFields<'f> {
    fields: &'f mut HashSet<FastFieldWarmupInfo>,
    schema: Schema,
}

impl<'a, 'f> QueryAstVisitor<'a> for ExistsQueryFastFields<'f> {
    type Err = Infallible;

    fn visit_exists(&mut self, exists_query: &'a FieldPresenceQuery) -> Result<(), Infallible> {
        let fields = exists_query.find_field_and_subfields(&self.schema);
        for (_, field_entry, path) in fields {
            if field_entry.is_fast() {
                if field_entry.field_type().is_json() {
                    let full_path = format!("{}.{}", field_entry.name(), path);
                    self.fields.insert(FastFieldWarmupInfo {
                        name: full_path,
                        with_subfields: true,
                    });
                } else if path.is_empty() {
                    self.fields.insert(FastFieldWarmupInfo {
                        name: field_entry.name().to_string(),
                        with_subfields: false,
                    });
                } else {
                    error!(
                        field_entry = field_entry.name(),
                        path, "only JSON type supports subfields"
                    );
                }
            }
        }
        Ok(())
    }
}

/// Build a `Query` with field resolution & forbidding range clauses.
pub(crate) fn build_query(
    query_ast: QueryAst,
    context: &BuildTantivyAstContext,
    cache_context: Option<(Arc<dyn quickwit_query::query_ast::PredicateCache>, SplitId)>,
) -> Result<(Box<dyn Query>, WarmupInfo), QueryParserError> {
    let mut fast_fields: HashSet<FastFieldWarmupInfo> = HashSet::new();

    let query_ast = if let Some((cache, split_id)) = cache_context {
        let Ok(query_ast) = quickwit_query::query_ast::PredicateCacheInjector { cache, split_id }
            .transform(query_ast);
        // this transformer isn't supposed to ever remove a node
        query_ast.unwrap_or(QueryAst::MatchAll)
    } else {
        query_ast
    };

    let mut range_query_fields = RangeQueryFields::default();
    // This cannot fail. The error type is Infallible.
    let Ok(_) = range_query_fields.visit(&query_ast);
    let range_query_fast_fields =
        range_query_fields
            .range_query_field_names
            .into_iter()
            .map(|name| FastFieldWarmupInfo {
                name,
                with_subfields: false,
            });
    fast_fields.extend(range_query_fast_fields);

    let Ok(_) = TermSearchOnColumnar {
        fields: &mut fast_fields,
        schema: context.schema.clone(),
    }
    .visit(&query_ast);

    let Ok(_) = ExistsQueryFastFields {
        fields: &mut fast_fields,
        schema: context.schema.clone(),
    }
    .visit(&query_ast);

    let query = query_ast.build_tantivy_query(context)?;

    let term_set_query_fields = extract_term_set_query_fields(&query_ast, context.schema)?;
    let (term_ranges_grouped_by_field, automatons_grouped_by_field) =
        extract_prefix_term_ranges_and_automaton(
            &query_ast,
            context.schema,
            context.tokenizer_manager,
        )?;

    let mut terms_grouped_by_field: HashMap<Field, HashMap<_, bool>> = Default::default();
    query.query_terms(&mut |term, need_position| {
        let field = term.field();
        if !context.schema.get_field_entry(field).is_indexed() {
            return;
        }
        *terms_grouped_by_field
            .entry(field)
            .or_default()
            .entry(term.clone())
            .or_default() |= need_position;
    });

    let warmup_info = WarmupInfo {
        term_dict_fields: term_set_query_fields,
        terms_grouped_by_field,
        term_ranges_grouped_by_field,
        fast_fields,
        automatons_grouped_by_field,
        ..WarmupInfo::default()
    };

    Ok((query, warmup_info))
}

struct ExtractTermSetFields<'a> {
    term_dict_fields_to_warm_up: HashSet<Field>,
    schema: &'a Schema,
}

impl<'a> ExtractTermSetFields<'a> {
    fn new(schema: &'a Schema) -> Self {
        ExtractTermSetFields {
            term_dict_fields_to_warm_up: HashSet::new(),
            schema,
        }
    }
}

impl<'a> QueryAstVisitor<'a> for ExtractTermSetFields<'_> {
    type Err = anyhow::Error;

    fn visit_term_set(&mut self, term_set_query: &'a TermSetQuery) -> anyhow::Result<()> {
        for field in term_set_query.terms_per_field.keys() {
            if let Some((field, _field_entry, _path)) =
                find_field_or_hit_dynamic(field, self.schema)
            {
                self.term_dict_fields_to_warm_up.insert(field);
            } else {
                anyhow::bail!("field does not exist: {}", field);
            }
        }
        Ok(())
    }
}

fn extract_term_set_query_fields(
    query_ast: &QueryAst,
    schema: &Schema,
) -> anyhow::Result<HashSet<Field>> {
    let mut visitor = ExtractTermSetFields::new(schema);
    visitor.visit(query_ast)?;
    Ok(visitor.term_dict_fields_to_warm_up)
}

/// Converts a `prefix` term into the equivalent term range.
///
/// The resulting range is `[prefix, next_prefix)`, that is:
/// - start bound: `Included(prefix)`
/// - end bound: `Excluded(next lexicographic term after the prefix)`
///
/// "abc"    -> start: "abc", end: "abd" (excluded)
/// "ab\xFF" -> start: "ab\xFF", end: "ac" (excluded)
/// "\xFF\xFF" -> start: "\xFF\xFF", end: Unbounded
fn prefix_term_to_range(prefix: Term) -> (Bound<Term>, Bound<Term>) {
    // Start from the given prefix and try to find the successor
    let mut end_bound = prefix.clone();
    let mut end_bound_value_bytes = prefix.serialized_value_bytes().to_vec();
    while !end_bound_value_bytes.is_empty() {
        let last_byte = end_bound_value_bytes.last_mut().unwrap();
        if *last_byte != u8::MAX {
            *last_byte += 1;
            // The last non-`u8::MAX` byte incremented
            // gives us the exclusive upper bound.
            end_bound.set_bytes(&end_bound_value_bytes);
            return (Bound::Included(prefix), Bound::Excluded(end_bound));
        }
        // pop u8::MAX byte and try next
        end_bound_value_bytes.pop();
    }
    // All bytes were `u8::MAX`: there is no successor, so the upper bound is unbounded.
    (Bound::Included(prefix), Bound::Unbounded)
}

type PositionNeeded = bool;

struct ExtractPrefixTermRanges<'a> {
    schema: &'a Schema,
    tokenizer_manager: &'a TokenizerManager,
    term_ranges_to_warm_up: HashMap<Field, HashMap<TermRange, PositionNeeded>>,
    automatons_to_warm_up: HashMap<Field, HashSet<Automaton>>,
}

impl<'a> ExtractPrefixTermRanges<'a> {
    fn with_schema(schema: &'a Schema, tokenizer_manager: &'a TokenizerManager) -> Self {
        ExtractPrefixTermRanges {
            schema,
            tokenizer_manager,
            term_ranges_to_warm_up: HashMap::new(),
            automatons_to_warm_up: HashMap::new(),
        }
    }

    fn add_prefix_term(
        &mut self,
        term: Term,
        max_expansions: u32,
        position_needed: PositionNeeded,
    ) {
        let field = term.field();
        let (start, end) = prefix_term_to_range(term);
        let term_range = TermRange {
            start,
            end,
            limit: Some(max_expansions as u64),
        };
        *self
            .term_ranges_to_warm_up
            .entry(field)
            .or_default()
            .entry(term_range)
            .or_default() |= position_needed;
    }

    fn add_automaton(&mut self, field: Field, automaton: Automaton) {
        self.automatons_to_warm_up
            .entry(field)
            .or_default()
            .insert(automaton);
    }
}

impl<'a, 'b: 'a> QueryAstVisitor<'a> for ExtractPrefixTermRanges<'b> {
    type Err = InvalidQuery;

    fn visit_full_text(&mut self, full_text_query: &'a FullTextQuery) -> Result<(), Self::Err> {
        if let Some(prefix_term) =
            full_text_query.get_prefix_term(self.schema, self.tokenizer_manager)
        {
            // the max_expansion expansion of a bool prefix query is used for the fuzzy part of the
            // query, not for the expension to a range request.
            // see https://github.com/elastic/elasticsearch/blob/6ad48306d029e6e527c0481e2e9880bd2f06b239/docs/reference/query-dsl/match-bool-prefix-query.asciidoc#parameters
            self.add_prefix_term(prefix_term, u32::MAX, false);
        }
        Ok(())
    }

    fn visit_phrase_prefix(
        &mut self,
        phrase_prefix: &'a PhrasePrefixQuery,
    ) -> Result<(), Self::Err> {
        let terms = match phrase_prefix.get_terms(self.schema, self.tokenizer_manager) {
            Ok((_, terms)) => terms,
            Err(InvalidQuery::SchemaError(_)) | Err(InvalidQuery::FieldDoesNotExist { .. }) => {
                return Ok(());
            } /* the query will be nullified when casting to a tantivy ast */
            Err(e) => return Err(e),
        };
        if let Some((_, term)) = terms.last() {
            self.add_prefix_term(term.clone(), phrase_prefix.max_expansions, terms.len() > 1);
        }
        Ok(())
    }

    fn visit_wildcard(&mut self, wildcard_query: &'a WildcardQuery) -> Result<(), Self::Err> {
        let (field, path, regex) =
            match wildcard_query.to_regex(self.schema, self.tokenizer_manager) {
                Ok(res) => res,
                /* the query will be nullified when casting to a tantivy ast */
                Err(InvalidQuery::FieldDoesNotExist { .. }) => return Ok(()),
                Err(e) => return Err(e),
            };

        self.add_automaton(field, Automaton::Regex(path, regex));
        Ok(())
    }

    fn visit_regex(&mut self, regex_query: &'a RegexQuery) -> Result<(), Self::Err> {
        let (field, path, regex) = match regex_query.to_field_and_regex(self.schema) {
            Ok(res) => res,
            /* the query will be nullified when casting to a tantivy ast */
            Err(InvalidQuery::FieldDoesNotExist { .. }) => return Ok(()),
            Err(e) => return Err(e),
        };
        self.add_automaton(field, Automaton::Regex(path, regex));
        Ok(())
    }
}

type TermRangeWarmupInfo = HashMap<Field, HashMap<TermRange, PositionNeeded>>;
type AutomatonWarmupInfo = HashMap<Field, HashSet<Automaton>>;

fn extract_prefix_term_ranges_and_automaton(
    query_ast: &QueryAst,
    schema: &Schema,
    tokenizer_manager: &TokenizerManager,
) -> anyhow::Result<(TermRangeWarmupInfo, AutomatonWarmupInfo)> {
    let mut visitor = ExtractPrefixTermRanges::with_schema(schema, tokenizer_manager);
    visitor.visit(query_ast)?;
    Ok((
        visitor.term_ranges_to_warm_up,
        visitor.automatons_to_warm_up,
    ))
}

#[cfg(test)]
mod test {
    use std::ops::Bound;

    use quickwit_common::shared_consts::FIELD_PRESENCE_FIELD_NAME;
    use quickwit_query::query_ast::{
        BuildTantivyAstContext, FullTextMode, FullTextParams, PhrasePrefixQuery, QueryAstVisitor,
        UserInputQuery, query_ast_from_user_text,
    };
    use quickwit_query::{
        BooleanOperand, MatchAllOrNone, create_default_quickwit_tokenizer_manager,
    };
    use tantivy::Term;
    use tantivy::schema::{DateOptions, DateTimePrecision, FAST, INDEXED, STORED, Schema, TEXT};

    use super::{ExtractPrefixTermRanges, build_query};
    use crate::{DYNAMIC_FIELD_NAME, SOURCE_FIELD_NAME, TermRange};

    enum TestExpectation<'a> {
        Err(&'a str),
        Ok(&'a str),
    }

    fn make_schema(dynamic_mode: bool) -> Schema {
        let mut schema_builder = Schema::builder();
        schema_builder.add_i64_field(FIELD_PRESENCE_FIELD_NAME, INDEXED);
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_text_field("desc", TEXT | STORED);
        schema_builder.add_text_field("server.name", TEXT | STORED);
        schema_builder.add_text_field("server.mem", TEXT);
        schema_builder.add_bool_field("server.running", FAST | STORED | INDEXED);
        schema_builder.add_text_field(SOURCE_FIELD_NAME, TEXT);
        schema_builder.add_ip_addr_field("ip", FAST | STORED);
        schema_builder.add_ip_addr_field("ips", FAST);
        schema_builder.add_ip_addr_field("ip_notff", STORED);
        let date_options = DateOptions::default()
            .set_fast()
            .set_precision(DateTimePrecision::Milliseconds);
        schema_builder.add_date_field("dt", date_options);
        schema_builder.add_u64_field("u64_fast", FAST | STORED);
        schema_builder.add_i64_field("i64_fast", FAST | STORED);
        schema_builder.add_f64_field("f64_fast", FAST | STORED);
        schema_builder.add_json_field("json_fast", FAST);
        schema_builder.add_json_field("json_text", TEXT);
        if dynamic_mode {
            schema_builder.add_json_field(DYNAMIC_FIELD_NAME, TEXT);
        }
        schema_builder.build()
    }

    #[track_caller]
    fn check_build_query_dynamic_mode(
        user_query: &str,
        search_fields: Vec<String>,
        expected: TestExpectation,
    ) {
        check_build_query(user_query, search_fields, expected, true, false);
    }

    #[track_caller]
    fn check_build_query_static_mode(
        user_query: &str,
        search_fields: Vec<String>,
        expected: TestExpectation,
    ) {
        check_build_query(user_query, search_fields, expected, false, false);
    }

    #[track_caller]
    fn check_build_query_static_lenient_mode(
        user_query: &str,
        search_fields: Vec<String>,
        expected: TestExpectation,
    ) {
        check_build_query(user_query, search_fields, expected, false, true);
    }

    fn test_build_query(
        user_query: &str,
        search_fields: Vec<String>,
        dynamic_mode: bool,
        lenient: bool,
    ) -> Result<String, String> {
        let user_input_query = UserInputQuery {
            user_text: user_query.to_string(),
            default_fields: Some(search_fields),
            default_operator: BooleanOperand::And,
            lenient,
        };
        let query_ast = user_input_query
            .parse_user_query(&[])
            .map_err(|err| err.to_string())?;
        let schema = make_schema(dynamic_mode);
        let query_result = build_query(query_ast, &BuildTantivyAstContext::for_test(&schema), None);
        query_result
            .map(|query| format!("{query:?}"))
            .map_err(|err| err.to_string())
    }

    #[track_caller]
    fn check_build_query(
        user_query: &str,
        search_fields: Vec<String>,
        expected: TestExpectation,
        dynamic_mode: bool,
        lenient: bool,
    ) {
        let query_result = test_build_query(user_query, search_fields, dynamic_mode, lenient);
        match (query_result, expected) {
            (Err(query_err_msg), TestExpectation::Err(sub_str)) => {
                assert!(
                    query_err_msg.contains(sub_str),
                    "query error received is {query_err_msg}. it should contain {sub_str}"
                );
            }
            (Ok(query_str), TestExpectation::Ok(sub_str)) => {
                assert!(
                    query_str.contains(sub_str),
                    "error query parsing {query_str} should contain {sub_str}"
                );
            }
            (Err(error_msg), TestExpectation::Ok(expectation)) => {
                panic!("Expected `{expectation}` but got an error `{error_msg}`.");
            }
            (Ok(query_str), TestExpectation::Err(expected_error)) => {
                panic!("Expected the error `{expected_error}`, but got a success `{query_str}`");
            }
        }
    }

    #[test]
    fn test_build_query_dynamic_field() {
        check_build_query_dynamic_mode("*", Vec::new(), TestExpectation::Ok("All"));
        check_build_query_dynamic_mode(
            "foo:bar",
            Vec::new(),
            TestExpectation::Ok(
                r#"TermQuery(Term(field=16, type=Json, path=foo, type=Str, "bar"))"#,
            ),
        );
        check_build_query_dynamic_mode(
            "server.type:hpc server.mem:4GB",
            Vec::new(),
            TestExpectation::Ok("server.type"),
        );
        check_build_query_dynamic_mode(
            "title:[a TO b]",
            Vec::new(),
            TestExpectation::Err(
                "range queries are only supported for fast fields. (`title` is not a fast field)",
            ),
        );
        check_build_query_dynamic_mode(
            "title:{a TO b} desc:foo",
            Vec::new(),
            TestExpectation::Err(
                "range queries are only supported for fast fields. (`title` is not a fast field)",
            ),
        );
    }

    #[test]
    fn test_build_query_not_dynamic_mode() {
        check_build_query_static_mode("*", Vec::new(), TestExpectation::Ok("All"));
        check_build_query_static_mode(
            "foo:bar",
            Vec::new(),
            TestExpectation::Err("invalid query: field does not exist: `foo`"),
        );
        check_build_query_static_lenient_mode(
            "foo:bar",
            Vec::new(),
            TestExpectation::Ok("EmptyQuery"),
        );
        check_build_query_static_mode(
            "title:bar",
            Vec::new(),
            TestExpectation::Ok(r#"TermQuery(Term(field=1, type=Str, "bar"))"#),
        );
        check_build_query_static_mode(
            "bar",
            vec!["fieldnotinschema".to_string()],
            TestExpectation::Err("invalid query: field does not exist: `fieldnotinschema`"),
        );
        check_build_query_static_lenient_mode(
            "bar",
            vec!["fieldnotinschema".to_string()],
            TestExpectation::Ok("EmptyQuery"),
        );
        check_build_query_static_mode(
            "title:[a TO b]",
            Vec::new(),
            TestExpectation::Err(
                "range queries are only supported for fast fields. (`title` is not a fast field)",
            ),
        );
        check_build_query_static_mode(
            "title:{a TO b} desc:foo",
            Vec::new(),
            TestExpectation::Err(
                "range queries are only supported for fast fields. (`title` is not a fast field)",
            ),
        );
        check_build_query_static_mode(
            "title:>foo",
            Vec::new(),
            TestExpectation::Err(
                "range queries are only supported for fast fields. (`title` is not a fast field)",
            ),
        );
        check_build_query_static_mode(
            "title:foo desc:bar _source:baz",
            Vec::new(),
            TestExpectation::Ok("TermQuery"),
        );
        check_build_query_static_mode(
            "server.name:\".bar:\" server.mem:4GB",
            vec!["server.name".to_string()],
            TestExpectation::Ok("TermQuery"),
        );
        check_build_query_static_mode(
            "server.name:\"for.bar:b\" server.mem:4GB",
            Vec::new(),
            TestExpectation::Ok("TermQuery"),
        );
        check_build_query_static_mode(
            "foo",
            Vec::new(),
            TestExpectation::Err("query requires a default search field and none was supplied"),
        );
        check_build_query_static_mode(
            "bar",
            Vec::new(),
            TestExpectation::Err("query requires a default search field and none was supplied"),
        );
        check_build_query_static_mode(
            "title:hello AND (Jane OR desc:world)",
            Vec::new(),
            TestExpectation::Err("query requires a default search field and none was supplied"),
        );
        check_build_query_static_mode(
            "server.running:true",
            Vec::new(),
            TestExpectation::Ok("TermQuery"),
        );
        check_build_query_static_mode(
            "title: IN [hello]",
            Vec::new(),
            TestExpectation::Ok("TermSetQuery"),
        );
        check_build_query_static_mode(
            "IN [hello]",
            Vec::new(),
            TestExpectation::Err("set query need to target a specific field"),
        );
    }

    #[test]
    fn test_wildcard_query() {
        check_build_query_static_mode("title:hello*", Vec::new(), TestExpectation::Ok("Regex"));
        check_build_query_static_mode(
            "title:\"hello world\"*",
            Vec::new(),
            TestExpectation::Ok("PhrasePrefixQuery"),
        );
        // the tokenizer removes '*' chars, making it a simple PhraseQuery (not RegexPhraseQuery)
        check_build_query_static_mode(
            "title:\"hello* world*\"",
            Vec::new(),
            TestExpectation::Ok("PhraseQuery"),
        );
        check_build_query_static_mode(
            "foo:bar*",
            Vec::new(),
            TestExpectation::Err("invalid query: field does not exist: `foo`"),
        );
        check_build_query_static_mode("title:hello*yo", Vec::new(), TestExpectation::Ok("Regex"));
    }

    #[test]
    fn test_existence_query() {
        check_build_query_static_mode(
            "title:*",
            Vec::new(),
            TestExpectation::Ok("TermQuery(Term(field=0, type=U64"),
        );

        check_build_query_static_mode(
            "ip:*",
            Vec::new(),
            TestExpectation::Ok("ExistsQuery { field_name: \"ip\", json_subpaths: true }"),
        );
        check_build_query_static_mode(
            "json_text:*",
            Vec::new(),
            TestExpectation::Ok("TermSetQuery"),
        );
        check_build_query_static_mode(
            "json_fast:*",
            Vec::new(),
            TestExpectation::Ok("ExistsQuery { field_name: \"json_fast\", json_subpaths: true }"),
        );
        check_build_query_static_mode(
            "foo:*",
            Vec::new(),
            TestExpectation::Err("invalid query: field does not exist: `foo`"),
        );
        check_build_query_static_mode(
            "server:*",
            Vec::new(),
            TestExpectation::Ok("BooleanQuery { subqueries: [(Should, TermQuery(Term"),
        );
    }

    #[test]
    fn test_datetime_range_query() {
        {
            // Check range on datetime in millisecond, precision has no impact as it is in
            // milliseconds.
            let start_date_time_str = "2023-01-10T08:38:51.150Z";
            let end_date_time_str = "2023-01-10T08:38:51.160Z";
            check_build_query_static_mode(
                &format!("dt:[{start_date_time_str} TO {end_date_time_str}]"),
                Vec::new(),
                TestExpectation::Ok("2023-01-10T08:38:51.15Z"),
            );
            check_build_query_static_mode(
                &format!("dt:[{start_date_time_str} TO {end_date_time_str}]"),
                Vec::new(),
                TestExpectation::Ok("RangeQuery"),
            );
            check_build_query_static_mode(
                &format!("dt:<{end_date_time_str}"),
                Vec::new(),
                TestExpectation::Ok("lower_bound: Unbounded"),
            );
            check_build_query_static_mode(
                &format!("dt:<{end_date_time_str}"),
                Vec::new(),
                TestExpectation::Ok("upper_bound: Excluded"),
            );
            check_build_query_static_mode(
                &format!("dt:<{end_date_time_str}"),
                Vec::new(),
                TestExpectation::Ok("2023-01-10T08:38:51.16Z"),
            );
        }

        // Check range on datetime in microseconds and truncation to milliseconds.
        {
            let start_date_time_str = "2023-01-10T08:38:51.000150Z";
            let end_date_time_str = "2023-01-10T08:38:51.000151Z";
            check_build_query_static_mode(
                &format!("dt:[{start_date_time_str} TO {end_date_time_str}]"),
                Vec::new(),
                TestExpectation::Ok("2023-01-10T08:38:51Z"),
            );
        }
    }

    #[test]
    fn test_ip_range_query() {
        check_build_query_static_mode(
            "ip:[127.0.0.1 TO 127.1.1.1]",
            Vec::new(),
            TestExpectation::Ok(
                "RangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=7, \
                 type=IpAddr, ::ffff:127.0.0.1)), upper_bound: Included(Term(field=7, \
                 type=IpAddr, ::ffff:127.1.1.1)) } }",
            ),
        );
        check_build_query_static_mode(
            "ip:>127.0.0.1",
            Vec::new(),
            TestExpectation::Ok(
                "RangeQuery { bounds: BoundsRange { lower_bound: Excluded(Term(field=7, \
                 type=IpAddr, ::ffff:127.0.0.1)), upper_bound: Unbounded } }",
            ),
        );
    }

    #[test]
    fn test_f64_range_query() {
        check_build_query_static_mode(
            "f64_fast:[7.7 TO 77.7]",
            Vec::new(),
            TestExpectation::Ok(
                r#"RangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=13, type=F64, 7.7)), upper_bound: Included(Term(field=13, type=F64, 77.7)) } }"#,
            ),
        );
        check_build_query_static_mode(
            "f64_fast:>7",
            Vec::new(),
            TestExpectation::Ok(
                r#"RangeQuery { bounds: BoundsRange { lower_bound: Excluded(Term(field=13, type=F64, 7.0)), upper_bound: Unbounded } }"#,
            ),
        );
    }

    #[test]
    fn test_i64_range_query() {
        check_build_query_static_mode(
            "i64_fast:[-7 TO 77]",
            Vec::new(),
            TestExpectation::Ok(r#"field=12"#),
        );
        check_build_query_static_mode(
            "i64_fast:>7",
            Vec::new(),
            TestExpectation::Ok(r#"field=12"#),
        );
    }

    #[test]
    fn test_u64_range_query() {
        check_build_query_static_mode(
            "u64_fast:[7 TO 77]",
            Vec::new(),
            TestExpectation::Ok(r#"field=11,"#),
        );
        check_build_query_static_mode(
            "u64_fast:>7",
            Vec::new(),
            TestExpectation::Ok(r#"field=11,"#),
        );
    }

    #[test]
    fn test_range_query_ip_fields_multivalued() {
        check_build_query_static_mode(
            "ips:[127.0.0.1 TO 127.1.1.1]",
            Vec::new(),
            TestExpectation::Ok(
                "RangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=8, \
                 type=IpAddr, ::ffff:127.0.0.1)), upper_bound: Included(Term(field=8, \
                 type=IpAddr, ::ffff:127.1.1.1)) } }",
            ),
        );
    }

    #[test]
    fn test_range_query_no_fast_field() {
        check_build_query_static_mode(
            "ip_notff:[127.0.0.1 TO 127.1.1.1]",
            Vec::new(),
            TestExpectation::Err("`ip_notff` is not a fast field"),
        );
    }

    #[test]
    fn test_build_query_not_bool_should_fail() {
        check_build_query_static_mode(
            "server.running:notabool",
            Vec::new(),
            TestExpectation::Err("expected a `bool` search value for field `server.running`"),
        );
    }

    #[test]
    fn test_build_query_warmup_info() {
        let query_with_set = query_ast_from_user_text("desc: IN [hello]", None)
            .parse_user_query(&[])
            .unwrap();
        let query_without_set = query_ast_from_user_text("desc:hello", None)
            .parse_user_query(&[])
            .unwrap();

        let schema = make_schema(true);
        let context = BuildTantivyAstContext::for_test(&schema);

        let (_, warmup_info) = build_query(query_with_set, &context, None).unwrap();
        assert_eq!(warmup_info.term_dict_fields.len(), 1);
        assert!(
            warmup_info
                .term_dict_fields
                .contains(&tantivy::schema::Field::from_field_id(2))
        );

        let (_, warmup_info) = build_query(query_without_set, &context, None).unwrap();
        assert!(warmup_info.term_dict_fields.is_empty());
    }

    #[test]
    fn test_extract_phrase_prefix_position_required() {
        let schema = make_schema(false);
        let tokenizer_manager = create_default_quickwit_tokenizer_manager();

        let params = FullTextParams {
            tokenizer: None,
            mode: FullTextMode::Phrase { slop: 0 },
            zero_terms_query: MatchAllOrNone::MatchNone,
        };
        let short = PhrasePrefixQuery {
            field: "title".to_string(),
            phrase: "short".to_string(),
            max_expansions: 50,
            params: params.clone(),
            lenient: false,
        };
        let long = PhrasePrefixQuery {
            field: "title".to_string(),
            phrase: "not so short".to_string(),
            max_expansions: 50,
            params: params.clone(),
            lenient: false,
        };
        let mut extractor1 = ExtractPrefixTermRanges::with_schema(&schema, &tokenizer_manager);
        extractor1.visit_phrase_prefix(&short).unwrap();
        extractor1.visit_phrase_prefix(&long).unwrap();

        let mut extractor2 = ExtractPrefixTermRanges::with_schema(&schema, &tokenizer_manager);
        extractor2.visit_phrase_prefix(&long).unwrap();
        extractor2.visit_phrase_prefix(&short).unwrap();

        assert_eq!(
            extractor1.term_ranges_to_warm_up,
            extractor2.term_ranges_to_warm_up
        );

        let field = tantivy::schema::Field::from_field_id(1);
        let mut expected_inner = std::collections::HashMap::new();
        expected_inner.insert(
            TermRange {
                start: Bound::Included(Term::from_field_text(field, "short")),
                end: Bound::Excluded(Term::from_field_text(field, "shoru")),
                limit: Some(50),
            },
            true,
        );
        let mut expected = std::collections::HashMap::new();
        expected.insert(field, expected_inner);
        assert_eq!(extractor1.term_ranges_to_warm_up, expected);
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/routing_expression/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::fmt::{self, Display};
use std::hash::{Hash, Hasher};
use std::str::FromStr;
use std::sync::Arc;

pub(crate) use expression_dsl::parse_field_name;
use serde_json::Value as JsonValue;
use siphasher::sip::SipHasher;

pub trait RoutingExprContext {
    fn hash_attribute<H: Hasher>(&self, attr_name: &[String], hasher: &mut H);
}

/// This is a bit overkill but this function has the merit of
/// ensuring that the data that is sent to the hasher is unique
/// to the value, so we do not lose injectivity there.
fn hash_json_val<H: Hasher>(json_val: &JsonValue, hasher: &mut H) {
    match json_val {
        JsonValue::Null => {
            hasher.write_u8(0u8);
        }
        JsonValue::Bool(bool_val) => {
            hasher.write_u8(1u8);
            bool_val.hash(hasher);
        }
        JsonValue::Number(num) => {
            hasher.write_u8(2u8);
            num.hash(hasher);
        }
        JsonValue::String(s) => {
            hasher.write_u8(3u8);
            hasher.write_u64(s.len() as u64);
            hasher.write(s.as_bytes());
        }
        JsonValue::Array(arr) => {
            hasher.write_u8(4u8);
            hasher.write_u64(arr.len() as u64);
            for el in arr {
                hash_json_val(el, hasher);
            }
        }
        JsonValue::Object(obj) => {
            hasher.write_u8(5u8);
            hasher.write_u64(obj.len() as u64);
            for (key, val) in obj.iter() {
                hasher.write_u64(key.len() as u64);
                hasher.write(key.as_bytes());
                hash_json_val(val, hasher);
            }
        }
    }
}

fn find_value<'a>(mut root: &'a JsonValue, keys: &[String]) -> Option<&'a JsonValue> {
    for key in keys {
        match root {
            JsonValue::Object(obj) => {
                root = obj.get(key)?;
            }
            _ => return None,
        }
    }
    Some(root)
}

fn find_value_in_map<'a>(
    obj: &'a serde_json::Map<String, JsonValue>,
    keys: &[String],
) -> Option<&'a JsonValue> {
    // we can't have an empty path and this is used only for the root map, so there is no risk of
    // out of bound
    if let Some(value) = obj.get(&keys[0]) {
        find_value(value, &keys[1..])
    } else {
        None
    }
}

impl RoutingExprContext for serde_json::Map<String, JsonValue> {
    fn hash_attribute<H: Hasher>(&self, attr_name: &[String], hasher: &mut H) {
        if let Some(json_val) = find_value_in_map(self, attr_name) {
            hasher.write_u8(1u8);
            hash_json_val(json_val, hasher);
        } else {
            hasher.write_u8(0u8);
        }
    }
}

/// which defines a routing expression
#[derive(Clone, Default)]
pub struct RoutingExpr {
    inner_opt: Option<Arc<InnerRoutingExpr>>,
    salted_hasher: SipHasher,
}

impl RoutingExpr {
    /// Construct a routing expression from a expression dsl string
    pub fn new(expr_dsl_str: &str) -> anyhow::Result<Self> {
        let expr_dsl_str = expr_dsl_str.trim();
        if expr_dsl_str.is_empty() {
            return Ok(RoutingExpr::default());
        }

        let mut salted_hasher: SipHasher = SipHasher::new();

        let inner: InnerRoutingExpr = InnerRoutingExpr::from_str(expr_dsl_str)?;
        // We hash the expression tree here instead of hashing the str, or
        // hash the display of the tree, in order to make the partition id less brittle to
        // a minor change in formatting, or a change in the DSL itself.
        //
        // We do not use the standard library DefaultHasher to make sure we
        // get the same hash values.
        inner.hash(&mut salted_hasher);

        Ok(RoutingExpr {
            inner_opt: Some(Arc::new(inner)),
            salted_hasher,
        })
    }

    /// Evaluates the expression applied to the given
    /// context and returns a u64 hash.
    ///
    /// Obviously this function is not perfectly injective.
    pub fn eval_hash<Ctx: RoutingExprContext>(&self, ctx: &Ctx) -> u64 {
        if let Some(inner) = self.inner_opt.as_ref() {
            let mut hasher: SipHasher = self.salted_hasher;
            inner.eval_hash(ctx, &mut hasher);
            hasher.finish()
        } else {
            0u64
        }
    }

    /// return all fields in a vector
    pub fn field_names(&self) -> Vec<String> {
        if let Some(inner) = self.inner_opt.as_ref() {
            inner.field_names()
        } else {
            Vec::new()
        }
    }
}

impl Display for RoutingExpr {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        if let Some(inner_expr) = self.inner_opt.as_ref() {
            inner_expr.fmt(f)
        } else {
            write!(f, "")
        }
    }
}

#[derive(Clone, Debug, Eq, PartialEq)]
enum InnerRoutingExpr {
    Field(Vec<String>),
    Composite(Vec<InnerRoutingExpr>),
    Modulo(Box<InnerRoutingExpr>, u64),
    // TODO Enrich me! Map / ...
}

impl InnerRoutingExpr {
    fn eval_hash<Ctx: RoutingExprContext, H: Hasher + Default>(&self, ctx: &Ctx, hasher: &mut H) {
        match self {
            InnerRoutingExpr::Field(field_name) => {
                ExprType::Field.hash(hasher);
                ctx.hash_attribute(field_name, hasher);
            }
            InnerRoutingExpr::Composite(children) => {
                ExprType::Composite.hash(hasher);
                for child in children {
                    child.eval_hash(ctx, hasher);
                }
            }
            InnerRoutingExpr::Modulo(inner_expr, modulo) => {
                ExprType::Modulo.hash(hasher);

                let mut sub_hasher = H::default();
                inner_expr.eval_hash(ctx, &mut sub_hasher);
                hasher.write_u64(sub_hasher.finish() % modulo);
            }
        }
    }

    // return all fields in a vector
    fn field_names(&self) -> Vec<String> {
        match self {
            InnerRoutingExpr::Field(field_name) => vec![field_name.join(".")],
            InnerRoutingExpr::Composite(children) => {
                let mut fields = Vec::new();
                for child in children {
                    fields.extend(child.field_names());
                }
                fields
            }
            InnerRoutingExpr::Modulo(inner_expr, _) => inner_expr.field_names(),
        }
    }
}

// We don't rely on Derive here to make it easier to keep the
// implementation stable.
#[allow(clippy::derived_hash_with_manual_eq)]
impl Hash for InnerRoutingExpr {
    fn hash<H: Hasher>(&self, hasher: &mut H) {
        match self {
            InnerRoutingExpr::Field(field_name) => {
                ExprType::Field.hash(hasher);
                hasher.write_u64(field_name.len() as u64);
                for (index, field) in field_name.iter().enumerate() {
                    if index != 0 {
                        hasher.write_u8(b'.');
                    }
                    hasher.write(field.as_bytes());
                }
            }
            InnerRoutingExpr::Composite(children) => {
                ExprType::Composite.hash(hasher);
                for child in children {
                    child.hash(hasher);
                }
            }
            InnerRoutingExpr::Modulo(inner_expr, modulo) => {
                ExprType::Modulo.hash(hasher);
                inner_expr.hash(hasher);
                hasher.write_u64(*modulo);
            }
        }
    }
}

impl Default for InnerRoutingExpr {
    fn default() -> InnerRoutingExpr {
        InnerRoutingExpr::Composite(Vec::new())
    }
}

impl FromStr for InnerRoutingExpr {
    type Err = anyhow::Error;

    fn from_str(expr_dsl_str: &str) -> anyhow::Result<Self> {
        let ast = expression_dsl::parse_expression(expr_dsl_str)?;

        convert_ast(ast)
    }
}

fn convert_ast(ast: Vec<expression_dsl::ExpressionAst>) -> anyhow::Result<InnerRoutingExpr> {
    use expression_dsl::{Argument, ExpressionAst};

    let mut result = ast
        .into_iter()
        .map(|ast_elem| match ast_elem {
            ExpressionAst::Field(field_name) => {
                let field_path = expression_dsl::parse_field_name(&field_name)?
                    .into_iter()
                    .map(Cow::into_owned)
                    .collect();
                Ok(InnerRoutingExpr::Field(field_path))
            }
            ExpressionAst::Function { name, mut args } => match &*name {
                "hash_mod" => {
                    if args.len() != 2 {
                        anyhow::bail!(
                            "invalid arguments for `hash_mod`: expected 2 arguments, found {}",
                            args.len()
                        );
                    }

                    let Argument::Expression(fields) = args.remove(0) else {
                        anyhow::bail!("invalid 1st argument for `hash_mod`: expected expression");
                    };

                    let Argument::Number(modulo) = args.remove(0) else {
                        anyhow::bail!("invalid 2nd argument for `hash_mod`: expected number");
                    };

                    Ok(InnerRoutingExpr::Modulo(
                        Box::new(convert_ast(fields)?),
                        modulo,
                    ))
                }
                _ => anyhow::bail!("unknown function `{}`", name),
            },
        })
        .collect::<Result<Vec<_>, _>>()?;
    if result.is_empty() {
        Ok(InnerRoutingExpr::default())
    } else if result.len() == 1 {
        Ok(result.remove(0))
    } else {
        Ok(InnerRoutingExpr::Composite(result))
    }
}

// The display implementation should be consistent with `FromString`.
impl Display for InnerRoutingExpr {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        match &self {
            InnerRoutingExpr::Field(field) => {
                for (index, part) in field.iter().enumerate() {
                    if index != 0 {
                        f.write_str(".")?;
                    }
                    f.write_str(&part.replace('.', r"\."))?;
                }
            }
            InnerRoutingExpr::Composite(children) => {
                if children.is_empty() {
                    return Ok(());
                }
                children[0].fmt(f)?;
                for child in &children[1..] {
                    write!(f, ",{child}")?;
                }
            }
            InnerRoutingExpr::Modulo(inner_expr, modulo) => {
                write!(f, "hash_mod(({inner_expr}), {modulo})")?;
            }
        }
        Ok(())
    }
}

#[derive(Hash)]
#[repr(u8)]
enum ExprType {
    Field,
    Composite,
    Modulo,
}

mod expression_dsl {
    use std::borrow::Cow;

    use nom::bytes::complete::{escaped, tag};
    use nom::character::complete::multispace0;
    use nom::combinator::{eof, map, opt};
    use nom::error::ErrorKind;
    use nom::multi::separated_list0;
    use nom::sequence::delimited;
    use nom::{AsChar, Finish, IResult, Input, Parser};

    // this is a RoutingSubExpr in our DSL.
    #[derive(Debug, PartialEq, Eq, Clone)]
    pub(crate) enum ExpressionAst {
        Field(String),
        Function { name: String, args: Vec<Argument> },
    }

    #[derive(Debug, PartialEq, Eq, Clone)]
    pub(crate) enum Argument {
        Expression(Vec<ExpressionAst>),
        Number(u64),
    }

    pub(crate) fn parse_expression(expr_dsl_str: &str) -> anyhow::Result<Vec<ExpressionAst>> {
        let (i, res) = routing_expr(expr_dsl_str)
            .finish()
            .map_err(|e| anyhow::anyhow!("error parsing routing expression: {e}"))?;
        eof::<_, ()>(i)?;

        Ok(res)
    }

    // tag, but ignore leading and trailing whitespaces
    pub fn wtag<'a, Error: nom::error::ParseError<&'a str>>(
        t: &'a str,
    ) -> impl Parser<&'a str, Output = &'a str, Error = Error> {
        delimited(multispace0, tag(t), multispace0)
    }

    // DSL:
    //
    // RoutingExpr := RoutingSubExpr [ , RoutingExpr ]
    // RougingSubExpr := Identifier [ \( Arguments \) ]
    // Identifier := FieldChar [ Identifier ]
    // FieldChar := { a..z | A..Z | 0..9 | _ | . | \ | / | @ | $ }
    // Arguments := Argument [ , Arguments ]
    // Argument := { \( RoutingExpr \) | RoutingSubExpr | DirectValue }
    // # We may want other DirectValue in the future
    // DirectValue := Number
    // Number := { 0..9 } [ Number ]

    /// An entire routing expression, containing comma separated routing sub-expressions
    fn routing_expr(input: &str) -> IResult<&str, Vec<ExpressionAst>> {
        separated_list0(wtag(","), routing_sub_expr).parse(input)
    }

    /// A sub-part of a routing expression
    fn routing_sub_expr(input: &str) -> IResult<&str, ExpressionAst> {
        let (input, identifier) = identifier(input)?;
        let (input, args) = opt((wtag("("), arguments, wtag(")"))).parse(input)?;
        let res = if let Some((_, args, _)) = args {
            ExpressionAst::Function {
                name: identifier.to_owned(),
                args,
            }
        } else {
            ExpressionAst::Field(identifier.to_owned())
        };
        Ok((input, res))
    }

    /// An identifier, it can be either a field name, or a function name. It's returned as is,
    /// without de-escaping.
    fn identifier(input: &str) -> IResult<&str, &str> {
        input.split_at_position1_complete(
            |item| !(item.is_alphanum() || ['_', '-', '.', '\\', '/', '@', '$'].contains(&item)),
            ErrorKind::AlphaNumeric,
        )
    }

    /// Arguments for a function
    fn arguments(input: &str) -> IResult<&str, Vec<Argument>> {
        separated_list0(wtag(","), argument).parse(input)
    }

    /// A single argument for a function
    fn argument(input: &str) -> IResult<&str, Argument> {
        if let Ok((input, number)) = number(input) {
            Ok((input, Argument::Number(number)))
        } else if let Ok((input, (_, arg, _))) = (wtag("("), routing_expr, wtag(")")).parse(input) {
            Ok((input, Argument::Expression(arg)))
        } else {
            routing_sub_expr(input).map(|(input, arg)| (input, Argument::Expression(vec![arg])))
        }
    }

    /// A number
    fn number(input: &str) -> IResult<&str, u64> {
        nom::character::complete::u64(input)
    }

    // functions after this are meant to parse a field into its path component, de-escaping where
    // appropriate

    /// Parse part of a path component, stop at the first . or \
    fn key_identifier(input: &str) -> IResult<&str, &str> {
        input.split_at_position1_complete(
            |item| !(item.is_alphanum() || ['_', '-', '/', '@', '$'].contains(&item)),
            ErrorKind::Fail,
        )
    }

    /// Parse a single path component, separated by dots. De-escape any escaped dot it may contain.
    fn escaped_key(input: &str) -> IResult<&str, Cow<'_, str>> {
        map(escaped(key_identifier, '\\', tag(".")), |s: &str| {
            if s.contains("\\.") {
                Cow::Owned(s.replace("\\.", "."))
            } else {
                Cow::Borrowed(s)
            }
        })
        .parse(input)
    }

    /// Parse a field name into a path, de-escaping where appropriate.
    pub(crate) fn parse_field_name(input: &str) -> anyhow::Result<Vec<Cow<'_, str>>> {
        let (i, res) = separated_list0(tag("."), escaped_key)
            .parse(input)
            .finish()
            .map_err(|e| anyhow::anyhow!("error parsing key expression: {e}"))?;
        eof::<_, ()>(i)?;
        Ok(res)
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;

    use super::*;

    #[track_caller]
    fn test_ser_deser(expr: &InnerRoutingExpr) {
        let ser = expr.to_string();
        assert_eq!(&InnerRoutingExpr::from_str(&ser).unwrap(), expr);
    }

    #[track_caller]
    fn deser_util(expr_dsl: &str) -> InnerRoutingExpr {
        let expr = InnerRoutingExpr::from_str(expr_dsl).unwrap();
        test_ser_deser(&expr);
        expr
    }

    #[test]
    fn test_routing_expr_empty() {
        let routing_expr = deser_util("");
        assert!(matches!(routing_expr, InnerRoutingExpr::Composite(leaves) if leaves.is_empty()));
    }

    #[test]
    fn test_routing_expr_empty_hashes_to_0() {
        let expr = RoutingExpr::new("").unwrap();
        let ctx: serde_json::Map<String, JsonValue> = Default::default();
        assert_eq!(expr.eval_hash(&ctx), 0u64);
    }

    #[test]
    fn test_routing_expr_single_field() {
        let routing_expr = deser_util("tenant_id");
        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Field(vec!["tenant_id".to_owned()])
        );
    }

    #[test]
    fn test_routing_expr_single_field_special_char() {
        let routing_expr = deser_util(r"abCD01-_/@$\.a.bc");
        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Field(vec![r"abCD01-_/@$.a".to_owned(), "bc".to_string()])
        );
    }

    #[test]
    fn test_routing_expr_single_field_with_dot() {
        let routing_expr = deser_util("app.id");
        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Field(vec!["app".to_owned(), "id".to_owned()])
        );
    }

    #[test]
    fn test_routing_expr_modulo_field() {
        let routing_expr = deser_util("hash_mod(tenant_id, 4)");
        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Modulo(
                Box::new(InnerRoutingExpr::Field(vec!["tenant_id".to_owned()])),
                4
            )
        );
    }

    #[test]
    fn test_routing_expr_modulo_complexe() {
        let routing_expr = deser_util("hash_mod((tenant_id,hash_mod(app_id, 3)), 8),cluster_id");
        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Composite(vec![
                InnerRoutingExpr::Modulo(
                    Box::new(InnerRoutingExpr::Composite(vec![
                        InnerRoutingExpr::Field(vec!["tenant_id".to_owned()]),
                        InnerRoutingExpr::Modulo(
                            Box::new(InnerRoutingExpr::Field(vec!["app_id".to_owned()]),),
                            3
                        ),
                    ])),
                    8
                ),
                InnerRoutingExpr::Field(vec!["cluster_id".to_owned()]),
            ])
        );
    }

    #[test]
    fn test_routing_expr_multiple_field() {
        let routing_expr = deser_util("tenant_id,app_id");

        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Composite(vec![
                InnerRoutingExpr::Field(vec!["tenant_id".to_owned()]),
                InnerRoutingExpr::Field(vec!["app_id".to_owned()]),
            ])
        );
    }

    #[test]
    fn test_routing_expr_multiple_field_with_dot() {
        let routing_expr = deser_util("tenant.id,app.id");

        assert_eq!(
            routing_expr,
            InnerRoutingExpr::Composite(vec![
                InnerRoutingExpr::Field(vec!["tenant".to_owned(), "id".to_owned()]),
                InnerRoutingExpr::Field(vec!["app".to_owned(), "id".to_owned()]),
            ])
        );
    }

    #[test]
    fn test_parse_field_name() {
        let keys = expression_dsl::parse_field_name("abc").unwrap();
        assert_eq!(keys, vec![String::from("abc")]);
    }

    #[test]
    fn test_parse_field_name_multiple() {
        let keys = expression_dsl::parse_field_name("abc.def").unwrap();
        assert_eq!(keys, vec![String::from("abc"), String::from("def")]);
    }

    #[test]
    fn test_parse_field_name_with_escaped_dot() {
        let keys = expression_dsl::parse_field_name("abc\\.def.hij").unwrap();
        assert_eq!(keys, vec![String::from("abc.def"), String::from("hij")]);
    }

    #[test]
    fn test_parse_field_name_with_special_char() {
        let keys = expression_dsl::parse_field_name("abCD01-_/@$").unwrap();
        assert_eq!(keys, vec![String::from("abCD01-_/@$")]);
    }

    #[test]
    fn test_find_value_with_escaped_dot() {
        let ctx = serde_json::from_str(r#"{"tenant.id": "happy", "app": "happy"}"#).unwrap();
        let keys: Vec<_> = expression_dsl::parse_field_name("tenant\\.id")
            .unwrap()
            .into_iter()
            .map(Cow::into_owned)
            .collect();
        assert_eq!(keys, vec![String::from("tenant.id")]);
        let value = find_value(&ctx, &keys).unwrap();
        assert_eq!(value, &JsonValue::String(String::from("happy")));
    }

    #[test]
    fn test_find_value_with_nested_keys() {
        let ctx = serde_json::from_str(
            r#"{"tenant_id": "happy", "app": {"name": "happy", "id": "123"}}"#,
        )
        .unwrap();
        let keys: Vec<_> = expression_dsl::parse_field_name("app.id")
            .unwrap()
            .into_iter()
            .map(Cow::into_owned)
            .collect();
        assert_eq!(keys, vec!["app", "id"]);
        let value = find_value(&ctx, &keys).unwrap();
        assert_eq!(value, &JsonValue::String(String::from("123")));
    }
    // This unit test is here to ensure that the routing expr hash depends on
    // the expression itself as well as the expression value.
    #[test]
    fn test_routing_expr_depends_on_both_expr_and_value() {
        let routing_expr = RoutingExpr::new("tenant_id").unwrap();
        let routing_expr2 = RoutingExpr::new("app").unwrap();
        let ctx: serde_json::Map<String, JsonValue> =
            serde_json::from_str(r#"{"tenant_id": "happy", "app": "happy"}"#).unwrap();
        let ctx2: serde_json::Map<String, JsonValue> =
            serde_json::from_str(r#"{"tenant_id": "happy2"}"#).unwrap();
        // This assert is important.
        assert_ne!(routing_expr.eval_hash(&ctx), routing_expr2.eval_hash(&ctx),);
        assert_ne!(routing_expr.eval_hash(&ctx), routing_expr.eval_hash(&ctx2),);
    }

    // This unit test is here to detect a change in the hash logic.
    // Breaking it is not catastrophic but it should not happen too often.
    #[test]
    fn test_routing_expr_change_detection() {
        let routing_expr = RoutingExpr::new("tenant_id").unwrap();
        let ctx: serde_json::Map<String, JsonValue> =
            serde_json::from_str(r#"{"tenant_id": "happy-tenant", "app": "happy"}"#).unwrap();
        assert_eq!(routing_expr.eval_hash(&ctx), 13914409176935416182);
    }

    #[test]
    fn test_routing_expr_missing_value_does_not_panic() {
        let routing_expr = RoutingExpr::new("tenant_id").unwrap();
        let ctx: serde_json::Map<String, JsonValue> = Default::default();
        assert_eq!(routing_expr.eval_hash(&ctx), 12482849403534986143);
    }

    #[test]
    fn test_routing_expr_mod() {
        let mut seen = HashSet::new();
        let routing_expr = RoutingExpr::new("hash_mod(tenant_id, 10)").unwrap();

        for i in 0..1000 {
            let ctx: serde_json::Map<String, JsonValue> =
                serde_json::from_str(&format!(r#"{{"tenant_id": "happy{i}"}}"#)).unwrap();
            seen.insert(routing_expr.eval_hash(&ctx));
        }

        assert_eq!(seen.len(), 10);
    }
}


================================================
FILE: quickwit/quickwit-doc-mapper/src/tag_pruning.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::fmt::Display;

use quickwit_query::query_ast::QueryAst;
use serde::{Deserialize, Serialize};
use tantivy::query_grammar::Occur;

/// Returns true if and only if tag is of form `{field_name}:any_value`.
pub fn match_tag_field_name(field_name: &str, tag: &str) -> bool {
    tag.len() > field_name.len()
        && tag.as_bytes()[field_name.len()] == b':'
        && tag.starts_with(field_name)
}

/// Tags a user query and returns a TagFilterAst that
/// represents a filtering predicate over a set of tags.
///
/// If the predicate evaluates to false for a given set of tags
/// associated with a split, we are guaranteed that no documents
/// in the split matches the query.
pub fn extract_tags_from_query(query_ast: QueryAst) -> Option<TagFilterAst> {
    let unsimplified_tag_filter_ast = extract_unsimplified_tags_filter_ast(query_ast);
    let term_filters_ast = simplify_ast(unsimplified_tag_filter_ast)?;
    Some(expand_to_tag_ast(term_filters_ast))
}

fn extract_unsimplified_tags_filter_ast(query_ast: QueryAst) -> UnsimplifiedTagFilterAst {
    match query_ast {
        QueryAst::Bool(bool_query) => {
            let mut clause_with_resolved_occur: Vec<(Occur, UnsimplifiedTagFilterAst)> = Vec::new();
            for (occur, children) in [
                (Occur::Must, bool_query.must),
                (Occur::Must, bool_query.filter),
                (Occur::Should, bool_query.should),
                (Occur::MustNot, bool_query.must_not),
            ] {
                for child_ast in children {
                    let child_unsimplified_tag_ast =
                        extract_unsimplified_tags_filter_ast(child_ast);
                    clause_with_resolved_occur.push((occur, child_unsimplified_tag_ast));
                }
            }
            collect_tag_filters_for_clause(clause_with_resolved_occur)
        }
        QueryAst::Term(term_query) => UnsimplifiedTagFilterAst::Tag {
            is_present: true,
            field: term_query.field,
            value: term_query.value,
        },
        QueryAst::MatchAll | QueryAst::MatchNone => UnsimplifiedTagFilterAst::Uninformative,
        QueryAst::Range(_) => {
            // We could technically add support for range over some quantitive tag value (like we do
            // for timestamps). This is not supported at this point.
            UnsimplifiedTagFilterAst::Uninformative
        }
        QueryAst::TermSet(term_set) => {
            let children: Vec<UnsimplifiedTagFilterAst> = term_set
                .terms_per_field
                .into_iter()
                .flat_map(|(field, terms)| {
                    terms
                        .into_iter()
                        .map(move |term| UnsimplifiedTagFilterAst::Tag {
                            is_present: true,
                            field: field.clone(),
                            value: term,
                        })
                })
                .collect();
            UnsimplifiedTagFilterAst::Or(children)
        }
        QueryAst::FullText(full_text_query) => {
            // TODO This is a bug in a sense.
            // A phrase is supposed to go through the tokenizer.
            UnsimplifiedTagFilterAst::Tag {
                is_present: true,
                field: full_text_query.field,
                value: full_text_query.text,
            }
        }
        QueryAst::PhrasePrefix(phrase_prefix_query) => {
            // TODO same as FullText above.
            UnsimplifiedTagFilterAst::Tag {
                is_present: true,
                field: phrase_prefix_query.field,
                value: phrase_prefix_query.phrase,
            }
        }
        QueryAst::Wildcard(wildcard_query) => {
            // TODO same as FullText above.
            UnsimplifiedTagFilterAst::Tag {
                is_present: true,
                field: wildcard_query.field,
                value: wildcard_query.value,
            }
        }
        QueryAst::Boost { underlying, .. } => extract_unsimplified_tags_filter_ast(*underlying),
        QueryAst::UserInput(_user_text_query) => {
            panic!("Extract unsimplified should only be called on AST without UserInputQuery.");
        }
        QueryAst::FieldPresence(_) => UnsimplifiedTagFilterAst::Uninformative,
        QueryAst::Regex(_) => UnsimplifiedTagFilterAst::Uninformative,
        QueryAst::Cache(cache_node) => extract_unsimplified_tags_filter_ast(*cache_node.inner),
    }
}

/// Intermediary AST that may contain leaf that are
/// equivalent to the "Uninformative" predicate.
#[derive(Clone, Debug, Eq, PartialEq)]
enum UnsimplifiedTagFilterAst {
    And(Vec<UnsimplifiedTagFilterAst>),
    Or(Vec<UnsimplifiedTagFilterAst>),
    Tag {
        is_present: bool,
        field: String,
        value: String,
    },
    /// Uninformative represents a node which could be
    /// True or False regardless of the tag values.
    ///
    /// Any subnode of the `UserInputAST` can be
    /// replaced by `Uninformative` while still being correct.
    Uninformative,
}

/// Represents a tag filter used for split pruning.
#[derive(Debug, PartialEq, Clone)]
enum TermFilterAst {
    And(Vec<TermFilterAst>),
    Or(Vec<TermFilterAst>),
    Term { field: String, value: String },
}

/// Records terms into a set of tags.
///
/// A special tag `{field_name}!` is always added to the tag set.
/// It indicates that `{field_name}` is in the list of the
/// `DocMapper` attribute `tag_fields`.
///
/// See `SplitMetadata` in `quickwit_metastore` for more detail.
pub fn append_to_tag_set(field_name: &str, values: &[String], tag_set: &mut BTreeSet<String>) {
    tag_set.insert(field_tag(field_name));
    for value in values {
        tag_set.insert(term_tag(field_name, value));
    }
}

/// Represents a predicate over the set of tags associated with a given split.
#[allow(missing_docs)]
#[derive(Debug, PartialEq, Clone, Serialize, Deserialize)]
pub enum TagFilterAst {
    And(Vec<TagFilterAst>),
    Or(Vec<TagFilterAst>),
    Tag {
        /// If set to false, the predicate tests for the absence of the tag.
        is_present: bool,
        tag: String,
    },
}

impl Display for TagFilterAst {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        let (is_or, children) = match self {
            TagFilterAst::And(children) => (false, children),
            TagFilterAst::Or(children) => (true, children),
            TagFilterAst::Tag { is_present, tag } => {
                if !is_present {
                    write!(f, "¬")?;
                }
                write!(f, "{tag}")?;
                return Ok(());
            }
        };
        if children.is_empty() {
            return Ok(());
        }
        if children.len() == 1 {
            write!(f, "{}", children[0])?;
            return Ok(());
        }
        if is_or {
            write!(f, "(")?;
        }
        let mut children_it = children.iter();
        write!(f, "{}", children_it.next().unwrap())?;
        for child in children_it {
            if is_or {
                write!(f, " ∨ {child}")?;
            } else {
                write!(f, " ∧ {child}")?;
            }
        }
        if is_or {
            write!(f, ")")?;
        }
        Ok(())
    }
}

impl TagFilterAst {
    /// Evaluates the tag filter predicate over a set of tags.
    pub fn evaluate(&self, tag_set: &BTreeSet<String>) -> bool {
        match self {
            TagFilterAst::And(children) => {
                children.iter().all(|child_ast| child_ast.evaluate(tag_set))
            }
            TagFilterAst::Or(children) => {
                children.iter().any(|child_ast| child_ast.evaluate(tag_set))
            }
            TagFilterAst::Tag { is_present, tag } => tag_set.contains(tag) == *is_present,
        }
    }
}

// Takes a tag AST and simplify it.
//
// The resulting AST does not contain any uninformative leaves.
//
// Returning None here, is to be interpreted as returning `True`.
fn simplify_ast(ast: UnsimplifiedTagFilterAst) -> Option<TermFilterAst> {
    match ast {
        UnsimplifiedTagFilterAst::And(conditions) => {
            let mut pruned_conditions: Vec<TermFilterAst> =
                conditions.into_iter().filter_map(simplify_ast).collect();
            match pruned_conditions.len() {
                0 => None,
                1 => pruned_conditions.pop().unwrap().into(),
                _ => TermFilterAst::And(pruned_conditions).into(),
            }
        }
        UnsimplifiedTagFilterAst::Or(conditions) => {
            let mut pruned_conditions: Vec<TermFilterAst> = Vec::new();
            for condition in conditions {
                // If we get None as part of the condition here, we return None
                // directly. (Remember None means True).
                pruned_conditions.push(simplify_ast(condition)?);
            }
            match pruned_conditions.len() {
                0 => None,
                1 => pruned_conditions.pop().unwrap().into(),
                _ => TermFilterAst::Or(pruned_conditions).into(),
            }
        }
        UnsimplifiedTagFilterAst::Tag {
            is_present,
            field,
            value,
        } => {
            if is_present {
                Some(TermFilterAst::Term { field, value })
            } else {
                // we can't do tag pruning on negative filters. If `field` can be one of 1 or 2,
                // and we search for not(1), we don't want to remove a split where
                // tags=[1,2] (which is_present: false does). It's even more problematic if some
                // documents have `field` unset, because we don't record that at all, so can't
                // even reject a split based on it having tags=[1].
                None
            }
        }
        UnsimplifiedTagFilterAst::Uninformative => None,
    }
}

/// Special tag to indicate that a field is listed in the
/// `DocMapper` `tag_fields` attribute.
pub fn field_tag(field_name: &str) -> String {
    format!("{field_name}!")
}

fn term_tag(field: &str, value: &str) -> String {
    format!("{field}:{value}")
}

fn expand_to_tag_ast(terms_filter_ast: TermFilterAst) -> TagFilterAst {
    match terms_filter_ast {
        TermFilterAst::And(children) => {
            TagFilterAst::And(children.into_iter().map(expand_to_tag_ast).collect())
        }
        TermFilterAst::Or(children) => {
            TagFilterAst::Or(children.into_iter().map(expand_to_tag_ast).collect())
        }
        TermFilterAst::Term { field, value } => {
            let field_is_tag = TagFilterAst::Tag {
                is_present: false,
                tag: field_tag(&field),
            };
            let term_tag = TagFilterAst::Tag {
                is_present: true,
                tag: term_tag(&field, &value),
            };
            TagFilterAst::Or(vec![field_is_tag, term_tag])
        }
    }
}

fn collect_tag_filters_for_clause(
    clause: Vec<(Occur, UnsimplifiedTagFilterAst)>,
) -> UnsimplifiedTagFilterAst {
    if clause.is_empty() {
        return UnsimplifiedTagFilterAst::Uninformative;
    }
    if clause.iter().any(|(occur, _)| occur == &Occur::Must) {
        let removed_should_clause: Vec<UnsimplifiedTagFilterAst> = clause
            .into_iter()
            .filter_map(|(occur, ast)| match occur {
                Occur::Must => Some(ast),
                Occur::MustNot => Some(negate_ast(ast)),
                Occur::Should => None,
            })
            .collect();
        // We will handle the case where removed_should_clause.len() == 1 in the simplify
        // phase.
        return UnsimplifiedTagFilterAst::And(removed_should_clause);
    }
    let converted_not_clause = clause
        .into_iter()
        .map(|(occur, ast)| match occur {
            Occur::MustNot => negate_ast(ast),
            Occur::Should => ast,
            Occur::Must => {
                unreachable!("This should never happen due to check above.")
            }
        })
        .collect();
    UnsimplifiedTagFilterAst::Or(converted_not_clause)
}

/// Negate the unsimplified ast, pushing the negation to the leaf
/// using De Morgan's law
/// - NOT( A AND B )=> NOT(A) OR NOT(B)
/// - NOT( A OR B )=> NOT(A) AND NOT(B)
/// - NOT( Tag ) => NotTag
/// - NOT( NotTag ) => Tag
/// - NOT( Uninformative ) => Uninformative.
fn negate_ast(clause: UnsimplifiedTagFilterAst) -> UnsimplifiedTagFilterAst {
    match clause {
        UnsimplifiedTagFilterAst::And(leaves) => {
            UnsimplifiedTagFilterAst::Or(leaves.into_iter().map(negate_ast).collect())
        }
        UnsimplifiedTagFilterAst::Or(leaves) => {
            UnsimplifiedTagFilterAst::And(leaves.into_iter().map(negate_ast).collect())
        }
        UnsimplifiedTagFilterAst::Tag {
            is_present,
            field,
            value,
        } => UnsimplifiedTagFilterAst::Tag {
            is_present: !is_present,
            field,
            value,
        },
        UnsimplifiedTagFilterAst::Uninformative => UnsimplifiedTagFilterAst::Uninformative,
    }
}

/// Helper to build a TagFilterAst checking for the presence of a tag.
pub fn tag(tag: impl ToString) -> TagFilterAst {
    TagFilterAst::Tag {
        is_present: true,
        tag: tag.to_string(),
    }
}

/// Helper to build a TagFilterAst checking for the absence of a tag.
pub fn no_tag(tag: impl ToString) -> TagFilterAst {
    TagFilterAst::Tag {
        is_present: false,
        tag: tag.to_string(),
    }
}
#[cfg(test)]
mod test {
    use quickwit_query::BooleanOperand;
    use quickwit_query::query_ast::{QueryAst, UserInputQuery};

    use super::extract_tags_from_query;
    use crate::tag_pruning::TagFilterAst;

    fn extract_tags_from_query_helper(user_query: &str) -> Option<TagFilterAst> {
        let query_ast: QueryAst = UserInputQuery {
            user_text: user_query.to_string(),
            default_fields: None,
            default_operator: BooleanOperand::Or,
            lenient: false,
        }
        .into();
        let parsed_query_ast = query_ast.parse_user_query(&[]).unwrap();
        extract_tags_from_query(parsed_query_ast)
    }

    #[test]
    fn test_extract_tags_from_query_all() {
        assert_eq!(extract_tags_from_query_helper("*"), None);
    }

    #[test]
    fn test_extract_tags_from_query_range_query() {
        assert_eq!(extract_tags_from_query_helper("title:>foo lang:fr"), None);
    }

    #[test]
    fn test_extract_tags_from_query_range_query_conjunction() {
        assert_eq!(
            &extract_tags_from_query_helper("title:>foo AND lang:fr")
                .unwrap()
                .to_string(),
            "(¬lang! ∨ lang:fr)"
        );
    }

    #[test]
    fn test_extract_tags_from_query_mixed_disjunction() -> anyhow::Result<()> {
        assert_eq!(
            &extract_tags_from_query_helper("title:foo user:bart lang:fr")
                .unwrap()
                .to_string(),
            "((¬title! ∨ title:foo) ∨ (¬user! ∨ user:bart) ∨ (¬lang! ∨ lang:fr))"
        );
        Ok(())
    }

    #[test]
    fn test_extract_tags_from_query_and_or() -> anyhow::Result<()> {
        assert_eq!(
            &extract_tags_from_query_helper("title:foo AND (user:bart OR lang:fr)")
                .unwrap()
                .to_string(),
            "(¬title! ∨ title:foo) ∧ ((¬user! ∨ user:bart) ∨ (¬lang! ∨ lang:fr))"
        );
        Ok(())
    }

    #[test]
    fn test_conjunction_of_tags() {
        assert_eq!(
            &extract_tags_from_query_helper("(user:bart AND lang:fr)")
                .unwrap()
                .to_string(),
            "(¬user! ∨ user:bart) ∧ (¬lang! ∨ lang:fr)"
        );
    }

    #[test]
    fn test_disjunction_of_tags() {
        assert_eq!(
            &extract_tags_from_query_helper("(user:bart OR lang:fr)")
                .unwrap()
                .to_string(),
            "((¬user! ∨ user:bart) ∨ (¬lang! ∨ lang:fr))"
        );
    }

    #[test]
    fn test_disjunction_of_tag_disjunction_with_not_clause() {
        // ORed negative tags make the result inconclusive. See simplify_ast() for details
        assert!(extract_tags_from_query_helper("(user:bart -lang:fr)").is_none());
    }

    #[test]
    fn test_disjunction_of_tag_conjunction_with_not_clause() {
        // negative tags are removed from AND clauses. See simplify_ast() for details
        assert_eq!(
            &extract_tags_from_query_helper("user:bart AND NOT lang:fr")
                .unwrap()
                .to_string(),
            "(¬user! ∨ user:bart)"
        );
    }

    #[test]
    fn test_disjunction_of_tag_must_should() {
        assert_eq!(
            &extract_tags_from_query_helper("(+user:bart lang:fr)")
                .unwrap()
                .to_string(),
            "(¬user! ∨ user:bart)"
        );
    }

    #[test]
    fn test_match_tag_field_name() {
        assert!(super::match_tag_field_name("tagfield", "tagfield:val"));
        assert!(super::match_tag_field_name("tagfield", "tagfield:"));
        assert!(!super::match_tag_field_name("tagfield", "tagfield"));
        assert!(!super::match_tag_field_name("tagfield", "tag:val"));
        assert!(!super::match_tag_field_name("tagfield", "tagfiele:val"));
        assert!(!super::match_tag_field_name("tagfield", "t:val"));
    }
}


================================================
FILE: quickwit/quickwit-index-management/Cargo.toml
================================================
[package]
name = "quickwit-index-management"
description = "Create and manage Quickwit indexes, sources, templates, etc."

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
futures = { workspace = true }
futures-util = { workspace = true }
itertools = { workspace = true }
thiserror = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-indexing = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-storage = { workspace = true }

[dev-dependencies]

quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }


================================================
FILE: quickwit/quickwit-index-management/src/garbage_collection.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::path::{Path, PathBuf};
use std::sync::{Arc, OnceLock};
use std::time::Duration;

use anyhow::Context;
use futures::{Future, StreamExt};
use itertools::Itertools;
use quickwit_common::metrics::IntCounter;
use quickwit_common::pretty::PrettySample;
use quickwit_common::{Progress, rate_limited_info};
use quickwit_metastore::{
    ListSplitsQuery, ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitInfo,
    SplitMetadata, SplitState,
};
use quickwit_proto::metastore::{
    DeleteSplitsRequest, ListSplitsRequest, MarkSplitsForDeletionRequest, MetastoreError,
    MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::{IndexUid, SplitId};
use quickwit_storage::{BulkDeleteError, Storage};
use thiserror::Error;
use time::OffsetDateTime;
use tracing::{error, instrument};

/// The maximum number of splits that the GC should delete per attempt.
const DELETE_SPLITS_BATCH_SIZE: usize = 10_000;

pub struct GcMetrics {
    pub deleted_splits: IntCounter,
    pub deleted_bytes: IntCounter,
    pub failed_splits: IntCounter,
}

trait RecordGcMetrics {
    fn record(&self, num_delete_splits: usize, num_deleted_bytes: u64, num_failed_splits: usize);
}

impl RecordGcMetrics for Option<GcMetrics> {
    fn record(&self, num_deleted_splits: usize, num_deleted_bytes: u64, num_failed_splits: usize) {
        if let Some(metrics) = self {
            metrics.deleted_splits.inc_by(num_deleted_splits as u64);
            metrics.deleted_bytes.inc_by(num_deleted_bytes);
            metrics.failed_splits.inc_by(num_failed_splits as u64);
        }
    }
}

/// [`DeleteSplitsError`] describes the errors that occurred during the deletion of splits from
/// storage and metastore.
#[derive(Error, Debug)]
#[error("failed to delete splits from storage and/or metastore")]
pub struct DeleteSplitsError {
    successes: Vec<SplitInfo>,
    storage_error: Option<BulkDeleteError>,
    storage_failures: Vec<SplitInfo>,
    metastore_error: Option<MetastoreError>,
    metastore_failures: Vec<SplitInfo>,
}

async fn protect_future<Fut, T>(progress: Option<&Progress>, future: Fut) -> T
where Fut: Future<Output = T> {
    match progress {
        None => future.await,
        Some(progress) => {
            let _guard = progress.protect_zone();
            future.await
        }
    }
}

/// Information on what splits have and have not been cleaned up by the GC.
#[derive(Debug, Default)]
pub struct SplitRemovalInfo {
    /// The set of splits that have been removed.
    pub removed_split_entries: Vec<SplitInfo>,
    /// The set of split ids that were attempted to be removed, but were unsuccessful.
    pub failed_splits: Vec<SplitInfo>,
}

/// Detect all dangling splits and associated files from the index and removes them.
///
/// * `indexes` - The target index uids and storages.
/// * `storage - The storage managing the target index.
/// * `metastore` - The metastore managing the target index.
/// * `staged_grace_period` -  Threshold period after which a staged split can be safely garbage
///   collected.
/// * `deletion_grace_period` -  Threshold period after which a marked as deleted split can be
///   safely deleted.
/// * `dry_run` - Should this only return a list of affected files without performing deletion.
/// * `progress` - For reporting progress (useful when called from within a quickwit actor).
pub async fn run_garbage_collect(
    indexes: HashMap<IndexUid, Arc<dyn Storage>>,
    metastore: MetastoreServiceClient,
    staged_grace_period: Duration,
    deletion_grace_period: Duration,
    dry_run: bool,
    progress_opt: Option<&Progress>,
    metrics: Option<GcMetrics>,
) -> anyhow::Result<SplitRemovalInfo> {
    let grace_period_timestamp =
        OffsetDateTime::now_utc().unix_timestamp() - staged_grace_period.as_secs() as i64;

    let index_uids: Vec<IndexUid> = indexes.keys().cloned().collect();

    // TODO maybe we want to do a ListSplitsQuery::for_all_indexes and post-filter ourselves here
    let Some(list_splits_query_for_index_uids) = ListSplitsQuery::try_from_index_uids(index_uids)
    else {
        return Ok(SplitRemovalInfo::default());
    };
    let list_splits_query = list_splits_query_for_index_uids
        .clone()
        .with_split_state(SplitState::Staged)
        .with_update_timestamp_lte(grace_period_timestamp);

    let list_deletable_staged_request =
        ListSplitsRequest::try_from_list_splits_query(&list_splits_query)?;
    let deletable_staged_splits: Vec<SplitMetadata> = protect_future(
        progress_opt,
        metastore.list_splits(list_deletable_staged_request),
    )
    .await?
    .collect_splits_metadata()
    .await?;

    if dry_run {
        let marked_for_deletion_query =
            list_splits_query_for_index_uids.with_split_state(SplitState::MarkedForDeletion);
        let marked_for_deletion_request =
            ListSplitsRequest::try_from_list_splits_query(&marked_for_deletion_query)?;
        let mut splits_marked_for_deletion: Vec<SplitMetadata> = protect_future(
            progress_opt,
            metastore.list_splits(marked_for_deletion_request),
        )
        .await?
        .collect_splits_metadata()
        .await?;
        splits_marked_for_deletion.extend(deletable_staged_splits);

        let candidate_entries: Vec<SplitInfo> = splits_marked_for_deletion
            .into_iter()
            .map(|split| split.as_split_info())
            .collect();
        return Ok(SplitRemovalInfo {
            removed_split_entries: candidate_entries,
            failed_splits: Vec::new(),
        });
    }

    // Schedule all eligible staged splits for delete
    let split_ids: HashMap<IndexUid, Vec<SplitId>> = deletable_staged_splits
        .into_iter()
        .map(|split| (split.index_uid, split.split_id))
        .into_group_map();
    for (index_uid, split_ids) in split_ids {
        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid, split_ids);
        protect_future(
            progress_opt,
            metastore.mark_splits_for_deletion(mark_splits_for_deletion_request),
        )
        .await?;
    }

    // We delete splits marked for deletion that have an update timestamp anterior
    // to `now - deletion_grace_period`.
    let updated_before_timestamp =
        OffsetDateTime::now_utc().unix_timestamp() - deletion_grace_period.as_secs() as i64;

    Ok(delete_splits_marked_for_deletion_several_indexes(
        updated_before_timestamp,
        metastore,
        indexes,
        progress_opt,
        metrics,
    )
    .await)
}

async fn delete_splits(
    splits_metadata_to_delete_per_index: HashMap<IndexUid, Vec<SplitMetadata>>,
    storages: &HashMap<IndexUid, Arc<dyn Storage>>,
    metastore: MetastoreServiceClient,
    progress_opt: Option<&Progress>,
    metrics: &Option<GcMetrics>,
    split_removal_info: &mut SplitRemovalInfo,
) -> Result<(), ()> {
    let mut delete_split_from_index_res_stream =
        futures::stream::iter(splits_metadata_to_delete_per_index)
            .map(|(index_uid, splits_metadata_to_delete)| {
                let storage = storages.get(&index_uid).cloned();
                let metastore = metastore.clone();
                async move {
                    if let Some(storage) = storage {
                        delete_splits_from_storage_and_metastore(
                            index_uid,
                            storage,
                            metastore,
                            splits_metadata_to_delete,
                            progress_opt,
                        )
                        .await
                    } else {
                        // in practice this can happen if the index was created between the start of
                        // the run and now, and one of its splits has already expired, which likely
                        // means a very long gc run, or if we run gc on a single index from the cli.
                        quickwit_common::rate_limited_warn!(
                            limit_per_min = 2,
                            index_uid=%index_uid,
                            "we are trying to GC without knowing the storage",
                        );
                        Ok(Vec::new())
                    }
                }
            })
            .buffer_unordered(get_index_gc_concurrency().unwrap_or(10));

    let mut error_encountered = false;
    while let Some(delete_split_result) = delete_split_from_index_res_stream.next().await {
        match delete_split_result {
            Ok(entries) => {
                let deleted_bytes = entries
                    .iter()
                    .map(|entry| entry.file_size_bytes.as_u64())
                    .sum::<u64>();
                let deleted_splits_count = entries.len();

                metrics.record(deleted_splits_count, deleted_bytes, 0);
                split_removal_info.removed_split_entries.extend(entries);
            }
            Err(delete_split_error) => {
                let deleted_bytes = delete_split_error
                    .successes
                    .iter()
                    .map(|entry| entry.file_size_bytes.as_u64())
                    .sum::<u64>();
                let deleted_splits_count = delete_split_error.successes.len();
                let failed_splits_count = delete_split_error.storage_failures.len()
                    + delete_split_error.metastore_failures.len();

                metrics.record(deleted_splits_count, deleted_bytes, failed_splits_count);
                split_removal_info
                    .removed_split_entries
                    .extend(delete_split_error.successes);
                split_removal_info
                    .failed_splits
                    .extend(delete_split_error.storage_failures);
                split_removal_info
                    .failed_splits
                    .extend(delete_split_error.metastore_failures);
                error_encountered = true;
            }
        }
    }
    if error_encountered { Err(()) } else { Ok(()) }
}

/// Fetch the list metadata from the metastore and returns them as a Vec.
async fn list_splits_metadata(
    metastore: &MetastoreServiceClient,
    query: &ListSplitsQuery,
) -> anyhow::Result<Vec<SplitMetadata>> {
    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(query)
        .context("failed to build list splits request")?;
    let splits_to_delete_stream = metastore
        .list_splits(list_splits_request)
        .await
        .context("failed to fetch stream splits")?;
    let splits = splits_to_delete_stream
        .collect_splits_metadata()
        .await
        .context("failed to collect splits")?;
    Ok(splits)
}

/// In order to avoid hammering the load on the metastore, we can throttle the rate of split
/// deletion by setting this environment variable.
fn get_maximum_split_deletion_rate_per_sec() -> Option<usize> {
    static MAX_SPLIT_DELETION_RATE_PER_SEC: OnceLock<Option<usize>> = OnceLock::new();
    *MAX_SPLIT_DELETION_RATE_PER_SEC.get_or_init(|| {
        quickwit_common::get_from_env_opt::<usize>("QW_MAX_SPLIT_DELETION_RATE_PER_SEC", false)
    })
}

fn get_index_gc_concurrency() -> Option<usize> {
    static INDEX_GC_CONCURRENCY: OnceLock<Option<usize>> = OnceLock::new();
    *INDEX_GC_CONCURRENCY.get_or_init(|| {
        quickwit_common::get_from_env_opt::<usize>("QW_INDEX_GC_CONCURRENCY", false)
    })
}

/// Removes any splits marked for deletion which haven't been
/// updated after `updated_before_timestamp` in batches of 1,000 splits.
///
/// Only splits from index_uids in the `storages` map will be deleted.
///
/// The aim of this is to spread the load out across a longer period
/// rather than short, heavy bursts on the metastore and storage system itself.
#[instrument(skip(storages, metastore, progress_opt, metrics), fields(num_indexes=%storages.len()))]
async fn delete_splits_marked_for_deletion_several_indexes(
    updated_before_timestamp: i64,
    metastore: MetastoreServiceClient,
    storages: HashMap<IndexUid, Arc<dyn Storage>>,
    progress_opt: Option<&Progress>,
    metrics: Option<GcMetrics>,
) -> SplitRemovalInfo {
    let mut split_removal_info = SplitRemovalInfo::default();

    // we ask for all indexes because the query is more efficient and we almost always want all
    // indexes anyway. The exception is when garbage collecting a single index from the commandline.
    // In this case, we will log a bunch of warn. i (trinity) consider it worth the more generic
    // code which needs fewer special case while testing, but we could check index_uids len if we
    // think it's a better idea.
    let list_splits_query = ListSplitsQuery::for_all_indexes();

    let mut list_splits_query = list_splits_query
        .with_split_state(SplitState::MarkedForDeletion)
        .with_update_timestamp_lte(updated_before_timestamp)
        .with_limit(DELETE_SPLITS_BATCH_SIZE)
        .sort_by_index_uid();

    loop {
        let sleep_duration: Duration = if let Some(maximum_split_deletion_per_sec) =
            get_maximum_split_deletion_rate_per_sec()
        {
            Duration::from_secs(
                DELETE_SPLITS_BATCH_SIZE.div_ceil(maximum_split_deletion_per_sec) as u64,
            )
        } else {
            Duration::default()
        };
        let sleep_future = tokio::time::sleep(sleep_duration);

        let splits_metadata_to_delete: Vec<SplitMetadata> = match protect_future(
            progress_opt,
            list_splits_metadata(&metastore, &list_splits_query),
        )
        .await
        {
            Ok(splits) => splits,
            Err(list_splits_err) => {
                error!(error=?list_splits_err, "failed to list splits");
                break;
            }
        };

        // We page through the list of splits to delete using a limit and a `search_after` trick.
        // To detect if this is the last page, we check if the number of splits is less than the
        // limit.
        assert!(splits_metadata_to_delete.len() <= DELETE_SPLITS_BATCH_SIZE);
        let splits_to_delete_possibly_remaining =
            splits_metadata_to_delete.len() == DELETE_SPLITS_BATCH_SIZE;

        // set split after which to search for the next loop
        let Some(last_split_metadata) = splits_metadata_to_delete.last() else {
            break;
        };
        list_splits_query = list_splits_query.after_split(last_split_metadata);

        let mut splits_metadata_to_delete_per_index: HashMap<IndexUid, Vec<SplitMetadata>> =
            HashMap::with_capacity(storages.len());

        for meta in splits_metadata_to_delete {
            if !storages.contains_key(&meta.index_uid) {
                rate_limited_info!(limit_per_min=6, index_uid=?meta.index_uid, "split not listed in storage map: skipping");
                continue;
            }
            splits_metadata_to_delete_per_index
                .entry(meta.index_uid.clone())
                .or_default()
                .push(meta);
        }

        // ignore return we continue either way
        let _: Result<(), ()> = delete_splits(
            splits_metadata_to_delete_per_index,
            &storages,
            metastore.clone(),
            progress_opt,
            &metrics,
            &mut split_removal_info,
        )
        .await;

        if splits_to_delete_possibly_remaining {
            sleep_future.await;
        } else {
            // stop the gc if this was the last batch
            // we are guaranteed to make progress due to .after_split()
            break;
        }
    }

    split_removal_info
}

/// Delete a list of splits from the storage and the metastore.
/// It should leave the index and the metastore in good state.
///
/// * `index_id` - The target index id.
/// * `storage - The storage managing the target index.
/// * `metastore` - The metastore managing the target index.
/// * `splits`  - The list of splits to delete.
/// * `progress` - For reporting progress (useful when called from within a quickwit actor).
pub async fn delete_splits_from_storage_and_metastore(
    index_uid: IndexUid,
    storage: Arc<dyn Storage>,
    metastore: MetastoreServiceClient,
    splits: Vec<SplitMetadata>,
    progress_opt: Option<&Progress>,
) -> Result<Vec<SplitInfo>, DeleteSplitsError> {
    let mut split_infos: HashMap<PathBuf, SplitInfo> = HashMap::with_capacity(splits.len());

    for split in splits {
        let split_info = split.as_split_info();
        split_infos.insert(split_info.file_name.clone(), split_info);
    }
    let split_paths = split_infos
        .keys()
        .map(|split_path_buf| split_path_buf.as_path())
        .collect::<Vec<&Path>>();
    let delete_result = protect_future(progress_opt, storage.bulk_delete(&split_paths)).await;

    if let Some(progress) = progress_opt {
        progress.record_progress();
    }
    let mut successes = Vec::with_capacity(split_infos.len());
    let mut storage_error: Option<BulkDeleteError> = None;
    let mut storage_failures = Vec::new();

    match delete_result {
        Ok(_) => successes.extend(split_infos.into_values()),
        Err(bulk_delete_error) => {
            let success_split_paths: HashSet<&PathBuf> =
                bulk_delete_error.successes.iter().collect();
            for (split_path, split_info) in split_infos {
                if success_split_paths.contains(&split_path) {
                    successes.push(split_info);
                } else {
                    storage_failures.push(split_info);
                }
            }
            let failed_split_paths = storage_failures
                .iter()
                .map(|split_info| split_info.file_name.as_path())
                .collect::<Vec<_>>();
            error!(
                error=?bulk_delete_error.error,
                index_id=index_uid.index_id,
                "failed to delete split file(s) {:?} from storage",
                PrettySample::new(&failed_split_paths, 5),
            );
            storage_error = Some(bulk_delete_error);
        }
    };
    if !successes.is_empty() {
        let split_ids: Vec<SplitId> = successes
            .iter()
            .map(|split_info| split_info.split_id.to_string())
            .collect();
        let delete_splits_request = DeleteSplitsRequest {
            index_uid: Some(index_uid.clone()),
            split_ids: split_ids.clone(),
        };
        let metastore_result =
            protect_future(progress_opt, metastore.delete_splits(delete_splits_request)).await;

        if let Err(metastore_error) = metastore_result {
            error!(
                error=?metastore_error,
                index_id=index_uid.index_id,
                "failed to delete split(s) {:?} from metastore",
                PrettySample::new(&split_ids, 5),
            );
            let delete_splits_error = DeleteSplitsError {
                successes: Vec::new(),
                storage_error,
                storage_failures,
                metastore_error: Some(metastore_error),
                metastore_failures: successes,
            };
            return Err(delete_splits_error);
        }
    }
    if !storage_failures.is_empty() {
        let delete_splits_error = DeleteSplitsError {
            successes,
            storage_error,
            storage_failures,
            metastore_error: None,
            metastore_failures: Vec::new(),
        };
        return Err(delete_splits_error);
    }
    Ok(successes)
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use itertools::Itertools;
    use quickwit_common::ServiceStream;
    use quickwit_config::IndexConfig;
    use quickwit_metastore::{
        CreateIndexRequestExt, ListSplitsQuery, MetastoreServiceStreamSplitsExt, SplitMetadata,
        SplitState, StageSplitsRequestExt, metastore_for_test,
    };
    use quickwit_proto::metastore::{
        CreateIndexRequest, EntityKind, MockMetastoreService, StageSplitsRequest,
    };
    use quickwit_proto::types::IndexUid;
    use quickwit_storage::{
        BulkDeleteError, DeleteFailure, MockStorage, PutPayload, storage_for_test,
    };

    use super::*;
    use crate::run_garbage_collect;

    fn hashmap<K: Eq + std::hash::Hash, V>(key: K, value: V) -> HashMap<K, V> {
        let mut map = HashMap::new();
        map.insert(key, value);
        map
    }

    #[tokio::test]
    async fn test_run_gc_marks_stale_staged_splits_for_deletion_after_grace_period() {
        let storage = storage_for_test();
        let metastore = metastore_for_test();

        let index_id = "test-run-gc--index";
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(index_id, &index_uri);
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let split_id = "test-run-gc--split";
        let split_metadata = SplitMetadata {
            split_id: split_id.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
        assert_eq!(
            metastore
                .list_splits(list_splits_request)
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .len(),
            1
        );

        // The staging grace period hasn't passed yet so the split remains staged.
        run_garbage_collect(
            hashmap(index_uid.clone(), storage.clone()),
            metastore.clone(),
            Duration::from_secs(30),
            Duration::from_secs(30),
            false,
            None,
            None,
        )
        .await
        .unwrap();

        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
        assert_eq!(
            metastore
                .list_splits(list_splits_request)
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .len(),
            1
        );

        // The staging grace period has passed so the split is marked for deletion.
        run_garbage_collect(
            hashmap(index_uid.clone(), storage.clone()),
            metastore.clone(),
            Duration::from_secs(0),
            Duration::from_secs(30),
            false,
            None,
            None,
        )
        .await
        .unwrap();

        let query =
            ListSplitsQuery::for_index(index_uid).with_split_state(SplitState::MarkedForDeletion);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
        assert_eq!(
            metastore
                .list_splits(list_splits_request)
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .len(),
            1
        );
    }

    #[tokio::test]
    async fn test_run_gc_deletes_splits_marked_for_deletion_after_grace_period() {
        let storage = storage_for_test();
        let metastore = metastore_for_test();

        let index_id = "test-run-gc--index";
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(index_id, &index_uri);
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let split_id = "test-run-gc--split";
        let split_metadata = SplitMetadata {
            split_id: split_id.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id.to_string()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::MarkedForDeletion);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
        assert_eq!(
            metastore
                .list_splits(list_splits_request)
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .len(),
            1
        );

        // The delete grace period hasn't passed yet so the split remains marked for deletion.
        run_garbage_collect(
            hashmap(index_uid.clone(), storage.clone()),
            metastore.clone(),
            Duration::from_secs(30),
            Duration::from_secs(30),
            false,
            None,
            None,
        )
        .await
        .unwrap();

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::MarkedForDeletion);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
        assert_eq!(
            metastore
                .list_splits(list_splits_request)
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .len(),
            1
        );

        // The delete grace period has passed so the split is deleted.
        run_garbage_collect(
            hashmap(index_uid.clone(), storage.clone()),
            metastore.clone(),
            Duration::from_secs(30),
            Duration::from_secs(0),
            false,
            None,
            None,
        )
        .await
        .unwrap();

        let query = ListSplitsQuery::for_index(index_uid);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
        assert_eq!(
            metastore
                .list_splits(list_splits_request)
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .len(),
            0
        );
    }

    #[tokio::test]
    async fn test_run_gc_deletes_splits_with_no_split() {
        // Test that we make only 2 calls to the metastore.
        let storage = storage_for_test();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_splits()
            .times(2)
            .returning(|_| Ok(ServiceStream::empty()));
        run_garbage_collect(
            hashmap(
                IndexUid::new_with_random_ulid("index-test-gc-deletes"),
                storage.clone(),
            ),
            MetastoreServiceClient::from_mock(mock_metastore),
            Duration::from_secs(30),
            Duration::from_secs(30),
            false,
            None,
            None,
        )
        .await
        .unwrap();
    }

    #[tokio::test]
    async fn test_delete_splits_from_storage_and_metastore_happy_path() {
        let storage = storage_for_test();
        let metastore = metastore_for_test();

        let index_id = "test-delete-splits-happy--index";
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(index_id, &index_uri);
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let split_id = "test-delete-splits-happy--split";
        let split_metadata = SplitMetadata {
            split_id: split_id.to_string(),
            index_uid: IndexUid::new_with_random_ulid(index_id),
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata.clone())
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id.to_string()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();

        let split_path_str = format!("{split_id}.split");
        let split_path = Path::new(&split_path_str);
        let payload: Box<dyn PutPayload> = Box::new(vec![0]);
        storage.put(split_path, payload).await.unwrap();
        assert!(storage.exists(split_path).await.unwrap());

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 1);

        let deleted_split_infos = delete_splits_from_storage_and_metastore(
            index_uid.clone(),
            storage.clone(),
            metastore.clone(),
            vec![split_metadata],
            None,
        )
        .await
        .unwrap();

        assert_eq!(deleted_split_infos.len(), 1);
        assert_eq!(deleted_split_infos[0].split_id, split_id,);
        assert_eq!(
            deleted_split_infos[0].file_name,
            Path::new(&format!("{split_id}.split"))
        );
        assert!(!storage.exists(split_path).await.unwrap());
        assert!(
            metastore
                .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap()
                .is_empty()
        );
    }

    #[tokio::test]
    async fn test_delete_splits_from_storage_and_metastore_storage_error() {
        let mut mock_storage = MockStorage::new();
        mock_storage
            .expect_bulk_delete()
            .return_once(|split_paths| {
                assert_eq!(split_paths.len(), 2);

                let split_paths: Vec<PathBuf> = split_paths
                    .iter()
                    .map(|split_path| split_path.to_path_buf())
                    .sorted()
                    .collect();
                let split_path = split_paths[0].to_path_buf();
                let successes = vec![split_path];

                let split_path = split_paths[1].to_path_buf();
                let delete_failure = DeleteFailure {
                    code: Some("AccessDenied".to_string()),
                    ..Default::default()
                };
                let failures = HashMap::from_iter([(split_path, delete_failure)]);
                let bulk_delete_error = BulkDeleteError {
                    successes,
                    failures,
                    ..Default::default()
                };
                Err(bulk_delete_error)
            });
        let storage = Arc::new(mock_storage);
        let metastore = metastore_for_test();

        let index_id = "test-delete-splits-storage-error--index";
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(index_id, &index_uri);
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let split_id_0 = "test-delete-splits-storage-error--split-0";
        let split_metadata_0 = SplitMetadata {
            split_id: split_id_0.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let split_id_1 = "test-delete-splits-storage-error--split-1";
        let split_metadata_1 = SplitMetadata {
            split_id: split_id_1.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            [split_metadata_0.clone(), split_metadata_1.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let mark_splits_for_deletion_request = MarkSplitsForDeletionRequest::new(
            index_uid.clone(),
            vec![split_id_0.to_string(), split_id_1.to_string()],
        );
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        let error = delete_splits_from_storage_and_metastore(
            index_uid.clone(),
            storage.clone(),
            metastore.clone(),
            vec![split_metadata_0, split_metadata_1],
            None,
        )
        .await
        .unwrap_err();

        assert_eq!(error.successes.len(), 1);
        assert_eq!(error.storage_failures.len(), 1);
        assert_eq!(error.metastore_failures.len(), 0);

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 1);
        assert_eq!(splits[0].split_id(), split_id_1);
    }

    #[tokio::test]
    async fn test_delete_splits_from_storage_and_metastore_metastore_error() {
        let mut mock_storage = MockStorage::new();
        mock_storage
            .expect_bulk_delete()
            .return_once(|split_paths| {
                assert_eq!(split_paths.len(), 2);

                let split_path = split_paths[0].to_path_buf();
                let successes = vec![split_path];

                let split_path = split_paths[1].to_path_buf();
                let delete_failure = DeleteFailure {
                    code: Some("AccessDenied".to_string()),
                    ..Default::default()
                };
                let failures = HashMap::from_iter([(split_path, delete_failure)]);
                let bulk_delete_error = BulkDeleteError {
                    successes,
                    failures,
                    ..Default::default()
                };
                Err(bulk_delete_error)
            });
        let storage = Arc::new(mock_storage);

        let index_id = "test-delete-splits-storage-error--index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_delete_splits().return_once(|_| {
            Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_id.to_string(),
            }))
        });

        let split_id_0 = "test-delete-splits-storage-error--split-0";
        let split_metadata_0 = SplitMetadata {
            split_id: split_id_0.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let split_id_1 = "test-delete-splits-storage-error--split-1";
        let split_metadata_1 = SplitMetadata {
            split_id: split_id_1.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let error = delete_splits_from_storage_and_metastore(
            index_uid.clone(),
            storage.clone(),
            MetastoreServiceClient::from_mock(mock_metastore),
            vec![split_metadata_0, split_metadata_1],
            None,
        )
        .await
        .unwrap_err();

        assert!(error.successes.is_empty());
        assert_eq!(error.storage_failures.len(), 1);
        assert_eq!(error.metastore_failures.len(), 1);
    }
}


================================================
FILE: quickwit/quickwit-index-management/src/index.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::path::Path;
use std::time::Duration;

use futures_util::StreamExt;
use itertools::Itertools;
use quickwit_common::fs::{empty_dir, get_cache_directory_path};
use quickwit_common::pretty::PrettySample;
use quickwit_common::rate_limited_error;
use quickwit_config::{IndexConfig, SourceConfig, validate_identifier};
use quickwit_indexing::check_source_connectivity;
use quickwit_metastore::{
    AddSourceRequestExt, CreateIndexResponseExt, IndexMetadata, IndexMetadataResponseExt,
    ListIndexesMetadataResponseExt, ListSplitsQuery, ListSplitsRequestExt,
    MetastoreServiceStreamSplitsExt, SplitInfo, SplitMetadata, SplitState, UpdateIndexRequestExt,
    UpdateSourceRequestExt,
};
use quickwit_proto::metastore::{
    AddSourceRequest, CreateIndexRequest, DeleteIndexRequest, EntityKind, IndexMetadataRequest,
    ListIndexesMetadataRequest, ListSplitsRequest, MarkSplitsForDeletionRequest, MetastoreError,
    MetastoreService, MetastoreServiceClient, ResetSourceCheckpointRequest, UpdateIndexRequest,
    UpdateSourceRequest, serde_utils,
};
use quickwit_proto::types::{IndexUid, SplitId};
use quickwit_proto::{ServiceError, ServiceErrorCode};
use quickwit_storage::{StorageResolver, StorageResolverError};
use thiserror::Error;
use tracing::{error, info};

use crate::garbage_collection::{
    DeleteSplitsError, SplitRemovalInfo, delete_splits_from_storage_and_metastore,
    run_garbage_collect,
};

#[derive(Error, Debug)]
pub enum IndexServiceError {
    #[error("failed to resolve the storage `{0}`")]
    Storage(#[from] StorageResolverError),
    #[error("metastore error `{0}`")]
    Metastore(#[from] MetastoreError),
    #[error("split deletion error `{0}`")]
    SplitDeletion(#[from] DeleteSplitsError),
    #[error("invalid config: {0:#}")]
    InvalidConfig(anyhow::Error),
    #[error("invalid identifier: {0}")]
    InvalidIdentifier(String),
    #[error("operation not allowed: {0}")]
    OperationNotAllowed(String),
    #[error("internal error: {0}")]
    Internal(String),
}

impl ServiceError for IndexServiceError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(err_msg) => {
                rate_limited_error!(limit_per_min = 6, err_msg);
                ServiceErrorCode::Internal
            }
            Self::InvalidConfig(_) => ServiceErrorCode::BadRequest,
            Self::InvalidIdentifier(_) => ServiceErrorCode::BadRequest,
            Self::Metastore(error) => error.error_code(),
            Self::OperationNotAllowed(_) => ServiceErrorCode::Forbidden,
            Self::SplitDeletion(delete_splits_error) => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "index service internal error/split deletion: {delete_splits_error:?}"
                );
                ServiceErrorCode::Internal
            }
            Self::Storage(storage_error) => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "index service internal error/storage {storage_error:?}"
                );
                ServiceErrorCode::Internal
            }
        }
    }
}

/// Index service responsible for creating, updating and deleting indexes.
#[derive(Clone)]
pub struct IndexService {
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
}

impl IndexService {
    /// Creates an `IndexService`.
    pub fn new(metastore: MetastoreServiceClient, storage_resolver: StorageResolver) -> Self {
        Self {
            metastore,
            storage_resolver,
        }
    }

    pub fn metastore(&self) -> MetastoreServiceClient {
        self.metastore.clone()
    }

    /// Creates an index from `IndexConfig`.
    pub async fn create_index(
        &mut self,
        index_config: IndexConfig,
        overwrite: bool,
    ) -> Result<IndexMetadata, IndexServiceError> {
        validate_storage_uri(&self.storage_resolver, &index_config)
            .await
            .map_err(IndexServiceError::InvalidConfig)?;

        // Delete existing index if it exists.
        if overwrite {
            match self.delete_index(&index_config.index_id, false).await {
                Ok(_)
                | Err(IndexServiceError::Metastore(MetastoreError::NotFound(
                    EntityKind::Index { .. },
                ))) => {
                    // Ignore index not found error.
                }
                Err(error) => {
                    return Err(error);
                }
            }
        }
        let metastore = self.metastore.clone();

        let index_config_json = serde_utils::to_json_str(&index_config)?;

        // Add default sources.
        let source_configs_json = vec![
            serde_utils::to_json_str(&SourceConfig::ingest_api_default())?,
            serde_utils::to_json_str(&SourceConfig::ingest_v2())?,
            serde_utils::to_json_str(&SourceConfig::cli())?,
        ];
        let create_index_request = CreateIndexRequest {
            index_config_json,
            source_configs_json,
        };
        let create_index_response = metastore.create_index(create_index_request).await?;
        let index_metadata = create_index_response.deserialize_index_metadata()?;
        Ok(index_metadata)
    }

    /// Returns the index metadata for the given index ID if it exists.
    pub async fn index_metadata_opt(
        &self,
        index_metadata_request: IndexMetadataRequest,
    ) -> Result<Option<IndexMetadata>, IndexServiceError> {
        let index_metadata_response = self.metastore.index_metadata(index_metadata_request).await;
        match index_metadata_response {
            Ok(index_metadata_response) => {
                let index_metadata = index_metadata_response.deserialize_index_metadata()?;
                Ok(Some(index_metadata))
            }
            Err(MetastoreError::NotFound(_)) => Ok(None),
            Err(error) => Err(IndexServiceError::Metastore(error)),
        }
    }

    /// Updates an index with the given index config.
    pub async fn update_index(
        &self,
        index_uid: IndexUid,
        index_config: IndexConfig,
    ) -> Result<IndexMetadata, IndexServiceError> {
        let update_index_request = UpdateIndexRequest::try_from_updates(
            index_uid,
            &index_config.doc_mapping,
            &index_config.indexing_settings,
            &index_config.ingest_settings,
            &index_config.search_settings,
            &index_config.retention_policy_opt,
        )?;
        let update_index_response = self.metastore.update_index(update_index_request).await?;
        let index_metadata = update_index_response.deserialize_index_metadata()?;
        Ok(index_metadata)
    }

    /// Deletes the index specified with `index_id`.
    /// This is equivalent to running `rm -rf <index path>` for a local index or
    /// `aws s3 rm --recursive <index path>` for a remote Amazon S3 index.
    ///
    /// * `index_id` - The target index Id.
    /// * `dry_run` - Should this only return a list of affected files without performing deletion.
    pub async fn delete_index(
        &mut self,
        index_id: &str,
        dry_run: bool,
    ) -> Result<Vec<SplitInfo>, IndexServiceError> {
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
        let index_metadata = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?;
        let index_uid = index_metadata.index_uid.clone();
        let index_uri = index_metadata.into_index_config().index_uri.clone();
        let storage = self.storage_resolver.resolve(&index_uri).await?;

        if dry_run {
            let list_splits_request = ListSplitsRequest::try_from_index_uid(index_uid)?;
            let splits_to_delete: Vec<SplitInfo> = self
                .metastore
                .list_splits(list_splits_request)
                .await?
                .collect_splits()
                .await?
                .into_iter()
                .map(|split| split.split_metadata.as_split_info())
                .collect();
            return Ok(splits_to_delete);
        }
        // Schedule staged and published splits for deletion.
        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_states([SplitState::Staged, SplitState::Published]);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
        let split_ids: Vec<SplitId> = self
            .metastore
            .list_splits(list_splits_request)
            .await?
            .collect_split_ids()
            .await?;
        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), split_ids);
        self.metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await?;

        // Select splits to delete
        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::MarkedForDeletion);
        let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
        let splits_metadata_to_delete: Vec<SplitMetadata> = self
            .metastore
            .list_splits(list_splits_request)
            .await?
            .collect_splits_metadata()
            .await?;

        let deleted_splits = delete_splits_from_storage_and_metastore(
            index_uid.clone(),
            storage,
            self.metastore.clone(),
            splits_metadata_to_delete,
            None,
        )
        .await?;
        let delete_index_request = DeleteIndexRequest {
            index_uid: Some(index_uid),
        };
        self.metastore.delete_index(delete_index_request).await?;

        Ok(deleted_splits)
    }

    /// Deletes the indexes specified with `index_id_patterns`.
    /// This is a wrapper of delete_index, and support index delete with index pattern
    ///
    /// * `index_id_patterns` - The targeted index ID patterns.
    /// * `dry_run` - Should this only return a list of affected files without performing deletion.
    pub async fn delete_indexes(
        &self,
        index_id_patterns: Vec<String>,
        ignore_missing: bool,
        dry_run: bool,
    ) -> Result<Vec<SplitInfo>, IndexServiceError> {
        let list_indexes_metadatas_request = ListIndexesMetadataRequest {
            index_id_patterns: index_id_patterns.to_owned(),
        };
        // disallow index_id patterns
        for index_id_pattern in &index_id_patterns {
            if index_id_pattern.contains('*') {
                return Err(IndexServiceError::Metastore(
                    MetastoreError::InvalidArgument {
                        message: format!("index_id pattern {index_id_pattern} contains *"),
                    },
                ));
            }
            if index_id_pattern == "_all" {
                return Err(IndexServiceError::Metastore(
                    MetastoreError::InvalidArgument {
                        message: "index_id pattern _all not supported".to_string(),
                    },
                ));
            }
        }

        let metastore = self.metastore.clone();
        let indexes_metadata = metastore
            .list_indexes_metadata(list_indexes_metadatas_request)
            .await?
            .deserialize_indexes_metadata()
            .await?;

        if !ignore_missing && indexes_metadata.len() != index_id_patterns.len() {
            let found_index_ids: HashSet<&str> = indexes_metadata
                .iter()
                .map(|index_metadata| index_metadata.index_id())
                .collect();
            let missing_index_ids: Vec<String> = index_id_patterns
                .iter()
                .filter(|index_id| !found_index_ids.contains(index_id.as_str()))
                .map(|index_id| index_id.to_string())
                .collect_vec();
            return Err(IndexServiceError::Metastore(MetastoreError::NotFound(
                EntityKind::Indexes {
                    index_ids: missing_index_ids.to_vec(),
                },
            )));
        }
        let index_ids = indexes_metadata
            .iter()
            .map(|index_metadata| index_metadata.index_id())
            .collect_vec();
        info!(index_ids = ?PrettySample::new(&index_ids, 5), "delete indexes");

        // setup delete index tasks
        let mut delete_index_tasks = Vec::new();
        for index_id in index_ids {
            let task = async move {
                let result = self.clone().delete_index(index_id, dry_run).await;
                (index_id, result)
            };
            delete_index_tasks.push(task);
        }
        let mut delete_responses: HashMap<String, Vec<SplitInfo>> = HashMap::new();
        let mut delete_errors: HashMap<String, IndexServiceError> = HashMap::new();
        let mut stream = futures::stream::iter(delete_index_tasks).buffer_unordered(5);
        while let Some((index_id, delete_response)) = stream.next().await {
            match delete_response {
                Ok(split_infos) => {
                    delete_responses.insert(index_id.to_string(), split_infos);
                }
                Err(error) => {
                    delete_errors.insert(index_id.to_string(), error);
                }
            }
        }

        if delete_errors.is_empty() {
            let mut concatenated_split_infos = Vec::new();
            for (_, split_info_vec) in delete_responses.into_iter() {
                concatenated_split_infos.extend(split_info_vec);
            }
            Ok(concatenated_split_infos)
        } else {
            Err(IndexServiceError::Metastore(MetastoreError::Internal {
                message: format!("errors occurred when deleting indexes: {index_id_patterns:?}"),
                cause: format!("errors: {delete_errors:?}\ndeleted indexes: {delete_responses:?}"),
            }))
        }
    }
    /// Detect all dangling splits and associated files from the index and removes them.
    ///
    /// * `index_id` - The target index Id.
    /// * `grace_period` -  Threshold period after which a staged split can be garbage collected.
    /// * `dry_run` - Should this only return a list of affected files without performing deletion.
    pub async fn garbage_collect_index(
        &mut self,
        index_id: &str,
        grace_period: Duration,
        dry_run: bool,
    ) -> anyhow::Result<SplitRemovalInfo> {
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
        let index_metadata = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?;
        let index_uid = index_metadata.index_uid.clone();
        let index_config = index_metadata.into_index_config();
        let storage = self
            .storage_resolver
            .resolve(&index_config.index_uri)
            .await?;

        let deleted_entries = run_garbage_collect(
            [(index_uid, storage)].into_iter().collect(),
            self.metastore.clone(),
            grace_period,
            // deletion_grace_period of zero, so that a cli call directly deletes splits after
            // marking to be deleted.
            Duration::ZERO,
            dry_run,
            None,
            None,
        )
        .await?;

        Ok(deleted_entries)
    }

    /// Clears the index by applying the following actions:
    /// - mark all splits for deletion in the metastore.
    /// - delete the files of all splits marked for deletion using garbage collection.
    /// - delete the splits from the metastore.
    /// - reset all the source checkpoints.
    ///
    /// * `metastore` - A metastore object for interacting with the metastore.
    /// * `index_id` - The target index Id.
    /// * `storage_resolver` - A storage resolver object to access the storage.
    pub async fn clear_index(&mut self, index_id: &str) -> Result<(), IndexServiceError> {
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
        let index_metadata = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?;
        let index_uid = index_metadata.index_uid.clone();
        let storage = self
            .storage_resolver
            .resolve(index_metadata.index_uri())
            .await?;
        let list_splits_request = ListSplitsRequest::try_from_index_uid(index_uid.clone())?;
        let splits_metadata: Vec<SplitMetadata> = self
            .metastore
            .list_splits(list_splits_request)
            .await?
            .collect_splits_metadata()
            .await?;
        let split_ids: Vec<SplitId> = splits_metadata
            .iter()
            .map(|split| split.split_id.to_string())
            .collect();
        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), split_ids.clone());
        self.metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await?;
        // FIXME: return an error.
        if let Err(err) = delete_splits_from_storage_and_metastore(
            index_uid.clone(),
            storage,
            self.metastore.clone(),
            splits_metadata,
            None,
        )
        .await
        {
            error!(metastore_endpoints=?self.metastore.endpoints(), index_id=%index_id, error=?err, "failed to delete all the split files during garbage collection");
        }
        for source_id in index_metadata.sources.keys() {
            let reset_source_checkpoint_request = ResetSourceCheckpointRequest {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.to_string(),
            };
            self.metastore
                .reset_source_checkpoint(reset_source_checkpoint_request)
                .await?;
        }
        Ok(())
    }

    /// Adds a source to an index identified by its UID.
    pub async fn add_source(
        &mut self,
        index_uid: IndexUid,
        source_config: SourceConfig,
    ) -> Result<SourceConfig, IndexServiceError> {
        let source_id = source_config.source_id.clone();
        // This is a bit redundant, as SourceConfig deserialization also checks
        // that the identifier is valid. However it authorizes the special
        // private names internal to quickwit, so we do an extra check.
        validate_identifier("source", &source_id).map_err(|_| {
            IndexServiceError::InvalidIdentifier(format!("invalid source ID: `{source_id}`"))
        })?;
        check_source_connectivity(&self.storage_resolver, &source_config)
            .await
            .map_err(IndexServiceError::InvalidConfig)?;
        let add_source_request =
            AddSourceRequest::try_from_source_config(index_uid.clone(), &source_config)?;
        self.metastore.add_source(add_source_request).await?;
        info!(
            "source `{}` successfully created for index `{}`",
            source_id, index_uid.index_id,
        );
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_uid.index_id);
        let source = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?
            .sources
            .get(&source_id)
            .ok_or_else(|| {
                IndexServiceError::Internal(
                    "created source is not in index metadata, this should never happen".to_string(),
                )
            })?
            .clone();
        Ok(source)
    }

    /// Updates a source from an index identified by its UID.
    pub async fn update_source(
        &mut self,
        index_uid: IndexUid,
        source_config: SourceConfig,
    ) -> Result<SourceConfig, IndexServiceError> {
        let source_id = source_config.source_id.clone();
        check_source_connectivity(&self.storage_resolver, &source_config)
            .await
            .map_err(IndexServiceError::InvalidConfig)?;
        let update_source_request =
            UpdateSourceRequest::try_from_source_config(index_uid.clone(), &source_config)?;
        self.metastore.update_source(update_source_request).await?;
        info!(
            "source `{source_id}` successfully updated for index `{}`",
            index_uid.index_id
        );
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_uid.index_id);
        let source = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?
            .sources
            .get(&source_id)
            .ok_or_else(|| {
                IndexServiceError::Internal(
                    "created source is not in index metadata, this should never happen".to_string(),
                )
            })?
            .clone();
        Ok(source)
    }

    pub async fn get_source(
        &mut self,
        index_id: &str,
        source_id: &str,
    ) -> Result<SourceConfig, IndexServiceError> {
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
        let source_config = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?
            .sources
            .get(source_id)
            .ok_or_else(|| {
                IndexServiceError::Metastore(MetastoreError::NotFound(EntityKind::Source {
                    index_id: index_id.to_string(),
                    source_id: source_id.to_string(),
                }))
            })?
            .clone();

        Ok(source_config)
    }
}

/// Clears the cache directory of a given source.
///
/// * `data_dir_path` - Path to directory where data (tmp data, splits kept for caching purpose) is
///   persisted.
pub async fn clear_cache_directory(data_dir_path: &Path) -> anyhow::Result<()> {
    let cache_directory_path = get_cache_directory_path(data_dir_path);
    info!(path = %cache_directory_path.display(), "clearing cache directory");
    empty_dir(&cache_directory_path).await?;
    Ok(())
}

/// Validates the storage URI by effectively resolving it.
pub async fn validate_storage_uri(
    storage_resolver: &StorageResolver,
    index_config: &IndexConfig,
) -> anyhow::Result<()> {
    storage_resolver.resolve(&index_config.index_uri).await?;
    Ok(())
}

#[cfg(test)]
mod tests {

    use quickwit_common::uri::Uri;
    use quickwit_config::{
        CLI_SOURCE_ID, INGEST_API_SOURCE_ID, INGEST_V2_SOURCE_ID, IndexConfig, RetentionPolicy,
    };
    use quickwit_metastore::{
        MetastoreServiceExt, SplitMetadata, StageSplitsRequestExt, metastore_for_test,
    };
    use quickwit_proto::metastore::StageSplitsRequest;
    use quickwit_storage::PutPayload;

    use super::*;

    #[tokio::test]
    async fn test_create_index() {
        let metastore = metastore_for_test();
        let storage_resolver = StorageResolver::for_test();
        let mut index_service = IndexService::new(metastore.clone(), storage_resolver);
        let index_id = "test-index";
        let index_uri = "ram://indexes/test-index";
        let index_config = IndexConfig::for_test(index_id, index_uri);
        let index_metadata_0 = index_service
            .create_index(index_config.clone(), false)
            .await
            .unwrap();
        assert_eq!(index_metadata_0.index_id(), index_id);
        assert_eq!(index_metadata_0.index_uri(), &index_uri);

        assert_eq!(index_metadata_0.sources.len(), 3);
        assert!(index_metadata_0.sources.contains_key(CLI_SOURCE_ID));
        assert!(index_metadata_0.sources.contains_key(INGEST_API_SOURCE_ID));
        assert!(index_metadata_0.sources.contains_key(INGEST_V2_SOURCE_ID));

        assert!(
            metastore
                .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
                .await
                .is_ok()
        );

        let error = index_service
            .create_index(index_config.clone(), false)
            .await
            .unwrap_err();
        let IndexServiceError::Metastore(inner_error) = error else {
            panic!("expected `MetastoreError` variant, got {error:?}")
        };
        assert!(
            matches!(inner_error, MetastoreError::AlreadyExists(EntityKind::Index { index_id }) if index_id == index_metadata_0.index_id())
        );

        let index_metadata_1 = index_service
            .create_index(index_config, true)
            .await
            .unwrap();
        assert_eq!(index_metadata_1.index_id(), index_id);
        assert_eq!(index_metadata_1.index_uri(), &index_uri);
        assert!(index_metadata_0.index_uid != index_metadata_1.index_uid);
    }

    #[tokio::test]
    async fn test_index_metadata_opt() {
        let metastore = metastore_for_test();
        let storage_resolver = StorageResolver::for_test();
        let mut index_service = IndexService::new(metastore.clone(), storage_resolver);

        let index_id = "test-index";
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
        let index_metadata = index_service
            .index_metadata_opt(index_metadata_request)
            .await
            .unwrap();
        assert!(index_metadata.is_none());

        let index_uri = "ram://indexes/test-index";
        let index_config = IndexConfig::for_test(index_id, index_uri);
        let index_uid = index_service
            .create_index(index_config.clone(), false)
            .await
            .unwrap()
            .index_uid;
        let index_metadata_request = IndexMetadataRequest::for_index_uid(index_uid.clone());
        let index_metadata = index_service
            .index_metadata_opt(index_metadata_request)
            .await
            .unwrap()
            .unwrap();
        assert_eq!(index_metadata.index_uid, index_uid);
    }

    #[tokio::test]
    async fn test_update_index() {
        let metastore = metastore_for_test();
        let storage_resolver = StorageResolver::for_test();
        let mut index_service = IndexService::new(metastore.clone(), storage_resolver);

        let index_id = "test-index";
        let index_uri = "ram://indexes/test-index";
        let mut index_config = IndexConfig::for_test(index_id, index_uri);
        let index_uid = index_service
            .create_index(index_config.clone(), false)
            .await
            .unwrap()
            .index_uid;

        let retention_policy = RetentionPolicy {
            retention_period: "42 hours".to_string(),
            evaluation_schedule: "hourly".to_string(),
        };
        index_config.retention_policy_opt = Some(retention_policy.clone());

        let updated_index_metadata = index_service
            .update_index(index_uid, index_config)
            .await
            .unwrap();
        let updated_retention_policy = updated_index_metadata
            .index_config
            .retention_policy_opt
            .unwrap();
        assert_eq!(updated_retention_policy, retention_policy);
    }

    #[tokio::test]
    async fn test_delete_index() {
        let mut metastore = metastore_for_test();
        let storage_resolver = StorageResolver::for_test();
        let storage = storage_resolver
            .resolve(&Uri::for_test("ram://indexes/test-index"))
            .await
            .unwrap();
        let mut index_service = IndexService::new(metastore.clone(), storage_resolver);
        let index_id = "test-index";
        let index_uri = "ram://indexes/test-index";
        let index_config = IndexConfig::for_test(index_id, index_uri);
        let index_uid = index_service
            .create_index(index_config.clone(), false)
            .await
            .unwrap()
            .index_uid;

        let split_id = "test-split";
        let split_metadata = SplitMetadata {
            split_id: split_id.to_string(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            vec![split_metadata.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 1);

        let split_path_str = format!("{split_id}.split");
        let split_path = Path::new(&split_path_str);
        let payload: Box<dyn PutPayload> = Box::new(vec![0]);
        storage.put(split_path, payload).await.unwrap();
        assert!(storage.exists(split_path).await.unwrap());

        let split_infos = index_service.delete_index(index_id, false).await.unwrap();
        assert_eq!(split_infos.len(), 1);

        assert!(!metastore.index_exists(index_id).await.unwrap());
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());
        assert!(!storage.exists(split_path).await.unwrap());
    }
}


================================================
FILE: quickwit/quickwit-index-management/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod garbage_collection;
mod index;

pub use garbage_collection::{GcMetrics, run_garbage_collect};
pub use index::{IndexService, IndexServiceError, clear_cache_directory, validate_storage_uri};


================================================
FILE: quickwit/quickwit-indexing/Cargo.toml
================================================
[package]
name = "quickwit-indexing"
description = "Indexing service implementation"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
arc-swap = { workspace = true }
async-compression = { workspace = true }
async-trait = { workspace = true }
aws-sdk-kinesis = { workspace = true, optional = true }
aws-sdk-sqs = { workspace = true, optional = true }
bytes = { workspace = true }
bytesize = { workspace = true }
fail = { workspace = true }
flume = { workspace = true }
fnv = { workspace = true }
futures = { workspace = true }
google-cloud-auth = { workspace = true, optional = true }
google-cloud-gax = { workspace = true, optional = true }
google-cloud-googleapis = { workspace = true, optional = true }
google-cloud-pubsub = { workspace = true, optional = true }
itertools = { workspace = true }
libz-sys = { workspace = true, optional = true }
once_cell = { workspace = true }
oneshot = { workspace = true }
openssl = { workspace = true, optional = true }
percent-encoding = { workspace = true }
pulsar = { workspace = true, optional = true }
quickwit-query = { workspace = true }
regex = { workspace = true }
rdkafka = { workspace = true, optional = true }
serde = { workspace = true }
serde_json = { workspace = true }
tantivy = { workspace = true }
tempfile = { workspace = true }
thiserror = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }
ulid = { workspace = true }
utoipa = { workspace = true }
vrl = { workspace = true, optional = true }
warp = { workspace = true, optional = true }

quickwit-actors = { workspace = true }
quickwit-aws = { workspace = true }
quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-directories = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-ingest = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-opentelemetry = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-storage = { workspace = true }

[features]
gcp-pubsub = [
  "dep:google-cloud-auth",
  "dep:google-cloud-gax",
  "dep:google-cloud-googleapis",
  "dep:google-cloud-pubsub",
]
gcp-pubsub-emulator-tests = []
kafka = ["rdkafka"]
kafka-broker-tests = []
kinesis = [
  "aws-sdk-kinesis",
  "quickwit-aws/kinesis",
]
kinesis-localstack-tests = []
pulsar = ["dep:pulsar"]
pulsar-broker-tests = []
queue-sources = []
sqs = [
  "aws-sdk-sqs",
  "queue-sources",
  "quickwit-aws/sqs",
]
sqs-test-helpers = ["warp"]
sqs-localstack-tests = ["sqs-test-helpers"]
vendored-kafka = [
  "kafka",
  "libz-sys/static",
  "openssl/vendored",
  "rdkafka/gssapi-vendored",
]
vendored-kafka-macos = ["kafka", "libz-sys/static", "openssl/vendored"]
testsuite = [
  "quickwit-actors/testsuite",
  "quickwit-cluster/testsuite",
  "quickwit-common/testsuite",
  "quickwit-config/testsuite",
  "quickwit-proto/testsuite",
  "quickwit-storage/testsuite"
]
vrl = ["dep:vrl", "quickwit-config/vrl"]
ci-test = []

[dev-dependencies]
bytes = { workspace = true }
criterion = { workspace = true, features = ["async_tokio"] }
mockall = { workspace = true }
proptest = { workspace = true }
prost = { workspace = true }
rand = { workspace = true }
reqwest = { workspace = true }
tempfile = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-cluster = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-doc-mapper = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-ingest = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }

[[test]]
name = "failpoints"
path = "failpoints/mod.rs"
required-features = ["fail/failpoints"]

[[bench]]
name = "doc_process_vrl_bench"
harness = false

[package.metadata.cargo-machete]
# used to vendor/static build native dependencies
ignored = ["libz-sys", "openssl"]


================================================
FILE: quickwit/quickwit-indexing/README.md
================================================
```mermaid
flowchart LR
    subgraph Indexing pipeline
        direction LR
        publisher --inf--> source
        source[Source] --10--> doc_processor
        doc_processor[DocProcessor] --10--> indexer
        indexer[Indexer] --1--> serializer
        serializer[IndexSerializer] --1--> packager
        packager[Packager] --0--> uploader
        uploader[Uploader] --2--> sequencer
        sequencer[Sequencer] --1--> publisher
    end
    subgraph Merge pipeline
        direction LR
        merge_downloader[MergeDownloader] --1--> merge_executor
        merge_executor[MergeExecutor] --1--> merge_packager
        merge_packager[MergePackager] --0--> merge_uploader
        merge_uploader[MergeUploader] --inf--> merge_publisher
    end
    merge_planner[MergePlanner] --1--> merge_downloader
    merge_publisher[MergePublisher] --1--> merge_planner
    publisher[Publisher] --1--> merge_planner
```


================================================
FILE: quickwit/quickwit-indexing/benches/data/bench_data.json
================================================
{"id":1,"first_name":"Kearney","last_name":"Paunsford","email":"kpaunsford0@springer.com","job":"VP Sales","timestamp":"2022-07-19T21:48:45Z"}
{"id":2,"first_name":"Robinia","last_name":"Hapgood","email":"rhapgood1@google.co.jp","job":"Recruiter","timestamp":"2022-05-28T01:40:07Z"}
{"id":3,"first_name":"Patrizius","last_name":"O'Henery","email":"pohenery2@narod.ru","job":"VP Quality Control","timestamp":"2022-09-28T02:48:31Z"}
{"id":4,"first_name":"Natalina","last_name":"Jimeno","email":"njimeno3@vimeo.com","job":"Quality Engineer","timestamp":"2022-10-17T07:06:14Z"}
{"id":5,"first_name":"Jerrylee","last_name":"Clemont","email":"jclemont4@nbcnews.com","job":"Geologist IV","timestamp":"2022-03-16T11:22:02Z"}
{"id":6,"first_name":"Alphonse","last_name":"Andrejevic","email":"aandrejevic5@csmonitor.com","job":"Automation Specialist IV","timestamp":"2022-09-25T16:06:30Z"}
{"id":7,"first_name":"Jessamine","last_name":"Sumshon","email":"jsumshon6@buzzfeed.com","job":"Administrative Assistant I","timestamp":"2022-04-19T14:49:00Z"}
{"id":8,"first_name":"Eloisa","last_name":"Mowen","email":"emowen7@mediafire.com","job":"VP Sales","timestamp":"2022-11-28T13:04:32Z"}
{"id":9,"first_name":"Millie","last_name":"Gooda","email":"mgooda8@tinypic.com","job":"Administrative Officer","timestamp":"2022-07-24T06:56:27Z"}
{"id":10,"first_name":"Tarrah","last_name":"Crucitti","email":"tcrucitti9@engadget.com","job":"Chemical Engineer","timestamp":"2022-01-13T20:45:27Z"}
{"id":11,"first_name":"Micaela","last_name":"Giottini","email":"mgiottinia@globo.com","job":"Director of Sales","timestamp":"2022-10-17T12:49:19Z"}
{"id":12,"first_name":"Shannah","last_name":"Goodlet","email":"sgoodletb@i2i.jp","job":"Senior Financial Analyst","timestamp":"2022-09-10T21:24:23Z"}
{"id":13,"first_name":"Carley","last_name":"Gloy","email":"cgloyc@github.io","job":"Sales Representative","timestamp":"2022-06-11T07:20:14Z"}
{"id":14,"first_name":"Eba","last_name":"Simionato","email":"esimionatod@bigcartel.com","job":"VP Sales","timestamp":"2022-04-04T02:02:43Z"}
{"id":15,"first_name":"Camey","last_name":"Walklett","email":"cwalklette@youku.com","job":"Assistant Media Planner","timestamp":"2022-11-21T10:34:51Z"}
{"id":16,"first_name":"Leonore","last_name":"Cowland","email":"lcowlandf@arizona.edu","job":"Administrative Officer","timestamp":"2021-12-13T00:18:33Z"}
{"id":17,"first_name":"Kit","last_name":"Domenici","email":"kdomenicig@icq.com","job":"Chemical Engineer","timestamp":"2022-03-22T10:25:46Z"}
{"id":18,"first_name":"Jewel","last_name":"McGillacoell","email":"jmcgillacoellh@sbwire.com","job":"Software Consultant","timestamp":"2022-09-06T12:27:03Z"}
{"id":19,"first_name":"Arabela","last_name":"Lillicrop","email":"alillicropi@tamu.edu","job":"Biostatistician III","timestamp":"2022-10-22T03:31:14Z"}
{"id":20,"first_name":"Deborah","last_name":"Ridd","email":"driddj@issuu.com","job":"Account Executive","timestamp":"2022-07-26T09:31:38Z"}
{"id":21,"first_name":"Cordula","last_name":"Borthwick","email":"cborthwickk@bloomberg.com","job":"Senior Sales Associate","timestamp":"2022-09-28T18:04:21Z"}
{"id":22,"first_name":"Vincents","last_name":"Fitzjohn","email":"vfitzjohnl@a8.net","job":"Sales Associate","timestamp":"2022-09-17T00:38:00Z"}
{"id":23,"first_name":"Cam","last_name":"Wadworth","email":"cwadworthm@prweb.com","job":"Developer IV","timestamp":"2021-12-28T15:12:11Z"}
{"id":24,"first_name":"Dennison","last_name":"Hedlestone","email":"dhedlestonen@so-net.ne.jp","job":"Clinical Specialist","timestamp":"2022-05-18T20:46:28Z"}
{"id":25,"first_name":"Ibby","last_name":"Stetson","email":"istetsono@aboutads.info","job":"Assistant Media Planner","timestamp":"2022-08-14T02:30:12Z"}
{"id":26,"first_name":"Herc","last_name":"Eivers","email":"heiversp@bloglovin.com","job":"Media Manager IV","timestamp":"2022-03-05T13:51:08Z"}
{"id":27,"first_name":"Christy","last_name":"Brundrett","email":"cbrundrettq@statcounter.com","job":"Budget/Accounting Analyst II","timestamp":"2022-03-08T03:10:55Z"}
{"id":28,"first_name":"Tyler","last_name":"Gregersen","email":"tgregersenr@prnewswire.com","job":"Assistant Professor","timestamp":"2022-10-16T14:14:06Z"}
{"id":29,"first_name":"Karole","last_name":"Worvell","email":"kworvells@fotki.com","job":"Marketing Assistant","timestamp":"2022-06-10T13:21:11Z"}
{"id":30,"first_name":"Lonnard","last_name":"Myton","email":"lmytont@unesco.org","job":"Nuclear Power Engineer","timestamp":"2022-07-25T06:32:06Z"}
{"id":31,"first_name":"Elsey","last_name":"Mingotti","email":"emingottiu@flickr.com","job":"Actuary","timestamp":"2022-09-06T23:11:13Z"}
{"id":32,"first_name":"Coral","last_name":"Roscoe","email":"croscoev@thetimes.co.uk","job":"Food Chemist","timestamp":"2022-03-17T08:08:12Z"}
{"id":33,"first_name":"Clare","last_name":"McErlaine","email":"cmcerlainew@mozilla.org","job":"Senior Quality Engineer","timestamp":"2022-11-06T13:36:06Z"}
{"id":34,"first_name":"Johnny","last_name":"Cattlemull","email":"jcattlemullx@gravatar.com","job":"Registered Nurse","timestamp":"2022-02-22T12:56:06Z"}
{"id":35,"first_name":"Hersch","last_name":"Andreaccio","email":"handreaccioy@hostgator.com","job":"Sales Representative","timestamp":"2022-05-15T11:29:06Z"}
{"id":36,"first_name":"Becky","last_name":"Frentz","email":"bfrentzz@psu.edu","job":"Paralegal","timestamp":"2022-04-15T18:31:28Z"}
{"id":37,"first_name":"Katheryn","last_name":"Gunbie","email":"kgunbie10@feedburner.com","job":"Design Engineer","timestamp":"2022-08-29T10:07:17Z"}
{"id":38,"first_name":"Antonino","last_name":"Reeder","email":"areeder11@ted.com","job":"Paralegal","timestamp":"2022-02-16T14:25:49Z"}
{"id":39,"first_name":"Meghan","last_name":"Pladen","email":"mpladen12@t.co","job":"Business Systems Development Analyst","timestamp":"2022-01-10T12:43:07Z"}
{"id":40,"first_name":"Melloney","last_name":"Nys","email":"mnys13@wix.com","job":"Professor","timestamp":"2022-03-11T23:21:46Z"}
{"id":41,"first_name":"Hilliard","last_name":"McGilben","email":"hmcgilben14@wunderground.com","job":"Junior Executive","timestamp":"2022-10-28T14:13:52Z"}
{"id":42,"first_name":"Olivero","last_name":"Ladson","email":"oladson15@aboutads.info","job":"Dental Hygienist","timestamp":"2022-04-27T15:37:45Z"}
{"id":43,"first_name":"Angelico","last_name":"Cregeen","email":"acregeen16@blog.com","job":"Clinical Specialist","timestamp":"2022-04-24T19:18:44Z"}
{"id":44,"first_name":"Redd","last_name":"Lowseley","email":"rlowseley17@cbsnews.com","job":"Accounting Assistant I","timestamp":"2022-05-06T20:20:58Z"}
{"id":45,"first_name":"Ida","last_name":"Colebrook","email":"icolebrook18@prnewswire.com","job":"Human Resources Assistant III","timestamp":"2022-12-05T14:57:45Z"}
{"id":46,"first_name":"Fritz","last_name":"Corbert","email":"fcorbert19@yelp.com","job":"Financial Analyst","timestamp":"2022-09-07T09:54:05Z"}
{"id":47,"first_name":"Fleming","last_name":"Woodeson","email":"fwoodeson1a@yolasite.com","job":"Speech Pathologist","timestamp":"2022-09-30T13:32:24Z"}
{"id":48,"first_name":"Layney","last_name":"Dispencer","email":"ldispencer1b@bizjournals.com","job":"Research Nurse","timestamp":"2022-09-22T19:15:54Z"}
{"id":49,"first_name":"Chen","last_name":"Glandfield","email":"cglandfield1c@jiathis.com","job":"Statistician III","timestamp":"2022-09-14T17:26:49Z"}
{"id":50,"first_name":"Maurise","last_name":"Braunle","email":"mbraunle1d@craigslist.org","job":"Research Assistant II","timestamp":"2022-12-01T06:05:42Z"}
{"id":51,"first_name":"Nevin","last_name":"McNeely","email":"nmcneely1e@webnode.com","job":"Marketing Assistant","timestamp":"2021-12-10T05:46:45Z"}
{"id":52,"first_name":"Antonie","last_name":"McBean","email":"amcbean1f@nyu.edu","job":"Design Engineer","timestamp":"2021-12-18T14:27:47Z"}
{"id":53,"first_name":"Alonzo","last_name":"Jordin","email":"ajordin1g@printfriendly.com","job":"Administrative Assistant III","timestamp":"2022-03-19T22:48:55Z"}
{"id":54,"first_name":"Laverna","last_name":"McCurtain","email":"lmccurtain1h@guardian.co.uk","job":"Software Test Engineer III","timestamp":"2022-07-20T12:24:51Z"}
{"id":55,"first_name":"Krishna","last_name":"Gerrett","email":"kgerrett1i@slashdot.org","job":"Internal Auditor","timestamp":"2021-12-19T12:20:00Z"}
{"id":56,"first_name":"Jethro","last_name":"Tomkys","email":"jtomkys1j@auda.org.au","job":"Automation Specialist III","timestamp":"2022-06-07T13:54:51Z"}
{"id":57,"first_name":"Blinni","last_name":"Rumgay","email":"brumgay1k@unicef.org","job":"Product Engineer","timestamp":"2022-04-12T05:12:19Z"}
{"id":58,"first_name":"Victoria","last_name":"Booi","email":"vbooi1l@forbes.com","job":"Environmental Specialist","timestamp":"2022-10-14T00:31:26Z"}
{"id":59,"first_name":"Hube","last_name":"Sheers","email":"hsheers1m@behance.net","job":"Payment Adjustment Coordinator","timestamp":"2022-05-30T04:44:02Z"}
{"id":60,"first_name":"Trip","last_name":"Twidle","email":"ttwidle1n@npr.org","job":"Design Engineer","timestamp":"2022-05-31T15:17:27Z"}
{"id":61,"first_name":"Brigida","last_name":"Simony","email":"bsimony1o@about.com","job":"VP Marketing","timestamp":"2022-02-07T21:30:51Z"}
{"id":62,"first_name":"Raynard","last_name":"Prati","email":"rprati1p@digg.com","job":"Recruiter","timestamp":"2022-01-27T06:13:13Z"}
{"id":63,"first_name":"Sylvan","last_name":"Brookes","email":"sbrookes1q@google.ca","job":"Statistician II","timestamp":"2022-10-28T04:52:16Z"}
{"id":64,"first_name":"Adrienne","last_name":"Geeve","email":"ageeve1r@google.com.br","job":"Social Worker","timestamp":"2022-06-08T13:20:30Z"}
{"id":65,"first_name":"Giorgia","last_name":"Tuddenham","email":"gtuddenham1s@nps.gov","job":"Account Executive","timestamp":"2022-07-11T14:53:45Z"}
{"id":66,"first_name":"Flss","last_name":"Ibel","email":"fibel1t@bandcamp.com","job":"Assistant Professor","timestamp":"2021-12-13T18:56:38Z"}
{"id":67,"first_name":"Rubina","last_name":"Seymer","email":"rseymer1u@ted.com","job":"Senior Editor","timestamp":"2022-03-25T08:18:09Z"}
{"id":68,"first_name":"Torie","last_name":"Shorton","email":"tshorton1v@theglobeandmail.com","job":"Data Coordiator","timestamp":"2022-03-02T04:07:55Z"}
{"id":69,"first_name":"Gale","last_name":"Nealand","email":"gnealand1w@usda.gov","job":"Assistant Manager","timestamp":"2022-09-22T04:08:11Z"}
{"id":70,"first_name":"Berkeley","last_name":"Riggey","email":"briggey1x@thetimes.co.uk","job":"Assistant Professor","timestamp":"2022-08-28T05:05:07Z"}
{"id":71,"first_name":"Noelani","last_name":"Guilliland","email":"nguilliland1y@ihg.com","job":"Structural Analysis Engineer","timestamp":"2022-06-02T22:38:23Z"}
{"id":72,"first_name":"Patsy","last_name":"Straniero","email":"pstraniero1z@wisc.edu","job":"Quality Control Specialist","timestamp":"2021-12-27T05:29:04Z"}
{"id":73,"first_name":"Trisha","last_name":"D'Angeli","email":"tdangeli20@networkadvertising.org","job":"Account Executive","timestamp":"2022-01-29T11:16:44Z"}
{"id":74,"first_name":"Arlen","last_name":"Matyja","email":"amatyja21@51.la","job":"Software Engineer I","timestamp":"2022-07-25T17:48:22Z"}
{"id":75,"first_name":"Garvey","last_name":"East","email":"geast22@github.io","job":"Recruiting Manager","timestamp":"2022-01-31T04:47:31Z"}
{"id":76,"first_name":"Pepillo","last_name":"Stigers","email":"pstigers23@va.gov","job":"Web Designer II","timestamp":"2022-04-03T01:00:18Z"}
{"id":77,"first_name":"Channa","last_name":"Johnke","email":"cjohnke24@blogspot.com","job":"Accounting Assistant II","timestamp":"2022-05-20T23:59:39Z"}
{"id":78,"first_name":"Marget","last_name":"Hymer","email":"mhymer25@cam.ac.uk","job":"Paralegal","timestamp":"2022-09-01T11:39:39Z"}
{"id":79,"first_name":"Arthur","last_name":"Leveridge","email":"aleveridge26@bing.com","job":"Structural Analysis Engineer","timestamp":"2021-12-09T22:58:01Z"}
{"id":80,"first_name":"Tiebout","last_name":"Sharples","email":"tsharples27@instagram.com","job":"Software Consultant","timestamp":"2022-03-13T04:09:09Z"}
{"id":81,"first_name":"Trixie","last_name":"O'Mullaney","email":"tomullaney28@redcross.org","job":"Mechanical Systems Engineer","timestamp":"2022-09-03T22:54:46Z"}
{"id":82,"first_name":"Karmen","last_name":"Baline","email":"kbaline29@uol.com.br","job":"Design Engineer","timestamp":"2022-02-05T02:43:57Z"}
{"id":83,"first_name":"Bonnee","last_name":"Whorall","email":"bwhorall2a@skype.com","job":"Junior Executive","timestamp":"2022-11-11T11:49:13Z"}
{"id":84,"first_name":"Tony","last_name":"Slafford","email":"tslafford2b@tripadvisor.com","job":"Assistant Professor","timestamp":"2022-08-28T11:45:10Z"}
{"id":85,"first_name":"Janifer","last_name":"Mixer","email":"jmixer2c@pagesperso-orange.fr","job":"Office Assistant II","timestamp":"2022-07-25T14:56:19Z"}
{"id":86,"first_name":"Haroun","last_name":"Diddams","email":"hdiddams2d@nasa.gov","job":"Analog Circuit Design manager","timestamp":"2022-07-13T04:39:35Z"}
{"id":87,"first_name":"Kelcey","last_name":"Fardell","email":"kfardell2e@dropbox.com","job":"Software Test Engineer I","timestamp":"2022-11-18T00:20:54Z"}
{"id":88,"first_name":"Ricard","last_name":"Scotti","email":"rscotti2f@live.com","job":"Nurse Practicioner","timestamp":"2022-06-09T19:59:33Z"}
{"id":89,"first_name":"Noell","last_name":"Tremathack","email":"ntremathack2g@nih.gov","job":"Food Chemist","timestamp":"2022-10-11T05:03:53Z"}
{"id":90,"first_name":"Jorge","last_name":"McIlhagga","email":"jmcilhagga2h@eventbrite.com","job":"Media Manager II","timestamp":"2022-04-03T20:52:05Z"}
{"id":91,"first_name":"Clerc","last_name":"Geraud","email":"cgeraud2i@answers.com","job":"Chemical Engineer","timestamp":"2022-06-11T22:00:49Z"}
{"id":92,"first_name":"Waverley","last_name":"Patnelli","email":"wpatnelli2j@cyberchimps.com","job":"Software Engineer III","timestamp":"2022-08-31T13:44:36Z"}
{"id":93,"first_name":"Angele","last_name":"Kenzie","email":"akenzie2k@vimeo.com","job":"Database Administrator III","timestamp":"2022-10-30T00:24:41Z"}
{"id":94,"first_name":"Mikkel","last_name":"Faveryear","email":"mfaveryear2l@com.com","job":"Occupational Therapist","timestamp":"2022-11-01T05:50:01Z"}
{"id":95,"first_name":"Hadleigh","last_name":"Selvey","email":"hselvey2m@liveinternet.ru","job":"Accounting Assistant IV","timestamp":"2022-01-12T07:45:38Z"}
{"id":96,"first_name":"Witty","last_name":"Shapira","email":"wshapira2n@behance.net","job":"Senior Cost Accountant","timestamp":"2022-02-27T01:22:32Z"}
{"id":97,"first_name":"Wynn","last_name":"Tamplin","email":"wtamplin2o@liveinternet.ru","job":"General Manager","timestamp":"2022-07-27T17:19:59Z"}
{"id":98,"first_name":"Thacher","last_name":"Greenhough","email":"tgreenhough2p@pbs.org","job":"Registered Nurse","timestamp":"2022-03-23T20:34:04Z"}
{"id":99,"first_name":"Gerladina","last_name":"Kirby","email":"gkirby2q@prweb.com","job":"Web Designer III","timestamp":"2022-08-12T13:15:37Z"}
{"id":100,"first_name":"Leanna","last_name":"Wallbutton","email":"lwallbutton2r@independent.co.uk","job":"Pharmacist","timestamp":"2022-11-19T12:42:02Z"}
{"id":101,"first_name":"Sheela","last_name":"Kepe","email":"skepe2s@addtoany.com","job":"Help Desk Technician","timestamp":"2022-08-02T10:51:10Z"}
{"id":102,"first_name":"Clo","last_name":"Ronan","email":"cronan2t@scribd.com","job":"Help Desk Operator","timestamp":"2022-09-13T21:04:16Z"}
{"id":103,"first_name":"Lurlene","last_name":"Adame","email":"ladame2u@soup.io","job":"Clinical Specialist","timestamp":"2022-08-19T05:41:48Z"}
{"id":104,"first_name":"Pebrook","last_name":"Balshaw","email":"pbalshaw2v@who.int","job":"Office Assistant IV","timestamp":"2022-10-17T00:17:21Z"}
{"id":105,"first_name":"Tadd","last_name":"Monsey","email":"tmonsey2w@spiegel.de","job":"Senior Editor","timestamp":"2022-07-28T18:03:25Z"}
{"id":106,"first_name":"Mireille","last_name":"Milkin","email":"mmilkin2x@theatlantic.com","job":"GIS Technical Architect","timestamp":"2022-09-22T05:28:48Z"}
{"id":107,"first_name":"Bunni","last_name":"Prowting","email":"bprowting2y@t.co","job":"Geological Engineer","timestamp":"2022-03-15T18:58:57Z"}
{"id":108,"first_name":"Tandie","last_name":"Buddle","email":"tbuddle2z@vk.com","job":"Nurse","timestamp":"2022-05-13T10:10:46Z"}
{"id":109,"first_name":"Sheryl","last_name":"Blair","email":"sblair30@discuz.net","job":"Administrative Assistant III","timestamp":"2022-08-16T15:44:54Z"}
{"id":110,"first_name":"Daveen","last_name":"Liebmann","email":"dliebmann31@nationalgeographic.com","job":"Professor","timestamp":"2022-10-22T09:16:28Z"}
{"id":111,"first_name":"Udall","last_name":"Essel","email":"uessel32@canalblog.com","job":"Speech Pathologist","timestamp":"2022-07-09T11:08:07Z"}
{"id":112,"first_name":"Nev","last_name":"Cromarty","email":"ncromarty33@army.mil","job":"Structural Analysis Engineer","timestamp":"2022-10-16T22:56:59Z"}
{"id":113,"first_name":"Lara","last_name":"Pundy","email":"lpundy34@pbs.org","job":"Environmental Tech","timestamp":"2021-12-30T22:19:17Z"}
{"id":114,"first_name":"Llywellyn","last_name":"Stockman","email":"lstockman35@senate.gov","job":"VP Product Management","timestamp":"2022-07-10T22:41:56Z"}
{"id":115,"first_name":"Ingrim","last_name":"Arkow","email":"iarkow36@jiathis.com","job":"Speech Pathologist","timestamp":"2022-07-25T03:36:14Z"}
{"id":116,"first_name":"Jamima","last_name":"Hedley","email":"jhedley37@epa.gov","job":"Legal Assistant","timestamp":"2022-07-08T02:00:55Z"}
{"id":117,"first_name":"Kippie","last_name":"Danilchev","email":"kdanilchev38@reddit.com","job":"Payment Adjustment Coordinator","timestamp":"2022-03-26T23:52:43Z"}
{"id":118,"first_name":"Dacie","last_name":"Basnall","email":"dbasnall39@cnn.com","job":"Electrical Engineer","timestamp":"2022-11-04T17:52:54Z"}
{"id":119,"first_name":"Frazer","last_name":"McVeighty","email":"fmcveighty3a@soundcloud.com","job":"Research Assistant IV","timestamp":"2021-12-16T11:04:03Z"}
{"id":120,"first_name":"Dynah","last_name":"Cecely","email":"dcecely3b@icq.com","job":"Research Associate","timestamp":"2022-05-14T03:58:47Z"}
{"id":121,"first_name":"Hermie","last_name":"Conlaund","email":"hconlaund3c@timesonline.co.uk","job":"Help Desk Technician","timestamp":"2022-01-19T11:35:16Z"}
{"id":122,"first_name":"Lindi","last_name":"Newling","email":"lnewling3d@gmpg.org","job":"Programmer I","timestamp":"2022-11-27T08:23:47Z"}
{"id":123,"first_name":"Oralia","last_name":"Ballefant","email":"oballefant3e@wiley.com","job":"Research Nurse","timestamp":"2022-11-01T06:10:30Z"}
{"id":124,"first_name":"Ava","last_name":"Monks","email":"amonks3f@google.es","job":"Senior Cost Accountant","timestamp":"2022-07-19T18:58:10Z"}
{"id":125,"first_name":"Donnamarie","last_name":"Tattersfield","email":"dtattersfield3g@constantcontact.com","job":"Chief Design Engineer","timestamp":"2022-08-14T22:55:33Z"}
{"id":126,"first_name":"Ketti","last_name":"Peealess","email":"kpeealess3h@woothemes.com","job":"Financial Advisor","timestamp":"2022-03-21T13:31:34Z"}
{"id":127,"first_name":"Gerti","last_name":"Pearlman","email":"gpearlman3i@constantcontact.com","job":"GIS Technical Architect","timestamp":"2022-01-19T08:47:13Z"}
{"id":128,"first_name":"Verna","last_name":"Thynne","email":"vthynne3j@opera.com","job":"Structural Engineer","timestamp":"2022-05-31T01:48:56Z"}
{"id":129,"first_name":"Arlen","last_name":"Coit","email":"acoit3k@apache.org","job":"Software Engineer IV","timestamp":"2022-09-08T06:29:36Z"}
{"id":130,"first_name":"Agna","last_name":"Oliveti","email":"aoliveti3l@imageshack.us","job":"Sales Representative","timestamp":"2022-10-24T20:06:30Z"}
{"id":131,"first_name":"Ellette","last_name":"Aggott","email":"eaggott3m@myspace.com","job":"Structural Engineer","timestamp":"2022-09-03T16:17:21Z"}
{"id":132,"first_name":"Candice","last_name":"Tembridge","email":"ctembridge3n@csmonitor.com","job":"Tax Accountant","timestamp":"2022-10-24T09:30:41Z"}
{"id":133,"first_name":"Vinnie","last_name":"Duffie","email":"vduffie3o@pcworld.com","job":"Occupational Therapist","timestamp":"2022-02-04T17:03:25Z"}
{"id":134,"first_name":"Fifine","last_name":"O'Dogherty","email":"fodogherty3p@behance.net","job":"Registered Nurse","timestamp":"2022-03-28T23:59:44Z"}
{"id":135,"first_name":"Raine","last_name":"Kerins","email":"rkerins3q@economist.com","job":"Database Administrator III","timestamp":"2022-01-19T03:25:36Z"}
{"id":136,"first_name":"Arabel","last_name":"McUre","email":"amcure3r@wired.com","job":"Speech Pathologist","timestamp":"2021-12-23T21:06:54Z"}
{"id":137,"first_name":"Cissy","last_name":"Olligan","email":"colligan3s@mysql.com","job":"Compensation Analyst","timestamp":"2021-12-12T22:19:29Z"}
{"id":138,"first_name":"Pierson","last_name":"Kornilyev","email":"pkornilyev3t@hp.com","job":"Information Systems Manager","timestamp":"2022-01-08T23:17:36Z"}
{"id":139,"first_name":"Eve","last_name":"Bostock","email":"ebostock3u@answers.com","job":"Human Resources Assistant IV","timestamp":"2022-04-09T22:00:21Z"}
{"id":140,"first_name":"Franciskus","last_name":"Bakesef","email":"fbakesef3v@yellowpages.com","job":"Structural Analysis Engineer","timestamp":"2022-03-09T04:42:58Z"}
{"id":141,"first_name":"Junette","last_name":"Bathersby","email":"jbathersby3w@baidu.com","job":"Programmer Analyst I","timestamp":"2022-05-08T16:10:27Z"}
{"id":142,"first_name":"Lyda","last_name":"Marchi","email":"lmarchi3x@digg.com","job":"Media Manager I","timestamp":"2022-11-27T04:28:38Z"}
{"id":143,"first_name":"Alasdair","last_name":"Kahler","email":"akahler3y@wisc.edu","job":"Assistant Manager","timestamp":"2022-02-07T13:51:07Z"}
{"id":144,"first_name":"Nessie","last_name":"Stockdale","email":"nstockdale3z@vinaora.com","job":"GIS Technical Architect","timestamp":"2021-12-11T07:04:34Z"}
{"id":145,"first_name":"Bastien","last_name":"Syalvester","email":"bsyalvester40@nationalgeographic.com","job":"Administrative Assistant III","timestamp":"2022-11-06T09:08:18Z"}
{"id":146,"first_name":"Ranique","last_name":"Youson","email":"ryouson41@simplemachines.org","job":"Nurse","timestamp":"2022-03-05T23:16:26Z"}
{"id":147,"first_name":"Ruddy","last_name":"Koop","email":"rkoop42@webnode.com","job":"Programmer IV","timestamp":"2022-06-23T11:31:40Z"}
{"id":148,"first_name":"Midge","last_name":"Trengove","email":"mtrengove43@lulu.com","job":"Director of Sales","timestamp":"2022-05-14T08:08:26Z"}
{"id":149,"first_name":"Hally","last_name":"Pettendrich","email":"hpettendrich44@washington.edu","job":"Operator","timestamp":"2022-01-17T00:32:17Z"}
{"id":150,"first_name":"Elfrieda","last_name":"Sorey","email":"esorey45@hc360.com","job":"Operator","timestamp":"2022-03-25T05:03:24Z"}
{"id":151,"first_name":"Arnuad","last_name":"Cridlin","email":"acridlin46@yandex.ru","job":"Design Engineer","timestamp":"2022-07-23T22:58:32Z"}
{"id":152,"first_name":"Cati","last_name":"Dunkersley","email":"cdunkersley47@umich.edu","job":"Financial Analyst","timestamp":"2022-09-09T12:53:00Z"}
{"id":153,"first_name":"Phillis","last_name":"Hollow","email":"phollow48@printfriendly.com","job":"Assistant Manager","timestamp":"2022-07-18T16:51:18Z"}
{"id":154,"first_name":"Annadiana","last_name":"Stovold","email":"astovold49@uiuc.edu","job":"Staff Scientist","timestamp":"2022-01-29T17:31:28Z"}
{"id":155,"first_name":"Shurwood","last_name":"Jurewicz","email":"sjurewicz4a@bloglovin.com","job":"Senior Financial Analyst","timestamp":"2022-02-05T22:03:30Z"}
{"id":156,"first_name":"Sibelle","last_name":"Wordesworth","email":"swordesworth4b@msn.com","job":"Financial Advisor","timestamp":"2022-05-26T04:44:42Z"}
{"id":157,"first_name":"Sandy","last_name":"Bau","email":"sbau4c@tinyurl.com","job":"Professor","timestamp":"2022-07-16T21:47:35Z"}
{"id":158,"first_name":"Moise","last_name":"Habens","email":"mhabens4d@nationalgeographic.com","job":"Internal Auditor","timestamp":"2022-03-01T13:48:25Z"}
{"id":159,"first_name":"Hoyt","last_name":"Measom","email":"hmeasom4e@github.io","job":"Administrative Assistant I","timestamp":"2022-05-10T17:51:28Z"}
{"id":160,"first_name":"Skell","last_name":"Siene","email":"ssiene4f@networkadvertising.org","job":"Physical Therapy Assistant","timestamp":"2022-10-20T12:11:04Z"}
{"id":161,"first_name":"Abbey","last_name":"Sainte Paul","email":"asaintepaul4g@howstuffworks.com","job":"Systems Administrator III","timestamp":"2022-03-04T12:17:58Z"}
{"id":162,"first_name":"Adriana","last_name":"Mault","email":"amault4h@ted.com","job":"Occupational Therapist","timestamp":"2021-12-15T16:58:31Z"}
{"id":163,"first_name":"Nerty","last_name":"Cullin","email":"ncullin4i@geocities.com","job":"Junior Executive","timestamp":"2022-06-02T04:14:19Z"}
{"id":164,"first_name":"Monroe","last_name":"Conlon","email":"mconlon4j@cnn.com","job":"Web Designer I","timestamp":"2022-07-05T16:54:18Z"}
{"id":165,"first_name":"Rena","last_name":"Penticost","email":"rpenticost4k@spiegel.de","job":"Assistant Media Planner","timestamp":"2021-12-15T19:04:42Z"}
{"id":166,"first_name":"Letisha","last_name":"Kitchingman","email":"lkitchingman4l@sphinn.com","job":"Structural Engineer","timestamp":"2022-12-05T04:33:23Z"}
{"id":167,"first_name":"Denney","last_name":"Playdon","email":"dplaydon4m@google.cn","job":"Systems Administrator IV","timestamp":"2022-06-17T08:30:54Z"}
{"id":168,"first_name":"Aprilette","last_name":"Ruffles","email":"aruffles4n@meetup.com","job":"Budget/Accounting Analyst III","timestamp":"2022-01-13T19:32:29Z"}
{"id":169,"first_name":"Rosalie","last_name":"Strutz","email":"rstrutz4o@guardian.co.uk","job":"Teacher","timestamp":"2022-02-21T22:44:51Z"}
{"id":170,"first_name":"Paxon","last_name":"Snoden","email":"psnoden4p@examiner.com","job":"Biostatistician II","timestamp":"2022-01-01T02:59:32Z"}
{"id":171,"first_name":"Son","last_name":"Clifforth","email":"sclifforth4q@wordpress.org","job":"Physical Therapy Assistant","timestamp":"2022-07-01T02:10:25Z"}
{"id":172,"first_name":"Pebrook","last_name":"Rollinshaw","email":"prollinshaw4r@gizmodo.com","job":"Help Desk Technician","timestamp":"2022-11-29T05:24:36Z"}
{"id":173,"first_name":"Harrison","last_name":"Steade","email":"hsteade4s@creativecommons.org","job":"Web Developer II","timestamp":"2022-10-18T08:29:27Z"}
{"id":174,"first_name":"Ardra","last_name":"MacConnal","email":"amacconnal4t@telegraph.co.uk","job":"Systems Administrator IV","timestamp":"2022-07-04T09:04:39Z"}
{"id":175,"first_name":"Donnajean","last_name":"Carabine","email":"dcarabine4u@de.vu","job":"Quality Control Specialist","timestamp":"2022-04-30T00:46:50Z"}
{"id":176,"first_name":"Jamey","last_name":"MacLardie","email":"jmaclardie4v@hp.com","job":"Community Outreach Specialist","timestamp":"2022-07-16T17:25:21Z"}
{"id":177,"first_name":"Jarrad","last_name":"Stockall","email":"jstockall4w@google.cn","job":"Actuary","timestamp":"2022-08-21T17:39:00Z"}
{"id":178,"first_name":"Eolande","last_name":"Tchir","email":"etchir4x@amazon.co.uk","job":"Research Nurse","timestamp":"2022-10-31T17:01:24Z"}
{"id":179,"first_name":"Carilyn","last_name":"Bindon","email":"cbindon4y@t.co","job":"Engineer III","timestamp":"2022-11-27T12:30:07Z"}
{"id":180,"first_name":"Lenore","last_name":"Davidescu","email":"ldavidescu4z@nytimes.com","job":"Legal Assistant","timestamp":"2022-09-18T15:32:28Z"}
{"id":181,"first_name":"Catherina","last_name":"Gowdie","email":"cgowdie50@smh.com.au","job":"Statistician IV","timestamp":"2022-09-23T15:13:19Z"}
{"id":182,"first_name":"Reena","last_name":"Elgram","email":"relgram51@etsy.com","job":"Geologist IV","timestamp":"2022-09-10T05:24:05Z"}
{"id":183,"first_name":"Vergil","last_name":"Saice","email":"vsaice52@domainmarket.com","job":"Project Manager","timestamp":"2022-04-01T12:59:25Z"}
{"id":184,"first_name":"Brose","last_name":"Titterell","email":"btitterell53@arizona.edu","job":"Community Outreach Specialist","timestamp":"2022-08-01T18:28:09Z"}
{"id":185,"first_name":"Waiter","last_name":"Slimon","email":"wslimon54@tuttocitta.it","job":"Research Associate","timestamp":"2022-08-04T22:18:40Z"}
{"id":186,"first_name":"Dawna","last_name":"Avard","email":"davard55@nhs.uk","job":"Electrical Engineer","timestamp":"2021-12-08T08:41:45Z"}
{"id":187,"first_name":"Geoff","last_name":"Erickson","email":"gerickson56@meetup.com","job":"Research Assistant I","timestamp":"2022-07-29T02:19:03Z"}
{"id":188,"first_name":"Orsa","last_name":"Wapples","email":"owapples57@unesco.org","job":"Engineer IV","timestamp":"2022-08-15T23:47:42Z"}
{"id":189,"first_name":"Lana","last_name":"Rawlin","email":"lrawlin58@surveymonkey.com","job":"Speech Pathologist","timestamp":"2022-02-15T21:01:49Z"}
{"id":190,"first_name":"Nydia","last_name":"Minet","email":"nminet59@umn.edu","job":"Engineer III","timestamp":"2022-10-24T09:35:38Z"}
{"id":191,"first_name":"Eadith","last_name":"Kornes","email":"ekornes5a@deliciousdays.com","job":"Biostatistician IV","timestamp":"2022-03-25T15:57:40Z"}
{"id":192,"first_name":"Kessia","last_name":"Spavins","email":"kspavins5b@mtv.com","job":"Speech Pathologist","timestamp":"2022-07-29T06:08:11Z"}
{"id":193,"first_name":"Lana","last_name":"Van Hesteren","email":"lvanhesteren5c@booking.com","job":"Director of Sales","timestamp":"2022-03-16T16:39:52Z"}
{"id":194,"first_name":"Sol","last_name":"McRill","email":"smcrill5d@buzzfeed.com","job":"Administrative Assistant I","timestamp":"2022-03-31T19:40:50Z"}
{"id":195,"first_name":"Layla","last_name":"Melling","email":"lmelling5e@skyrock.com","job":"Analyst Programmer","timestamp":"2022-05-19T05:55:38Z"}
{"id":196,"first_name":"Erhard","last_name":"Hendrik","email":"ehendrik5f@smugmug.com","job":"VP Sales","timestamp":"2021-12-26T20:22:51Z"}
{"id":197,"first_name":"Ailbert","last_name":"Quarles","email":"aquarles5g@seattletimes.com","job":"Speech Pathologist","timestamp":"2022-10-09T04:40:12Z"}
{"id":198,"first_name":"Tabby","last_name":"Colt","email":"tcolt5h@theglobeandmail.com","job":"Senior Financial Analyst","timestamp":"2022-02-01T04:06:23Z"}
{"id":199,"first_name":"Andee","last_name":"Longbone","email":"alongbone5i@istockphoto.com","job":"Budget/Accounting Analyst II","timestamp":"2022-05-10T17:39:08Z"}
{"id":200,"first_name":"Marlowe","last_name":"Camsey","email":"mcamsey5j@earthlink.net","job":"Recruiter","timestamp":"2022-01-12T17:12:21Z"}
{"id":201,"first_name":"Gregorius","last_name":"Mincini","email":"gmincini5k@sakura.ne.jp","job":"Automation Specialist II","timestamp":"2022-08-02T17:15:49Z"}
{"id":202,"first_name":"Kath","last_name":"Minci","email":"kminci5l@mozilla.org","job":"Nuclear Power Engineer","timestamp":"2022-06-14T16:37:46Z"}
{"id":203,"first_name":"Harmonie","last_name":"Dorricott","email":"hdorricott5m@pagesperso-orange.fr","job":"Administrative Officer","timestamp":"2022-02-28T08:11:46Z"}
{"id":204,"first_name":"Isidro","last_name":"Hillum","email":"ihillum5n@telegraph.co.uk","job":"Account Representative II","timestamp":"2022-06-01T20:52:51Z"}
{"id":205,"first_name":"Gabie","last_name":"McEniry","email":"gmceniry5o@wikispaces.com","job":"Financial Analyst","timestamp":"2022-01-05T15:30:32Z"}
{"id":206,"first_name":"Wynne","last_name":"Amorts","email":"wamorts5p@thetimes.co.uk","job":"Editor","timestamp":"2022-05-13T00:02:48Z"}
{"id":207,"first_name":"Timothee","last_name":"O'Finan","email":"tofinan5q@tripod.com","job":"Research Associate","timestamp":"2022-01-08T21:30:02Z"}
{"id":208,"first_name":"Alfreda","last_name":"Kures","email":"akures5r@hhs.gov","job":"Automation Specialist II","timestamp":"2022-04-11T12:16:06Z"}
{"id":209,"first_name":"Diannne","last_name":"Tiesman","email":"dtiesman5s@pen.io","job":"Environmental Specialist","timestamp":"2022-07-06T01:41:13Z"}
{"id":210,"first_name":"Leisha","last_name":"Peasee","email":"lpeasee5t@bloomberg.com","job":"Associate Professor","timestamp":"2022-10-22T08:35:54Z"}
{"id":211,"first_name":"Demetri","last_name":"Broom","email":"dbroom5u@oaic.gov.au","job":"Director of Sales","timestamp":"2022-12-06T07:28:25Z"}
{"id":212,"first_name":"Simone","last_name":"Chisholm","email":"schisholm5v@go.com","job":"Paralegal","timestamp":"2022-09-05T09:33:00Z"}
{"id":213,"first_name":"Siobhan","last_name":"Ironmonger","email":"sironmonger5w@mit.edu","job":"Database Administrator I","timestamp":"2022-08-29T19:18:51Z"}
{"id":214,"first_name":"Candra","last_name":"Tern","email":"ctern5x@hud.gov","job":"Chief Design Engineer","timestamp":"2021-12-30T13:10:59Z"}
{"id":215,"first_name":"Charla","last_name":"Bearward","email":"cbearward5y@dyndns.org","job":"Paralegal","timestamp":"2022-11-14T00:49:58Z"}
{"id":216,"first_name":"Flynn","last_name":"Waring","email":"fwaring5z@disqus.com","job":"Mechanical Systems Engineer","timestamp":"2022-06-12T12:06:46Z"}
{"id":217,"first_name":"Laetitia","last_name":"Haggleton","email":"lhaggleton60@reverbnation.com","job":"Software Test Engineer I","timestamp":"2021-12-16T04:43:32Z"}
{"id":218,"first_name":"Robin","last_name":"Garritley","email":"rgarritley61@hexun.com","job":"Structural Analysis Engineer","timestamp":"2022-02-11T00:24:01Z"}
{"id":219,"first_name":"Rosie","last_name":"Ladyman","email":"rladyman62@mashable.com","job":"Structural Engineer","timestamp":"2022-08-07T13:55:28Z"}
{"id":220,"first_name":"Asia","last_name":"Ellerman","email":"aellerman63@arstechnica.com","job":"Food Chemist","timestamp":"2022-01-23T06:14:00Z"}
{"id":221,"first_name":"Christye","last_name":"McWhan","email":"cmcwhan64@github.com","job":"Recruiter","timestamp":"2022-05-24T01:03:07Z"}
{"id":222,"first_name":"Johanna","last_name":"Khotler","email":"jkhotler65@thetimes.co.uk","job":"Help Desk Technician","timestamp":"2022-04-23T20:21:02Z"}
{"id":223,"first_name":"Angil","last_name":"Carress","email":"acarress66@i2i.jp","job":"Electrical Engineer","timestamp":"2022-03-19T06:35:10Z"}
{"id":224,"first_name":"Joyce","last_name":"Beaglehole","email":"jbeaglehole67@sfgate.com","job":"Design Engineer","timestamp":"2021-12-13T13:06:10Z"}
{"id":225,"first_name":"Pip","last_name":"Escudier","email":"pescudier68@globo.com","job":"Junior Executive","timestamp":"2021-12-16T23:35:43Z"}
{"id":226,"first_name":"Isadore","last_name":"O'Longain","email":"iolongain69@sbwire.com","job":"Product Engineer","timestamp":"2022-08-06T10:15:09Z"}
{"id":227,"first_name":"Gilburt","last_name":"Bowbrick","email":"gbowbrick6a@ezinearticles.com","job":"Safety Technician III","timestamp":"2022-01-16T04:22:33Z"}
{"id":228,"first_name":"Renault","last_name":"Frammingham","email":"rframmingham6b@ox.ac.uk","job":"Financial Advisor","timestamp":"2022-09-02T13:10:17Z"}
{"id":229,"first_name":"Tam","last_name":"Nangle","email":"tnangle6c@t-online.de","job":"Professor","timestamp":"2022-04-16T21:51:58Z"}
{"id":230,"first_name":"Ardelle","last_name":"Coultous","email":"acoultous6d@wix.com","job":"Statistician I","timestamp":"2022-11-27T05:43:01Z"}
{"id":231,"first_name":"Demetra","last_name":"Mabson","email":"dmabson6e@sciencedirect.com","job":"Analyst Programmer","timestamp":"2022-01-09T08:43:12Z"}
{"id":232,"first_name":"Avis","last_name":"Laverenz","email":"alaverenz6f@wikia.com","job":"Biostatistician IV","timestamp":"2022-03-12T02:41:08Z"}
{"id":233,"first_name":"Scarface","last_name":"Gurnett","email":"sgurnett6g@bigcartel.com","job":"Accounting Assistant I","timestamp":"2022-11-30T00:57:31Z"}
{"id":234,"first_name":"Hermon","last_name":"Overil","email":"hoveril6h@yolasite.com","job":"Senior Sales Associate","timestamp":"2022-09-08T19:07:46Z"}
{"id":235,"first_name":"Eduard","last_name":"Nasey","email":"enasey6i@buzzfeed.com","job":"Environmental Specialist","timestamp":"2022-03-09T00:20:19Z"}
{"id":236,"first_name":"Elle","last_name":"Golt","email":"egolt6j@dion.ne.jp","job":"Computer Systems Analyst III","timestamp":"2022-08-20T16:30:40Z"}
{"id":237,"first_name":"Gwyn","last_name":"Asaaf","email":"gasaaf6k@webnode.com","job":"Financial Advisor","timestamp":"2022-02-02T03:45:52Z"}
{"id":238,"first_name":"Cullie","last_name":"Pala","email":"cpala6l@google.co.jp","job":"Marketing Manager","timestamp":"2022-10-17T10:54:32Z"}
{"id":239,"first_name":"Torie","last_name":"Drinkall","email":"tdrinkall6m@go.com","job":"Account Coordinator","timestamp":"2022-01-07T19:42:33Z"}
{"id":240,"first_name":"Petronella","last_name":"Reimer","email":"preimer6n@creativecommons.org","job":"Sales Associate","timestamp":"2022-11-15T22:51:02Z"}
{"id":241,"first_name":"Dun","last_name":"Gamett","email":"dgamett6o@yahoo.com","job":"Tax Accountant","timestamp":"2022-09-24T13:16:14Z"}
{"id":242,"first_name":"Fritz","last_name":"Jeannet","email":"fjeannet6p@wunderground.com","job":"Actuary","timestamp":"2022-04-23T04:52:39Z"}
{"id":243,"first_name":"Joby","last_name":"Gouny","email":"jgouny6q@last.fm","job":"Associate Professor","timestamp":"2022-04-11T10:01:24Z"}
{"id":244,"first_name":"Priscilla","last_name":"Hagard","email":"phagard6r@blog.com","job":"Assistant Manager","timestamp":"2022-10-24T01:59:01Z"}
{"id":245,"first_name":"Chadd","last_name":"Runnett","email":"crunnett6s@irs.gov","job":"Human Resources Manager","timestamp":"2022-10-19T14:04:54Z"}
{"id":246,"first_name":"Pansy","last_name":"Coan","email":"pcoan6t@4shared.com","job":"Help Desk Operator","timestamp":"2022-07-26T13:19:39Z"}
{"id":247,"first_name":"Bobby","last_name":"Bothbie","email":"bbothbie6u@youku.com","job":"Analog Circuit Design manager","timestamp":"2022-08-09T02:08:24Z"}
{"id":248,"first_name":"Deidre","last_name":"Guillart","email":"dguillart6v@rakuten.co.jp","job":"Statistician III","timestamp":"2022-06-25T03:36:25Z"}
{"id":249,"first_name":"Corine","last_name":"Garnham","email":"cgarnham6w@typepad.com","job":"Editor","timestamp":"2022-09-19T02:45:29Z"}
{"id":250,"first_name":"Ag","last_name":"Franiak","email":"afraniak6x@alibaba.com","job":"Research Associate","timestamp":"2022-07-28T04:44:05Z"}
{"id":251,"first_name":"Ben","last_name":"Scramage","email":"bscramage6y@sina.com.cn","job":"Nurse Practicioner","timestamp":"2022-09-12T04:05:39Z"}
{"id":252,"first_name":"Edlin","last_name":"Bishell","email":"ebishell6z@de.vu","job":"Tax Accountant","timestamp":"2022-03-31T23:36:47Z"}
{"id":253,"first_name":"Opaline","last_name":"Soden","email":"osoden70@utexas.edu","job":"Project Manager","timestamp":"2022-01-22T23:13:02Z"}
{"id":254,"first_name":"Meredithe","last_name":"Hiscocks","email":"mhiscocks71@reuters.com","job":"Paralegal","timestamp":"2022-05-19T10:29:21Z"}
{"id":255,"first_name":"Georgeanne","last_name":"Donhardt","email":"gdonhardt72@tamu.edu","job":"Speech Pathologist","timestamp":"2022-06-21T07:31:28Z"}
{"id":256,"first_name":"Bridgette","last_name":"Obin","email":"bobin73@hubpages.com","job":"Software Test Engineer IV","timestamp":"2022-03-04T04:51:56Z"}
{"id":257,"first_name":"Livvy","last_name":"Shorten","email":"lshorten74@slate.com","job":"Sales Representative","timestamp":"2022-07-02T07:44:35Z"}
{"id":258,"first_name":"Isabelita","last_name":"Hannaby","email":"ihannaby75@exblog.jp","job":"Human Resources Assistant III","timestamp":"2021-12-14T20:08:16Z"}
{"id":259,"first_name":"Elisabetta","last_name":"Kisar","email":"ekisar76@yelp.com","job":"Legal Assistant","timestamp":"2022-07-13T05:43:49Z"}
{"id":260,"first_name":"Pattie","last_name":"Skeggs","email":"pskeggs77@smugmug.com","job":"Developer II","timestamp":"2022-09-21T23:30:44Z"}
{"id":261,"first_name":"Von","last_name":"Plaide","email":"vplaide78@163.com","job":"Financial Analyst","timestamp":"2022-01-17T18:18:40Z"}
{"id":262,"first_name":"Aurie","last_name":"Fones","email":"afones79@craigslist.org","job":"Statistician I","timestamp":"2022-06-25T21:03:25Z"}
{"id":263,"first_name":"Sue","last_name":"Peacocke","email":"speacocke7a@amazonaws.com","job":"Quality Engineer","timestamp":"2022-05-21T11:51:33Z"}
{"id":264,"first_name":"Lorrin","last_name":"Dallemore","email":"ldallemore7b@jigsy.com","job":"Tax Accountant","timestamp":"2022-06-16T21:10:49Z"}
{"id":265,"first_name":"Heloise","last_name":"Dober","email":"hdober7c@seesaa.net","job":"Dental Hygienist","timestamp":"2021-12-29T01:17:53Z"}
{"id":266,"first_name":"Scotti","last_name":"Layson","email":"slayson7d@accuweather.com","job":"Desktop Support Technician","timestamp":"2022-04-26T19:46:46Z"}
{"id":267,"first_name":"Clementia","last_name":"Weepers","email":"cweepers7e@list-manage.com","job":"Assistant Manager","timestamp":"2022-06-01T21:45:12Z"}
{"id":268,"first_name":"Cullan","last_name":"Liebmann","email":"cliebmann7f@dmoz.org","job":"Financial Advisor","timestamp":"2022-08-03T01:34:18Z"}
{"id":269,"first_name":"Althea","last_name":"Boutell","email":"aboutell7g@seattletimes.com","job":"Health Coach III","timestamp":"2022-07-24T17:30:47Z"}
{"id":270,"first_name":"Karoly","last_name":"Girdwood","email":"kgirdwood7h@webs.com","job":"Senior Quality Engineer","timestamp":"2022-10-17T11:54:59Z"}
{"id":271,"first_name":"Farrel","last_name":"Blackney","email":"fblackney7i@ed.gov","job":"Research Assistant IV","timestamp":"2022-10-25T20:27:01Z"}
{"id":272,"first_name":"Tynan","last_name":"Bleas","email":"tbleas7j@hhs.gov","job":"Compensation Analyst","timestamp":"2022-04-17T03:22:37Z"}
{"id":273,"first_name":"Cybill","last_name":"Caple","email":"ccaple7k@about.me","job":"Payment Adjustment Coordinator","timestamp":"2022-07-26T23:54:40Z"}
{"id":274,"first_name":"Rasla","last_name":"Rameau","email":"rrameau7l@nbcnews.com","job":"Help Desk Technician","timestamp":"2022-06-29T12:22:48Z"}
{"id":275,"first_name":"Harry","last_name":"Sculpher","email":"hsculpher7m@apple.com","job":"Business Systems Development Analyst","timestamp":"2022-07-04T15:07:45Z"}
{"id":276,"first_name":"Dell","last_name":"Higgonet","email":"dhiggonet7n@jalbum.net","job":"Sales Representative","timestamp":"2022-06-27T03:19:01Z"}
{"id":277,"first_name":"Yorke","last_name":"Newstead","email":"ynewstead7o@uol.com.br","job":"Registered Nurse","timestamp":"2022-08-12T07:47:07Z"}
{"id":278,"first_name":"Germaine","last_name":"Polland","email":"gpolland7p@go.com","job":"Developer I","timestamp":"2022-04-01T16:12:57Z"}
{"id":279,"first_name":"Asher","last_name":"Sollett","email":"asollett7q@slashdot.org","job":"VP Sales","timestamp":"2022-01-06T23:20:17Z"}
{"id":280,"first_name":"Marion","last_name":"Armit","email":"marmit7r@meetup.com","job":"Quality Engineer","timestamp":"2022-02-13T02:17:16Z"}
{"id":281,"first_name":"Thomas","last_name":"Clewlow","email":"tclewlow7s@51.la","job":"Executive Secretary","timestamp":"2022-05-29T12:22:11Z"}
{"id":282,"first_name":"Turner","last_name":"Karchowski","email":"tkarchowski7t@elpais.com","job":"Automation Specialist I","timestamp":"2022-04-06T08:23:05Z"}
{"id":283,"first_name":"Ketty","last_name":"Costain","email":"kcostain7u@latimes.com","job":"Structural Engineer","timestamp":"2022-04-30T06:20:06Z"}
{"id":284,"first_name":"Heath","last_name":"Palser","email":"hpalser7v@aol.com","job":"Structural Engineer","timestamp":"2022-04-05T02:10:42Z"}
{"id":285,"first_name":"Gaspar","last_name":"Van den Bosch","email":"gvandenbosch7w@bloomberg.com","job":"Mechanical Systems Engineer","timestamp":"2021-12-22T16:35:11Z"}
{"id":286,"first_name":"Adeline","last_name":"Pacher","email":"apacher7x@e-recht24.de","job":"General Manager","timestamp":"2022-01-19T03:53:17Z"}
{"id":287,"first_name":"Emyle","last_name":"Cookes","email":"ecookes7y@statcounter.com","job":"Nurse Practicioner","timestamp":"2022-11-04T05:52:43Z"}
{"id":288,"first_name":"Eugine","last_name":"Vell","email":"evell7z@webs.com","job":"Sales Representative","timestamp":"2022-04-25T21:53:59Z"}
{"id":289,"first_name":"Ogden","last_name":"Outridge","email":"ooutridge80@epa.gov","job":"Web Designer II","timestamp":"2022-02-02T01:01:16Z"}
{"id":290,"first_name":"Krystalle","last_name":"Esposi","email":"kesposi81@github.io","job":"Editor","timestamp":"2022-05-21T05:46:12Z"}
{"id":291,"first_name":"Fremont","last_name":"Poge","email":"fpoge82@addtoany.com","job":"Software Consultant","timestamp":"2022-11-23T05:50:15Z"}
{"id":292,"first_name":"Mamie","last_name":"Aery","email":"maery83@sciencedirect.com","job":"Professor","timestamp":"2022-08-21T16:38:20Z"}
{"id":293,"first_name":"Andra","last_name":"Iles","email":"ailes84@guardian.co.uk","job":"Biostatistician III","timestamp":"2022-07-07T19:37:01Z"}
{"id":294,"first_name":"Ardith","last_name":"Gemnett","email":"agemnett85@apache.org","job":"Design Engineer","timestamp":"2022-11-29T09:49:25Z"}
{"id":295,"first_name":"Carlie","last_name":"Mulderrig","email":"cmulderrig86@time.com","job":"Developer III","timestamp":"2022-08-30T03:38:10Z"}
{"id":296,"first_name":"Eadie","last_name":"Hain","email":"ehain87@live.com","job":"VP Quality Control","timestamp":"2022-02-14T01:21:52Z"}
{"id":297,"first_name":"Kellen","last_name":"McFall","email":"kmcfall88@engadget.com","job":"Librarian","timestamp":"2022-05-20T11:47:09Z"}
{"id":298,"first_name":"Lianna","last_name":"Weerdenburg","email":"lweerdenburg89@free.fr","job":"Nuclear Power Engineer","timestamp":"2022-04-20T06:32:55Z"}
{"id":299,"first_name":"Ciro","last_name":"Slainey","email":"cslainey8a@angelfire.com","job":"Office Assistant I","timestamp":"2022-06-29T22:41:59Z"}
{"id":300,"first_name":"Kenna","last_name":"Cecchi","email":"kcecchi8b@joomla.org","job":"Executive Secretary","timestamp":"2022-11-25T21:17:24Z"}
{"id":301,"first_name":"Corry","last_name":"Crean","email":"ccrean8c@admin.ch","job":"Biostatistician I","timestamp":"2022-04-14T16:28:03Z"}
{"id":302,"first_name":"Kylie","last_name":"Boylund","email":"kboylund8d@blog.com","job":"Accounting Assistant III","timestamp":"2022-07-16T20:44:59Z"}
{"id":303,"first_name":"Venita","last_name":"Tate","email":"vtate8e@parallels.com","job":"Account Representative III","timestamp":"2022-01-16T07:51:28Z"}
{"id":304,"first_name":"Alain","last_name":"Rustedge","email":"arustedge8f@arizona.edu","job":"Tax Accountant","timestamp":"2022-06-12T19:47:12Z"}
{"id":305,"first_name":"Emilio","last_name":"Ellul","email":"eellul8g@cbslocal.com","job":"Sales Representative","timestamp":"2022-12-01T16:49:33Z"}
{"id":306,"first_name":"Malissia","last_name":"Caspell","email":"mcaspell8h@spiegel.de","job":"Research Assistant IV","timestamp":"2022-08-14T21:19:45Z"}
{"id":307,"first_name":"Gavin","last_name":"Marvel","email":"gmarvel8i@upenn.edu","job":"Research Assistant II","timestamp":"2022-06-16T01:30:19Z"}
{"id":308,"first_name":"Demetri","last_name":"Jumel","email":"djumel8j@weibo.com","job":"Teacher","timestamp":"2022-07-27T03:12:46Z"}
{"id":309,"first_name":"Elia","last_name":"Stovell","email":"estovell8k@quantcast.com","job":"Web Designer III","timestamp":"2022-11-21T00:23:57Z"}
{"id":310,"first_name":"Mab","last_name":"Aleksich","email":"maleksich8l@hhs.gov","job":"Clinical Specialist","timestamp":"2022-07-20T13:14:20Z"}
{"id":311,"first_name":"Mord","last_name":"Klawi","email":"mklawi8m@blogspot.com","job":"Internal Auditor","timestamp":"2022-11-13T15:52:38Z"}
{"id":312,"first_name":"Cale","last_name":"Fante","email":"cfante8n@unesco.org","job":"Editor","timestamp":"2022-09-06T10:13:30Z"}
{"id":313,"first_name":"Samantha","last_name":"Whistlecraft","email":"swhistlecraft8o@dion.ne.jp","job":"Staff Accountant III","timestamp":"2022-04-15T15:47:01Z"}
{"id":314,"first_name":"Wallache","last_name":"Meach","email":"wmeach8p@soundcloud.com","job":"Recruiting Manager","timestamp":"2022-10-18T22:27:16Z"}
{"id":315,"first_name":"York","last_name":"MacRorie","email":"ymacrorie8q@mysql.com","job":"Software Engineer III","timestamp":"2021-12-12T17:51:57Z"}
{"id":316,"first_name":"Eugen","last_name":"Claus","email":"eclaus8r@google.it","job":"Computer Systems Analyst IV","timestamp":"2022-03-28T19:33:23Z"}
{"id":317,"first_name":"Karlotta","last_name":"Geck","email":"kgeck8s@psu.edu","job":"Senior Editor","timestamp":"2022-05-17T14:01:31Z"}
{"id":318,"first_name":"Cherry","last_name":"Gillyett","email":"cgillyett8t@cornell.edu","job":"VP Product Management","timestamp":"2022-05-28T08:17:39Z"}
{"id":319,"first_name":"Estrellita","last_name":"Brient","email":"ebrient8u@clickbank.net","job":"Account Executive","timestamp":"2022-01-08T01:17:56Z"}
{"id":320,"first_name":"Ly","last_name":"Svanetti","email":"lsvanetti8v@sina.com.cn","job":"Desktop Support Technician","timestamp":"2022-05-26T17:19:42Z"}
{"id":321,"first_name":"Ronica","last_name":"Bloys","email":"rbloys8w@elegantthemes.com","job":"Environmental Tech","timestamp":"2022-04-09T15:25:24Z"}
{"id":322,"first_name":"Tallie","last_name":"Wanless","email":"twanless8x@w3.org","job":"Graphic Designer","timestamp":"2022-01-22T15:01:09Z"}
{"id":323,"first_name":"Karola","last_name":"Scotland","email":"kscotland8y@wired.com","job":"Analyst Programmer","timestamp":"2022-11-19T18:36:41Z"}
{"id":324,"first_name":"Albrecht","last_name":"De Bruyn","email":"adebruyn8z@hatena.ne.jp","job":"VP Sales","timestamp":"2021-12-09T22:57:42Z"}
{"id":325,"first_name":"Boniface","last_name":"Lampl","email":"blampl90@slate.com","job":"Analog Circuit Design manager","timestamp":"2022-05-30T23:52:01Z"}
{"id":326,"first_name":"Paxton","last_name":"Garritley","email":"pgarritley91@imdb.com","job":"Recruiter","timestamp":"2022-08-17T08:47:51Z"}
{"id":327,"first_name":"Em","last_name":"Pierrepont","email":"epierrepont92@t.co","job":"Research Assistant II","timestamp":"2022-06-21T06:48:47Z"}
{"id":328,"first_name":"Odele","last_name":"Weymouth","email":"oweymouth93@dot.gov","job":"Financial Analyst","timestamp":"2022-07-21T18:13:46Z"}
{"id":329,"first_name":"Karlik","last_name":"Casely","email":"kcasely94@vimeo.com","job":"Statistician II","timestamp":"2022-01-01T15:51:47Z"}
{"id":330,"first_name":"Marisa","last_name":"Christon","email":"mchriston95@unicef.org","job":"Electrical Engineer","timestamp":"2022-07-22T00:41:36Z"}
{"id":331,"first_name":"Norrie","last_name":"Peotz","email":"npeotz96@ftc.gov","job":"Senior Developer","timestamp":"2022-11-07T15:28:00Z"}
{"id":332,"first_name":"Derby","last_name":"Pover","email":"dpover97@statcounter.com","job":"Technical Writer","timestamp":"2022-04-29T02:37:02Z"}
{"id":333,"first_name":"Miranda","last_name":"Beartup","email":"mbeartup98@barnesandnoble.com","job":"Dental Hygienist","timestamp":"2021-12-13T12:54:56Z"}
{"id":334,"first_name":"Euell","last_name":"Bittlestone","email":"ebittlestone99@google.es","job":"Sales Associate","timestamp":"2022-12-03T03:42:46Z"}
{"id":335,"first_name":"Hewie","last_name":"McConnal","email":"hmcconnal9a@globo.com","job":"Media Manager I","timestamp":"2022-11-12T14:58:30Z"}
{"id":336,"first_name":"Maryanna","last_name":"Blackburne","email":"mblackburne9b@nbcnews.com","job":"Payment Adjustment Coordinator","timestamp":"2022-10-07T19:58:13Z"}
{"id":337,"first_name":"Vicki","last_name":"Wicks","email":"vwicks9c@skype.com","job":"Computer Systems Analyst III","timestamp":"2022-10-28T11:22:21Z"}
{"id":338,"first_name":"Camel","last_name":"Slader","email":"cslader9d@wufoo.com","job":"Sales Representative","timestamp":"2022-01-26T15:37:10Z"}
{"id":339,"first_name":"Alvan","last_name":"Kehoe","email":"akehoe9e@illinois.edu","job":"Staff Scientist","timestamp":"2022-06-01T01:34:48Z"}
{"id":340,"first_name":"Daniella","last_name":"Schapero","email":"dschapero9f@usnews.com","job":"Database Administrator II","timestamp":"2022-04-02T23:01:40Z"}
{"id":341,"first_name":"Roslyn","last_name":"Bortoletti","email":"rbortoletti9g@icio.us","job":"VP Marketing","timestamp":"2022-12-01T16:25:31Z"}
{"id":342,"first_name":"Tonya","last_name":"Largan","email":"tlargan9h@ft.com","job":"Project Manager","timestamp":"2022-03-04T06:31:36Z"}
{"id":343,"first_name":"Elisabeth","last_name":"Sudran","email":"esudran9i@wikimedia.org","job":"VP Product Management","timestamp":"2022-08-11T09:40:53Z"}
{"id":344,"first_name":"Sukey","last_name":"Stopper","email":"sstopper9j@cdbaby.com","job":"Nuclear Power Engineer","timestamp":"2022-09-03T10:25:28Z"}
{"id":345,"first_name":"Merwin","last_name":"Fuentez","email":"mfuentez9k@hp.com","job":"Food Chemist","timestamp":"2022-01-13T00:48:55Z"}
{"id":346,"first_name":"Alden","last_name":"Hariot","email":"ahariot9l@meetup.com","job":"Senior Financial Analyst","timestamp":"2022-11-27T11:30:45Z"}
{"id":347,"first_name":"Persis","last_name":"Jasik","email":"pjasik9m@behance.net","job":"Executive Secretary","timestamp":"2022-09-16T02:54:51Z"}
{"id":348,"first_name":"Quinn","last_name":"Pickavance","email":"qpickavance9n@java.com","job":"Human Resources Assistant I","timestamp":"2022-09-16T17:58:06Z"}
{"id":349,"first_name":"Jules","last_name":"Le Franc","email":"jlefranc9o@kickstarter.com","job":"Administrative Officer","timestamp":"2021-12-15T22:58:34Z"}
{"id":350,"first_name":"Darn","last_name":"Stoate","email":"dstoate9p@umich.edu","job":"Chief Design Engineer","timestamp":"2022-10-03T06:16:31Z"}
{"id":351,"first_name":"Cecilius","last_name":"Deane","email":"cdeane9q@nature.com","job":"Developer I","timestamp":"2022-04-20T02:13:21Z"}
{"id":352,"first_name":"Liane","last_name":"Meredyth","email":"lmeredyth9r@t-online.de","job":"Developer II","timestamp":"2022-12-04T10:09:36Z"}
{"id":353,"first_name":"Elbertina","last_name":"Rogier","email":"erogier9s@hp.com","job":"Accountant IV","timestamp":"2022-01-03T07:33:20Z"}
{"id":354,"first_name":"Isaac","last_name":"Takle","email":"itakle9t@wikispaces.com","job":"Safety Technician I","timestamp":"2022-06-21T02:00:17Z"}
{"id":355,"first_name":"Blondelle","last_name":"Reiner","email":"breiner9u@hp.com","job":"Civil Engineer","timestamp":"2022-10-14T05:55:57Z"}
{"id":356,"first_name":"Hermy","last_name":"Spraging","email":"hspraging9v@geocities.jp","job":"Administrative Officer","timestamp":"2022-03-23T05:46:21Z"}
{"id":357,"first_name":"Skyler","last_name":"Bavister","email":"sbavister9w@cyberchimps.com","job":"Financial Analyst","timestamp":"2021-12-20T01:19:37Z"}
{"id":358,"first_name":"Ruby","last_name":"Hebden","email":"rhebden9x@nba.com","job":"Payment Adjustment Coordinator","timestamp":"2022-02-24T02:38:01Z"}
{"id":359,"first_name":"Jethro","last_name":"Lammerding","email":"jlammerding9y@mac.com","job":"Human Resources Assistant IV","timestamp":"2022-03-21T04:48:37Z"}
{"id":360,"first_name":"Kean","last_name":"Whitticks","email":"kwhitticks9z@economist.com","job":"Financial Advisor","timestamp":"2021-12-17T13:13:36Z"}
{"id":361,"first_name":"Talia","last_name":"Desforges","email":"tdesforgesa0@phpbb.com","job":"Developer IV","timestamp":"2022-04-04T19:29:49Z"}
{"id":362,"first_name":"Colin","last_name":"Cleyburn","email":"ccleyburna1@rakuten.co.jp","job":"Database Administrator III","timestamp":"2022-04-23T03:14:04Z"}
{"id":363,"first_name":"Hube","last_name":"Ells","email":"hellsa2@smugmug.com","job":"Biostatistician I","timestamp":"2022-08-22T16:06:47Z"}
{"id":364,"first_name":"Deloria","last_name":"Coiley","email":"dcoileya3@plala.or.jp","job":"Teacher","timestamp":"2022-04-21T19:30:19Z"}
{"id":365,"first_name":"Lissi","last_name":"Whiteland","email":"lwhitelanda4@addthis.com","job":"Engineer III","timestamp":"2022-05-24T05:21:21Z"}
{"id":366,"first_name":"Kathryn","last_name":"Simek","email":"ksimeka5@washingtonpost.com","job":"Pharmacist","timestamp":"2022-03-03T01:23:04Z"}
{"id":367,"first_name":"Alex","last_name":"Lammenga","email":"alammengaa6@symantec.com","job":"Nuclear Power Engineer","timestamp":"2022-04-24T09:48:47Z"}
{"id":368,"first_name":"Marabel","last_name":"Reilingen","email":"mreilingena7@upenn.edu","job":"Help Desk Technician","timestamp":"2022-07-01T09:26:53Z"}
{"id":369,"first_name":"Zolly","last_name":"Cooney","email":"zcooneya8@discovery.com","job":"Desktop Support Technician","timestamp":"2022-03-01T18:21:42Z"}
{"id":370,"first_name":"Ali","last_name":"Fairlaw","email":"afairlawa9@walmart.com","job":"Environmental Specialist","timestamp":"2022-01-22T12:52:35Z"}
{"id":371,"first_name":"Reilly","last_name":"Langston","email":"rlangstonaa@intel.com","job":"Software Engineer II","timestamp":"2022-10-25T07:16:41Z"}
{"id":372,"first_name":"Chantal","last_name":"Ingram","email":"cingramab@bizjournals.com","job":"Web Designer IV","timestamp":"2022-02-18T23:11:52Z"}
{"id":373,"first_name":"Pembroke","last_name":"Coltart","email":"pcoltartac@examiner.com","job":"VP Accounting","timestamp":"2022-09-13T01:48:41Z"}
{"id":374,"first_name":"Irwin","last_name":"Spain-Gower","email":"ispaingowerad@imageshack.us","job":"Senior Financial Analyst","timestamp":"2022-09-30T11:02:23Z"}
{"id":375,"first_name":"Graig","last_name":"Chastan","email":"gchastanae@geocities.jp","job":"Teacher","timestamp":"2022-08-03T03:42:11Z"}
{"id":376,"first_name":"Leanora","last_name":"Quincee","email":"lquinceeaf@tinyurl.com","job":"Information Systems Manager","timestamp":"2022-04-23T16:46:27Z"}
{"id":377,"first_name":"Kele","last_name":"Cubley","email":"kcubleyag@harvard.edu","job":"Software Engineer III","timestamp":"2022-04-04T14:35:24Z"}
{"id":378,"first_name":"Chariot","last_name":"Minchin","email":"cminchinah@ucla.edu","job":"Senior Developer","timestamp":"2022-09-07T07:00:13Z"}
{"id":379,"first_name":"Ellyn","last_name":"Loggie","email":"eloggieai@washington.edu","job":"Compensation Analyst","timestamp":"2022-05-12T12:07:36Z"}
{"id":380,"first_name":"Dmitri","last_name":"Geleman","email":"dgelemanaj@gizmodo.com","job":"Account Coordinator","timestamp":"2022-07-26T15:41:05Z"}
{"id":381,"first_name":"Steve","last_name":"Lemmer","email":"slemmerak@eepurl.com","job":"Database Administrator IV","timestamp":"2022-07-19T21:11:14Z"}
{"id":382,"first_name":"Tillie","last_name":"Dodle","email":"tdodleal@sciencedirect.com","job":"Geologist III","timestamp":"2022-05-01T16:47:01Z"}
{"id":383,"first_name":"Deirdre","last_name":"Southcombe","email":"dsouthcombeam@trellian.com","job":"Administrative Officer","timestamp":"2022-06-02T00:35:13Z"}
{"id":384,"first_name":"Harman","last_name":"Cino","email":"hcinoan@yahoo.co.jp","job":"Tax Accountant","timestamp":"2022-08-12T09:34:14Z"}
{"id":385,"first_name":"Hy","last_name":"Chittim","email":"hchittimao@scientificamerican.com","job":"Biostatistician IV","timestamp":"2022-07-03T00:37:30Z"}
{"id":386,"first_name":"Cordula","last_name":"Pendlebury","email":"cpendleburyap@cnbc.com","job":"Research Assistant II","timestamp":"2022-05-26T10:47:16Z"}
{"id":387,"first_name":"Murvyn","last_name":"Kuhnwald","email":"mkuhnwaldaq@fotki.com","job":"Senior Financial Analyst","timestamp":"2022-11-02T18:35:53Z"}
{"id":388,"first_name":"King","last_name":"Guilbert","email":"kguilbertar@ycombinator.com","job":"Executive Secretary","timestamp":"2022-03-03T18:22:09Z"}
{"id":389,"first_name":"Emlyn","last_name":"Stanislaw","email":"estanislawas@soup.io","job":"Developer I","timestamp":"2022-04-14T04:40:47Z"}
{"id":390,"first_name":"Talyah","last_name":"Glanester","email":"tglanesterat@nasa.gov","job":"GIS Technical Architect","timestamp":"2022-02-27T06:00:35Z"}
{"id":391,"first_name":"Lou","last_name":"Mockler","email":"lmocklerau@liveinternet.ru","job":"Administrative Assistant III","timestamp":"2022-06-14T09:55:20Z"}
{"id":392,"first_name":"Faulkner","last_name":"Kiddie","email":"fkiddieav@last.fm","job":"Speech Pathologist","timestamp":"2022-11-20T20:38:11Z"}
{"id":393,"first_name":"Fabio","last_name":"Brimner","email":"fbrimneraw@g.co","job":"Geologist I","timestamp":"2022-05-09T23:09:20Z"}
{"id":394,"first_name":"Melisa","last_name":"Piotrowski","email":"mpiotrowskiax@posterous.com","job":"Information Systems Manager","timestamp":"2022-10-08T09:12:54Z"}
{"id":395,"first_name":"Celinda","last_name":"Blodget","email":"cblodgetay@indiatimes.com","job":"Dental Hygienist","timestamp":"2022-07-10T03:04:56Z"}
{"id":396,"first_name":"Haywood","last_name":"Padfield","email":"hpadfieldaz@joomla.org","job":"Registered Nurse","timestamp":"2021-12-09T07:07:51Z"}
{"id":397,"first_name":"Jane","last_name":"Rasor","email":"jrasorb0@soundcloud.com","job":"Editor","timestamp":"2022-01-19T18:10:29Z"}
{"id":398,"first_name":"Rance","last_name":"Hambric","email":"rhambricb1@sciencedirect.com","job":"Human Resources Manager","timestamp":"2022-04-11T18:18:00Z"}
{"id":399,"first_name":"Lincoln","last_name":"Challenger","email":"lchallengerb2@icq.com","job":"Senior Financial Analyst","timestamp":"2022-05-24T13:24:16Z"}
{"id":400,"first_name":"Elnore","last_name":"Pickervance","email":"epickervanceb3@opera.com","job":"Data Coordiator","timestamp":"2022-10-26T04:10:45Z"}
{"id":401,"first_name":"Reidar","last_name":"Cradock","email":"rcradockb4@nature.com","job":"VP Marketing","timestamp":"2022-09-20T14:35:56Z"}
{"id":402,"first_name":"Tarah","last_name":"Binford","email":"tbinfordb5@psu.edu","job":"VP Sales","timestamp":"2022-11-26T12:05:40Z"}
{"id":403,"first_name":"Cinda","last_name":"Trevithick","email":"ctrevithickb6@ustream.tv","job":"Sales Representative","timestamp":"2022-02-02T13:15:47Z"}
{"id":404,"first_name":"Lara","last_name":"Lovel","email":"llovelb7@cocolog-nifty.com","job":"Analyst Programmer","timestamp":"2022-07-11T00:41:53Z"}
{"id":405,"first_name":"Janina","last_name":"Gossart","email":"jgossartb8@cpanel.net","job":"Sales Associate","timestamp":"2022-05-06T08:33:35Z"}
{"id":406,"first_name":"Stefan","last_name":"Bowdrey","email":"sbowdreyb9@oaic.gov.au","job":"Internal Auditor","timestamp":"2022-10-20T14:21:53Z"}
{"id":407,"first_name":"Meryl","last_name":"Shorthouse","email":"mshorthouseba@macromedia.com","job":"Assistant Manager","timestamp":"2022-11-14T11:44:59Z"}
{"id":408,"first_name":"Whittaker","last_name":"Vela","email":"wvelabb@answers.com","job":"Account Coordinator","timestamp":"2021-12-13T11:34:38Z"}
{"id":409,"first_name":"Cheston","last_name":"Ruffli","email":"crufflibc@usnews.com","job":"Data Coordiator","timestamp":"2022-04-08T14:59:45Z"}
{"id":410,"first_name":"Daven","last_name":"Mulryan","email":"dmulryanbd@aboutads.info","job":"Teacher","timestamp":"2022-10-09T00:18:34Z"}
{"id":411,"first_name":"Gusta","last_name":"Goldstraw","email":"ggoldstrawbe@alibaba.com","job":"Sales Representative","timestamp":"2022-01-24T21:37:08Z"}
{"id":412,"first_name":"Chase","last_name":"Kenworthey","email":"ckenwortheybf@indiatimes.com","job":"Nurse","timestamp":"2022-09-17T13:33:39Z"}
{"id":413,"first_name":"Lynn","last_name":"Poluzzi","email":"lpoluzzibg@cocolog-nifty.com","job":"Automation Specialist II","timestamp":"2022-03-23T12:46:38Z"}
{"id":414,"first_name":"Mal","last_name":"Snawden","email":"msnawdenbh@netvibes.com","job":"Business Systems Development Analyst","timestamp":"2022-02-21T09:45:03Z"}
{"id":415,"first_name":"Charin","last_name":"Pennyman","email":"cpennymanbi@bizjournals.com","job":"Account Executive","timestamp":"2022-03-10T18:16:19Z"}
{"id":416,"first_name":"Berkeley","last_name":"Plaster","email":"bplasterbj@technorati.com","job":"Account Coordinator","timestamp":"2022-11-18T14:10:21Z"}
{"id":417,"first_name":"Fransisco","last_name":"Flanner","email":"fflannerbk@cisco.com","job":"Human Resources Assistant III","timestamp":"2022-03-16T22:27:36Z"}
{"id":418,"first_name":"Burt","last_name":"Casajuana","email":"bcasajuanabl@techcrunch.com","job":"Electrical Engineer","timestamp":"2022-09-14T02:08:34Z"}
{"id":419,"first_name":"Tulley","last_name":"Gwinn","email":"tgwinnbm@dell.com","job":"Senior Quality Engineer","timestamp":"2022-11-27T16:15:10Z"}
{"id":420,"first_name":"Anneliese","last_name":"Richie","email":"arichiebn@imageshack.us","job":"Software Test Engineer I","timestamp":"2021-12-17T08:26:36Z"}
{"id":421,"first_name":"Mack","last_name":"Ariss","email":"marissbo@patch.com","job":"Operator","timestamp":"2022-11-26T18:35:09Z"}
{"id":422,"first_name":"Carlin","last_name":"O'Keenan","email":"cokeenanbp@amazon.co.jp","job":"Graphic Designer","timestamp":"2022-05-31T11:18:22Z"}
{"id":423,"first_name":"Cointon","last_name":"Wride","email":"cwridebq@bloomberg.com","job":"Information Systems Manager","timestamp":"2022-10-12T14:19:52Z"}
{"id":424,"first_name":"Quillan","last_name":"Betun","email":"qbetunbr@cnet.com","job":"Junior Executive","timestamp":"2022-06-03T11:49:22Z"}
{"id":425,"first_name":"Dolly","last_name":"Loren","email":"dlorenbs@t.co","job":"Help Desk Operator","timestamp":"2022-06-13T09:31:29Z"}
{"id":426,"first_name":"Helli","last_name":"Whiteoak","email":"hwhiteoakbt@bbb.org","job":"Software Engineer IV","timestamp":"2022-09-10T05:16:50Z"}
{"id":427,"first_name":"Babb","last_name":"Aiton","email":"baitonbu@artisteer.com","job":"Research Associate","timestamp":"2022-03-25T23:13:53Z"}
{"id":428,"first_name":"Ryon","last_name":"Klimkin","email":"rklimkinbv@istockphoto.com","job":"Programmer Analyst I","timestamp":"2022-01-31T10:29:35Z"}
{"id":429,"first_name":"Ignacius","last_name":"Wragge","email":"iwraggebw@dot.gov","job":"Database Administrator IV","timestamp":"2021-12-30T17:50:24Z"}
{"id":430,"first_name":"Orren","last_name":"Janovsky","email":"ojanovskybx@ucoz.com","job":"Help Desk Operator","timestamp":"2022-08-18T17:04:35Z"}
{"id":431,"first_name":"Teddie","last_name":"Sayward","email":"tsaywardby@springer.com","job":"Geologist III","timestamp":"2022-10-17T23:55:12Z"}
{"id":432,"first_name":"Linc","last_name":"Deeming","email":"ldeemingbz@privacy.gov.au","job":"Programmer Analyst III","timestamp":"2022-07-05T12:33:47Z"}
{"id":433,"first_name":"Arin","last_name":"McConnulty","email":"amcconnultyc0@example.com","job":"General Manager","timestamp":"2022-03-26T08:26:10Z"}
{"id":434,"first_name":"Wainwright","last_name":"Majury","email":"wmajuryc1@nasa.gov","job":"Nurse","timestamp":"2022-02-16T03:48:15Z"}
{"id":435,"first_name":"Rogerio","last_name":"Siddens","email":"rsiddensc2@bing.com","job":"Financial Advisor","timestamp":"2022-05-23T14:39:00Z"}
{"id":436,"first_name":"Alyce","last_name":"Kort","email":"akortc3@craigslist.org","job":"Biostatistician II","timestamp":"2022-11-17T12:36:43Z"}
{"id":437,"first_name":"Tiphany","last_name":"Savory","email":"tsavoryc4@sohu.com","job":"Structural Analysis Engineer","timestamp":"2022-04-28T20:22:51Z"}
{"id":438,"first_name":"Colan","last_name":"Gissop","email":"cgissopc5@unicef.org","job":"Quality Engineer","timestamp":"2022-06-15T12:53:13Z"}
{"id":439,"first_name":"Almira","last_name":"MacPike","email":"amacpikec6@multiply.com","job":"Chemical Engineer","timestamp":"2022-09-22T08:14:24Z"}
{"id":440,"first_name":"Jae","last_name":"Jelks","email":"jjelksc7@nasa.gov","job":"Marketing Assistant","timestamp":"2022-02-23T15:12:22Z"}
{"id":441,"first_name":"Ruthe","last_name":"Armatidge","email":"rarmatidgec8@huffingtonpost.com","job":"Human Resources Manager","timestamp":"2022-01-30T13:08:16Z"}
{"id":442,"first_name":"Graehme","last_name":"Mullin","email":"gmullinc9@netscape.com","job":"Account Coordinator","timestamp":"2022-01-31T13:57:36Z"}
{"id":443,"first_name":"Maude","last_name":"Conlon","email":"mconlonca@time.com","job":"Staff Accountant I","timestamp":"2022-04-10T08:37:13Z"}
{"id":444,"first_name":"Elonore","last_name":"Westmore","email":"ewestmorecb@netvibes.com","job":"Registered Nurse","timestamp":"2022-10-17T01:52:09Z"}
{"id":445,"first_name":"Yorker","last_name":"Merrell","email":"ymerrellcc@cornell.edu","job":"Account Representative IV","timestamp":"2022-04-01T17:28:42Z"}
{"id":446,"first_name":"Billi","last_name":"Sammars","email":"bsammarscd@sogou.com","job":"Physical Therapy Assistant","timestamp":"2022-05-23T09:25:27Z"}
{"id":447,"first_name":"Angel","last_name":"Leader","email":"aleaderce@multiply.com","job":"Editor","timestamp":"2022-12-06T20:41:05Z"}
{"id":448,"first_name":"Juana","last_name":"Bellward","email":"jbellwardcf@geocities.com","job":"Executive Secretary","timestamp":"2022-06-10T21:03:40Z"}
{"id":449,"first_name":"Talia","last_name":"Adin","email":"tadincg@angelfire.com","job":"Internal Auditor","timestamp":"2022-01-15T05:23:52Z"}
{"id":450,"first_name":"Bryn","last_name":"Ibell","email":"bibellch@oracle.com","job":"Dental Hygienist","timestamp":"2022-01-15T21:38:04Z"}
{"id":451,"first_name":"Marlowe","last_name":"Gauge","email":"mgaugeci@foxnews.com","job":"Senior Developer","timestamp":"2022-06-21T14:29:23Z"}
{"id":452,"first_name":"Roxane","last_name":"Pernell","email":"rpernellcj@163.com","job":"Director of Sales","timestamp":"2022-05-25T16:10:44Z"}
{"id":453,"first_name":"Renado","last_name":"Sheekey","email":"rsheekeyck@amazon.de","job":"VP Accounting","timestamp":"2022-01-07T02:59:37Z"}
{"id":454,"first_name":"Adria","last_name":"Causer","email":"acausercl@yale.edu","job":"Tax Accountant","timestamp":"2022-10-13T23:57:39Z"}
{"id":455,"first_name":"Reese","last_name":"Sclater","email":"rsclatercm@patch.com","job":"VP Product Management","timestamp":"2021-12-22T05:29:22Z"}
{"id":456,"first_name":"Pail","last_name":"Uzielli","email":"puziellicn@hhs.gov","job":"Recruiting Manager","timestamp":"2022-01-09T10:05:30Z"}
{"id":457,"first_name":"Sadella","last_name":"Fiander","email":"sfianderco@webs.com","job":"Budget/Accounting Analyst II","timestamp":"2022-04-18T18:09:34Z"}
{"id":458,"first_name":"Clint","last_name":"Thirwell","email":"cthirwellcp@comsenz.com","job":"VP Marketing","timestamp":"2022-06-21T21:54:28Z"}
{"id":459,"first_name":"Lamar","last_name":"July","email":"ljulycq@reverbnation.com","job":"Budget/Accounting Analyst II","timestamp":"2022-10-02T14:08:53Z"}
{"id":460,"first_name":"Meg","last_name":"Deschlein","email":"mdeschleincr@networkadvertising.org","job":"Web Developer I","timestamp":"2022-04-03T11:15:05Z"}
{"id":461,"first_name":"Stephine","last_name":"Gorry","email":"sgorrycs@naver.com","job":"Food Chemist","timestamp":"2021-12-09T11:30:53Z"}
{"id":462,"first_name":"Beilul","last_name":"Merrett","email":"bmerrettct@soup.io","job":"Administrative Officer","timestamp":"2022-02-15T18:27:04Z"}
{"id":463,"first_name":"Perren","last_name":"Doni","email":"pdonicu@google.co.uk","job":"Accounting Assistant II","timestamp":"2022-08-20T15:13:36Z"}
{"id":464,"first_name":"Cullie","last_name":"Skarman","email":"cskarmancv@rambler.ru","job":"Administrative Assistant II","timestamp":"2022-08-03T23:13:37Z"}
{"id":465,"first_name":"Matthieu","last_name":"Simonato","email":"msimonatocw@icq.com","job":"Civil Engineer","timestamp":"2022-09-14T13:30:09Z"}
{"id":466,"first_name":"Thea","last_name":"Deer","email":"tdeercx@slate.com","job":"Nurse","timestamp":"2022-05-22T17:37:39Z"}
{"id":467,"first_name":"Nicolina","last_name":"Deyes","email":"ndeyescy@etsy.com","job":"Professor","timestamp":"2022-08-27T09:03:04Z"}
{"id":468,"first_name":"Katalin","last_name":"Bryan","email":"kbryancz@addthis.com","job":"Health Coach III","timestamp":"2022-04-30T15:05:37Z"}
{"id":469,"first_name":"Reggis","last_name":"Daffern","email":"rdaffernd0@odnoklassniki.ru","job":"Senior Developer","timestamp":"2022-02-24T16:58:16Z"}
{"id":470,"first_name":"Westbrook","last_name":"Cockroft","email":"wcockroftd1@uiuc.edu","job":"Research Associate","timestamp":"2022-11-27T21:04:57Z"}
{"id":471,"first_name":"Tomaso","last_name":"Bellon","email":"tbellond2@sakura.ne.jp","job":"Business Systems Development Analyst","timestamp":"2022-07-25T06:37:11Z"}
{"id":472,"first_name":"Jonathan","last_name":"Marfe","email":"jmarfed3@naver.com","job":"Help Desk Operator","timestamp":"2022-01-21T07:39:22Z"}
{"id":473,"first_name":"Dane","last_name":"Duro","email":"ddurod4@google.com.br","job":"Developer III","timestamp":"2022-10-03T05:05:38Z"}
{"id":474,"first_name":"Celine","last_name":"Cartner","email":"ccartnerd5@is.gd","job":"Developer I","timestamp":"2022-07-10T15:56:19Z"}
{"id":475,"first_name":"Atlante","last_name":"Leads","email":"aleadsd6@yellowbook.com","job":"Structural Analysis Engineer","timestamp":"2022-03-13T07:18:55Z"}
{"id":476,"first_name":"Pail","last_name":"Jurgenson","email":"pjurgensond7@newyorker.com","job":"Recruiter","timestamp":"2021-12-19T10:30:18Z"}
{"id":477,"first_name":"Roslyn","last_name":"Bazylets","email":"rbazyletsd8@networksolutions.com","job":"Research Associate","timestamp":"2022-02-28T10:34:48Z"}
{"id":478,"first_name":"Rube","last_name":"Cona","email":"rconad9@opensource.org","job":"Mechanical Systems Engineer","timestamp":"2022-06-03T02:50:16Z"}
{"id":479,"first_name":"Pansie","last_name":"Waistell","email":"pwaistellda@elegantthemes.com","job":"Account Representative IV","timestamp":"2022-08-03T10:25:55Z"}
{"id":480,"first_name":"Uri","last_name":"Duerden","email":"uduerdendb@sourceforge.net","job":"Web Developer IV","timestamp":"2022-12-03T14:11:59Z"}
{"id":481,"first_name":"Kerianne","last_name":"Pipping","email":"kpippingdc@arizona.edu","job":"Operator","timestamp":"2022-09-13T05:25:50Z"}
{"id":482,"first_name":"Blaine","last_name":"Kop","email":"bkopdd@ucla.edu","job":"Geologist III","timestamp":"2022-05-23T16:22:18Z"}
{"id":483,"first_name":"Ana","last_name":"Orringe","email":"aorringede@flickr.com","job":"Dental Hygienist","timestamp":"2022-04-28T11:21:02Z"}
{"id":484,"first_name":"Carine","last_name":"Rawsthorne","email":"crawsthornedf@gmpg.org","job":"Registered Nurse","timestamp":"2022-04-21T04:20:56Z"}
{"id":485,"first_name":"Wilburt","last_name":"Liley","email":"wlileydg@unicef.org","job":"Health Coach IV","timestamp":"2022-05-14T23:43:51Z"}
{"id":486,"first_name":"Cory","last_name":"Winscom","email":"cwinscomdh@hp.com","job":"Tax Accountant","timestamp":"2022-01-08T06:38:08Z"}
{"id":487,"first_name":"Pris","last_name":"Greenley","email":"pgreenleydi@ted.com","job":"Design Engineer","timestamp":"2022-05-04T19:18:30Z"}
{"id":488,"first_name":"Kath","last_name":"Danet","email":"kdanetdj@acquirethisname.com","job":"Help Desk Operator","timestamp":"2022-06-17T01:19:36Z"}
{"id":489,"first_name":"Cindi","last_name":"Isac","email":"cisacdk@patch.com","job":"Database Administrator IV","timestamp":"2022-09-11T21:21:36Z"}
{"id":490,"first_name":"Eduardo","last_name":"Rozzell","email":"erozzelldl@si.edu","job":"Cost Accountant","timestamp":"2022-06-29T05:11:51Z"}
{"id":491,"first_name":"Carmita","last_name":"Siggins","email":"csigginsdm@webeden.co.uk","job":"Project Manager","timestamp":"2022-05-05T17:20:09Z"}
{"id":492,"first_name":"Friederike","last_name":"Wileman","email":"fwilemandn@discovery.com","job":"Human Resources Manager","timestamp":"2022-07-25T18:07:09Z"}
{"id":493,"first_name":"Art","last_name":"Glas","email":"aglasdo@yolasite.com","job":"Dental Hygienist","timestamp":"2022-05-29T18:53:16Z"}
{"id":494,"first_name":"Nevin","last_name":"Twinning","email":"ntwinningdp@g.co","job":"Senior Financial Analyst","timestamp":"2022-10-03T16:43:45Z"}
{"id":495,"first_name":"Anderea","last_name":"Soots","email":"asootsdq@photobucket.com","job":"Senior Sales Associate","timestamp":"2022-04-10T06:00:14Z"}
{"id":496,"first_name":"Jehanna","last_name":"Collishaw","email":"jcollishawdr@latimes.com","job":"Account Coordinator","timestamp":"2022-09-13T00:49:41Z"}
{"id":497,"first_name":"Markos","last_name":"Dunley","email":"mdunleyds@over-blog.com","job":"Executive Secretary","timestamp":"2022-09-30T22:27:56Z"}
{"id":498,"first_name":"Marysa","last_name":"Lebond","email":"mlebonddt@nationalgeographic.com","job":"Chief Design Engineer","timestamp":"2022-07-03T09:53:16Z"}
{"id":499,"first_name":"Washington","last_name":"Nutton","email":"wnuttondu@godaddy.com","job":"Software Consultant","timestamp":"2022-01-15T12:19:31Z"}
{"id":500,"first_name":"Donny","last_name":"Matteo","email":"dmatteodv@comsenz.com","job":"Programmer I","timestamp":"2022-06-13T22:13:41Z"}
{"id":501,"first_name":"Alan","last_name":"Drummond","email":"adrummonddw@google.de","job":"Engineer II","timestamp":"2021-12-17T20:17:04Z"}
{"id":502,"first_name":"Tedmund","last_name":"Dorricott","email":"tdorricottdx@huffingtonpost.com","job":"Office Assistant III","timestamp":"2022-01-17T16:29:48Z"}
{"id":503,"first_name":"Dene","last_name":"Lammers","email":"dlammersdy@wiley.com","job":"Professor","timestamp":"2022-04-16T09:41:42Z"}
{"id":504,"first_name":"Town","last_name":"Leman","email":"tlemandz@amazon.co.uk","job":"Computer Systems Analyst II","timestamp":"2022-02-07T23:47:26Z"}
{"id":505,"first_name":"Bendix","last_name":"Applewhaite","email":"bapplewhaitee0@unc.edu","job":"Professor","timestamp":"2022-01-13T02:07:26Z"}
{"id":506,"first_name":"Paige","last_name":"Mcsarry","email":"pmcsarrye1@furl.net","job":"Librarian","timestamp":"2022-10-08T21:52:03Z"}
{"id":507,"first_name":"Nahum","last_name":"Sweeny","email":"nsweenye2@nifty.com","job":"Teacher","timestamp":"2022-05-03T19:18:43Z"}
{"id":508,"first_name":"Odelle","last_name":"Crosson","email":"ocrossone3@time.com","job":"Senior Developer","timestamp":"2022-07-19T01:56:54Z"}
{"id":509,"first_name":"Carny","last_name":"Hunter","email":"chuntere4@goodreads.com","job":"Human Resources Assistant IV","timestamp":"2022-06-01T04:40:16Z"}
{"id":510,"first_name":"Jarad","last_name":"Rogez","email":"jrogeze5@weather.com","job":"Media Manager IV","timestamp":"2022-11-04T13:41:35Z"}
{"id":511,"first_name":"Iggie","last_name":"Gainsburgh","email":"igainsburghe6@ehow.com","job":"Data Coordiator","timestamp":"2022-11-25T18:42:36Z"}
{"id":512,"first_name":"Meredeth","last_name":"Gealy","email":"mgealye7@va.gov","job":"Environmental Specialist","timestamp":"2022-07-06T12:34:03Z"}
{"id":513,"first_name":"Arluene","last_name":"Hallifax","email":"ahallifaxe8@narod.ru","job":"Environmental Tech","timestamp":"2022-11-01T18:57:22Z"}
{"id":514,"first_name":"Yehudit","last_name":"Leyfield","email":"yleyfielde9@clickbank.net","job":"Recruiting Manager","timestamp":"2022-07-02T07:24:27Z"}
{"id":515,"first_name":"Ezra","last_name":"Blabey","email":"eblabeyea@google.ca","job":"Librarian","timestamp":"2022-06-12T02:22:15Z"}
{"id":516,"first_name":"Gus","last_name":"Leipnik","email":"gleipnikeb@nytimes.com","job":"VP Product Management","timestamp":"2022-01-16T10:36:47Z"}
{"id":517,"first_name":"Benjamin","last_name":"Choak","email":"bchoakec@tumblr.com","job":"VP Product Management","timestamp":"2022-07-25T05:51:24Z"}
{"id":518,"first_name":"Reider","last_name":"Fisby","email":"rfisbyed@cdbaby.com","job":"Information Systems Manager","timestamp":"2022-07-16T17:19:04Z"}
{"id":519,"first_name":"Urbano","last_name":"Barr","email":"ubarree@ihg.com","job":"Data Coordiator","timestamp":"2022-08-16T09:11:02Z"}
{"id":520,"first_name":"Heinrik","last_name":"Courvert","email":"hcourvertef@plala.or.jp","job":"Software Test Engineer I","timestamp":"2022-05-13T03:16:39Z"}
{"id":521,"first_name":"Johann","last_name":"Schlagtmans","email":"jschlagtmanseg@over-blog.com","job":"Software Test Engineer I","timestamp":"2022-08-20T19:57:12Z"}
{"id":522,"first_name":"Brendan","last_name":"MacFadden","email":"bmacfaddeneh@vkontakte.ru","job":"Media Manager II","timestamp":"2022-08-01T22:39:44Z"}
{"id":523,"first_name":"Brittaney","last_name":"Kissock","email":"bkissockei@state.gov","job":"Compensation Analyst","timestamp":"2022-11-17T12:39:14Z"}
{"id":524,"first_name":"Hy","last_name":"Osmant","email":"hosmantej@hibu.com","job":"Help Desk Operator","timestamp":"2022-05-31T11:21:37Z"}
{"id":525,"first_name":"Christean","last_name":"Okell","email":"cokellek@sphinn.com","job":"VP Sales","timestamp":"2022-06-11T06:54:34Z"}
{"id":526,"first_name":"Catharina","last_name":"Onians","email":"coniansel@seesaa.net","job":"Structural Analysis Engineer","timestamp":"2022-12-02T18:12:53Z"}
{"id":527,"first_name":"Murry","last_name":"Gillings","email":"mgillingsem@vinaora.com","job":"Associate Professor","timestamp":"2022-10-29T18:22:04Z"}
{"id":528,"first_name":"Eunice","last_name":"Cottisford","email":"ecottisforden@ebay.co.uk","job":"Executive Secretary","timestamp":"2022-03-05T20:38:13Z"}
{"id":529,"first_name":"Brigg","last_name":"Earie","email":"bearieeo@printfriendly.com","job":"Staff Scientist","timestamp":"2022-09-02T02:50:14Z"}
{"id":530,"first_name":"Pavla","last_name":"Gooder","email":"pgooderep@sphinn.com","job":"Biostatistician II","timestamp":"2022-08-14T11:30:27Z"}
{"id":531,"first_name":"Vite","last_name":"Hendrichs","email":"vhendrichseq@wikia.com","job":"Payment Adjustment Coordinator","timestamp":"2022-10-22T09:52:12Z"}
{"id":532,"first_name":"Genovera","last_name":"Hucker","email":"ghuckerer@diigo.com","job":"Actuary","timestamp":"2022-08-31T22:16:03Z"}
{"id":533,"first_name":"Kristofor","last_name":"Gee","email":"kgeees@unblog.fr","job":"Software Consultant","timestamp":"2021-12-30T22:01:09Z"}
{"id":534,"first_name":"Rozanne","last_name":"Killoran","email":"rkilloranet@sun.com","job":"Social Worker","timestamp":"2022-07-10T01:32:57Z"}
{"id":535,"first_name":"Maurizio","last_name":"Whitby","email":"mwhitbyeu@reference.com","job":"Senior Editor","timestamp":"2021-12-31T05:35:45Z"}
{"id":536,"first_name":"Gerard","last_name":"Yukhnev","email":"gyukhnevev@merriam-webster.com","job":"Environmental Tech","timestamp":"2022-09-21T02:01:45Z"}
{"id":537,"first_name":"Abe","last_name":"Fleg","email":"aflegew@acquirethisname.com","job":"Database Administrator III","timestamp":"2022-03-19T11:41:21Z"}
{"id":538,"first_name":"Roseanna","last_name":"Lovewell","email":"rlovewellex@weebly.com","job":"Account Representative II","timestamp":"2022-04-10T19:30:59Z"}
{"id":539,"first_name":"Joya","last_name":"Makin","email":"jmakiney@dmoz.org","job":"Help Desk Operator","timestamp":"2022-05-22T09:39:40Z"}
{"id":540,"first_name":"Otto","last_name":"Kinneir","email":"okinneirez@mysql.com","job":"Biostatistician III","timestamp":"2022-06-05T12:49:16Z"}
{"id":541,"first_name":"Candy","last_name":"Pedrol","email":"cpedrolf0@sina.com.cn","job":"Social Worker","timestamp":"2022-02-08T15:10:50Z"}
{"id":542,"first_name":"Margarita","last_name":"Hembling","email":"mhemblingf1@cpanel.net","job":"Quality Engineer","timestamp":"2022-07-02T03:09:59Z"}
{"id":543,"first_name":"Claribel","last_name":"Pirouet","email":"cpirouetf2@apache.org","job":"Software Engineer II","timestamp":"2022-04-27T19:40:05Z"}
{"id":544,"first_name":"Jerrold","last_name":"Anglish","email":"janglishf3@unblog.fr","job":"Web Designer III","timestamp":"2022-10-13T04:12:21Z"}
{"id":545,"first_name":"Barr","last_name":"Humberston","email":"bhumberstonf4@etsy.com","job":"Statistician II","timestamp":"2022-05-04T01:15:05Z"}
{"id":546,"first_name":"Elbertine","last_name":"Fellnee","email":"efellneef5@reuters.com","job":"Health Coach II","timestamp":"2022-05-04T21:05:03Z"}
{"id":547,"first_name":"Edithe","last_name":"Hackin","email":"ehackinf6@uol.com.br","job":"Senior Sales Associate","timestamp":"2022-09-22T06:50:43Z"}
{"id":548,"first_name":"Lyndsay","last_name":"Bartoli","email":"lbartolif7@slate.com","job":"Staff Scientist","timestamp":"2021-12-10T17:25:16Z"}
{"id":549,"first_name":"Mason","last_name":"Furney","email":"mfurneyf8@si.edu","job":"Web Designer II","timestamp":"2022-11-29T08:36:41Z"}
{"id":550,"first_name":"Barbey","last_name":"Mindenhall","email":"bmindenhallf9@dailymotion.com","job":"Nuclear Power Engineer","timestamp":"2022-06-23T05:29:44Z"}
{"id":551,"first_name":"Jodi","last_name":"Olekhov","email":"jolekhovfa@oakley.com","job":"General Manager","timestamp":"2022-02-19T14:46:26Z"}
{"id":552,"first_name":"Jillayne","last_name":"Newis","email":"jnewisfb@e-recht24.de","job":"Research Associate","timestamp":"2022-11-13T17:04:16Z"}
{"id":553,"first_name":"Juliet","last_name":"Ridsdale","email":"jridsdalefc@loc.gov","job":"Software Engineer III","timestamp":"2021-12-22T08:30:46Z"}
{"id":554,"first_name":"Der","last_name":"Troth","email":"dtrothfd@samsung.com","job":"Software Test Engineer IV","timestamp":"2022-12-05T05:25:54Z"}
{"id":555,"first_name":"Sibley","last_name":"Aldin","email":"saldinfe@sogou.com","job":"Financial Analyst","timestamp":"2022-10-19T12:41:24Z"}
{"id":556,"first_name":"Dorris","last_name":"Blizard","email":"dblizardff@umich.edu","job":"Database Administrator I","timestamp":"2022-04-07T23:05:04Z"}
{"id":557,"first_name":"Blake","last_name":"Whates","email":"bwhatesfg@1688.com","job":"Marketing Manager","timestamp":"2022-05-23T17:32:50Z"}
{"id":558,"first_name":"Codi","last_name":"Marke","email":"cmarkefh@wsj.com","job":"Research Assistant III","timestamp":"2022-02-02T22:23:33Z"}
{"id":559,"first_name":"Stanislas","last_name":"Brafield","email":"sbrafieldfi@timesonline.co.uk","job":"Assistant Manager","timestamp":"2021-12-21T16:11:21Z"}
{"id":560,"first_name":"Lottie","last_name":"Sperring","email":"lsperringfj@salon.com","job":"Cost Accountant","timestamp":"2022-06-21T13:48:13Z"}
{"id":561,"first_name":"Alvina","last_name":"Beausang","email":"abeausangfk@blogspot.com","job":"Biostatistician I","timestamp":"2022-11-20T19:04:41Z"}
{"id":562,"first_name":"Barton","last_name":"Spencelayh","email":"bspencelayhfl@histats.com","job":"Product Engineer","timestamp":"2022-10-20T00:46:24Z"}
{"id":563,"first_name":"Allayne","last_name":"Treasure","email":"atreasurefm@xrea.com","job":"Accountant III","timestamp":"2022-10-09T13:55:39Z"}
{"id":564,"first_name":"Odey","last_name":"Van der Velde","email":"ovanderveldefn@t-online.de","job":"Recruiting Manager","timestamp":"2022-02-10T08:44:33Z"}
{"id":565,"first_name":"Eleanora","last_name":"Luchelli","email":"eluchellifo@livejournal.com","job":"Engineer I","timestamp":"2022-06-08T22:10:32Z"}
{"id":566,"first_name":"Gerta","last_name":"Iskowitz","email":"giskowitzfp@bravesites.com","job":"Nurse","timestamp":"2021-12-14T18:48:43Z"}
{"id":567,"first_name":"Asa","last_name":"Gregorin","email":"agregorinfq@addtoany.com","job":"Professor","timestamp":"2022-08-14T23:21:12Z"}
{"id":568,"first_name":"Marion","last_name":"MacManus","email":"mmacmanusfr@cdc.gov","job":"Marketing Manager","timestamp":"2022-06-03T08:50:13Z"}
{"id":569,"first_name":"Dionis","last_name":"Klimowski","email":"dklimowskifs@constantcontact.com","job":"Automation Specialist III","timestamp":"2022-02-14T12:33:54Z"}
{"id":570,"first_name":"Katherine","last_name":"McCarle","email":"kmccarleft@sogou.com","job":"Office Assistant II","timestamp":"2022-03-31T12:05:36Z"}
{"id":571,"first_name":"Evelyn","last_name":"MacCarrane","email":"emaccarranefu@cam.ac.uk","job":"Technical Writer","timestamp":"2022-11-06T20:16:28Z"}
{"id":572,"first_name":"Carolynn","last_name":"Forsaith","email":"cforsaithfv@blogs.com","job":"Health Coach IV","timestamp":"2022-02-08T14:49:50Z"}
{"id":573,"first_name":"Pancho","last_name":"Grealish","email":"pgrealishfw@fc2.com","job":"Senior Developer","timestamp":"2022-01-22T03:02:35Z"}
{"id":574,"first_name":"Royall","last_name":"Watson-Brown","email":"rwatsonbrownfx@a8.net","job":"Marketing Assistant","timestamp":"2022-03-15T23:38:10Z"}
{"id":575,"first_name":"Derk","last_name":"Carvill","email":"dcarvillfy@marriott.com","job":"Nurse","timestamp":"2021-12-13T14:15:47Z"}
{"id":576,"first_name":"Siffre","last_name":"Poston","email":"spostonfz@creativecommons.org","job":"Librarian","timestamp":"2022-07-03T08:01:40Z"}
{"id":577,"first_name":"Layla","last_name":"Monckton","email":"lmoncktong0@constantcontact.com","job":"Civil Engineer","timestamp":"2022-08-07T22:49:41Z"}
{"id":578,"first_name":"Ellyn","last_name":"Masse","email":"emasseg1@archive.org","job":"Sales Representative","timestamp":"2022-11-11T21:31:00Z"}
{"id":579,"first_name":"Gilbertina","last_name":"Younglove","email":"gyoungloveg2@omniture.com","job":"Design Engineer","timestamp":"2022-05-16T22:24:11Z"}
{"id":580,"first_name":"Hansiain","last_name":"Eddisford","email":"heddisfordg3@newsvine.com","job":"Design Engineer","timestamp":"2022-12-06T18:22:45Z"}
{"id":581,"first_name":"Sydney","last_name":"Writer","email":"swriterg4@yahoo.co.jp","job":"Media Manager I","timestamp":"2022-10-06T10:57:14Z"}
{"id":582,"first_name":"Stuart","last_name":"Jimeno","email":"sjimenog5@nifty.com","job":"Safety Technician IV","timestamp":"2022-01-03T22:49:27Z"}
{"id":583,"first_name":"Averill","last_name":"Leuchars","email":"aleucharsg6@g.co","job":"GIS Technical Architect","timestamp":"2022-05-17T04:29:13Z"}
{"id":584,"first_name":"Ruddie","last_name":"Bickerdicke","email":"rbickerdickeg7@earthlink.net","job":"Cost Accountant","timestamp":"2022-10-03T06:19:29Z"}
{"id":585,"first_name":"Krissie","last_name":"Walford","email":"kwalfordg8@a8.net","job":"Financial Analyst","timestamp":"2022-06-26T23:22:59Z"}
{"id":586,"first_name":"Zarah","last_name":"Ingleton","email":"zingletong9@si.edu","job":"Assistant Professor","timestamp":"2022-04-27T12:56:33Z"}
{"id":587,"first_name":"Ira","last_name":"Jaxon","email":"ijaxonga@virginia.edu","job":"Graphic Designer","timestamp":"2022-01-24T07:33:08Z"}
{"id":588,"first_name":"Gusella","last_name":"Musla","email":"gmuslagb@dmoz.org","job":"Web Designer III","timestamp":"2022-11-22T01:03:00Z"}
{"id":589,"first_name":"Hildegarde","last_name":"Breem","email":"hbreemgc@goo.gl","job":"Web Designer I","timestamp":"2022-04-01T05:45:18Z"}
{"id":590,"first_name":"Thaddeus","last_name":"Scouller","email":"tscoullergd@bloglovin.com","job":"Geological Engineer","timestamp":"2022-04-02T08:13:20Z"}
{"id":591,"first_name":"Martainn","last_name":"Fevers","email":"mfeversge@example.com","job":"Research Associate","timestamp":"2022-08-24T03:11:38Z"}
{"id":592,"first_name":"Edd","last_name":"Veasey","email":"eveaseygf@ameblo.jp","job":"Administrative Assistant II","timestamp":"2022-05-26T08:06:04Z"}
{"id":593,"first_name":"Elihu","last_name":"Redgewell","email":"eredgewellgg@nationalgeographic.com","job":"Clinical Specialist","timestamp":"2022-04-26T02:56:31Z"}
{"id":594,"first_name":"Renault","last_name":"Smye","email":"rsmyegh@wunderground.com","job":"Analog Circuit Design manager","timestamp":"2022-01-30T22:12:02Z"}
{"id":595,"first_name":"Leeland","last_name":"Hendricks","email":"lhendricksgi@foxnews.com","job":"Pharmacist","timestamp":"2022-05-30T02:24:30Z"}
{"id":596,"first_name":"Collin","last_name":"Arent","email":"carentgj@liveinternet.ru","job":"Mechanical Systems Engineer","timestamp":"2021-12-31T21:09:33Z"}
{"id":597,"first_name":"Kameko","last_name":"Pierce","email":"kpiercegk@china.com.cn","job":"Payment Adjustment Coordinator","timestamp":"2022-11-16T07:31:05Z"}
{"id":598,"first_name":"Mei","last_name":"Pigne","email":"mpignegl@ihg.com","job":"Technical Writer","timestamp":"2022-04-23T10:59:50Z"}
{"id":599,"first_name":"Jenni","last_name":"Skeggs","email":"jskeggsgm@wikipedia.org","job":"Assistant Manager","timestamp":"2022-05-25T06:30:40Z"}
{"id":600,"first_name":"Carver","last_name":"Rivalland","email":"crivallandgn@cornell.edu","job":"Internal Auditor","timestamp":"2022-01-31T17:19:48Z"}
{"id":601,"first_name":"Ciro","last_name":"MacLaverty","email":"cmaclavertygo@usda.gov","job":"VP Quality Control","timestamp":"2022-05-10T19:41:08Z"}
{"id":602,"first_name":"Brook","last_name":"Stickells","email":"bstickellsgp@prnewswire.com","job":"Help Desk Technician","timestamp":"2021-12-12T18:23:13Z"}
{"id":603,"first_name":"Morty","last_name":"Varfolomeev","email":"mvarfolomeevgq@toplist.cz","job":"Administrative Officer","timestamp":"2022-01-03T17:52:59Z"}
{"id":604,"first_name":"Ilario","last_name":"Silman","email":"isilmangr@princeton.edu","job":"Programmer I","timestamp":"2021-12-16T15:24:55Z"}
{"id":605,"first_name":"Lemar","last_name":"Groll","email":"lgrollgs@dyndns.org","job":"Cost Accountant","timestamp":"2022-01-19T15:59:40Z"}
{"id":606,"first_name":"Titos","last_name":"Thorrington","email":"tthorringtongt@cafepress.com","job":"Dental Hygienist","timestamp":"2022-10-06T23:19:20Z"}
{"id":607,"first_name":"Ivonne","last_name":"Yakov","email":"iyakovgu@alibaba.com","job":"Programmer Analyst I","timestamp":"2022-09-02T09:44:39Z"}
{"id":608,"first_name":"Cherish","last_name":"Poinsett","email":"cpoinsettgv@latimes.com","job":"Chemical Engineer","timestamp":"2022-01-23T21:57:24Z"}
{"id":609,"first_name":"Conrad","last_name":"Edmondson","email":"cedmondsongw@bravesites.com","job":"Marketing Assistant","timestamp":"2022-06-02T08:27:23Z"}
{"id":610,"first_name":"Zachary","last_name":"Debney","email":"zdebneygx@squidoo.com","job":"Software Consultant","timestamp":"2022-05-16T03:14:27Z"}
{"id":611,"first_name":"Candy","last_name":"Mc Harg","email":"cmcharggy@wikimedia.org","job":"Account Executive","timestamp":"2022-06-24T22:49:07Z"}
{"id":612,"first_name":"Stormi","last_name":"Stockford","email":"sstockfordgz@thetimes.co.uk","job":"Cost Accountant","timestamp":"2022-06-02T06:18:14Z"}
{"id":613,"first_name":"Robin","last_name":"Antalffy","email":"rantalffyh0@blinklist.com","job":"Design Engineer","timestamp":"2022-10-30T16:07:38Z"}
{"id":614,"first_name":"Elaina","last_name":"Dunkinson","email":"edunkinsonh1@istockphoto.com","job":"Director of Sales","timestamp":"2022-08-12T01:26:15Z"}
{"id":615,"first_name":"Merilyn","last_name":"Annable","email":"mannableh2@sourceforge.net","job":"Pharmacist","timestamp":"2022-11-13T10:13:18Z"}
{"id":616,"first_name":"Ferris","last_name":"Swetmore","email":"fswetmoreh3@mediafire.com","job":"Junior Executive","timestamp":"2022-07-01T14:36:04Z"}
{"id":617,"first_name":"Alf","last_name":"Ozintsev","email":"aozintsevh4@businessweek.com","job":"Internal Auditor","timestamp":"2022-11-19T03:10:43Z"}
{"id":618,"first_name":"Franky","last_name":"Ralton","email":"fraltonh5@weather.com","job":"VP Sales","timestamp":"2022-01-30T19:17:00Z"}
{"id":619,"first_name":"Hedvige","last_name":"Rowlands","email":"hrowlandsh6@comcast.net","job":"Financial Advisor","timestamp":"2022-09-09T11:04:09Z"}
{"id":620,"first_name":"Tynan","last_name":"Crippell","email":"tcrippellh7@berkeley.edu","job":"Nurse Practicioner","timestamp":"2022-09-21T03:11:14Z"}
{"id":621,"first_name":"Alexine","last_name":"Rawlinson","email":"arawlinsonh8@boston.com","job":"Pharmacist","timestamp":"2022-10-18T23:38:56Z"}
{"id":622,"first_name":"Yehudit","last_name":"Couldwell","email":"ycouldwellh9@scientificamerican.com","job":"Safety Technician I","timestamp":"2022-03-28T18:53:05Z"}
{"id":623,"first_name":"Eleanora","last_name":"Bromont","email":"ebromontha@tinyurl.com","job":"Teacher","timestamp":"2022-05-20T03:41:08Z"}
{"id":624,"first_name":"Vincenty","last_name":"Rackham","email":"vrackhamhb@blogtalkradio.com","job":"Senior Financial Analyst","timestamp":"2022-05-10T00:44:21Z"}
{"id":625,"first_name":"Rozella","last_name":"Stent","email":"rstenthc@so-net.ne.jp","job":"Actuary","timestamp":"2022-04-16T06:16:59Z"}
{"id":626,"first_name":"Kerwinn","last_name":"Possel","email":"kposselhd@umn.edu","job":"Analyst Programmer","timestamp":"2022-07-30T17:35:49Z"}
{"id":627,"first_name":"Griffie","last_name":"Quibell","email":"gquibellhe@newyorker.com","job":"Executive Secretary","timestamp":"2022-06-14T19:28:57Z"}
{"id":628,"first_name":"Anatola","last_name":"Mallion","email":"amallionhf@upenn.edu","job":"Sales Associate","timestamp":"2022-03-15T17:11:58Z"}
{"id":629,"first_name":"Dalila","last_name":"Christaeas","email":"dchristaeashg@bandcamp.com","job":"Automation Specialist II","timestamp":"2022-02-03T01:42:06Z"}
{"id":630,"first_name":"Gina","last_name":"Franses","email":"gfranseshh@hao123.com","job":"Clinical Specialist","timestamp":"2022-09-02T08:10:09Z"}
{"id":631,"first_name":"Clio","last_name":"Richardt","email":"crichardthi@joomla.org","job":"Nurse","timestamp":"2021-12-31T19:05:01Z"}
{"id":632,"first_name":"Aryn","last_name":"Hofler","email":"ahoflerhj@free.fr","job":"Quality Control Specialist","timestamp":"2021-12-31T02:58:46Z"}
{"id":633,"first_name":"Berthe","last_name":"Pecht","email":"bpechthk@soundcloud.com","job":"Safety Technician III","timestamp":"2022-11-28T13:33:39Z"}
{"id":634,"first_name":"Marty","last_name":"Crichten","email":"mcrichtenhl@joomla.org","job":"Technical Writer","timestamp":"2022-11-20T17:22:51Z"}
{"id":635,"first_name":"Costanza","last_name":"Grigorushkin","email":"cgrigorushkinhm@seesaa.net","job":"Nurse","timestamp":"2022-07-23T11:29:41Z"}
{"id":636,"first_name":"Janet","last_name":"Northidge","email":"jnorthidgehn@elpais.com","job":"Civil Engineer","timestamp":"2022-05-29T19:03:17Z"}
{"id":637,"first_name":"Charo","last_name":"Esp","email":"cespho@google.com.au","job":"Assistant Media Planner","timestamp":"2022-11-07T00:24:12Z"}
{"id":638,"first_name":"Livvy","last_name":"Grzelewski","email":"lgrzelewskihp@alibaba.com","job":"Administrative Officer","timestamp":"2022-02-06T05:24:56Z"}
{"id":639,"first_name":"Hernando","last_name":"Bryde","email":"hbrydehq@a8.net","job":"Professor","timestamp":"2022-11-01T19:40:15Z"}
{"id":640,"first_name":"Biddy","last_name":"Vine","email":"bvinehr@yahoo.co.jp","job":"Assistant Professor","timestamp":"2022-04-10T06:19:06Z"}
{"id":641,"first_name":"Base","last_name":"Friend","email":"bfriendhs@blogs.com","job":"Legal Assistant","timestamp":"2022-09-03T07:38:34Z"}
{"id":642,"first_name":"Marian","last_name":"Basek","email":"mbasekht@shop-pro.jp","job":"Teacher","timestamp":"2022-09-08T13:13:12Z"}
{"id":643,"first_name":"Ketty","last_name":"Clowney","email":"kclowneyhu@illinois.edu","job":"Research Assistant I","timestamp":"2022-02-20T17:55:16Z"}
{"id":644,"first_name":"Thurston","last_name":"Bossom","email":"tbossomhv@netvibes.com","job":"Statistician III","timestamp":"2022-07-08T06:19:02Z"}
{"id":645,"first_name":"Laure","last_name":"Durrad","email":"ldurradhw@google.pl","job":"Staff Scientist","timestamp":"2022-03-04T04:48:35Z"}
{"id":646,"first_name":"Mildrid","last_name":"Gloy","email":"mgloyhx@themeforest.net","job":"Information Systems Manager","timestamp":"2022-01-08T22:58:28Z"}
{"id":647,"first_name":"Johannah","last_name":"Dorward","email":"jdorwardhy@ovh.net","job":"Analyst Programmer","timestamp":"2022-08-31T07:35:18Z"}
{"id":648,"first_name":"Breena","last_name":"Sidebottom","email":"bsidebottomhz@networksolutions.com","job":"Data Coordiator","timestamp":"2021-12-22T03:36:41Z"}
{"id":649,"first_name":"Jemie","last_name":"Bunch","email":"jbunchi0@cnet.com","job":"Senior Sales Associate","timestamp":"2022-06-03T16:40:56Z"}
{"id":650,"first_name":"Daphna","last_name":"Matchett","email":"dmatchetti1@lulu.com","job":"Information Systems Manager","timestamp":"2022-09-14T16:03:23Z"}
{"id":651,"first_name":"Aymer","last_name":"Lamb-shine","email":"alambshinei2@miibeian.gov.cn","job":"Executive Secretary","timestamp":"2022-05-14T06:33:03Z"}
{"id":652,"first_name":"Brady","last_name":"O'Cuddie","email":"bocuddiei3@google.nl","job":"Research Assistant III","timestamp":"2022-10-28T18:25:01Z"}
{"id":653,"first_name":"Orion","last_name":"Scane","email":"oscanei4@ed.gov","job":"Payment Adjustment Coordinator","timestamp":"2022-07-31T08:16:20Z"}
{"id":654,"first_name":"Bord","last_name":"Cundy","email":"bcundyi5@va.gov","job":"Chief Design Engineer","timestamp":"2022-05-14T12:57:30Z"}
{"id":655,"first_name":"Claudio","last_name":"Fowls","email":"cfowlsi6@1688.com","job":"Director of Sales","timestamp":"2022-01-02T16:42:42Z"}
{"id":656,"first_name":"Leif","last_name":"Inkster","email":"linksteri7@yolasite.com","job":"Assistant Manager","timestamp":"2022-10-24T14:04:24Z"}
{"id":657,"first_name":"Giacinta","last_name":"Wiley","email":"gwileyi8@1688.com","job":"Director of Sales","timestamp":"2022-09-26T16:26:19Z"}
{"id":658,"first_name":"Karylin","last_name":"Allcock","email":"kallcocki9@unesco.org","job":"Accounting Assistant II","timestamp":"2022-05-23T22:15:24Z"}
{"id":659,"first_name":"Krisha","last_name":"Cadden","email":"kcaddenia@purevolume.com","job":"Design Engineer","timestamp":"2022-03-13T05:30:02Z"}
{"id":660,"first_name":"Darnall","last_name":"Grayer","email":"dgrayerib@cargocollective.com","job":"Quality Control Specialist","timestamp":"2022-05-26T11:19:15Z"}
{"id":661,"first_name":"Vin","last_name":"Brinsden","email":"vbrinsdenic@cnet.com","job":"Administrative Officer","timestamp":"2022-10-27T11:50:28Z"}
{"id":662,"first_name":"Lori","last_name":"Hartzogs","email":"lhartzogsid@admin.ch","job":"Senior Editor","timestamp":"2021-12-23T05:37:47Z"}
{"id":663,"first_name":"Kim","last_name":"MacAlinden","email":"kmacalindenie@cornell.edu","job":"Sales Representative","timestamp":"2022-07-09T04:11:04Z"}
{"id":664,"first_name":"Trever","last_name":"Pirnie","email":"tpirnieif@msu.edu","job":"Software Consultant","timestamp":"2022-06-15T21:46:38Z"}
{"id":665,"first_name":"Deidre","last_name":"Kinloch","email":"dkinlochig@salon.com","job":"Health Coach I","timestamp":"2022-10-24T05:33:17Z"}
{"id":666,"first_name":"Christabella","last_name":"Vecard","email":"cvecardih@nydailynews.com","job":"Social Worker","timestamp":"2022-11-13T22:26:59Z"}
{"id":667,"first_name":"Bobbye","last_name":"Kanzler","email":"bkanzlerii@cdbaby.com","job":"Food Chemist","timestamp":"2022-09-23T19:25:44Z"}
{"id":668,"first_name":"Ellen","last_name":"O'Monahan","email":"eomonahanij@mapquest.com","job":"Budget/Accounting Analyst III","timestamp":"2022-08-24T01:54:47Z"}
{"id":669,"first_name":"Nickolaus","last_name":"Bilbie","email":"nbilbieik@ucoz.ru","job":"Junior Executive","timestamp":"2022-02-04T07:50:33Z"}
{"id":670,"first_name":"Brooks","last_name":"Mableson","email":"bmablesonil@toplist.cz","job":"Editor","timestamp":"2022-05-17T16:53:27Z"}
{"id":671,"first_name":"Joyann","last_name":"Tavinor","email":"jtavinorim@tamu.edu","job":"Nuclear Power Engineer","timestamp":"2022-09-06T03:01:20Z"}
{"id":672,"first_name":"Mathe","last_name":"Valerius","email":"mvaleriusin@squarespace.com","job":"GIS Technical Architect","timestamp":"2022-03-08T15:41:18Z"}
{"id":673,"first_name":"Donalt","last_name":"Sainz","email":"dsainzio@biglobe.ne.jp","job":"Nurse","timestamp":"2022-03-19T11:31:30Z"}
{"id":674,"first_name":"Tobey","last_name":"Semeradova","email":"tsemeradovaip@google.ru","job":"Senior Cost Accountant","timestamp":"2022-07-29T04:18:03Z"}
{"id":675,"first_name":"Hendrik","last_name":"Patman","email":"hpatmaniq@zdnet.com","job":"Research Associate","timestamp":"2022-02-03T16:16:17Z"}
{"id":676,"first_name":"Trina","last_name":"Whopples","email":"twhopplesir@who.int","job":"Librarian","timestamp":"2022-07-07T17:52:03Z"}
{"id":677,"first_name":"Merrick","last_name":"Ussher","email":"mussheris@oakley.com","job":"Software Test Engineer III","timestamp":"2022-01-21T05:56:03Z"}
{"id":678,"first_name":"Jennine","last_name":"Mielnik","email":"jmielnikit@ocn.ne.jp","job":"Software Test Engineer III","timestamp":"2022-07-25T19:09:52Z"}
{"id":679,"first_name":"Kenny","last_name":"Greeve","email":"kgreeveiu@ow.ly","job":"Community Outreach Specialist","timestamp":"2022-10-16T20:23:43Z"}
{"id":680,"first_name":"Hasheem","last_name":"Franklyn","email":"hfranklyniv@typepad.com","job":"Quality Control Specialist","timestamp":"2022-05-26T01:47:42Z"}
{"id":681,"first_name":"Wendel","last_name":"Dicken","email":"wdickeniw@ft.com","job":"Automation Specialist IV","timestamp":"2022-06-23T02:50:42Z"}
{"id":682,"first_name":"Harlene","last_name":"Semaine","email":"hsemaineix@odnoklassniki.ru","job":"Recruiting Manager","timestamp":"2022-05-31T14:10:40Z"}
{"id":683,"first_name":"Timothea","last_name":"Kilminster","email":"tkilminsteriy@ning.com","job":"Operator","timestamp":"2022-07-28T21:06:36Z"}
{"id":684,"first_name":"Ram","last_name":"Lindelof","email":"rlindelofiz@mail.ru","job":"Nuclear Power Engineer","timestamp":"2022-01-11T12:40:10Z"}
{"id":685,"first_name":"Marven","last_name":"Wollen","email":"mwollenj0@printfriendly.com","job":"Automation Specialist I","timestamp":"2022-05-24T11:30:18Z"}
{"id":686,"first_name":"Nikoletta","last_name":"Shimmin","email":"nshimminj1@taobao.com","job":"Product Engineer","timestamp":"2022-01-02T14:01:08Z"}
{"id":687,"first_name":"Wheeler","last_name":"Beincken","email":"wbeinckenj2@symantec.com","job":"Professor","timestamp":"2022-12-05T15:00:24Z"}
{"id":688,"first_name":"Mufi","last_name":"Slimon","email":"mslimonj3@arizona.edu","job":"Junior Executive","timestamp":"2022-02-17T18:27:49Z"}
{"id":689,"first_name":"Debee","last_name":"Heavyside","email":"dheavysidej4@ftc.gov","job":"Accounting Assistant II","timestamp":"2022-04-21T20:06:43Z"}
{"id":690,"first_name":"Lois","last_name":"Choules","email":"lchoulesj5@sbwire.com","job":"Computer Systems Analyst IV","timestamp":"2022-04-23T05:50:57Z"}
{"id":691,"first_name":"Issie","last_name":"Rosenberg","email":"irosenbergj6@spotify.com","job":"Analyst Programmer","timestamp":"2022-05-06T21:27:41Z"}
{"id":692,"first_name":"Cicely","last_name":"Costen","email":"ccostenj7@goo.gl","job":"Staff Scientist","timestamp":"2021-12-21T02:39:27Z"}
{"id":693,"first_name":"Barbe","last_name":"Kinneir","email":"bkinneirj8@artisteer.com","job":"Sales Associate","timestamp":"2022-06-11T10:08:55Z"}
{"id":694,"first_name":"Emlyn","last_name":"Adamski","email":"eadamskij9@hubpages.com","job":"Programmer I","timestamp":"2022-10-03T15:22:54Z"}
{"id":695,"first_name":"Rebeca","last_name":"Lorenzini","email":"rlorenzinija@auda.org.au","job":"Analyst Programmer","timestamp":"2022-01-25T17:06:52Z"}
{"id":696,"first_name":"Burke","last_name":"Dalzell","email":"bdalzelljb@bing.com","job":"Programmer I","timestamp":"2022-06-25T11:26:32Z"}
{"id":697,"first_name":"Danila","last_name":"Munton","email":"dmuntonjc@oracle.com","job":"Administrative Assistant III","timestamp":"2022-02-07T19:08:39Z"}
{"id":698,"first_name":"Pablo","last_name":"Ritchman","email":"pritchmanjd@virginia.edu","job":"Research Associate","timestamp":"2022-01-10T02:21:15Z"}
{"id":699,"first_name":"Jillana","last_name":"Welden","email":"jweldenje@vistaprint.com","job":"Recruiter","timestamp":"2022-10-14T01:12:35Z"}
{"id":700,"first_name":"Quintilla","last_name":"McDonagh","email":"qmcdonaghjf@biblegateway.com","job":"Food Chemist","timestamp":"2021-12-09T23:20:44Z"}
{"id":701,"first_name":"Gladys","last_name":"Schoenfisch","email":"gschoenfischjg@google.com.br","job":"VP Accounting","timestamp":"2022-01-20T10:39:38Z"}
{"id":702,"first_name":"Hallie","last_name":"Gery","email":"hgeryjh@blinklist.com","job":"Senior Editor","timestamp":"2022-07-28T15:09:46Z"}
{"id":703,"first_name":"Iorgos","last_name":"Skea","email":"iskeaji@wikia.com","job":"Chemical Engineer","timestamp":"2022-11-22T18:08:01Z"}
{"id":704,"first_name":"Lennard","last_name":"Jolliman","email":"ljollimanjj@walmart.com","job":"Executive Secretary","timestamp":"2021-12-23T00:39:05Z"}
{"id":705,"first_name":"Barde","last_name":"Dixie","email":"bdixiejk@java.com","job":"GIS Technical Architect","timestamp":"2022-02-03T12:21:25Z"}
{"id":706,"first_name":"Catherin","last_name":"Jain","email":"cjainjl@flavors.me","job":"Internal Auditor","timestamp":"2022-09-04T12:46:16Z"}
{"id":707,"first_name":"Dwight","last_name":"Axston","email":"daxstonjm@taobao.com","job":"Marketing Assistant","timestamp":"2021-12-11T13:11:12Z"}
{"id":708,"first_name":"Gerhardine","last_name":"More","email":"gmorejn@liveinternet.ru","job":"Junior Executive","timestamp":"2022-05-08T03:43:14Z"}
{"id":709,"first_name":"Gabe","last_name":"Dominy","email":"gdominyjo@nba.com","job":"Physical Therapy Assistant","timestamp":"2022-04-08T18:45:30Z"}
{"id":710,"first_name":"Lena","last_name":"Abbis","email":"labbisjp@nps.gov","job":"Editor","timestamp":"2022-03-09T21:30:34Z"}
{"id":711,"first_name":"Viola","last_name":"Filgate","email":"vfilgatejq@altervista.org","job":"Project Manager","timestamp":"2022-11-08T00:41:42Z"}
{"id":712,"first_name":"Rolfe","last_name":"Ranahan","email":"rranahanjr@sakura.ne.jp","job":"Software Engineer III","timestamp":"2022-10-23T12:04:16Z"}
{"id":713,"first_name":"Victoria","last_name":"Zanni","email":"vzannijs@google.de","job":"Accountant IV","timestamp":"2022-03-24T07:57:40Z"}
{"id":714,"first_name":"Scarlet","last_name":"Linay","email":"slinayjt@admin.ch","job":"Food Chemist","timestamp":"2022-06-20T04:04:22Z"}
{"id":715,"first_name":"Odella","last_name":"Nursey","email":"onurseyju@fema.gov","job":"Computer Systems Analyst I","timestamp":"2022-09-06T07:57:03Z"}
{"id":716,"first_name":"Gretta","last_name":"Crasswell","email":"gcrasswelljv@i2i.jp","job":"Media Manager IV","timestamp":"2022-12-06T23:09:00Z"}
{"id":717,"first_name":"Lorna","last_name":"Stanman","email":"lstanmanjw@spiegel.de","job":"Physical Therapy Assistant","timestamp":"2022-04-17T12:42:27Z"}
{"id":718,"first_name":"Emilio","last_name":"Gercken","email":"egerckenjx@addthis.com","job":"Editor","timestamp":"2022-08-25T06:39:00Z"}
{"id":719,"first_name":"Bailey","last_name":"Tournay","email":"btournayjy@discuz.net","job":"Editor","timestamp":"2022-03-19T15:02:39Z"}
{"id":720,"first_name":"Magdalen","last_name":"Gavriel","email":"mgavrieljz@indiatimes.com","job":"Assistant Manager","timestamp":"2022-08-05T17:45:49Z"}
{"id":721,"first_name":"Gretel","last_name":"Tinkler","email":"gtinklerk0@51.la","job":"Occupational Therapist","timestamp":"2022-07-27T12:40:20Z"}
{"id":722,"first_name":"Rona","last_name":"Caldecutt","email":"rcaldecuttk1@edublogs.org","job":"Human Resources Manager","timestamp":"2022-07-23T14:54:32Z"}
{"id":723,"first_name":"Lynne","last_name":"Crinidge","email":"lcrinidgek2@google.nl","job":"Financial Analyst","timestamp":"2022-05-26T17:40:55Z"}
{"id":724,"first_name":"Pace","last_name":"Ambrogio","email":"pambrogiok3@ehow.com","job":"Accountant II","timestamp":"2022-02-01T23:19:50Z"}
{"id":725,"first_name":"Alaine","last_name":"Durgan","email":"adurgank4@cmu.edu","job":"Chemical Engineer","timestamp":"2022-06-13T08:59:43Z"}
{"id":726,"first_name":"Teddie","last_name":"Nealon","email":"tnealonk5@qq.com","job":"Community Outreach Specialist","timestamp":"2022-05-12T16:32:14Z"}
{"id":727,"first_name":"Lorelei","last_name":"Lindstrom","email":"llindstromk6@nyu.edu","job":"Nuclear Power Engineer","timestamp":"2022-02-28T06:36:27Z"}
{"id":728,"first_name":"Marena","last_name":"Treleaven","email":"mtreleavenk7@answers.com","job":"Occupational Therapist","timestamp":"2022-07-31T18:58:00Z"}
{"id":729,"first_name":"Trace","last_name":"Mouth","email":"tmouthk8@about.me","job":"Environmental Tech","timestamp":"2022-04-04T08:48:58Z"}
{"id":730,"first_name":"Terry","last_name":"Dorant","email":"tdorantk9@vkontakte.ru","job":"Accountant III","timestamp":"2022-03-28T09:01:58Z"}
{"id":731,"first_name":"De witt","last_name":"Tilbury","email":"dtilburyka@istockphoto.com","job":"Mechanical Systems Engineer","timestamp":"2022-08-08T21:56:03Z"}
{"id":732,"first_name":"Mel","last_name":"Kilalea","email":"mkilaleakb@java.com","job":"Developer III","timestamp":"2022-01-22T22:44:51Z"}
{"id":733,"first_name":"Albertina","last_name":"Eagles","email":"aeagleskc@typepad.com","job":"Accounting Assistant IV","timestamp":"2022-03-23T22:17:56Z"}
{"id":734,"first_name":"Berthe","last_name":"De Hailes","email":"bdehaileskd@biblegateway.com","job":"Associate Professor","timestamp":"2021-12-13T10:46:15Z"}
{"id":735,"first_name":"Muffin","last_name":"MacCawley","email":"mmaccawleyke@yahoo.com","job":"General Manager","timestamp":"2022-07-04T09:03:49Z"}
{"id":736,"first_name":"Glynnis","last_name":"Petz","email":"gpetzkf@infoseek.co.jp","job":"Data Coordiator","timestamp":"2022-08-26T16:14:41Z"}
{"id":737,"first_name":"Davis","last_name":"Loyns","email":"dloynskg@phpbb.com","job":"VP Quality Control","timestamp":"2022-02-26T22:11:32Z"}
{"id":738,"first_name":"Rayshell","last_name":"Whittenbury","email":"rwhittenburykh@ucoz.ru","job":"Staff Scientist","timestamp":"2022-08-25T13:30:55Z"}
{"id":739,"first_name":"Adrien","last_name":"Wellfare","email":"awellfareki@unblog.fr","job":"Registered Nurse","timestamp":"2022-08-11T06:20:29Z"}
{"id":740,"first_name":"Atlanta","last_name":"Piccop","email":"apiccopkj@vistaprint.com","job":"Sales Representative","timestamp":"2022-02-22T09:26:48Z"}
{"id":741,"first_name":"Glad","last_name":"Boolsen","email":"gboolsenkk@dailymail.co.uk","job":"Budget/Accounting Analyst IV","timestamp":"2022-06-15T06:48:27Z"}
{"id":742,"first_name":"Marlo","last_name":"Schenfisch","email":"mschenfischkl@businessinsider.com","job":"Programmer I","timestamp":"2022-04-21T15:15:56Z"}
{"id":743,"first_name":"Nadine","last_name":"Lomb","email":"nlombkm@theguardian.com","job":"Senior Editor","timestamp":"2022-10-28T11:10:07Z"}
{"id":744,"first_name":"Hartley","last_name":"Kemetz","email":"hkemetzkn@histats.com","job":"Internal Auditor","timestamp":"2022-01-13T20:49:23Z"}
{"id":745,"first_name":"Wayland","last_name":"Murch","email":"wmurchko@yellowbook.com","job":"Nurse","timestamp":"2022-01-19T12:11:01Z"}
{"id":746,"first_name":"Chuck","last_name":"Shama","email":"cshamakp@noaa.gov","job":"Occupational Therapist","timestamp":"2022-08-17T03:48:57Z"}
{"id":747,"first_name":"Maximilien","last_name":"Hender","email":"mhenderkq@squarespace.com","job":"Analog Circuit Design manager","timestamp":"2022-10-09T00:31:21Z"}
{"id":748,"first_name":"Hoyt","last_name":"Sains","email":"hsainskr@patch.com","job":"Project Manager","timestamp":"2022-11-02T08:21:21Z"}
{"id":749,"first_name":"Raychel","last_name":"Marsham","email":"rmarshamks@eepurl.com","job":"Database Administrator III","timestamp":"2022-08-14T01:54:32Z"}
{"id":750,"first_name":"Meriel","last_name":"Slowley","email":"mslowleykt@mail.ru","job":"Information Systems Manager","timestamp":"2022-07-07T00:41:12Z"}
{"id":751,"first_name":"Meara","last_name":"Rawcliff","email":"mrawcliffku@t.co","job":"Tax Accountant","timestamp":"2022-08-10T04:38:07Z"}
{"id":752,"first_name":"Mignon","last_name":"Klee","email":"mkleekv@usatoday.com","job":"Staff Scientist","timestamp":"2022-10-02T13:43:33Z"}
{"id":753,"first_name":"Dulci","last_name":"Simonou","email":"dsimonoukw@i2i.jp","job":"Operator","timestamp":"2022-10-11T17:09:14Z"}
{"id":754,"first_name":"Candis","last_name":"Letford","email":"cletfordkx@cyberchimps.com","job":"Accountant I","timestamp":"2022-03-30T08:46:25Z"}
{"id":755,"first_name":"Carmen","last_name":"Crighton","email":"ccrightonky@prlog.org","job":"Assistant Professor","timestamp":"2022-09-26T06:42:14Z"}
{"id":756,"first_name":"Warner","last_name":"Sinott","email":"wsinottkz@dropbox.com","job":"Staff Scientist","timestamp":"2022-05-20T22:40:55Z"}
{"id":757,"first_name":"Viv","last_name":"Moylan","email":"vmoylanl0@jimdo.com","job":"Account Representative II","timestamp":"2021-12-08T21:43:10Z"}
{"id":758,"first_name":"Heddie","last_name":"Beynke","email":"hbeynkel1@amazon.com","job":"Physical Therapy Assistant","timestamp":"2021-12-16T14:39:59Z"}
{"id":759,"first_name":"Roberto","last_name":"Bottle","email":"rbottlel2@mlb.com","job":"Sales Associate","timestamp":"2021-12-23T04:18:27Z"}
{"id":760,"first_name":"Krysta","last_name":"Malzard","email":"kmalzardl3@hp.com","job":"Administrative Assistant III","timestamp":"2022-11-03T17:41:14Z"}
{"id":761,"first_name":"Aurea","last_name":"Povall","email":"apovalll4@wikispaces.com","job":"Editor","timestamp":"2021-12-27T03:17:49Z"}
{"id":762,"first_name":"Burt","last_name":"Phillott","email":"bphillottl5@opensource.org","job":"Programmer II","timestamp":"2022-02-11T00:22:12Z"}
{"id":763,"first_name":"Elnar","last_name":"Smorthit","email":"esmorthitl6@timesonline.co.uk","job":"Research Nurse","timestamp":"2022-01-05T14:47:09Z"}
{"id":764,"first_name":"Linnell","last_name":"Ilyushkin","email":"lilyushkinl7@bloglovin.com","job":"Senior Financial Analyst","timestamp":"2022-01-30T02:30:52Z"}
{"id":765,"first_name":"Lee","last_name":"Waeland","email":"lwaelandl8@mapy.cz","job":"Accounting Assistant I","timestamp":"2022-04-17T05:28:49Z"}
{"id":766,"first_name":"Clotilda","last_name":"Litterick","email":"clitterickl9@gmpg.org","job":"Research Associate","timestamp":"2022-10-13T02:50:59Z"}
{"id":767,"first_name":"Shepherd","last_name":"Furmonger","email":"sfurmongerla@opensource.org","job":"Junior Executive","timestamp":"2022-10-24T12:54:10Z"}
{"id":768,"first_name":"Boycey","last_name":"Halversen","email":"bhalversenlb@fastcompany.com","job":"Editor","timestamp":"2021-12-09T13:50:42Z"}
{"id":769,"first_name":"Lamar","last_name":"Dressell","email":"ldresselllc@instagram.com","job":"Web Developer IV","timestamp":"2022-04-27T08:39:18Z"}
{"id":770,"first_name":"Davita","last_name":"Jolin","email":"djolinld@is.gd","job":"Food Chemist","timestamp":"2021-12-21T15:03:35Z"}
{"id":771,"first_name":"Teddie","last_name":"Heinrici","email":"theinricile@guardian.co.uk","job":"Desktop Support Technician","timestamp":"2022-03-14T17:43:34Z"}
{"id":772,"first_name":"Catherin","last_name":"Egle of Germany","email":"cegleofgermanylf@yahoo.com","job":"Senior Quality Engineer","timestamp":"2022-06-13T23:32:57Z"}
{"id":773,"first_name":"Birgit","last_name":"Vasyukhin","email":"bvasyukhinlg@freewebs.com","job":"Human Resources Manager","timestamp":"2022-01-31T18:54:27Z"}
{"id":774,"first_name":"Rory","last_name":"Bohman","email":"rbohmanlh@goo.gl","job":"Actuary","timestamp":"2022-01-02T22:02:28Z"}
{"id":775,"first_name":"Ezechiel","last_name":"Bransdon","email":"ebransdonli@blogtalkradio.com","job":"Information Systems Manager","timestamp":"2022-03-22T18:51:52Z"}
{"id":776,"first_name":"Hillie","last_name":"Athowe","email":"hathowelj@google.pl","job":"Sales Representative","timestamp":"2021-12-16T07:47:18Z"}
{"id":777,"first_name":"Edwina","last_name":"Verry","email":"everrylk@trellian.com","job":"Staff Accountant IV","timestamp":"2022-04-29T04:08:45Z"}
{"id":778,"first_name":"Alyce","last_name":"Pulham","email":"apulhamll@samsung.com","job":"Health Coach II","timestamp":"2022-12-06T01:14:54Z"}
{"id":779,"first_name":"Estele","last_name":"Cullimore","email":"ecullimorelm@indiatimes.com","job":"Actuary","timestamp":"2022-01-21T10:00:05Z"}
{"id":780,"first_name":"Iver","last_name":"Jeannenet","email":"ijeannenetln@nifty.com","job":"Accountant II","timestamp":"2022-11-16T09:38:28Z"}
{"id":781,"first_name":"Olimpia","last_name":"Coulsen","email":"ocoulsenlo@xing.com","job":"Research Associate","timestamp":"2022-02-24T09:11:20Z"}
{"id":782,"first_name":"Noel","last_name":"Ludlem","email":"nludlemlp@desdev.cn","job":"Speech Pathologist","timestamp":"2022-04-25T11:57:38Z"}
{"id":783,"first_name":"Enoch","last_name":"Goddman","email":"egoddmanlq@imdb.com","job":"Staff Scientist","timestamp":"2021-12-19T13:34:15Z"}
{"id":784,"first_name":"Heinrik","last_name":"McGee","email":"hmcgeelr@marriott.com","job":"Technical Writer","timestamp":"2022-03-25T07:45:03Z"}
{"id":785,"first_name":"Rosella","last_name":"Arent","email":"rarentls@mysql.com","job":"Chief Design Engineer","timestamp":"2022-08-27T06:07:40Z"}
{"id":786,"first_name":"Gerard","last_name":"Heathfield","email":"gheathfieldlt@bloomberg.com","job":"Health Coach II","timestamp":"2022-01-11T18:42:53Z"}
{"id":787,"first_name":"Davie","last_name":"Di Biaggi","email":"ddibiaggilu@yelp.com","job":"Director of Sales","timestamp":"2022-06-05T18:40:22Z"}
{"id":788,"first_name":"Meredith","last_name":"Hatchell","email":"mhatchelllv@google.ca","job":"Biostatistician IV","timestamp":"2022-05-26T14:28:05Z"}
{"id":789,"first_name":"Haven","last_name":"Coppeard","email":"hcoppeardlw@virginia.edu","job":"Structural Engineer","timestamp":"2022-04-02T23:43:01Z"}
{"id":790,"first_name":"Marietta","last_name":"MacTrustey","email":"mmactrusteylx@pinterest.com","job":"Graphic Designer","timestamp":"2022-03-16T13:38:59Z"}
{"id":791,"first_name":"Chrisse","last_name":"Sargerson","email":"csargersonly@dell.com","job":"VP Sales","timestamp":"2022-07-16T21:03:21Z"}
{"id":792,"first_name":"Barri","last_name":"Danilevich","email":"bdanilevichlz@dmoz.org","job":"Community Outreach Specialist","timestamp":"2022-11-12T05:56:51Z"}
{"id":793,"first_name":"Eleanore","last_name":"Dallemore","email":"edallemorem0@globo.com","job":"Paralegal","timestamp":"2022-09-29T14:34:42Z"}
{"id":794,"first_name":"Skye","last_name":"Southerill","email":"ssoutherillm1@weebly.com","job":"Database Administrator I","timestamp":"2022-06-08T18:20:11Z"}
{"id":795,"first_name":"Trueman","last_name":"Layfield","email":"tlayfieldm2@live.com","job":"Structural Analysis Engineer","timestamp":"2022-02-26T21:26:01Z"}
{"id":796,"first_name":"Nollie","last_name":"Allanson","email":"nallansonm3@un.org","job":"Sales Associate","timestamp":"2022-02-26T05:40:49Z"}
{"id":797,"first_name":"Shay","last_name":"Marder","email":"smarderm4@chronoengine.com","job":"Data Coordiator","timestamp":"2022-05-25T12:31:14Z"}
{"id":798,"first_name":"Jolee","last_name":"Danit","email":"jdanitm5@princeton.edu","job":"VP Product Management","timestamp":"2022-08-21T12:50:15Z"}
{"id":799,"first_name":"Neile","last_name":"Pottiphar","email":"npottipharm6@nsw.gov.au","job":"Research Nurse","timestamp":"2022-06-30T15:02:03Z"}
{"id":800,"first_name":"Pen","last_name":"Garrattley","email":"pgarrattleym7@ucoz.ru","job":"Registered Nurse","timestamp":"2022-12-05T16:06:07Z"}
{"id":801,"first_name":"Duffie","last_name":"Morrow","email":"dmorrowm8@weebly.com","job":"Research Associate","timestamp":"2022-10-27T20:27:59Z"}
{"id":802,"first_name":"Garland","last_name":"Dunnet","email":"gdunnetm9@microsoft.com","job":"Graphic Designer","timestamp":"2022-04-06T05:47:47Z"}
{"id":803,"first_name":"Bianka","last_name":"Escott","email":"bescottma@netlog.com","job":"Statistician II","timestamp":"2022-02-05T07:13:30Z"}
{"id":804,"first_name":"Ebonee","last_name":"Bown","email":"ebownmb@nasa.gov","job":"Paralegal","timestamp":"2022-07-03T08:24:49Z"}
{"id":805,"first_name":"Katherina","last_name":"Marciskewski","email":"kmarciskewskimc@cdbaby.com","job":"Mechanical Systems Engineer","timestamp":"2022-07-01T19:22:29Z"}
{"id":806,"first_name":"Matti","last_name":"Cadwaladr","email":"mcadwaladrmd@163.com","job":"Senior Sales Associate","timestamp":"2022-05-06T00:33:03Z"}
{"id":807,"first_name":"Kiel","last_name":"Castellet","email":"kcastelletme@washingtonpost.com","job":"Environmental Specialist","timestamp":"2022-02-18T09:24:22Z"}
{"id":808,"first_name":"Lothario","last_name":"Gingle","email":"lginglemf@seattletimes.com","job":"Software Engineer IV","timestamp":"2022-10-18T10:17:11Z"}
{"id":809,"first_name":"Thadeus","last_name":"Caine","email":"tcainemg@google.co.jp","job":"Programmer Analyst I","timestamp":"2022-09-25T02:58:47Z"}
{"id":810,"first_name":"Debor","last_name":"Membry","email":"dmembrymh@flavors.me","job":"GIS Technical Architect","timestamp":"2022-06-20T09:00:42Z"}
{"id":811,"first_name":"Bronson","last_name":"Grassi","email":"bgrassimi@reverbnation.com","job":"Accountant II","timestamp":"2022-05-24T07:30:50Z"}
{"id":812,"first_name":"Corey","last_name":"Cheley","email":"ccheleymj@cafepress.com","job":"Environmental Specialist","timestamp":"2022-08-17T04:44:36Z"}
{"id":813,"first_name":"Faydra","last_name":"Wason","email":"fwasonmk@sphinn.com","job":"Software Engineer I","timestamp":"2022-10-14T11:57:26Z"}
{"id":814,"first_name":"Lulu","last_name":"Kluger","email":"lklugerml@google.cn","job":"Accounting Assistant IV","timestamp":"2022-02-11T06:23:54Z"}
{"id":815,"first_name":"Micky","last_name":"Urch","email":"murchmm@yellowbook.com","job":"Office Assistant II","timestamp":"2022-09-12T14:35:45Z"}
{"id":816,"first_name":"Hinze","last_name":"Buglass","email":"hbuglassmn@biglobe.ne.jp","job":"GIS Technical Architect","timestamp":"2022-09-09T07:07:58Z"}
{"id":817,"first_name":"Bernette","last_name":"Wikey","email":"bwikeymo@issuu.com","job":"Graphic Designer","timestamp":"2022-08-06T03:02:20Z"}
{"id":818,"first_name":"Gav","last_name":"Starbucke","email":"gstarbuckemp@ox.ac.uk","job":"Registered Nurse","timestamp":"2022-10-24T06:45:21Z"}
{"id":819,"first_name":"Karleen","last_name":"Taffie","email":"ktaffiemq@acquirethisname.com","job":"Speech Pathologist","timestamp":"2022-08-26T14:37:04Z"}
{"id":820,"first_name":"Aldon","last_name":"Margerison","email":"amargerisonmr@de.vu","job":"Business Systems Development Analyst","timestamp":"2022-02-13T18:06:07Z"}
{"id":821,"first_name":"Gerrie","last_name":"O'Lenechan","email":"golenechanms@nytimes.com","job":"Sales Associate","timestamp":"2022-09-06T17:38:15Z"}
{"id":822,"first_name":"Ronny","last_name":"Woodage","email":"rwoodagemt@cbc.ca","job":"Graphic Designer","timestamp":"2022-01-24T01:06:27Z"}
{"id":823,"first_name":"Kippie","last_name":"Stone","email":"kstonemu@nih.gov","job":"Sales Associate","timestamp":"2022-07-31T21:58:11Z"}
{"id":824,"first_name":"Alvis","last_name":"Cranidge","email":"acranidgemv@cmu.edu","job":"Database Administrator III","timestamp":"2021-12-15T21:10:22Z"}
{"id":825,"first_name":"Irv","last_name":"Mycroft","email":"imycroftmw@walmart.com","job":"Web Developer II","timestamp":"2022-07-23T17:09:26Z"}
{"id":826,"first_name":"Salome","last_name":"McGourty","email":"smcgourtymx@techcrunch.com","job":"Data Coordiator","timestamp":"2022-10-15T12:52:05Z"}
{"id":827,"first_name":"Querida","last_name":"Dall","email":"qdallmy@home.pl","job":"Librarian","timestamp":"2022-04-02T23:34:41Z"}
{"id":828,"first_name":"Ailee","last_name":"Clemmensen","email":"aclemmensenmz@webs.com","job":"Human Resources Manager","timestamp":"2022-03-04T22:47:54Z"}
{"id":829,"first_name":"Merwyn","last_name":"MacVaugh","email":"mmacvaughn0@msn.com","job":"VP Accounting","timestamp":"2022-09-16T15:33:45Z"}
{"id":830,"first_name":"Hilary","last_name":"Ostridge","email":"hostridgen1@apache.org","job":"Librarian","timestamp":"2022-07-01T12:51:19Z"}
{"id":831,"first_name":"Jose","last_name":"Willder","email":"jwilldern2@hc360.com","job":"Information Systems Manager","timestamp":"2022-06-16T19:41:35Z"}
{"id":832,"first_name":"Rozalie","last_name":"Crowcher","email":"rcrowchern3@economist.com","job":"Accountant IV","timestamp":"2022-05-03T15:17:59Z"}
{"id":833,"first_name":"Heidi","last_name":"Tuny","email":"htunyn4@timesonline.co.uk","job":"Research Associate","timestamp":"2022-10-19T14:35:46Z"}
{"id":834,"first_name":"Inge","last_name":"Raun","email":"iraunn5@slideshare.net","job":"Financial Analyst","timestamp":"2022-10-26T19:33:59Z"}
{"id":835,"first_name":"Sibelle","last_name":"Cours","email":"scoursn6@themeforest.net","job":"VP Sales","timestamp":"2022-11-13T04:22:18Z"}
{"id":836,"first_name":"Arden","last_name":"Algie","email":"aalgien7@photobucket.com","job":"Safety Technician III","timestamp":"2022-09-17T06:44:05Z"}
{"id":837,"first_name":"Irvin","last_name":"Scroyton","email":"iscroytonn8@auda.org.au","job":"Editor","timestamp":"2021-12-19T13:18:04Z"}
{"id":838,"first_name":"Waring","last_name":"Van Dalen","email":"wvandalenn9@addtoany.com","job":"Chemical Engineer","timestamp":"2022-01-13T10:19:40Z"}
{"id":839,"first_name":"Mata","last_name":"McAulay","email":"mmcaulayna@ucla.edu","job":"Marketing Assistant","timestamp":"2022-08-30T06:04:43Z"}
{"id":840,"first_name":"Elsa","last_name":"Vickery","email":"evickerynb@si.edu","job":"Operator","timestamp":"2022-09-30T00:48:09Z"}
{"id":841,"first_name":"Hedda","last_name":"Erat","email":"heratnc@amazon.de","job":"Administrative Officer","timestamp":"2022-06-20T14:36:55Z"}
{"id":842,"first_name":"Belicia","last_name":"Eddow","email":"beddownd@cnn.com","job":"Chief Design Engineer","timestamp":"2022-01-10T05:33:16Z"}
{"id":843,"first_name":"Jenn","last_name":"Maidstone","email":"jmaidstonene@theglobeandmail.com","job":"Senior Editor","timestamp":"2022-03-02T23:23:36Z"}
{"id":844,"first_name":"Boycie","last_name":"Cordes","email":"bcordesnf@baidu.com","job":"Clinical Specialist","timestamp":"2022-06-23T03:06:33Z"}
{"id":845,"first_name":"Sanderson","last_name":"Breffitt","email":"sbreffittng@aboutads.info","job":"Software Engineer II","timestamp":"2022-10-05T00:17:08Z"}
{"id":846,"first_name":"Renell","last_name":"Eldred","email":"reldrednh@histats.com","job":"Analog Circuit Design manager","timestamp":"2022-07-25T23:38:06Z"}
{"id":847,"first_name":"Flory","last_name":"Castagnier","email":"fcastagnierni@studiopress.com","job":"Safety Technician I","timestamp":"2022-10-26T16:38:48Z"}
{"id":848,"first_name":"Susette","last_name":"Runnacles","email":"srunnaclesnj@wisc.edu","job":"Assistant Media Planner","timestamp":"2022-04-17T08:23:24Z"}
{"id":849,"first_name":"Camila","last_name":"Tweedell","email":"ctweedellnk@bizjournals.com","job":"Administrative Assistant IV","timestamp":"2022-02-21T08:17:01Z"}
{"id":850,"first_name":"Perry","last_name":"Obey","email":"pobeynl@omniture.com","job":"Biostatistician III","timestamp":"2022-10-06T13:30:56Z"}
{"id":851,"first_name":"Ertha","last_name":"Elleray","email":"eelleraynm@github.io","job":"Teacher","timestamp":"2022-08-04T23:19:13Z"}
{"id":852,"first_name":"Wallie","last_name":"Hamlett","email":"whamlettnn@hexun.com","job":"Media Manager III","timestamp":"2022-08-30T06:54:56Z"}
{"id":853,"first_name":"Marchelle","last_name":"De la Yglesia","email":"mdelayglesiano@nbcnews.com","job":"Engineer III","timestamp":"2022-03-30T09:10:19Z"}
{"id":854,"first_name":"Eugen","last_name":"Kirk","email":"ekirknp@ezinearticles.com","job":"Community Outreach Specialist","timestamp":"2021-12-16T02:14:06Z"}
{"id":855,"first_name":"Mable","last_name":"Bickerton","email":"mbickertonnq@zdnet.com","job":"Food Chemist","timestamp":"2022-01-07T16:19:09Z"}
{"id":856,"first_name":"Ricki","last_name":"Lalevee","email":"rlaleveenr@msu.edu","job":"VP Sales","timestamp":"2022-07-16T03:33:06Z"}
{"id":857,"first_name":"Karylin","last_name":"Allport","email":"kallportns@time.com","job":"Paralegal","timestamp":"2022-04-22T13:30:34Z"}
{"id":858,"first_name":"Sisile","last_name":"Burkin","email":"sburkinnt@google.com.br","job":"Senior Editor","timestamp":"2022-08-12T00:46:45Z"}
{"id":859,"first_name":"Maxi","last_name":"Carl","email":"mcarlnu@illinois.edu","job":"Internal Auditor","timestamp":"2022-04-07T15:15:14Z"}
{"id":860,"first_name":"Ediva","last_name":"McFarlan","email":"emcfarlannv@google.cn","job":"Quality Engineer","timestamp":"2022-05-15T14:40:42Z"}
{"id":861,"first_name":"Rosco","last_name":"Gregoretti","email":"rgregorettinw@bravesites.com","job":"Account Coordinator","timestamp":"2022-07-01T10:19:08Z"}
{"id":862,"first_name":"Denise","last_name":"Trimmell","email":"dtrimmellnx@163.com","job":"Assistant Professor","timestamp":"2022-06-03T15:07:57Z"}
{"id":863,"first_name":"Penny","last_name":"Dahlman","email":"pdahlmanny@apache.org","job":"Account Representative III","timestamp":"2022-05-18T11:27:11Z"}
{"id":864,"first_name":"Brant","last_name":"Billes","email":"bbillesnz@kickstarter.com","job":"Data Coordiator","timestamp":"2022-10-28T10:54:26Z"}
{"id":865,"first_name":"Lorne","last_name":"Stanbridge","email":"lstanbridgeo0@vistaprint.com","job":"Compensation Analyst","timestamp":"2022-02-15T09:00:19Z"}
{"id":866,"first_name":"Rodger","last_name":"Vedeniktov","email":"rvedeniktovo1@ycombinator.com","job":"Software Consultant","timestamp":"2022-08-03T14:49:52Z"}
{"id":867,"first_name":"Selma","last_name":"Twitching","email":"stwitchingo2@meetup.com","job":"Help Desk Operator","timestamp":"2022-04-30T22:24:30Z"}
{"id":868,"first_name":"Templeton","last_name":"Yakebovich","email":"tyakebovicho3@fc2.com","job":"Internal Auditor","timestamp":"2022-02-24T01:33:50Z"}
{"id":869,"first_name":"Reidar","last_name":"Dudding","email":"rduddingo4@ucoz.com","job":"Statistician III","timestamp":"2022-01-08T12:26:12Z"}
{"id":870,"first_name":"Lammond","last_name":"Dunnion","email":"ldunniono5@miibeian.gov.cn","job":"Actuary","timestamp":"2022-10-02T01:22:33Z"}
{"id":871,"first_name":"Pren","last_name":"Baraclough","email":"pbaraclougho6@artisteer.com","job":"Software Consultant","timestamp":"2022-06-27T19:19:01Z"}
{"id":872,"first_name":"Stacie","last_name":"Grunnell","email":"sgrunnello7@aol.com","job":"Social Worker","timestamp":"2022-03-13T04:54:57Z"}
{"id":873,"first_name":"Grata","last_name":"Karlsen","email":"gkarlseno8@google.com.hk","job":"Software Test Engineer II","timestamp":"2022-08-08T09:17:55Z"}
{"id":874,"first_name":"Stirling","last_name":"Lohan","email":"slohano9@yale.edu","job":"Quality Control Specialist","timestamp":"2022-02-25T07:55:43Z"}
{"id":875,"first_name":"Samuele","last_name":"Evason","email":"sevasonoa@va.gov","job":"Software Engineer II","timestamp":"2022-03-23T04:00:01Z"}
{"id":876,"first_name":"Jerome","last_name":"Sherlock","email":"jsherlockob@4shared.com","job":"Community Outreach Specialist","timestamp":"2022-11-23T09:46:58Z"}
{"id":877,"first_name":"Iseabal","last_name":"Titmuss","email":"ititmussoc@pen.io","job":"Teacher","timestamp":"2022-05-19T11:43:40Z"}
{"id":878,"first_name":"Farr","last_name":"Duignan","email":"fduignanod@nbcnews.com","job":"Business Systems Development Analyst","timestamp":"2022-11-16T07:29:52Z"}
{"id":879,"first_name":"Julita","last_name":"Alster","email":"jalsteroe@altervista.org","job":"Marketing Assistant","timestamp":"2022-07-19T19:16:33Z"}
{"id":880,"first_name":"Modestia","last_name":"Aldrin","email":"maldrinof@slideshare.net","job":"Media Manager III","timestamp":"2022-08-22T15:07:30Z"}
{"id":881,"first_name":"Elset","last_name":"Bilston","email":"ebilstonog@gizmodo.com","job":"Nurse Practicioner","timestamp":"2022-01-28T19:35:10Z"}
{"id":882,"first_name":"Fidole","last_name":"Deverell","email":"fdeverelloh@issuu.com","job":"Environmental Specialist","timestamp":"2021-12-29T09:20:43Z"}
{"id":883,"first_name":"Aloysia","last_name":"Napier","email":"anapieroi@rediff.com","job":"Staff Accountant IV","timestamp":"2022-06-07T06:02:41Z"}
{"id":884,"first_name":"Rustin","last_name":"Teliga","email":"rteligaoj@chronoengine.com","job":"Physical Therapy Assistant","timestamp":"2022-07-05T08:34:42Z"}
{"id":885,"first_name":"Debor","last_name":"Kester","email":"dkesterok@ca.gov","job":"Recruiter","timestamp":"2022-09-01T03:43:02Z"}
{"id":886,"first_name":"Morna","last_name":"Davidzon","email":"mdavidzonol@altervista.org","job":"Media Manager II","timestamp":"2022-06-23T05:24:01Z"}
{"id":887,"first_name":"Joan","last_name":"Aldcorn","email":"jaldcornom@phpbb.com","job":"Internal Auditor","timestamp":"2022-07-06T02:23:55Z"}
{"id":888,"first_name":"Luciana","last_name":"Mousley","email":"lmousleyon@ehow.com","job":"Data Coordiator","timestamp":"2021-12-17T12:48:48Z"}
{"id":889,"first_name":"Laney","last_name":"Sharman","email":"lsharmanoo@omniture.com","job":"Executive Secretary","timestamp":"2021-12-07T15:02:25Z"}
{"id":890,"first_name":"Chancey","last_name":"Andover","email":"candoverop@irs.gov","job":"Project Manager","timestamp":"2022-08-04T23:53:09Z"}
{"id":891,"first_name":"Jilly","last_name":"Remirez","email":"jremirezoq@sakura.ne.jp","job":"Programmer Analyst III","timestamp":"2021-12-31T17:59:35Z"}
{"id":892,"first_name":"Darin","last_name":"Ivanuschka","email":"divanuschkaor@guardian.co.uk","job":"Accountant III","timestamp":"2022-05-03T05:25:56Z"}
{"id":893,"first_name":"Griselda","last_name":"Cordeau]","email":"gcordeauos@illinois.edu","job":"Legal Assistant","timestamp":"2021-12-16T18:09:52Z"}
{"id":894,"first_name":"Peta","last_name":"Ramsier","email":"pramsierot@thetimes.co.uk","job":"Nurse","timestamp":"2022-09-26T04:28:02Z"}
{"id":895,"first_name":"Ferrell","last_name":"Quinnelly","email":"fquinnellyou@technorati.com","job":"Legal Assistant","timestamp":"2022-02-09T15:26:30Z"}
{"id":896,"first_name":"Buffy","last_name":"Osgodby","email":"bosgodbyov@blogger.com","job":"Chief Design Engineer","timestamp":"2022-02-26T01:21:35Z"}
{"id":897,"first_name":"Shannen","last_name":"Village","email":"svillageow@cloudflare.com","job":"Marketing Manager","timestamp":"2022-07-05T14:31:29Z"}
{"id":898,"first_name":"Randy","last_name":"Wickliffe","email":"rwickliffeox@trellian.com","job":"Actuary","timestamp":"2022-02-11T06:57:45Z"}
{"id":899,"first_name":"Elayne","last_name":"Maurice","email":"emauriceoy@economist.com","job":"Research Associate","timestamp":"2022-04-24T10:22:55Z"}
{"id":900,"first_name":"Erda","last_name":"Babonau","email":"ebabonauoz@topsy.com","job":"Senior Financial Analyst","timestamp":"2022-11-28T04:40:49Z"}
{"id":901,"first_name":"Jehu","last_name":"Mullard","email":"jmullardp0@chicagotribune.com","job":"Marketing Manager","timestamp":"2022-08-02T04:25:00Z"}
{"id":902,"first_name":"Chrissie","last_name":"Clacey","email":"cclaceyp1@domainmarket.com","job":"Software Test Engineer IV","timestamp":"2022-03-27T12:28:06Z"}
{"id":903,"first_name":"Michaela","last_name":"Streeting","email":"mstreetingp2@epa.gov","job":"Human Resources Manager","timestamp":"2022-03-08T11:02:27Z"}
{"id":904,"first_name":"Stearn","last_name":"Kiernan","email":"skiernanp3@google.pl","job":"Payment Adjustment Coordinator","timestamp":"2022-08-23T15:42:08Z"}
{"id":905,"first_name":"Cory","last_name":"Athowe","email":"cathowep4@unblog.fr","job":"Actuary","timestamp":"2022-09-13T15:53:22Z"}
{"id":906,"first_name":"Vonni","last_name":"Goby","email":"vgobyp5@nifty.com","job":"Compensation Analyst","timestamp":"2021-12-11T08:40:28Z"}
{"id":907,"first_name":"Englebert","last_name":"Glaister","email":"eglaisterp6@independent.co.uk","job":"Human Resources Manager","timestamp":"2022-11-20T00:02:17Z"}
{"id":908,"first_name":"Barris","last_name":"Mosson","email":"bmossonp7@statcounter.com","job":"Nurse","timestamp":"2022-07-15T10:29:25Z"}
{"id":909,"first_name":"Konstantin","last_name":"Furphy","email":"kfurphyp8@oakley.com","job":"Legal Assistant","timestamp":"2022-08-16T13:16:54Z"}
{"id":910,"first_name":"Loria","last_name":"Carratt","email":"lcarrattp9@ow.ly","job":"Structural Engineer","timestamp":"2022-01-11T20:48:34Z"}
{"id":911,"first_name":"Torrey","last_name":"Richings","email":"trichingspa@indiatimes.com","job":"Computer Systems Analyst III","timestamp":"2022-04-28T05:05:01Z"}
{"id":912,"first_name":"Merissa","last_name":"Jorioz","email":"mjoriozpb@ebay.com","job":"Senior Developer","timestamp":"2022-04-12T00:47:48Z"}
{"id":913,"first_name":"Abraham","last_name":"Fairbard","email":"afairbardpc@intel.com","job":"Assistant Professor","timestamp":"2022-01-11T00:48:04Z"}
{"id":914,"first_name":"Sidnee","last_name":"McCreery","email":"smccreerypd@forbes.com","job":"Registered Nurse","timestamp":"2022-11-23T23:12:08Z"}
{"id":915,"first_name":"Elspeth","last_name":"Kollatsch","email":"ekollatschpe@rediff.com","job":"Account Representative I","timestamp":"2022-01-20T06:08:10Z"}
{"id":916,"first_name":"Gherardo","last_name":"Waitland","email":"gwaitlandpf@businessinsider.com","job":"Cost Accountant","timestamp":"2022-07-04T05:08:04Z"}
{"id":917,"first_name":"Alick","last_name":"Olczak","email":"aolczakpg@stumbleupon.com","job":"VP Product Management","timestamp":"2022-10-22T14:53:06Z"}
{"id":918,"first_name":"Eolanda","last_name":"Scarfe","email":"escarfeph@e-recht24.de","job":"Cost Accountant","timestamp":"2022-05-14T07:33:31Z"}
{"id":919,"first_name":"Gilberto","last_name":"Shatford","email":"gshatfordpi@digg.com","job":"Chemical Engineer","timestamp":"2022-09-04T13:51:44Z"}
{"id":920,"first_name":"Vincent","last_name":"Andreopolos","email":"vandreopolospj@cbslocal.com","job":"Office Assistant II","timestamp":"2022-07-25T09:43:30Z"}
{"id":921,"first_name":"Kat","last_name":"Gaylard","email":"kgaylardpk@nydailynews.com","job":"Pharmacist","timestamp":"2022-01-07T13:41:26Z"}
{"id":922,"first_name":"Kettie","last_name":"Downing","email":"kdowningpl@odnoklassniki.ru","job":"Software Test Engineer IV","timestamp":"2022-04-28T01:05:46Z"}
{"id":923,"first_name":"Dolores","last_name":"Ellif","email":"dellifpm@craigslist.org","job":"Chief Design Engineer","timestamp":"2022-05-28T08:11:26Z"}
{"id":924,"first_name":"Baillie","last_name":"Aymerich","email":"baymerichpn@posterous.com","job":"Financial Advisor","timestamp":"2022-08-19T21:42:32Z"}
{"id":925,"first_name":"Fidelia","last_name":"Latour","email":"flatourpo@weebly.com","job":"Senior Financial Analyst","timestamp":"2022-07-09T04:32:59Z"}
{"id":926,"first_name":"Fraser","last_name":"Hinchon","email":"fhinchonpp@nydailynews.com","job":"Structural Engineer","timestamp":"2022-03-07T21:17:55Z"}
{"id":927,"first_name":"Eryn","last_name":"Gosnall","email":"egosnallpq@lulu.com","job":"Actuary","timestamp":"2022-07-24T19:40:39Z"}
{"id":928,"first_name":"Doria","last_name":"Coumbe","email":"dcoumbepr@nymag.com","job":"Cost Accountant","timestamp":"2022-01-27T05:05:20Z"}
{"id":929,"first_name":"Mei","last_name":"Cusick","email":"mcusickps@gizmodo.com","job":"Librarian","timestamp":"2022-06-13T19:46:16Z"}
{"id":930,"first_name":"Hernando","last_name":"Prestie","email":"hprestiept@disqus.com","job":"Product Engineer","timestamp":"2022-03-28T11:48:59Z"}
{"id":931,"first_name":"Stefanie","last_name":"Wonham","email":"swonhampu@liveinternet.ru","job":"Accountant I","timestamp":"2022-01-09T11:17:35Z"}
{"id":932,"first_name":"Addy","last_name":"Kemell","email":"akemellpv@sina.com.cn","job":"Sales Representative","timestamp":"2022-09-15T01:17:27Z"}
{"id":933,"first_name":"Delainey","last_name":"Laver","email":"dlaverpw@usa.gov","job":"Junior Executive","timestamp":"2022-07-13T19:59:51Z"}
{"id":934,"first_name":"Ewart","last_name":"Doe","email":"edoepx@zdnet.com","job":"Electrical Engineer","timestamp":"2022-07-10T20:15:41Z"}
{"id":935,"first_name":"Gabriela","last_name":"Marmyon","email":"gmarmyonpy@blinklist.com","job":"Junior Executive","timestamp":"2022-06-06T14:42:33Z"}
{"id":936,"first_name":"Amabelle","last_name":"Vassie","email":"avassiepz@sitemeter.com","job":"Statistician IV","timestamp":"2022-10-17T15:35:37Z"}
{"id":937,"first_name":"Haley","last_name":"Paddon","email":"hpaddonq0@google.ru","job":"Engineer II","timestamp":"2022-01-24T08:25:00Z"}
{"id":938,"first_name":"Kurt","last_name":"Sandaver","email":"ksandaverq1@bluehost.com","job":"Structural Engineer","timestamp":"2022-06-29T14:55:21Z"}
{"id":939,"first_name":"Almire","last_name":"Wearne","email":"awearneq2@tmall.com","job":"General Manager","timestamp":"2022-01-08T01:56:40Z"}
{"id":940,"first_name":"Norina","last_name":"Pacey","email":"npaceyq3@cyberchimps.com","job":"VP Product Management","timestamp":"2022-07-26T04:44:14Z"}
{"id":941,"first_name":"Irwin","last_name":"Barrett","email":"ibarrettq4@icio.us","job":"Editor","timestamp":"2022-06-06T22:52:44Z"}
{"id":942,"first_name":"Cornie","last_name":"Pasquale","email":"cpasqualeq5@xing.com","job":"Actuary","timestamp":"2022-05-26T04:39:40Z"}
{"id":943,"first_name":"Heda","last_name":"Behling","email":"hbehlingq6@noaa.gov","job":"Senior Quality Engineer","timestamp":"2022-08-31T20:17:15Z"}
{"id":944,"first_name":"Cariotta","last_name":"Luberti","email":"clubertiq7@sphinn.com","job":"Accounting Assistant II","timestamp":"2022-06-22T05:02:39Z"}
{"id":945,"first_name":"Saraann","last_name":"Clew","email":"sclewq8@geocities.jp","job":"Quality Control Specialist","timestamp":"2022-10-09T03:37:41Z"}
{"id":946,"first_name":"Reynold","last_name":"Lean","email":"rleanq9@facebook.com","job":"Product Engineer","timestamp":"2022-05-01T01:08:01Z"}
{"id":947,"first_name":"Dorree","last_name":"McKevin","email":"dmckevinqa@odnoklassniki.ru","job":"Budget/Accounting Analyst IV","timestamp":"2022-07-06T20:09:43Z"}
{"id":948,"first_name":"Redford","last_name":"Mancell","email":"rmancellqb@techcrunch.com","job":"Research Assistant I","timestamp":"2022-07-08T21:45:19Z"}
{"id":949,"first_name":"Ricky","last_name":"Gilstoun","email":"rgilstounqc@boston.com","job":"Software Consultant","timestamp":"2022-03-12T08:04:21Z"}
{"id":950,"first_name":"Jessamyn","last_name":"Canlin","email":"jcanlinqd@jimdo.com","job":"Structural Analysis Engineer","timestamp":"2022-08-17T17:20:42Z"}
{"id":951,"first_name":"Donaugh","last_name":"Goodson","email":"dgoodsonqe@reference.com","job":"Internal Auditor","timestamp":"2022-03-10T10:29:27Z"}
{"id":952,"first_name":"Yehudi","last_name":"Truggian","email":"ytruggianqf@fc2.com","job":"Project Manager","timestamp":"2022-05-25T21:02:33Z"}
{"id":953,"first_name":"Alister","last_name":"Drust","email":"adrustqg@techcrunch.com","job":"Quality Engineer","timestamp":"2022-01-04T10:05:09Z"}
{"id":954,"first_name":"Cosette","last_name":"Fawdrie","email":"cfawdrieqh@statcounter.com","job":"Assistant Manager","timestamp":"2022-03-27T19:08:56Z"}
{"id":955,"first_name":"Jayne","last_name":"Crosio","email":"jcrosioqi@webs.com","job":"Biostatistician IV","timestamp":"2021-12-28T22:15:22Z"}
{"id":956,"first_name":"Sawyere","last_name":"Brompton","email":"sbromptonqj@imdb.com","job":"Recruiting Manager","timestamp":"2022-05-02T22:03:03Z"}
{"id":957,"first_name":"Timmie","last_name":"Farrow","email":"tfarrowqk@hexun.com","job":"Safety Technician II","timestamp":"2022-07-31T05:14:18Z"}
{"id":958,"first_name":"Courtney","last_name":"Gleave","email":"cgleaveql@squidoo.com","job":"Information Systems Manager","timestamp":"2022-10-01T22:12:55Z"}
{"id":959,"first_name":"Justis","last_name":"Mauditt","email":"jmaudittqm@wikispaces.com","job":"Structural Engineer","timestamp":"2022-07-03T02:48:32Z"}
{"id":960,"first_name":"Ambrosius","last_name":"Taffs","email":"ataffsqn@house.gov","job":"Geologist II","timestamp":"2022-10-19T20:32:22Z"}
{"id":961,"first_name":"Pren","last_name":"Bountiff","email":"pbountiffqo@redcross.org","job":"Electrical Engineer","timestamp":"2022-07-28T14:25:59Z"}
{"id":962,"first_name":"Zack","last_name":"Kubal","email":"zkubalqp@phoca.cz","job":"Data Coordiator","timestamp":"2022-03-20T13:57:34Z"}
{"id":963,"first_name":"Jaquenetta","last_name":"MacGilfoyle","email":"jmacgilfoyleqq@weebly.com","job":"Web Developer I","timestamp":"2022-10-17T19:19:52Z"}
{"id":964,"first_name":"Sarajane","last_name":"Kampshell","email":"skampshellqr@examiner.com","job":"Pharmacist","timestamp":"2022-08-19T15:18:34Z"}
{"id":965,"first_name":"Zorine","last_name":"Franc","email":"zfrancqs@slideshare.net","job":"Quality Control Specialist","timestamp":"2022-11-01T20:57:31Z"}
{"id":966,"first_name":"Milissent","last_name":"Tristram","email":"mtristramqt@va.gov","job":"Sales Representative","timestamp":"2021-12-22T08:28:56Z"}
{"id":967,"first_name":"Finley","last_name":"Hughf","email":"fhughfqu@cbsnews.com","job":"Payment Adjustment Coordinator","timestamp":"2021-12-26T09:12:05Z"}
{"id":968,"first_name":"Fionnula","last_name":"McSporrin","email":"fmcsporrinqv@senate.gov","job":"Occupational Therapist","timestamp":"2022-10-03T10:44:53Z"}
{"id":969,"first_name":"Marcelline","last_name":"Hartington","email":"mhartingtonqw@unblog.fr","job":"Desktop Support Technician","timestamp":"2022-10-11T20:39:44Z"}
{"id":970,"first_name":"Maurizio","last_name":"MacBean","email":"mmacbeanqx@hhs.gov","job":"Operator","timestamp":"2022-08-04T13:28:13Z"}
{"id":971,"first_name":"Jeannie","last_name":"Muzzall","email":"jmuzzallqy@bbc.co.uk","job":"Account Representative III","timestamp":"2022-08-23T13:31:39Z"}
{"id":972,"first_name":"Fredia","last_name":"Hitchens","email":"fhitchensqz@chronoengine.com","job":"General Manager","timestamp":"2022-01-01T15:22:41Z"}
{"id":973,"first_name":"Karim","last_name":"Fossitt","email":"kfossittr0@csmonitor.com","job":"Engineer IV","timestamp":"2022-03-05T15:37:38Z"}
{"id":974,"first_name":"Heindrick","last_name":"Bird","email":"hbirdr1@ehow.com","job":"Computer Systems Analyst II","timestamp":"2022-03-13T18:22:09Z"}
{"id":975,"first_name":"Carolann","last_name":"Dunphy","email":"cdunphyr2@mozilla.com","job":"VP Product Management","timestamp":"2022-04-23T23:07:14Z"}
{"id":976,"first_name":"Herman","last_name":"Ciubutaro","email":"hciubutaror3@alibaba.com","job":"Nurse Practicioner","timestamp":"2022-03-08T21:50:13Z"}
{"id":977,"first_name":"Konrad","last_name":"Gregon","email":"kgregonr4@npr.org","job":"Research Assistant IV","timestamp":"2022-11-24T16:44:53Z"}
{"id":978,"first_name":"Sansone","last_name":"O'Regan","email":"soreganr5@wordpress.org","job":"Compensation Analyst","timestamp":"2022-07-26T04:39:39Z"}
{"id":979,"first_name":"Edi","last_name":"Shevelin","email":"eshevelinr6@reverbnation.com","job":"Programmer Analyst III","timestamp":"2022-02-21T21:29:55Z"}
{"id":980,"first_name":"Putnem","last_name":"Muldoon","email":"pmuldoonr7@webs.com","job":"Registered Nurse","timestamp":"2022-11-17T10:38:54Z"}
{"id":981,"first_name":"Clair","last_name":"Durtnell","email":"cdurtnellr8@theglobeandmail.com","job":"VP Sales","timestamp":"2022-09-03T05:07:03Z"}
{"id":982,"first_name":"Mellisa","last_name":"Stillmann","email":"mstillmannr9@yelp.com","job":"Actuary","timestamp":"2022-06-01T10:13:00Z"}
{"id":983,"first_name":"Alyce","last_name":"Caron","email":"acaronra@mysql.com","job":"Marketing Assistant","timestamp":"2022-03-08T11:48:23Z"}
{"id":984,"first_name":"Elnora","last_name":"Perell","email":"eperellrb@com.com","job":"Database Administrator II","timestamp":"2022-01-23T07:00:30Z"}
{"id":985,"first_name":"Ximenez","last_name":"Soppit","email":"xsoppitrc@marriott.com","job":"Design Engineer","timestamp":"2022-09-04T01:28:57Z"}
{"id":986,"first_name":"Wallie","last_name":"DeSousa","email":"wdesousard@nps.gov","job":"VP Sales","timestamp":"2022-01-13T10:38:52Z"}
{"id":987,"first_name":"Ruddy","last_name":"Michel","email":"rmichelre@gravatar.com","job":"Recruiter","timestamp":"2022-02-06T04:05:07Z"}
{"id":988,"first_name":"Mariel","last_name":"Gooderick","email":"mgooderickrf@joomla.org","job":"Analyst Programmer","timestamp":"2022-04-07T06:43:49Z"}
{"id":989,"first_name":"Adria","last_name":"Kinkaid","email":"akinkaidrg@slate.com","job":"Business Systems Development Analyst","timestamp":"2022-09-28T19:22:58Z"}
{"id":990,"first_name":"Ashley","last_name":"Easey","email":"aeaseyrh@themeforest.net","job":"Product Engineer","timestamp":"2022-03-05T02:20:09Z"}
{"id":991,"first_name":"Mikkel","last_name":"Greiswood","email":"mgreiswoodri@hao123.com","job":"Speech Pathologist","timestamp":"2022-12-04T12:31:00Z"}
{"id":992,"first_name":"Nissy","last_name":"Titmuss","email":"ntitmussrj@si.edu","job":"Software Engineer IV","timestamp":"2022-02-18T04:52:53Z"}
{"id":993,"first_name":"Maddi","last_name":"Pimmocke","email":"mpimmockerk@canalblog.com","job":"GIS Technical Architect","timestamp":"2022-02-11T08:34:43Z"}
{"id":994,"first_name":"Rossy","last_name":"Draco","email":"rdracorl@goodreads.com","job":"Marketing Assistant","timestamp":"2022-07-02T04:23:06Z"}
{"id":995,"first_name":"Travus","last_name":"Babber","email":"tbabberrm@shareasale.com","job":"VP Quality Control","timestamp":"2022-02-18T19:54:19Z"}
{"id":996,"first_name":"Clayton","last_name":"Nancarrow","email":"cnancarrowrn@hao123.com","job":"Web Developer III","timestamp":"2022-05-05T22:18:27Z"}
{"id":997,"first_name":"Cami","last_name":"Jimmes","email":"cjimmesro@webeden.co.uk","job":"Financial Advisor","timestamp":"2022-08-23T18:13:14Z"}
{"id":998,"first_name":"Eirena","last_name":"Darling","email":"edarlingrp@altervista.org","job":"Mechanical Systems Engineer","timestamp":"2022-07-15T22:39:00Z"}
{"id":999,"first_name":"Anne-marie","last_name":"Dober","email":"adoberrq@nyu.edu","job":"Software Engineer I","timestamp":"2022-10-04T07:37:09Z"}
{"id":1000,"first_name":"Calla","last_name":"Handrock","email":"chandrockrr@seesaa.net","job":"Systems Administrator II","timestamp":"2022-11-18T22:33:30Z"}


================================================
FILE: quickwit/quickwit-indexing/benches/data/bench_data_heavy_transform.json
================================================
{ "body": "{\"id\":1,\"first_name\":\"Darcey\",\"email\":\"dzammett0@gizmodo.com\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":2,\"first_name\":\"Wilmette\",\"email\":\"wvsanelli1@yellowpages.com\",\"job\":\"Web Designer II\"}"}
{ "body": "{\"id\":3,\"first_name\":\"Inez\",\"email\":\"igirardet2@vkontakte.ru\",\"job\":\"Design Engineer\"}"}
{ "body": "{\"id\":4,\"first_name\":\"Nickie\",\"email\":\"nranyell3@vistaprint.com\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":5,\"first_name\":\"Shanon\",\"email\":\"spritchett4@buzzfeed.com\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":6,\"first_name\":\"Warren\",\"email\":\"wpicknett5@oaic.gov.au\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":7,\"first_name\":\"Nedda\",\"email\":\"nstoad6@geocities.com\",\"job\":\"Assistant Media Planner\"}"}
{ "body": "{\"id\":8,\"first_name\":\"Devonne\",\"email\":\"dbrisse7@cdc.gov\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":9,\"first_name\":\"Cassondra\",\"email\":\"cbackshall8@senate.gov\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":10,\"first_name\":\"Maurise\",\"email\":\"mciottoi9@vistaprint.com\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":11,\"first_name\":\"Alida\",\"email\":\"alathwella@godaddy.com\",\"job\":\"Human Resources Assistant III\"}"}
{ "body": "{\"id\":12,\"first_name\":\"Lynna\",\"email\":\"lbulstrodeb@businesswire.com\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":13,\"first_name\":\"Bordy\",\"email\":\"bwethersc@weebly.com\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":14,\"first_name\":\"Jilly\",\"email\":\"jscanesd@dagondesign.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":15,\"first_name\":\"Benedicto\",\"email\":\"bglantone@europa.eu\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":16,\"first_name\":\"Hedda\",\"email\":\"hcaddingf@angelfire.com\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":17,\"first_name\":\"Tammara\",\"email\":\"tgrigoriog@ycombinator.com\",\"job\":\"Product Engineer\"}"}
{ "body": "{\"id\":18,\"first_name\":\"Lindsey\",\"email\":\"lgiraldezh@pen.io\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":19,\"first_name\":\"Putnam\",\"email\":\"pdunnetti@hhs.gov\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":20,\"first_name\":\"Dennie\",\"email\":\"dmcilvorayj@auda.org.au\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":21,\"first_name\":\"Ilene\",\"email\":\"iheighok@friendfeed.com\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":22,\"first_name\":\"Orville\",\"email\":\"olanahanl@purevolume.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":23,\"first_name\":\"Marcella\",\"email\":\"mfavellem@foxnews.com\",\"job\":\"Analyst Programmer\"}"}
{ "body": "{\"id\":24,\"first_name\":\"Liliane\",\"email\":\"lsommervillen@goo.ne.jp\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":25,\"first_name\":\"Ruperta\",\"email\":\"rbrightwello@webnode.com\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":26,\"first_name\":\"Dwight\",\"email\":\"dcraigmilep@blinklist.com\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":27,\"first_name\":\"Lory\",\"email\":\"ltemperleyq@imdb.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":28,\"first_name\":\"Abelard\",\"email\":\"amaseresr@pcworld.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":29,\"first_name\":\"Minetta\",\"email\":\"mcobleys@squarespace.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":30,\"first_name\":\"Caesar\",\"email\":\"cshadboltt@imdb.com\",\"job\":\"Account Executive\"}"}
{ "body": "{\"id\":31,\"first_name\":\"Patti\",\"email\":\"pperonu@bravesites.com\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":32,\"first_name\":\"Louisa\",\"email\":\"lpynerv@hubpages.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":33,\"first_name\":\"Cordi\",\"email\":\"cpetrowskyw@privacy.gov.au\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":34,\"first_name\":\"Meir\",\"email\":\"mearthfieldx@biglobe.ne.jp\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":35,\"first_name\":\"Lark\",\"email\":\"lcasay@craigslist.org\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":36,\"first_name\":\"Sayer\",\"email\":\"scrummyz@answers.com\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":37,\"first_name\":\"Alec\",\"email\":\"alahive10@ow.ly\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":38,\"first_name\":\"Helyn\",\"email\":\"hcarbry11@aol.com\",\"job\":\"Engineer I\"}"}
{ "body": "{\"id\":39,\"first_name\":\"Ansley\",\"email\":\"abartolozzi12@wikia.com\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":40,\"first_name\":\"Lucretia\",\"email\":\"lalbertson13@unc.edu\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":41,\"first_name\":\"Guthrie\",\"email\":\"gpencost14@amazon.co.uk\",\"job\":\"Business Systems Development Analyst\"}"}
{ "body": "{\"id\":42,\"first_name\":\"Misty\",\"email\":\"mmulberry15@fotki.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":43,\"first_name\":\"Dante\",\"email\":\"dbellringer16@amazon.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":44,\"first_name\":\"Josefa\",\"email\":\"jkinane17@pinterest.com\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":45,\"first_name\":\"Mathilda\",\"email\":\"mgoldin18@msu.edu\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":46,\"first_name\":\"Dinny\",\"email\":\"dbirdwhistell19@pinterest.com\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":47,\"first_name\":\"Sig\",\"email\":\"srabl1a@soup.io\",\"job\":\"Legal Assistant\"}"}
{ "body": "{\"id\":48,\"first_name\":\"Aggie\",\"email\":\"awychard1b@sitemeter.com\",\"job\":\"Business Systems Development Analyst\"}"}
{ "body": "{\"id\":49,\"first_name\":\"Isadora\",\"email\":\"itaplow1c@issuu.com\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":50,\"first_name\":\"Celine\",\"email\":\"cbruneton1d@cbslocal.com\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":51,\"first_name\":\"Orelia\",\"email\":\"ozavattiero1e@delicious.com\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":52,\"first_name\":\"Orson\",\"email\":\"oarp1f@hhs.gov\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":53,\"first_name\":\"Cathyleen\",\"email\":\"cmcgannon1g@lycos.com\",\"job\":\"Software Engineer II\"}"}
{ "body": "{\"id\":54,\"first_name\":\"Tabitha\",\"email\":\"teich1h@comsenz.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":55,\"first_name\":\"Fabe\",\"email\":\"fnewband1i@cnet.com\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":56,\"first_name\":\"Liesa\",\"email\":\"lkingsbury1j@hp.com\",\"job\":\"Web Developer IV\"}"}
{ "body": "{\"id\":57,\"first_name\":\"Rochette\",\"email\":\"rbenedetti1k@mysql.com\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":58,\"first_name\":\"Andonis\",\"email\":\"alydon1l@wp.com\",\"job\":\"Statistician I\"}"}
{ "body": "{\"id\":59,\"first_name\":\"Philis\",\"email\":\"pbaldick1m@about.com\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":60,\"first_name\":\"Arleen\",\"email\":\"alongmore1n@wikimedia.org\",\"job\":\"Biostatistician II\"}"}
{ "body": "{\"id\":61,\"first_name\":\"Hastie\",\"email\":\"htitterell1o@examiner.com\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":62,\"first_name\":\"Willow\",\"email\":\"wfillon1p@msu.edu\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":63,\"first_name\":\"Babara\",\"email\":\"bwaycot1q@opera.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":64,\"first_name\":\"Ibby\",\"email\":\"ihansbury1r@buzzfeed.com\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":65,\"first_name\":\"Rhodie\",\"email\":\"rganforth1s@angelfire.com\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":66,\"first_name\":\"Dorice\",\"email\":\"disack1t@example.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":67,\"first_name\":\"Rossy\",\"email\":\"rbeadle1u@nsw.gov.au\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":68,\"first_name\":\"Helena\",\"email\":\"hmennell1v@shinystat.com\",\"job\":\"Analyst Programmer\"}"}
{ "body": "{\"id\":69,\"first_name\":\"Tremayne\",\"email\":\"trosenblad1w@technorati.com\",\"job\":\"Biostatistician III\"}"}
{ "body": "{\"id\":70,\"first_name\":\"Case\",\"email\":\"cbranston1x@fc2.com\",\"job\":\"Environmental Specialist\"}"}
{ "body": "{\"id\":71,\"first_name\":\"Misti\",\"email\":\"mwiddop1y@columbia.edu\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":72,\"first_name\":\"Constancia\",\"email\":\"cedwinson1z@bandcamp.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":73,\"first_name\":\"John\",\"email\":\"jprobart20@google.es\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":74,\"first_name\":\"Ruddie\",\"email\":\"rfelton21@pagesperso-orange.fr\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":75,\"first_name\":\"Rasia\",\"email\":\"rlawland22@tumblr.com\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":76,\"first_name\":\"Ara\",\"email\":\"astatersfield23@eepurl.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":77,\"first_name\":\"Aurlie\",\"email\":\"abispo24@ycombinator.com\",\"job\":\"Safety Technician III\"}"}
{ "body": "{\"id\":78,\"first_name\":\"Marsh\",\"email\":\"mniven25@dailymotion.com\",\"job\":\"Analyst Programmer\"}"}
{ "body": "{\"id\":79,\"first_name\":\"Lee\",\"email\":\"lsmalls26@alibaba.com\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":80,\"first_name\":\"Eloisa\",\"email\":\"estanney27@ovh.net\",\"job\":\"Staff Accountant II\"}"}
{ "body": "{\"id\":81,\"first_name\":\"Michale\",\"email\":\"mdurston28@yellowbook.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":82,\"first_name\":\"Idette\",\"email\":\"ibenedikt29@themeforest.net\",\"job\":\"Statistician IV\"}"}
{ "body": "{\"id\":83,\"first_name\":\"Rhianna\",\"email\":\"rbodimeade2a@google.ru\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":84,\"first_name\":\"Lydie\",\"email\":\"lesherwood2b@fotki.com\",\"job\":\"Developer IV\"}"}
{ "body": "{\"id\":85,\"first_name\":\"Jack\",\"email\":\"jsiddon2c@cam.ac.uk\",\"job\":\"Payment Adjustment Coordinator\"}"}
{ "body": "{\"id\":86,\"first_name\":\"Augie\",\"email\":\"asiggin2d@webmd.com\",\"job\":\"Automation Specialist I\"}"}
{ "body": "{\"id\":87,\"first_name\":\"Verina\",\"email\":\"vhurry2e@miibeian.gov.cn\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":88,\"first_name\":\"Layton\",\"email\":\"lvasilechko2f@shutterfly.com\",\"job\":\"Media Manager I\"}"}
{ "body": "{\"id\":89,\"first_name\":\"Joana\",\"email\":\"jpinilla2g@blinklist.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":90,\"first_name\":\"Astra\",\"email\":\"aesom2h@google.it\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":91,\"first_name\":\"Cassandry\",\"email\":\"cjerrolt2i@tumblr.com\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":92,\"first_name\":\"Dedie\",\"email\":\"dleprovest2j@chron.com\",\"job\":\"Accountant IV\"}"}
{ "body": "{\"id\":93,\"first_name\":\"Alleen\",\"email\":\"aickovitz2k@sciencedaily.com\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":94,\"first_name\":\"Lorilee\",\"email\":\"lborlease2l@1und1.de\",\"job\":\"Administrative Assistant IV\"}"}
{ "body": "{\"id\":95,\"first_name\":\"Rem\",\"email\":\"rwerlock2m@shareasale.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":96,\"first_name\":\"Cathe\",\"email\":\"clevecque2n@engadget.com\",\"job\":\"Office Assistant III\"}"}
{ "body": "{\"id\":97,\"first_name\":\"Kelsey\",\"email\":\"kpatershall2o@scientificamerican.com\",\"job\":\"Recruiting Manager\"}"}
{ "body": "{\"id\":98,\"first_name\":\"Percy\",\"email\":\"pjery2p@mac.com\",\"job\":\"Operator\"}"}
{ "body": "{\"id\":99,\"first_name\":\"Cathee\",\"email\":\"csconce2q@blinklist.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":100,\"first_name\":\"Michaeline\",\"email\":\"mcuel2r@ted.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":101,\"first_name\":\"Prescott\",\"email\":\"plivingstone2s@ask.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":102,\"first_name\":\"Broddy\",\"email\":\"bgiacopazzi2t@goo.ne.jp\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":103,\"first_name\":\"Errol\",\"email\":\"ecasino2u@surveymonkey.com\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":104,\"first_name\":\"Correy\",\"email\":\"cchamberlin2v@creativecommons.org\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":105,\"first_name\":\"Randall\",\"email\":\"rrenshell2w@seattletimes.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":106,\"first_name\":\"Darbie\",\"email\":\"dchantillon2x@tamu.edu\",\"job\":\"Payment Adjustment Coordinator\"}"}
{ "body": "{\"id\":107,\"first_name\":\"Benny\",\"email\":\"bpeert2y@arstechnica.com\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":108,\"first_name\":\"Leigh\",\"email\":\"lalchin2z@oaic.gov.au\",\"job\":\"Human Resources Assistant IV\"}"}
{ "body": "{\"id\":109,\"first_name\":\"Demetri\",\"email\":\"dobin30@blog.com\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":110,\"first_name\":\"Gilberto\",\"email\":\"glewsie31@nps.gov\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":111,\"first_name\":\"Ruthi\",\"email\":\"rmacconachy32@yelp.com\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":112,\"first_name\":\"Gard\",\"email\":\"glancley33@comcast.net\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":113,\"first_name\":\"Storm\",\"email\":\"sdufray34@drupal.org\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":114,\"first_name\":\"Jillian\",\"email\":\"jgegg35@eepurl.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":115,\"first_name\":\"Valentina\",\"email\":\"vthorlby36@macromedia.com\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":116,\"first_name\":\"Paxon\",\"email\":\"pscrewton37@odnoklassniki.ru\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":117,\"first_name\":\"Cariotta\",\"email\":\"cbrik38@t.co\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":118,\"first_name\":\"Franchot\",\"email\":\"fgrzelczyk39@xrea.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":119,\"first_name\":\"Skip\",\"email\":\"shathaway3a@e-recht24.de\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":120,\"first_name\":\"Tripp\",\"email\":\"ttrippitt3b@rambler.ru\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":121,\"first_name\":\"Etienne\",\"email\":\"ecoldrick3c@huffingtonpost.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":122,\"first_name\":\"Adara\",\"email\":\"agurnett3d@lycos.com\",\"job\":\"Accounting Assistant III\"}"}
{ "body": "{\"id\":123,\"first_name\":\"Spence\",\"email\":\"sions3e@nifty.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":124,\"first_name\":\"Hadrian\",\"email\":\"hemlin3f@eventbrite.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":125,\"first_name\":\"Dulci\",\"email\":\"dletham3g@com.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":126,\"first_name\":\"Nolana\",\"email\":\"nwelham3h@weebly.com\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":127,\"first_name\":\"Barnard\",\"email\":\"bwaplinton3i@bbc.co.uk\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":128,\"first_name\":\"Cati\",\"email\":\"cnorthbridge3j@ebay.com\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":129,\"first_name\":\"Elle\",\"email\":\"elester3k@mozilla.com\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":130,\"first_name\":\"Dareen\",\"email\":\"dpossel3l@hc360.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":131,\"first_name\":\"Bertram\",\"email\":\"bphettis3m@imdb.com\",\"job\":\"Geologist I\"}"}
{ "body": "{\"id\":132,\"first_name\":\"Kittie\",\"email\":\"ksharville3n@shop-pro.jp\",\"job\":\"Health Coach IV\"}"}
{ "body": "{\"id\":133,\"first_name\":\"Inesita\",\"email\":\"ihofton3o@wsj.com\",\"job\":\"Accountant III\"}"}
{ "body": "{\"id\":134,\"first_name\":\"Charin\",\"email\":\"cbartomeu3p@wikipedia.org\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":135,\"first_name\":\"Kristi\",\"email\":\"kidenden3q@so-net.ne.jp\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":136,\"first_name\":\"Torey\",\"email\":\"ttoner3r@bandcamp.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":137,\"first_name\":\"Lockwood\",\"email\":\"ldunne3s@slideshare.net\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":138,\"first_name\":\"Filberto\",\"email\":\"fstrang3t@state.gov\",\"job\":\"Research Assistant IV\"}"}
{ "body": "{\"id\":139,\"first_name\":\"Rhody\",\"email\":\"rbridgwater3u@typepad.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":140,\"first_name\":\"Kesley\",\"email\":\"kkepling3v@reference.com\",\"job\":\"Payment Adjustment Coordinator\"}"}
{ "body": "{\"id\":141,\"first_name\":\"Lombard\",\"email\":\"lmasterman3w@youku.com\",\"job\":\"Software Test Engineer I\"}"}
{ "body": "{\"id\":142,\"first_name\":\"Ferdinanda\",\"email\":\"fsandsallan3x@photobucket.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":143,\"first_name\":\"Grier\",\"email\":\"gandriveaux3y@mtv.com\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":144,\"first_name\":\"Evonne\",\"email\":\"emayho3z@google.es\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":145,\"first_name\":\"Jarrod\",\"email\":\"jgadault40@themeforest.net\",\"job\":\"Staff Accountant IV\"}"}
{ "body": "{\"id\":146,\"first_name\":\"Cassondra\",\"email\":\"ccunio41@ihg.com\",\"job\":\"Computer Systems Analyst II\"}"}
{ "body": "{\"id\":147,\"first_name\":\"Jule\",\"email\":\"jbilam42@illinois.edu\",\"job\":\"Web Developer II\"}"}
{ "body": "{\"id\":148,\"first_name\":\"Elianora\",\"email\":\"ehallede43@miibeian.gov.cn\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":149,\"first_name\":\"Addi\",\"email\":\"abanishevitz44@usnews.com\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":150,\"first_name\":\"Carin\",\"email\":\"carndell45@purevolume.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":151,\"first_name\":\"Buddy\",\"email\":\"btwydell46@sogou.com\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":152,\"first_name\":\"Parker\",\"email\":\"ppriestland47@hubpages.com\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":153,\"first_name\":\"Anthony\",\"email\":\"asallnow48@globo.com\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":154,\"first_name\":\"Barri\",\"email\":\"btollfree49@symantec.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":155,\"first_name\":\"Ernesta\",\"email\":\"ebeech4a@google.com\",\"job\":\"Safety Technician I\"}"}
{ "body": "{\"id\":156,\"first_name\":\"Claudian\",\"email\":\"civushkin4b@sciencedirect.com\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":157,\"first_name\":\"Tova\",\"email\":\"townsworth4c@godaddy.com\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":158,\"first_name\":\"Stephanus\",\"email\":\"slarkkem4d@cnn.com\",\"job\":\"Computer Systems Analyst IV\"}"}
{ "body": "{\"id\":159,\"first_name\":\"Adiana\",\"email\":\"atorregiani4e@who.int\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":160,\"first_name\":\"Tabor\",\"email\":\"ttrevorrow4f@uol.com.br\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":161,\"first_name\":\"Richmound\",\"email\":\"rfawkes4g@dropbox.com\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":162,\"first_name\":\"Evelyn\",\"email\":\"ebaggaley4h@google.it\",\"job\":\"Web Developer II\"}"}
{ "body": "{\"id\":163,\"first_name\":\"Gypsy\",\"email\":\"gknudsen4i@domainmarket.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":164,\"first_name\":\"Patsy\",\"email\":\"plouthe4j@opensource.org\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":165,\"first_name\":\"Davita\",\"email\":\"dciotto4k@mayoclinic.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":166,\"first_name\":\"Jorey\",\"email\":\"jmassingberd4l@topsy.com\",\"job\":\"Software Engineer IV\"}"}
{ "body": "{\"id\":167,\"first_name\":\"Cash\",\"email\":\"cclelland4m@columbia.edu\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":168,\"first_name\":\"Thorny\",\"email\":\"tlavell4n@fotki.com\",\"job\":\"Research Assistant IV\"}"}
{ "body": "{\"id\":169,\"first_name\":\"Cassandra\",\"email\":\"ccapron4o@yellowpages.com\",\"job\":\"Administrative Assistant II\"}"}
{ "body": "{\"id\":170,\"first_name\":\"Marylynne\",\"email\":\"mredparth4p@marriott.com\",\"job\":\"Accountant I\"}"}
{ "body": "{\"id\":171,\"first_name\":\"Udale\",\"email\":\"ugarard4q@spiegel.de\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":172,\"first_name\":\"Annamarie\",\"email\":\"ahammerton4r@who.int\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":173,\"first_name\":\"Haskell\",\"email\":\"hstollwerck4s@comsenz.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":174,\"first_name\":\"Townsend\",\"email\":\"tnewnham4t@merriam-webster.com\",\"job\":\"Systems Administrator III\"}"}
{ "body": "{\"id\":175,\"first_name\":\"Amargo\",\"email\":\"abaish4u@netlog.com\",\"job\":\"Computer Systems Analyst II\"}"}
{ "body": "{\"id\":176,\"first_name\":\"Euphemia\",\"email\":\"eflaunders4v@spotify.com\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":177,\"first_name\":\"Addy\",\"email\":\"amuspratt4w@aol.com\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":178,\"first_name\":\"Mellisa\",\"email\":\"mchiddy4x@sciencedirect.com\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":179,\"first_name\":\"Zara\",\"email\":\"zyuill4y@gov.uk\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":180,\"first_name\":\"Gaven\",\"email\":\"gvaszoly4z@bravesites.com\",\"job\":\"Systems Administrator I\"}"}
{ "body": "{\"id\":181,\"first_name\":\"Drugi\",\"email\":\"dshowt50@liveinternet.ru\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":182,\"first_name\":\"Frederick\",\"email\":\"fhurlston51@indiatimes.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":183,\"first_name\":\"Darin\",\"email\":\"dmaulin52@samsung.com\",\"job\":\"Geologist I\"}"}
{ "body": "{\"id\":184,\"first_name\":\"Wallis\",\"email\":\"wscurrer53@nbcnews.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":185,\"first_name\":\"Susann\",\"email\":\"skingsley54@yale.edu\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":186,\"first_name\":\"Bree\",\"email\":\"blieber55@furl.net\",\"job\":\"Accountant IV\"}"}
{ "body": "{\"id\":187,\"first_name\":\"Nonnah\",\"email\":\"ngutteridge56@dailymail.co.uk\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":188,\"first_name\":\"Chrysler\",\"email\":\"cvarnham57@google.nl\",\"job\":\"Software Test Engineer IV\"}"}
{ "body": "{\"id\":189,\"first_name\":\"Otha\",\"email\":\"odargavel58@phpbb.com\",\"job\":\"Administrative Assistant I\"}"}
{ "body": "{\"id\":190,\"first_name\":\"Reynold\",\"email\":\"rbirdsall59@devhub.com\",\"job\":\"Safety Technician IV\"}"}
{ "body": "{\"id\":191,\"first_name\":\"Cati\",\"email\":\"calcott5a@smh.com.au\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":192,\"first_name\":\"Yale\",\"email\":\"ymcguffog5b@seattletimes.com\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":193,\"first_name\":\"Berkly\",\"email\":\"bdutteridge5c@bbb.org\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":194,\"first_name\":\"Delinda\",\"email\":\"dhans5d@cbslocal.com\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":195,\"first_name\":\"Fayre\",\"email\":\"fmeachen5e@vinaora.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":196,\"first_name\":\"Damaris\",\"email\":\"dlimbrick5f@biglobe.ne.jp\",\"job\":\"Automation Specialist III\"}"}
{ "body": "{\"id\":197,\"first_name\":\"Adam\",\"email\":\"awintour5g@dyndns.org\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":198,\"first_name\":\"Phedra\",\"email\":\"ptuttle5h@wsj.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":199,\"first_name\":\"Cindie\",\"email\":\"cwenderott5i@sfgate.com\",\"job\":\"Staff Accountant I\"}"}
{ "body": "{\"id\":200,\"first_name\":\"Stesha\",\"email\":\"sbatrip5j@mlb.com\",\"job\":\"Design Engineer\"}"}
{ "body": "{\"id\":201,\"first_name\":\"Gale\",\"email\":\"gcraythorn5k@wikispaces.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":202,\"first_name\":\"Pincas\",\"email\":\"psilvester5l@purevolume.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":203,\"first_name\":\"Colly\",\"email\":\"crubinow5m@behance.net\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":204,\"first_name\":\"Evy\",\"email\":\"ealkins5n@sogou.com\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":205,\"first_name\":\"Brana\",\"email\":\"bmelson5o@umn.edu\",\"job\":\"Information Systems Manager\"}"}
{ "body": "{\"id\":206,\"first_name\":\"Jobina\",\"email\":\"jshivlin5p@merriam-webster.com\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":207,\"first_name\":\"Lanny\",\"email\":\"lbediss5q@illinois.edu\",\"job\":\"Accounting Assistant I\"}"}
{ "body": "{\"id\":208,\"first_name\":\"Myrilla\",\"email\":\"mbuesnel5r@cisco.com\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":209,\"first_name\":\"Karleen\",\"email\":\"kbullerwell5s@go.com\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":210,\"first_name\":\"Dulcie\",\"email\":\"dniaves5t@issuu.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":211,\"first_name\":\"Clay\",\"email\":\"cmarguerite5u@washingtonpost.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":212,\"first_name\":\"Celeste\",\"email\":\"cradeliffe5v@sourceforge.net\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":213,\"first_name\":\"Calypso\",\"email\":\"claite5w@mashable.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":214,\"first_name\":\"Jessika\",\"email\":\"jmagne5x@ebay.co.uk\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":215,\"first_name\":\"Celka\",\"email\":\"ctomsa5y@addthis.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":216,\"first_name\":\"Ashla\",\"email\":\"amathouse5z@alibaba.com\",\"job\":\"Staff Accountant III\"}"}
{ "body": "{\"id\":217,\"first_name\":\"Ameline\",\"email\":\"agibbens60@qq.com\",\"job\":\"Database Administrator III\"}"}
{ "body": "{\"id\":218,\"first_name\":\"Kerri\",\"email\":\"ktrowl61@google.co.jp\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":219,\"first_name\":\"Dill\",\"email\":\"dbrittan62@opera.com\",\"job\":\"Staff Accountant III\"}"}
{ "body": "{\"id\":220,\"first_name\":\"Nikos\",\"email\":\"nyoull63@bloomberg.com\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":221,\"first_name\":\"Tyler\",\"email\":\"tosbaldstone64@noaa.gov\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":222,\"first_name\":\"Antonetta\",\"email\":\"asinnett65@state.tx.us\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":223,\"first_name\":\"Ramsay\",\"email\":\"rlagneaux66@senate.gov\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":224,\"first_name\":\"Webb\",\"email\":\"wceney67@indiatimes.com\",\"job\":\"Web Developer I\"}"}
{ "body": "{\"id\":225,\"first_name\":\"Karyl\",\"email\":\"knicholson68@exblog.jp\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":226,\"first_name\":\"Pietro\",\"email\":\"pclaybourn69@wikispaces.com\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":227,\"first_name\":\"Dinah\",\"email\":\"dsandal6a@trellian.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":228,\"first_name\":\"Britta\",\"email\":\"bferri6b@home.pl\",\"job\":\"Research Assistant IV\"}"}
{ "body": "{\"id\":229,\"first_name\":\"Filberto\",\"email\":\"fshireff6c@163.com\",\"job\":\"Computer Systems Analyst II\"}"}
{ "body": "{\"id\":230,\"first_name\":\"Eberto\",\"email\":\"etunaclift6d@booking.com\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":231,\"first_name\":\"Martainn\",\"email\":\"mchuck6e@craigslist.org\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":232,\"first_name\":\"Lory\",\"email\":\"lolenichev6f@arizona.edu\",\"job\":\"Assistant Media Planner\"}"}
{ "body": "{\"id\":233,\"first_name\":\"Blinnie\",\"email\":\"bwhelband6g@lulu.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":234,\"first_name\":\"Candide\",\"email\":\"cdresse6h@sciencedaily.com\",\"job\":\"Payment Adjustment Coordinator\"}"}
{ "body": "{\"id\":235,\"first_name\":\"Birgitta\",\"email\":\"bhue6i@dell.com\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":236,\"first_name\":\"Emyle\",\"email\":\"ecommander6j@dion.ne.jp\",\"job\":\"Budget/Accounting Analyst III\"}"}
{ "body": "{\"id\":237,\"first_name\":\"Rosanne\",\"email\":\"rkrystek6k@washington.edu\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":238,\"first_name\":\"Dottie\",\"email\":\"dbyas6l@scribd.com\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":239,\"first_name\":\"Theda\",\"email\":\"thugk6m@kickstarter.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":240,\"first_name\":\"Joceline\",\"email\":\"jgregoraci6n@omniture.com\",\"job\":\"Budget/Accounting Analyst IV\"}"}
{ "body": "{\"id\":241,\"first_name\":\"Hannis\",\"email\":\"hquarrell6o@domainmarket.com\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":242,\"first_name\":\"Percival\",\"email\":\"psharper6p@blog.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":243,\"first_name\":\"Theodora\",\"email\":\"tsangwin6q@infoseek.co.jp\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":244,\"first_name\":\"Sherri\",\"email\":\"swilcher6r@pagesperso-orange.fr\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":245,\"first_name\":\"Cheryl\",\"email\":\"cedwicke6s@mlb.com\",\"job\":\"Health Coach I\"}"}
{ "body": "{\"id\":246,\"first_name\":\"Floyd\",\"email\":\"fharbottle6t@tiny.cc\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":247,\"first_name\":\"Merrilee\",\"email\":\"mcuesta6u@so-net.ne.jp\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":248,\"first_name\":\"Anestassia\",\"email\":\"amorshead6v@joomla.org\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":249,\"first_name\":\"Coralyn\",\"email\":\"cdrynan6w@github.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":250,\"first_name\":\"Kory\",\"email\":\"kdevaney6x@theglobeandmail.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":251,\"first_name\":\"Orazio\",\"email\":\"obraddon6y@jimdo.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":252,\"first_name\":\"Ajay\",\"email\":\"acoushe6z@icio.us\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":253,\"first_name\":\"Elnore\",\"email\":\"eallsopp70@aboutads.info\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":254,\"first_name\":\"Laughton\",\"email\":\"lgoodee71@booking.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":255,\"first_name\":\"Donn\",\"email\":\"dgianni72@boston.com\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":256,\"first_name\":\"Millie\",\"email\":\"mcogman73@skype.com\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":257,\"first_name\":\"Elvira\",\"email\":\"elampet74@ibm.com\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":258,\"first_name\":\"Tanny\",\"email\":\"tkeilloh75@bbb.org\",\"job\":\"Operator\"}"}
{ "body": "{\"id\":259,\"first_name\":\"Toiboid\",\"email\":\"tgennerich76@hibu.com\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":260,\"first_name\":\"Bram\",\"email\":\"blackie77@godaddy.com\",\"job\":\"Staff Accountant I\"}"}
{ "body": "{\"id\":261,\"first_name\":\"Rozella\",\"email\":\"rantonov78@ca.gov\",\"job\":\"Human Resources Assistant I\"}"}
{ "body": "{\"id\":262,\"first_name\":\"Ilene\",\"email\":\"ibattie79@deviantart.com\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":263,\"first_name\":\"Nobe\",\"email\":\"nhayhurst7a@drupal.org\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":264,\"first_name\":\"Reggy\",\"email\":\"rdomican7b@archive.org\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":265,\"first_name\":\"Pru\",\"email\":\"patcherley7c@sina.com.cn\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":266,\"first_name\":\"Jeremiah\",\"email\":\"jjiranek7d@bloglovin.com\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":267,\"first_name\":\"Ivor\",\"email\":\"irudledge7e@businessinsider.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":268,\"first_name\":\"Marys\",\"email\":\"mtarbert7f@ebay.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":269,\"first_name\":\"Joshuah\",\"email\":\"jwitty7g@creativecommons.org\",\"job\":\"Programmer IV\"}"}
{ "body": "{\"id\":270,\"first_name\":\"Gilberte\",\"email\":\"gmccall7h@delicious.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":271,\"first_name\":\"Clayborne\",\"email\":\"clecointe7i@twitpic.com\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":272,\"first_name\":\"Karole\",\"email\":\"kteodori7j@twitter.com\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":273,\"first_name\":\"Kaiser\",\"email\":\"kyglesias7k@purevolume.com\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":274,\"first_name\":\"Lek\",\"email\":\"lmacci7l@prlog.org\",\"job\":\"Environmental Specialist\"}"}
{ "body": "{\"id\":275,\"first_name\":\"Ellyn\",\"email\":\"eculpen7m@umich.edu\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":276,\"first_name\":\"Mavis\",\"email\":\"mfurlonge7n@yellowbook.com\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":277,\"first_name\":\"Arlyne\",\"email\":\"afullegar7o@howstuffworks.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":278,\"first_name\":\"Joy\",\"email\":\"jgristwood7p@myspace.com\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":279,\"first_name\":\"Genni\",\"email\":\"gvoak7q@wufoo.com\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":280,\"first_name\":\"Ermina\",\"email\":\"eforseith7r@indiegogo.com\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":281,\"first_name\":\"Ruddie\",\"email\":\"rbranson7s@ezinearticles.com\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":282,\"first_name\":\"Wendye\",\"email\":\"wcasiero7t@adobe.com\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":283,\"first_name\":\"Harman\",\"email\":\"htevlin7u@dailymail.co.uk\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":284,\"first_name\":\"Zeb\",\"email\":\"zpiatkow7v@tamu.edu\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":285,\"first_name\":\"Sidoney\",\"email\":\"sdawson7w@etsy.com\",\"job\":\"Web Developer II\"}"}
{ "body": "{\"id\":286,\"first_name\":\"Maude\",\"email\":\"marnholz7x@flickr.com\",\"job\":\"Statistician III\"}"}
{ "body": "{\"id\":287,\"first_name\":\"Ennis\",\"email\":\"epietranek7y@jimdo.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":288,\"first_name\":\"Rutter\",\"email\":\"rlockart7z@devhub.com\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":289,\"first_name\":\"Shauna\",\"email\":\"sproctor80@studiopress.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":290,\"first_name\":\"Ingunna\",\"email\":\"ikermon81@google.es\",\"job\":\"Account Representative II\"}"}
{ "body": "{\"id\":291,\"first_name\":\"Wynnie\",\"email\":\"wliddiard82@51.la\",\"job\":\"Health Coach IV\"}"}
{ "body": "{\"id\":292,\"first_name\":\"Lydon\",\"email\":\"lkanwell83@mysql.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":293,\"first_name\":\"Richart\",\"email\":\"rdoone84@cisco.com\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":294,\"first_name\":\"Zeb\",\"email\":\"ziacovelli85@baidu.com\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":295,\"first_name\":\"Emlen\",\"email\":\"eroly86@goodreads.com\",\"job\":\"Business Systems Development Analyst\"}"}
{ "body": "{\"id\":296,\"first_name\":\"Whitaker\",\"email\":\"wkingstne87@oracle.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":297,\"first_name\":\"Karlis\",\"email\":\"kworssam88@freewebs.com\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":298,\"first_name\":\"Shurlocke\",\"email\":\"szorzenoni89@cmu.edu\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":299,\"first_name\":\"Myrtle\",\"email\":\"mmccrillis8a@google.fr\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":300,\"first_name\":\"Marillin\",\"email\":\"msara8b@alexa.com\",\"job\":\"Accounting Assistant III\"}"}
{ "body": "{\"id\":301,\"first_name\":\"Nadia\",\"email\":\"nsantarelli8c@netvibes.com\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":302,\"first_name\":\"Kendal\",\"email\":\"kgerbl8d@un.org\",\"job\":\"Programmer Analyst IV\"}"}
{ "body": "{\"id\":303,\"first_name\":\"Ayn\",\"email\":\"apinck8e@theglobeandmail.com\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":304,\"first_name\":\"Mort\",\"email\":\"mfyndon8f@nydailynews.com\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":305,\"first_name\":\"Pauletta\",\"email\":\"pllopis8g@blogtalkradio.com\",\"job\":\"Systems Administrator III\"}"}
{ "body": "{\"id\":306,\"first_name\":\"Bartel\",\"email\":\"bjosephs8h@unblog.fr\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":307,\"first_name\":\"Ezri\",\"email\":\"ebricksey8i@networksolutions.com\",\"job\":\"Product Engineer\"}"}
{ "body": "{\"id\":308,\"first_name\":\"Roarke\",\"email\":\"rreymers8j@instagram.com\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":309,\"first_name\":\"Danya\",\"email\":\"dmilillo8k@ow.ly\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":310,\"first_name\":\"Anatol\",\"email\":\"aokey8l@latimes.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":311,\"first_name\":\"Kirsti\",\"email\":\"kwormell8m@noaa.gov\",\"job\":\"Research Assistant II\"}"}
{ "body": "{\"id\":312,\"first_name\":\"Chrisy\",\"email\":\"cupstell8n@wsj.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":313,\"first_name\":\"Tudor\",\"email\":\"tsunshine8o@weebly.com\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":314,\"first_name\":\"Gaspar\",\"email\":\"gdollimore8p@squarespace.com\",\"job\":\"Product Engineer\"}"}
{ "body": "{\"id\":315,\"first_name\":\"Amata\",\"email\":\"adaville8q@ow.ly\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":316,\"first_name\":\"Gal\",\"email\":\"gbaltrushaitis8r@bbc.co.uk\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":317,\"first_name\":\"Jinny\",\"email\":\"jmccoughan8s@list-manage.com\",\"job\":\"Automation Specialist III\"}"}
{ "body": "{\"id\":318,\"first_name\":\"Rina\",\"email\":\"rlabbey8t@cdc.gov\",\"job\":\"Environmental Specialist\"}"}
{ "body": "{\"id\":319,\"first_name\":\"Quinn\",\"email\":\"qgarrold8u@dailymail.co.uk\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":320,\"first_name\":\"Jozef\",\"email\":\"jyanin8v@purevolume.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":321,\"first_name\":\"Lynea\",\"email\":\"lspitaro8w@cdc.gov\",\"job\":\"Software Engineer IV\"}"}
{ "body": "{\"id\":322,\"first_name\":\"Page\",\"email\":\"pyeliashev8x@si.edu\",\"job\":\"Staff Accountant II\"}"}
{ "body": "{\"id\":323,\"first_name\":\"Katerina\",\"email\":\"khuygen8y@wikispaces.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":324,\"first_name\":\"Conan\",\"email\":\"cjelly8z@yellowpages.com\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":325,\"first_name\":\"Paula\",\"email\":\"pridgers90@paypal.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":326,\"first_name\":\"Lilyan\",\"email\":\"ltuft91@quantcast.com\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":327,\"first_name\":\"Kore\",\"email\":\"kquincey92@mediafire.com\",\"job\":\"Senior Developer\"}"}
{ "body": "{\"id\":328,\"first_name\":\"Dorice\",\"email\":\"dfargie93@t-online.de\",\"job\":\"Media Manager IV\"}"}
{ "body": "{\"id\":329,\"first_name\":\"Archer\",\"email\":\"apoints94@bbb.org\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":330,\"first_name\":\"Hyacinth\",\"email\":\"hcathcart95@taobao.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":331,\"first_name\":\"Gerome\",\"email\":\"gstrain96@free.fr\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":332,\"first_name\":\"Annie\",\"email\":\"apollastrino97@msn.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":333,\"first_name\":\"Catharina\",\"email\":\"ccallendar98@sbwire.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":334,\"first_name\":\"Lanie\",\"email\":\"lackroyd99@cdbaby.com\",\"job\":\"Recruiting Manager\"}"}
{ "body": "{\"id\":335,\"first_name\":\"Liuka\",\"email\":\"ltowns9a@wufoo.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":336,\"first_name\":\"Julianna\",\"email\":\"jgrassick9b@ocn.ne.jp\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":337,\"first_name\":\"Jaimie\",\"email\":\"jforgie9c@plala.or.jp\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":338,\"first_name\":\"Amye\",\"email\":\"ashortall9d@booking.com\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":339,\"first_name\":\"Laurie\",\"email\":\"lwiddows9e@blogspot.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":340,\"first_name\":\"Belva\",\"email\":\"barmour9f@msu.edu\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":341,\"first_name\":\"Vida\",\"email\":\"vdorgon9g@printfriendly.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":342,\"first_name\":\"Sherlock\",\"email\":\"silyinykh9h@accuweather.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":343,\"first_name\":\"Erhard\",\"email\":\"edranfield9i@pagesperso-orange.fr\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":344,\"first_name\":\"Roxi\",\"email\":\"rjerdein9j@google.fr\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":345,\"first_name\":\"Carl\",\"email\":\"ctutill9k@youtu.be\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":346,\"first_name\":\"Alana\",\"email\":\"astangoe9l@tamu.edu\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":347,\"first_name\":\"Lura\",\"email\":\"lcosgry9m@typepad.com\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":348,\"first_name\":\"Eve\",\"email\":\"earkin9n@usda.gov\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":349,\"first_name\":\"Claiborn\",\"email\":\"cmcellen9o@bbb.org\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":350,\"first_name\":\"Cindy\",\"email\":\"csellor9p@ow.ly\",\"job\":\"Chief Design Engineer\"}"}
{ "body": "{\"id\":351,\"first_name\":\"Torey\",\"email\":\"tkasperski9q@bing.com\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":352,\"first_name\":\"Baird\",\"email\":\"bdillet9r@mac.com\",\"job\":\"Budget/Accounting Analyst I\"}"}
{ "body": "{\"id\":353,\"first_name\":\"Lesley\",\"email\":\"lavramow9s@wsj.com\",\"job\":\"Assistant Media Planner\"}"}
{ "body": "{\"id\":354,\"first_name\":\"Claire\",\"email\":\"cpattenden9t@sohu.com\",\"job\":\"Software Test Engineer I\"}"}
{ "body": "{\"id\":355,\"first_name\":\"Bernardina\",\"email\":\"bfazakerley9u@springer.com\",\"job\":\"Automation Specialist II\"}"}
{ "body": "{\"id\":356,\"first_name\":\"Humfried\",\"email\":\"harrighini9v@barnesandnoble.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":357,\"first_name\":\"Didi\",\"email\":\"dhullock9w@foxnews.com\",\"job\":\"Operator\"}"}
{ "body": "{\"id\":358,\"first_name\":\"Morlee\",\"email\":\"mosmint9x@goo.gl\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":359,\"first_name\":\"Jethro\",\"email\":\"jjessett9y@usgs.gov\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":360,\"first_name\":\"Aurelia\",\"email\":\"aeveriss9z@china.com.cn\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":361,\"first_name\":\"Cornelius\",\"email\":\"czanettinia0@xinhuanet.com\",\"job\":\"Software Test Engineer II\"}"}
{ "body": "{\"id\":362,\"first_name\":\"Giovanni\",\"email\":\"ghuddlestona1@bloomberg.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":363,\"first_name\":\"Perla\",\"email\":\"pjirouteka2@yahoo.co.jp\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":364,\"first_name\":\"Hayes\",\"email\":\"hjorgensena3@ucla.edu\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":365,\"first_name\":\"Vitia\",\"email\":\"vpischofa4@tamu.edu\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":366,\"first_name\":\"Becki\",\"email\":\"bsimkissa5@drupal.org\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":367,\"first_name\":\"Bary\",\"email\":\"blemmensa6@gmpg.org\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":368,\"first_name\":\"Jolyn\",\"email\":\"jlemarquanda7@fc2.com\",\"job\":\"Engineer II\"}"}
{ "body": "{\"id\":369,\"first_name\":\"Margette\",\"email\":\"mrentenbecka8@jugem.jp\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":370,\"first_name\":\"Yoshi\",\"email\":\"ybinleya9@un.org\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":371,\"first_name\":\"Skipton\",\"email\":\"stheodorisaa@pinterest.com\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":372,\"first_name\":\"Crin\",\"email\":\"cdrezzerab@tmall.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":373,\"first_name\":\"Kendra\",\"email\":\"ksabatheac@istockphoto.com\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":374,\"first_name\":\"Alica\",\"email\":\"aglaisnerad@bbc.co.uk\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":375,\"first_name\":\"Penelopa\",\"email\":\"pgiovannilliae@123-reg.co.uk\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":376,\"first_name\":\"Julie\",\"email\":\"jcuttenaf@yandex.ru\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":377,\"first_name\":\"Scot\",\"email\":\"smidgelyag@imdb.com\",\"job\":\"Chief Design Engineer\"}"}
{ "body": "{\"id\":378,\"first_name\":\"Almira\",\"email\":\"ajelkah@foxnews.com\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":379,\"first_name\":\"Diannne\",\"email\":\"dtallonai@imgur.com\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":380,\"first_name\":\"Cyrus\",\"email\":\"cdunlopaj@miibeian.gov.cn\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":381,\"first_name\":\"Ronny\",\"email\":\"rtriggak@edublogs.org\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":382,\"first_name\":\"Archaimbaud\",\"email\":\"alushal@dedecms.com\",\"job\":\"Accountant I\"}"}
{ "body": "{\"id\":383,\"first_name\":\"Matthew\",\"email\":\"mcashinam@sfgate.com\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":384,\"first_name\":\"Abramo\",\"email\":\"ahentzeleran@istockphoto.com\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":385,\"first_name\":\"Farah\",\"email\":\"flarventao@1688.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":386,\"first_name\":\"Jackquelin\",\"email\":\"jdevericksap@ted.com\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":387,\"first_name\":\"Leonhard\",\"email\":\"lbasfordaq@odnoklassniki.ru\",\"job\":\"Engineer II\"}"}
{ "body": "{\"id\":388,\"first_name\":\"Dixie\",\"email\":\"dbouchar@instagram.com\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":389,\"first_name\":\"Tanitansy\",\"email\":\"ttamburoas@twitter.com\",\"job\":\"Programmer II\"}"}
{ "body": "{\"id\":390,\"first_name\":\"Olivier\",\"email\":\"ohighnamat@amazonaws.com\",\"job\":\"Systems Administrator II\"}"}
{ "body": "{\"id\":391,\"first_name\":\"Seumas\",\"email\":\"scalladineau@aol.com\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":392,\"first_name\":\"Vinni\",\"email\":\"vstidworthyav@comcast.net\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":393,\"first_name\":\"Lorri\",\"email\":\"lvennartaw@linkedin.com\",\"job\":\"Paralegal\"}"}
{ "body": "{\"id\":394,\"first_name\":\"Gelya\",\"email\":\"gcotesax@nydailynews.com\",\"job\":\"Account Representative II\"}"}
{ "body": "{\"id\":395,\"first_name\":\"Ximenez\",\"email\":\"xkermonay@github.io\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":396,\"first_name\":\"Blythe\",\"email\":\"blandsmanaz@deliciousdays.com\",\"job\":\"Research Assistant II\"}"}
{ "body": "{\"id\":397,\"first_name\":\"Noak\",\"email\":\"nmourgeb0@purevolume.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":398,\"first_name\":\"Mallissa\",\"email\":\"mbradmoreb1@adobe.com\",\"job\":\"Information Systems Manager\"}"}
{ "body": "{\"id\":399,\"first_name\":\"Malissa\",\"email\":\"mdjorevicb2@cafepress.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":400,\"first_name\":\"Vern\",\"email\":\"vrobroeb3@squarespace.com\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":401,\"first_name\":\"Willette\",\"email\":\"wgawthorpb4@fotki.com\",\"job\":\"Web Designer I\"}"}
{ "body": "{\"id\":402,\"first_name\":\"Joseito\",\"email\":\"jmuatb5@vkontakte.ru\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":403,\"first_name\":\"Roger\",\"email\":\"rtunstallb6@fotki.com\",\"job\":\"Software Test Engineer III\"}"}
{ "body": "{\"id\":404,\"first_name\":\"Welsh\",\"email\":\"wringerb7@cam.ac.uk\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":405,\"first_name\":\"Consolata\",\"email\":\"csmallwoodb8@springer.com\",\"job\":\"Budget/Accounting Analyst IV\"}"}
{ "body": "{\"id\":406,\"first_name\":\"Bern\",\"email\":\"bgascarb9@networksolutions.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":407,\"first_name\":\"Giusto\",\"email\":\"gfoottitba@reuters.com\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":408,\"first_name\":\"Alfie\",\"email\":\"awingbb@uiuc.edu\",\"job\":\"Database Administrator II\"}"}
{ "body": "{\"id\":409,\"first_name\":\"Tilda\",\"email\":\"tchiecobc@dyndns.org\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":410,\"first_name\":\"Gilburt\",\"email\":\"gbacherbd@samsung.com\",\"job\":\"Accountant IV\"}"}
{ "body": "{\"id\":411,\"first_name\":\"Carolyne\",\"email\":\"ckaretbe@arizona.edu\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":412,\"first_name\":\"Bastian\",\"email\":\"bpoebf@si.edu\",\"job\":\"Systems Administrator I\"}"}
{ "body": "{\"id\":413,\"first_name\":\"Shem\",\"email\":\"smartlewbg@cafepress.com\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":414,\"first_name\":\"Lauryn\",\"email\":\"lwardropbh@nydailynews.com\",\"job\":\"Design Engineer\"}"}
{ "body": "{\"id\":415,\"first_name\":\"Sondra\",\"email\":\"sboschmannbi@fastcompany.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":416,\"first_name\":\"Adham\",\"email\":\"awroughtbj@cpanel.net\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":417,\"first_name\":\"Cornall\",\"email\":\"cbreacherbk@businessweek.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":418,\"first_name\":\"Vilma\",\"email\":\"vsamsinbl@toplist.cz\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":419,\"first_name\":\"Ollie\",\"email\":\"omannockbm@wsj.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":420,\"first_name\":\"Carie\",\"email\":\"ckernaghanbn@last.fm\",\"job\":\"Environmental Specialist\"}"}
{ "body": "{\"id\":421,\"first_name\":\"Wells\",\"email\":\"wkalinowskybo@discuz.net\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":422,\"first_name\":\"Boothe\",\"email\":\"bjoontjesbp@people.com.cn\",\"job\":\"Account Executive\"}"}
{ "body": "{\"id\":423,\"first_name\":\"Dominick\",\"email\":\"dweekesbq@networkadvertising.org\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":424,\"first_name\":\"Jeanie\",\"email\":\"jveldebr@ovh.net\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":425,\"first_name\":\"Shayne\",\"email\":\"stipplebs@amazon.co.jp\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":426,\"first_name\":\"Romola\",\"email\":\"rrylettbt@paginegialle.it\",\"job\":\"Accountant I\"}"}
{ "body": "{\"id\":427,\"first_name\":\"Onida\",\"email\":\"omenpesbu@gnu.org\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":428,\"first_name\":\"Margareta\",\"email\":\"mwolteringbv@list-manage.com\",\"job\":\"Web Developer IV\"}"}
{ "body": "{\"id\":429,\"first_name\":\"Erastus\",\"email\":\"eschwandbw@fastcompany.com\",\"job\":\"Budget/Accounting Analyst I\"}"}
{ "body": "{\"id\":430,\"first_name\":\"Michail\",\"email\":\"mlauritsenbx@webeden.co.uk\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":431,\"first_name\":\"Allissa\",\"email\":\"amaddocksby@de.vu\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":432,\"first_name\":\"Jerrylee\",\"email\":\"jwannesbz@redcross.org\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":433,\"first_name\":\"Nadeen\",\"email\":\"nsamplesc0@github.io\",\"job\":\"Legal Assistant\"}"}
{ "body": "{\"id\":434,\"first_name\":\"Lucilia\",\"email\":\"lalveyc1@latimes.com\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":435,\"first_name\":\"Neille\",\"email\":\"ncoldhamc2@ebay.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":436,\"first_name\":\"Alick\",\"email\":\"abidgodc3@arstechnica.com\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":437,\"first_name\":\"Myrah\",\"email\":\"mtrailc4@wunderground.com\",\"job\":\"Software Engineer II\"}"}
{ "body": "{\"id\":438,\"first_name\":\"Jacquelyn\",\"email\":\"jdearnleyc5@ebay.co.uk\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":439,\"first_name\":\"Gloriane\",\"email\":\"glehemannc6@wisc.edu\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":440,\"first_name\":\"Genni\",\"email\":\"gbaddamc7@istockphoto.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":441,\"first_name\":\"Fairlie\",\"email\":\"fdepperc8@ft.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":442,\"first_name\":\"Honoria\",\"email\":\"hchokec9@seesaa.net\",\"job\":\"Information Systems Manager\"}"}
{ "body": "{\"id\":443,\"first_name\":\"Enos\",\"email\":\"ehoweyca@mediafire.com\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":444,\"first_name\":\"Corney\",\"email\":\"caguirrecb@bizjournals.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":445,\"first_name\":\"Ced\",\"email\":\"cfoulkscc@reference.com\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":446,\"first_name\":\"Vivianna\",\"email\":\"vplailcd@ycombinator.com\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":447,\"first_name\":\"Daffy\",\"email\":\"dingarfieldce@xrea.com\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":448,\"first_name\":\"Barrie\",\"email\":\"bdowyercf@newyorker.com\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":449,\"first_name\":\"Ema\",\"email\":\"ekediecg@dailymotion.com\",\"job\":\"Programmer Analyst III\"}"}
{ "body": "{\"id\":450,\"first_name\":\"Caty\",\"email\":\"ckordingch@theguardian.com\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":451,\"first_name\":\"Annmarie\",\"email\":\"ablockci@about.com\",\"job\":\"Legal Assistant\"}"}
{ "body": "{\"id\":452,\"first_name\":\"Otis\",\"email\":\"ofassecj@themeforest.net\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":453,\"first_name\":\"Perla\",\"email\":\"pfassck@yandex.ru\",\"job\":\"Statistician I\"}"}
{ "body": "{\"id\":454,\"first_name\":\"Issy\",\"email\":\"ithatchercl@vk.com\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":455,\"first_name\":\"Kerby\",\"email\":\"koscanloncm@npr.org\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":456,\"first_name\":\"Randy\",\"email\":\"rchetwyndcn@google.com.au\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":457,\"first_name\":\"Findley\",\"email\":\"fwillasco@loc.gov\",\"job\":\"Web Developer IV\"}"}
{ "body": "{\"id\":458,\"first_name\":\"Cristobal\",\"email\":\"cmacgibboncp@washington.edu\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":459,\"first_name\":\"Neille\",\"email\":\"nscrauniagecq@nasa.gov\",\"job\":\"Health Coach IV\"}"}
{ "body": "{\"id\":460,\"first_name\":\"Dennison\",\"email\":\"dsacazecr@barnesandnoble.com\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":461,\"first_name\":\"Harcourt\",\"email\":\"hhawkridgecs@ted.com\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":462,\"first_name\":\"Ceciley\",\"email\":\"cridouttct@xinhuanet.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":463,\"first_name\":\"Ginnifer\",\"email\":\"gbartlettcu@livejournal.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":464,\"first_name\":\"Livvy\",\"email\":\"lbranncv@microsoft.com\",\"job\":\"Biostatistician II\"}"}
{ "body": "{\"id\":465,\"first_name\":\"Marjory\",\"email\":\"mwimpresscw@microsoft.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":466,\"first_name\":\"Manya\",\"email\":\"mcianicx@usda.gov\",\"job\":\"Health Coach III\"}"}
{ "body": "{\"id\":467,\"first_name\":\"Hobart\",\"email\":\"hhakecy@boston.com\",\"job\":\"Business Systems Development Analyst\"}"}
{ "body": "{\"id\":468,\"first_name\":\"Drona\",\"email\":\"dstylescz@amazon.co.uk\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":469,\"first_name\":\"Cathryn\",\"email\":\"cpollockd0@prlog.org\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":470,\"first_name\":\"Arvie\",\"email\":\"apowlesd1@apache.org\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":471,\"first_name\":\"Elisha\",\"email\":\"erableaud2@latimes.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":472,\"first_name\":\"Stanton\",\"email\":\"sdinehartd3@engadget.com\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":473,\"first_name\":\"Athena\",\"email\":\"amignotd4@123-reg.co.uk\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":474,\"first_name\":\"Fredericka\",\"email\":\"fbrannod5@gov.uk\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":475,\"first_name\":\"Rois\",\"email\":\"rlesperd6@slideshare.net\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":476,\"first_name\":\"Devlin\",\"email\":\"dsaleryd7@prlog.org\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":477,\"first_name\":\"Chandal\",\"email\":\"clearmonthd8@jimdo.com\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":478,\"first_name\":\"Gordy\",\"email\":\"gzanicchellid9@nydailynews.com\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":479,\"first_name\":\"Kaye\",\"email\":\"kklimasda@smh.com.au\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":480,\"first_name\":\"Anthiathia\",\"email\":\"acorwooddb@networksolutions.com\",\"job\":\"Product Engineer\"}"}
{ "body": "{\"id\":481,\"first_name\":\"Bertina\",\"email\":\"bgoddarddc@ocn.ne.jp\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":482,\"first_name\":\"Alexandre\",\"email\":\"aliteldd@tripadvisor.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":483,\"first_name\":\"Sutton\",\"email\":\"skhidrde@techcrunch.com\",\"job\":\"Research Assistant II\"}"}
{ "body": "{\"id\":484,\"first_name\":\"Elsinore\",\"email\":\"eairddf@taobao.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":485,\"first_name\":\"Branden\",\"email\":\"bgraundissondg@cam.ac.uk\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":486,\"first_name\":\"Mic\",\"email\":\"mcooledh@sciencedaily.com\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":487,\"first_name\":\"Wain\",\"email\":\"wtinklindi@deliciousdays.com\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":488,\"first_name\":\"Cody\",\"email\":\"cliledj@earthlink.net\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":489,\"first_name\":\"Clevie\",\"email\":\"cmcglauddk@virginia.edu\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":490,\"first_name\":\"Renato\",\"email\":\"rchildrensdl@wufoo.com\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":491,\"first_name\":\"Erna\",\"email\":\"ekleinbaumdm@weather.com\",\"job\":\"Accounting Assistant IV\"}"}
{ "body": "{\"id\":492,\"first_name\":\"Kanya\",\"email\":\"kwimmsdn@vimeo.com\",\"job\":\"Biostatistician III\"}"}
{ "body": "{\"id\":493,\"first_name\":\"Corilla\",\"email\":\"cgrobdo@infoseek.co.jp\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":494,\"first_name\":\"Shell\",\"email\":\"schardindp@i2i.jp\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":495,\"first_name\":\"Maury\",\"email\":\"msywelldq@rambler.ru\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":496,\"first_name\":\"Towny\",\"email\":\"tburwelldr@wix.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":497,\"first_name\":\"Giff\",\"email\":\"gbrenardds@fda.gov\",\"job\":\"Human Resources Assistant III\"}"}
{ "body": "{\"id\":498,\"first_name\":\"Maisey\",\"email\":\"mlanpheredt@slideshare.net\",\"job\":\"Assistant Media Planner\"}"}
{ "body": "{\"id\":499,\"first_name\":\"Ulrich\",\"email\":\"uwhiteleydu@jugem.jp\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":500,\"first_name\":\"Lisha\",\"email\":\"lcharvilledv@wufoo.com\",\"job\":\"Accounting Assistant III\"}"}
{ "body": "{\"id\":501,\"first_name\":\"Conrad\",\"email\":\"cmatteaudw@who.int\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":502,\"first_name\":\"Joaquin\",\"email\":\"jbrolechandx@homestead.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":503,\"first_name\":\"Gusti\",\"email\":\"gpinchbeckdy@gizmodo.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":504,\"first_name\":\"Flossi\",\"email\":\"fbrettonerdz@cargocollective.com\",\"job\":\"Administrative Assistant II\"}"}
{ "body": "{\"id\":505,\"first_name\":\"Rollo\",\"email\":\"rrougee0@cocolog-nifty.com\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":506,\"first_name\":\"Estella\",\"email\":\"ewallase1@businessinsider.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":507,\"first_name\":\"Karna\",\"email\":\"krobotthame2@cnn.com\",\"job\":\"Engineer I\"}"}
{ "body": "{\"id\":508,\"first_name\":\"Doroteya\",\"email\":\"dtinnere3@ameblo.jp\",\"job\":\"Assistant Media Planner\"}"}
{ "body": "{\"id\":509,\"first_name\":\"Esme\",\"email\":\"emarfelle4@google.cn\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":510,\"first_name\":\"Pren\",\"email\":\"ptuffelle5@artisteer.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":511,\"first_name\":\"Enos\",\"email\":\"ekarolyie6@cmu.edu\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":512,\"first_name\":\"Edvard\",\"email\":\"ebrindlee7@narod.ru\",\"job\":\"Account Representative II\"}"}
{ "body": "{\"id\":513,\"first_name\":\"Kimberlee\",\"email\":\"kguihene8@phoca.cz\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":514,\"first_name\":\"Ginevra\",\"email\":\"ghammeriche9@taobao.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":515,\"first_name\":\"Dolph\",\"email\":\"dmarquisea@webs.com\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":516,\"first_name\":\"Kienan\",\"email\":\"kgeareb@loc.gov\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":517,\"first_name\":\"Nonnah\",\"email\":\"nhenfreec@cpanel.net\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":518,\"first_name\":\"Yoko\",\"email\":\"ybarnetted@prweb.com\",\"job\":\"Account Executive\"}"}
{ "body": "{\"id\":519,\"first_name\":\"Sandor\",\"email\":\"sfaireyee@behance.net\",\"job\":\"Budget/Accounting Analyst I\"}"}
{ "body": "{\"id\":520,\"first_name\":\"Gretel\",\"email\":\"govendenef@xrea.com\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":521,\"first_name\":\"Karyn\",\"email\":\"kclaywortheg@ed.gov\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":522,\"first_name\":\"Darsie\",\"email\":\"ddeieh@cmu.edu\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":523,\"first_name\":\"Lynnell\",\"email\":\"lellerbeckei@lulu.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":524,\"first_name\":\"Cissiee\",\"email\":\"cbabonauej@admin.ch\",\"job\":\"Safety Technician I\"}"}
{ "body": "{\"id\":525,\"first_name\":\"Natalina\",\"email\":\"npilipyakek@surveymonkey.com\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":526,\"first_name\":\"Kristien\",\"email\":\"ksangel@nsw.gov.au\",\"job\":\"Research Assistant IV\"}"}
{ "body": "{\"id\":527,\"first_name\":\"Fred\",\"email\":\"ffealeyem@usgs.gov\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":528,\"first_name\":\"Tilda\",\"email\":\"tshelmerdineen@ask.com\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":529,\"first_name\":\"Kassandra\",\"email\":\"kburdikineo@macromedia.com\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":530,\"first_name\":\"Reginauld\",\"email\":\"rmittenep@samsung.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":531,\"first_name\":\"Elberta\",\"email\":\"egrosiereq@pen.io\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":532,\"first_name\":\"Ring\",\"email\":\"rtunnacliffeer@booking.com\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":533,\"first_name\":\"Eleanora\",\"email\":\"eflugeres@fema.gov\",\"job\":\"Database Administrator III\"}"}
{ "body": "{\"id\":534,\"first_name\":\"Duane\",\"email\":\"ddunmoreet@comcast.net\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":535,\"first_name\":\"Geoff\",\"email\":\"ggardnereu@ted.com\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":536,\"first_name\":\"Karrie\",\"email\":\"kquickev@xrea.com\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":537,\"first_name\":\"Erna\",\"email\":\"egaytonew@phoca.cz\",\"job\":\"Paralegal\"}"}
{ "body": "{\"id\":538,\"first_name\":\"Diannne\",\"email\":\"draithbieex@chicagotribune.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":539,\"first_name\":\"Glenn\",\"email\":\"gfraneey@china.com.cn\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":540,\"first_name\":\"Claudio\",\"email\":\"chugliez@ifeng.com\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":541,\"first_name\":\"Addie\",\"email\":\"astanmerf0@sourceforge.net\",\"job\":\"Analyst Programmer\"}"}
{ "body": "{\"id\":542,\"first_name\":\"Katherina\",\"email\":\"kwenzelf1@goo.ne.jp\",\"job\":\"Administrative Assistant IV\"}"}
{ "body": "{\"id\":543,\"first_name\":\"Shannon\",\"email\":\"sluskf2@engadget.com\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":544,\"first_name\":\"Hetty\",\"email\":\"hoxenburyf3@biglobe.ne.jp\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":545,\"first_name\":\"Jemimah\",\"email\":\"jdelgardillof4@theatlantic.com\",\"job\":\"Web Developer II\"}"}
{ "body": "{\"id\":546,\"first_name\":\"Marlee\",\"email\":\"mconlaundf5@nifty.com\",\"job\":\"Account Representative I\"}"}
{ "body": "{\"id\":547,\"first_name\":\"Libbi\",\"email\":\"lkiftf6@etsy.com\",\"job\":\"Product Engineer\"}"}
{ "body": "{\"id\":548,\"first_name\":\"Uta\",\"email\":\"usmithenf7@bluehost.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":549,\"first_name\":\"Barny\",\"email\":\"bibarraf8@freewebs.com\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":550,\"first_name\":\"Maximilianus\",\"email\":\"mconanf9@stumbleupon.com\",\"job\":\"Developer I\"}"}
{ "body": "{\"id\":551,\"first_name\":\"Erinna\",\"email\":\"ecaskiefa@answers.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":552,\"first_name\":\"Brantley\",\"email\":\"barnsonfb@weebly.com\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":553,\"first_name\":\"Sharron\",\"email\":\"sfatherfc@hao123.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":554,\"first_name\":\"Andre\",\"email\":\"achapelhowfd@dagondesign.com\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":555,\"first_name\":\"Raimondo\",\"email\":\"rrapinfe@europa.eu\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":556,\"first_name\":\"Dwight\",\"email\":\"dduligallff@virginia.edu\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":557,\"first_name\":\"Jae\",\"email\":\"joswalfg@cdc.gov\",\"job\":\"Computer Systems Analyst I\"}"}
{ "body": "{\"id\":558,\"first_name\":\"Nels\",\"email\":\"nblindermannfh@sogou.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":559,\"first_name\":\"Natala\",\"email\":\"nseebrightfi@sciencedaily.com\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":560,\"first_name\":\"Ilaire\",\"email\":\"igiottofj@reverbnation.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":561,\"first_name\":\"Caron\",\"email\":\"ccarverhillfk@cdc.gov\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":562,\"first_name\":\"Jojo\",\"email\":\"jloomesfl@ftc.gov\",\"job\":\"Computer Systems Analyst III\"}"}
{ "body": "{\"id\":563,\"first_name\":\"Hollis\",\"email\":\"hcoultarfm@elegantthemes.com\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":564,\"first_name\":\"Charita\",\"email\":\"cracefn@sakura.ne.jp\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":565,\"first_name\":\"Norean\",\"email\":\"npenimanfo@last.fm\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":566,\"first_name\":\"Arv\",\"email\":\"asherrocksfp@ted.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":567,\"first_name\":\"Editha\",\"email\":\"emottersheadfq@webeden.co.uk\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":568,\"first_name\":\"Mallissa\",\"email\":\"mgreedyfr@nifty.com\",\"job\":\"Media Manager II\"}"}
{ "body": "{\"id\":569,\"first_name\":\"Sax\",\"email\":\"sbischoffs@networkadvertising.org\",\"job\":\"Database Administrator I\"}"}
{ "body": "{\"id\":570,\"first_name\":\"Arlin\",\"email\":\"ahowickft@yellowbook.com\",\"job\":\"Accountant II\"}"}
{ "body": "{\"id\":571,\"first_name\":\"Corry\",\"email\":\"cportmanfu@gmpg.org\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":572,\"first_name\":\"Beau\",\"email\":\"bbettesworthfv@w3.org\",\"job\":\"Administrative Assistant III\"}"}
{ "body": "{\"id\":573,\"first_name\":\"Tersina\",\"email\":\"tandrellifw@people.com.cn\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":574,\"first_name\":\"Jacklyn\",\"email\":\"jpaeckmeyerfx@rambler.ru\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":575,\"first_name\":\"Robena\",\"email\":\"rlylefy@dropbox.com\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":576,\"first_name\":\"Jo\",\"email\":\"jdewfz@nasa.gov\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":577,\"first_name\":\"Carrol\",\"email\":\"cdrohang0@utexas.edu\",\"job\":\"Programmer Analyst I\"}"}
{ "body": "{\"id\":578,\"first_name\":\"Hedda\",\"email\":\"hberreclothg1@csmonitor.com\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":579,\"first_name\":\"Matty\",\"email\":\"mbullerg2@typepad.com\",\"job\":\"Accountant IV\"}"}
{ "body": "{\"id\":580,\"first_name\":\"Tito\",\"email\":\"tlarkbyg3@google.com\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":581,\"first_name\":\"Culver\",\"email\":\"ccarloneg4@cbsnews.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":582,\"first_name\":\"Isidore\",\"email\":\"ipecholdg5@ebay.com\",\"job\":\"Office Assistant III\"}"}
{ "body": "{\"id\":583,\"first_name\":\"Babette\",\"email\":\"bspooleg6@issuu.com\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":584,\"first_name\":\"Aarika\",\"email\":\"ajeannenetg7@berkeley.edu\",\"job\":\"Systems Administrator IV\"}"}
{ "body": "{\"id\":585,\"first_name\":\"Buddie\",\"email\":\"bveitchg8@cpanel.net\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":586,\"first_name\":\"Silvio\",\"email\":\"seslieg9@tumblr.com\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":587,\"first_name\":\"Alie\",\"email\":\"abehninckga@nymag.com\",\"job\":\"Nurse\"}"}
{ "body": "{\"id\":588,\"first_name\":\"Fanny\",\"email\":\"flevenskygb@addthis.com\",\"job\":\"Database Administrator II\"}"}
{ "body": "{\"id\":589,\"first_name\":\"Rycca\",\"email\":\"rbeamesgc@live.com\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":590,\"first_name\":\"Oralla\",\"email\":\"ogriffithgd@adobe.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":591,\"first_name\":\"Cordelie\",\"email\":\"cbrattange@twitpic.com\",\"job\":\"Database Administrator I\"}"}
{ "body": "{\"id\":592,\"first_name\":\"Caryl\",\"email\":\"ctommasuzzigf@ow.ly\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":593,\"first_name\":\"Belle\",\"email\":\"bbouchergg@delicious.com\",\"job\":\"Geologist I\"}"}
{ "body": "{\"id\":594,\"first_name\":\"Joshuah\",\"email\":\"jpiccopgh@nifty.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":595,\"first_name\":\"Dean\",\"email\":\"dmalyangi@deviantart.com\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":596,\"first_name\":\"Alberto\",\"email\":\"agatleygj@craigslist.org\",\"job\":\"Accountant III\"}"}
{ "body": "{\"id\":597,\"first_name\":\"Emerson\",\"email\":\"eohalleghanegk@foxnews.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":598,\"first_name\":\"Jasmin\",\"email\":\"jcreebergl@photobucket.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":599,\"first_name\":\"Leslie\",\"email\":\"lyepiskovgm@simplemachines.org\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":600,\"first_name\":\"Kassie\",\"email\":\"kbantongn@abc.net.au\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":601,\"first_name\":\"Gottfried\",\"email\":\"gsummerlygo@google.com.hk\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":602,\"first_name\":\"Thaxter\",\"email\":\"tlandsburygp@myspace.com\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":603,\"first_name\":\"Celinka\",\"email\":\"churlgq@oakley.com\",\"job\":\"Statistician I\"}"}
{ "body": "{\"id\":604,\"first_name\":\"Alex\",\"email\":\"acanepegr@youtube.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":605,\"first_name\":\"Clerc\",\"email\":\"cwesthofergs@dion.ne.jp\",\"job\":\"Software Engineer I\"}"}
{ "body": "{\"id\":606,\"first_name\":\"Harwell\",\"email\":\"hlandmangt@marriott.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":607,\"first_name\":\"Lennard\",\"email\":\"lpillingtongu@bloglovin.com\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":608,\"first_name\":\"Nadia\",\"email\":\"nshewongv@marriott.com\",\"job\":\"Software Test Engineer II\"}"}
{ "body": "{\"id\":609,\"first_name\":\"Felic\",\"email\":\"fkidsongw@photobucket.com\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":610,\"first_name\":\"Amandie\",\"email\":\"abarocgx@nps.gov\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":611,\"first_name\":\"Cosme\",\"email\":\"cfogtgy@umich.edu\",\"job\":\"Account Representative II\"}"}
{ "body": "{\"id\":612,\"first_name\":\"Roanne\",\"email\":\"rrobathamgz@jigsy.com\",\"job\":\"Health Coach IV\"}"}
{ "body": "{\"id\":613,\"first_name\":\"Mar\",\"email\":\"mtilmouthh0@flavors.me\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":614,\"first_name\":\"Arabele\",\"email\":\"amcallisterh1@google.com.au\",\"job\":\"Staff Accountant II\"}"}
{ "body": "{\"id\":615,\"first_name\":\"Kynthia\",\"email\":\"ktithecoteh2@princeton.edu\",\"job\":\"Engineer II\"}"}
{ "body": "{\"id\":616,\"first_name\":\"Denys\",\"email\":\"dcarloneh3@123-reg.co.uk\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":617,\"first_name\":\"Christabella\",\"email\":\"csaggsh4@narod.ru\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":618,\"first_name\":\"Gay\",\"email\":\"ghawkeridgeh5@posterous.com\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":619,\"first_name\":\"Quincy\",\"email\":\"qlissimoreh6@nps.gov\",\"job\":\"Statistician IV\"}"}
{ "body": "{\"id\":620,\"first_name\":\"Cody\",\"email\":\"cpontinh7@addthis.com\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":621,\"first_name\":\"Mildrid\",\"email\":\"mdomelowh8@edublogs.org\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":622,\"first_name\":\"Luciano\",\"email\":\"lzornh9@china.com.cn\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":623,\"first_name\":\"Carmita\",\"email\":\"criccardha@blogtalkradio.com\",\"job\":\"Systems Administrator III\"}"}
{ "body": "{\"id\":624,\"first_name\":\"Cally\",\"email\":\"cstainerhb@123-reg.co.uk\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":625,\"first_name\":\"Carmella\",\"email\":\"ckeaysellhc@amazon.co.uk\",\"job\":\"Biostatistician III\"}"}
{ "body": "{\"id\":626,\"first_name\":\"Ernestus\",\"email\":\"erumboldhd@walmart.com\",\"job\":\"Systems Administrator II\"}"}
{ "body": "{\"id\":627,\"first_name\":\"Dena\",\"email\":\"dgrishechkinhe@sitemeter.com\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":628,\"first_name\":\"Karrie\",\"email\":\"kheldhf@chron.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":629,\"first_name\":\"Alfonso\",\"email\":\"aclinnickhg@i2i.jp\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":630,\"first_name\":\"Pren\",\"email\":\"pavannhh@digg.com\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":631,\"first_name\":\"Dulcy\",\"email\":\"dsallyhi@sciencedaily.com\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":632,\"first_name\":\"Chalmers\",\"email\":\"cjirsahj@theglobeandmail.com\",\"job\":\"Systems Administrator I\"}"}
{ "body": "{\"id\":633,\"first_name\":\"Hoyt\",\"email\":\"hwhitesonhk@epa.gov\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":634,\"first_name\":\"Theressa\",\"email\":\"tstinchcombehl@wunderground.com\",\"job\":\"Web Developer IV\"}"}
{ "body": "{\"id\":635,\"first_name\":\"Tiertza\",\"email\":\"tcatterickhm@un.org\",\"job\":\"Safety Technician III\"}"}
{ "body": "{\"id\":636,\"first_name\":\"Kathleen\",\"email\":\"kgreesonhn@i2i.jp\",\"job\":\"Assistant Media Planner\"}"}
{ "body": "{\"id\":637,\"first_name\":\"Alwin\",\"email\":\"athurbonho@fotki.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":638,\"first_name\":\"Linet\",\"email\":\"lbedenhamhp@so-net.ne.jp\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":639,\"first_name\":\"Hubie\",\"email\":\"hlivenshq@geocities.com\",\"job\":\"Chief Design Engineer\"}"}
{ "body": "{\"id\":640,\"first_name\":\"Fergus\",\"email\":\"frablenhr@patch.com\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":641,\"first_name\":\"Rozelle\",\"email\":\"rcameratihs@amazon.co.jp\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":642,\"first_name\":\"Paco\",\"email\":\"pgaitunght@hc360.com\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":643,\"first_name\":\"Raymond\",\"email\":\"rkarlowiczhu@gnu.org\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":644,\"first_name\":\"Brody\",\"email\":\"bbaberhv@sfgate.com\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":645,\"first_name\":\"Forster\",\"email\":\"fhuncotehw@dmoz.org\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":646,\"first_name\":\"Anabelle\",\"email\":\"abenardettehx@gmpg.org\",\"job\":\"Information Systems Manager\"}"}
{ "body": "{\"id\":647,\"first_name\":\"Atlante\",\"email\":\"atabernerhy@istockphoto.com\",\"job\":\"Computer Systems Analyst III\"}"}
{ "body": "{\"id\":648,\"first_name\":\"Gretta\",\"email\":\"gcampeyhz@blinklist.com\",\"job\":\"Programmer Analyst II\"}"}
{ "body": "{\"id\":649,\"first_name\":\"Grethel\",\"email\":\"ggheeraerti0@fda.gov\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":650,\"first_name\":\"Meggy\",\"email\":\"mstringfellowi1@whitehouse.gov\",\"job\":\"Payment Adjustment Coordinator\"}"}
{ "body": "{\"id\":651,\"first_name\":\"Quintina\",\"email\":\"qondrichi2@marriott.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":652,\"first_name\":\"Dylan\",\"email\":\"drentenbecki3@netscape.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":653,\"first_name\":\"Donovan\",\"email\":\"dalcidei4@sciencedirect.com\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":654,\"first_name\":\"Rhiamon\",\"email\":\"rkenderi5@rediff.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":655,\"first_name\":\"Genovera\",\"email\":\"ggorvini6@trellian.com\",\"job\":\"Health Coach III\"}"}
{ "body": "{\"id\":656,\"first_name\":\"Warren\",\"email\":\"wsaccoi7@ask.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":657,\"first_name\":\"Marcellina\",\"email\":\"mkerini8@yale.edu\",\"job\":\"Programmer Analyst II\"}"}
{ "body": "{\"id\":658,\"first_name\":\"Pennie\",\"email\":\"prolinsoni9@pen.io\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":659,\"first_name\":\"Padraic\",\"email\":\"pgrigoria@goo.ne.jp\",\"job\":\"Computer Systems Analyst III\"}"}
{ "body": "{\"id\":660,\"first_name\":\"Boonie\",\"email\":\"bboundsib@virginia.edu\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":661,\"first_name\":\"Sela\",\"email\":\"sdudmeshic@reverbnation.com\",\"job\":\"Media Manager IV\"}"}
{ "body": "{\"id\":662,\"first_name\":\"Gunilla\",\"email\":\"ggissingid@china.com.cn\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":663,\"first_name\":\"Diannne\",\"email\":\"djirusie@epa.gov\",\"job\":\"General Manager\"}"}
{ "body": "{\"id\":664,\"first_name\":\"Cybill\",\"email\":\"cpennif@google.com.br\",\"job\":\"Paralegal\"}"}
{ "body": "{\"id\":665,\"first_name\":\"Roland\",\"email\":\"rtrippackig@answers.com\",\"job\":\"Research Assistant I\"}"}
{ "body": "{\"id\":666,\"first_name\":\"Van\",\"email\":\"vlyokhinih@slate.com\",\"job\":\"Automation Specialist I\"}"}
{ "body": "{\"id\":667,\"first_name\":\"Kevina\",\"email\":\"kprickettii@marriott.com\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":668,\"first_name\":\"Freemon\",\"email\":\"fmckinneyij@i2i.jp\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":669,\"first_name\":\"Kevin\",\"email\":\"kmaccorkellik@tripadvisor.com\",\"job\":\"Database Administrator IV\"}"}
{ "body": "{\"id\":670,\"first_name\":\"Fayina\",\"email\":\"fbarneveldil@yahoo.co.jp\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":671,\"first_name\":\"Carmelle\",\"email\":\"cblakerim@bbc.co.uk\",\"job\":\"Business Systems Development Analyst\"}"}
{ "body": "{\"id\":672,\"first_name\":\"Rosie\",\"email\":\"rmattheusin@tinyurl.com\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":673,\"first_name\":\"Sheryl\",\"email\":\"sbowdenio@home.pl\",\"job\":\"Human Resources Assistant IV\"}"}
{ "body": "{\"id\":674,\"first_name\":\"Dannye\",\"email\":\"diddensip@cnbc.com\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":675,\"first_name\":\"Pasquale\",\"email\":\"pcolhouniq@vkontakte.ru\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":676,\"first_name\":\"Betta\",\"email\":\"bcaffreyir@prnewswire.com\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":677,\"first_name\":\"Carolan\",\"email\":\"cdickmanis@sciencedirect.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":678,\"first_name\":\"Olwen\",\"email\":\"okirkamit@mtv.com\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":679,\"first_name\":\"Marmaduke\",\"email\":\"myaneziu@lycos.com\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":680,\"first_name\":\"Elisha\",\"email\":\"edurtneliv@symantec.com\",\"job\":\"Health Coach IV\"}"}
{ "body": "{\"id\":681,\"first_name\":\"Lind\",\"email\":\"lrediw@engadget.com\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":682,\"first_name\":\"Ruby\",\"email\":\"rhedgecockix@webeden.co.uk\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":683,\"first_name\":\"Arch\",\"email\":\"areynaultiy@networkadvertising.org\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":684,\"first_name\":\"Garold\",\"email\":\"gcolthurstiz@cocolog-nifty.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":685,\"first_name\":\"Seward\",\"email\":\"sapplegatej0@miibeian.gov.cn\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":686,\"first_name\":\"Fionnula\",\"email\":\"fcunahj1@auda.org.au\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":687,\"first_name\":\"Clarke\",\"email\":\"ccambridgej2@dropbox.com\",\"job\":\"Account Executive\"}"}
{ "body": "{\"id\":688,\"first_name\":\"Therine\",\"email\":\"tjacombj3@nba.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":689,\"first_name\":\"Forest\",\"email\":\"fsearsj4@ed.gov\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":690,\"first_name\":\"Nicky\",\"email\":\"nruselinj5@tripadvisor.com\",\"job\":\"Software Test Engineer IV\"}"}
{ "body": "{\"id\":691,\"first_name\":\"Jilly\",\"email\":\"jkegleyj6@privacy.gov.au\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":692,\"first_name\":\"Paulie\",\"email\":\"ppollicotej7@unicef.org\",\"job\":\"Nuclear Power Engineer\"}"}
{ "body": "{\"id\":693,\"first_name\":\"Bette-ann\",\"email\":\"bselbiej8@blog.com\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":694,\"first_name\":\"Revkah\",\"email\":\"rgonsalvezj9@xrea.com\",\"job\":\"VP Sales\"}"}
{ "body": "{\"id\":695,\"first_name\":\"Warren\",\"email\":\"wearpeja@dot.gov\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":696,\"first_name\":\"Luce\",\"email\":\"ldousejb@deliciousdays.com\",\"job\":\"Staff Accountant I\"}"}
{ "body": "{\"id\":697,\"first_name\":\"Clem\",\"email\":\"cgablejc@hugedomains.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":698,\"first_name\":\"Sofie\",\"email\":\"sgoldfinchjd@gravatar.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":699,\"first_name\":\"Sheffy\",\"email\":\"sacklandsje@squidoo.com\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":700,\"first_name\":\"Aili\",\"email\":\"acastellettojf@aol.com\",\"job\":\"Accountant I\"}"}
{ "body": "{\"id\":701,\"first_name\":\"Araldo\",\"email\":\"alippinijg@microsoft.com\",\"job\":\"Staff Accountant IV\"}"}
{ "body": "{\"id\":702,\"first_name\":\"Devon\",\"email\":\"dsallerjh@sina.com.cn\",\"job\":\"Design Engineer\"}"}
{ "body": "{\"id\":703,\"first_name\":\"Morgana\",\"email\":\"mharfordji@dyndns.org\",\"job\":\"Help Desk Operator\"}"}
{ "body": "{\"id\":704,\"first_name\":\"Genevra\",\"email\":\"gjubbjj@redcross.org\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":705,\"first_name\":\"Cam\",\"email\":\"cbewshirejk@arstechnica.com\",\"job\":\"Help Desk Technician\"}"}
{ "body": "{\"id\":706,\"first_name\":\"Aldon\",\"email\":\"akempejl@nih.gov\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":707,\"first_name\":\"Ferne\",\"email\":\"fdoellejm@github.io\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":708,\"first_name\":\"Aymer\",\"email\":\"aesbergerjn@issuu.com\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":709,\"first_name\":\"Jacynth\",\"email\":\"joddajo@ed.gov\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":710,\"first_name\":\"Gerrie\",\"email\":\"gwatmanjp@dailymail.co.uk\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":711,\"first_name\":\"Dagmar\",\"email\":\"doshevlinjq@webmd.com\",\"job\":\"Analyst Programmer\"}"}
{ "body": "{\"id\":712,\"first_name\":\"Lilia\",\"email\":\"lcastilljojr@wsj.com\",\"job\":\"Web Developer I\"}"}
{ "body": "{\"id\":713,\"first_name\":\"Charyl\",\"email\":\"cmacilwrickjs@howstuffworks.com\",\"job\":\"Programmer Analyst III\"}"}
{ "body": "{\"id\":714,\"first_name\":\"Olivier\",\"email\":\"omoulsdalejt@ocn.ne.jp\",\"job\":\"Legal Assistant\"}"}
{ "body": "{\"id\":715,\"first_name\":\"Sully\",\"email\":\"scourtju@shop-pro.jp\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":716,\"first_name\":\"Cathryn\",\"email\":\"celverstonejv@weather.com\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":717,\"first_name\":\"Rochette\",\"email\":\"rclemenzojw@wikipedia.org\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":718,\"first_name\":\"Jasen\",\"email\":\"jcorainijx@ox.ac.uk\",\"job\":\"Geologist IV\"}"}
{ "body": "{\"id\":719,\"first_name\":\"Kalle\",\"email\":\"kgiacobazzijy@networkadvertising.org\",\"job\":\"Operator\"}"}
{ "body": "{\"id\":720,\"first_name\":\"Gaye\",\"email\":\"gmccalisterjz@gnu.org\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":721,\"first_name\":\"Hyacinthe\",\"email\":\"hcovillk0@constantcontact.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":722,\"first_name\":\"Vicky\",\"email\":\"vgibbingsk1@yellowbook.com\",\"job\":\"Engineer I\"}"}
{ "body": "{\"id\":723,\"first_name\":\"Ransell\",\"email\":\"rtreecek2@mozilla.com\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":724,\"first_name\":\"Arnoldo\",\"email\":\"ajerroltk3@scientificamerican.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":725,\"first_name\":\"Ailyn\",\"email\":\"aprendergastk4@networkadvertising.org\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":726,\"first_name\":\"Chrystel\",\"email\":\"chorbathk5@wix.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":727,\"first_name\":\"Billy\",\"email\":\"bboritk6@arstechnica.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":728,\"first_name\":\"Wendy\",\"email\":\"wborelandk7@hao123.com\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":729,\"first_name\":\"Verile\",\"email\":\"vcroadk8@rediff.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":730,\"first_name\":\"Abdul\",\"email\":\"acamblink9@paypal.com\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":731,\"first_name\":\"Thorsten\",\"email\":\"tturevilleka@hatena.ne.jp\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":732,\"first_name\":\"Gaby\",\"email\":\"gdovidaitiskb@prlog.org\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":733,\"first_name\":\"Harli\",\"email\":\"hcarstairskc@goo.gl\",\"job\":\"Media Manager I\"}"}
{ "body": "{\"id\":734,\"first_name\":\"Netta\",\"email\":\"nbrieretonkd@cornell.edu\",\"job\":\"Safety Technician II\"}"}
{ "body": "{\"id\":735,\"first_name\":\"Dillie\",\"email\":\"dtrimbleke@ucla.edu\",\"job\":\"Geologist III\"}"}
{ "body": "{\"id\":736,\"first_name\":\"Nicoli\",\"email\":\"nbristerkf@dyndns.org\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":737,\"first_name\":\"Dasha\",\"email\":\"dtulleykg@t.co\",\"job\":\"Statistician I\"}"}
{ "body": "{\"id\":738,\"first_name\":\"Salomone\",\"email\":\"skindlesidekh@mashable.com\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":739,\"first_name\":\"Andras\",\"email\":\"acissonki@bbb.org\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":740,\"first_name\":\"Chaim\",\"email\":\"cbettinsonkj@lulu.com\",\"job\":\"Budget/Accounting Analyst I\"}"}
{ "body": "{\"id\":741,\"first_name\":\"Tammara\",\"email\":\"tallinkk@sfgate.com\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":742,\"first_name\":\"Leora\",\"email\":\"lkiffinkl@odnoklassniki.ru\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":743,\"first_name\":\"Emogene\",\"email\":\"ecoodekm@accuweather.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":744,\"first_name\":\"Hobart\",\"email\":\"hlarrattkn@discuz.net\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":745,\"first_name\":\"Daren\",\"email\":\"dnavarroko@answers.com\",\"job\":\"Biostatistician III\"}"}
{ "body": "{\"id\":746,\"first_name\":\"Sondra\",\"email\":\"sroakekp@bigcartel.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":747,\"first_name\":\"Vinnie\",\"email\":\"vdullaghankq@guardian.co.uk\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":748,\"first_name\":\"Margie\",\"email\":\"mboomekr@nhs.uk\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":749,\"first_name\":\"Emma\",\"email\":\"evidgenks@meetup.com\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":750,\"first_name\":\"Marlo\",\"email\":\"mgrastyekt@baidu.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":751,\"first_name\":\"Jorry\",\"email\":\"jaldhouseku@icio.us\",\"job\":\"Research Assistant II\"}"}
{ "body": "{\"id\":752,\"first_name\":\"Hagen\",\"email\":\"hjorgensenkv@nbcnews.com\",\"job\":\"VP Product Management\"}"}
{ "body": "{\"id\":753,\"first_name\":\"Jacinthe\",\"email\":\"jguwerkw@gizmodo.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":754,\"first_name\":\"Velvet\",\"email\":\"vwyantkx@google.co.uk\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":755,\"first_name\":\"Lilias\",\"email\":\"lkitleeky@bloglovin.com\",\"job\":\"Product Engineer\"}"}
{ "body": "{\"id\":756,\"first_name\":\"Kacey\",\"email\":\"kdemcikkz@google.es\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":757,\"first_name\":\"Bearnard\",\"email\":\"bcordell0@wunderground.com\",\"job\":\"Chief Design Engineer\"}"}
{ "body": "{\"id\":758,\"first_name\":\"Fanechka\",\"email\":\"fgosdinl1@house.gov\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":759,\"first_name\":\"Maryanna\",\"email\":\"mmaughanl2@dion.ne.jp\",\"job\":\"Human Resources Assistant II\"}"}
{ "body": "{\"id\":760,\"first_name\":\"Robinette\",\"email\":\"rhedditchl3@sohu.com\",\"job\":\"Systems Administrator II\"}"}
{ "body": "{\"id\":761,\"first_name\":\"Aliza\",\"email\":\"adurwardl4@wikimedia.org\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":762,\"first_name\":\"Minni\",\"email\":\"mjedraszekl5@businesswire.com\",\"job\":\"Quality Engineer\"}"}
{ "body": "{\"id\":763,\"first_name\":\"Fitz\",\"email\":\"farnetl6@seesaa.net\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":764,\"first_name\":\"Priscella\",\"email\":\"pjaherl7@marriott.com\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":765,\"first_name\":\"Marja\",\"email\":\"mdingleyl8@rambler.ru\",\"job\":\"Engineer I\"}"}
{ "body": "{\"id\":766,\"first_name\":\"Franni\",\"email\":\"flafayettel9@wix.com\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":767,\"first_name\":\"Fayina\",\"email\":\"fduckla@scribd.com\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":768,\"first_name\":\"Maggi\",\"email\":\"mgriffittslb@deviantart.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":769,\"first_name\":\"Homere\",\"email\":\"hmanterfieldlc@howstuffworks.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":770,\"first_name\":\"Raoul\",\"email\":\"rwickeyld@google.fr\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":771,\"first_name\":\"Kermie\",\"email\":\"kskeermerle@tamu.edu\",\"job\":\"Accountant II\"}"}
{ "body": "{\"id\":772,\"first_name\":\"Steffane\",\"email\":\"sbrendishlf@live.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":773,\"first_name\":\"Lisle\",\"email\":\"lhattlg@weibo.com\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":774,\"first_name\":\"Pearle\",\"email\":\"poakdenlh@cnbc.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":775,\"first_name\":\"Herold\",\"email\":\"hmusicoli@loc.gov\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":776,\"first_name\":\"Archambault\",\"email\":\"ahawkridgelj@sitemeter.com\",\"job\":\"Financial Analyst\"}"}
{ "body": "{\"id\":777,\"first_name\":\"Emmy\",\"email\":\"emandellk@japanpost.jp\",\"job\":\"Software Test Engineer IV\"}"}
{ "body": "{\"id\":778,\"first_name\":\"Colas\",\"email\":\"cheavyll@sciencedirect.com\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":779,\"first_name\":\"Mikkel\",\"email\":\"mdrummerlm@amazon.co.jp\",\"job\":\"Systems Administrator IV\"}"}
{ "body": "{\"id\":780,\"first_name\":\"Ewart\",\"email\":\"esurmeyerln@rambler.ru\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":781,\"first_name\":\"Jere\",\"email\":\"jcapslo@epa.gov\",\"job\":\"Office Assistant IV\"}"}
{ "body": "{\"id\":782,\"first_name\":\"Ceil\",\"email\":\"cbygottlp@state.gov\",\"job\":\"Safety Technician II\"}"}
{ "body": "{\"id\":783,\"first_name\":\"Mabelle\",\"email\":\"mcornwalllq@xinhuanet.com\",\"job\":\"Chief Design Engineer\"}"}
{ "body": "{\"id\":784,\"first_name\":\"Nolie\",\"email\":\"npirrilr@devhub.com\",\"job\":\"Media Manager III\"}"}
{ "body": "{\"id\":785,\"first_name\":\"Mara\",\"email\":\"mderwinls@spiegel.de\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":786,\"first_name\":\"Hill\",\"email\":\"hattwilllt@dedecms.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":787,\"first_name\":\"Ralina\",\"email\":\"rcloustonlu@reference.com\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":788,\"first_name\":\"Cy\",\"email\":\"cfehnerslv@ebay.com\",\"job\":\"Database Administrator I\"}"}
{ "body": "{\"id\":789,\"first_name\":\"Lind\",\"email\":\"ldargavellw@ft.com\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":790,\"first_name\":\"Zara\",\"email\":\"zpereslx@cmu.edu\",\"job\":\"Web Developer III\"}"}
{ "body": "{\"id\":791,\"first_name\":\"Nonie\",\"email\":\"ntealely@independent.co.uk\",\"job\":\"Human Resources Assistant I\"}"}
{ "body": "{\"id\":792,\"first_name\":\"Gabriello\",\"email\":\"gcoetzeelz@archive.org\",\"job\":\"Senior Quality Engineer\"}"}
{ "body": "{\"id\":793,\"first_name\":\"Brynna\",\"email\":\"bborrowsm0@flavors.me\",\"job\":\"Physical Therapy Assistant\"}"}
{ "body": "{\"id\":794,\"first_name\":\"Guntar\",\"email\":\"gduerdenm1@icio.us\",\"job\":\"Account Executive\"}"}
{ "body": "{\"id\":795,\"first_name\":\"Boigie\",\"email\":\"battwaterm2@ed.gov\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":796,\"first_name\":\"Guinevere\",\"email\":\"gverrickm3@eventbrite.com\",\"job\":\"Speech Pathologist\"}"}
{ "body": "{\"id\":797,\"first_name\":\"Kimbra\",\"email\":\"krozalskim4@studiopress.com\",\"job\":\"Mechanical Systems Engineer\"}"}
{ "body": "{\"id\":798,\"first_name\":\"Alisha\",\"email\":\"afeym5@wikispaces.com\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":799,\"first_name\":\"Tarrance\",\"email\":\"ttallboym6@skype.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":800,\"first_name\":\"Neale\",\"email\":\"ndodingm7@auda.org.au\",\"job\":\"Geologist IV\"}"}
{ "body": "{\"id\":801,\"first_name\":\"Jorge\",\"email\":\"jstearnsm8@princeton.edu\",\"job\":\"Database Administrator III\"}"}
{ "body": "{\"id\":802,\"first_name\":\"George\",\"email\":\"gdresserm9@nationalgeographic.com\",\"job\":\"Social Worker\"}"}
{ "body": "{\"id\":803,\"first_name\":\"Susanne\",\"email\":\"sburridgema@fda.gov\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":804,\"first_name\":\"Giraud\",\"email\":\"gpaulsenmb@sphinn.com\",\"job\":\"Safety Technician II\"}"}
{ "body": "{\"id\":805,\"first_name\":\"Conni\",\"email\":\"ckeepingmc@mozilla.org\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":806,\"first_name\":\"Mirabella\",\"email\":\"mknapmanmd@constantcontact.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":807,\"first_name\":\"Joel\",\"email\":\"jmaccoleme@cdc.gov\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":808,\"first_name\":\"Merrily\",\"email\":\"mmussardmf@yandex.ru\",\"job\":\"Web Designer IV\"}"}
{ "body": "{\"id\":809,\"first_name\":\"Ermanno\",\"email\":\"ewinspiremg@gizmodo.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":810,\"first_name\":\"Fonsie\",\"email\":\"frieplmh@unc.edu\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":811,\"first_name\":\"Latrina\",\"email\":\"lbridgermi@house.gov\",\"job\":\"Compensation Analyst\"}"}
{ "body": "{\"id\":812,\"first_name\":\"Jehanna\",\"email\":\"jmacaughtriemj@i2i.jp\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":813,\"first_name\":\"Sancho\",\"email\":\"swhiskinmk@devhub.com\",\"job\":\"Engineer IV\"}"}
{ "body": "{\"id\":814,\"first_name\":\"Addy\",\"email\":\"amatzenml@arstechnica.com\",\"job\":\"Paralegal\"}"}
{ "body": "{\"id\":815,\"first_name\":\"Gav\",\"email\":\"ghowsegomm@geocities.com\",\"job\":\"Accountant IV\"}"}
{ "body": "{\"id\":816,\"first_name\":\"Thedric\",\"email\":\"tchealemn@360.cn\",\"job\":\"Business Systems Development Analyst\"}"}
{ "body": "{\"id\":817,\"first_name\":\"Suellen\",\"email\":\"smoodycliffemo@tinyurl.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":818,\"first_name\":\"Andrei\",\"email\":\"ayarkermp@nydailynews.com\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":819,\"first_name\":\"Hermina\",\"email\":\"helderkinmq@howstuffworks.com\",\"job\":\"Design Engineer\"}"}
{ "body": "{\"id\":820,\"first_name\":\"Skye\",\"email\":\"swellummr@imdb.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":821,\"first_name\":\"Frasquito\",\"email\":\"fdunkinsonms@washington.edu\",\"job\":\"Web Developer IV\"}"}
{ "body": "{\"id\":822,\"first_name\":\"Lin\",\"email\":\"ldarleymt@dion.ne.jp\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":823,\"first_name\":\"Lorettalorna\",\"email\":\"lfeyermu@quantcast.com\",\"job\":\"Chief Design Engineer\"}"}
{ "body": "{\"id\":824,\"first_name\":\"Debera\",\"email\":\"dmellingmv@imdb.com\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":825,\"first_name\":\"Gardener\",\"email\":\"gmitchardmw@skyrock.com\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":826,\"first_name\":\"Adora\",\"email\":\"abernadonmx@quantcast.com\",\"job\":\"Editor\"}"}
{ "body": "{\"id\":827,\"first_name\":\"Laural\",\"email\":\"lshilitomy@cargocollective.com\",\"job\":\"Executive Secretary\"}"}
{ "body": "{\"id\":828,\"first_name\":\"Daniel\",\"email\":\"dstantonmz@google.com.hk\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":829,\"first_name\":\"Tomasina\",\"email\":\"tmccawn0@howstuffworks.com\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":830,\"first_name\":\"Ferne\",\"email\":\"fgagern1@nih.gov\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":831,\"first_name\":\"Laural\",\"email\":\"lmaturan2@mysql.com\",\"job\":\"Media Manager III\"}"}
{ "body": "{\"id\":832,\"first_name\":\"Christoph\",\"email\":\"cgoldhilln3@com.com\",\"job\":\"Registered Nurse\"}"}
{ "body": "{\"id\":833,\"first_name\":\"Julissa\",\"email\":\"jmcmorlandn4@simplemachines.org\",\"job\":\"Safety Technician II\"}"}
{ "body": "{\"id\":834,\"first_name\":\"Rosa\",\"email\":\"ryoungen5@sun.com\",\"job\":\"Geologist II\"}"}
{ "body": "{\"id\":835,\"first_name\":\"Paulo\",\"email\":\"pdallowayn6@unblog.fr\",\"job\":\"Office Assistant IV\"}"}
{ "body": "{\"id\":836,\"first_name\":\"Aurlie\",\"email\":\"amoulesn7@squidoo.com\",\"job\":\"Computer Systems Analyst I\"}"}
{ "body": "{\"id\":837,\"first_name\":\"Rosanne\",\"email\":\"rbrixeyn8@va.gov\",\"job\":\"Legal Assistant\"}"}
{ "body": "{\"id\":838,\"first_name\":\"Benedicto\",\"email\":\"bharcen9@irs.gov\",\"job\":\"Associate Professor\"}"}
{ "body": "{\"id\":839,\"first_name\":\"Huntington\",\"email\":\"hshuttleworthna@answers.com\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":840,\"first_name\":\"Leupold\",\"email\":\"lcapounnb@bbb.org\",\"job\":\"Marketing Manager\"}"}
{ "body": "{\"id\":841,\"first_name\":\"Austine\",\"email\":\"adielhennnc@rediff.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":842,\"first_name\":\"Tristam\",\"email\":\"tfranceschellind@ibm.com\",\"job\":\"Clinical Specialist\"}"}
{ "body": "{\"id\":843,\"first_name\":\"Marjie\",\"email\":\"mpendrene@reuters.com\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":844,\"first_name\":\"Barth\",\"email\":\"bskirlingnf@ezinearticles.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":845,\"first_name\":\"Zackariah\",\"email\":\"ztrippickng@canalblog.com\",\"job\":\"Account Representative III\"}"}
{ "body": "{\"id\":846,\"first_name\":\"Chandler\",\"email\":\"cdemorenanh@biglobe.ne.jp\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":847,\"first_name\":\"Grayce\",\"email\":\"gvidoni@taobao.com\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":848,\"first_name\":\"Ryann\",\"email\":\"rbrittennj@furl.net\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":849,\"first_name\":\"Findlay\",\"email\":\"fmabbittnk@youtube.com\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":850,\"first_name\":\"Remington\",\"email\":\"rdundonnl@nyu.edu\",\"job\":\"Health Coach I\"}"}
{ "body": "{\"id\":851,\"first_name\":\"Raynell\",\"email\":\"rballardnm@dmoz.org\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":852,\"first_name\":\"Merrili\",\"email\":\"mciccettinn@quantcast.com\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":853,\"first_name\":\"Bogey\",\"email\":\"btargetterno@blogspot.com\",\"job\":\"VP Accounting\"}"}
{ "body": "{\"id\":854,\"first_name\":\"Gordan\",\"email\":\"gkemmetnp@angelfire.com\",\"job\":\"Geological Engineer\"}"}
{ "body": "{\"id\":855,\"first_name\":\"Kipp\",\"email\":\"kscotchbrooknq@posterous.com\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":856,\"first_name\":\"Brande\",\"email\":\"bparradyenr@home.pl\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":857,\"first_name\":\"Gabriella\",\"email\":\"gdegoixns@163.com\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":858,\"first_name\":\"Ruddy\",\"email\":\"rprysnt@ted.com\",\"job\":\"Sales Representative\"}"}
{ "body": "{\"id\":859,\"first_name\":\"Fredrick\",\"email\":\"fmcnabbnu@buzzfeed.com\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":860,\"first_name\":\"Bertram\",\"email\":\"bnolinnv@hibu.com\",\"job\":\"Biostatistician IV\"}"}
{ "body": "{\"id\":861,\"first_name\":\"Marylee\",\"email\":\"mlaidlernw@kickstarter.com\",\"job\":\"Office Assistant III\"}"}
{ "body": "{\"id\":862,\"first_name\":\"Gerda\",\"email\":\"gsmiznx@live.com\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":863,\"first_name\":\"Theressa\",\"email\":\"tluneyny@statcounter.com\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":864,\"first_name\":\"Caron\",\"email\":\"ctraillnz@geocities.jp\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":865,\"first_name\":\"Jorie\",\"email\":\"jgreensideo0@purevolume.com\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":866,\"first_name\":\"Fleming\",\"email\":\"flinggoodo1@slate.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":867,\"first_name\":\"Kennan\",\"email\":\"kpinchino2@hubpages.com\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":868,\"first_name\":\"Cacilia\",\"email\":\"cfishbyo3@altervista.org\",\"job\":\"Environmental Specialist\"}"}
{ "body": "{\"id\":869,\"first_name\":\"Filberte\",\"email\":\"feverwino4@weebly.com\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":870,\"first_name\":\"Tess\",\"email\":\"tkennewayo5@woothemes.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":871,\"first_name\":\"Vite\",\"email\":\"visakseno6@ovh.net\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":872,\"first_name\":\"Mauricio\",\"email\":\"mgrzelczako7@rediff.com\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":873,\"first_name\":\"Daven\",\"email\":\"dhaslewoodo8@ovh.net\",\"job\":\"Accounting Assistant IV\"}"}
{ "body": "{\"id\":874,\"first_name\":\"Maddi\",\"email\":\"mmaskallo9@intel.com\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":875,\"first_name\":\"Amalea\",\"email\":\"aismayoa@apache.org\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":876,\"first_name\":\"Wren\",\"email\":\"wcoyob@discuz.net\",\"job\":\"Assistant Manager\"}"}
{ "body": "{\"id\":877,\"first_name\":\"Kareem\",\"email\":\"kairetonoc@quantcast.com\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":878,\"first_name\":\"Felicdad\",\"email\":\"fbiddwellod@pinterest.com\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":879,\"first_name\":\"Hube\",\"email\":\"hmaniloveoe@behance.net\",\"job\":\"Senior Developer\"}"}
{ "body": "{\"id\":880,\"first_name\":\"Lowrance\",\"email\":\"lmabbittof@wiley.com\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":881,\"first_name\":\"Geraldine\",\"email\":\"gleirmonthog@jigsy.com\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":882,\"first_name\":\"Reese\",\"email\":\"rmathiesonoh@telegraph.co.uk\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":883,\"first_name\":\"Mariel\",\"email\":\"medinborooi@github.io\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":884,\"first_name\":\"Darnell\",\"email\":\"dgrzegoreckioj@umich.edu\",\"job\":\"Database Administrator I\"}"}
{ "body": "{\"id\":885,\"first_name\":\"Samson\",\"email\":\"spondeok@xing.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":886,\"first_name\":\"Marv\",\"email\":\"mgargettol@nature.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":887,\"first_name\":\"Desmond\",\"email\":\"dlazellom@goo.ne.jp\",\"job\":\"Legal Assistant\"}"}
{ "body": "{\"id\":888,\"first_name\":\"Perren\",\"email\":\"preineron@list-manage.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":889,\"first_name\":\"Branden\",\"email\":\"blawteyoo@t.co\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":890,\"first_name\":\"Roy\",\"email\":\"rdiggesop@dagondesign.com\",\"job\":\"Web Developer II\"}"}
{ "body": "{\"id\":891,\"first_name\":\"Stillman\",\"email\":\"sdarkinsoq@disqus.com\",\"job\":\"Nurse Practicioner\"}"}
{ "body": "{\"id\":892,\"first_name\":\"Spense\",\"email\":\"solcotor@ezinearticles.com\",\"job\":\"Data Coordiator\"}"}
{ "body": "{\"id\":893,\"first_name\":\"Will\",\"email\":\"wisardos@kickstarter.com\",\"job\":\"Graphic Designer\"}"}
{ "body": "{\"id\":894,\"first_name\":\"Millie\",\"email\":\"mbuttwellot@prweb.com\",\"job\":\"Systems Administrator I\"}"}
{ "body": "{\"id\":895,\"first_name\":\"Rickie\",\"email\":\"rgogieou@paypal.com\",\"job\":\"Human Resources Assistant IV\"}"}
{ "body": "{\"id\":896,\"first_name\":\"Ardene\",\"email\":\"aboristonov@princeton.edu\",\"job\":\"Systems Administrator II\"}"}
{ "body": "{\"id\":897,\"first_name\":\"Irwin\",\"email\":\"irentelllow@wix.com\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":898,\"first_name\":\"Padriac\",\"email\":\"pkremerox@reuters.com\",\"job\":\"Nurse\"}"}
{ "body": "{\"id\":899,\"first_name\":\"Franciskus\",\"email\":\"fokelloy@ft.com\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":900,\"first_name\":\"Marillin\",\"email\":\"mmacclureoz@bing.com\",\"job\":\"Software Consultant\"}"}
{ "body": "{\"id\":901,\"first_name\":\"Eberhard\",\"email\":\"egrigoliisp0@1688.com\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":902,\"first_name\":\"Colin\",\"email\":\"chammerichp1@japanpost.jp\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":903,\"first_name\":\"Dorolice\",\"email\":\"dglovesp2@soup.io\",\"job\":\"Electrical Engineer\"}"}
{ "body": "{\"id\":904,\"first_name\":\"Matteo\",\"email\":\"mhickfordp3@google.com.au\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":905,\"first_name\":\"Abagail\",\"email\":\"asallierp4@typepad.com\",\"job\":\"Occupational Therapist\"}"}
{ "body": "{\"id\":906,\"first_name\":\"Ina\",\"email\":\"igeevep5@diigo.com\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":907,\"first_name\":\"Tommi\",\"email\":\"tbridgestockp6@nydailynews.com\",\"job\":\"Human Resources Assistant IV\"}"}
{ "body": "{\"id\":908,\"first_name\":\"Hugo\",\"email\":\"hgregoracip7@t.co\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":909,\"first_name\":\"Nathanil\",\"email\":\"nmillsonp8@cocolog-nifty.com\",\"job\":\"Senior Developer\"}"}
{ "body": "{\"id\":910,\"first_name\":\"Inesita\",\"email\":\"isootp9@studiopress.com\",\"job\":\"Biostatistician I\"}"}
{ "body": "{\"id\":911,\"first_name\":\"Beatriz\",\"email\":\"bdmytrykpa@taobao.com\",\"job\":\"Research Assistant II\"}"}
{ "body": "{\"id\":912,\"first_name\":\"Brigit\",\"email\":\"btinnerpb@rediff.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":913,\"first_name\":\"Free\",\"email\":\"fkollachpc@narod.ru\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":914,\"first_name\":\"Barron\",\"email\":\"bklossmannpd@europa.eu\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":915,\"first_name\":\"Mommy\",\"email\":\"mskoggingspe@adobe.com\",\"job\":\"Software Engineer I\"}"}
{ "body": "{\"id\":916,\"first_name\":\"Whittaker\",\"email\":\"wpanswickpf@amazon.com\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":917,\"first_name\":\"Clementina\",\"email\":\"cbradbornepg@live.com\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":918,\"first_name\":\"Feodor\",\"email\":\"fbodemeaidph@businessweek.com\",\"job\":\"Professor\"}"}
{ "body": "{\"id\":919,\"first_name\":\"Esteban\",\"email\":\"emacrurypi@mozilla.com\",\"job\":\"Human Resources Manager\"}"}
{ "body": "{\"id\":920,\"first_name\":\"Suzanne\",\"email\":\"sgotterpj@noaa.gov\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":921,\"first_name\":\"Sheila-kathryn\",\"email\":\"shubanpk@hhs.gov\",\"job\":\"Geologist IV\"}"}
{ "body": "{\"id\":922,\"first_name\":\"Minette\",\"email\":\"mleakpl@nps.gov\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":923,\"first_name\":\"Jordana\",\"email\":\"jhousemanpm@aboutads.info\",\"job\":\"Geologist II\"}"}
{ "body": "{\"id\":924,\"first_name\":\"Izak\",\"email\":\"ibaloghpn@smh.com.au\",\"job\":\"Project Manager\"}"}
{ "body": "{\"id\":925,\"first_name\":\"Carita\",\"email\":\"cbeekepo@lulu.com\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":926,\"first_name\":\"Rowney\",\"email\":\"rgronoupp@blogtalkradio.com\",\"job\":\"Statistician III\"}"}
{ "body": "{\"id\":927,\"first_name\":\"Skipper\",\"email\":\"sraffonpq@prweb.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":928,\"first_name\":\"Bettine\",\"email\":\"briddioughpr@bloomberg.com\",\"job\":\"Internal Auditor\"}"}
{ "body": "{\"id\":929,\"first_name\":\"Cherice\",\"email\":\"chovendenps@diigo.com\",\"job\":\"Desktop Support Technician\"}"}
{ "body": "{\"id\":930,\"first_name\":\"Eb\",\"email\":\"ewoodcraftpt@jigsy.com\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":931,\"first_name\":\"Trixie\",\"email\":\"tscutchinpu@simplemachines.org\",\"job\":\"Recruiter\"}"}
{ "body": "{\"id\":932,\"first_name\":\"Kattie\",\"email\":\"kaxtellpv@w3.org\",\"job\":\"Programmer Analyst III\"}"}
{ "body": "{\"id\":933,\"first_name\":\"Marnia\",\"email\":\"mwehnerrpw@technorati.com\",\"job\":\"Sales Associate\"}"}
{ "body": "{\"id\":934,\"first_name\":\"Bessy\",\"email\":\"bwahnckepx@businessweek.com\",\"job\":\"Database Administrator IV\"}"}
{ "body": "{\"id\":935,\"first_name\":\"Parry\",\"email\":\"pseyfartpy@techcrunch.com\",\"job\":\"Senior Sales Associate\"}"}
{ "body": "{\"id\":936,\"first_name\":\"Jonie\",\"email\":\"jsteptoepz@ask.com\",\"job\":\"Nurse\"}"}
{ "body": "{\"id\":937,\"first_name\":\"Creight\",\"email\":\"cbutfieldq0@is.gd\",\"job\":\"Developer II\"}"}
{ "body": "{\"id\":938,\"first_name\":\"Kendell\",\"email\":\"kkyrkemanq1@ted.com\",\"job\":\"Director of Sales\"}"}
{ "body": "{\"id\":939,\"first_name\":\"Stanly\",\"email\":\"swherryq2@cdc.gov\",\"job\":\"Developer II\"}"}
{ "body": "{\"id\":940,\"first_name\":\"Valerie\",\"email\":\"vramirezq3@ucla.edu\",\"job\":\"Technical Writer\"}"}
{ "body": "{\"id\":941,\"first_name\":\"Margalo\",\"email\":\"mspruceq4@nps.gov\",\"job\":\"Chemical Engineer\"}"}
{ "body": "{\"id\":942,\"first_name\":\"Saundra\",\"email\":\"stretterq5@phoca.cz\",\"job\":\"Research Associate\"}"}
{ "body": "{\"id\":943,\"first_name\":\"Jenda\",\"email\":\"jalexsandrowiczq6@hhs.gov\",\"job\":\"Senior Cost Accountant\"}"}
{ "body": "{\"id\":944,\"first_name\":\"Orazio\",\"email\":\"oelvyq7@odnoklassniki.ru\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":945,\"first_name\":\"Caitlin\",\"email\":\"cledgewayq8@infoseek.co.jp\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":946,\"first_name\":\"Hobard\",\"email\":\"htomkowiczq9@intel.com\",\"job\":\"Teacher\"}"}
{ "body": "{\"id\":947,\"first_name\":\"Vitia\",\"email\":\"vgaviniqa@ezinearticles.com\",\"job\":\"Structural Engineer\"}"}
{ "body": "{\"id\":948,\"first_name\":\"Karissa\",\"email\":\"klannonqb@studiopress.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":949,\"first_name\":\"Beverley\",\"email\":\"bshreveqc@go.com\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":950,\"first_name\":\"Lisette\",\"email\":\"lcasebourneqd@4shared.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":951,\"first_name\":\"Ashil\",\"email\":\"akonkeqe@admin.ch\",\"job\":\"Software Engineer IV\"}"}
{ "body": "{\"id\":952,\"first_name\":\"Lauraine\",\"email\":\"lbleakleyqf@xing.com\",\"job\":\"Statistician IV\"}"}
{ "body": "{\"id\":953,\"first_name\":\"Timothea\",\"email\":\"tpetfordqg@icq.com\",\"job\":\"Accountant III\"}"}
{ "body": "{\"id\":954,\"first_name\":\"Ancell\",\"email\":\"aabbittqh@craigslist.org\",\"job\":\"Programmer III\"}"}
{ "body": "{\"id\":955,\"first_name\":\"Jarid\",\"email\":\"jhardwareqi@spotify.com\",\"job\":\"Financial Advisor\"}"}
{ "body": "{\"id\":956,\"first_name\":\"Sheff\",\"email\":\"sbwyqj@vkontakte.ru\",\"job\":\"Actuary\"}"}
{ "body": "{\"id\":957,\"first_name\":\"Archie\",\"email\":\"abassoqk@google.com.br\",\"job\":\"Assistant Professor\"}"}
{ "body": "{\"id\":958,\"first_name\":\"Ber\",\"email\":\"bspargoql@thetimes.co.uk\",\"job\":\"Analog Circuit Design manager\"}"}
{ "body": "{\"id\":959,\"first_name\":\"Josefa\",\"email\":\"jhuffyqm@blog.com\",\"job\":\"Dental Hygienist\"}"}
{ "body": "{\"id\":960,\"first_name\":\"Rivalee\",\"email\":\"rknowlmanqn@domainmarket.com\",\"job\":\"GIS Technical Architect\"}"}
{ "body": "{\"id\":961,\"first_name\":\"Kean\",\"email\":\"kbegginiqo@eventbrite.com\",\"job\":\"Programmer IV\"}"}
{ "body": "{\"id\":962,\"first_name\":\"Jacklin\",\"email\":\"jlaxtonqp@yandex.ru\",\"job\":\"Structural Analysis Engineer\"}"}
{ "body": "{\"id\":963,\"first_name\":\"Lynda\",\"email\":\"ldeluzeqq@blogger.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":964,\"first_name\":\"Kaile\",\"email\":\"kjefferdqr@shareasale.com\",\"job\":\"Administrative Officer\"}"}
{ "body": "{\"id\":965,\"first_name\":\"Tamar\",\"email\":\"tjoreauqs@nature.com\",\"job\":\"Office Assistant IV\"}"}
{ "body": "{\"id\":966,\"first_name\":\"Reg\",\"email\":\"rcorssqt@uol.com.br\",\"job\":\"Account Coordinator\"}"}
{ "body": "{\"id\":967,\"first_name\":\"Alastair\",\"email\":\"abranneyqu@ustream.tv\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":968,\"first_name\":\"Astrix\",\"email\":\"acushqv@liveinternet.ru\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":969,\"first_name\":\"Brendan\",\"email\":\"branceqw@oaic.gov.au\",\"job\":\"Food Chemist\"}"}
{ "body": "{\"id\":970,\"first_name\":\"Rosita\",\"email\":\"rminchellaqx@indiatimes.com\",\"job\":\"Junior Executive\"}"}
{ "body": "{\"id\":971,\"first_name\":\"Alexina\",\"email\":\"acurrmqy@1und1.de\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":972,\"first_name\":\"Jeanna\",\"email\":\"jdawneyqz@nba.com\",\"job\":\"Community Outreach Specialist\"}"}
{ "body": "{\"id\":973,\"first_name\":\"Donavon\",\"email\":\"dvogeler0@cam.ac.uk\",\"job\":\"Nurse\"}"}
{ "body": "{\"id\":974,\"first_name\":\"Salim\",\"email\":\"smilberryr1@amazon.co.jp\",\"job\":\"Payment Adjustment Coordinator\"}"}
{ "body": "{\"id\":975,\"first_name\":\"Theo\",\"email\":\"trosendorfr2@illinois.edu\",\"job\":\"Senior Developer\"}"}
{ "body": "{\"id\":976,\"first_name\":\"Ford\",\"email\":\"fmachansr3@deliciousdays.com\",\"job\":\"Research Nurse\"}"}
{ "body": "{\"id\":977,\"first_name\":\"Ernesto\",\"email\":\"eternaultr4@hp.com\",\"job\":\"Cost Accountant\"}"}
{ "body": "{\"id\":978,\"first_name\":\"Travis\",\"email\":\"tcloneyr5@jigsy.com\",\"job\":\"Recruiting Manager\"}"}
{ "body": "{\"id\":979,\"first_name\":\"Tynan\",\"email\":\"tcreusr6@alibaba.com\",\"job\":\"Design Engineer\"}"}
{ "body": "{\"id\":980,\"first_name\":\"Samuele\",\"email\":\"shumbertr7@indiatimes.com\",\"job\":\"Software Engineer II\"}"}
{ "body": "{\"id\":981,\"first_name\":\"Molli\",\"email\":\"mbenboughr8@bravesites.com\",\"job\":\"Nurse\"}"}
{ "body": "{\"id\":982,\"first_name\":\"Sampson\",\"email\":\"scrasswellr9@storify.com\",\"job\":\"Marketing Assistant\"}"}
{ "body": "{\"id\":983,\"first_name\":\"Jerad\",\"email\":\"jdacksra@bizjournals.com\",\"job\":\"Systems Administrator IV\"}"}
{ "body": "{\"id\":984,\"first_name\":\"Marcelline\",\"email\":\"mvenmorerb@t.co\",\"job\":\"Senior Editor\"}"}
{ "body": "{\"id\":985,\"first_name\":\"Beryle\",\"email\":\"bemersonrc@people.com.cn\",\"job\":\"Librarian\"}"}
{ "body": "{\"id\":986,\"first_name\":\"Rosemary\",\"email\":\"rmeddickrd@apple.com\",\"job\":\"Environmental Tech\"}"}
{ "body": "{\"id\":987,\"first_name\":\"Lars\",\"email\":\"lgillbardre@gov.uk\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":988,\"first_name\":\"Barnaby\",\"email\":\"bgrishukovrf@geocities.jp\",\"job\":\"Tax Accountant\"}"}
{ "body": "{\"id\":989,\"first_name\":\"Staci\",\"email\":\"sloryrg@pcworld.com\",\"job\":\"Civil Engineer\"}"}
{ "body": "{\"id\":990,\"first_name\":\"Vassily\",\"email\":\"vfarfullrh@51.la\",\"job\":\"VP Marketing\"}"}
{ "body": "{\"id\":991,\"first_name\":\"Robbert\",\"email\":\"rpinckstoneri@unblog.fr\",\"job\":\"Pharmacist\"}"}
{ "body": "{\"id\":992,\"first_name\":\"Simeon\",\"email\":\"shrishchenkorj@gizmodo.com\",\"job\":\"Nurse\"}"}
{ "body": "{\"id\":993,\"first_name\":\"Silvan\",\"email\":\"slinkierk@elpais.com\",\"job\":\"Engineer III\"}"}
{ "body": "{\"id\":994,\"first_name\":\"Doralin\",\"email\":\"dfinbyrl@xing.com\",\"job\":\"Statistician I\"}"}
{ "body": "{\"id\":995,\"first_name\":\"Katine\",\"email\":\"kgilmartinrm@ezinearticles.com\",\"job\":\"Systems Administrator IV\"}"}
{ "body": "{\"id\":996,\"first_name\":\"Deanne\",\"email\":\"drentonrn@example.com\",\"job\":\"Quality Control Specialist\"}"}
{ "body": "{\"id\":997,\"first_name\":\"Abdul\",\"email\":\"amccreeryro@tiny.cc\",\"job\":\"VP Quality Control\"}"}
{ "body": "{\"id\":998,\"first_name\":\"Lalo\",\"email\":\"ljeevesrp@furl.net\",\"job\":\"Senior Financial Analyst\"}"}
{ "body": "{\"id\":999,\"first_name\":\"Randal\",\"email\":\"rhancellrq@instagram.com\",\"job\":\"Staff Scientist\"}"}
{ "body": "{\"id\":1000,\"first_name\":\"Ramsay\",\"email\":\"rprujeanrr@whitehouse.gov\",\"job\":\"Internal Auditor\"}"}


================================================
FILE: quickwit/quickwit-indexing/benches/data/bench_data_light_transform.json
================================================
{"id":1,"first_name":"Alia","email":"aingleston0@twitpic.com","job":"Civil Engineer","timestamp":"2022-01-25T09:26:29Z"}
{"id":2,"first_name":"Erl","email":"ebegwell1@google.com.br","job":"Data Coordiator","timestamp":"2022-04-21T23:08:59Z"}
{"id":3,"first_name":"Drona","email":"dranyell2@ehow.com","job":"Desktop Support Technician","timestamp":"2022-10-20T03:43:51Z"}
{"id":4,"first_name":"Jackie","email":"jkingsley3@squidoo.com","job":"GIS Technical Architect","timestamp":"2022-02-02T21:54:48Z"}
{"id":5,"first_name":"Ginny","email":"glangman4@hud.gov","job":"Senior Sales Associate","timestamp":"2022-07-08T22:55:59Z"}
{"id":6,"first_name":"Lorenzo","email":"ltempleman5@pen.io","job":"Financial Advisor","timestamp":"2022-07-08T09:29:57Z"}
{"id":7,"first_name":"Kyle","email":"kkundt6@soup.io","job":"Sales Representative","timestamp":"2022-04-04T09:20:18Z"}
{"id":8,"first_name":"Miof mela","email":"mcamelin7@github.io","job":"Marketing Manager","timestamp":"2022-04-10T17:52:47Z"}
{"id":9,"first_name":"Shelden","email":"ssarson8@networkadvertising.org","job":"Biostatistician IV","timestamp":"2022-02-21T04:11:00Z"}
{"id":10,"first_name":"Evey","email":"estrang9@hostgator.com","job":"Programmer II","timestamp":"2022-09-21T02:54:44Z"}
{"id":11,"first_name":"Dav","email":"davrasina@trellian.com","job":"Accounting Assistant I","timestamp":"2022-11-10T13:00:59Z"}
{"id":12,"first_name":"Ignacio","email":"iduhamelb@desdev.cn","job":"Research Associate","timestamp":"2022-01-09T14:19:37Z"}
{"id":13,"first_name":"Lottie","email":"lfouchc@amazon.co.uk","job":"Help Desk Technician","timestamp":"2022-01-17T07:07:32Z"}
{"id":14,"first_name":"Moira","email":"menrigod@narod.ru","job":"Software Test Engineer IV","timestamp":"2022-05-28T04:42:48Z"}
{"id":15,"first_name":"Jori","email":"jeverille@ed.gov","job":"Senior Financial Analyst","timestamp":"2022-02-03T15:27:09Z"}
{"id":16,"first_name":"Markos","email":"mpostansf@4shared.com","job":"Tax Accountant","timestamp":"2022-05-15T15:57:34Z"}
{"id":17,"first_name":"Bryana","email":"bpokerg@printfriendly.com","job":"Physical Therapy Assistant","timestamp":"2022-04-21T13:20:12Z"}
{"id":18,"first_name":"Reiko","email":"rtunsleyh@arstechnica.com","job":"Recruiter","timestamp":"2022-10-30T21:27:31Z"}
{"id":19,"first_name":"Dedie","email":"dcouttsi@alibaba.com","job":"Human Resources Assistant II","timestamp":"2022-10-17T03:12:12Z"}
{"id":20,"first_name":"Sigfrid","email":"sfriattj@google.ru","job":"Help Desk Operator","timestamp":"2022-06-06T22:56:02Z"}
{"id":21,"first_name":"Sheilah","email":"stuitek@baidu.com","job":"VP Product Management","timestamp":"2022-08-04T05:08:19Z"}
{"id":22,"first_name":"Colan","email":"cbeardselll@drupal.org","job":"Structural Engineer","timestamp":"2022-07-11T05:12:49Z"}
{"id":23,"first_name":"Loise","email":"lminifiem@whitehouse.gov","job":"Research Assistant IV","timestamp":"2022-03-31T17:55:15Z"}
{"id":24,"first_name":"Imogen","email":"imckelveyn@hibu.com","job":"Accountant I","timestamp":"2022-06-19T23:39:31Z"}
{"id":25,"first_name":"Richy","email":"rcoultharto@mozilla.com","job":"Senior Cost Accountant","timestamp":"2022-05-01T02:00:34Z"}
{"id":26,"first_name":"Henrieta","email":"hkermittp@huffingtonpost.com","job":"Engineer III","timestamp":"2022-01-24T14:18:00Z"}
{"id":27,"first_name":"Matty","email":"msawoodq@goodreads.com","job":"Payment Adjustment Coordinator","timestamp":"2022-01-03T14:34:46Z"}
{"id":28,"first_name":"Lane","email":"ltownsleyr@ustream.tv","job":"General Manager","timestamp":"2022-06-06T22:51:21Z"}
{"id":29,"first_name":"Matias","email":"mbangss@dagondesign.com","job":"Paralegal","timestamp":"2022-09-05T18:38:43Z"}
{"id":30,"first_name":"Nita","email":"nmcsheat@flickr.com","job":"Professor","timestamp":"2022-10-06T06:00:26Z"}
{"id":31,"first_name":"Paul","email":"pmotherwellu@google.ru","job":"Sales Associate","timestamp":"2021-12-13T05:11:20Z"}
{"id":32,"first_name":"Hercules","email":"hdeattav@jimdo.com","job":"Pharmacist","timestamp":"2022-10-15T23:26:33Z"}
{"id":33,"first_name":"Beckie","email":"bcorradiniw@flickr.com","job":"Paralegal","timestamp":"2022-09-06T19:00:34Z"}
{"id":34,"first_name":"Roldan","email":"rvannix@ftc.gov","job":"Senior Quality Engineer","timestamp":"2022-12-04T17:22:04Z"}
{"id":35,"first_name":"Garwin","email":"gprucknery@dagondesign.com","job":"Sales Associate","timestamp":"2022-01-20T19:46:44Z"}
{"id":36,"first_name":"Sarine","email":"sfrantzenz@answers.com","job":"Data Coordiator","timestamp":"2022-10-23T21:34:29Z"}
{"id":37,"first_name":"Darby","email":"dberthot10@ocn.ne.jp","job":"Nurse Practicioner","timestamp":"2022-11-29T04:04:16Z"}
{"id":38,"first_name":"Virgil","email":"vpeltzer11@bloglovin.com","job":"Dental Hygienist","timestamp":"2022-05-30T03:34:01Z"}
{"id":39,"first_name":"Jennette","email":"jrenney12@businessinsider.com","job":"VP Product Management","timestamp":"2022-07-19T21:12:26Z"}
{"id":40,"first_name":"Marylee","email":"mbedell13@senate.gov","job":"VP Sales","timestamp":"2022-10-08T00:05:14Z"}
{"id":41,"first_name":"Randi","email":"racedo14@nymag.com","job":"Statistician III","timestamp":"2022-01-09T05:52:30Z"}
{"id":42,"first_name":"Bertrand","email":"bloxly15@bluehost.com","job":"Assistant Professor","timestamp":"2022-11-05T12:33:19Z"}
{"id":43,"first_name":"Maddy","email":"mscathard16@cyberchimps.com","job":"Actuary","timestamp":"2022-01-25T10:18:29Z"}
{"id":44,"first_name":"Gayla","email":"glidgate17@mediafire.com","job":"Dental Hygienist","timestamp":"2021-12-24T18:53:23Z"}
{"id":45,"first_name":"Omero","email":"omaxstead18@gravatar.com","job":"Civil Engineer","timestamp":"2022-09-16T18:24:37Z"}
{"id":46,"first_name":"Jaimie","email":"jtalby19@yahoo.co.jp","job":"Research Associate","timestamp":"2022-09-18T08:51:35Z"}
{"id":47,"first_name":"Vonni","email":"vpude1a@drupal.org","job":"Information Systems Manager","timestamp":"2022-05-16T09:53:18Z"}
{"id":48,"first_name":"Nikaniki","email":"nsurmeyers1b@accuweather.com","job":"Business Systems Development Analyst","timestamp":"2022-01-22T12:22:46Z"}
{"id":49,"first_name":"Colin","email":"cphuprate1c@reference.com","job":"GIS Technical Architect","timestamp":"2022-06-02T09:18:14Z"}
{"id":50,"first_name":"Vevay","email":"vlipson1d@illinois.edu","job":"Biostatistician II","timestamp":"2022-06-02T08:34:03Z"}
{"id":51,"first_name":"Maudie","email":"mluckcock1e@behance.net","job":"Staff Scientist","timestamp":"2022-04-20T12:44:22Z"}
{"id":52,"first_name":"Raymund","email":"rlewnden1f@tripadvisor.com","job":"Librarian","timestamp":"2022-08-13T23:17:51Z"}
{"id":53,"first_name":"Leonelle","email":"lwellum1g@buzzfeed.com","job":"Assistant Manager","timestamp":"2022-02-24T05:57:17Z"}
{"id":54,"first_name":"Merrill","email":"mdominico1h@netlog.com","job":"Nuclear Power Engineer","timestamp":"2022-02-13T16:40:32Z"}
{"id":55,"first_name":"Maura","email":"mjarman1i@ucoz.com","job":"Community Outreach Specialist","timestamp":"2022-08-02T04:15:09Z"}
{"id":56,"first_name":"Archambault","email":"aalcorn1j@posterous.com","job":"Nurse Practicioner","timestamp":"2022-02-07T03:03:27Z"}
{"id":57,"first_name":"Murray","email":"mwharfe1k@bloglovin.com","job":"Compensation Analyst","timestamp":"2022-11-17T11:46:01Z"}
{"id":58,"first_name":"Fawne","email":"froston1l@bloglines.com","job":"Computer Systems Analyst III","timestamp":"2022-03-27T06:42:55Z"}
{"id":59,"first_name":"Trudey","email":"tberinger1m@github.io","job":"Food Chemist","timestamp":"2022-03-05T15:02:41Z"}
{"id":60,"first_name":"Mureil","email":"malloway1n@purevolume.com","job":"Marketing Assistant","timestamp":"2022-09-05T23:29:03Z"}
{"id":61,"first_name":"Norine","email":"npennetta1o@bloglovin.com","job":"Director of Sales","timestamp":"2022-02-08T11:56:03Z"}
{"id":62,"first_name":"Lucinda","email":"ldemetz1p@tripadvisor.com","job":"Civil Engineer","timestamp":"2022-03-07T23:09:35Z"}
{"id":63,"first_name":"Hulda","email":"hhaville1q@mashable.com","job":"Paralegal","timestamp":"2022-01-22T07:03:36Z"}
{"id":64,"first_name":"Valenka","email":"vtorpie1r@netscape.com","job":"Design Engineer","timestamp":"2022-01-13T11:26:42Z"}
{"id":65,"first_name":"Farleigh","email":"fdantoni1s@mayoclinic.com","job":"Nurse Practicioner","timestamp":"2022-03-27T14:07:23Z"}
{"id":66,"first_name":"Demetra","email":"dtabourier1t@nytimes.com","job":"Senior Financial Analyst","timestamp":"2022-06-13T05:56:48Z"}
{"id":67,"first_name":"Austine","email":"ableas1u@jiathis.com","job":"Quality Control Specialist","timestamp":"2022-02-07T04:51:56Z"}
{"id":68,"first_name":"Amie","email":"alanchbury1v@hc360.com","job":"Operator","timestamp":"2022-05-09T15:29:00Z"}
{"id":69,"first_name":"Normie","email":"nwardall1w@gnu.org","job":"Professor","timestamp":"2022-10-14T09:26:18Z"}
{"id":70,"first_name":"Lowe","email":"ledelman1x@mediafire.com","job":"Operator","timestamp":"2022-02-06T12:42:05Z"}
{"id":71,"first_name":"Agretha","email":"awelchman1y@deviantart.com","job":"Product Engineer","timestamp":"2022-07-04T03:37:27Z"}
{"id":72,"first_name":"Marleah","email":"mwale1z@youtube.com","job":"Nurse Practicioner","timestamp":"2022-10-07T01:50:50Z"}
{"id":73,"first_name":"Tammi","email":"tcallow20@quantcast.com","job":"Registered Nurse","timestamp":"2022-06-10T20:24:59Z"}
{"id":74,"first_name":"Wye","email":"wkidner21@themeforest.net","job":"Tax Accountant","timestamp":"2021-12-20T08:54:36Z"}
{"id":75,"first_name":"Katherine","email":"kburnep22@histats.com","job":"Analyst Programmer","timestamp":"2022-07-02T18:17:33Z"}
{"id":76,"first_name":"Charita","email":"cmuccino23@usatoday.com","job":"Staff Scientist","timestamp":"2022-10-14T20:40:12Z"}
{"id":77,"first_name":"Brook","email":"btoquet24@cmu.edu","job":"Structural Analysis Engineer","timestamp":"2022-02-24T07:42:26Z"}
{"id":78,"first_name":"Lexine","email":"lface25@telegraph.co.uk","job":"Health Coach III","timestamp":"2022-08-14T05:15:07Z"}
{"id":79,"first_name":"Corri","email":"cdavidy26@tiny.cc","job":"Food Chemist","timestamp":"2022-11-16T00:04:23Z"}
{"id":80,"first_name":"Kelcey","email":"ksargeaunt27@sakura.ne.jp","job":"Associate Professor","timestamp":"2022-11-24T13:06:33Z"}
{"id":81,"first_name":"Tracy","email":"tbennetto28@goo.ne.jp","job":"VP Quality Control","timestamp":"2022-11-20T11:49:26Z"}
{"id":82,"first_name":"Edmon","email":"ehuxtable29@rambler.ru","job":"Environmental Specialist","timestamp":"2022-07-31T23:16:51Z"}
{"id":83,"first_name":"Tessy","email":"tsargeant2a@shop-pro.jp","job":"Desktop Support Technician","timestamp":"2022-05-15T12:07:04Z"}
{"id":84,"first_name":"Chev","email":"ctenbrug2b@topsy.com","job":"Senior Quality Engineer","timestamp":"2021-12-09T09:41:20Z"}
{"id":85,"first_name":"Olivero","email":"oseebright2c@nba.com","job":"Structural Analysis Engineer","timestamp":"2022-09-19T23:40:16Z"}
{"id":86,"first_name":"Oswald","email":"oswash2d@fotki.com","job":"Occupational Therapist","timestamp":"2022-08-06T13:17:22Z"}
{"id":87,"first_name":"Laurent","email":"lsineath2e@a8.net","job":"Web Designer IV","timestamp":"2022-09-29T13:15:18Z"}
{"id":88,"first_name":"Mehetabel","email":"mfendt2f@bing.com","job":"Assistant Media Planner","timestamp":"2021-12-31T08:22:47Z"}
{"id":89,"first_name":"Jaime","email":"jrichfield2g@europa.eu","job":"Staff Scientist","timestamp":"2022-10-30T10:50:50Z"}
{"id":90,"first_name":"Grissel","email":"ggell2h@bluehost.com","job":"Speech Pathologist","timestamp":"2022-02-26T08:04:19Z"}
{"id":91,"first_name":"Fanchette","email":"fgooderham2i@123-reg.co.uk","job":"Professor","timestamp":"2022-02-04T06:06:20Z"}
{"id":92,"first_name":"Dov","email":"dcurston2j@jigsy.com","job":"Payment Adjustment Coordinator","timestamp":"2022-02-18T00:39:48Z"}
{"id":93,"first_name":"Fawn","email":"fcazin2k@mac.com","job":"Legal Assistant","timestamp":"2022-10-06T14:22:24Z"}
{"id":94,"first_name":"Emilio","email":"esaphin2l@china.com.cn","job":"Systems Administrator III","timestamp":"2022-05-18T14:52:18Z"}
{"id":95,"first_name":"Lisabeth","email":"lgarrand2m@mlb.com","job":"Recruiter","timestamp":"2022-08-13T12:08:41Z"}
{"id":96,"first_name":"Stanwood","email":"sschruur2n@phpbb.com","job":"Senior Editor","timestamp":"2022-06-08T15:49:39Z"}
{"id":97,"first_name":"Elke","email":"eoliverpaull2o@msu.edu","job":"Research Assistant II","timestamp":"2022-11-26T20:49:01Z"}
{"id":98,"first_name":"Daisey","email":"dpadfield2p@chronoengine.com","job":"VP Marketing","timestamp":"2022-09-22T13:51:47Z"}
{"id":99,"first_name":"Hirsch","email":"htrembley2q@hibu.com","job":"Environmental Specialist","timestamp":"2022-06-11T18:27:56Z"}
{"id":100,"first_name":"Karlee","email":"kgates2r@vistaprint.com","job":"Media Manager III","timestamp":"2022-04-18T22:02:59Z"}
{"id":101,"first_name":"Kylie","email":"kklimov2s@cmu.edu","job":"Senior Financial Analyst","timestamp":"2022-03-20T06:18:08Z"}
{"id":102,"first_name":"Lorrie","email":"lsmewings2t@weibo.com","job":"Mechanical Systems Engineer","timestamp":"2022-11-22T01:27:34Z"}
{"id":103,"first_name":"Lilli","email":"lsanto2u@wired.com","job":"Research Nurse","timestamp":"2022-02-25T04:53:03Z"}
{"id":104,"first_name":"Julieta","email":"jdyers2v@un.org","job":"Associate Professor","timestamp":"2022-08-17T09:32:36Z"}
{"id":105,"first_name":"Uriel","email":"uqualtro2w@mlb.com","job":"Budget/Accounting Analyst II","timestamp":"2022-08-09T14:45:37Z"}
{"id":106,"first_name":"Irvine","email":"ikleinschmidt2x@weather.com","job":"Operator","timestamp":"2022-03-29T18:17:15Z"}
{"id":107,"first_name":"Elaine","email":"eglennon2y@jigsy.com","job":"Speech Pathologist","timestamp":"2022-09-08T11:23:44Z"}
{"id":108,"first_name":"Gaspar","email":"gmaass2z@sfgate.com","job":"Community Outreach Specialist","timestamp":"2022-04-10T07:49:11Z"}
{"id":109,"first_name":"Josy","email":"jchick30@merriam-webster.com","job":"Electrical Engineer","timestamp":"2022-06-22T22:33:43Z"}
{"id":110,"first_name":"Dawna","email":"ddinsale31@nydailynews.com","job":"Associate Professor","timestamp":"2022-12-02T13:10:31Z"}
{"id":111,"first_name":"Aldo","email":"alindsell32@ow.ly","job":"Engineer IV","timestamp":"2022-05-03T01:50:41Z"}
{"id":112,"first_name":"Wade","email":"wparkyns33@cpanel.net","job":"Project Manager","timestamp":"2022-03-31T20:28:42Z"}
{"id":113,"first_name":"Aundrea","email":"ahaggith34@prnewswire.com","job":"Engineer I","timestamp":"2022-11-05T23:37:37Z"}
{"id":114,"first_name":"Tuck","email":"tnasi35@netvibes.com","job":"Staff Scientist","timestamp":"2022-03-16T15:50:38Z"}
{"id":115,"first_name":"Kirby","email":"kworsalls36@cargocollective.com","job":"Recruiting Manager","timestamp":"2022-06-25T06:27:40Z"}
{"id":116,"first_name":"Lauren","email":"lmenghi37@rambler.ru","job":"Software Engineer III","timestamp":"2022-01-25T07:16:48Z"}
{"id":117,"first_name":"Pearce","email":"pgleed38@hubpages.com","job":"Tax Accountant","timestamp":"2022-05-05T18:33:52Z"}
{"id":118,"first_name":"Vlad","email":"vbensley39@prweb.com","job":"Help Desk Operator","timestamp":"2022-05-12T17:41:17Z"}
{"id":119,"first_name":"Uriah","email":"ustaniford3a@timesonline.co.uk","job":"Staff Accountant III","timestamp":"2022-05-23T06:37:31Z"}
{"id":120,"first_name":"Frederic","email":"fchataignier3b@utexas.edu","job":"Cost Accountant","timestamp":"2022-08-21T19:45:23Z"}
{"id":121,"first_name":"Nell","email":"ngniewosz3c@cnn.com","job":"Librarian","timestamp":"2022-01-04T15:59:26Z"}
{"id":122,"first_name":"Baxy","email":"bcockings3d@dmoz.org","job":"Product Engineer","timestamp":"2022-12-04T03:13:12Z"}
{"id":123,"first_name":"Shadow","email":"squade3e@sciencedaily.com","job":"Research Assistant I","timestamp":"2021-12-14T07:33:10Z"}
{"id":124,"first_name":"Selene","email":"ssammut3f@51.la","job":"Nurse Practicioner","timestamp":"2021-12-23T23:00:29Z"}
{"id":125,"first_name":"Wendye","email":"wsimons3g@phpbb.com","job":"Internal Auditor","timestamp":"2021-12-31T22:20:21Z"}
{"id":126,"first_name":"Cobby","email":"cmanton3h@rediff.com","job":"Analyst Programmer","timestamp":"2022-05-03T06:36:31Z"}
{"id":127,"first_name":"Sharyl","email":"sdowner3i@wikipedia.org","job":"Help Desk Technician","timestamp":"2022-11-18T09:17:46Z"}
{"id":128,"first_name":"Sallyanne","email":"slinley3j@woothemes.com","job":"VP Marketing","timestamp":"2022-03-03T20:52:39Z"}
{"id":129,"first_name":"Christophe","email":"cvelti3k@youku.com","job":"Director of Sales","timestamp":"2022-08-18T14:15:52Z"}
{"id":130,"first_name":"Dion","email":"dcoburn3l@booking.com","job":"Junior Executive","timestamp":"2022-10-16T14:04:46Z"}
{"id":131,"first_name":"Terencio","email":"thandmore3m@utexas.edu","job":"Director of Sales","timestamp":"2022-08-15T01:47:28Z"}
{"id":132,"first_name":"Tiler","email":"tvala3n@godaddy.com","job":"Geologist III","timestamp":"2022-10-18T05:08:00Z"}
{"id":133,"first_name":"Lelia","email":"lleddie3o@youku.com","job":"VP Accounting","timestamp":"2022-11-08T09:30:26Z"}
{"id":134,"first_name":"Dawna","email":"dcamellini3p@hibu.com","job":"Environmental Tech","timestamp":"2022-06-26T10:52:54Z"}
{"id":135,"first_name":"Nickolas","email":"ngosling3q@ox.ac.uk","job":"Director of Sales","timestamp":"2021-12-28T16:28:31Z"}
{"id":136,"first_name":"Mufinella","email":"mkleiner3r@51.la","job":"Automation Specialist III","timestamp":"2022-04-26T08:05:51Z"}
{"id":137,"first_name":"Hoebart","email":"hharses3s@cbc.ca","job":"Business Systems Development Analyst","timestamp":"2022-05-16T14:01:59Z"}
{"id":138,"first_name":"Brier","email":"bstivey3t@hatena.ne.jp","job":"Electrical Engineer","timestamp":"2022-08-17T04:40:43Z"}
{"id":139,"first_name":"Hynda","email":"hbloore3u@shareasale.com","job":"Media Manager III","timestamp":"2022-01-26T18:01:30Z"}
{"id":140,"first_name":"Maure","email":"mfrankis3v@mashable.com","job":"Software Engineer I","timestamp":"2022-10-12T16:15:44Z"}
{"id":141,"first_name":"Kendra","email":"kgrisenthwaite3w@yandex.ru","job":"Environmental Tech","timestamp":"2022-08-20T21:52:08Z"}
{"id":142,"first_name":"Rand","email":"rrowledge3x@themeforest.net","job":"Librarian","timestamp":"2022-05-30T11:46:14Z"}
{"id":143,"first_name":"Paulie","email":"pmerit3y@hud.gov","job":"Financial Analyst","timestamp":"2022-04-01T18:06:45Z"}
{"id":144,"first_name":"Lynn","email":"lcrannach3z@weibo.com","job":"Software Test Engineer II","timestamp":"2022-03-24T14:41:03Z"}
{"id":145,"first_name":"Petronella","email":"pjanic40@infoseek.co.jp","job":"Chief Design Engineer","timestamp":"2022-06-19T21:29:51Z"}
{"id":146,"first_name":"Alberik","email":"abodleigh41@uiuc.edu","job":"Nurse","timestamp":"2022-06-17T03:57:06Z"}
{"id":147,"first_name":"Joshuah","email":"jcecchi42@businessinsider.com","job":"Budget/Accounting Analyst III","timestamp":"2022-03-27T02:57:33Z"}
{"id":148,"first_name":"Chicky","email":"cbraxton43@utexas.edu","job":"Senior Quality Engineer","timestamp":"2022-10-15T12:21:30Z"}
{"id":149,"first_name":"Glyn","email":"ggauvin44@ezinearticles.com","job":"Software Consultant","timestamp":"2021-12-11T23:15:12Z"}
{"id":150,"first_name":"Barnabe","email":"bemery45@bluehost.com","job":"Marketing Manager","timestamp":"2022-06-11T14:14:01Z"}
{"id":151,"first_name":"Paulina","email":"pchettle46@cornell.edu","job":"Geologist III","timestamp":"2022-01-07T14:29:30Z"}
{"id":152,"first_name":"Clarisse","email":"csharer47@indiegogo.com","job":"Junior Executive","timestamp":"2022-01-12T21:10:23Z"}
{"id":153,"first_name":"Mona","email":"mlakeland48@globo.com","job":"Accountant I","timestamp":"2022-12-04T20:07:31Z"}
{"id":154,"first_name":"Emogene","email":"ewillison49@cam.ac.uk","job":"Food Chemist","timestamp":"2022-06-28T15:40:59Z"}
{"id":155,"first_name":"Dael","email":"dbryns4a@nydailynews.com","job":"Geological Engineer","timestamp":"2022-09-24T00:17:27Z"}
{"id":156,"first_name":"Mel","email":"mbahl4b@tumblr.com","job":"VP Marketing","timestamp":"2022-06-12T01:10:19Z"}
{"id":157,"first_name":"Marlene","email":"mferrao4c@seesaa.net","job":"Systems Administrator IV","timestamp":"2022-01-13T07:40:49Z"}
{"id":158,"first_name":"Guenna","email":"gpalethorpe4d@whitehouse.gov","job":"Senior Sales Associate","timestamp":"2022-07-21T04:39:45Z"}
{"id":159,"first_name":"Keri","email":"kgionettitti4e@bravesites.com","job":"Operator","timestamp":"2022-09-03T00:08:51Z"}
{"id":160,"first_name":"Collen","email":"cmacterrelly4f@theatlantic.com","job":"Assistant Professor","timestamp":"2022-09-30T06:34:38Z"}
{"id":161,"first_name":"Arabelle","email":"adoree4g@blinklist.com","job":"Analyst Programmer","timestamp":"2022-04-18T00:16:37Z"}
{"id":162,"first_name":"Aridatha","email":"aalcido4h@xrea.com","job":"Programmer Analyst IV","timestamp":"2022-05-31T04:17:35Z"}
{"id":163,"first_name":"Roxine","email":"rwarbeys4i@paypal.com","job":"Biostatistician IV","timestamp":"2022-11-17T07:13:36Z"}
{"id":164,"first_name":"Elga","email":"ewelsby4j@parallels.com","job":"Financial Advisor","timestamp":"2022-08-09T11:01:09Z"}
{"id":165,"first_name":"Anna","email":"astovine4k@wikispaces.com","job":"Marketing Assistant","timestamp":"2022-04-18T20:09:47Z"}
{"id":166,"first_name":"Ailyn","email":"aquick4l@wordpress.com","job":"VP Marketing","timestamp":"2022-10-16T06:58:38Z"}
{"id":167,"first_name":"Robinet","email":"reddington4m@dailymotion.com","job":"Help Desk Technician","timestamp":"2021-12-17T13:53:29Z"}
{"id":168,"first_name":"Berty","email":"bhauxley4n@sun.com","job":"Safety Technician III","timestamp":"2022-09-09T17:16:53Z"}
{"id":169,"first_name":"Hedwiga","email":"hmassen4o@1und1.de","job":"Senior Developer","timestamp":"2022-06-18T19:08:16Z"}
{"id":170,"first_name":"Marlow","email":"mugo4p@time.com","job":"Assistant Manager","timestamp":"2022-11-21T09:02:51Z"}
{"id":171,"first_name":"Lindsay","email":"llangthorne4q@ameblo.jp","job":"Health Coach II","timestamp":"2022-05-24T18:16:34Z"}
{"id":172,"first_name":"Katie","email":"kdorney4r@soundcloud.com","job":"Staff Accountant I","timestamp":"2022-01-30T18:38:41Z"}
{"id":173,"first_name":"Hilary","email":"hcattach4s@meetup.com","job":"VP Product Management","timestamp":"2022-04-08T21:28:37Z"}
{"id":174,"first_name":"Ardine","email":"aparram4t@irs.gov","job":"Legal Assistant","timestamp":"2022-07-27T14:12:56Z"}
{"id":175,"first_name":"Mable","email":"mriccardo4u@aboutads.info","job":"Assistant Media Planner","timestamp":"2022-10-03T22:14:39Z"}
{"id":176,"first_name":"Cairistiona","email":"csparwell4v@instagram.com","job":"VP Sales","timestamp":"2022-10-02T20:22:11Z"}
{"id":177,"first_name":"Gunther","email":"gbradden4w@google.com.hk","job":"Research Associate","timestamp":"2022-08-07T06:19:07Z"}
{"id":178,"first_name":"Filide","email":"fkingswood4x@narod.ru","job":"Associate Professor","timestamp":"2022-09-14T02:24:37Z"}
{"id":179,"first_name":"Jacinda","email":"jgribbins4y@quantcast.com","job":"Nurse Practicioner","timestamp":"2022-02-21T19:24:53Z"}
{"id":180,"first_name":"Fay","email":"fizakson4z@i2i.jp","job":"Tax Accountant","timestamp":"2022-01-06T01:57:09Z"}
{"id":181,"first_name":"Trish","email":"tgurko50@dropbox.com","job":"Research Associate","timestamp":"2022-08-26T15:02:51Z"}
{"id":182,"first_name":"Chrotoem","email":"claviss51@bluehost.com","job":"VP Product Management","timestamp":"2022-10-14T17:04:29Z"}
{"id":183,"first_name":"Drusilla","email":"dvern52@upenn.edu","job":"Web Designer II","timestamp":"2022-10-13T00:54:08Z"}
{"id":184,"first_name":"Kent","email":"kleahair53@theglobeandmail.com","job":"Recruiter","timestamp":"2022-01-07T05:32:42Z"}
{"id":185,"first_name":"Abagail","email":"aparadin54@netlog.com","job":"Editor","timestamp":"2022-06-02T00:24:32Z"}
{"id":186,"first_name":"Agosto","email":"atwinberrow55@answers.com","job":"Editor","timestamp":"2022-01-29T09:42:02Z"}
{"id":187,"first_name":"Danyette","email":"dbecker56@jigsy.com","job":"Legal Assistant","timestamp":"2022-05-07T01:24:37Z"}
{"id":188,"first_name":"Waverly","email":"wspinelli57@umn.edu","job":"Environmental Tech","timestamp":"2022-09-29T06:05:36Z"}
{"id":189,"first_name":"Basil","email":"bdobel58@twitpic.com","job":"Senior Financial Analyst","timestamp":"2022-01-21T06:37:20Z"}
{"id":190,"first_name":"Catharine","email":"cconnew59@xing.com","job":"Clinical Specialist","timestamp":"2022-02-17T07:17:47Z"}
{"id":191,"first_name":"Edd","email":"edezamudio5a@intel.com","job":"Chief Design Engineer","timestamp":"2022-09-17T12:49:36Z"}
{"id":192,"first_name":"Aura","email":"aserris5b@google.it","job":"Internal Auditor","timestamp":"2022-02-24T22:25:08Z"}
{"id":193,"first_name":"Tomi","email":"tyarnton5c@g.co","job":"Project Manager","timestamp":"2022-09-14T23:50:00Z"}
{"id":194,"first_name":"Claudianus","email":"cskerratt5d@va.gov","job":"Environmental Tech","timestamp":"2022-11-11T06:48:47Z"}
{"id":195,"first_name":"Christine","email":"cmiliffe5e@fda.gov","job":"Environmental Specialist","timestamp":"2021-12-30T16:41:26Z"}
{"id":196,"first_name":"Neda","email":"nlicciardello5f@ameblo.jp","job":"Database Administrator III","timestamp":"2022-11-26T02:35:02Z"}
{"id":197,"first_name":"Avram","email":"abeeston5g@acquirethisname.com","job":"Health Coach III","timestamp":"2022-11-20T12:15:09Z"}
{"id":198,"first_name":"Murry","email":"madamkiewicz5h@time.com","job":"Developer II","timestamp":"2022-04-04T04:01:09Z"}
{"id":199,"first_name":"Oralia","email":"odener5i@amazon.de","job":"Financial Advisor","timestamp":"2022-06-08T15:04:48Z"}
{"id":200,"first_name":"Pearce","email":"pabramovitz5j@sciencedirect.com","job":"Assistant Professor","timestamp":"2022-01-04T10:36:44Z"}
{"id":201,"first_name":"Jesse","email":"jseares5k@elegantthemes.com","job":"Civil Engineer","timestamp":"2022-03-28T14:24:48Z"}
{"id":202,"first_name":"Jedediah","email":"jconstantinou5l@wsj.com","job":"Assistant Manager","timestamp":"2022-03-05T20:32:52Z"}
{"id":203,"first_name":"Prescott","email":"pmatuska5m@miitbeian.gov.cn","job":"Quality Engineer","timestamp":"2021-12-24T15:53:01Z"}
{"id":204,"first_name":"Germaine","email":"ghadny5n@sakura.ne.jp","job":"Nuclear Power Engineer","timestamp":"2022-11-23T20:50:04Z"}
{"id":205,"first_name":"Merle","email":"mgillmore5o@nsw.gov.au","job":"Sales Associate","timestamp":"2022-07-17T06:35:23Z"}
{"id":206,"first_name":"Tiphanie","email":"tjekel5p@msn.com","job":"Financial Advisor","timestamp":"2022-09-17T06:38:25Z"}
{"id":207,"first_name":"Abbott","email":"adauney5q@wsj.com","job":"Business Systems Development Analyst","timestamp":"2022-02-26T17:55:00Z"}
{"id":208,"first_name":"Flor","email":"fbuche5r@kickstarter.com","job":"Account Representative II","timestamp":"2022-06-30T12:59:37Z"}
{"id":209,"first_name":"Kandace","email":"kgavin5s@ovh.net","job":"Professor","timestamp":"2022-06-15T22:27:43Z"}
{"id":210,"first_name":"Raimund","email":"rmcpeck5t@weibo.com","job":"GIS Technical Architect","timestamp":"2021-12-25T09:56:17Z"}
{"id":211,"first_name":"Archibold","email":"atunmore5u@privacy.gov.au","job":"VP Accounting","timestamp":"2022-01-30T06:27:36Z"}
{"id":212,"first_name":"Don","email":"docrigane5v@squidoo.com","job":"Speech Pathologist","timestamp":"2022-03-28T05:37:07Z"}
{"id":213,"first_name":"Zuzana","email":"zreynard5w@google.it","job":"Desktop Support Technician","timestamp":"2022-08-09T01:13:52Z"}
{"id":214,"first_name":"Grantley","email":"glapley5x@youtube.com","job":"Product Engineer","timestamp":"2022-05-21T22:28:10Z"}
{"id":215,"first_name":"Granthem","email":"gdrover5y@technorati.com","job":"VP Product Management","timestamp":"2022-03-09T21:39:04Z"}
{"id":216,"first_name":"Shaina","email":"sgrinnov5z@usa.gov","job":"Developer III","timestamp":"2022-07-01T13:50:43Z"}
{"id":217,"first_name":"Giovanna","email":"gleeburn60@kickstarter.com","job":"Senior Developer","timestamp":"2022-09-03T13:08:03Z"}
{"id":218,"first_name":"Dehlia","email":"dguinness61@hc360.com","job":"Associate Professor","timestamp":"2021-12-15T19:00:10Z"}
{"id":219,"first_name":"Cinda","email":"cdunklee62@topsy.com","job":"Actuary","timestamp":"2022-04-11T05:24:27Z"}
{"id":220,"first_name":"Kimball","email":"kbortolutti63@unicef.org","job":"Data Coordiator","timestamp":"2022-07-02T21:45:40Z"}
{"id":221,"first_name":"Daffie","email":"dlivingstone64@pbs.org","job":"Graphic Designer","timestamp":"2022-02-21T10:00:07Z"}
{"id":222,"first_name":"Hermina","email":"hmacglory65@360.cn","job":"Geological Engineer","timestamp":"2022-09-17T07:01:59Z"}
{"id":223,"first_name":"Robinet","email":"rcook66@fema.gov","job":"Web Developer I","timestamp":"2021-12-25T06:48:04Z"}
{"id":224,"first_name":"Cedric","email":"cgeroldini67@arizona.edu","job":"Engineer III","timestamp":"2022-10-19T01:36:02Z"}
{"id":225,"first_name":"Daune","email":"dalgar68@creativecommons.org","job":"Assistant Media Planner","timestamp":"2022-01-15T03:59:23Z"}
{"id":226,"first_name":"Susanne","email":"sgeist69@nsw.gov.au","job":"Structural Analysis Engineer","timestamp":"2022-02-03T18:50:39Z"}
{"id":227,"first_name":"Sibelle","email":"skenion6a@sciencedaily.com","job":"Community Outreach Specialist","timestamp":"2021-12-20T23:39:47Z"}
{"id":228,"first_name":"Tabb","email":"tcubbit6b@shinystat.com","job":"Programmer IV","timestamp":"2022-04-06T22:19:21Z"}
{"id":229,"first_name":"Shirley","email":"shardstaff6c@furl.net","job":"Developer II","timestamp":"2022-09-03T18:49:43Z"}
{"id":230,"first_name":"Sigvard","email":"smaffia6d@uol.com.br","job":"Software Test Engineer II","timestamp":"2022-11-06T03:16:32Z"}
{"id":231,"first_name":"Maryjo","email":"mcamblin6e@symantec.com","job":"Paralegal","timestamp":"2022-09-27T18:02:30Z"}
{"id":232,"first_name":"Jdavie","email":"jishaki6f@mozilla.org","job":"Computer Systems Analyst III","timestamp":"2022-10-13T21:42:19Z"}
{"id":233,"first_name":"Louie","email":"lmoresby6g@zdnet.com","job":"Nuclear Power Engineer","timestamp":"2022-09-15T23:17:28Z"}
{"id":234,"first_name":"Merla","email":"mpietraszek6h@twitpic.com","job":"Accounting Assistant I","timestamp":"2022-09-04T11:29:39Z"}
{"id":235,"first_name":"Nealon","email":"ntertre6i@free.fr","job":"Safety Technician IV","timestamp":"2022-10-25T01:34:35Z"}
{"id":236,"first_name":"Riordan","email":"rhark6j@hhs.gov","job":"Account Representative III","timestamp":"2022-08-28T09:49:55Z"}
{"id":237,"first_name":"Borg","email":"bwettern6k@fastcompany.com","job":"Engineer I","timestamp":"2022-11-06T21:22:23Z"}
{"id":238,"first_name":"Micki","email":"mgange6l@live.com","job":"Dental Hygienist","timestamp":"2022-10-23T03:47:59Z"}
{"id":239,"first_name":"Werner","email":"wledgeway6m@vistaprint.com","job":"Payment Adjustment Coordinator","timestamp":"2022-06-27T08:29:47Z"}
{"id":240,"first_name":"Aundrea","email":"agirt6n@sbwire.com","job":"Electrical Engineer","timestamp":"2022-07-23T13:19:16Z"}
{"id":241,"first_name":"Benedetto","email":"bharmon6o@google.pl","job":"Technical Writer","timestamp":"2022-11-19T14:02:05Z"}
{"id":242,"first_name":"Cristal","email":"cellington6p@ask.com","job":"Editor","timestamp":"2022-07-01T23:57:52Z"}
{"id":243,"first_name":"Ebonee","email":"ebartolomeo6q@goo.ne.jp","job":"Account Executive","timestamp":"2022-01-28T09:49:08Z"}
{"id":244,"first_name":"Bern","email":"bturrell6r@topsy.com","job":"Research Associate","timestamp":"2022-03-06T14:31:58Z"}
{"id":245,"first_name":"Kenny","email":"kruggs6s@nba.com","job":"Software Test Engineer III","timestamp":"2022-05-23T21:28:39Z"}
{"id":246,"first_name":"Wilhelmina","email":"wfandrey6t@flavors.me","job":"Actuary","timestamp":"2022-08-29T02:19:02Z"}
{"id":247,"first_name":"Aurelea","email":"acoverdill6u@furl.net","job":"Community Outreach Specialist","timestamp":"2022-06-09T09:59:42Z"}
{"id":248,"first_name":"Aaren","email":"asautter6v@chicagotribune.com","job":"GIS Technical Architect","timestamp":"2022-09-06T22:52:21Z"}
{"id":249,"first_name":"Alva","email":"achillingsworth6w@salon.com","job":"Community Outreach Specialist","timestamp":"2022-02-15T03:57:24Z"}
{"id":250,"first_name":"Coretta","email":"cdenormanville6x@nbcnews.com","job":"Graphic Designer","timestamp":"2022-11-17T23:47:28Z"}
{"id":251,"first_name":"Lem","email":"lcarlesso6y@hibu.com","job":"Clinical Specialist","timestamp":"2022-08-18T16:41:37Z"}
{"id":252,"first_name":"Alejandro","email":"aloughlin6z@hibu.com","job":"Operator","timestamp":"2022-10-15T01:17:03Z"}
{"id":253,"first_name":"Benetta","email":"bbuttrey70@lulu.com","job":"Speech Pathologist","timestamp":"2022-03-02T20:29:32Z"}
{"id":254,"first_name":"Ralina","email":"rsterte71@sun.com","job":"Environmental Specialist","timestamp":"2022-11-21T02:40:25Z"}
{"id":255,"first_name":"Serena","email":"smoulds72@globo.com","job":"VP Marketing","timestamp":"2022-07-20T12:10:53Z"}
{"id":256,"first_name":"Bonnie","email":"bthreader73@over-blog.com","job":"Financial Analyst","timestamp":"2022-04-26T20:51:46Z"}
{"id":257,"first_name":"Joelynn","email":"jlangham74@discovery.com","job":"Chemical Engineer","timestamp":"2022-01-07T19:00:00Z"}
{"id":258,"first_name":"Otha","email":"ocaselli75@wikispaces.com","job":"Actuary","timestamp":"2022-07-04T17:16:53Z"}
{"id":259,"first_name":"Maryann","email":"mbenn76@clickbank.net","job":"Office Assistant III","timestamp":"2022-06-19T05:43:08Z"}
{"id":260,"first_name":"Ryun","email":"rgwalter77@about.me","job":"Quality Control Specialist","timestamp":"2022-06-18T08:19:32Z"}
{"id":261,"first_name":"Letisha","email":"linns78@tinypic.com","job":"Operator","timestamp":"2022-03-27T08:33:52Z"}
{"id":262,"first_name":"Anni","email":"awhale79@sciencedirect.com","job":"Graphic Designer","timestamp":"2022-03-02T13:47:31Z"}
{"id":263,"first_name":"Erek","email":"ekoppen7a@cafepress.com","job":"Geological Engineer","timestamp":"2021-12-29T08:26:09Z"}
{"id":264,"first_name":"Guendolen","email":"gharvatt7b@abc.net.au","job":"Software Engineer I","timestamp":"2022-06-05T16:59:36Z"}
{"id":265,"first_name":"Byram","email":"bfarn7c@icq.com","job":"VP Quality Control","timestamp":"2022-06-27T09:53:33Z"}
{"id":266,"first_name":"Carine","email":"cshallo7d@telegraph.co.uk","job":"Environmental Tech","timestamp":"2022-05-02T19:02:15Z"}
{"id":267,"first_name":"Nina","email":"nmiguet7e@g.co","job":"Office Assistant II","timestamp":"2022-06-13T09:15:28Z"}
{"id":268,"first_name":"Anni","email":"ademschke7f@acquirethisname.com","job":"Sales Representative","timestamp":"2022-08-03T09:56:07Z"}
{"id":269,"first_name":"Leilah","email":"lhorrod7g@nps.gov","job":"Marketing Manager","timestamp":"2022-04-06T00:10:25Z"}
{"id":270,"first_name":"Emmit","email":"elobbe7h@liveinternet.ru","job":"Dental Hygienist","timestamp":"2022-02-22T10:18:21Z"}
{"id":271,"first_name":"Caprice","email":"ccaldairou7i@behance.net","job":"Web Developer III","timestamp":"2022-11-10T18:43:09Z"}
{"id":272,"first_name":"Delly","email":"djefferys7j@comsenz.com","job":"Accounting Assistant III","timestamp":"2022-07-06T00:39:58Z"}
{"id":273,"first_name":"Ninnetta","email":"ngarton7k@cargocollective.com","job":"Web Designer IV","timestamp":"2022-04-29T12:06:43Z"}
{"id":274,"first_name":"Gweneth","email":"gdowell7l@timesonline.co.uk","job":"Internal Auditor","timestamp":"2021-12-13T07:25:58Z"}
{"id":275,"first_name":"Tuckie","email":"tpailin7m@bandcamp.com","job":"Accounting Assistant IV","timestamp":"2022-10-05T08:08:07Z"}
{"id":276,"first_name":"Dorian","email":"ddrews7n@marriott.com","job":"Design Engineer","timestamp":"2022-07-13T22:58:08Z"}
{"id":277,"first_name":"Sadella","email":"stofanini7o@so-net.ne.jp","job":"Graphic Designer","timestamp":"2022-04-27T23:58:37Z"}
{"id":278,"first_name":"Kerby","email":"klarrett7p@slideshare.net","job":"Environmental Tech","timestamp":"2022-09-18T11:27:04Z"}
{"id":279,"first_name":"Roberto","email":"rbrabbs7q@nationalgeographic.com","job":"Programmer Analyst II","timestamp":"2022-01-31T08:57:00Z"}
{"id":280,"first_name":"Avery","email":"aweatherdon7r@soundcloud.com","job":"Quality Control Specialist","timestamp":"2022-09-04T01:22:07Z"}
{"id":281,"first_name":"Ammamaria","email":"awaddie7s@msu.edu","job":"Sales Representative","timestamp":"2022-05-20T12:28:49Z"}
{"id":282,"first_name":"Atalanta","email":"awonter7t@miibeian.gov.cn","job":"Information Systems Manager","timestamp":"2022-08-07T12:32:10Z"}
{"id":283,"first_name":"Matilde","email":"mgarric7u@zimbio.com","job":"Account Representative III","timestamp":"2022-07-11T20:38:19Z"}
{"id":284,"first_name":"Sibylle","email":"starbett7v@chicagotribune.com","job":"Recruiter","timestamp":"2022-02-06T16:23:04Z"}
{"id":285,"first_name":"Honey","email":"hobrian7w@latimes.com","job":"Account Executive","timestamp":"2022-05-18T19:12:26Z"}
{"id":286,"first_name":"Ulysses","email":"uhutson7x@walmart.com","job":"Sales Representative","timestamp":"2021-12-09T23:19:28Z"}
{"id":287,"first_name":"Jasper","email":"jmacpaik7y@zdnet.com","job":"Information Systems Manager","timestamp":"2022-08-02T21:42:22Z"}
{"id":288,"first_name":"Bessy","email":"bburker7z@theglobeandmail.com","job":"Quality Control Specialist","timestamp":"2022-03-24T08:24:07Z"}
{"id":289,"first_name":"Belle","email":"bhasnney80@japanpost.jp","job":"Health Coach I","timestamp":"2022-10-18T10:42:23Z"}
{"id":290,"first_name":"Elia","email":"emcilwain81@sfgate.com","job":"Research Associate","timestamp":"2022-09-09T02:42:53Z"}
{"id":291,"first_name":"Ed","email":"ejorczyk82@t-online.de","job":"Graphic Designer","timestamp":"2022-06-13T11:22:03Z"}
{"id":292,"first_name":"Sandor","email":"smeller83@cafepress.com","job":"Dental Hygienist","timestamp":"2022-06-17T00:53:01Z"}
{"id":293,"first_name":"Wallie","email":"wroe84@gravatar.com","job":"Occupational Therapist","timestamp":"2022-05-28T21:53:57Z"}
{"id":294,"first_name":"Ladonna","email":"lhearst85@tiny.cc","job":"Automation Specialist IV","timestamp":"2022-07-25T13:50:29Z"}
{"id":295,"first_name":"Michael","email":"mgilardi86@chicagotribune.com","job":"Graphic Designer","timestamp":"2022-11-29T12:09:37Z"}
{"id":296,"first_name":"Marion","email":"mbusfield87@ifeng.com","job":"Sales Associate","timestamp":"2022-01-12T02:10:19Z"}
{"id":297,"first_name":"Ode","email":"ocoxon88@csmonitor.com","job":"Environmental Specialist","timestamp":"2022-06-28T05:16:21Z"}
{"id":298,"first_name":"Bink","email":"bcrossan89@t.co","job":"Chemical Engineer","timestamp":"2022-03-19T19:09:19Z"}
{"id":299,"first_name":"Royce","email":"rduffie8a@de.vu","job":"Office Assistant II","timestamp":"2022-04-26T13:21:14Z"}
{"id":300,"first_name":"Thain","email":"tannakin8b@addtoany.com","job":"Business Systems Development Analyst","timestamp":"2022-09-18T22:11:03Z"}
{"id":301,"first_name":"Clarine","email":"ccheal8c@alibaba.com","job":"Marketing Manager","timestamp":"2022-01-08T20:37:46Z"}
{"id":302,"first_name":"Garrard","email":"ggobat8d@toplist.cz","job":"Staff Accountant II","timestamp":"2022-07-27T23:50:41Z"}
{"id":303,"first_name":"Kare","email":"kingliby8e@ycombinator.com","job":"Associate Professor","timestamp":"2022-08-17T01:56:29Z"}
{"id":304,"first_name":"Les","email":"ledis8f@yahoo.co.jp","job":"Mechanical Systems Engineer","timestamp":"2022-01-06T20:01:59Z"}
{"id":305,"first_name":"Jessie","email":"jcherrett8g@paginegialle.it","job":"VP Product Management","timestamp":"2022-07-03T06:55:11Z"}
{"id":306,"first_name":"Coreen","email":"cedmund8h@ask.com","job":"Software Test Engineer I","timestamp":"2021-12-12T07:49:12Z"}
{"id":307,"first_name":"Courtnay","email":"clowre8i@lycos.com","job":"Desktop Support Technician","timestamp":"2022-10-12T09:42:23Z"}
{"id":308,"first_name":"Isacco","email":"iesslemont8j@google.co.uk","job":"Help Desk Operator","timestamp":"2022-07-10T22:34:28Z"}
{"id":309,"first_name":"Tades","email":"tandrat8k@patch.com","job":"Accounting Assistant II","timestamp":"2022-04-14T12:38:29Z"}
{"id":310,"first_name":"Mitchael","email":"mlermouth8l@weather.com","job":"Senior Sales Associate","timestamp":"2022-03-12T21:48:44Z"}
{"id":311,"first_name":"Kurt","email":"kfleet8m@cisco.com","job":"Business Systems Development Analyst","timestamp":"2022-06-23T20:47:09Z"}
{"id":312,"first_name":"Miriam","email":"mchestney8n@un.org","job":"Statistician IV","timestamp":"2022-01-21T02:23:11Z"}
{"id":313,"first_name":"Galven","email":"gkennifick8o@4shared.com","job":"Quality Engineer","timestamp":"2022-11-18T01:30:03Z"}
{"id":314,"first_name":"Robinet","email":"restabrook8p@amazon.com","job":"Occupational Therapist","timestamp":"2022-03-23T20:24:42Z"}
{"id":315,"first_name":"Bren","email":"bmaase8q@privacy.gov.au","job":"Actuary","timestamp":"2022-03-30T13:52:45Z"}
{"id":316,"first_name":"Perl","email":"pmcglew8r@auda.org.au","job":"Paralegal","timestamp":"2022-02-21T15:31:21Z"}
{"id":317,"first_name":"Sada","email":"shartas8s@foxnews.com","job":"Associate Professor","timestamp":"2022-09-20T04:49:11Z"}
{"id":318,"first_name":"Trixie","email":"tgeydon8t@intel.com","job":"VP Sales","timestamp":"2022-01-23T05:52:12Z"}
{"id":319,"first_name":"Sauveur","email":"sgiscken8u@ezinearticles.com","job":"Engineer I","timestamp":"2022-08-10T04:16:30Z"}
{"id":320,"first_name":"Megan","email":"mlawleff8v@dyndns.org","job":"Developer II","timestamp":"2022-10-28T17:54:31Z"}
{"id":321,"first_name":"Gail","email":"gswalough8w@dagondesign.com","job":"Media Manager II","timestamp":"2022-08-23T09:04:46Z"}
{"id":322,"first_name":"Bradan","email":"bellinor8x@gov.uk","job":"Engineer IV","timestamp":"2022-05-09T21:16:31Z"}
{"id":323,"first_name":"Nan","email":"nlindeboom8y@apple.com","job":"Payment Adjustment Coordinator","timestamp":"2022-05-22T20:57:54Z"}
{"id":324,"first_name":"Horatia","email":"hgounard8z@mediafire.com","job":"VP Sales","timestamp":"2022-10-07T14:31:33Z"}
{"id":325,"first_name":"Thomasine","email":"tgoodlake90@amazon.com","job":"Budget/Accounting Analyst I","timestamp":"2022-09-02T05:15:30Z"}
{"id":326,"first_name":"Odetta","email":"odoige91@java.com","job":"VP Sales","timestamp":"2022-11-25T13:05:15Z"}
{"id":327,"first_name":"Ronda","email":"rblandford92@wisc.edu","job":"Biostatistician I","timestamp":"2022-04-19T23:39:29Z"}
{"id":328,"first_name":"Rhianon","email":"rgillett93@arstechnica.com","job":"Sales Associate","timestamp":"2022-02-20T10:38:28Z"}
{"id":329,"first_name":"Cordell","email":"cjannings94@chronoengine.com","job":"Geological Engineer","timestamp":"2022-05-23T02:44:43Z"}
{"id":330,"first_name":"Puff","email":"pmaylard95@g.co","job":"Clinical Specialist","timestamp":"2022-01-20T13:50:09Z"}
{"id":331,"first_name":"Mahalia","email":"mmanifield96@ca.gov","job":"Actuary","timestamp":"2022-06-13T07:10:18Z"}
{"id":332,"first_name":"Amalie","email":"apfleger97@shareasale.com","job":"VP Sales","timestamp":"2022-05-03T07:14:03Z"}
{"id":333,"first_name":"Hayden","email":"hsparkes98@prlog.org","job":"Human Resources Assistant I","timestamp":"2022-11-25T09:10:49Z"}
{"id":334,"first_name":"Penelope","email":"pmctavish99@earthlink.net","job":"Graphic Designer","timestamp":"2022-10-17T00:08:59Z"}
{"id":335,"first_name":"Malory","email":"mlogsdail9a@github.io","job":"Cost Accountant","timestamp":"2022-10-21T00:25:47Z"}
{"id":336,"first_name":"Bibbie","email":"bcutchie9b@yahoo.co.jp","job":"Chief Design Engineer","timestamp":"2022-04-19T16:36:54Z"}
{"id":337,"first_name":"Codie","email":"ccoundley9c@instagram.com","job":"Occupational Therapist","timestamp":"2022-08-29T03:37:02Z"}
{"id":338,"first_name":"Alick","email":"ahaggleton9d@moonfruit.com","job":"Statistician III","timestamp":"2021-12-28T21:14:48Z"}
{"id":339,"first_name":"Phil","email":"pmowatt9e@cocolog-nifty.com","job":"Help Desk Operator","timestamp":"2022-05-30T14:19:42Z"}
{"id":340,"first_name":"Agace","email":"askeats9f@nationalgeographic.com","job":"Web Designer III","timestamp":"2022-11-19T07:35:23Z"}
{"id":341,"first_name":"Maria","email":"maleksashin9g@tmall.com","job":"Information Systems Manager","timestamp":"2022-02-21T07:40:14Z"}
{"id":342,"first_name":"Coreen","email":"cchampley9h@economist.com","job":"Biostatistician I","timestamp":"2022-07-20T05:23:22Z"}
{"id":343,"first_name":"Ariel","email":"adolder9i@nytimes.com","job":"Automation Specialist II","timestamp":"2022-08-17T02:56:53Z"}
{"id":344,"first_name":"Mathilde","email":"mtheml9j@unesco.org","job":"Environmental Tech","timestamp":"2022-09-16T10:25:30Z"}
{"id":345,"first_name":"Thorndike","email":"twyd9k@nyu.edu","job":"Speech Pathologist","timestamp":"2022-05-14T09:10:54Z"}
{"id":346,"first_name":"Hilario","email":"hivanchenkov9l@spiegel.de","job":"Human Resources Assistant III","timestamp":"2022-07-26T00:37:05Z"}
{"id":347,"first_name":"Jessa","email":"jdavidek9m@youtu.be","job":"Technical Writer","timestamp":"2022-08-25T16:04:23Z"}
{"id":348,"first_name":"Taylor","email":"tzavattieri9n@nba.com","job":"Account Coordinator","timestamp":"2022-05-17T17:07:33Z"}
{"id":349,"first_name":"Tobiah","email":"tcescot9o@symantec.com","job":"VP Product Management","timestamp":"2022-09-01T21:53:33Z"}
{"id":350,"first_name":"Natalie","email":"nspinks9p@bbc.co.uk","job":"Cost Accountant","timestamp":"2022-03-27T07:20:50Z"}
{"id":351,"first_name":"Penny","email":"pjiggins9q@tinyurl.com","job":"Community Outreach Specialist","timestamp":"2022-08-15T12:37:50Z"}
{"id":352,"first_name":"Burnaby","email":"bbrookton9r@shareasale.com","job":"Biostatistician I","timestamp":"2022-06-28T12:28:50Z"}
{"id":353,"first_name":"Ted","email":"twalhedd9s@foxnews.com","job":"Research Associate","timestamp":"2022-01-22T21:56:51Z"}
{"id":354,"first_name":"Christie","email":"ccrangle9t@baidu.com","job":"Mechanical Systems Engineer","timestamp":"2022-09-08T07:07:25Z"}
{"id":355,"first_name":"Skipper","email":"sminett9u@cam.ac.uk","job":"Help Desk Operator","timestamp":"2022-05-05T20:18:23Z"}
{"id":356,"first_name":"Robbie","email":"rcloake9v@rediff.com","job":"Office Assistant I","timestamp":"2022-08-31T05:21:10Z"}
{"id":357,"first_name":"Winny","email":"wlooney9w@gmpg.org","job":"General Manager","timestamp":"2022-03-26T06:45:14Z"}
{"id":358,"first_name":"Meghan","email":"mguslon9x@ca.gov","job":"Health Coach III","timestamp":"2022-09-21T01:54:06Z"}
{"id":359,"first_name":"Ignatius","email":"igergolet9y@gmpg.org","job":"Research Assistant II","timestamp":"2022-08-12T03:08:44Z"}
{"id":360,"first_name":"Dalenna","email":"dkinig9z@seesaa.net","job":"Software Engineer II","timestamp":"2022-07-18T12:00:37Z"}
{"id":361,"first_name":"Tasha","email":"tredmirea0@typepad.com","job":"Business Systems Development Analyst","timestamp":"2022-10-08T04:47:15Z"}
{"id":362,"first_name":"Olenolin","email":"ofogartya1@sbwire.com","job":"Environmental Tech","timestamp":"2022-02-15T14:35:15Z"}
{"id":363,"first_name":"Toiboid","email":"tjanesa2@sfgate.com","job":"Cost Accountant","timestamp":"2022-07-10T21:41:01Z"}
{"id":364,"first_name":"Flem","email":"fjentona3@amazon.co.jp","job":"Desktop Support Technician","timestamp":"2022-01-26T00:20:34Z"}
{"id":365,"first_name":"Bab","email":"bvaleka4@nydailynews.com","job":"Clinical Specialist","timestamp":"2022-03-12T10:26:20Z"}
{"id":366,"first_name":"Juli","email":"jcuniama5@fotki.com","job":"Tax Accountant","timestamp":"2022-04-10T09:07:47Z"}
{"id":367,"first_name":"Anatollo","email":"ableakleya6@fda.gov","job":"Help Desk Operator","timestamp":"2021-12-13T05:04:59Z"}
{"id":368,"first_name":"Shina","email":"smeggisona7@europa.eu","job":"Research Nurse","timestamp":"2022-08-05T03:34:02Z"}
{"id":369,"first_name":"Malva","email":"mpeizera8@vimeo.com","job":"Design Engineer","timestamp":"2022-03-26T15:22:50Z"}
{"id":370,"first_name":"Filbert","email":"fdominya9@theguardian.com","job":"Marketing Assistant","timestamp":"2021-12-15T02:49:47Z"}
{"id":371,"first_name":"Dana","email":"dcasswellaa@studiopress.com","job":"Web Designer I","timestamp":"2022-10-22T09:24:45Z"}
{"id":372,"first_name":"Merle","email":"mpetersonab@sciencedirect.com","job":"Account Executive","timestamp":"2022-02-22T10:27:38Z"}
{"id":373,"first_name":"Allan","email":"abuntingac@dot.gov","job":"Data Coordiator","timestamp":"2022-08-03T08:18:11Z"}
{"id":374,"first_name":"Bram","email":"bverniad@chronoengine.com","job":"Community Outreach Specialist","timestamp":"2022-08-02T22:06:32Z"}
{"id":375,"first_name":"Leonelle","email":"lyvensae@dailymotion.com","job":"Graphic Designer","timestamp":"2022-04-16T02:55:02Z"}
{"id":376,"first_name":"Liane","email":"lrabbittaf@house.gov","job":"Project Manager","timestamp":"2022-08-06T19:07:53Z"}
{"id":377,"first_name":"Bartholemy","email":"bsemarkeag@slashdot.org","job":"Assistant Professor","timestamp":"2022-01-28T21:04:03Z"}
{"id":378,"first_name":"Lee","email":"ldocwraah@diigo.com","job":"Senior Editor","timestamp":"2022-02-27T02:10:23Z"}
{"id":379,"first_name":"Gorden","email":"gtalmadgeai@yolasite.com","job":"Graphic Designer","timestamp":"2022-03-30T03:03:19Z"}
{"id":380,"first_name":"Brody","email":"bmedgewickaj@soup.io","job":"Senior Cost Accountant","timestamp":"2022-09-29T19:39:00Z"}
{"id":381,"first_name":"Rebekah","email":"rgossageak@mapquest.com","job":"Software Test Engineer I","timestamp":"2022-04-22T17:40:15Z"}
{"id":382,"first_name":"Josselyn","email":"jmilneral@timesonline.co.uk","job":"Project Manager","timestamp":"2022-02-07T18:32:26Z"}
{"id":383,"first_name":"Padriac","email":"psmalecombeam@bandcamp.com","job":"Programmer Analyst I","timestamp":"2021-12-11T22:06:01Z"}
{"id":384,"first_name":"Flossy","email":"fwhitehornean@indiegogo.com","job":"Analyst Programmer","timestamp":"2022-09-09T15:01:19Z"}
{"id":385,"first_name":"Chantal","email":"cvaughanao@sciencedaily.com","job":"Financial Advisor","timestamp":"2022-01-23T20:15:13Z"}
{"id":386,"first_name":"Jacquette","email":"jlamballap@xinhuanet.com","job":"Community Outreach Specialist","timestamp":"2022-02-13T01:40:24Z"}
{"id":387,"first_name":"Jerrome","email":"jbruckmannaq@homestead.com","job":"Dental Hygienist","timestamp":"2022-05-29T18:49:31Z"}
{"id":388,"first_name":"Edik","email":"ecoughlanar@moonfruit.com","job":"Developer III","timestamp":"2022-12-05T11:10:08Z"}
{"id":389,"first_name":"Jonis","email":"jdallmannas@51.la","job":"VP Product Management","timestamp":"2022-11-17T01:01:20Z"}
{"id":390,"first_name":"Pryce","email":"pchaliceat@yellowbook.com","job":"Budget/Accounting Analyst II","timestamp":"2021-12-12T03:37:34Z"}
{"id":391,"first_name":"Katheryn","email":"kfleoteau@nps.gov","job":"Nuclear Power Engineer","timestamp":"2022-10-21T03:25:23Z"}
{"id":392,"first_name":"Bent","email":"bblacklerav@merriam-webster.com","job":"Paralegal","timestamp":"2022-01-17T10:38:38Z"}
{"id":393,"first_name":"Farly","email":"fcowingaw@youku.com","job":"Director of Sales","timestamp":"2022-06-12T00:06:35Z"}
{"id":394,"first_name":"Ninon","email":"nreinaax@chicagotribune.com","job":"Director of Sales","timestamp":"2022-04-02T17:18:46Z"}
{"id":395,"first_name":"Lyndsay","email":"lbrandtsay@cargocollective.com","job":"Assistant Media Planner","timestamp":"2022-03-22T12:47:37Z"}
{"id":396,"first_name":"Elaina","email":"emccloughlinaz@usda.gov","job":"Structural Engineer","timestamp":"2022-09-14T12:34:04Z"}
{"id":397,"first_name":"Hillery","email":"hgilhoolyb0@alexa.com","job":"Physical Therapy Assistant","timestamp":"2022-03-23T21:50:41Z"}
{"id":398,"first_name":"Garth","email":"gabbotsb1@wordpress.com","job":"Account Executive","timestamp":"2022-09-28T23:38:07Z"}
{"id":399,"first_name":"Sinclair","email":"sboyerb2@usda.gov","job":"Developer II","timestamp":"2022-08-08T21:24:47Z"}
{"id":400,"first_name":"Jody","email":"jgetshamb3@vinaora.com","job":"Software Test Engineer I","timestamp":"2022-03-17T14:23:39Z"}
{"id":401,"first_name":"Melamie","email":"mmatulab4@amazonaws.com","job":"Dental Hygienist","timestamp":"2021-12-14T08:21:43Z"}
{"id":402,"first_name":"Adina","email":"aapedaileb5@paginegialle.it","job":"Environmental Tech","timestamp":"2022-09-12T14:59:41Z"}
{"id":403,"first_name":"Carmencita","email":"cnolanb6@shareasale.com","job":"Teacher","timestamp":"2021-12-17T03:12:30Z"}
{"id":404,"first_name":"Marion","email":"mmcfetridgeb7@csmonitor.com","job":"Recruiter","timestamp":"2022-11-21T06:37:22Z"}
{"id":405,"first_name":"Kelley","email":"kcouchb8@smugmug.com","job":"VP Marketing","timestamp":"2022-07-19T15:59:16Z"}
{"id":406,"first_name":"Aluino","email":"adeeryb9@jigsy.com","job":"Junior Executive","timestamp":"2022-01-02T14:05:55Z"}
{"id":407,"first_name":"Chantal","email":"cvannsba@ehow.com","job":"Assistant Media Planner","timestamp":"2022-11-22T10:16:54Z"}
{"id":408,"first_name":"Neville","email":"nlacasebb@vistaprint.com","job":"Legal Assistant","timestamp":"2022-06-07T04:19:30Z"}
{"id":409,"first_name":"Babette","email":"blandebc@is.gd","job":"Help Desk Operator","timestamp":"2022-06-30T17:27:16Z"}
{"id":410,"first_name":"Zarah","email":"zcasellabd@github.io","job":"Social Worker","timestamp":"2022-04-11T01:56:29Z"}
{"id":411,"first_name":"Hendrick","email":"hlawrencebe@rediff.com","job":"GIS Technical Architect","timestamp":"2022-05-18T23:39:22Z"}
{"id":412,"first_name":"Miles","email":"mtollbf@so-net.ne.jp","job":"Staff Accountant III","timestamp":"2022-10-07T11:26:47Z"}
{"id":413,"first_name":"Antonino","email":"aiskowbg@umn.edu","job":"Internal Auditor","timestamp":"2022-05-28T14:03:33Z"}
{"id":414,"first_name":"Mehetabel","email":"mjiroudekbh@wikispaces.com","job":"Senior Quality Engineer","timestamp":"2021-12-08T12:30:46Z"}
{"id":415,"first_name":"Babb","email":"bkembrybi@cocolog-nifty.com","job":"Mechanical Systems Engineer","timestamp":"2022-10-12T06:41:10Z"}
{"id":416,"first_name":"Theresina","email":"tcastagnebj@spiegel.de","job":"Help Desk Operator","timestamp":"2022-01-03T13:36:12Z"}
{"id":417,"first_name":"Aaron","email":"afazakerleybk@webeden.co.uk","job":"Payment Adjustment Coordinator","timestamp":"2022-10-03T06:22:19Z"}
{"id":418,"first_name":"Bartie","email":"bkettlestringesbl@pcworld.com","job":"Budget/Accounting Analyst II","timestamp":"2022-04-14T04:23:27Z"}
{"id":419,"first_name":"Amelie","email":"abesantiebm@bloglines.com","job":"Social Worker","timestamp":"2022-10-17T08:14:30Z"}
{"id":420,"first_name":"Harrison","email":"hrollesbn@twitter.com","job":"Graphic Designer","timestamp":"2022-05-18T06:25:09Z"}
{"id":421,"first_name":"Siward","email":"smarquisbo@nydailynews.com","job":"Librarian","timestamp":"2022-02-01T11:52:44Z"}
{"id":422,"first_name":"Millard","email":"misonbp@issuu.com","job":"Health Coach I","timestamp":"2022-08-24T03:53:59Z"}
{"id":423,"first_name":"Daniella","email":"dfaransbq@mysql.com","job":"Sales Representative","timestamp":"2022-08-10T13:25:10Z"}
{"id":424,"first_name":"Raimund","email":"rsteptoebr@wordpress.com","job":"Analyst Programmer","timestamp":"2022-06-07T16:45:17Z"}
{"id":425,"first_name":"Ingmar","email":"ifeldmanbs@1und1.de","job":"Computer Systems Analyst II","timestamp":"2022-01-05T14:01:15Z"}
{"id":426,"first_name":"Zack","email":"zbarnwellbt@msu.edu","job":"Staff Accountant IV","timestamp":"2022-06-28T17:14:21Z"}
{"id":427,"first_name":"Mozelle","email":"mstuchburybu@kickstarter.com","job":"Geologist IV","timestamp":"2022-07-13T19:58:35Z"}
{"id":428,"first_name":"Wallie","email":"wflurybv@hc360.com","job":"Environmental Tech","timestamp":"2022-03-24T07:28:36Z"}
{"id":429,"first_name":"Annis","email":"abenettolobw@cpanel.net","job":"Recruiter","timestamp":"2022-01-26T05:18:04Z"}
{"id":430,"first_name":"Martainn","email":"mbeedenbx@wikipedia.org","job":"Geologist I","timestamp":"2022-03-28T12:59:52Z"}
{"id":431,"first_name":"Ara","email":"akeachby@ebay.co.uk","job":"Product Engineer","timestamp":"2022-03-24T19:33:33Z"}
{"id":432,"first_name":"Sully","email":"sbomanbz@scientificamerican.com","job":"Accounting Assistant III","timestamp":"2022-04-20T00:28:36Z"}
{"id":433,"first_name":"Alley","email":"aboeckec0@youtube.com","job":"Social Worker","timestamp":"2022-12-06T11:01:24Z"}
{"id":434,"first_name":"Ignace","email":"ibullonc1@engadget.com","job":"Geological Engineer","timestamp":"2022-07-16T19:26:35Z"}
{"id":435,"first_name":"Gretta","email":"gpavelinc2@cbslocal.com","job":"Design Engineer","timestamp":"2022-01-13T19:58:02Z"}
{"id":436,"first_name":"Godiva","email":"gnarramorec3@barnesandnoble.com","job":"Sales Associate","timestamp":"2021-12-29T16:34:57Z"}
{"id":437,"first_name":"Erskine","email":"ebillingc4@ning.com","job":"Account Representative III","timestamp":"2022-10-09T12:03:38Z"}
{"id":438,"first_name":"Otha","email":"omcdowallc5@hugedomains.com","job":"Speech Pathologist","timestamp":"2022-10-25T06:57:20Z"}
{"id":439,"first_name":"Annabal","email":"ajerrardc6@ca.gov","job":"Research Nurse","timestamp":"2022-02-28T20:54:44Z"}
{"id":440,"first_name":"Helenka","email":"hwillougheyc7@51.la","job":"Teacher","timestamp":"2022-11-27T13:25:13Z"}
{"id":441,"first_name":"Frederic","email":"flaversc8@ox.ac.uk","job":"Chief Design Engineer","timestamp":"2022-10-22T08:43:20Z"}
{"id":442,"first_name":"Shel","email":"sjeffcoatec9@e-recht24.de","job":"Senior Cost Accountant","timestamp":"2022-10-18T22:44:57Z"}
{"id":443,"first_name":"Gisele","email":"gplenderleithca@hibu.com","job":"Environmental Tech","timestamp":"2022-11-15T06:20:33Z"}
{"id":444,"first_name":"Devland","email":"dthamescb@ebay.co.uk","job":"Data Coordiator","timestamp":"2022-09-08T21:56:53Z"}
{"id":445,"first_name":"Leonardo","email":"lbalazotcc@seesaa.net","job":"Information Systems Manager","timestamp":"2022-09-10T05:34:02Z"}
{"id":446,"first_name":"Evanne","email":"epeyntuecd@smh.com.au","job":"Developer IV","timestamp":"2022-06-21T05:01:58Z"}
{"id":447,"first_name":"Bran","email":"beastmeadce@dot.gov","job":"Assistant Media Planner","timestamp":"2022-05-06T08:08:38Z"}
{"id":448,"first_name":"Edmon","email":"egoldbourncf@digg.com","job":"Account Representative III","timestamp":"2022-04-30T09:53:46Z"}
{"id":449,"first_name":"Dud","email":"dmoscropcg@hexun.com","job":"Payment Adjustment Coordinator","timestamp":"2022-10-20T22:52:50Z"}
{"id":450,"first_name":"Emilia","email":"ethorroldch@multiply.com","job":"Product Engineer","timestamp":"2022-04-28T08:39:13Z"}
{"id":451,"first_name":"Jinny","email":"jrosenwasserci@yelp.com","job":"Director of Sales","timestamp":"2022-08-04T03:14:57Z"}
{"id":452,"first_name":"Kerry","email":"kfaltincj@techcrunch.com","job":"Associate Professor","timestamp":"2022-03-18T15:12:10Z"}
{"id":453,"first_name":"Moore","email":"mclellck@amazon.de","job":"Research Assistant I","timestamp":"2022-11-15T22:30:36Z"}
{"id":454,"first_name":"Aida","email":"acrandoncl@nationalgeographic.com","job":"Developer IV","timestamp":"2022-07-17T20:29:10Z"}
{"id":455,"first_name":"Appolonia","email":"abragancacm@elegantthemes.com","job":"Internal Auditor","timestamp":"2022-11-28T09:14:18Z"}
{"id":456,"first_name":"Alberik","email":"afountiancn@github.com","job":"Financial Advisor","timestamp":"2022-02-07T14:48:02Z"}
{"id":457,"first_name":"Dew","email":"dimpettco@unesco.org","job":"Research Nurse","timestamp":"2022-03-11T09:31:20Z"}
{"id":458,"first_name":"Abner","email":"amacdougalcp@example.com","job":"Physical Therapy Assistant","timestamp":"2022-07-17T03:37:51Z"}
{"id":459,"first_name":"Riordan","email":"rgeecq@ustream.tv","job":"Chemical Engineer","timestamp":"2022-07-15T08:22:35Z"}
{"id":460,"first_name":"Lutero","email":"lembletoncr@de.vu","job":"Information Systems Manager","timestamp":"2022-06-11T06:31:58Z"}
{"id":461,"first_name":"Maia","email":"mdelaceycs@google.es","job":"VP Product Management","timestamp":"2022-01-18T03:03:17Z"}
{"id":462,"first_name":"Milka","email":"mquenellct@reuters.com","job":"VP Quality Control","timestamp":"2022-09-05T04:42:07Z"}
{"id":463,"first_name":"Shannen","email":"smcevoycu@surveymonkey.com","job":"Assistant Media Planner","timestamp":"2022-11-01T00:56:44Z"}
{"id":464,"first_name":"Ruby","email":"rkantercv@twitter.com","job":"Nuclear Power Engineer","timestamp":"2022-07-21T07:23:51Z"}
{"id":465,"first_name":"Ewan","email":"eshellumcw@apple.com","job":"Paralegal","timestamp":"2022-01-26T17:12:30Z"}
{"id":466,"first_name":"Randie","email":"rkiernancx@freewebs.com","job":"Software Test Engineer III","timestamp":"2022-04-06T07:32:00Z"}
{"id":467,"first_name":"Gwendolyn","email":"gtattoocy@miitbeian.gov.cn","job":"Administrative Assistant IV","timestamp":"2022-04-13T22:40:15Z"}
{"id":468,"first_name":"Pierson","email":"phussycz@java.com","job":"GIS Technical Architect","timestamp":"2021-12-16T03:01:44Z"}
{"id":469,"first_name":"Clare","email":"cgrinikhinovd0@blogspot.com","job":"Office Assistant I","timestamp":"2022-01-22T12:28:11Z"}
{"id":470,"first_name":"Lucie","email":"lkillbyd1@e-recht24.de","job":"Technical Writer","timestamp":"2022-05-03T06:52:32Z"}
{"id":471,"first_name":"Wynn","email":"warndtd2@ucoz.ru","job":"Structural Analysis Engineer","timestamp":"2022-11-30T03:02:47Z"}
{"id":472,"first_name":"Homerus","email":"hclemitsd3@japanpost.jp","job":"Research Associate","timestamp":"2022-08-19T04:53:40Z"}
{"id":473,"first_name":"Trefor","email":"tmulberyd4@wordpress.com","job":"Accounting Assistant III","timestamp":"2021-12-10T12:00:52Z"}
{"id":474,"first_name":"Adan","email":"aattridged5@hc360.com","job":"Administrative Assistant I","timestamp":"2022-03-25T14:25:46Z"}
{"id":475,"first_name":"Gal","email":"gfourcaded6@washington.edu","job":"Junior Executive","timestamp":"2022-01-21T23:49:44Z"}
{"id":476,"first_name":"Jasun","email":"jchaveyd7@myspace.com","job":"Paralegal","timestamp":"2022-06-20T22:15:39Z"}
{"id":477,"first_name":"Lanita","email":"lpithied8@home.pl","job":"Mechanical Systems Engineer","timestamp":"2022-01-18T21:49:32Z"}
{"id":478,"first_name":"Blancha","email":"bcarswelld9@cnbc.com","job":"VP Marketing","timestamp":"2022-02-26T13:05:07Z"}
{"id":479,"first_name":"Stormie","email":"splimmerda@earthlink.net","job":"Programmer Analyst III","timestamp":"2022-02-14T19:55:10Z"}
{"id":480,"first_name":"Jan","email":"jlinklaterdb@ocn.ne.jp","job":"Occupational Therapist","timestamp":"2022-12-06T21:55:37Z"}
{"id":481,"first_name":"Aggy","email":"atargetterdc@amazon.com","job":"Nurse","timestamp":"2022-09-07T03:22:50Z"}
{"id":482,"first_name":"Alfy","email":"abernotdd@newsvine.com","job":"Structural Analysis Engineer","timestamp":"2022-05-18T01:35:03Z"}
{"id":483,"first_name":"Orelee","email":"oferrandde@tumblr.com","job":"Recruiting Manager","timestamp":"2022-08-23T22:05:49Z"}
{"id":484,"first_name":"Jeana","email":"jkhristyukhindf@purevolume.com","job":"Nurse","timestamp":"2022-10-09T17:35:26Z"}
{"id":485,"first_name":"Carline","email":"cllewelyndg@wikipedia.org","job":"Clinical Specialist","timestamp":"2022-08-05T01:00:13Z"}
{"id":486,"first_name":"Etta","email":"educhandh@oaic.gov.au","job":"Administrative Officer","timestamp":"2022-10-09T11:36:54Z"}
{"id":487,"first_name":"Alphonso","email":"astockoedi@last.fm","job":"Marketing Manager","timestamp":"2022-08-01T13:27:06Z"}
{"id":488,"first_name":"Hunfredo","email":"hrheltondj@163.com","job":"Clinical Specialist","timestamp":"2022-01-17T01:23:28Z"}
{"id":489,"first_name":"Cob","email":"cellingforddk@princeton.edu","job":"Health Coach I","timestamp":"2022-05-27T15:03:10Z"}
{"id":490,"first_name":"Catlee","email":"calennikovdl@so-net.ne.jp","job":"Help Desk Technician","timestamp":"2022-07-14T16:37:24Z"}
{"id":491,"first_name":"Renato","email":"rsauntondm@google.ru","job":"VP Product Management","timestamp":"2022-04-10T15:32:28Z"}
{"id":492,"first_name":"Theodor","email":"tbatissedn@dropbox.com","job":"Automation Specialist III","timestamp":"2022-02-08T14:25:15Z"}
{"id":493,"first_name":"Freedman","email":"fantonopoulosdo@vk.com","job":"Human Resources Assistant IV","timestamp":"2022-09-26T10:35:50Z"}
{"id":494,"first_name":"Hendrick","email":"hhazelgreavedp@wikispaces.com","job":"Technical Writer","timestamp":"2022-06-07T00:51:55Z"}
{"id":495,"first_name":"Rosella","email":"rweatheydq@oaic.gov.au","job":"Automation Specialist III","timestamp":"2022-08-30T15:14:52Z"}
{"id":496,"first_name":"Bradly","email":"bkylesdr@pinterest.com","job":"VP Accounting","timestamp":"2021-12-13T16:34:39Z"}
{"id":497,"first_name":"Nannette","email":"nsileyds@va.gov","job":"Research Associate","timestamp":"2022-02-02T08:57:22Z"}
{"id":498,"first_name":"Virgilio","email":"vgarforthdt@exblog.jp","job":"Nurse","timestamp":"2022-08-24T12:03:17Z"}
{"id":499,"first_name":"Talyah","email":"tverrechiadu@seesaa.net","job":"Junior Executive","timestamp":"2022-11-28T03:41:52Z"}
{"id":500,"first_name":"Melisent","email":"mwhooleydv@rakuten.co.jp","job":"Project Manager","timestamp":"2022-02-08T06:19:33Z"}
{"id":501,"first_name":"Langston","email":"lingerfielddw@jugem.jp","job":"Media Manager II","timestamp":"2022-01-31T18:38:45Z"}
{"id":502,"first_name":"Chase","email":"clangdx@clickbank.net","job":"Engineer IV","timestamp":"2022-03-10T07:05:47Z"}
{"id":503,"first_name":"Tobiah","email":"tmughaldy@domainmarket.com","job":"Structural Analysis Engineer","timestamp":"2022-07-06T18:49:01Z"}
{"id":504,"first_name":"Laird","email":"lsalladz@vistaprint.com","job":"Pharmacist","timestamp":"2022-11-19T14:59:08Z"}
{"id":505,"first_name":"Rozamond","email":"rwalerane0@soup.io","job":"Developer I","timestamp":"2022-06-15T04:38:16Z"}
{"id":506,"first_name":"Eugine","email":"emaccartane1@dedecms.com","job":"Assistant Manager","timestamp":"2022-03-12T12:49:39Z"}
{"id":507,"first_name":"Norrie","email":"nfeasleye2@networkadvertising.org","job":"Human Resources Assistant III","timestamp":"2022-07-12T04:43:23Z"}
{"id":508,"first_name":"Lanny","email":"lsnape3@discuz.net","job":"Compensation Analyst","timestamp":"2022-11-11T15:50:09Z"}
{"id":509,"first_name":"Othilia","email":"ochaneye4@tmall.com","job":"Media Manager I","timestamp":"2022-11-16T12:51:48Z"}
{"id":510,"first_name":"Rosette","email":"rbauckhame5@de.vu","job":"Office Assistant IV","timestamp":"2021-12-19T06:17:48Z"}
{"id":511,"first_name":"Shepperd","email":"sburehille6@ed.gov","job":"Media Manager I","timestamp":"2022-05-22T21:52:36Z"}
{"id":512,"first_name":"Leese","email":"lparagreene7@mashable.com","job":"Senior Developer","timestamp":"2022-05-09T16:08:14Z"}
{"id":513,"first_name":"Nina","email":"njiroutkae8@fema.gov","job":"Information Systems Manager","timestamp":"2022-10-20T10:17:19Z"}
{"id":514,"first_name":"Dianne","email":"dshrubshalle9@so-net.ne.jp","job":"Recruiter","timestamp":"2022-10-29T06:12:38Z"}
{"id":515,"first_name":"Melissa","email":"mcourtierea@eepurl.com","job":"Professor","timestamp":"2022-11-04T13:37:54Z"}
{"id":516,"first_name":"Fairlie","email":"fbargeryeb@seesaa.net","job":"Physical Therapy Assistant","timestamp":"2022-06-08T14:28:16Z"}
{"id":517,"first_name":"Lonnie","email":"lclaigeec@over-blog.com","job":"Sales Associate","timestamp":"2022-10-29T19:10:59Z"}
{"id":518,"first_name":"Rik","email":"rtedmaned@ask.com","job":"Design Engineer","timestamp":"2022-02-11T01:58:13Z"}
{"id":519,"first_name":"Frankie","email":"fgreenrodee@theguardian.com","job":"Research Assistant III","timestamp":"2022-02-14T18:52:01Z"}
{"id":520,"first_name":"Gib","email":"gdurranef@state.tx.us","job":"Accounting Assistant III","timestamp":"2022-07-08T08:39:29Z"}
{"id":521,"first_name":"Philippa","email":"pchattoeg@opensource.org","job":"General Manager","timestamp":"2022-11-25T11:36:17Z"}
{"id":522,"first_name":"Eugenio","email":"eblundoneh@shinystat.com","job":"Programmer II","timestamp":"2022-09-21T15:58:17Z"}
{"id":523,"first_name":"Rona","email":"rhowsanei@newyorker.com","job":"Recruiting Manager","timestamp":"2022-11-15T19:29:13Z"}
{"id":524,"first_name":"Elise","email":"ealgoreej@hao123.com","job":"Professor","timestamp":"2022-10-11T12:57:44Z"}
{"id":525,"first_name":"Ertha","email":"ewoofek@princeton.edu","job":"Analyst Programmer","timestamp":"2022-06-02T07:23:49Z"}
{"id":526,"first_name":"Marietta","email":"mlawrieel@jalbum.net","job":"Human Resources Manager","timestamp":"2022-09-09T15:08:59Z"}
{"id":527,"first_name":"Meryl","email":"mzupoem@github.io","job":"Associate Professor","timestamp":"2022-05-26T05:33:16Z"}
{"id":528,"first_name":"Jehanna","email":"jastburyen@hp.com","job":"Director of Sales","timestamp":"2022-07-10T23:08:44Z"}
{"id":529,"first_name":"Rock","email":"rsnowdoneo@mashable.com","job":"Research Associate","timestamp":"2022-09-10T07:52:36Z"}
{"id":530,"first_name":"Genovera","email":"gdemichettiep@weather.com","job":"Account Coordinator","timestamp":"2022-11-07T19:52:34Z"}
{"id":531,"first_name":"Merlina","email":"mwillinghameq@blog.com","job":"Marketing Assistant","timestamp":"2022-09-26T16:53:26Z"}
{"id":532,"first_name":"Susan","email":"shundeller@flickr.com","job":"Staff Scientist","timestamp":"2022-02-28T07:56:11Z"}
{"id":533,"first_name":"Dannye","email":"dsheivelses@plala.or.jp","job":"VP Accounting","timestamp":"2021-12-15T21:11:19Z"}
{"id":534,"first_name":"Jenn","email":"jellumet@buzzfeed.com","job":"Desktop Support Technician","timestamp":"2022-05-21T04:32:34Z"}
{"id":535,"first_name":"Giana","email":"gfulfordeu@imdb.com","job":"Marketing Manager","timestamp":"2022-07-21T04:57:09Z"}
{"id":536,"first_name":"Jere","email":"jcavnorev@cisco.com","job":"Help Desk Operator","timestamp":"2022-07-08T14:36:50Z"}
{"id":537,"first_name":"Emiline","email":"ekoschkeew@bbb.org","job":"Analog Circuit Design manager","timestamp":"2022-08-12T06:30:27Z"}
{"id":538,"first_name":"Gaylene","email":"gdinnegesex@dagondesign.com","job":"Clinical Specialist","timestamp":"2022-06-10T16:56:18Z"}
{"id":539,"first_name":"Oberon","email":"obougeney@devhub.com","job":"Senior Sales Associate","timestamp":"2022-10-02T23:50:51Z"}
{"id":540,"first_name":"Stephine","email":"seusticeez@boston.com","job":"Programmer III","timestamp":"2022-04-24T01:38:58Z"}
{"id":541,"first_name":"Lulita","email":"lmunbyf0@redcross.org","job":"Librarian","timestamp":"2022-07-19T05:43:05Z"}
{"id":542,"first_name":"Lemmie","email":"lmcphelimeyf1@unc.edu","job":"Media Manager II","timestamp":"2022-09-22T21:24:25Z"}
{"id":543,"first_name":"Kimbra","email":"kbarthroppf2@illinois.edu","job":"Operator","timestamp":"2022-07-01T19:30:08Z"}
{"id":544,"first_name":"Clerkclaude","email":"ccrasswellerf3@yandex.ru","job":"Health Coach I","timestamp":"2022-06-17T21:08:02Z"}
{"id":545,"first_name":"Lucilia","email":"lraratyf4@shop-pro.jp","job":"Programmer Analyst III","timestamp":"2022-03-01T05:56:13Z"}
{"id":546,"first_name":"Karla","email":"ksabbinsf5@phoca.cz","job":"General Manager","timestamp":"2022-10-10T04:07:44Z"}
{"id":547,"first_name":"Angelica","email":"acuninghamf6@hibu.com","job":"Computer Systems Analyst III","timestamp":"2022-09-17T05:20:49Z"}
{"id":548,"first_name":"Verine","email":"vpriverf7@constantcontact.com","job":"Automation Specialist III","timestamp":"2022-11-02T21:38:47Z"}
{"id":549,"first_name":"Meridel","email":"malesof8@g.co","job":"Analyst Programmer","timestamp":"2022-09-28T22:57:26Z"}
{"id":550,"first_name":"Giulietta","email":"gconeybearef9@bluehost.com","job":"Information Systems Manager","timestamp":"2022-04-01T17:06:32Z"}
{"id":551,"first_name":"Bartlet","email":"bvisefa@nih.gov","job":"Computer Systems Analyst III","timestamp":"2022-03-26T23:42:57Z"}
{"id":552,"first_name":"Coriss","email":"clorrymanfb@posterous.com","job":"Account Representative III","timestamp":"2021-12-31T22:46:51Z"}
{"id":553,"first_name":"Eran","email":"ecellifc@pinterest.com","job":"Quality Control Specialist","timestamp":"2022-07-30T08:12:57Z"}
{"id":554,"first_name":"Zacharia","email":"zvillaronfd@godaddy.com","job":"Systems Administrator III","timestamp":"2022-01-23T08:52:15Z"}
{"id":555,"first_name":"Nico","email":"nbirdwistlefe@noaa.gov","job":"Nurse Practicioner","timestamp":"2022-01-07T13:13:02Z"}
{"id":556,"first_name":"Yardley","email":"ygiannasiff@addthis.com","job":"Registered Nurse","timestamp":"2022-08-14T09:08:06Z"}
{"id":557,"first_name":"Nina","email":"nfeirnfg@icq.com","job":"Librarian","timestamp":"2022-08-30T00:25:37Z"}
{"id":558,"first_name":"Kenna","email":"krichinfh@ucoz.ru","job":"Mechanical Systems Engineer","timestamp":"2021-12-27T08:39:15Z"}
{"id":559,"first_name":"Murray","email":"masplenfi@soup.io","job":"Chief Design Engineer","timestamp":"2022-06-06T21:51:39Z"}
{"id":560,"first_name":"Maribeth","email":"mbroschkefj@drupal.org","job":"Assistant Media Planner","timestamp":"2022-04-22T14:35:45Z"}
{"id":561,"first_name":"Shae","email":"sstorerfk@berkeley.edu","job":"Community Outreach Specialist","timestamp":"2022-07-29T13:17:56Z"}
{"id":562,"first_name":"Edik","email":"esawreyfl@marketwatch.com","job":"Speech Pathologist","timestamp":"2021-12-19T16:35:17Z"}
{"id":563,"first_name":"Annabela","email":"acowenfm@home.pl","job":"Speech Pathologist","timestamp":"2022-03-31T12:06:02Z"}
{"id":564,"first_name":"Barr","email":"bgilmartinfn@walmart.com","job":"Biostatistician IV","timestamp":"2022-10-03T01:25:41Z"}
{"id":565,"first_name":"Marten","email":"mbothiefo@ameblo.jp","job":"Mechanical Systems Engineer","timestamp":"2022-04-02T20:32:33Z"}
{"id":566,"first_name":"Merle","email":"mmahoodfp@de.vu","job":"VP Sales","timestamp":"2022-03-20T01:29:18Z"}
{"id":567,"first_name":"Vere","email":"vlapthornefq@uiuc.edu","job":"Media Manager III","timestamp":"2021-12-11T03:57:21Z"}
{"id":568,"first_name":"Falkner","email":"fbrucksteinfr@mozilla.com","job":"Account Representative III","timestamp":"2022-03-11T12:52:49Z"}
{"id":569,"first_name":"Cullie","email":"cswallowfs@de.vu","job":"Paralegal","timestamp":"2022-02-01T10:37:02Z"}
{"id":570,"first_name":"Vaclav","email":"vtrowlft@stanford.edu","job":"Software Consultant","timestamp":"2022-04-07T18:15:57Z"}
{"id":571,"first_name":"Joanne","email":"jmaccomiskeyfu@discovery.com","job":"Analyst Programmer","timestamp":"2022-08-10T15:01:00Z"}
{"id":572,"first_name":"Britt","email":"bnairefv@utexas.edu","job":"Geological Engineer","timestamp":"2022-06-26T09:45:46Z"}
{"id":573,"first_name":"Bunnie","email":"bdafyddfw@tinyurl.com","job":"Programmer I","timestamp":"2022-04-10T01:54:26Z"}
{"id":574,"first_name":"Janean","email":"jpinkardfx@jimdo.com","job":"Senior Sales Associate","timestamp":"2022-11-22T06:59:53Z"}
{"id":575,"first_name":"Abbey","email":"aagnewfy@independent.co.uk","job":"Desktop Support Technician","timestamp":"2022-03-06T08:48:48Z"}
{"id":576,"first_name":"Aleen","email":"atripeanfz@reuters.com","job":"Office Assistant IV","timestamp":"2022-05-16T06:52:18Z"}
{"id":577,"first_name":"Crissie","email":"ctiversg0@sakura.ne.jp","job":"Office Assistant III","timestamp":"2022-07-08T04:07:16Z"}
{"id":578,"first_name":"Audra","email":"alisciandrig1@acquirethisname.com","job":"Professor","timestamp":"2022-07-19T23:58:30Z"}
{"id":579,"first_name":"Jasmina","email":"jgillowg2@mozilla.org","job":"Marketing Manager","timestamp":"2022-02-21T10:07:20Z"}
{"id":580,"first_name":"Wendi","email":"wtolandg3@deliciousdays.com","job":"Administrative Assistant I","timestamp":"2022-09-26T02:02:11Z"}
{"id":581,"first_name":"Marilee","email":"mlejeang4@noaa.gov","job":"Sales Associate","timestamp":"2022-07-08T14:40:55Z"}
{"id":582,"first_name":"Rochelle","email":"rrubinlichtg5@topsy.com","job":"Quality Engineer","timestamp":"2022-01-25T04:10:30Z"}
{"id":583,"first_name":"Carolann","email":"ctremonteg6@mtv.com","job":"Structural Analysis Engineer","timestamp":"2021-12-22T06:05:34Z"}
{"id":584,"first_name":"Marika","email":"mzumfeldeg7@hhs.gov","job":"Engineer II","timestamp":"2022-08-22T07:44:12Z"}
{"id":585,"first_name":"Claiborn","email":"crasherg8@bbc.co.uk","job":"Computer Systems Analyst II","timestamp":"2022-09-22T17:51:53Z"}
{"id":586,"first_name":"Nonie","email":"nitzcovichg9@npr.org","job":"Computer Systems Analyst IV","timestamp":"2022-11-02T11:37:11Z"}
{"id":587,"first_name":"Ddene","email":"dkeighlyga@alexa.com","job":"Human Resources Assistant II","timestamp":"2021-12-11T03:50:29Z"}
{"id":588,"first_name":"Arlyn","email":"amaystongb@timesonline.co.uk","job":"Librarian","timestamp":"2022-11-14T19:00:02Z"}
{"id":589,"first_name":"Aaron","email":"agallymoregc@taobao.com","job":"Associate Professor","timestamp":"2022-11-06T06:54:00Z"}
{"id":590,"first_name":"Jermaine","email":"jdelwatergd@phoca.cz","job":"Sales Associate","timestamp":"2022-04-02T22:52:38Z"}
{"id":591,"first_name":"Robinetta","email":"rmilingtonge@bizjournals.com","job":"Human Resources Assistant III","timestamp":"2021-12-08T04:09:29Z"}
{"id":592,"first_name":"Hedi","email":"htapsellgf@miibeian.gov.cn","job":"Sales Representative","timestamp":"2022-01-24T20:10:52Z"}
{"id":593,"first_name":"Cookie","email":"ckmieciakgg@aol.com","job":"Account Representative IV","timestamp":"2022-01-06T02:34:26Z"}
{"id":594,"first_name":"Othilie","email":"obredeegh@unblog.fr","job":"Teacher","timestamp":"2022-03-22T04:28:22Z"}
{"id":595,"first_name":"Temp","email":"tbenfordgi@disqus.com","job":"Quality Engineer","timestamp":"2022-08-04T07:54:26Z"}
{"id":596,"first_name":"Noreen","email":"nhawgj@timesonline.co.uk","job":"Desktop Support Technician","timestamp":"2022-08-16T02:03:26Z"}
{"id":597,"first_name":"Gaylene","email":"gdurbingk@myspace.com","job":"Senior Sales Associate","timestamp":"2022-01-05T01:43:57Z"}
{"id":598,"first_name":"Katha","email":"kbaumbergl@whitehouse.gov","job":"Accounting Assistant IV","timestamp":"2022-09-19T07:13:54Z"}
{"id":599,"first_name":"Sisile","email":"sgregangm@sbwire.com","job":"Librarian","timestamp":"2022-02-15T23:30:09Z"}
{"id":600,"first_name":"Flynn","email":"feyckelberggn@prnewswire.com","job":"General Manager","timestamp":"2022-02-15T10:12:52Z"}
{"id":601,"first_name":"Erda","email":"elattingo@people.com.cn","job":"Chief Design Engineer","timestamp":"2022-04-25T00:18:55Z"}
{"id":602,"first_name":"Annabelle","email":"amulchronegp@diigo.com","job":"Sales Associate","timestamp":"2022-07-27T02:47:06Z"}
{"id":603,"first_name":"Etienne","email":"ealmeidagq@ocn.ne.jp","job":"VP Marketing","timestamp":"2022-01-01T19:43:33Z"}
{"id":604,"first_name":"Kerrie","email":"kproudmangr@tumblr.com","job":"Payment Adjustment Coordinator","timestamp":"2021-12-18T07:32:44Z"}
{"id":605,"first_name":"Tilda","email":"tlandsmangs@angelfire.com","job":"General Manager","timestamp":"2022-01-27T10:53:51Z"}
{"id":606,"first_name":"Arabella","email":"arobinsgt@prnewswire.com","job":"Account Representative III","timestamp":"2022-02-16T16:13:51Z"}
{"id":607,"first_name":"Alaster","email":"arosewellgu@tuttocitta.it","job":"Nuclear Power Engineer","timestamp":"2022-05-10T00:05:46Z"}
{"id":608,"first_name":"Devin","email":"dbannergv@parallels.com","job":"Human Resources Assistant III","timestamp":"2022-08-09T19:53:47Z"}
{"id":609,"first_name":"Nonah","email":"nhallfordgw@bloglines.com","job":"Director of Sales","timestamp":"2022-09-02T16:04:31Z"}
{"id":610,"first_name":"Alberik","email":"amceacherngx@fda.gov","job":"Structural Engineer","timestamp":"2021-12-12T13:48:05Z"}
{"id":611,"first_name":"Chadd","email":"caarongy@alibaba.com","job":"Developer III","timestamp":"2022-08-31T00:09:29Z"}
{"id":612,"first_name":"Jammal","email":"jdavydochkingz@flavors.me","job":"Sales Associate","timestamp":"2022-10-04T14:58:25Z"}
{"id":613,"first_name":"Bridie","email":"bdebeauchamph0@dailymail.co.uk","job":"Marketing Manager","timestamp":"2022-07-04T01:26:31Z"}
{"id":614,"first_name":"Nona","email":"nobeneyh1@theguardian.com","job":"Office Assistant III","timestamp":"2021-12-31T06:38:53Z"}
{"id":615,"first_name":"Mia","email":"mswannellh2@blog.com","job":"Senior Quality Engineer","timestamp":"2022-05-07T10:17:45Z"}
{"id":616,"first_name":"Salem","email":"stissingtonh3@gmpg.org","job":"Assistant Media Planner","timestamp":"2022-08-21T23:43:20Z"}
{"id":617,"first_name":"Harli","email":"hlanegranh4@trellian.com","job":"Geological Engineer","timestamp":"2022-08-25T16:34:25Z"}
{"id":618,"first_name":"Corliss","email":"ceuelsh5@ed.gov","job":"Help Desk Technician","timestamp":"2022-11-18T03:47:20Z"}
{"id":619,"first_name":"Clemens","email":"cphebeeh6@constantcontact.com","job":"Librarian","timestamp":"2022-10-08T08:47:23Z"}
{"id":620,"first_name":"Maren","email":"mscarreh7@aol.com","job":"Account Executive","timestamp":"2022-07-22T15:02:12Z"}
{"id":621,"first_name":"Cad","email":"cdivinyh8@cbc.ca","job":"Assistant Manager","timestamp":"2021-12-15T05:30:37Z"}
{"id":622,"first_name":"Carrissa","email":"ceverallh9@amazon.com","job":"Paralegal","timestamp":"2022-11-12T21:35:59Z"}
{"id":623,"first_name":"Alejandra","email":"askamalha@mashable.com","job":"Marketing Manager","timestamp":"2022-10-09T22:22:14Z"}
{"id":624,"first_name":"Kip","email":"kconnachanhb@apache.org","job":"Senior Developer","timestamp":"2022-05-03T18:43:02Z"}
{"id":625,"first_name":"Orland","email":"orowenhc@eventbrite.com","job":"Compensation Analyst","timestamp":"2022-04-10T09:38:40Z"}
{"id":626,"first_name":"Victor","email":"vleadleyhd@1688.com","job":"Administrative Assistant I","timestamp":"2022-06-22T19:00:46Z"}
{"id":627,"first_name":"Elfrida","email":"ebygravehe@diigo.com","job":"Information Systems Manager","timestamp":"2022-03-01T08:38:49Z"}
{"id":628,"first_name":"Stanislas","email":"srandlesomehf@istockphoto.com","job":"Physical Therapy Assistant","timestamp":"2022-10-09T04:54:10Z"}
{"id":629,"first_name":"Jake","email":"jberkleyhg@smh.com.au","job":"Executive Secretary","timestamp":"2022-08-29T16:34:06Z"}
{"id":630,"first_name":"Lissa","email":"llourenshh@mit.edu","job":"Operator","timestamp":"2022-03-31T02:56:51Z"}
{"id":631,"first_name":"Fidelia","email":"fmendoncahi@cafepress.com","job":"Analyst Programmer","timestamp":"2022-10-10T17:58:04Z"}
{"id":632,"first_name":"Magdaia","email":"mpartingtonhj@cbsnews.com","job":"Nurse","timestamp":"2022-05-22T11:17:36Z"}
{"id":633,"first_name":"Saunderson","email":"sarnfieldhk@icq.com","job":"Environmental Tech","timestamp":"2022-03-17T04:16:50Z"}
{"id":634,"first_name":"Morie","email":"mnearyhl@shop-pro.jp","job":"Geological Engineer","timestamp":"2022-12-06T19:53:49Z"}
{"id":635,"first_name":"Ulrick","email":"umellhuishhm@a8.net","job":"Software Test Engineer II","timestamp":"2022-10-10T04:34:01Z"}
{"id":636,"first_name":"Netta","email":"nlamswoodhn@mail.ru","job":"Human Resources Assistant IV","timestamp":"2021-12-16T01:49:11Z"}
{"id":637,"first_name":"Amelina","email":"aravenscroftho@godaddy.com","job":"Office Assistant II","timestamp":"2022-09-17T20:31:27Z"}
{"id":638,"first_name":"Marybeth","email":"mfrenzlhp@ed.gov","job":"Nuclear Power Engineer","timestamp":"2022-09-19T23:47:19Z"}
{"id":639,"first_name":"Viva","email":"vdonsonhq@hubpages.com","job":"Senior Financial Analyst","timestamp":"2022-08-24T14:49:26Z"}
{"id":640,"first_name":"Zea","email":"zbercherhr@accuweather.com","job":"VP Marketing","timestamp":"2022-03-30T19:15:59Z"}
{"id":641,"first_name":"Sonia","email":"sjoreths@joomla.org","job":"Paralegal","timestamp":"2022-12-06T16:14:12Z"}
{"id":642,"first_name":"Foster","email":"fblaxlandeht@google.co.uk","job":"Administrative Officer","timestamp":"2022-06-30T05:18:46Z"}
{"id":643,"first_name":"Ema","email":"etorresehu@globo.com","job":"Software Test Engineer I","timestamp":"2022-08-13T07:21:00Z"}
{"id":644,"first_name":"Venus","email":"vminchellahv@woothemes.com","job":"Senior Cost Accountant","timestamp":"2022-05-07T02:11:33Z"}
{"id":645,"first_name":"Cherilyn","email":"cjenesshw@so-net.ne.jp","job":"Financial Advisor","timestamp":"2022-12-02T11:35:03Z"}
{"id":646,"first_name":"Carolee","email":"cwyehx@miibeian.gov.cn","job":"Business Systems Development Analyst","timestamp":"2022-11-06T02:43:51Z"}
{"id":647,"first_name":"Tybi","email":"tburrhy@geocities.jp","job":"Electrical Engineer","timestamp":"2022-02-13T08:57:59Z"}
{"id":648,"first_name":"Karoly","email":"kmangeonhz@github.com","job":"Librarian","timestamp":"2022-11-01T03:32:14Z"}
{"id":649,"first_name":"Wandie","email":"wklimentyevi0@redcross.org","job":"Associate Professor","timestamp":"2022-09-15T12:54:45Z"}
{"id":650,"first_name":"Bonny","email":"bsneesbyi1@tinyurl.com","job":"Financial Analyst","timestamp":"2022-05-16T02:52:09Z"}
{"id":651,"first_name":"Minna","email":"mmcgluei2@meetup.com","job":"Developer III","timestamp":"2022-10-11T11:00:55Z"}
{"id":652,"first_name":"Cleo","email":"cbillsoni3@php.net","job":"Developer III","timestamp":"2022-03-23T02:20:12Z"}
{"id":653,"first_name":"Glendon","email":"gwrankmorei4@japanpost.jp","job":"Senior Developer","timestamp":"2022-01-06T01:37:38Z"}
{"id":654,"first_name":"Darn","email":"ddunsirei5@businessweek.com","job":"Programmer Analyst I","timestamp":"2022-05-17T11:14:20Z"}
{"id":655,"first_name":"Bernice","email":"bhrachoveci6@guardian.co.uk","job":"Marketing Assistant","timestamp":"2022-06-12T01:14:43Z"}
{"id":656,"first_name":"Benoite","email":"bgregoni7@bbc.co.uk","job":"Staff Scientist","timestamp":"2022-05-14T20:00:31Z"}
{"id":657,"first_name":"Nicol","email":"nogleviei8@nps.gov","job":"Quality Engineer","timestamp":"2022-07-30T12:09:37Z"}
{"id":658,"first_name":"Desmond","email":"desleyi9@craigslist.org","job":"Safety Technician III","timestamp":"2022-07-29T10:46:51Z"}
{"id":659,"first_name":"Simone","email":"sdonaghieia@yelp.com","job":"Health Coach II","timestamp":"2022-10-27T09:06:51Z"}
{"id":660,"first_name":"Lynn","email":"lmctrustamib@mail.ru","job":"Software Test Engineer I","timestamp":"2022-08-24T03:37:20Z"}
{"id":661,"first_name":"Jerri","email":"jledekeric@mail.ru","job":"Senior Developer","timestamp":"2022-09-06T19:35:20Z"}
{"id":662,"first_name":"Cristal","email":"cjochananyid@wp.com","job":"Sales Representative","timestamp":"2022-06-12T06:52:58Z"}
{"id":663,"first_name":"Caye","email":"cbirdseyie@amazon.de","job":"Chief Design Engineer","timestamp":"2022-06-02T00:42:50Z"}
{"id":664,"first_name":"Tamma","email":"tredheadif@friendfeed.com","job":"Pharmacist","timestamp":"2022-11-27T20:41:48Z"}
{"id":665,"first_name":"Delaney","email":"dabbettig@umich.edu","job":"Financial Analyst","timestamp":"2022-09-05T10:44:54Z"}
{"id":666,"first_name":"Henka","email":"hvondrasekih@prweb.com","job":"Recruiting Manager","timestamp":"2022-04-09T19:42:27Z"}
{"id":667,"first_name":"Martie","email":"mjandourekii@sphinn.com","job":"Nurse Practicioner","timestamp":"2022-11-02T22:27:58Z"}
{"id":668,"first_name":"Adelle","email":"ariddlesdenij@netlog.com","job":"Dental Hygienist","timestamp":"2022-10-12T03:05:23Z"}
{"id":669,"first_name":"Andee","email":"abandeyik@guardian.co.uk","job":"Librarian","timestamp":"2022-08-07T13:11:22Z"}
{"id":670,"first_name":"Hollis","email":"hmacgrueril@wired.com","job":"Recruiting Manager","timestamp":"2022-10-06T05:09:28Z"}
{"id":671,"first_name":"Dona","email":"dselesnickim@yandex.ru","job":"Senior Sales Associate","timestamp":"2022-07-18T09:15:16Z"}
{"id":672,"first_name":"Siffre","email":"smaliffein@hugedomains.com","job":"VP Sales","timestamp":"2022-07-19T13:05:02Z"}
{"id":673,"first_name":"Gwenny","email":"gfeighryio@go.com","job":"Automation Specialist IV","timestamp":"2022-03-07T03:15:33Z"}
{"id":674,"first_name":"Paxon","email":"pcoplandip@blogs.com","job":"Data Coordiator","timestamp":"2022-09-10T10:45:06Z"}
{"id":675,"first_name":"Fredric","email":"fohanneniq@livejournal.com","job":"Director of Sales","timestamp":"2022-10-30T18:56:02Z"}
{"id":676,"first_name":"Enoch","email":"ekenningleyir@sciencedaily.com","job":"Account Coordinator","timestamp":"2022-01-11T16:42:07Z"}
{"id":677,"first_name":"Farand","email":"ffassonis@theglobeandmail.com","job":"GIS Technical Architect","timestamp":"2022-08-17T01:48:24Z"}
{"id":678,"first_name":"Gypsy","email":"gbristoeit@tumblr.com","job":"VP Marketing","timestamp":"2022-02-02T15:22:39Z"}
{"id":679,"first_name":"Lewie","email":"lskiltoniu@yolasite.com","job":"Executive Secretary","timestamp":"2022-11-02T17:38:40Z"}
{"id":680,"first_name":"Elnora","email":"evogeliv@geocities.com","job":"Administrative Officer","timestamp":"2022-05-14T16:28:29Z"}
{"id":681,"first_name":"Humfrey","email":"htethacotiw@springer.com","job":"Compensation Analyst","timestamp":"2022-01-18T00:36:58Z"}
{"id":682,"first_name":"Eadith","email":"eespadasix@mit.edu","job":"Web Designer III","timestamp":"2021-12-19T13:39:40Z"}
{"id":683,"first_name":"Winne","email":"wdunrigeiy@zdnet.com","job":"Help Desk Operator","timestamp":"2022-03-12T11:35:51Z"}
{"id":684,"first_name":"Ewell","email":"ewestbyiz@cargocollective.com","job":"Research Assistant III","timestamp":"2022-05-24T04:23:15Z"}
{"id":685,"first_name":"Johan","email":"jjoej0@mac.com","job":"Developer I","timestamp":"2022-11-14T13:44:24Z"}
{"id":686,"first_name":"Palmer","email":"phassenj1@pagesperso-orange.fr","job":"Data Coordiator","timestamp":"2022-04-11T09:12:42Z"}
{"id":687,"first_name":"Gabriel","email":"gwyllcocksj2@ox.ac.uk","job":"Nurse Practicioner","timestamp":"2022-02-21T15:51:39Z"}
{"id":688,"first_name":"Gustavus","email":"gwardropj3@ca.gov","job":"Librarian","timestamp":"2021-12-23T05:56:10Z"}
{"id":689,"first_name":"Sharl","email":"srabbagej4@artisteer.com","job":"Marketing Manager","timestamp":"2022-02-07T10:20:00Z"}
{"id":690,"first_name":"Lexi","email":"ldumphryj5@vistaprint.com","job":"Accountant III","timestamp":"2022-09-23T07:06:14Z"}
{"id":691,"first_name":"Garrot","email":"gfydoej6@ucla.edu","job":"Geological Engineer","timestamp":"2022-01-26T10:00:47Z"}
{"id":692,"first_name":"Aida","email":"akissackj7@delicious.com","job":"Senior Cost Accountant","timestamp":"2022-03-12T19:37:00Z"}
{"id":693,"first_name":"Quillan","email":"qibesonj8@marriott.com","job":"Geological Engineer","timestamp":"2022-08-07T09:42:27Z"}
{"id":694,"first_name":"Ailey","email":"awimmersj9@dion.ne.jp","job":"VP Accounting","timestamp":"2022-04-20T23:12:01Z"}
{"id":695,"first_name":"Corbett","email":"ctancockja@prlog.org","job":"Executive Secretary","timestamp":"2022-09-26T06:28:39Z"}
{"id":696,"first_name":"Aubry","email":"agarrudjb@sphinn.com","job":"VP Accounting","timestamp":"2022-07-08T15:40:52Z"}
{"id":697,"first_name":"Lyndsay","email":"lbarrelljc@aboutads.info","job":"Administrative Assistant III","timestamp":"2022-11-14T23:43:47Z"}
{"id":698,"first_name":"Ezekiel","email":"espeedinjd@who.int","job":"Human Resources Manager","timestamp":"2022-06-07T23:27:06Z"}
{"id":699,"first_name":"Monah","email":"mwittmanje@forbes.com","job":"Executive Secretary","timestamp":"2022-02-27T22:07:29Z"}
{"id":700,"first_name":"Tammi","email":"tpetticrewjf@yandex.ru","job":"Programmer Analyst III","timestamp":"2022-03-21T08:41:59Z"}
{"id":701,"first_name":"Brynne","email":"bbondleyjg@admin.ch","job":"Analyst Programmer","timestamp":"2022-08-08T19:25:12Z"}
{"id":702,"first_name":"Mirilla","email":"mrollinsonjh@twitter.com","job":"Geological Engineer","timestamp":"2022-05-23T06:08:30Z"}
{"id":703,"first_name":"Archibald","email":"aandricji@icq.com","job":"Chemical Engineer","timestamp":"2022-08-01T05:10:36Z"}
{"id":704,"first_name":"Mozes","email":"mcawoodjj@flickr.com","job":"VP Sales","timestamp":"2022-05-01T22:55:12Z"}
{"id":705,"first_name":"Delcine","email":"dcornickjk@amazon.de","job":"Director of Sales","timestamp":"2022-11-23T10:16:23Z"}
{"id":706,"first_name":"Jill","email":"jhandesjl@netscape.com","job":"Programmer IV","timestamp":"2022-05-04T07:01:23Z"}
{"id":707,"first_name":"Eleonore","email":"ecoxenjm@histats.com","job":"Human Resources Manager","timestamp":"2022-09-17T04:17:56Z"}
{"id":708,"first_name":"Gabrila","email":"gkeilingjn@zdnet.com","job":"Legal Assistant","timestamp":"2021-12-12T09:11:37Z"}
{"id":709,"first_name":"Nalani","email":"nleathesjo@yandex.ru","job":"Quality Engineer","timestamp":"2022-07-17T15:32:26Z"}
{"id":710,"first_name":"Brittany","email":"battenbarrowjp@cocolog-nifty.com","job":"Graphic Designer","timestamp":"2022-07-20T13:14:17Z"}
{"id":711,"first_name":"Nickola","email":"nnormanvillejq@seesaa.net","job":"Electrical Engineer","timestamp":"2022-02-05T08:16:47Z"}
{"id":712,"first_name":"Gian","email":"gneelyjr@de.vu","job":"Desktop Support Technician","timestamp":"2022-03-01T08:02:02Z"}
{"id":713,"first_name":"Merill","email":"mgaveltonejs@cbslocal.com","job":"Quality Engineer","timestamp":"2022-01-04T05:48:29Z"}
{"id":714,"first_name":"Salomon","email":"sambrogijt@exblog.jp","job":"Geological Engineer","timestamp":"2022-03-03T16:21:14Z"}
{"id":715,"first_name":"Mamie","email":"myaninju@clickbank.net","job":"Payment Adjustment Coordinator","timestamp":"2022-03-02T06:21:14Z"}
{"id":716,"first_name":"Arel","email":"acushejv@usnews.com","job":"VP Quality Control","timestamp":"2022-03-13T18:33:20Z"}
{"id":717,"first_name":"Benjamin","email":"bromanskijw@pinterest.com","job":"Electrical Engineer","timestamp":"2022-07-08T14:39:45Z"}
{"id":718,"first_name":"Woody","email":"wfrancesconejx@friendfeed.com","job":"Account Representative III","timestamp":"2022-02-02T21:45:59Z"}
{"id":719,"first_name":"Annabal","email":"atrewhittjy@ameblo.jp","job":"Teacher","timestamp":"2022-09-17T16:09:41Z"}
{"id":720,"first_name":"Kasper","email":"kweightjz@wikia.com","job":"Financial Advisor","timestamp":"2022-08-06T22:31:35Z"}
{"id":721,"first_name":"Sylvan","email":"stumasiank0@theglobeandmail.com","job":"Recruiting Manager","timestamp":"2022-03-17T18:22:35Z"}
{"id":722,"first_name":"Helga","email":"hcocklek1@slate.com","job":"Help Desk Operator","timestamp":"2022-10-27T22:15:09Z"}
{"id":723,"first_name":"Dottie","email":"dpiggottk2@adobe.com","job":"Nurse Practicioner","timestamp":"2022-05-01T14:02:18Z"}
{"id":724,"first_name":"Brant","email":"bwookeyk3@ucsd.edu","job":"Help Desk Operator","timestamp":"2022-08-10T08:04:15Z"}
{"id":725,"first_name":"Jojo","email":"jbeurichk4@linkedin.com","job":"Professor","timestamp":"2022-03-29T06:28:53Z"}
{"id":726,"first_name":"Daryl","email":"dcromlyk5@spotify.com","job":"Tax Accountant","timestamp":"2022-02-11T22:39:20Z"}
{"id":727,"first_name":"Eadmund","email":"emelmethk6@google.com.au","job":"Environmental Specialist","timestamp":"2022-04-19T04:20:44Z"}
{"id":728,"first_name":"Gaston","email":"gjaneczekk7@mashable.com","job":"VP Marketing","timestamp":"2022-02-09T19:01:05Z"}
{"id":729,"first_name":"Jody","email":"jhansleyk8@edublogs.org","job":"Mechanical Systems Engineer","timestamp":"2022-04-19T23:15:14Z"}
{"id":730,"first_name":"Chelsy","email":"cdimblebeek9@vk.com","job":"Quality Control Specialist","timestamp":"2022-02-18T17:49:47Z"}
{"id":731,"first_name":"Lilias","email":"lburchka@oaic.gov.au","job":"Nuclear Power Engineer","timestamp":"2022-05-19T21:46:19Z"}
{"id":732,"first_name":"Godiva","email":"gmolloykb@ibm.com","job":"Systems Administrator II","timestamp":"2022-05-17T17:39:48Z"}
{"id":733,"first_name":"Faye","email":"fbucknillkc@hc360.com","job":"Web Developer IV","timestamp":"2022-02-22T20:39:11Z"}
{"id":734,"first_name":"Rickie","email":"rdemezakd@tiny.cc","job":"General Manager","timestamp":"2022-06-09T10:15:05Z"}
{"id":735,"first_name":"Jessi","email":"jkingsnoadke@aboutads.info","job":"Programmer II","timestamp":"2022-08-19T22:15:39Z"}
{"id":736,"first_name":"Marice","email":"mmacdaidkf@omniture.com","job":"Clinical Specialist","timestamp":"2021-12-10T07:04:23Z"}
{"id":737,"first_name":"Sig","email":"sbarffordkg@wufoo.com","job":"Account Coordinator","timestamp":"2022-06-20T01:48:52Z"}
{"id":738,"first_name":"Ashia","email":"ahulettkh@pcworld.com","job":"Cost Accountant","timestamp":"2022-07-18T11:58:34Z"}
{"id":739,"first_name":"Alisa","email":"ascandrickki@businessinsider.com","job":"Accountant III","timestamp":"2022-10-05T04:12:34Z"}
{"id":740,"first_name":"Janella","email":"jfranzelinikj@jimdo.com","job":"Help Desk Operator","timestamp":"2022-01-21T13:47:46Z"}
{"id":741,"first_name":"Bondie","email":"bhryskiewiczkk@ucla.edu","job":"Safety Technician II","timestamp":"2022-10-15T19:50:53Z"}
{"id":742,"first_name":"Vivyan","email":"vcardnellkl@shareasale.com","job":"Senior Sales Associate","timestamp":"2022-04-18T16:31:43Z"}
{"id":743,"first_name":"Mylo","email":"miviekm@hhs.gov","job":"Analog Circuit Design manager","timestamp":"2022-06-08T12:03:06Z"}
{"id":744,"first_name":"Thomas","email":"tshawekn@cnbc.com","job":"Senior Quality Engineer","timestamp":"2021-12-11T11:54:22Z"}
{"id":745,"first_name":"Jessalin","email":"jgarthlandko@canalblog.com","job":"Chemical Engineer","timestamp":"2022-11-23T08:39:58Z"}
{"id":746,"first_name":"Joannes","email":"jwhitcombkp@odnoklassniki.ru","job":"Food Chemist","timestamp":"2022-01-22T22:10:33Z"}
{"id":747,"first_name":"Morlee","email":"mellisskq@virginia.edu","job":"VP Quality Control","timestamp":"2022-01-07T13:48:52Z"}
{"id":748,"first_name":"Karalynn","email":"koshevlinkr@japanpost.jp","job":"VP Product Management","timestamp":"2022-11-28T08:30:42Z"}
{"id":749,"first_name":"Phedra","email":"pgrigoriscuks@mayoclinic.com","job":"VP Accounting","timestamp":"2021-12-19T22:37:59Z"}
{"id":750,"first_name":"Denna","email":"ddeluzekt@freewebs.com","job":"Sales Associate","timestamp":"2022-09-01T10:42:32Z"}
{"id":751,"first_name":"Audrye","email":"aburghallku@behance.net","job":"Civil Engineer","timestamp":"2022-02-22T05:02:58Z"}
{"id":752,"first_name":"Dane","email":"dsharpekv@comcast.net","job":"VP Sales","timestamp":"2022-11-14T11:52:28Z"}
{"id":753,"first_name":"Nye","email":"nmulcasterkw@wikia.com","job":"Environmental Specialist","timestamp":"2022-08-09T11:06:13Z"}
{"id":754,"first_name":"Dame","email":"dmacenellykx@technorati.com","job":"Compensation Analyst","timestamp":"2022-03-16T13:16:49Z"}
{"id":755,"first_name":"Nevsa","email":"nkurdaniky@moonfruit.com","job":"Associate Professor","timestamp":"2022-07-30T09:04:58Z"}
{"id":756,"first_name":"Ronni","email":"rstarfordkz@aboutads.info","job":"Payment Adjustment Coordinator","timestamp":"2022-06-21T05:54:44Z"}
{"id":757,"first_name":"Hyacintha","email":"hcallabyl0@ask.com","job":"Social Worker","timestamp":"2022-03-09T00:34:02Z"}
{"id":758,"first_name":"Obidiah","email":"odougherl1@eventbrite.com","job":"Financial Analyst","timestamp":"2022-05-12T12:34:37Z"}
{"id":759,"first_name":"Terrill","email":"thaddacksl2@businesswire.com","job":"Accounting Assistant II","timestamp":"2022-12-02T04:29:19Z"}
{"id":760,"first_name":"Robby","email":"rhurdl3@i2i.jp","job":"Budget/Accounting Analyst IV","timestamp":"2022-09-28T12:20:36Z"}
{"id":761,"first_name":"Blayne","email":"bbebbelll4@dailymotion.com","job":"Administrative Assistant II","timestamp":"2022-10-22T13:16:00Z"}
{"id":762,"first_name":"Viki","email":"vmcmylerl5@mtv.com","job":"General Manager","timestamp":"2022-09-24T05:32:27Z"}
{"id":763,"first_name":"Erhard","email":"epengellyl6@slate.com","job":"Database Administrator I","timestamp":"2022-12-02T07:39:09Z"}
{"id":764,"first_name":"Weylin","email":"wpesekl7@moonfruit.com","job":"Accounting Assistant IV","timestamp":"2022-08-18T01:40:24Z"}
{"id":765,"first_name":"Garwin","email":"gspikinsl8@hhs.gov","job":"Computer Systems Analyst III","timestamp":"2022-03-01T04:22:37Z"}
{"id":766,"first_name":"Frederique","email":"fpellingl9@unc.edu","job":"Internal Auditor","timestamp":"2022-06-24T21:08:43Z"}
{"id":767,"first_name":"Terence","email":"tbardsleyla@i2i.jp","job":"Teacher","timestamp":"2022-09-12T16:41:01Z"}
{"id":768,"first_name":"Reynold","email":"rgiovanninilb@fotki.com","job":"Information Systems Manager","timestamp":"2022-04-12T21:15:43Z"}
{"id":769,"first_name":"Ethel","email":"ewhightmanlc@scribd.com","job":"Tax Accountant","timestamp":"2022-04-22T18:35:04Z"}
{"id":770,"first_name":"Larry","email":"lchavezld@amazon.co.uk","job":"Business Systems Development Analyst","timestamp":"2022-07-15T05:25:54Z"}
{"id":771,"first_name":"Tessy","email":"tbenle@wisc.edu","job":"VP Sales","timestamp":"2022-03-16T21:30:37Z"}
{"id":772,"first_name":"Dane","email":"dmatterfacelf@deliciousdays.com","job":"Mechanical Systems Engineer","timestamp":"2022-11-25T10:41:02Z"}
{"id":773,"first_name":"Kleon","email":"ksurgenerlg@tinypic.com","job":"Food Chemist","timestamp":"2022-02-13T20:28:16Z"}
{"id":774,"first_name":"Nicolea","email":"nnequestlh@dmoz.org","job":"VP Marketing","timestamp":"2022-03-31T01:03:41Z"}
{"id":775,"first_name":"Bevvy","email":"bsavellli@ucoz.ru","job":"Electrical Engineer","timestamp":"2022-10-25T06:01:02Z"}
{"id":776,"first_name":"Joel","email":"jnottilj@amazonaws.com","job":"Chief Design Engineer","timestamp":"2022-07-15T05:05:24Z"}
{"id":777,"first_name":"Mindy","email":"mpinnockelk@squidoo.com","job":"Marketing Assistant","timestamp":"2022-06-30T00:26:25Z"}
{"id":778,"first_name":"Jerad","email":"jgallierll@digg.com","job":"Sales Associate","timestamp":"2022-01-21T20:28:29Z"}
{"id":779,"first_name":"Milissent","email":"mbackslm@spotify.com","job":"Research Assistant I","timestamp":"2022-01-19T06:38:59Z"}
{"id":780,"first_name":"Callean","email":"cradborneln@ft.com","job":"VP Sales","timestamp":"2022-08-20T09:47:35Z"}
{"id":781,"first_name":"Gilbertina","email":"gzorzonilo@alibaba.com","job":"Cost Accountant","timestamp":"2022-01-09T19:52:20Z"}
{"id":782,"first_name":"Thain","email":"tlevenslp@zimbio.com","job":"Media Manager II","timestamp":"2022-05-31T00:22:07Z"}
{"id":783,"first_name":"Lem","email":"lrylattlq@yellowpages.com","job":"Marketing Assistant","timestamp":"2022-05-12T17:04:30Z"}
{"id":784,"first_name":"Lillian","email":"ltanslylr@sourceforge.net","job":"Human Resources Assistant III","timestamp":"2022-07-02T03:01:56Z"}
{"id":785,"first_name":"Smith","email":"smeinls@biglobe.ne.jp","job":"Junior Executive","timestamp":"2022-02-07T00:50:30Z"}
{"id":786,"first_name":"Meris","email":"mterbruggenlt@livejournal.com","job":"Structural Analysis Engineer","timestamp":"2022-07-27T16:40:12Z"}
{"id":787,"first_name":"Leesa","email":"lraeburnlu@tmall.com","job":"Operator","timestamp":"2022-02-22T06:34:25Z"}
{"id":788,"first_name":"Brennen","email":"bbowartlv@cdc.gov","job":"GIS Technical Architect","timestamp":"2022-11-08T23:11:20Z"}
{"id":789,"first_name":"Fabian","email":"fravenslw@linkedin.com","job":"Project Manager","timestamp":"2022-07-18T23:53:45Z"}
{"id":790,"first_name":"Amelina","email":"alandmanlx@ted.com","job":"Internal Auditor","timestamp":"2022-01-13T23:18:20Z"}
{"id":791,"first_name":"Mozelle","email":"meldertonly@ezinearticles.com","job":"Media Manager II","timestamp":"2022-11-03T14:12:26Z"}
{"id":792,"first_name":"Tobit","email":"tserjentlz@elegantthemes.com","job":"Database Administrator I","timestamp":"2022-07-01T12:08:46Z"}
{"id":793,"first_name":"Tanner","email":"tpauleym0@stumbleupon.com","job":"Senior Cost Accountant","timestamp":"2022-01-29T14:16:25Z"}
{"id":794,"first_name":"Kristin","email":"kdukerm1@sohu.com","job":"Administrative Assistant IV","timestamp":"2022-02-07T10:44:11Z"}
{"id":795,"first_name":"Ware","email":"wchellm2@rediff.com","job":"Social Worker","timestamp":"2022-02-17T13:59:09Z"}
{"id":796,"first_name":"Berrie","email":"begglem3@surveymonkey.com","job":"Accounting Assistant I","timestamp":"2022-06-19T18:52:37Z"}
{"id":797,"first_name":"Andros","email":"asprullsm4@ifeng.com","job":"Account Executive","timestamp":"2022-01-17T22:42:36Z"}
{"id":798,"first_name":"Saidee","email":"swiffillm5@blogspot.com","job":"VP Quality Control","timestamp":"2022-05-25T02:52:49Z"}
{"id":799,"first_name":"Susanna","email":"sbrentnallm6@vistaprint.com","job":"VP Product Management","timestamp":"2022-04-17T11:27:28Z"}
{"id":800,"first_name":"Micheline","email":"mwalbrookm7@nih.gov","job":"Statistician II","timestamp":"2022-08-07T03:20:05Z"}
{"id":801,"first_name":"Putnem","email":"pnevillm8@studiopress.com","job":"Professor","timestamp":"2022-03-05T15:31:28Z"}
{"id":802,"first_name":"Hinze","email":"hboocockm9@amazon.co.jp","job":"Human Resources Assistant II","timestamp":"2022-02-05T09:35:18Z"}
{"id":803,"first_name":"Ketti","email":"kbritcherma@instagram.com","job":"Administrative Officer","timestamp":"2022-07-17T06:02:28Z"}
{"id":804,"first_name":"Nevins","email":"nyanshinmb@surveymonkey.com","job":"Operator","timestamp":"2022-08-07T10:38:06Z"}
{"id":805,"first_name":"Scott","email":"sgallafantmc@amazonaws.com","job":"Statistician III","timestamp":"2022-08-26T17:02:44Z"}
{"id":806,"first_name":"Lacie","email":"lsplavenmd@addtoany.com","job":"Quality Engineer","timestamp":"2022-01-17T19:39:07Z"}
{"id":807,"first_name":"Renado","email":"rleijsme@discuz.net","job":"Executive Secretary","timestamp":"2022-04-14T21:12:21Z"}
{"id":808,"first_name":"Goldia","email":"gbumphreymf@senate.gov","job":"Editor","timestamp":"2022-06-27T04:37:50Z"}
{"id":809,"first_name":"Corri","email":"ctonkinsonmg@slate.com","job":"Dental Hygienist","timestamp":"2022-11-25T08:45:37Z"}
{"id":810,"first_name":"Barry","email":"bondramh@sciencedaily.com","job":"Project Manager","timestamp":"2022-02-27T10:13:39Z"}
{"id":811,"first_name":"Duffy","email":"dvandersonmi@blinklist.com","job":"Recruiting Manager","timestamp":"2022-04-26T20:13:47Z"}
{"id":812,"first_name":"Sande","email":"sphairmj@live.com","job":"Associate Professor","timestamp":"2022-07-30T13:56:11Z"}
{"id":813,"first_name":"Marissa","email":"mkisbymk@hud.gov","job":"Mechanical Systems Engineer","timestamp":"2022-11-13T13:55:16Z"}
{"id":814,"first_name":"Timmy","email":"twoloschinml@army.mil","job":"Environmental Tech","timestamp":"2022-04-12T01:37:40Z"}
{"id":815,"first_name":"Early","email":"ehaukeymm@tamu.edu","job":"Executive Secretary","timestamp":"2022-01-17T16:13:19Z"}
{"id":816,"first_name":"Maynard","email":"mmajormn@google.ru","job":"Database Administrator II","timestamp":"2022-10-30T01:30:43Z"}
{"id":817,"first_name":"Geordie","email":"gspiermo@rambler.ru","job":"Administrative Assistant I","timestamp":"2022-10-28T08:13:24Z"}
{"id":818,"first_name":"Trula","email":"tcustmp@drupal.org","job":"Database Administrator II","timestamp":"2022-01-23T22:50:14Z"}
{"id":819,"first_name":"Vale","email":"vrammemq@prlog.org","job":"Desktop Support Technician","timestamp":"2021-12-25T03:53:38Z"}
{"id":820,"first_name":"Winny","email":"wmcgallmr@edublogs.org","job":"Media Manager IV","timestamp":"2022-06-22T03:47:41Z"}
{"id":821,"first_name":"Laraine","email":"lfortems@tamu.edu","job":"Social Worker","timestamp":"2022-07-17T05:32:39Z"}
{"id":822,"first_name":"Nathanil","email":"nchamleymt@altervista.org","job":"Administrative Assistant II","timestamp":"2022-05-28T11:05:26Z"}
{"id":823,"first_name":"Jarib","email":"jspinettimu@cnbc.com","job":"Internal Auditor","timestamp":"2022-09-04T22:57:50Z"}
{"id":824,"first_name":"Betsey","email":"bbolgarmv@google.nl","job":"Librarian","timestamp":"2022-05-14T19:20:02Z"}
{"id":825,"first_name":"Tadd","email":"tnoellmw@walmart.com","job":"Structural Engineer","timestamp":"2022-08-24T02:35:22Z"}
{"id":826,"first_name":"Puff","email":"pgerokmx@gizmodo.com","job":"Teacher","timestamp":"2022-09-12T07:28:33Z"}
{"id":827,"first_name":"Yasmin","email":"yfippmy@reverbnation.com","job":"Programmer Analyst III","timestamp":"2022-12-02T19:47:38Z"}
{"id":828,"first_name":"Bernadette","email":"bleganmz@telegraph.co.uk","job":"Civil Engineer","timestamp":"2022-03-31T12:49:01Z"}
{"id":829,"first_name":"Berni","email":"bgloucestern0@gov.uk","job":"Research Assistant I","timestamp":"2022-06-25T03:32:48Z"}
{"id":830,"first_name":"Karlotte","email":"kmartignonin1@cocolog-nifty.com","job":"Health Coach I","timestamp":"2022-02-20T11:58:30Z"}
{"id":831,"first_name":"Bernadine","email":"bspavonn2@liveinternet.ru","job":"Structural Analysis Engineer","timestamp":"2021-12-11T21:39:43Z"}
{"id":832,"first_name":"Lela","email":"lnoenn3@redcross.org","job":"Human Resources Assistant IV","timestamp":"2022-05-29T13:49:27Z"}
{"id":833,"first_name":"Aurora","email":"amendenhalln4@delicious.com","job":"Food Chemist","timestamp":"2022-07-31T00:29:00Z"}
{"id":834,"first_name":"Florian","email":"fstrowthern5@scribd.com","job":"Data Coordiator","timestamp":"2022-10-09T13:32:16Z"}
{"id":835,"first_name":"Audy","email":"aoveralln6@dell.com","job":"Editor","timestamp":"2022-04-11T14:56:31Z"}
{"id":836,"first_name":"Lyndsay","email":"ldecavillen7@cdc.gov","job":"Nuclear Power Engineer","timestamp":"2022-05-27T07:08:15Z"}
{"id":837,"first_name":"Pail","email":"plewcockn8@github.com","job":"Administrative Officer","timestamp":"2022-01-20T04:13:27Z"}
{"id":838,"first_name":"Kevan","email":"kbarkleyn9@seesaa.net","job":"Assistant Media Planner","timestamp":"2022-08-07T06:05:54Z"}
{"id":839,"first_name":"Kimmi","email":"kmunnionna@newsvine.com","job":"Safety Technician III","timestamp":"2022-08-14T04:25:45Z"}
{"id":840,"first_name":"Esmaria","email":"eairenb@ox.ac.uk","job":"Account Coordinator","timestamp":"2022-03-10T21:54:53Z"}
{"id":841,"first_name":"Klarika","email":"kpennettinc@oakley.com","job":"Senior Quality Engineer","timestamp":"2022-09-17T15:56:15Z"}
{"id":842,"first_name":"Minetta","email":"mkornackind@discovery.com","job":"GIS Technical Architect","timestamp":"2022-07-11T11:26:43Z"}
{"id":843,"first_name":"Emmit","email":"eboylinne@storify.com","job":"Sales Associate","timestamp":"2022-10-16T12:23:15Z"}
{"id":844,"first_name":"Chaim","email":"credmaynenf@wiley.com","job":"Mechanical Systems Engineer","timestamp":"2022-05-14T03:30:45Z"}
{"id":845,"first_name":"Orazio","email":"owitcherleyng@amazon.de","job":"VP Accounting","timestamp":"2022-10-18T20:52:32Z"}
{"id":846,"first_name":"Egbert","email":"ejordannh@surveymonkey.com","job":"Graphic Designer","timestamp":"2021-12-28T17:52:15Z"}
{"id":847,"first_name":"Clemens","email":"cblackebyni@livejournal.com","job":"Design Engineer","timestamp":"2022-03-30T10:36:40Z"}
{"id":848,"first_name":"Brooke","email":"bleedernj@godaddy.com","job":"Senior Sales Associate","timestamp":"2022-11-26T13:38:37Z"}
{"id":849,"first_name":"Batholomew","email":"baceynk@jigsy.com","job":"Information Systems Manager","timestamp":"2022-11-20T08:57:31Z"}
{"id":850,"first_name":"Reinhold","email":"rcubberleynl@de.vu","job":"Software Consultant","timestamp":"2022-07-09T19:38:46Z"}
{"id":851,"first_name":"Bel","email":"bshavenm@miitbeian.gov.cn","job":"Recruiting Manager","timestamp":"2022-01-28T17:24:18Z"}
{"id":852,"first_name":"Glenden","email":"ghumbienn@princeton.edu","job":"Project Manager","timestamp":"2022-05-16T07:45:40Z"}
{"id":853,"first_name":"Lorie","email":"ljeannotno@examiner.com","job":"Dental Hygienist","timestamp":"2022-10-15T03:52:40Z"}
{"id":854,"first_name":"Garrot","email":"gjepsonnp@marriott.com","job":"Editor","timestamp":"2022-04-10T04:24:08Z"}
{"id":855,"first_name":"Henrieta","email":"hfarrownq@ezinearticles.com","job":"Programmer Analyst III","timestamp":"2022-01-27T23:19:22Z"}
{"id":856,"first_name":"Luis","email":"ldiboldinr@aboutads.info","job":"Director of Sales","timestamp":"2022-02-21T08:33:27Z"}
{"id":857,"first_name":"Maurie","email":"medgettns@linkedin.com","job":"Clinical Specialist","timestamp":"2022-02-20T13:04:26Z"}
{"id":858,"first_name":"Kalie","email":"klemmennt@webs.com","job":"VP Sales","timestamp":"2022-02-07T04:55:05Z"}
{"id":859,"first_name":"Nadeen","email":"naldwichnu@java.com","job":"VP Sales","timestamp":"2022-06-06T09:30:36Z"}
{"id":860,"first_name":"Codie","email":"cdeclairmontnv@indiegogo.com","job":"Accountant III","timestamp":"2022-02-07T06:29:46Z"}
{"id":861,"first_name":"Fanny","email":"fdemanchenw@parallels.com","job":"Paralegal","timestamp":"2022-08-14T16:49:12Z"}
{"id":862,"first_name":"Dev","email":"ddongallnx@globo.com","job":"Health Coach III","timestamp":"2022-10-09T10:42:24Z"}
{"id":863,"first_name":"Anette","email":"alestorny@independent.co.uk","job":"Quality Engineer","timestamp":"2022-05-05T09:17:14Z"}
{"id":864,"first_name":"Alfy","email":"atindallnz@wordpress.com","job":"Web Developer II","timestamp":"2022-04-03T15:01:04Z"}
{"id":865,"first_name":"Malissa","email":"mdorseto0@umich.edu","job":"Research Assistant II","timestamp":"2022-01-18T08:08:14Z"}
{"id":866,"first_name":"Raychel","email":"rfolko1@hubpages.com","job":"Mechanical Systems Engineer","timestamp":"2022-10-01T03:04:36Z"}
{"id":867,"first_name":"Deloria","email":"dtraharo2@freewebs.com","job":"Paralegal","timestamp":"2022-04-22T11:25:15Z"}
{"id":868,"first_name":"Jayme","email":"jhardbattleo3@indiatimes.com","job":"Quality Control Specialist","timestamp":"2022-07-22T11:02:53Z"}
{"id":869,"first_name":"Brina","email":"bsherryo4@marketwatch.com","job":"Librarian","timestamp":"2022-01-05T17:11:02Z"}
{"id":870,"first_name":"Christal","email":"cloisio5@ehow.com","job":"Programmer II","timestamp":"2022-10-22T01:30:55Z"}
{"id":871,"first_name":"Nonna","email":"nneumanno6@dailymotion.com","job":"Nurse Practicioner","timestamp":"2022-02-21T08:46:46Z"}
{"id":872,"first_name":"Reiko","email":"rwordeno7@techcrunch.com","job":"Registered Nurse","timestamp":"2022-12-06T17:34:34Z"}
{"id":873,"first_name":"Michaeline","email":"mballantineo8@goo.ne.jp","job":"Associate Professor","timestamp":"2022-11-22T06:13:48Z"}
{"id":874,"first_name":"Flossie","email":"fdaylyo9@java.com","job":"Engineer III","timestamp":"2022-04-23T11:41:09Z"}
{"id":875,"first_name":"Kathleen","email":"kroblouoa@baidu.com","job":"Associate Professor","timestamp":"2021-12-26T18:03:46Z"}
{"id":876,"first_name":"Renaud","email":"rgookesob@mediafire.com","job":"Help Desk Technician","timestamp":"2022-12-03T02:45:25Z"}
{"id":877,"first_name":"Rollo","email":"rdericutoc@businesswire.com","job":"Research Assistant IV","timestamp":"2022-10-31T18:36:20Z"}
{"id":878,"first_name":"Faber","email":"fsimioniod@alibaba.com","job":"GIS Technical Architect","timestamp":"2022-12-01T21:20:46Z"}
{"id":879,"first_name":"Malynda","email":"mgresoe@furl.net","job":"Systems Administrator I","timestamp":"2022-05-31T05:31:01Z"}
{"id":880,"first_name":"Eldridge","email":"everdonof@hexun.com","job":"Data Coordiator","timestamp":"2022-03-27T14:39:55Z"}
{"id":881,"first_name":"Maxy","email":"mmooneyog@businessweek.com","job":"Data Coordiator","timestamp":"2022-11-06T17:31:25Z"}
{"id":882,"first_name":"Kevina","email":"kpericooh@google.de","job":"Nurse Practicioner","timestamp":"2022-03-27T13:04:10Z"}
{"id":883,"first_name":"Roberto","email":"ralloneoi@over-blog.com","job":"Assistant Media Planner","timestamp":"2022-10-19T17:41:28Z"}
{"id":884,"first_name":"Reeta","email":"rmatlockoj@ow.ly","job":"Legal Assistant","timestamp":"2022-05-16T05:22:12Z"}
{"id":885,"first_name":"Romonda","email":"rpinckneyok@list-manage.com","job":"Financial Analyst","timestamp":"2022-02-02T20:15:20Z"}
{"id":886,"first_name":"Barnett","email":"bhedlestoneol@ifeng.com","job":"Chief Design Engineer","timestamp":"2021-12-14T08:29:47Z"}
{"id":887,"first_name":"Jemie","email":"jmatousekom@zimbio.com","job":"Junior Executive","timestamp":"2022-11-10T23:11:53Z"}
{"id":888,"first_name":"Sianna","email":"sriddioughon@usatoday.com","job":"Product Engineer","timestamp":"2021-12-25T07:59:10Z"}
{"id":889,"first_name":"Mort","email":"mhamshawoo@qq.com","job":"Accountant III","timestamp":"2022-10-08T06:32:44Z"}
{"id":890,"first_name":"Raff","email":"rdareyop@quantcast.com","job":"Sales Associate","timestamp":"2022-11-06T01:09:57Z"}
{"id":891,"first_name":"Josias","email":"jstimsonoq@drupal.org","job":"Civil Engineer","timestamp":"2022-01-28T21:36:02Z"}
{"id":892,"first_name":"Cello","email":"cbonyor@jugem.jp","job":"Information Systems Manager","timestamp":"2022-06-27T05:23:17Z"}
{"id":893,"first_name":"Johann","email":"jlampos@facebook.com","job":"Recruiter","timestamp":"2022-04-20T08:29:47Z"}
{"id":894,"first_name":"Grazia","email":"ggoverot@people.com.cn","job":"Environmental Tech","timestamp":"2022-08-22T23:23:20Z"}
{"id":895,"first_name":"Davon","email":"dteligaou@weibo.com","job":"Senior Sales Associate","timestamp":"2022-07-01T00:54:36Z"}
{"id":896,"first_name":"Ichabod","email":"ikobierraov@dion.ne.jp","job":"GIS Technical Architect","timestamp":"2022-04-03T21:08:09Z"}
{"id":897,"first_name":"Sandor","email":"scotaow@reference.com","job":"Assistant Media Planner","timestamp":"2022-03-27T14:52:14Z"}
{"id":898,"first_name":"Doy","email":"dstiffkinsox@toplist.cz","job":"Financial Advisor","timestamp":"2022-07-02T16:07:19Z"}
{"id":899,"first_name":"Carla","email":"cstorckeoy@mlb.com","job":"Recruiter","timestamp":"2022-08-13T18:25:56Z"}
{"id":900,"first_name":"Nicolais","email":"nharceoz@soup.io","job":"Financial Advisor","timestamp":"2022-05-10T18:45:14Z"}
{"id":901,"first_name":"Ab","email":"abrinep0@google.co.uk","job":"Assistant Manager","timestamp":"2022-05-01T05:27:10Z"}
{"id":902,"first_name":"Blake","email":"bmackinderp1@ed.gov","job":"VP Quality Control","timestamp":"2022-08-23T16:12:10Z"}
{"id":903,"first_name":"Thurston","email":"tcarncrossp2@wikia.com","job":"Biostatistician III","timestamp":"2021-12-10T09:23:49Z"}
{"id":904,"first_name":"Montague","email":"mreinp3@java.com","job":"Staff Scientist","timestamp":"2022-04-27T05:05:08Z"}
{"id":905,"first_name":"Thomas","email":"tcahernyp4@oracle.com","job":"Geologist I","timestamp":"2021-12-14T13:45:34Z"}
{"id":906,"first_name":"Beitris","email":"beslandp5@xing.com","job":"GIS Technical Architect","timestamp":"2022-10-30T12:45:54Z"}
{"id":907,"first_name":"Tristam","email":"tbyardp6@army.mil","job":"Senior Developer","timestamp":"2022-07-11T22:57:40Z"}
{"id":908,"first_name":"Romona","email":"rrashleighp7@cnet.com","job":"Environmental Specialist","timestamp":"2022-07-22T21:54:19Z"}
{"id":909,"first_name":"Gardener","email":"gcalowp8@furl.net","job":"Recruiting Manager","timestamp":"2022-02-21T20:44:18Z"}
{"id":910,"first_name":"Westleigh","email":"wlegerwoodp9@moonfruit.com","job":"Web Developer III","timestamp":"2022-04-17T17:12:19Z"}
{"id":911,"first_name":"Korrie","email":"kwightpa@tamu.edu","job":"Office Assistant II","timestamp":"2022-08-02T16:12:44Z"}
{"id":912,"first_name":"Elliot","email":"epeschetpb@fastcompany.com","job":"Budget/Accounting Analyst IV","timestamp":"2022-09-01T10:23:33Z"}
{"id":913,"first_name":"Fax","email":"feichpc@delicious.com","job":"Food Chemist","timestamp":"2022-07-25T01:56:13Z"}
{"id":914,"first_name":"Erastus","email":"eblaypd@paypal.com","job":"Professor","timestamp":"2022-09-18T23:35:46Z"}
{"id":915,"first_name":"Oralla","email":"omccorleype@umich.edu","job":"VP Marketing","timestamp":"2022-09-09T03:24:55Z"}
{"id":916,"first_name":"Urbano","email":"ukingstnepf@narod.ru","job":"Engineer III","timestamp":"2022-07-13T10:14:55Z"}
{"id":917,"first_name":"Ethel","email":"elonerganpg@discovery.com","job":"Operator","timestamp":"2022-02-28T13:40:14Z"}
{"id":918,"first_name":"Grove","email":"gathridgeph@springer.com","job":"Dental Hygienist","timestamp":"2022-05-19T00:14:03Z"}
{"id":919,"first_name":"Junette","email":"jbaupi@amazon.co.jp","job":"Physical Therapy Assistant","timestamp":"2022-06-05T15:40:44Z"}
{"id":920,"first_name":"Elbert","email":"elernerpj@examiner.com","job":"Environmental Tech","timestamp":"2022-02-23T02:05:59Z"}
{"id":921,"first_name":"Juditha","email":"jternouthpk@people.com.cn","job":"Marketing Assistant","timestamp":"2022-11-17T11:21:10Z"}
{"id":922,"first_name":"Madeleine","email":"mskallypl@pen.io","job":"Community Outreach Specialist","timestamp":"2022-07-18T05:12:34Z"}
{"id":923,"first_name":"Merill","email":"mmerrienpm@1und1.de","job":"Help Desk Operator","timestamp":"2022-05-21T02:24:56Z"}
{"id":924,"first_name":"Lois","email":"lcadoganpn@dyndns.org","job":"Marketing Assistant","timestamp":"2022-10-24T01:25:17Z"}
{"id":925,"first_name":"Bendix","email":"bchenepo@dailymotion.com","job":"Administrative Officer","timestamp":"2022-03-24T15:17:47Z"}
{"id":926,"first_name":"Isis","email":"iseekspp@usgs.gov","job":"Actuary","timestamp":"2022-10-12T05:56:55Z"}
{"id":927,"first_name":"Eda","email":"edartpq@godaddy.com","job":"Mechanical Systems Engineer","timestamp":"2022-02-26T05:06:30Z"}
{"id":928,"first_name":"Rhys","email":"rszachpr@instagram.com","job":"Recruiter","timestamp":"2022-02-18T06:27:48Z"}
{"id":929,"first_name":"Gerianna","email":"ggladbeckps@nifty.com","job":"Compensation Analyst","timestamp":"2022-06-11T13:07:20Z"}
{"id":930,"first_name":"Merrill","email":"mclutterhampt@tripod.com","job":"Engineer III","timestamp":"2022-02-24T21:42:32Z"}
{"id":931,"first_name":"Sheree","email":"sdeamayapu@bravesites.com","job":"Financial Advisor","timestamp":"2022-10-17T23:12:59Z"}
{"id":932,"first_name":"Dane","email":"djarmanpv@constantcontact.com","job":"Financial Analyst","timestamp":"2022-07-22T11:17:02Z"}
{"id":933,"first_name":"Corney","email":"cmccroriepw@va.gov","job":"Structural Analysis Engineer","timestamp":"2022-05-24T01:47:23Z"}
{"id":934,"first_name":"Candace","email":"cflacknellpx@php.net","job":"VP Quality Control","timestamp":"2022-09-07T11:36:27Z"}
{"id":935,"first_name":"Corrinne","email":"ccardenaspy@wunderground.com","job":"Compensation Analyst","timestamp":"2022-01-31T11:37:46Z"}
{"id":936,"first_name":"Meade","email":"mpetrashkovpz@booking.com","job":"Account Representative III","timestamp":"2022-01-18T15:57:19Z"}
{"id":937,"first_name":"Sauveur","email":"sfinnanq0@indiatimes.com","job":"Account Coordinator","timestamp":"2022-09-23T10:05:56Z"}
{"id":938,"first_name":"Tammy","email":"tgrasq1@blogger.com","job":"Engineer I","timestamp":"2022-04-15T01:39:44Z"}
{"id":939,"first_name":"Teodoor","email":"tmacgraithq2@sfgate.com","job":"Engineer IV","timestamp":"2022-12-03T22:35:35Z"}
{"id":940,"first_name":"Fae","email":"fgalgeyq3@google.fr","job":"Dental Hygienist","timestamp":"2022-08-21T19:01:24Z"}
{"id":941,"first_name":"Joell","email":"jkochlq4@lulu.com","job":"Chief Design Engineer","timestamp":"2022-01-11T09:35:21Z"}
{"id":942,"first_name":"Aldwin","email":"arosenbloomq5@msn.com","job":"Community Outreach Specialist","timestamp":"2022-06-19T10:51:49Z"}
{"id":943,"first_name":"Tracee","email":"tlymbourneq6@bing.com","job":"Staff Accountant II","timestamp":"2022-03-09T09:48:29Z"}
{"id":944,"first_name":"Peyton","email":"phardsonq7@nifty.com","job":"Civil Engineer","timestamp":"2022-06-15T02:15:23Z"}
{"id":945,"first_name":"Larina","email":"lleckieq8@weather.com","job":"Web Designer III","timestamp":"2022-11-24T04:15:27Z"}
{"id":946,"first_name":"Emelia","email":"ejarnellq9@nyu.edu","job":"Geologist III","timestamp":"2022-05-09T02:19:47Z"}
{"id":947,"first_name":"Andrus","email":"amarquisqa@seesaa.net","job":"Staff Scientist","timestamp":"2022-08-27T04:02:30Z"}
{"id":948,"first_name":"Vernen","email":"vlockeqb@ucsd.edu","job":"Developer IV","timestamp":"2022-03-05T01:12:55Z"}
{"id":949,"first_name":"Wyndham","email":"wbroadwayqc@github.io","job":"Pharmacist","timestamp":"2022-05-11T07:26:10Z"}
{"id":950,"first_name":"Amye","email":"ahellinqd@stumbleupon.com","job":"Clinical Specialist","timestamp":"2022-05-27T04:52:14Z"}
{"id":951,"first_name":"Valera","email":"vreemeqe@wordpress.com","job":"Account Coordinator","timestamp":"2022-08-14T18:45:26Z"}
{"id":952,"first_name":"Kipp","email":"kgulstonqf@guardian.co.uk","job":"Help Desk Technician","timestamp":"2021-12-28T08:31:34Z"}
{"id":953,"first_name":"Sayer","email":"sstifeqg@squidoo.com","job":"Quality Engineer","timestamp":"2022-08-16T09:11:02Z"}
{"id":954,"first_name":"Yancey","email":"yculliganqh@mediafire.com","job":"Data Coordiator","timestamp":"2022-05-28T22:17:43Z"}
{"id":955,"first_name":"Yoshi","email":"yprofferqi@mapquest.com","job":"Speech Pathologist","timestamp":"2022-05-04T02:45:51Z"}
{"id":956,"first_name":"Madison","email":"mimortsqj@discovery.com","job":"Staff Scientist","timestamp":"2022-04-08T00:37:08Z"}
{"id":957,"first_name":"Eziechiele","email":"efollinqk@weebly.com","job":"Physical Therapy Assistant","timestamp":"2022-05-02T21:05:48Z"}
{"id":958,"first_name":"Barrie","email":"bwalaronql@newyorker.com","job":"Technical Writer","timestamp":"2022-09-09T10:56:49Z"}
{"id":959,"first_name":"Reggie","email":"rcahnqm@google.com.hk","job":"Graphic Designer","timestamp":"2022-02-04T05:10:00Z"}
{"id":960,"first_name":"Conny","email":"celleswortheqn@jalbum.net","job":"Design Engineer","timestamp":"2022-11-08T10:58:05Z"}
{"id":961,"first_name":"Roselia","email":"rhurranqo@eventbrite.com","job":"Environmental Specialist","timestamp":"2022-03-31T15:47:33Z"}
{"id":962,"first_name":"Vera","email":"vgowlandqp@homestead.com","job":"Geologist IV","timestamp":"2022-09-24T08:20:45Z"}
{"id":963,"first_name":"Sheeree","email":"smundowqq@artisteer.com","job":"Health Coach I","timestamp":"2022-09-07T03:54:28Z"}
{"id":964,"first_name":"Becky","email":"bspurriarqr@diigo.com","job":"Social Worker","timestamp":"2022-11-09T01:46:54Z"}
{"id":965,"first_name":"Tan","email":"tbatyqs@wikimedia.org","job":"Occupational Therapist","timestamp":"2022-10-25T09:43:54Z"}
{"id":966,"first_name":"Kalila","email":"kdowersqt@cyberchimps.com","job":"GIS Technical Architect","timestamp":"2022-02-04T19:00:56Z"}
{"id":967,"first_name":"Morrie","email":"mjesticoqu@army.mil","job":"Associate Professor","timestamp":"2022-12-04T22:25:48Z"}
{"id":968,"first_name":"Abelard","email":"asmewinqv@arizona.edu","job":"Financial Advisor","timestamp":"2022-06-24T19:19:09Z"}
{"id":969,"first_name":"Shelby","email":"sropckeqw@census.gov","job":"Account Coordinator","timestamp":"2022-05-30T09:49:34Z"}
{"id":970,"first_name":"Jaynell","email":"jmarvelleyqx@princeton.edu","job":"Food Chemist","timestamp":"2022-08-18T20:04:49Z"}
{"id":971,"first_name":"Jori","email":"jdibsdaleqy@last.fm","job":"Database Administrator III","timestamp":"2022-05-12T19:28:48Z"}
{"id":972,"first_name":"Cari","email":"credittqz@addthis.com","job":"Safety Technician I","timestamp":"2022-10-08T19:43:07Z"}
{"id":973,"first_name":"Edee","email":"ezylberdikr0@ning.com","job":"Staff Accountant IV","timestamp":"2022-05-23T09:04:15Z"}
{"id":974,"first_name":"Kaiser","email":"kbaggallayr1@slashdot.org","job":"Dental Hygienist","timestamp":"2022-01-07T20:11:41Z"}
{"id":975,"first_name":"Christalle","email":"cbuzekr2@istockphoto.com","job":"Senior Financial Analyst","timestamp":"2022-04-10T22:36:11Z"}
{"id":976,"first_name":"Otha","email":"oaluardr3@deliciousdays.com","job":"Project Manager","timestamp":"2022-07-11T21:01:49Z"}
{"id":977,"first_name":"Imogene","email":"iharwoodr4@geocities.jp","job":"Executive Secretary","timestamp":"2021-12-29T14:21:12Z"}
{"id":978,"first_name":"Valentijn","email":"vsouterr5@mtv.com","job":"Senior Editor","timestamp":"2022-01-13T07:30:20Z"}
{"id":979,"first_name":"Danielle","email":"dharrowayr6@hugedomains.com","job":"Biostatistician II","timestamp":"2022-08-03T09:35:36Z"}
{"id":980,"first_name":"Griff","email":"gdoyleyr7@qq.com","job":"Marketing Assistant","timestamp":"2022-07-02T10:23:43Z"}
{"id":981,"first_name":"Claudelle","email":"cthompsonr8@wikispaces.com","job":"Financial Advisor","timestamp":"2022-08-22T17:13:02Z"}
{"id":982,"first_name":"Marla","email":"mcaulketr9@usnews.com","job":"Quality Control Specialist","timestamp":"2022-05-15T23:29:39Z"}
{"id":983,"first_name":"Lorne","email":"llabellra@g.co","job":"Pharmacist","timestamp":"2022-03-01T00:37:57Z"}
{"id":984,"first_name":"Mar","email":"mrispinrb@networkadvertising.org","job":"Design Engineer","timestamp":"2022-07-09T01:55:58Z"}
{"id":985,"first_name":"Townie","email":"tbusrc@guardian.co.uk","job":"Director of Sales","timestamp":"2022-10-06T16:48:30Z"}
{"id":986,"first_name":"Darcey","email":"dwillerstonerd@diigo.com","job":"Assistant Media Planner","timestamp":"2022-08-04T00:05:16Z"}
{"id":987,"first_name":"Joann","email":"jschwandnerre@theglobeandmail.com","job":"Account Representative I","timestamp":"2022-11-08T05:48:40Z"}
{"id":988,"first_name":"Katerine","email":"kuttleyrf@japanpost.jp","job":"Nuclear Power Engineer","timestamp":"2022-05-13T12:35:36Z"}
{"id":989,"first_name":"Audie","email":"akeemsrg@chron.com","job":"Analog Circuit Design manager","timestamp":"2022-10-22T02:14:29Z"}
{"id":990,"first_name":"Findlay","email":"fjaggersrh@time.com","job":"Human Resources Manager","timestamp":"2022-05-12T08:41:24Z"}
{"id":991,"first_name":"Jonis","email":"jjedrasikri@google.co.uk","job":"Clinical Specialist","timestamp":"2022-06-05T11:49:21Z"}
{"id":992,"first_name":"Erhart","email":"eszymonowiczrj@washingtonpost.com","job":"Software Engineer IV","timestamp":"2022-03-16T03:49:43Z"}
{"id":993,"first_name":"Ulysses","email":"umadenrk@walmart.com","job":"Research Assistant III","timestamp":"2022-11-17T14:27:14Z"}
{"id":994,"first_name":"Vannie","email":"vallsoprl@github.com","job":"Executive Secretary","timestamp":"2022-08-19T15:25:28Z"}
{"id":995,"first_name":"Rory","email":"rballstonrm@oaic.gov.au","job":"Project Manager","timestamp":"2022-05-23T10:42:53Z"}
{"id":996,"first_name":"Korrie","email":"kbeneditrn@constantcontact.com","job":"Safety Technician II","timestamp":"2021-12-30T08:56:55Z"}
{"id":997,"first_name":"Vlad","email":"vendlero@storify.com","job":"Dental Hygienist","timestamp":"2022-01-15T17:01:19Z"}
{"id":998,"first_name":"Jenelle","email":"jsteinerrp@technorati.com","job":"Safety Technician III","timestamp":"2022-02-23T20:35:11Z"}
{"id":999,"first_name":"Elwood","email":"eengehamrq@fda.gov","job":"Occupational Therapist","timestamp":"2022-04-27T20:29:45Z"}
{"id":1000,"first_name":"Donnie","email":"dshiptonrr@slideshare.net","job":"Developer II","timestamp":"2022-03-10T21:39:22Z"}


================================================
FILE: quickwit/quickwit-indexing/benches/doc_process_vrl_bench.rs
================================================
use std::sync::Arc;

use bytes::Bytes;
use criterion::{BenchmarkId, Criterion, criterion_group, criterion_main};
use quickwit_actors::{ActorHandle, Mailbox, Universe};
use quickwit_config::{SourceInputFormat, TransformConfig};
use quickwit_doc_mapper::DocMapper;
use quickwit_indexing::actors::DocProcessor;
use quickwit_indexing::models::RawDocBatch;
use quickwit_metastore::checkpoint::SourceCheckpointDelta;

const JSON_NORMAL: &str = include_str!("data/bench_data.json");
const JSON_LIGHT_TRANSFORM: &str = include_str!("data/bench_data_light_transform.json");
const JSON_HEAVY_TRANSFORM: &str = include_str!("data/bench_data_heavy_transform.json");

macro_rules! bench_func {
    ($input:expr, $group:expr, $name:expr, $param:expr, $func:expr) => {{
        let lines: Vec<&str> = $input.lines().map(|line| line.trim()).collect();
        $group.throughput(criterion::Throughput::Bytes($input.len() as u64));

        let runtime = tokio::runtime::Runtime::new().unwrap();
        let checkpoint_delta = SourceCheckpointDelta::from_range(0..$input.len() as u64);

        $group.bench_function(BenchmarkId::new($name, $param), |b| {
            b.to_async(&runtime).iter_batched(
                || {
                    lines
                        .iter()
                        .map(|line| Bytes::from(*line))
                        .collect::<Vec<_>>()
                },
                |docs| async {
                    let (mailbox, handle, universe) = $func;
                    mailbox
                        .send_message(RawDocBatch::new(docs, checkpoint_delta.clone(), false))
                        .await
                        .unwrap();

                    universe.send_exit_with_success(&mailbox).await.unwrap();
                    handle.join().await;
                },
                criterion::BatchSize::SmallInput,
            )
        });
    }};
}

pub fn default_doc_mapper_for_bench() -> DocMapper {
    const JSON_CONFIG_VALUE: &str = r#"
        {
            "store_source": true,
            "default_search_fields": [],
            "timestamp_field": "timestamp",
            "tag_fields": ["id"],
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "datetime",
                    "output_format": "unix_timestamp_secs",
                    "fast": true,
                    "input_formats": ["iso8601"]
                },
                {
                    "name": "first_name",
                    "type": "text",
                    "stored": true
                },
                {
                    "name": "last_name",
                    "type": "text",
                    "stored": true
                },
                {
                    "name": "id",
                    "type": "u64",
                    "stored": true
                },
                {
                    "name": "email",
                    "type": "text",
                    "stored": true
                },
                {
                    "name": "job",
                    "type": "text",
                    "stored": true
                }
            ]
        }"#;
    serde_json::from_str::<DocMapper>(JSON_CONFIG_VALUE).unwrap()
}

fn doc_processor_no_transform() -> (Mailbox<DocProcessor>, ActorHandle<DocProcessor>, Universe) {
    create_doc_processor(None)
}

fn doc_processor_light_transform() -> (Mailbox<DocProcessor>, ActorHandle<DocProcessor>, Universe) {
    let vrl_script = r#"
        .last_name = "Doe"
        .job = upcase(string!(.job))
    "#;
    let transform_config = TransformConfig::for_test(vrl_script);
    create_doc_processor(Some(transform_config))
}

fn doc_processor_heavy_transform() -> (Mailbox<DocProcessor>, ActorHandle<DocProcessor>, Universe) {
    let vrl_script = r#"
        . = parse_json!(.body)
        .last_name = "Doe"
        .job = upcase(string!(.job))
        .timestamp = to_string(to_timestamp(now()))
    "#;
    let transform_config = TransformConfig::for_test(vrl_script);
    create_doc_processor(Some(transform_config))
}

fn create_doc_processor(
    transform_config_opt: Option<TransformConfig>,
) -> (Mailbox<DocProcessor>, ActorHandle<DocProcessor>, Universe) {
    let index_id = "my-index".to_string();
    let source_id = "my-source".to_string();
    let doc_mapper = Arc::new(default_doc_mapper_for_bench());
    let universe = Universe::new();
    let (indexer_mailbox, _) = universe.create_test_mailbox();
    let doc_processor = DocProcessor::try_new(
        index_id,
        source_id,
        doc_mapper,
        indexer_mailbox,
        transform_config_opt,
        SourceInputFormat::Json,
    )
    .unwrap();
    let (mailbox, handle) = universe.spawn_builder().spawn(doc_processor);
    (mailbox, handle, universe)
}

fn bench_simple_json(c: &mut Criterion) {
    let mut group = c.benchmark_group("Simple Json");
    bench_func!(
        JSON_NORMAL,
        group,
        "No VRL",
        "Simple JSON",
        doc_processor_no_transform()
    );
    bench_func!(
        JSON_NORMAL,
        group,
        "Light VRL",
        "Simple JSON",
        doc_processor_light_transform()
    );
}

fn bench_light_json(c: &mut Criterion) {
    let mut group = c.benchmark_group("Simple/Light Json");
    bench_func!(
        JSON_NORMAL,
        group,
        "No VRL",
        "Simple JSON",
        doc_processor_no_transform()
    );
    bench_func!(
        JSON_LIGHT_TRANSFORM,
        group,
        "Light VRL",
        "Light JSON",
        doc_processor_light_transform()
    );
}

fn bench_heavy_json(c: &mut Criterion) {
    let mut group = c.benchmark_group("Simple/Light Json");
    bench_func!(
        JSON_NORMAL,
        group,
        "No VRL",
        "Simple JSON",
        doc_processor_no_transform()
    );
    bench_func!(
        JSON_HEAVY_TRANSFORM,
        group,
        "Heavy VRL",
        "Heavy JSON",
        doc_processor_heavy_transform()
    );
}

criterion_group!(
    benches,
    bench_simple_json,
    bench_light_json,
    bench_heavy_json
);
criterion_main!(benches);


================================================
FILE: quickwit/quickwit-indexing/data/test_corpus.json
================================================
{"timestamp":1375457457,"body":"hello","response_date":141436123,"response_time":141436123,"response_payload":"data","owner":"","properties":{},"children":[],"attributes":{"tags":[12,34],"server":"foo","server.status":["down","up"],"server.payload":"data"}}
{"timestamp":1375457457,"body":"happy","response_date":141436123,"response_time":141436123,"response_payload":"data","owner":"","properties":{},"children":{},"attributes":{"tags":[12,34],"server":"foo","server.status":["down","up"],"server.payload":"data"}}
{"timestamp":1375457457,"body":"tax","response_date":141436123,"response_time":141436123,"response_payload":"data","owner":"","properties":{},"children":{},"attributes":{"tags":[12,34],"server":"foo","server.status":["down","up"],"server.payload":"data"}}
{"timestamp":1375457457,"body":"payer","response_date":141436123,"response_time":141436123,"response_payload":"data","owner":"","properties":{},"children":[],"attributes":{"tags":[12,34],"server":"foo","server.status":["down","up"],"server.payload":"data"}}


================================================
FILE: quickwit/quickwit-indexing/failpoints/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Fail points are a form of code instrumentation that allow errors and other behaviors
//! to be injected dynamically at runtime, primarily for testing purposes. Fail
//! points are flexible and can be configured to exhibit a variety of behaviors,
//! including panics, early returns, and sleeps. They can be controlled both
//! programmatically and via the environment, and can be triggered conditionally
//! and probabilistically.
//!
//! They rely on a global variable, which requires them to be executed in a single
//! thread.
//! For this reason, we isolate them from the other unit tests and define an
//! independent binary target.
//!
//! They are not executed by default.
//! They are executed in CI and can be executed locally
//! `cargo test --features fail/failpoints test_failpoint -- --test-threads`
//!
//! Below we test panics at different steps in the indexing pipeline.

use std::path::Path;
use std::sync::{Arc, Barrier, Mutex};
use std::time::Duration;

use fail::FailScenario;
use quickwit_common::io::IoControls;
use quickwit_common::rand::append_random_suffix;
use quickwit_common::split_file;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_indexing::actors::MergeExecutor;
use quickwit_indexing::merge_policy::{MergeOperation, MergeTask};
use quickwit_indexing::models::MergeScratch;
use quickwit_indexing::{TestSandbox, get_tantivy_directory_from_split_bundle};
use quickwit_metastore::{
    ListSplitsQuery, ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitMetadata,
    SplitState,
};
use quickwit_proto::indexing::MergePipelineId;
use quickwit_proto::metastore::{ListSplitsRequest, MetastoreService};
use quickwit_proto::types::{IndexUid, NodeId};
use serde_json::Value as JsonValue;
use tantivy::Directory;

#[tokio::test]
async fn test_failpoint_no_failure() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

fn deterministic_panic_sequence(mut panics: Vec<bool>) -> impl Fn() + Send + Sync {
    panics.reverse();
    let panics = Mutex::new(panics);
    move || {
        let should_panic = panics.lock().unwrap().pop().unwrap_or(false);
        if should_panic {
            panic!("panicked");
        }
    }
}

#[tokio::test]
async fn test_failpoint_packager_panics_right_away() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback("packager:before", deterministic_panic_sequence(vec![true])).unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_packager_panics_after_one_success() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback(
        "packager:before",
        deterministic_panic_sequence(vec![false, true]),
    )
    .unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_publisher_panics_after_one_success() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback(
        "publisher:before",
        deterministic_panic_sequence(vec![false, true]),
    )
    .unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_publisher_panics_right_away() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback("publisher:before", deterministic_panic_sequence(vec![true])).unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_publisher_after_panics_right_away() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback("publisher:after", deterministic_panic_sequence(vec![true])).unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_uploader_panics_right_away() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback(
        "uploader:before",
        deterministic_panic_sequence(vec![false, true]),
    )
    .unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_uploader_panics_after_one_success() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback("uploader:before", deterministic_panic_sequence(vec![true])).unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

#[tokio::test]
async fn test_failpoint_uploader_after_panics_right_away() -> anyhow::Result<()> {
    let scenario = FailScenario::setup();
    fail::cfg_callback("uploader:after", deterministic_panic_sequence(vec![true])).unwrap();
    aux_test_failpoints().await?;
    scenario.teardown();
    Ok(())
}

async fn aux_test_failpoints() -> anyhow::Result<()> {
    let doc_mapper_yaml = r#"
        field_mappings:
          - name: body
            type: text
          - name: ts
            type: datetime
            fast: true
        timestamp_field: ts
        "#;
    let search_fields = ["body"];
    let index_id = append_random_suffix("test-index");
    let test_index_builder =
        TestSandbox::create(&index_id, doc_mapper_yaml, "", &search_fields).await?;
    let batch_1: Vec<JsonValue> = vec![
        serde_json::json!({"body ": "1", "ts": 1629889530 }),
        serde_json::json!({"body ": "2", "ts": 1629889531 }),
    ];
    let batch_2: Vec<JsonValue> = vec![
        serde_json::json!({"body ": "3", "ts": 1629889532 }),
        serde_json::json!({"body ": "4", "ts": 1629889533 }),
    ];
    test_index_builder.add_documents(batch_1).await?;
    test_index_builder.add_documents(batch_2).await?;
    let query = ListSplitsQuery::for_index(test_index_builder.index_uid())
        .with_split_state(SplitState::Published);
    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query).unwrap();
    let mut splits = test_index_builder
        .metastore()
        .list_splits(list_splits_request)
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    splits.sort_by_key(|split| *split.split_metadata.time_range.clone().unwrap().start());
    assert_eq!(splits.len(), 2);
    assert_eq!(
        splits[0].split_metadata.time_range.clone().unwrap(),
        1629889530..=1629889531
    );
    assert_eq!(
        splits[1].split_metadata.time_range.clone().unwrap(),
        1629889532..=1629889533
    );
    test_index_builder.universe().quit().await;
    Ok(())
}

const TEST_TEXT: &str = r#"His sole child, my lord, and bequeathed to my
overlooking. I have those hopes of her good that
her education promises; her dispositions she
inherits, which makes fair gifts fairer; for where
an unclean mind carries virtuous qualities, there
commendations go with pity; they are virtues and
traitors too; in her they are the better for their
simpleness; she derives her honesty and achieves her goodness."#;

#[tokio::test]
async fn test_merge_executor_controlled_directory_kill_switch() -> anyhow::Result<()> {
    // This tests checks that if a merger is killed in a middle of
    // a merge, then the controlled directory makes it possible to
    // abort the merging operation and return quickly.
    // NOTE(fmassot): This test is working but not as exactly we would want.
    // Ideally we want the actor to stop while merging which is a long task and we
    // don't want to wait until it's finished. But... the merging phase is
    // currently in a protected zone and thus there will be not kill switch activated
    // during this period. We added the protected zone because without we observe from
    // time to time a kill switch activation because the ControlledDirectory did not
    // do any write during a HEARTBEAT... Before removing the protect zone, we need
    // to investigate this instability. Then this test will finally be really helpful.
    quickwit_common::setup_logging_for_tests();
    let doc_mapper_yaml = r#"
        field_mappings:
          - name: body
            type: text
          - name: ts
            type: datetime
            fast: true
        timestamp_field: ts
        "#;
    let indexing_setting_yaml = r#"
        split_num_docs_target: 1000
        merge_policy:
          type: "no_merge"
    "#;
    let search_fields = ["body"];
    let index_id = "test-index-merge-executory-kill-switch";
    let test_index_builder = TestSandbox::create(
        index_id,
        doc_mapper_yaml,
        indexing_setting_yaml,
        &search_fields,
    )
    .await?;

    let doc_mapper = test_index_builder.doc_mapper();
    let batch: Vec<JsonValue> =
        std::iter::repeat_with(|| serde_json::json!({"body ": TEST_TEXT, "ts": 1631072713 }))
            .take(500)
            .collect();
    for _ in 0..2 {
        test_index_builder.add_documents(batch.clone()).await?;
    }
    tokio::time::sleep(Duration::from_millis(10)).await;

    let metastore = test_index_builder.metastore();
    let split_metadatas: Vec<SplitMetadata> = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(test_index_builder.index_uid()).unwrap())
        .await?
        .collect_splits_metadata()
        .await
        .unwrap();
    let merge_scratch_directory = TempDirectory::for_test();

    let downloaded_splits_directory =
        merge_scratch_directory.named_temp_child("downloaded-splits-")?;
    let storage = test_index_builder.storage();
    let mut tantivy_dirs: Vec<Box<dyn Directory>> = Vec::new();
    for split in &split_metadatas {
        let split_filename = split_file(split.split_id());
        let dest_filepath = downloaded_splits_directory.path().join(&split_filename);
        storage
            .copy_to_file(Path::new(&split_filename), &dest_filepath)
            .await?;

        tantivy_dirs.push(get_tantivy_directory_from_split_bundle(&dest_filepath).unwrap());
    }
    let merge_operation = MergeOperation::new_merge_operation(split_metadatas);
    let merge_task = MergeTask::from_merge_operation_for_test(merge_operation);
    let merge_scratch = MergeScratch {
        merge_task,
        merge_scratch_directory,
        downloaded_splits_directory,
        tantivy_dirs,
    };
    let pipeline_id = MergePipelineId {
        node_id: NodeId::from("test-node"),
        index_uid: IndexUid::new_with_random_ulid(index_id),
        source_id: "test-source".to_string(),
    };

    let universe = test_index_builder.universe();
    let (merge_packager_mailbox, _merge_packager_inbox) = universe.create_test_mailbox();
    let io_controls = IoControls::default();
    let merge_executor = MergeExecutor::new(
        pipeline_id,
        metastore,
        doc_mapper,
        io_controls,
        merge_packager_mailbox,
    );

    let (merge_executor_mailbox, _merge_executor_handle) =
        universe.spawn_builder().spawn(merge_executor);

    // We want to make sure that the processing of the message gets
    // aborted not by the actor framework, before the message is being processed.
    //
    // To do so, we
    // - set two barrier so the actor pauses right upon entering the process_merge function
    // - send the merge message
    // - wait on the first barrier to ensure that the actor has reached the process_merge function
    // - kill the universe
    // - wait and release the second barrier so the actor can continue processing the merge message
    //
    // Before the controlled directory, the merge operation would have continued until it
    // finished, taking hundreds of millisecs to terminate.
    let before_universe_kill = Arc::new(Barrier::new(2));
    let after_universe_kill = Arc::new(Barrier::new(2));
    let before_universe_kill_clone = before_universe_kill.clone();
    let after_universe_kill_clone = after_universe_kill.clone();
    fail::cfg_callback("before-merge-split", move || {
        before_universe_kill_clone.wait();
        after_universe_kill_clone.wait();
    })
    .unwrap();
    fail::cfg(
        "after-merge-split",
        "panic(merge should be failed by directory kill switch)",
    )
    .unwrap();
    merge_executor_mailbox.send_message(merge_scratch).await?;
    before_universe_kill.wait();
    universe.kill();
    after_universe_kill.wait();
    universe.quit().await;

    Ok(())
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/cooperative_indexing.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::hash::{DefaultHasher, Hash, Hasher};
use std::sync::Arc;
use std::time::Duration;

use once_cell::sync::Lazy;
use quickwit_proto::indexing::{CpuCapacity, PIPELINE_FULL_CAPACITY, PipelineMetrics};
use tokio::sync::{OwnedSemaphorePermit, Semaphore};
use tokio::time::Instant;

/// We allow ourselves to adjust the sleep time by at most `NUDGE_TOLERANCE`
/// in order to steer a pipeline to its phase.
const NUDGE_TOLERANCE: Duration = Duration::from_secs(5);

// Origin of time. It is used to compute the phase of the pipeline.
static ORIGIN_OF_TIME: Lazy<Instant> = Lazy::new(Instant::now);

/// Cooperative indexing is a mechanism to deal with a large amount of pipelines.
///
/// Instead of having all pipelines index concurrently, cooperative indexing:
/// - have them take turn, making sure that at most only N pipelines are indexing at the same time.
///   This has the benefit is reducing RAM using (by having a limited number of `IndexWriter` at the
///   same time), reducing context switching.
/// - keeps the different pipelines work uniformously spread in time. If the system is not at
///   capacity, we prefer to have the indexing pipeline as desynchronized as possible to make sure
///   they don't all use the same resources (disk/cpu/network) at the same time.
///
/// It works by:
/// - a semaphore is used to restrict the number of pipelines indexing at the same time.
/// - in the indexer when `on_drain` is called, the indexer will cut a split and "go to sleep" for a
///   given amount of time.
///
/// The key logic is in the computation of that sleep time.
///
/// We want to set it in order to steer the pipeline toward an ideal cycle with a period
/// of `commit_timeout`,
///
/// A period in this ideal cycle should, for some k,
/// - start at `t0 + k * commit_timeout + target_phase`
/// - end at `t0 + (k+1)*commit_timeout + target_phase`.
///
/// `target_phase` is computed using a hash over the pipeline id, and meant to follow
/// a uniform distribution over the interval [0, commit_timeout).
///
/// Each period of this cycle is divided into three phases.
/// - waking [t_wake..t_work_start) acquisition of the period guard (this is instantaneous)
///   acquisition of the semaphore
/// - working [t_work_start..t_work_end)
/// - sleeping [t=t_work_end..t_sleep_end)
///
/// The idea is to first pick the sleep time to to create a cycle of period
/// `commit_timeout`.
///   sleep_time := max(0, commit_timeout - (t_workend - t_wake))
///
/// If the work phase is too long, the regular commit timeout mechanism
/// kicks in an the pipeline will create a split without waiting for the
/// mailbox to be drained.
///
/// We then allow ourselves to tweak the sleep time one way or another by at
/// most two seconds to eventually nudge the system toward the desired phase.
pub(crate) struct CooperativeIndexingCycle {
    target_phase: Duration,
    commit_timeout: Duration,
    indexing_permits: Arc<Semaphore>,
}

impl CooperativeIndexingCycle {
    /// Creates a new cooperative indexing cycle object.
    /// `phase_id` is hashed to compute the target phase.
    pub fn new(
        phase_id: &(impl Hash + ?Sized),
        commit_timeout: Duration,
        indexing_permits: Arc<Semaphore>,
    ) -> CooperativeIndexingCycle {
        assert!(commit_timeout.as_millis() > 0);
        let mut hasher = DefaultHasher::new();
        phase_id.hash(&mut hasher);
        let target_phase_millis: u64 = hasher.finish() % commit_timeout.as_millis() as u64;
        Self::new_with_phase(
            Duration::from_millis(target_phase_millis),
            commit_timeout,
            indexing_permits,
        )
    }

    fn new_with_phase(
        target_phase: Duration,
        commit_timeout: Duration,
        indexing_permits: Arc<Semaphore>,
    ) -> CooperativeIndexingCycle {
        // Force the initial of the origin of time.
        let _t0 = *ORIGIN_OF_TIME;
        CooperativeIndexingCycle {
            target_phase,
            commit_timeout,
            indexing_permits,
        }
    }

    pub fn initial_sleep_duration(&self) -> Duration {
        let t0 = *ORIGIN_OF_TIME;
        let commit_timeout_millis = self.commit_timeout.as_millis() as u64;
        let current_phase_millis: u64 = t0.elapsed().as_millis() as u64 % commit_timeout_millis;
        let target_phase_millis: u64 = self.target_phase.as_millis() as u64 % commit_timeout_millis;
        let initial_sleep_millis: u64 = (commit_timeout_millis + target_phase_millis
            - current_phase_millis)
            % commit_timeout_millis;
        if initial_sleep_millis + 2 * NUDGE_TOLERANCE.as_millis() as u64 > commit_timeout_millis {
            // We are reasonably close to the target phase. No need to sleep. The nudge
            // will be enough.
            return Duration::default();
        }
        Duration::from_millis(initial_sleep_millis)
    }

    pub async fn cooperative_indexing_period(&self) -> CooperativeIndexingPeriod {
        let t_wake = Instant::now();
        let permit = Semaphore::acquire_owned(self.indexing_permits.clone())
            .await
            .unwrap();
        let t_work_start = Instant::now();
        CooperativeIndexingPeriod {
            t_wake,
            t_work_start,
            commit_timeout: self.commit_timeout,
            target_phase: self.target_phase,
            _permit: permit,
        }
    }
}

pub(crate) struct CooperativeIndexingPeriod {
    // measured right before the acquisition of the indexing semaphore
    t_wake: Instant,
    // measured after the acquisition of the semaphore.
    t_work_start: Instant,
    commit_timeout: Duration,
    target_phase: Duration,
    _permit: OwnedSemaphorePermit,
}

impl CooperativeIndexingPeriod {
    fn compute_pipeline_metrics(
        &self,
        end: Instant,
        uncompressed_num_bytes: u64,
    ) -> PipelineMetrics {
        let elapsed = end - self.t_work_start;
        let throughput_mb_per_sec: u64 =
            uncompressed_num_bytes / (1u64 + elapsed.as_micros() as u64);
        let commit_timeout = self.commit_timeout;
        let pipeline_throughput_fraction =
            (elapsed.as_micros() as f32 / commit_timeout.as_micros() as f32).min(1.0f32);
        let cpu_load: CpuCapacity = PIPELINE_FULL_CAPACITY * pipeline_throughput_fraction;
        PipelineMetrics {
            cpu_load,
            throughput_mb_per_sec: throughput_mb_per_sec as u16,
        }
    }

    fn compute_sleep_duration(&self, t_work_end: Instant) -> Duration {
        let commit_timeout_millis = self.commit_timeout.as_millis() as u64;
        let phase_millis: u64 =
            ((t_work_end - *ORIGIN_OF_TIME).as_millis() as u64) % commit_timeout_millis;
        let delta_phase: i64 = phase_millis as i64 - self.target_phase.as_millis() as i64;
        // delta phase is within (-commit_timeout_millis, commit_timeout_millis)
        // We fold it back to [-commit_timeout_millis/2, commit_timeout_millis/2)
        let half_commit_timeout_millis = commit_timeout_millis as i64 / 2;
        let delta_phase = if delta_phase >= half_commit_timeout_millis {
            delta_phase - commit_timeout_millis as i64
        } else if delta_phase < -half_commit_timeout_millis {
            delta_phase + commit_timeout_millis as i64
        } else {
            delta_phase
        };
        let nudge_tolerance_millis = NUDGE_TOLERANCE.as_millis() as i64;
        let nudge_millis: i64 = delta_phase.clamp(-nudge_tolerance_millis, nudge_tolerance_millis);
        let sleep_duration_millis = self.commit_timeout.as_millis() as i64
            - (t_work_end - self.t_wake).as_millis() as i64
            - nudge_millis;
        if sleep_duration_millis > 0 {
            Duration::from_millis(sleep_duration_millis as u64)
        } else {
            Duration::ZERO
        }
    }

    /// This drops the indexing permit, allowing another indexer to start indexing.
    /// This function also returns the amount of time to sleep until the next period.
    pub fn end_of_work(self, uncompressed_num_bytes: u64) -> (Duration, PipelineMetrics) {
        let end = Instant::now();
        let sleep_duration = self.compute_sleep_duration(end);
        let metrics = self.compute_pipeline_metrics(end, uncompressed_num_bytes);
        (sleep_duration, metrics)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[track_caller]
    fn assert_approx_equal_sleep_time(left: Duration, right: Duration) {
        let delta = (left.as_millis() as i128 - right.as_millis() as i128).unsigned_abs();
        if delta >= NUDGE_TOLERANCE.mul_f32(1.1).as_millis() {
            panic!("{left:?} and {right:?} are not approximately equal.");
        }
    }

    #[track_caller]
    fn assert_approx_equal(left: u32, right: u32) {
        assert!(
            left.abs_diff(right) * 10 <= (left + right),
            "inequal values {left} != {right}"
        );
    }

    #[track_caller]
    fn assert_approx_metrics(left_metrics: &PipelineMetrics, right_metrics: &PipelineMetrics) {
        assert_approx_equal(
            left_metrics.throughput_mb_per_sec as u32,
            right_metrics.throughput_mb_per_sec as u32,
        );
        assert_approx_equal(
            left_metrics.cpu_load.cpu_millis(),
            right_metrics.cpu_load.cpu_millis(),
        );
    }

    #[tokio::test]
    async fn test_initial_sleep_time() {
        tokio::time::pause();
        let t0 = *ORIGIN_OF_TIME;
        for target_phase_secs in [0, 1, 2, 5, 10, 15, 20, 25, 29, 30, 1_000] {
            for start_time_secs in [0, 1, 2, 5, 10, 15, 20, 25, 29, 30] {
                let target_phase = Duration::from_secs(target_phase_secs);
                let semaphore = Arc::new(Semaphore::new(1));
                tokio::time::sleep(Duration::from_secs(start_time_secs)).await;
                let cooperative_indexing = CooperativeIndexingCycle::new_with_phase(
                    target_phase,
                    Duration::from_secs(30),
                    semaphore.clone(),
                );
                let initial_sleep_duration: Duration =
                    cooperative_indexing.initial_sleep_duration();
                tokio::time::sleep(initial_sleep_duration).await;
                let target_phase_millis = cooperative_indexing.target_phase.as_millis() as i64;
                let commit_timeout_ms = cooperative_indexing.commit_timeout.as_millis() as i64;
                let phase_millis =
                    (t0.elapsed().as_millis() as i64 - target_phase_millis) % commit_timeout_ms;
                assert!(phase_millis >= -100, "{phase_millis}");
                assert!(phase_millis <= (NUDGE_TOLERANCE.as_millis() as i64) * 2 + 100);
            }
        }
    }

    #[tokio::test]
    async fn test_cooperative_indexing_simple() {
        tokio::time::pause();
        let semaphore = Arc::new(Semaphore::new(1));
        let cooperative_indexing =
            CooperativeIndexingCycle::new("id", Duration::from_secs(30), semaphore.clone());
        let guard = cooperative_indexing.cooperative_indexing_period().await;
        tokio::time::advance(Duration::from_secs(10)).await;
        let (sleep_time, metrics) = guard.end_of_work(100_000_000);
        assert_approx_equal_sleep_time(sleep_time, Duration::from_secs(20));
        let expected_metrics = PipelineMetrics {
            cpu_load: CpuCapacity::from_cpu_millis(PIPELINE_FULL_CAPACITY.cpu_millis() * 10 / 30),
            throughput_mb_per_sec: 10u16,
        };
        assert_approx_metrics(&metrics, &expected_metrics)
    }

    fn drop_after<T: Send + 'static>(guard: T, duration: Duration) {
        tokio::task::spawn(async move {
            tokio::time::sleep(duration).await;
            drop(guard);
        });
    }

    #[tokio::test]
    async fn test_cooperative_indexing_maximum_throughput() {
        tokio::time::pause();
        let semaphore = Arc::new(Semaphore::new(1));
        let cooperative_indexing =
            CooperativeIndexingCycle::new("id", Duration::from_secs(30), semaphore.clone());
        let semaphore_guard = Semaphore::acquire_owned(semaphore).await;
        drop_after(semaphore_guard, Duration::from_secs(30));
        let cycle_guard = cooperative_indexing.cooperative_indexing_period().await;
        tokio::time::advance(Duration::from_secs(15)).await;
        let (sleep_time, metrics) = cycle_guard.end_of_work(30_000_000);
        let expected_metrics = PipelineMetrics {
            cpu_load: CpuCapacity::from_cpu_millis(PIPELINE_FULL_CAPACITY.cpu_millis() * 15 / 30),
            throughput_mb_per_sec: 1u16,
        };
        assert_approx_metrics(&metrics, &expected_metrics);
        assert!(sleep_time.is_zero());
    }

    #[tokio::test]
    async fn test_cooperative_indexing_simple_contention() {
        tokio::time::pause();
        let semaphore = Arc::new(Semaphore::new(1));
        let cooperative_indexing =
            CooperativeIndexingCycle::new("id", Duration::from_secs(30), semaphore.clone());
        let semaphore_guard = Semaphore::acquire_owned(semaphore).await;
        drop_after(semaphore_guard, Duration::from_secs(10));
        let cycle_guard = cooperative_indexing.cooperative_indexing_period().await;
        tokio::time::advance(Duration::from_secs(10)).await;
        let (sleep_time, metrics) = cycle_guard.end_of_work(100_000_000);
        assert_approx_equal_sleep_time(sleep_time, Duration::from_secs(10));
        let expected_metrics = PipelineMetrics {
            cpu_load: CpuCapacity::from_cpu_millis(PIPELINE_FULL_CAPACITY.cpu_millis() * 10 / 30),
            throughput_mb_per_sec: 10u16,
        };
        assert_approx_metrics(&metrics, &expected_metrics);
    }

    #[tokio::test]
    async fn test_cooperative_indexing_nudge_to_phase() {
        tokio::time::pause();
        let num_threads = 10;
        let num_pipelines = 100;
        let num_steps = 15;
        let semaphore = Arc::new(Semaphore::new(num_threads));
        let commit_timeout = Duration::from_secs(30);
        let t0 = Instant::now();
        let mut handles = Vec::new();
        for i in 0..num_pipelines {
            let target_phase =
                Duration::from_millis(commit_timeout.as_millis() as u64 * i / num_pipelines);
            let cooperative_indexing = CooperativeIndexingCycle::new_with_phase(
                target_phase,
                commit_timeout,
                semaphore.clone(),
            );
            let join_handle = tokio::task::spawn(async move {
                let mut last_phase = 0;
                for _ in 0..num_steps {
                    let cycle_guard = cooperative_indexing.cooperative_indexing_period().await;
                    let work_time = Duration::from_millis(10);
                    tokio::time::sleep(work_time).await;
                    last_phase =
                        t0.elapsed().as_millis() as u64 % commit_timeout.as_millis() as u64;
                    let (sleep_time, _) = cycle_guard.end_of_work(1_000_000);
                    tokio::time::sleep(sleep_time).await;
                }
                last_phase
            });
            handles.push(join_handle);
        }
        for (i, phase_handle) in handles.into_iter().enumerate() {
            let phase = phase_handle.await.unwrap() as u32;
            let expected_phase_millis: u32 =
                commit_timeout.as_millis() as u32 * i as u32 / num_pipelines as u32;
            assert!(phase.abs_diff(expected_phase_millis) < 3);
        }
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/doc_processor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::string::FromUtf8Error;
use std::sync::Arc;
use std::sync::atomic::{AtomicU64, Ordering};

use anyhow::{Context, bail};
use async_trait::async_trait;
use bytes::Bytes;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::metrics::IntCounter;
use quickwit_common::rate_limited_tracing::rate_limited_warn;
use quickwit_common::runtimes::RuntimeType;
use quickwit_config::{SourceInputFormat, TransformConfig};
use quickwit_doc_mapper::{DocMapper, DocParsingError, JsonObject};
use quickwit_opentelemetry::otlp::{
    JsonLogIterator, JsonSpanIterator, OtlpLogsError, OtlpTracesError, parse_otlp_logs_json,
    parse_otlp_logs_protobuf, parse_otlp_spans_json, parse_otlp_spans_protobuf,
};
use quickwit_proto::types::{IndexId, SourceId};
use serde::Serialize;
use serde_json::Value as JsonValue;
use tantivy::schema::{Field, Value};
use tantivy::{DateTime, TantivyDocument};
use thiserror::Error;
use tokio::runtime::Handle;

#[cfg(feature = "vrl")]
use super::vrl_processing::*;
use crate::actors::Indexer;
use crate::models::{
    NewPublishLock, NewPublishToken, ProcessedDoc, ProcessedDocBatch, PublishLock, RawDocBatch,
};

const PLAIN_TEXT: &str = "plain_text";

pub(super) struct JsonDoc {
    json_obj: JsonObject,
    num_bytes: usize,
}

impl JsonDoc {
    pub fn new(json_obj: JsonObject, num_bytes: usize) -> Self {
        Self {
            json_obj,
            num_bytes,
        }
    }

    pub fn try_from_json_value(
        json_value: JsonValue,
        num_bytes: usize,
    ) -> Result<Self, DocProcessorError> {
        match json_value {
            JsonValue::Object(json_obj) => Ok(Self::new(json_obj, num_bytes)),
            _ => Err(DocProcessorError::JsonParsing(
                "document is not an object".to_string(),
            )),
        }
    }

    #[cfg(feature = "vrl")]
    pub fn try_from_vrl_doc(vrl_doc: VrlDoc) -> Result<Self, DocProcessorError> {
        let json_value = serde_json::to_value(vrl_doc.vrl_value)?;
        Self::try_from_json_value(json_value, vrl_doc.num_bytes)
    }
}

#[allow(clippy::enum_variant_names)]
#[derive(Error, Debug)]
pub enum DocProcessorError {
    #[error("doc mapper parse error: {0}")]
    DocMapperParsing(DocParsingError),
    #[error("JSON parse error: {0}")]
    JsonParsing(String),
    #[error("OLTP log records parse error: {0}")]
    OltpLogsParsing(OtlpLogsError),
    #[error("OLTP traces parse error: {0}")]
    OltpTracesParsing(OtlpTracesError),
    #[cfg(feature = "vrl")]
    #[error("VRL transform error: {0}")]
    Transform(VrlTerminate),
}

impl From<OtlpLogsError> for DocProcessorError {
    fn from(error: OtlpLogsError) -> Self {
        Self::OltpLogsParsing(error)
    }
}

impl From<OtlpTracesError> for DocProcessorError {
    fn from(error: OtlpTracesError) -> Self {
        Self::OltpTracesParsing(error)
    }
}

impl From<DocParsingError> for DocProcessorError {
    fn from(error: DocParsingError) -> Self {
        Self::DocMapperParsing(error)
    }
}

impl From<serde_json::Error> for DocProcessorError {
    fn from(error: serde_json::Error) -> Self {
        Self::JsonParsing(error.to_string())
    }
}

impl From<FromUtf8Error> for DocProcessorError {
    fn from(error: FromUtf8Error) -> Self {
        Self::JsonParsing(error.to_string())
    }
}

#[cfg(feature = "vrl")]
fn try_into_vrl_doc(
    input_format: SourceInputFormat,
    raw_doc: Bytes,
    num_bytes: usize,
) -> Result<VrlDoc, DocProcessorError> {
    let vrl_value = match input_format {
        SourceInputFormat::Json => serde_json::from_slice::<VrlValue>(&raw_doc)?,
        SourceInputFormat::PlainText => {
            let mut map = std::collections::BTreeMap::new();
            let key = vrl::value::KeyString::from(PLAIN_TEXT);
            let value = VrlValue::Bytes(raw_doc);
            map.insert(key, value);
            VrlValue::Object(map)
        }
        SourceInputFormat::OtlpLogsJson
        | SourceInputFormat::OtlpLogsProtobuf
        | SourceInputFormat::OtlpTracesJson
        | SourceInputFormat::OtlpTracesProtobuf => {
            panic!("OTP logs or traces do not support VRL transforms")
        }
    };
    let vrl_doc = VrlDoc::new(vrl_value, num_bytes);
    Ok(vrl_doc)
}

fn try_into_json_docs(
    input_format: SourceInputFormat,
    raw_doc: Bytes,
    num_bytes: usize,
) -> JsonDocIterator {
    match input_format {
        SourceInputFormat::Json => {
            let json_doc_result = serde_json::from_slice::<JsonObject>(&raw_doc)
                .map(|json_obj| JsonDoc::new(json_obj, num_bytes));
            JsonDocIterator::from(json_doc_result)
        }
        SourceInputFormat::OtlpLogsJson => {
            let logs = parse_otlp_logs_json(&raw_doc);
            JsonDocIterator::from(logs)
        }
        SourceInputFormat::OtlpLogsProtobuf => {
            let logs = parse_otlp_logs_protobuf(&raw_doc);
            JsonDocIterator::from(logs)
        }
        SourceInputFormat::OtlpTracesJson => {
            let spans = parse_otlp_spans_json(&raw_doc);
            JsonDocIterator::from(spans)
        }
        SourceInputFormat::OtlpTracesProtobuf => {
            let spans = parse_otlp_spans_protobuf(&raw_doc);
            JsonDocIterator::from(spans)
        }
        SourceInputFormat::PlainText => {
            let json_doc_result = String::from_utf8(raw_doc.to_vec()).map(|value| {
                let mut json_obj = serde_json::Map::with_capacity(1);
                let key = PLAIN_TEXT.to_string();
                json_obj.insert(key, JsonValue::String(value));
                JsonDoc::new(json_obj, num_bytes)
            });
            JsonDocIterator::from(json_doc_result)
        }
    }
}

#[cfg(feature = "vrl")]
fn parse_raw_doc(
    input_format: SourceInputFormat,
    raw_doc: Bytes,
    num_bytes: usize,
    vrl_program_opt: Option<&mut VrlProgram>,
) -> JsonDocIterator {
    let Some(vrl_program) = vrl_program_opt else {
        return try_into_json_docs(input_format, raw_doc, num_bytes);
    };
    let json_doc_result = try_into_vrl_doc(input_format, raw_doc, num_bytes)
        .and_then(|vrl_doc| vrl_program.transform_doc(vrl_doc))
        .and_then(JsonDoc::try_from_vrl_doc);

    JsonDocIterator::from(json_doc_result)
}

#[cfg(not(feature = "vrl"))]
fn parse_raw_doc(
    input_format: SourceInputFormat,
    raw_doc: Bytes,
    num_bytes: usize,
    _vrl_program_opt: Option<&mut VrlProgram>,
) -> JsonDocIterator {
    try_into_json_docs(input_format, raw_doc, num_bytes)
}

enum JsonDocIterator {
    One(Option<Result<JsonDoc, DocProcessorError>>),
    Logs(JsonLogIterator),
    Spans(JsonSpanIterator),
}

impl Iterator for JsonDocIterator {
    type Item = Result<JsonDoc, DocProcessorError>;

    fn next(&mut self) -> Option<Self::Item> {
        match self {
            Self::One(opt) => opt.take(),
            Self::Logs(logs) => logs
                .next()
                .map(|(json_value, num_bytes)| JsonDoc::try_from_json_value(json_value, num_bytes)),
            Self::Spans(spans) => spans
                .next()
                .map(|(json_value, num_bytes)| JsonDoc::try_from_json_value(json_value, num_bytes)),
        }
    }
}

impl<E> From<Result<JsonDoc, E>> for JsonDocIterator
where E: Into<DocProcessorError>
{
    fn from(result: Result<JsonDoc, E>) -> Self {
        match result {
            Ok(json_doc) => Self::One(Some(Ok(json_doc))),
            Err(error) => Self::One(Some(Err(error.into()))),
        }
    }
}

impl From<Result<JsonLogIterator, OtlpLogsError>> for JsonDocIterator {
    fn from(result: Result<JsonLogIterator, OtlpLogsError>) -> Self {
        match result {
            Ok(logs) => Self::Logs(logs),
            Err(error) => Self::One(Some(Err(DocProcessorError::from(error)))),
        }
    }
}

impl From<Result<JsonSpanIterator, OtlpTracesError>> for JsonDocIterator {
    fn from(result: Result<JsonSpanIterator, OtlpTracesError>) -> Self {
        match result {
            Ok(spans) => Self::Spans(spans),
            Err(error) => Self::One(Some(Err(DocProcessorError::from(error)))),
        }
    }
}

#[derive(Debug)]
pub struct DocProcessorCounter {
    pub num_docs: AtomicU64,
    pub num_docs_metric: IntCounter,
    pub num_bytes_metric: IntCounter,
}

impl Serialize for DocProcessorCounter {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        serializer.serialize_u64(self.get_num_docs())
    }
}

impl DocProcessorCounter {
    fn for_index_and_doc_processor_outcome(index: &str, outcome: &str) -> DocProcessorCounter {
        let index_label = quickwit_common::metrics::index_label(index);
        let labels = [index_label, outcome];
        DocProcessorCounter {
            num_docs: Default::default(),
            num_docs_metric: crate::metrics::INDEXER_METRICS
                .processed_docs_total
                .with_label_values(labels),
            num_bytes_metric: crate::metrics::INDEXER_METRICS
                .processed_bytes
                .with_label_values(labels),
        }
    }

    #[inline(always)]
    fn get_num_docs(&self) -> u64 {
        self.num_docs.load(Ordering::Relaxed)
    }

    fn record_doc(&self, num_bytes: u64) {
        self.num_docs.fetch_add(1, Ordering::Relaxed);
        self.num_docs_metric.inc();
        self.num_bytes_metric.inc_by(num_bytes);
    }
}

#[derive(Debug, Serialize)]
pub struct DocProcessorCounters {
    index_id: IndexId,
    source_id: SourceId,

    /// Overall number of documents received, partitioned
    /// into 5 categories:
    /// - valid documents
    /// - number of docs that could not be parsed.
    /// - number of docs that were not valid json.
    /// - number of docs that could not be transformed.
    /// - number of docs for which the doc mapper returned an error.
    /// - number of valid docs.
    pub valid: DocProcessorCounter,
    pub doc_mapper_errors: DocProcessorCounter,
    pub transform_errors: DocProcessorCounter,
    pub json_parse_errors: DocProcessorCounter,
    pub otlp_parse_errors: DocProcessorCounter,

    /// Number of bytes that went through the indexer
    /// during its entire lifetime.
    ///
    /// Includes both valid and invalid documents.
    pub num_bytes_total: AtomicU64,
}

impl DocProcessorCounters {
    pub fn new(index_id: IndexId, source_id: SourceId) -> Self {
        let valid_docs =
            DocProcessorCounter::for_index_and_doc_processor_outcome(&index_id, "valid");
        let doc_mapper_errors =
            DocProcessorCounter::for_index_and_doc_processor_outcome(&index_id, "doc_mapper_error");
        let transform_errors =
            DocProcessorCounter::for_index_and_doc_processor_outcome(&index_id, "transform_error");
        let json_parse_errors =
            DocProcessorCounter::for_index_and_doc_processor_outcome(&index_id, "json_parse_error");
        let otlp_parse_errors =
            DocProcessorCounter::for_index_and_doc_processor_outcome(&index_id, "otlp_parse_error");
        DocProcessorCounters {
            index_id,
            source_id,

            valid: valid_docs,
            doc_mapper_errors,
            transform_errors,
            json_parse_errors,
            otlp_parse_errors,
            num_bytes_total: Default::default(),
        }
    }

    /// Returns the overall number of docs that went through the indexer (valid or not).
    pub fn num_processed_docs(&self) -> u64 {
        self.valid.get_num_docs()
            + self.doc_mapper_errors.get_num_docs()
            + self.json_parse_errors.get_num_docs()
            + self.otlp_parse_errors.get_num_docs()
            + self.transform_errors.get_num_docs()
    }

    /// Returns the overall number of docs that were sent to the indexer but were invalid.
    /// (For instance, because they were missing a required field or because their because
    /// their format was invalid)
    pub fn num_invalid_docs(&self) -> u64 {
        self.doc_mapper_errors.get_num_docs()
            + self.json_parse_errors.get_num_docs()
            + self.otlp_parse_errors.get_num_docs()
            + self.transform_errors.get_num_docs()
    }

    pub fn record_valid(&self, num_bytes: u64) {
        self.num_bytes_total.fetch_add(num_bytes, Ordering::Relaxed);
        self.valid.record_doc(num_bytes);
    }

    pub fn record_error(&self, error: DocProcessorError, num_bytes: u64) {
        self.num_bytes_total.fetch_add(num_bytes, Ordering::Relaxed);
        match error {
            DocProcessorError::DocMapperParsing(_) => {
                self.doc_mapper_errors.record_doc(num_bytes);
            }
            DocProcessorError::JsonParsing(_) => {
                self.json_parse_errors.record_doc(num_bytes);
            }
            DocProcessorError::OltpLogsParsing(_) | DocProcessorError::OltpTracesParsing(_) => {
                self.otlp_parse_errors.record_doc(num_bytes);
            }
            #[cfg(feature = "vrl")]
            DocProcessorError::Transform(_) => {
                self.transform_errors.record_doc(num_bytes);
            }
        };
    }
}

pub struct DocProcessor {
    doc_mapper: Arc<DocMapper>,
    indexer_mailbox: Mailbox<Indexer>,
    timestamp_field_opt: Option<Field>,
    counters: Arc<DocProcessorCounters>,
    publish_lock: PublishLock,
    #[cfg(feature = "vrl")]
    transform_opt: Option<VrlProgram>,
    input_format: SourceInputFormat,
}

impl DocProcessor {
    pub fn try_new(
        index_id: IndexId,
        source_id: SourceId,
        doc_mapper: Arc<DocMapper>,
        indexer_mailbox: Mailbox<Indexer>,
        transform_config_opt: Option<TransformConfig>,
        input_format: SourceInputFormat,
    ) -> anyhow::Result<Self> {
        let timestamp_field_opt = extract_timestamp_field(&doc_mapper)?;
        if cfg!(not(feature = "vrl")) && transform_config_opt.is_some() {
            bail!("VRL is not enabled: please recompile with the `vrl` feature")
        }
        Ok(DocProcessor {
            doc_mapper,
            indexer_mailbox,
            timestamp_field_opt,
            counters: Arc::new(DocProcessorCounters::new(index_id, source_id)),
            publish_lock: PublishLock::default(),
            #[cfg(feature = "vrl")]
            transform_opt: transform_config_opt
                .map(VrlProgram::try_from_transform_config)
                .transpose()?,
            input_format,
        })
    }

    // Extract a timestamp from a tantivy document.
    //
    // If the timestamp is set up in the docmapper and the timestamp is missing,
    // returns an PrepareDocumentError::MissingField error.
    fn extract_timestamp(
        &self,
        doc: &TantivyDocument,
    ) -> Result<Option<DateTime>, DocProcessorError> {
        let Some(timestamp_field) = self.timestamp_field_opt else {
            return Ok(None);
        };
        let timestamp = doc
            .get_first(timestamp_field)
            .and_then(|val| val.as_datetime())
            .ok_or(DocProcessorError::from(DocParsingError::RequiredField(
                "timestamp field is required".to_string(),
            )))?;
        Ok(Some(timestamp))
    }

    fn process_raw_doc(&mut self, raw_doc: Bytes, processed_docs: &mut Vec<ProcessedDoc>) {
        let num_bytes = raw_doc.len();

        #[cfg(feature = "vrl")]
        let transform_opt = self.transform_opt.as_mut();
        #[cfg(not(feature = "vrl"))]
        let transform_opt: Option<&mut VrlProgram> = None;

        for json_doc_result in parse_raw_doc(self.input_format, raw_doc, num_bytes, transform_opt) {
            let processed_doc_result =
                json_doc_result.and_then(|json_doc| self.process_json_doc(json_doc));

            match processed_doc_result {
                Ok(processed_doc) => {
                    self.counters.record_valid(processed_doc.num_bytes as u64);
                    processed_docs.push(processed_doc);
                }
                Err(error) => {
                    rate_limited_warn!(
                        limit_per_min = 10,
                        index_id = self.counters.index_id,
                        source_id = self.counters.source_id,
                        "{error}",
                    );
                    self.counters.record_error(error, num_bytes as u64);
                }
            }
        }
    }

    fn process_json_doc(&self, json_doc: JsonDoc) -> Result<ProcessedDoc, DocProcessorError> {
        let num_bytes = json_doc.num_bytes;

        let (partition, doc) = self
            .doc_mapper
            .doc_from_json_obj(json_doc.json_obj, json_doc.num_bytes as u64)?;
        let timestamp_opt = self.extract_timestamp(&doc)?;
        Ok(ProcessedDoc {
            doc,
            timestamp_opt,
            partition,
            num_bytes,
        })
    }
}

fn extract_timestamp_field(doc_mapper: &DocMapper) -> anyhow::Result<Option<Field>> {
    let schema = doc_mapper.schema();
    let Some(timestamp_field_name) = doc_mapper.timestamp_field_name() else {
        return Ok(None);
    };
    let timestamp_field = schema
        .get_field(timestamp_field_name)
        .context("failed to find timestamp field in schema")?;
    Ok(Some(timestamp_field))
}

#[cfg(not(feature = "vrl"))]
struct VrlProgram {}

#[async_trait]
impl Actor for DocProcessor {
    type ObservableState = Arc<DocProcessorCounters>;

    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(10)
    }

    fn runtime_handle(&self) -> Handle {
        RuntimeType::Blocking.get_runtime_handle()
    }

    #[inline]
    fn yield_after_each_message(&self) -> bool {
        false
    }

    async fn finalize(
        &mut self,
        exit_status: &ActorExitStatus,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        match exit_status {
            ActorExitStatus::DownstreamClosed
            | ActorExitStatus::Killed
            | ActorExitStatus::Failure(_)
            | ActorExitStatus::Panicked => return Ok(()),
            ActorExitStatus::Quit | ActorExitStatus::Success => {
                let _ = ctx.send_exit_with_success(&self.indexer_mailbox).await;
            }
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<RawDocBatch> for DocProcessor {
    type Reply = ();

    async fn handle(
        &mut self,
        raw_doc_batch: RawDocBatch,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if self.publish_lock.is_dead() {
            return Ok(());
        }
        let mut processed_docs: Vec<ProcessedDoc> = Vec::with_capacity(raw_doc_batch.docs.len());

        for raw_doc in raw_doc_batch.docs {
            let _protected_zone_guard = ctx.protect_zone();
            self.process_raw_doc(raw_doc, &mut processed_docs);
            ctx.record_progress();
        }
        let processed_doc_batch = ProcessedDocBatch::new(
            processed_docs,
            raw_doc_batch.checkpoint_delta,
            raw_doc_batch.force_commit,
        );
        ctx.send_message(&self.indexer_mailbox, processed_doc_batch)
            .await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<NewPublishLock> for DocProcessor {
    type Reply = ();

    async fn handle(
        &mut self,
        message: NewPublishLock,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let NewPublishLock(publish_lock) = &message;
        self.publish_lock = publish_lock.clone();
        ctx.send_message(&self.indexer_mailbox, message).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<NewPublishToken> for DocProcessor {
    type Reply = ();

    async fn handle(
        &mut self,
        message: NewPublishToken,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        ctx.send_message(&self.indexer_mailbox, message).await?;
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;

    use prost::Message;
    use quickwit_actors::Universe;
    use quickwit_common::uri::Uri;
    use quickwit_config::{SearchSettings, build_doc_mapper};
    use quickwit_doc_mapper::{DocMapper, default_doc_mapper_for_test};
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;
    use quickwit_opentelemetry::otlp::{OtlpGrpcLogsService, OtlpGrpcTracesService};
    use quickwit_proto::opentelemetry::proto::collector::logs::v1::ExportLogsServiceRequest;
    use quickwit_proto::opentelemetry::proto::collector::trace::v1::ExportTraceServiceRequest;
    use quickwit_proto::opentelemetry::proto::common::v1::AnyValue as OtlpAnyValue;
    use quickwit_proto::opentelemetry::proto::common::v1::any_value::Value as OtlpAnyValueValue;
    use quickwit_proto::opentelemetry::proto::logs::v1::{LogRecord, ResourceLogs, ScopeLogs};
    use quickwit_proto::opentelemetry::proto::trace::v1::{ResourceSpans, ScopeSpans, Span};
    use serde_json::Value as JsonValue;
    use tantivy::Document;
    use tantivy::schema::NamedFieldDocument;

    use super::*;
    use crate::models::{PublishLock, RawDocBatch};

    #[tokio::test]
    async fn test_doc_processor_simple() {
        let index_id = "my-index";
        let source_id = "my-source";
        let universe = Universe::with_accelerated_time();
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            index_id.to_string(),
            source_id.to_string(),
            doc_mapper.clone(),
            indexer_mailbox,
            None,
            SourceInputFormat::Json,
        )
        .unwrap();
        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);
        let checkpoint_delta = SourceCheckpointDelta::from_range(0..4);
        doc_processor_mailbox
            .send_message(RawDocBatch::for_test(
                &[
                    br#"{"body": "happy", "response_date": "2021-12-19T16:39:57+00:00", "response_time": 12, "response_payload": "YWJj"}"#, // missing timestamp
                    br#"{"body": "happy", "timestamp": 1628837062, "response_date": "2021-12-19T16:39:59+00:00", "response_time": 2, "response_payload": "YWJj"}"#, // ok
                    br#"{"body": "happy2", "timestamp": 1628837062, "response_date": "2021-12-19T16:40:57+00:00", "response_time": 13, "response_payload": "YWJj"}"#, // ok
                    b"{", // invalid json
                ],
                0..4,
            ))
            .await.unwrap();

        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.index_id, index_id);
        assert_eq!(counters.source_id, source_id);
        assert_eq!(counters.doc_mapper_errors.get_num_docs(), 1);
        assert_eq!(counters.json_parse_errors.get_num_docs(), 1);
        assert_eq!(counters.transform_errors.get_num_docs(), 0);
        assert_eq!(counters.otlp_parse_errors.get_num_docs(), 0);
        assert_eq!(counters.valid.get_num_docs(), 2);
        assert_eq!(counters.num_bytes_total.load(Ordering::Relaxed), 387);

        let output_messages = indexer_inbox.drain_for_test();
        assert_eq!(output_messages.len(), 1);
        let batch = *(output_messages
            .into_iter()
            .next()
            .unwrap()
            .downcast::<ProcessedDocBatch>()
            .unwrap());
        assert_eq!(batch.docs.len(), 2);
        assert_eq!(batch.checkpoint_delta, checkpoint_delta);

        let schema = doc_mapper.schema();
        let NamedFieldDocument(named_field_doc_map) = batch.docs[0].doc.to_named_doc(&schema);
        let doc_json = JsonValue::Object(doc_mapper.doc_to_json(named_field_doc_map).unwrap());
        assert_eq!(
            doc_json,
            serde_json::json!({
                "_source": {
                    "body": "happy",
                    "response_date": "2021-12-19T16:39:59Z",
                    "response_payload": "YWJj",
                    "response_time": 2,
                    "timestamp": 1628837062
                },
                "body": "happy",
                "response_date": "2021-12-19T16:39:59Z",
                "response_payload": "YWJj",
                "response_time": 2.0,
                "timestamp": 1628837062
            })
        );
        universe.assert_quit().await;
    }

    const DOCMAPPER_WITH_PARTITION_JSON: &str = r#"
        {
            "tag_fields": ["tenant"],
            "partition_key": "tenant",
            "field_mappings": [
                { "name": "tenant", "type": "text", "tokenizer": "raw", "indexed": true },
                { "name": "body", "type": "text" }
            ]
        }"#;

    #[tokio::test]
    async fn test_doc_processor_partitioning() {
        let doc_mapper: Arc<DocMapper> =
            Arc::new(serde_json::from_str::<DocMapper>(DOCMAPPER_WITH_PARTITION_JSON).unwrap());
        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::Json,
        )
        .unwrap();
        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);
        doc_processor_mailbox
            .send_message(RawDocBatch::for_test(
                &[
                    br#"{"tenant": "tenant_1", "body": "first doc for tenant 1"}"#,
                    br#"{"tenant": "tenant_2", "body": "first doc for tenant 2"}"#,
                    br#"{"tenant": "tenant_1", "body": "second doc for tenant 1"}"#,
                    br#"{"tenant": "tenant_2", "body": "second doc for tenant 2"}"#,
                ],
                0..2,
            ))
            .await
            .unwrap();

        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();
        let (exit_status, _) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        let processed_doc_batches: Vec<ProcessedDocBatch> = indexer_inbox.drain_for_test_typed();
        assert_eq!(processed_doc_batches.len(), 1);
        let partition_ids: Vec<u64> = processed_doc_batches[0]
            .docs
            .iter()
            .map(|doc| doc.partition)
            .collect();
        assert_eq!(partition_ids[0], partition_ids[2]);
        assert_eq!(partition_ids[1], partition_ids[3]);
        assert_ne!(partition_ids[0], partition_ids[1]);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_doc_processor_forward_publish_lock() {
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::Json,
        )
        .unwrap();
        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);
        let publish_lock = PublishLock::default();
        doc_processor_mailbox
            .send_message(NewPublishLock(publish_lock.clone()))
            .await
            .unwrap();
        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();
        let (exit_status, _) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        let publish_locks: Vec<NewPublishLock> = indexer_inbox.drain_for_test_typed();
        assert_eq!(&publish_locks, &[NewPublishLock(publish_lock)]);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_doc_processor_ignores_messages_when_publish_lock_is_dead() {
        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::Json,
        )
        .unwrap();
        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);
        let publish_lock = PublishLock::default();
        doc_processor_mailbox
            .send_message(NewPublishLock(publish_lock.clone()))
            .await
            .unwrap();
        doc_processor_handle.process_pending_and_observe().await;
        publish_lock.kill().await;
        doc_processor_mailbox
            .send_message(RawDocBatch::for_test(
                &[
                    br#"{"body": "happy", "timestamp": 1628837062, "response_date": "2021-12-19T16:39:59+00:00", "response_time": 2, "response_payload": "YWJj"}"#,
                ],
                0..1,
            ))
            .await.unwrap();
        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();
        let (exit_status, _indexer_counters) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        let indexer_messages: Vec<ProcessedDocBatch> = indexer_inbox.drain_for_test_typed();
        assert!(indexer_messages.is_empty());
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_doc_processor_otlp_logs_json() {
        let root_uri = Uri::for_test("ram:///indexes");
        let index_config = OtlpGrpcLogsService::index_config(&root_uri).unwrap();
        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &SearchSettings::default()).unwrap();

        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::OtlpLogsJson,
        )
        .unwrap();

        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);

        let scope_logs = vec![ScopeLogs {
            log_records: vec![
                LogRecord {
                    time_unix_nano: 1_000_000_000,
                    body: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue(
                            "foo log message".to_string(),
                        )),
                    }),
                    ..Default::default()
                },
                LogRecord {
                    time_unix_nano: 1_000_000_001,
                    body: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue(
                            "bar log message".to_string(),
                        )),
                    }),
                    ..Default::default()
                },
            ],
            ..Default::default()
        }];
        let resource_logs = vec![ResourceLogs {
            scope_logs,
            ..Default::default()
        }];
        let request = ExportLogsServiceRequest { resource_logs };
        let raw_doc_json = serde_json::to_vec(&request).unwrap();
        let raw_doc_batch = RawDocBatch::for_test(&[&raw_doc_json], 0..2);
        doc_processor_mailbox
            .send_message(raw_doc_batch)
            .await
            .unwrap();

        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();

        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.valid.get_num_docs(), 2);

        let batch = indexer_inbox.drain_for_test_typed::<ProcessedDocBatch>();
        assert_eq!(batch.len(), 1);
        assert_eq!(batch[0].docs.len(), 2);

        let (exit_status, _) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_doc_processor_otlp_logs_proto() {
        let root_uri = Uri::for_test("ram:///indexes");
        let index_config = OtlpGrpcLogsService::index_config(&root_uri).unwrap();
        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &SearchSettings::default()).unwrap();

        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::OtlpLogsProtobuf,
        )
        .unwrap();

        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);

        let scope_logs = vec![ScopeLogs {
            log_records: vec![
                LogRecord {
                    time_unix_nano: 1_000_000_000,
                    body: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue(
                            "foo log message".to_string(),
                        )),
                    }),
                    ..Default::default()
                },
                LogRecord {
                    time_unix_nano: 1_000_000_001,
                    body: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue(
                            "bar log message".to_string(),
                        )),
                    }),
                    ..Default::default()
                },
            ],
            ..Default::default()
        }];
        let resource_logs = vec![ResourceLogs {
            scope_logs,
            ..Default::default()
        }];
        let request = ExportLogsServiceRequest { resource_logs };
        let mut raw_doc_buffer = Vec::new();
        request.encode(&mut raw_doc_buffer).unwrap();

        let raw_doc_batch = RawDocBatch::for_test(&[&raw_doc_buffer], 0..2);
        doc_processor_mailbox
            .send_message(raw_doc_batch)
            .await
            .unwrap();

        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();

        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.valid.get_num_docs(), 2);

        let batch = indexer_inbox.drain_for_test_typed::<ProcessedDocBatch>();
        assert_eq!(batch.len(), 1);
        assert_eq!(batch[0].docs.len(), 2);

        let (exit_status, _) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_doc_processor_otlp_traces_json() {
        let root_uri = Uri::for_test("ram:///indexes");
        let index_config = OtlpGrpcTracesService::index_config(&root_uri).unwrap();
        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &SearchSettings::default()).unwrap();

        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::OtlpTracesJson,
        )
        .unwrap();

        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);

        let scope_spans = vec![ScopeSpans {
            spans: vec![
                Span {
                    trace_id: vec![1; 16],
                    span_id: vec![2; 8],
                    start_time_unix_nano: 1_000_000_001,
                    end_time_unix_nano: 1_000_000_002,
                    ..Default::default()
                },
                Span {
                    trace_id: vec![3; 16],
                    span_id: vec![4; 8],
                    start_time_unix_nano: 2_000_000_001,
                    end_time_unix_nano: 2_000_000_002,
                    ..Default::default()
                },
            ],
            ..Default::default()
        }];
        let resource_spans = vec![ResourceSpans {
            scope_spans,
            ..Default::default()
        }];
        let request = ExportTraceServiceRequest { resource_spans };
        let raw_doc_json = serde_json::to_vec(&request).unwrap();
        let raw_doc_batch = RawDocBatch::for_test(&[&raw_doc_json], 0..2);
        doc_processor_mailbox
            .send_message(raw_doc_batch)
            .await
            .unwrap();

        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();

        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.valid.get_num_docs(), 2);

        let batch = indexer_inbox.drain_for_test_typed::<ProcessedDocBatch>();
        assert_eq!(batch.len(), 1);
        assert_eq!(batch[0].docs.len(), 2);

        let (exit_status, _) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_doc_processor_otlp_traces_proto() {
        let root_uri = Uri::for_test("ram:///indexes");
        let index_config = OtlpGrpcTracesService::index_config(&root_uri).unwrap();
        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &SearchSettings::default()).unwrap();

        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_processor = DocProcessor::try_new(
            "my-index".to_string(),
            "my-source".to_string(),
            doc_mapper,
            indexer_mailbox,
            None,
            SourceInputFormat::OtlpTracesProtobuf,
        )
        .unwrap();

        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);

        let scope_spans = vec![ScopeSpans {
            spans: vec![
                Span {
                    trace_id: vec![1; 16],
                    span_id: vec![2; 8],
                    start_time_unix_nano: 1_000_000_001,
                    end_time_unix_nano: 1_000_000_002,
                    ..Default::default()
                },
                Span {
                    trace_id: vec![3; 16],
                    span_id: vec![4; 8],
                    start_time_unix_nano: 2_000_000_001,
                    end_time_unix_nano: 2_000_000_002,
                    ..Default::default()
                },
            ],
            ..Default::default()
        }];
        let resource_spans = vec![ResourceSpans {
            scope_spans,
            ..Default::default()
        }];
        let request = ExportTraceServiceRequest { resource_spans };
        let mut raw_doc_buffer = Vec::new();
        request.encode(&mut raw_doc_buffer).unwrap();

        let raw_doc_batch = RawDocBatch::for_test(&[&raw_doc_buffer], 0..2);
        doc_processor_mailbox
            .send_message(raw_doc_batch)
            .await
            .unwrap();

        universe
            .send_exit_with_success(&doc_processor_mailbox)
            .await
            .unwrap();

        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.valid.get_num_docs(), 2);

        let batch = indexer_inbox.drain_for_test_typed::<ProcessedDocBatch>();
        assert_eq!(batch.len(), 1);
        assert_eq!(batch[0].docs.len(), 2);

        let (exit_status, _) = doc_processor_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        universe.assert_quit().await;
    }
}

#[cfg(feature = "vrl")]
#[cfg(test)]
mod tests_vrl {
    use quickwit_actors::Universe;
    use quickwit_doc_mapper::default_doc_mapper_for_test;
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;
    use tantivy::Document;
    use tantivy::schema::NamedFieldDocument;

    use super::*;

    #[tokio::test]
    async fn test_doc_processor_simple_vrl() -> anyhow::Result<()> {
        let index_id = "my-index";
        let source_id = "my-source";
        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let transform_config = TransformConfig::for_test(".body = upcase(string!(.body))");
        let doc_processor = DocProcessor::try_new(
            index_id.to_string(),
            source_id.to_string(),
            doc_mapper.clone(),
            indexer_mailbox,
            Some(transform_config),
            SourceInputFormat::Json,
        )
        .unwrap();
        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);
        doc_processor_mailbox
            .send_message(RawDocBatch::for_test(
                &[
                    br#"{"body": "happy", "response_date": "2021-12-19T16:39:57+00:00", "response_time": 12, "response_payload": "YWJj"}"#, // missing timestamp
                    br#"{"body": "happy using VRL", "timestamp": 1628837062, "response_date": "2021-12-19T16:39:59+00:00", "response_time": 2, "response_payload": "YWJj"}"#, // ok
                    br#"{"body": "happy2", "timestamp": 1628837062, "response_date": "2021-12-19T16:40:57+00:00", "response_time": 13, "response_payload": "YWJj"}"#, // ok
                    b"{", // invalid json
                ],
                0..4,
            ))
            .await?;
        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.index_id, index_id.to_string());
        assert_eq!(counters.source_id, source_id.to_string());
        assert_eq!(counters.doc_mapper_errors.get_num_docs(), 1);
        assert_eq!(counters.json_parse_errors.get_num_docs(), 1);
        assert_eq!(counters.transform_errors.get_num_docs(), 0);
        assert_eq!(counters.otlp_parse_errors.get_num_docs(), 0);
        assert_eq!(counters.valid.get_num_docs(), 2);
        assert_eq!(counters.num_bytes_total.load(Ordering::Relaxed), 397);

        let output_messages = indexer_inbox.drain_for_test();
        assert_eq!(output_messages.len(), 1);
        let batch = *(output_messages
            .into_iter()
            .next()
            .unwrap()
            .downcast::<ProcessedDocBatch>()
            .unwrap());
        assert_eq!(batch.docs.len(), 2);
        assert_eq!(
            batch.checkpoint_delta,
            SourceCheckpointDelta::from_range(0..4)
        );

        let schema = doc_mapper.schema();
        let NamedFieldDocument(named_field_doc_map) = batch.docs[0].doc.to_named_doc(&schema);
        let doc_json = JsonValue::Object(doc_mapper.doc_to_json(named_field_doc_map)?);
        assert_eq!(
            doc_json,
            serde_json::json!({
                "_source": {
                    "body": "HAPPY USING VRL",
                    "response_date": "2021-12-19T16:39:59Z",
                    "response_payload": "YWJj",
                    "response_time": 2,
                    "timestamp": 1628837062
                },
                "body": "HAPPY USING VRL",
                "response_date": "2021-12-19T16:39:59Z",
                 "response_payload": "YWJj",
                 "response_time": 2.0,
                 "timestamp": 1628837062
            })
        );
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_doc_processor_with_plain_text_input() {
        let index_id = "my-index";
        let source_id = "my-source";
        let universe = Universe::with_accelerated_time();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let vrl_script = r#"
            values = parse_csv!(.plain_text)
            .body = upcase(string!(values[0]))
            .timestamp = to_int!(values[1])
            .response_date = values[2]
            .response_time = to_int!(values[3])
            .response_payload = values[4]
            del(.plain_text)
        "#;

        let transform_config = TransformConfig::for_test(vrl_script);
        let doc_processor = DocProcessor::try_new(
            index_id.to_string(),
            source_id.to_string(),
            doc_mapper.clone(),
            indexer_mailbox,
            Some(transform_config),
            SourceInputFormat::PlainText,
        )
        .unwrap();
        let (doc_processor_mailbox, doc_processor_handle) =
            universe.spawn_builder().spawn(doc_processor);
        doc_processor_mailbox
            .send_message(RawDocBatch::for_test(
                &[
                    // body,timestamp,response_date,response_time,response_payload
                    br#""happy using VRL",1628837062,"2021-12-19T16:39:59+00:00",2,"YWJj""#,
                    br#""happy2",1628837062,"2021-12-19T16:40:57+00:00",13,"YWJj""#,
                    br#""happy2",1628837062,"2021-12-19T16:40:57+00:00","invalid-response_time","YWJj""#,
                ],
                0..4,
            ))
            .await.unwrap();
        let counters = doc_processor_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(counters.index_id, index_id);
        assert_eq!(counters.source_id, source_id);
        assert_eq!(counters.doc_mapper_errors.get_num_docs(), 0,);
        assert_eq!(counters.transform_errors.get_num_docs(), 1,);
        assert_eq!(counters.otlp_parse_errors.get_num_docs(), 0,);
        assert_eq!(counters.valid.get_num_docs(), 2,);
        assert_eq!(counters.num_bytes_total.load(Ordering::Relaxed), 200,);

        let output_messages = indexer_inbox.drain_for_test();
        assert_eq!(output_messages.len(), 1);
        let batch = *(output_messages
            .into_iter()
            .next()
            .unwrap()
            .downcast::<ProcessedDocBatch>()
            .unwrap());
        assert_eq!(batch.docs.len(), 2);
        assert_eq!(
            batch.checkpoint_delta,
            SourceCheckpointDelta::from_range(0..4)
        );

        let schema = doc_mapper.schema();
        let NamedFieldDocument(named_field_doc_map) = batch.docs[0].doc.to_named_doc(&schema);
        let doc_json = JsonValue::Object(doc_mapper.doc_to_json(named_field_doc_map).unwrap());
        assert_eq!(
            doc_json,
            serde_json::json!({
                "_source": {
                    "body": "HAPPY USING VRL",
                    "response_date": "2021-12-19T16:39:59Z",
                    "response_payload": "YWJj",
                    "response_time": 2,
                    "timestamp": 1628837062
                },
                "body": "HAPPY USING VRL",
                "response_date": "2021-12-19T16:39:59Z",
                "response_payload": "YWJj",
                "response_time": 2.0,
                "timestamp": 1628837062
            })
        );
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/index_serializer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::io::IoControls;
use quickwit_common::runtimes::RuntimeType;
use tokio::runtime::Handle;
use tracing::instrument;

use crate::actors::Packager;
use crate::models::{EmptySplit, IndexedSplit, IndexedSplitBatch, IndexedSplitBatchBuilder};

/// The index serializer takes a non-serialized split,
/// and serializes it before passing it to the packager.
///
/// This is usually a CPU heavy operation.
///
/// Depending on the data
/// (terms cardinality) and the index settings (sorted or not)
/// it can range from medium IO to IO heavy.
pub struct IndexSerializer {
    packager_mailbox: Mailbox<Packager>,
}

impl IndexSerializer {
    pub fn new(packager_mailbox: Mailbox<Packager>) -> Self {
        Self { packager_mailbox }
    }
}

#[async_trait]
impl Actor for IndexSerializer {
    type ObservableState = ();

    fn observable_state(&self) -> Self::ObservableState {}

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(0)
    }

    fn runtime_handle(&self) -> Handle {
        RuntimeType::Blocking.get_runtime_handle()
    }
}

#[async_trait]
impl Handler<IndexedSplitBatchBuilder> for IndexSerializer {
    type Reply = ();

    #[instrument(
        name="serialize_split_batch"
        parent=batch_builder.batch_parent_span.id(),
        skip_all,
    )]
    async fn handle(
        &mut self,
        batch_builder: IndexedSplitBatchBuilder,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let mut splits: Vec<IndexedSplit> = Vec::with_capacity(batch_builder.splits.len());
        for split_builder in batch_builder.splits {
            // TODO Consider & test removing this protect guard.
            //
            // In theory the controlled directory should be sufficient.
            let _protect_guard = ctx.protect_zone();
            if let Some(controlled_directory) = &split_builder.controlled_directory_opt {
                let io_controls = IoControls::default()
                    .set_progress(ctx.progress().clone())
                    .set_kill_switch(ctx.kill_switch().clone())
                    .set_component("index_serializer");
                controlled_directory.set_io_controls(io_controls);
            }
            let split = split_builder.finalize()?;
            splits.push(split);
        }
        let indexed_split_batch = IndexedSplitBatch {
            splits,
            checkpoint_delta_opt: batch_builder.checkpoint_delta_opt,
            publish_lock: batch_builder.publish_lock,
            publish_token_opt: batch_builder.publish_token_opt,
            merge_task_opt: None,
            batch_parent_span: batch_builder.batch_parent_span,
        };
        ctx.send_message(&self.packager_mailbox, indexed_split_batch)
            .await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<EmptySplit> for IndexSerializer {
    type Reply = ();

    #[instrument(
        name="serialize_empty_split"
        parent=empty_split.batch_parent_span.id(),
        skip_all,
    )]
    async fn handle(
        &mut self,
        empty_split: EmptySplit,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        ctx.send_message(&self.packager_mailbox, empty_split)
            .await?;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/indexer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::hash_map::Entry;
use std::num::NonZeroU32;
use std::ops::RangeInclusive;
use std::sync::Arc;

use anyhow::Context;
use async_trait::async_trait;
use bytesize::ByteSize;
use fail::fail_point;
use fnv::FnvHashMap;
use itertools::Itertools;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, Command, Handler, Mailbox, QueueCapacity,
};
use quickwit_common::io::IoControls;
use quickwit_common::metrics::GaugeGuard;
use quickwit_common::runtimes::RuntimeType;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_config::IndexingSettings;
use quickwit_doc_mapper::DocMapper;
use quickwit_metastore::checkpoint::{IndexCheckpointDelta, SourceCheckpointDelta};
use quickwit_proto::indexing::{IndexingPipelineId, PipelineMetrics};
use quickwit_proto::metastore::{
    LastDeleteOpstampRequest, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::{DocMappingUid, PublishToken};
use quickwit_query::get_quickwit_fastfield_normalizer_manager;
use serde::Serialize;
use tantivy::schema::Schema;
use tantivy::store::{Compressor, ZstdCompressor};
use tantivy::tokenizer::TokenizerManager;
use tantivy::{DateTime, IndexBuilder, IndexSettings};
use tokio::runtime::Handle;
use tokio::sync::Semaphore;
use tracing::{Span, info, info_span, warn};
use ulid::Ulid;

use crate::actors::IndexSerializer;
use crate::actors::cooperative_indexing::{CooperativeIndexingCycle, CooperativeIndexingPeriod};
use crate::models::{
    CommitTrigger, EmptySplit, IndexedSplitBatchBuilder, IndexedSplitBuilder, NewPublishLock,
    NewPublishToken, ProcessedDoc, ProcessedDocBatch, PublishLock,
};

// Random partition ID used to gather partitions exceeding the maximum number of partitions.
const OTHER_PARTITION_ID: u64 = 3264326757911759461u64;

#[derive(Debug)]
struct CommitTimeout {
    workbench_id: Ulid,
}

#[derive(Clone, Debug, Default, Eq, PartialEq, Serialize)]
pub struct IndexerCounters {
    /// Number of splits that were emitted by the indexer.
    pub num_splits_emitted: u64,

    /// Number of split batches that were emitted by the indexer.
    pub num_split_batches_emitted: u64,

    /// Number of (valid) documents in the current workbench.
    /// This value is used to trigger commit and for observation.
    pub num_docs_in_workbench: u64,

    /// Number of ProcessDocBatch received by the indexer to
    /// build this split.
    pub num_doc_batches_in_workbench: u64,

    /// Metrics describing the load and indexing performance of the
    /// pipeline. This is only updated for cooperative indexers.
    pub pipeline_metrics_opt: Option<PipelineMetrics>,
}

struct IndexerState {
    pipeline_id: IndexingPipelineId,
    metastore: MetastoreServiceClient,
    indexing_directory: TempDirectory,
    indexing_settings: IndexingSettings,
    publish_lock: PublishLock,
    publish_token_opt: Option<PublishToken>,
    schema: Schema,
    doc_mapping_uid: DocMappingUid,
    tokenizer_manager: TokenizerManager,
    max_num_partitions: NonZeroU32,
    index_settings: IndexSettings,
    cooperative_indexing_opt: Option<CooperativeIndexingCycle>,
}

impl IndexerState {
    fn create_indexed_split_builder(
        &self,
        partition_id: u64,
        last_delete_opstamp: u64,
        ctx: &ActorContext<Indexer>,
    ) -> anyhow::Result<IndexedSplitBuilder> {
        let index_builder = IndexBuilder::new()
            .settings(self.index_settings.clone())
            .schema(self.schema.clone())
            .tokenizers(self.tokenizer_manager.clone())
            .fast_field_tokenizers(
                get_quickwit_fastfield_normalizer_manager()
                    .tantivy_manager()
                    .clone(),
            );

        let io_controls = IoControls::default()
            .set_progress(ctx.progress().clone())
            .set_kill_switch(ctx.kill_switch().clone())
            .set_component("indexer");

        let indexed_split = IndexedSplitBuilder::new_in_dir(
            self.pipeline_id.clone(),
            partition_id,
            last_delete_opstamp,
            self.doc_mapping_uid,
            self.indexing_directory.clone(),
            index_builder,
            io_controls,
        )?;
        info!(
            split_id=%indexed_split.split_id(),
            partition_id=%partition_id,
            "new-split"
        );
        Ok(indexed_split)
    }

    fn get_or_create_indexed_split<'a>(
        &self,
        partition_id: u64,
        last_delete_opstamp: u64,
        splits: &'a mut FnvHashMap<u64, IndexedSplitBuilder>,
        other_split_opt: &'a mut Option<IndexedSplitBuilder>,
        counter: &'a mut IndexerCounters,
        ctx: &ActorContext<Indexer>,
    ) -> anyhow::Result<(&'a mut IndexedSplitBuilder, bool)> {
        let num_splits = splits.len();
        match splits.entry(partition_id) {
            Entry::Occupied(indexed_split) => Ok((indexed_split.into_mut(), false)),
            Entry::Vacant(vacant_entry) => {
                if num_splits as u32 >= self.max_num_partitions.get() {
                    // In order to avoid exceeding max_num_partitions, we map the document to the
                    // `OTHER` special partition.
                    if other_split_opt.is_none() {
                        warn!(
                            num_docs_in_workbench = counter.num_docs_in_workbench,
                            max_num_partition = self.max_num_partitions.get(),
                            "Exceeding max_num_partition"
                        );
                        let new_other_split = self.create_indexed_split_builder(
                            OTHER_PARTITION_ID,
                            last_delete_opstamp,
                            ctx,
                        )?;
                        *other_split_opt = Some(new_other_split);
                    }
                    Ok((other_split_opt.as_mut().unwrap(), true))
                } else {
                    let indexed_split =
                        self.create_indexed_split_builder(partition_id, last_delete_opstamp, ctx)?;
                    Ok((vacant_entry.insert(indexed_split), true))
                }
            }
        }
    }

    async fn create_workbench(
        &self,
        ctx: &ActorContext<Indexer>,
    ) -> anyhow::Result<IndexingWorkbench> {
        let workbench_id = Ulid::new();
        let batch_parent_span = info_span!(target: "quickwit-indexing", "index-doc-batches",
            index_id=%self.pipeline_id.index_uid.index_id,
            source_id=%self.pipeline_id.source_id,
            pipeline_uid=%self.pipeline_id.pipeline_uid,
            workbench_id=%workbench_id,
        );
        let indexing_span = info_span!(parent: batch_parent_span.id(), "indexer");
        let cooperative_indexing_period =
            if let Some(cooperative_indexing) = &self.cooperative_indexing_opt {
                Some(
                    ctx.protect_future(cooperative_indexing.cooperative_indexing_period())
                        .await,
                )
            } else {
                None
            };

        let last_delete_opstamp_request = LastDeleteOpstampRequest {
            index_uid: Some(self.pipeline_id.index_uid.clone()),
        };
        let last_delete_opstamp_response = ctx
            .protect_future(
                self.metastore
                    .clone()
                    .last_delete_opstamp(last_delete_opstamp_request),
            )
            .await?;
        let last_delete_opstamp = last_delete_opstamp_response.last_delete_opstamp;

        let checkpoint_delta = IndexCheckpointDelta {
            source_id: self.pipeline_id.source_id.clone(),
            source_delta: SourceCheckpointDelta::default(),
        };
        let publish_lock = self.publish_lock.clone();
        let publish_token_opt = self.publish_token_opt.clone();

        let mut split_builders_guard =
            GaugeGuard::from_gauge(&crate::metrics::INDEXER_METRICS.split_builders);
        split_builders_guard.add(1);

        let workbench = IndexingWorkbench {
            workbench_id,
            batch_parent_span,
            _indexing_span: indexing_span,
            indexed_splits: FnvHashMap::with_capacity_and_hasher(250, Default::default()),
            other_indexed_split_opt: None,
            checkpoint_delta,
            publish_lock,
            publish_token_opt,
            last_delete_opstamp,
            memory_usage: GaugeGuard::from_gauge(
                &quickwit_common::metrics::MEMORY_METRICS
                    .in_flight
                    .index_writer,
            ),
            cooperative_indexing_period,
            split_builders_guard,
        };
        Ok(workbench)
    }

    /// Returns the current_indexed_split. If this is the first message, then
    /// the indexed_split does not exist yet.
    ///
    /// This function will then create it, and can hence return an Error.
    async fn get_or_create_workbench<'a>(
        &'a self,
        indexing_workbench_opt: &'a mut Option<IndexingWorkbench>,
        ctx: &'a ActorContext<Indexer>,
    ) -> anyhow::Result<&'a mut IndexingWorkbench> {
        if indexing_workbench_opt.is_none() {
            let indexing_workbench = self.create_workbench(ctx).await?;
            let commit_timeout_message = CommitTimeout {
                workbench_id: indexing_workbench.workbench_id,
            };
            ctx.schedule_self_msg(
                self.indexing_settings.commit_timeout(),
                commit_timeout_message,
            );
            *indexing_workbench_opt = Some(indexing_workbench);
        }
        let current_indexing_workbench = indexing_workbench_opt.as_mut().context(
            "no index writer available. this should never happen! please, report on https://github.com/quickwit-oss/quickwit/issues"
        )?;
        Ok(current_indexing_workbench)
    }

    async fn index_batch(
        &self,
        batch: ProcessedDocBatch,
        indexing_workbench_opt: &mut Option<IndexingWorkbench>,
        counters: &mut IndexerCounters,
        ctx: &ActorContext<Indexer>,
    ) -> Result<(), ActorExitStatus> {
        let IndexingWorkbench {
            checkpoint_delta,
            indexed_splits,
            other_indexed_split_opt,
            publish_lock,
            last_delete_opstamp,
            memory_usage,
            ..
        } = self
            .get_or_create_workbench(indexing_workbench_opt, ctx)
            .await?;
        if publish_lock.is_dead() {
            // Release indexing permit early.
            indexing_workbench_opt.take();
            return Ok(());
        }
        checkpoint_delta
            .source_delta
            .extend(batch.checkpoint_delta)
            .context("batch delta does not follow indexer checkpoint")?;
        let mut memory_usage_delta: i64 = 0;
        counters.num_doc_batches_in_workbench += 1;
        for doc in batch.docs {
            let ProcessedDoc {
                doc,
                timestamp_opt,
                partition,
                num_bytes,
            } = doc;
            counters.num_docs_in_workbench += 1;
            let (indexed_split, split_created) = self.get_or_create_indexed_split(
                partition,
                *last_delete_opstamp,
                indexed_splits,
                other_indexed_split_opt,
                counters,
                ctx,
            )?;
            let mem_usage_before = indexed_split.index_writer.mem_usage() as u64;
            if split_created {
                // The split was just created. We need to account for the initial index writer's
                // memory usage.
                memory_usage_delta += mem_usage_before as i64;
            }
            indexed_split.split_attrs.uncompressed_docs_size_in_bytes += num_bytes as u64;
            indexed_split.split_attrs.num_docs += 1;
            if let Some(timestamp) = timestamp_opt {
                record_timestamp(timestamp, &mut indexed_split.split_attrs.time_range);
            }
            let _protect_guard = ctx.protect_zone();
            indexed_split
                .index_writer
                .add_document(doc)
                .context("failed to add document")?;
            let mem_usage_after = indexed_split.index_writer.mem_usage() as u64;
            memory_usage_delta += mem_usage_after as i64 - mem_usage_before as i64;
            ctx.record_progress();
        }
        memory_usage.add(memory_usage_delta);
        Ok(())
    }
}

/// A workbench hosts the set of `IndexedSplit` that are being built.
struct IndexingWorkbench {
    workbench_id: Ulid,
    // This span is meant to be passed through the pipeline.
    batch_parent_span: Span,
    // Span for the in-memory indexing (done in the Indexer actor).
    _indexing_span: Span,

    indexed_splits: FnvHashMap<u64, IndexedSplitBuilder>,
    other_indexed_split_opt: Option<IndexedSplitBuilder>,

    checkpoint_delta: IndexCheckpointDelta,
    publish_lock: PublishLock,
    publish_token_opt: Option<PublishToken>,
    // On workbench creation, we fetch from the metastore the last delete task opstamp.
    // We use this value to set the `delete_opstamp` of the workbench splits.
    last_delete_opstamp: u64,
    // Number of bytes declared as used by tantivy.
    memory_usage: GaugeGuard<'static>,
    split_builders_guard: GaugeGuard<'static>,
    cooperative_indexing_period: Option<CooperativeIndexingPeriod>,
}

pub struct Indexer {
    indexer_state: IndexerState,
    index_serializer_mailbox: Mailbox<IndexSerializer>,
    indexing_workbench_opt: Option<IndexingWorkbench>,
    counters: IndexerCounters,
}

#[async_trait]
impl Actor for Indexer {
    type ObservableState = IndexerCounters;

    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(10)
    }

    fn name(&self) -> String {
        "Indexer".to_string()
    }

    fn runtime_handle(&self) -> Handle {
        RuntimeType::Blocking.get_runtime_handle()
    }

    #[inline]
    fn yield_after_each_message(&self) -> bool {
        false
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        if let Some(cooperative_indexing_cycle) = &self.indexer_state.cooperative_indexing_opt {
            let initial_sleep_duration = cooperative_indexing_cycle.initial_sleep_duration();
            ctx.pause();
            ctx.schedule_self_msg(initial_sleep_duration, Command::Resume);
        }
        Ok(())
    }

    async fn on_drained_messages(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let Some(indexing_workbench) = &mut self.indexing_workbench_opt else {
            return Ok(());
        };

        let Some(cooperative_indexing_period) =
            indexing_workbench.cooperative_indexing_period.take()
        else {
            return Ok(());
        };

        let uncompressed_num_bytes = indexing_workbench
            .indexed_splits
            .values()
            .map(|split| split.split_attrs.uncompressed_docs_size_in_bytes)
            .sum::<u64>();

        // This also drops the indexing permit.
        let (sleep_duration, pipeline_metrics) =
            cooperative_indexing_period.end_of_work(uncompressed_num_bytes);

        self.counters.pipeline_metrics_opt = Some(pipeline_metrics);

        self.send_to_serializer(CommitTrigger::Drained, ctx).await?;

        if !sleep_duration.is_zero() {
            ctx.pause();
            ctx.schedule_self_msg(sleep_duration, Command::Resume);
        }

        Ok(())
    }

    async fn finalize(
        &mut self,
        exit_status: &ActorExitStatus,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        match exit_status {
            ActorExitStatus::DownstreamClosed
            | ActorExitStatus::Killed
            | ActorExitStatus::Failure(_)
            | ActorExitStatus::Panicked => return Ok(()),
            ActorExitStatus::Quit | ActorExitStatus::Success => {
                let _ = self
                    .send_to_serializer(CommitTrigger::NoMoreDocs, ctx)
                    .await;
            }
        }
        Ok(())
    }
}

fn record_timestamp(timestamp: DateTime, time_range: &mut Option<RangeInclusive<DateTime>>) {
    let new_timestamp_range = match time_range {
        Some(range) => timestamp.min(*range.start())..=timestamp.max(*range.end()),
        None => timestamp..=timestamp,
    };
    *time_range = Some(new_timestamp_range);
}

#[async_trait]
impl Handler<CommitTimeout> for Indexer {
    type Reply = ();

    async fn handle(
        &mut self,
        commit_timeout: CommitTimeout,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if let Some(indexing_workbench) = &self.indexing_workbench_opt {
            // If this is a timeout for a different workbench, we must ignore it.
            if indexing_workbench.workbench_id != commit_timeout.workbench_id {
                return Ok(());
            }
        }
        self.send_to_serializer(CommitTrigger::Timeout, ctx).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<ProcessedDocBatch> for Indexer {
    type Reply = ();

    async fn handle(
        &mut self,
        doc_batch: ProcessedDocBatch,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.index_batch(doc_batch, ctx).await
    }
}

#[async_trait]
impl Handler<NewPublishLock> for Indexer {
    type Reply = ();

    async fn handle(
        &mut self,
        message: NewPublishLock,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let NewPublishLock(publish_lock) = message;
        self.indexing_workbench_opt = None;
        self.indexer_state.publish_lock = publish_lock;
        Ok(())
    }
}

#[async_trait]
impl Handler<NewPublishToken> for Indexer {
    type Reply = ();

    async fn handle(
        &mut self,
        message: NewPublishToken,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let NewPublishToken(publish_token) = message;
        self.indexer_state.publish_token_opt = Some(publish_token);
        Ok(())
    }
}

impl Indexer {
    pub fn new(
        pipeline_id: IndexingPipelineId,
        doc_mapper: Arc<DocMapper>,
        metastore: MetastoreServiceClient,
        indexing_directory: TempDirectory,
        indexing_settings: IndexingSettings,
        cooperative_indexing_permits_opt: Option<Arc<Semaphore>>,
        index_serializer_mailbox: Mailbox<IndexSerializer>,
    ) -> Self {
        let schema = doc_mapper.schema();
        let tokenizer_manager = doc_mapper.tokenizer_manager().clone();
        let docstore_compression = Compressor::Zstd(ZstdCompressor {
            compression_level: Some(indexing_settings.docstore_compression_level),
        });
        let index_settings = IndexSettings {
            docstore_blocksize: indexing_settings.docstore_blocksize,
            docstore_compression,
            docstore_compress_dedicated_thread: true,
        };
        let cooperative_indexing_opt: Option<CooperativeIndexingCycle> =
            cooperative_indexing_permits_opt.map(|cooperative_indexing_permits| {
                CooperativeIndexingCycle::new(
                    &pipeline_id,
                    indexing_settings.commit_timeout(),
                    cooperative_indexing_permits,
                )
            });
        Self {
            indexer_state: IndexerState {
                pipeline_id,
                metastore: metastore.clone(),
                indexing_directory,
                indexing_settings,
                publish_lock: PublishLock::default(),
                publish_token_opt: None,
                schema,
                doc_mapping_uid: doc_mapper.doc_mapping_uid(),
                tokenizer_manager: tokenizer_manager.tantivy_manager().clone(),
                index_settings,
                max_num_partitions: doc_mapper.max_num_partitions(),
                cooperative_indexing_opt,
            },
            index_serializer_mailbox,
            indexing_workbench_opt: None,
            counters: IndexerCounters::default(),
        }
    }

    fn memory_usage(&self) -> ByteSize {
        if let Some(workbench) = &self.indexing_workbench_opt {
            ByteSize(workbench.memory_usage.get() as u64)
        } else {
            ByteSize(0u64)
        }
    }

    async fn index_batch(
        &mut self,
        batch: ProcessedDocBatch,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        fail_point!("indexer:batch:before");
        let force_commit = batch.force_commit;
        self.indexer_state
            .index_batch(
                batch,
                &mut self.indexing_workbench_opt,
                &mut self.counters,
                ctx,
            )
            .await?;
        let memory_usage = self.memory_usage();
        if memory_usage >= self.indexer_state.indexing_settings.resources.heap_size {
            self.send_to_serializer(CommitTrigger::MemoryLimit, ctx)
                .await?;
        }
        if self.counters.num_docs_in_workbench
            >= self.indexer_state.indexing_settings.split_num_docs_target as u64
        {
            self.send_to_serializer(CommitTrigger::NumDocsLimit, ctx)
                .await?;
        }
        if force_commit {
            self.send_to_serializer(CommitTrigger::ForceCommit, ctx)
                .await?;
        }
        fail_point!("indexer:batch:after");
        Ok(())
    }

    /// Extract the indexed split and send it to the IndexSerializer.
    async fn send_to_serializer(
        &mut self,
        commit_trigger: CommitTrigger,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        let Some(IndexingWorkbench {
            indexed_splits,
            other_indexed_split_opt,
            checkpoint_delta,
            publish_lock,
            publish_token_opt,
            batch_parent_span,
            memory_usage,
            split_builders_guard,
            ..
        }) = self.indexing_workbench_opt.take()
        else {
            return Ok(());
        };

        let mut splits: Vec<IndexedSplitBuilder> = indexed_splits.into_values().collect();

        if let Some(other_split) = other_indexed_split_opt {
            splits.push(other_split)
        }

        // Avoid producing empty split, but still update the checkpoint if it is not empty to avoid
        // reprocessing the same faulty documents.
        if splits.is_empty() {
            if !checkpoint_delta.is_empty() {
                ctx.send_message(
                    &self.index_serializer_mailbox,
                    EmptySplit {
                        index_uid: self.indexer_state.pipeline_id.index_uid.clone(),
                        checkpoint_delta,
                        publish_lock,
                        publish_token_opt,
                        batch_parent_span,
                    },
                )
                .await?;
            }
            return Ok(());
        }
        let num_splits = splits.len() as u64;
        let split_ids = splits.iter().map(|split| split.split_id()).join(",");
        info!(
            index=%self.indexer_state.pipeline_id.index_uid,
            source=self.indexer_state.pipeline_id.source_id.as_str(),
            pipeline_uid=%self.indexer_state.pipeline_id.pipeline_uid,
            commit_trigger=?commit_trigger,
            num_batches=%self.counters.num_doc_batches_in_workbench,
            split_ids=%split_ids,
            num_docs=self.counters.num_docs_in_workbench, "send-to-index-serializer");
        ctx.send_message(
            &self.index_serializer_mailbox,
            IndexedSplitBatchBuilder {
                splits,
                checkpoint_delta_opt: Some(checkpoint_delta),
                publish_lock,
                publish_token_opt,
                commit_trigger,
                batch_parent_span,
                memory_usage,
                _split_builders_guard: split_builders_guard,
            },
        )
        .await?;
        self.counters.num_docs_in_workbench = 0;
        self.counters.num_doc_batches_in_workbench = 0;
        self.counters.num_splits_emitted += num_splits;
        self.counters.num_split_batches_emitted += 1;
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::fmt::Write;
    use std::sync::Arc;
    use std::time::Duration;

    use quickwit_actors::Universe;
    use quickwit_doc_mapper::{DocMapper, default_doc_mapper_for_test};
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;
    use quickwit_proto::metastore::{
        EmptyResponse, LastDeleteOpstampResponse, MockMetastoreService,
    };
    use quickwit_proto::types::{IndexUid, NodeId, PipelineUid};
    use tantivy::{DateTime, doc};

    use super::*;
    use crate::actors::indexer::{IndexerCounters, record_timestamp};

    #[test]
    fn test_record_timestamp() {
        let mut time_range = None;
        record_timestamp(DateTime::from_timestamp_secs(1628664679), &mut time_range);
        assert_eq!(
            time_range,
            Some(
                DateTime::from_timestamp_secs(1628664679)
                    ..=DateTime::from_timestamp_secs(1628664679)
            )
        );
        record_timestamp(DateTime::from_timestamp_secs(1628664112), &mut time_range);
        assert_eq!(
            time_range,
            Some(
                DateTime::from_timestamp_secs(1628664112)
                    ..=DateTime::from_timestamp_secs(1628664679)
            )
        );
        record_timestamp(DateTime::from_timestamp_secs(1628665112), &mut time_range);
        assert_eq!(
            time_range,
            Some(
                DateTime::from_timestamp_secs(1628664112)
                    ..=DateTime::from_timestamp_secs(1628665112)
            )
        )
    }

    #[tokio::test]
    async fn test_indexer_triggers_commit_on_target_num_docs() -> anyhow::Result<()> {
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let pipeline_id = IndexingPipelineId {
            index_uid: index_uid.clone(),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let last_delete_opstamp = 10;
        let schema = doc_mapper.schema();
        let body_field = schema.get_field("body").unwrap();
        let timestamp_field = schema.get_field("timestamp").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.split_num_docs_target = 3;
        let universe = Universe::with_accelerated_time();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        mock_metastore
            .expect_last_delete_opstamp()
            .times(2)
            .returning(move |delete_opstamp_request| {
                assert_eq!(delete_opstamp_request.index_uid(), &index_uid);
                Ok(LastDeleteOpstampResponse::new(last_delete_opstamp))
            });
        mock_metastore.expect_publish_splits().never();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![
                    ProcessedDoc {
                        doc: doc!(
                            body_field=>"this is a test document",
                            timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435)
                        ),
                        timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                        partition: 1,
                        num_bytes: 30,
                    },
                    ProcessedDoc {
                        doc: doc!(
                            body_field=>"this is a test document 2",
                            timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435)
                        ),
                        timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                        partition: 1,
                        num_bytes: 30,
                    },
                ],
                SourceCheckpointDelta::from_range(4..6),
                false,
            ))
            .await?;
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![
                    ProcessedDoc {
                        doc: doc!(
                            body_field=>"this is a test document 3",
                            timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435i64)
                        ),
                        timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435i64)),
                        partition: 1,
                        num_bytes: 30,
                    },
                    ProcessedDoc {
                        doc: doc!(
                            body_field=>"this is a test document 4",
                            timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435)
                        ),
                        timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                        partition: 1,
                        num_bytes: 30,
                    },
                ],
                SourceCheckpointDelta::from_range(6..8),
                false,
            ))
            .await?;
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![ProcessedDoc {
                    doc: doc!(
                        body_field=>"this is a test document 5",
                        timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435)
                    ),
                    timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                    partition: 1,
                    num_bytes: 30,
                }],
                SourceCheckpointDelta::from_range(8..9),
                false,
            ))
            .await?;
        let indexer_counters = indexer_handle.process_pending_and_observe().await.state;
        assert_eq!(
            indexer_counters,
            IndexerCounters {
                num_splits_emitted: 1,
                num_split_batches_emitted: 1,
                num_docs_in_workbench: 1, //< the num docs in split counter has been reset.
                num_doc_batches_in_workbench: 1, //< the num docs in split counter has been reset.
                pipeline_metrics_opt: None,
            }
        );
        let messages: Vec<IndexedSplitBatchBuilder> = index_serializer_inbox.drain_for_test_typed();
        assert_eq!(messages.len(), 1);
        let batch = messages.into_iter().next().unwrap();
        assert_eq!(batch.commit_trigger, CommitTrigger::NumDocsLimit);
        assert_eq!(batch.splits[0].split_attrs.num_docs, 4);
        for split in batch.splits.iter() {
            assert_eq!(split.split_attrs.delete_opstamp, last_delete_opstamp);
        }
        let index_checkpoint = batch.checkpoint_delta_opt.unwrap();
        assert_eq!(index_checkpoint.source_id, "test-source");
        assert_eq!(
            index_checkpoint.source_delta,
            SourceCheckpointDelta::from_range(4..8)
        );
        batch.splits.into_iter().next().unwrap().finalize()?;
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_indexer_triggers_commit_on_memory_limit() -> anyhow::Result<()> {
        let universe = Universe::new();
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let pipeline_id = IndexingPipelineId {
            index_uid: index_uid.clone(),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let last_delete_opstamp = 10;
        let schema = doc_mapper.schema();
        let body_field = schema.get_field("body").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.resources.heap_size = ByteSize::mb(16);
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        mock_metastore
            .expect_last_delete_opstamp()
            .times(1..=2)
            .returning(move |last_delete_opstamp_request| {
                assert_eq!(last_delete_opstamp_request.index_uid(), &index_uid);
                Ok(LastDeleteOpstampResponse::new(last_delete_opstamp))
            });
        mock_metastore.expect_publish_splits().never();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, _indexer_handle) = universe.spawn_builder().spawn(indexer);

        let make_doc = |i: u64| {
            let mut body = String::new();
            for val in 100 * i..100 * (i + 1) {
                write!(&mut body, "{val} ").unwrap();
            }
            let num_bytes = body.len() * 2;
            ProcessedDoc {
                doc: doc!(body_field=>body),
                timestamp_opt: None,
                partition: 0,
                num_bytes,
            }
        };
        for i in 0..10_000 {
            indexer_mailbox
                .send_message(ProcessedDocBatch::new(
                    vec![make_doc(i)],
                    SourceCheckpointDelta::from_range(i..i + 1),
                    false,
                ))
                .await?;
            let output_messages: Vec<IndexedSplitBatchBuilder> =
                index_serializer_inbox.drain_for_test_typed();
            if !output_messages.is_empty() {
                assert_eq!(output_messages.len(), 1);
                assert_eq!(
                    output_messages[0].commit_trigger,
                    CommitTrigger::MemoryLimit
                );
                // The following assert is not a strict one. It should help detect large
                // regression in memory usage.
                assert!((500..3_000).contains(&i));
                break;
            }
        }
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_indexer_triggers_commit_on_timeout() -> anyhow::Result<()> {
        let universe = Universe::new();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let last_delete_opstamp = 10;
        let schema = doc_mapper.schema();
        let body_field = schema.get_field("body").unwrap();
        let timestamp_field = schema.get_field("timestamp").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.commit_timeout_secs = 1;
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        mock_metastore.expect_last_delete_opstamp().returning(
            move |_last_delete_opstamp_request| {
                Ok(LastDeleteOpstampResponse::new(last_delete_opstamp))
            },
        );
        mock_metastore.expect_publish_splits().never();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        tokio::task::spawn({
            let indexer_mailbox = indexer_mailbox.clone();
            async move {
                let mut position = 0;
                while indexer_mailbox
                    .send_message(ProcessedDocBatch::new(
                        vec![ProcessedDoc {
                            doc: doc!(
                                body_field=>"this is a test document",
                                timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435)
                            ),
                            timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                            partition: 1,
                            num_bytes: 30,
                        }],
                        SourceCheckpointDelta::from_range(position..position + 1),
                        false,
                    ))
                    .await
                    .is_ok()
                {
                    position += 1;
                }
            }
        });
        universe.sleep(Duration::from_secs(3)).await;

        let indexer_counters = indexer_handle.process_pending_and_observe().await.state;
        assert!(indexer_counters.num_splits_emitted > 0);
        assert!(indexer_counters.num_split_batches_emitted > 0);

        let indexed_serializer_messages: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();
        assert!(!indexed_serializer_messages.is_empty());
        assert_eq!(
            indexed_serializer_messages[0].commit_trigger,
            CommitTrigger::Timeout
        );
        assert!(
            indexed_serializer_messages[0].splits[0]
                .split_attrs
                .num_docs
                > 0
        );
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_indexer_triggers_commit_on_drained_mailbox() -> anyhow::Result<()> {
        let universe = Universe::new();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let last_delete_opstamp = 10;
        let schema = doc_mapper.schema();
        let body_field = schema.get_field("body").unwrap();
        let timestamp_field = schema.get_field("timestamp").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let indexing_settings = IndexingSettings::for_test();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        mock_metastore.expect_last_delete_opstamp().returning(
            move |_last_delete_opstamp_request| {
                Ok(LastDeleteOpstampResponse::new(last_delete_opstamp))
            },
        );
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            Some(Arc::new(Semaphore::new(1))),
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![ProcessedDoc {
                    doc: doc!(
                        body_field=>"this is a test document 5",
                        timestamp_field=>DateTime::from_timestamp_secs(1_662_529_435)
                    ),
                    timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                    partition: 1,
                    num_bytes: 30,
                }],
                SourceCheckpointDelta::from_range(8..9),
                false,
            ))
            .await
            .unwrap();
        let mut indexer_counters: IndexerCounters = Default::default();
        for _ in 0..100 {
            // When a lot of unit tests are running concurrently we have a race condition here.
            // It is very difficult to assess when drain will actually be called.
            //
            // Therefore we check that it happens "eventually".
            universe.sleep(Duration::from_secs(1)).await;
            tokio::task::yield_now().await;
            indexer_counters = indexer_handle.observe().await.state;
            indexer_counters.pipeline_metrics_opt = None;
            // drain was called at least once.
            if indexer_counters.num_splits_emitted > 0 {
                break;
            }
        }

        assert_eq!(
            &indexer_counters,
            &IndexerCounters {
                num_splits_emitted: 1,
                num_split_batches_emitted: 1,
                num_docs_in_workbench: 0,
                num_doc_batches_in_workbench: 0,
                pipeline_metrics_opt: None,
            }
        );
        let indexed_split_batches: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();
        assert_eq!(indexed_split_batches.len(), 1);
        assert_eq!(
            indexed_split_batches[0].commit_trigger,
            CommitTrigger::Drained
        );
        assert_eq!(indexed_split_batches[0].splits[0].split_attrs.num_docs, 1);
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_indexer_triggers_commit_on_quit() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let schema = doc_mapper.schema();
        let body_field = schema.get_field("body").unwrap();
        let timestamp_field = schema.get_field("timestamp").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let indexing_settings = IndexingSettings::for_test();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        mock_metastore
            .expect_last_delete_opstamp()
            .once()
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore.expect_publish_splits().never();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![ProcessedDoc {
                    doc: doc!(
                        body_field=>"this is a test document 5",
                        timestamp_field=> DateTime::from_timestamp_secs(1_662_529_435)
                    ),
                    timestamp_opt: Some(DateTime::from_timestamp_secs(1_662_529_435)),
                    partition: 1,
                    num_bytes: 30,
                }],
                SourceCheckpointDelta::from_range(8..9),
                false,
            ))
            .await
            .unwrap();
        universe.send_exit_with_success(&indexer_mailbox).await?;
        let (exit_status, indexer_counters) = indexer_handle.join().await;
        assert!(exit_status.is_success());
        assert_eq!(
            indexer_counters,
            IndexerCounters {
                num_splits_emitted: 1,
                num_split_batches_emitted: 1,
                num_docs_in_workbench: 0,
                num_doc_batches_in_workbench: 0,
                pipeline_metrics_opt: None,
            }
        );
        let output_messages: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();
        assert_eq!(output_messages.len(), 1);
        assert_eq!(output_messages[0].commit_trigger, CommitTrigger::NoMoreDocs);
        assert_eq!(output_messages[0].splits[0].split_attrs.num_docs, 1);
        universe.assert_quit().await;
        Ok(())
    }

    const DOCMAPPER_WITH_PARTITION_JSON: &str = r#"{
        "tag_fields": ["tenant"],
        "partition_key": "tenant",
        "field_mappings": [
            { "name": "tenant", "type": "text", "tokenizer": "raw", "indexed": true },
            { "name": "body", "type": "text" }
        ]
    }"#;

    #[tokio::test]
    async fn test_indexer_partitioning() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper: Arc<DocMapper> =
            Arc::new(serde_json::from_str::<DocMapper>(DOCMAPPER_WITH_PARTITION_JSON).unwrap());
        let schema = doc_mapper.schema();
        let tenant_field = schema.get_field("tenant").unwrap();
        let body_field = schema.get_field("body").unwrap();

        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.resources.heap_size = ByteSize::mb(100);
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        mock_metastore
            .expect_last_delete_opstamp()
            .once()
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore.expect_publish_splits().never();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![
                    ProcessedDoc {
                        doc: doc!(
                            body_field=>"doc 2",
                            tenant_field=>"tenant_1",
                        ),
                        timestamp_opt: None,
                        partition: 1,
                        num_bytes: 30,
                    },
                    ProcessedDoc {
                        doc: doc!(
                            body_field=>"doc 2",
                            tenant_field=>"tenant_2",
                        ),
                        timestamp_opt: None,
                        partition: 3,
                        num_bytes: 30,
                    },
                ],
                SourceCheckpointDelta::from_range(8..9),
                false,
            ))
            .await?;

        let indexer_counters = indexer_handle.process_pending_and_observe().await.state;
        assert_eq!(
            indexer_counters,
            IndexerCounters {
                num_docs_in_workbench: 2,
                num_doc_batches_in_workbench: 1,
                num_splits_emitted: 0,
                num_split_batches_emitted: 0,
                pipeline_metrics_opt: None,
            }
        );
        universe.send_exit_with_success(&indexer_mailbox).await?;
        let (exit_status, indexer_counters) = indexer_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        assert_eq!(
            indexer_counters,
            IndexerCounters {
                num_docs_in_workbench: 0,
                num_doc_batches_in_workbench: 0,
                num_splits_emitted: 2,
                num_split_batches_emitted: 1,
                pipeline_metrics_opt: None,
            }
        );
        let split_batches: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();
        assert_eq!(split_batches.len(), 1);
        assert_eq!(split_batches[0].splits.len(), 2);
        universe.assert_quit().await;
        Ok(())
    }

    const DOCMAPPER_SIMPLE_JSON: &str = r#"{
        "field_mappings": [{"name": "body", "type": "text"}],
        "max_num_partitions": 10
    }"#;

    #[tokio::test]
    async fn test_indexer_exceeding_max_num_partitions() {
        let universe = Universe::with_accelerated_time();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper: Arc<DocMapper> =
            Arc::new(serde_json::from_str::<DocMapper>(DOCMAPPER_SIMPLE_JSON).unwrap());
        let body_field = doc_mapper.schema().get_field("body").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.resources.heap_size = ByteSize::gb(5);
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_last_delete_opstamp()
            .times(1)
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore.expect_publish_splits().never();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);

        for partition in 0..100 {
            indexer_mailbox
                .send_message(ProcessedDocBatch::new(
                    vec![ProcessedDoc {
                        doc: doc!(body_field=>"doc {i}"),
                        timestamp_opt: None,
                        partition,
                        num_bytes: 30,
                    }],
                    SourceCheckpointDelta::from_range(partition..partition + 1),
                    false,
                ))
                .await
                .unwrap();
        }
        universe
            .send_exit_with_success(&indexer_mailbox)
            .await
            .unwrap();

        let (exit_status, _indexer_counters) = indexer_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));

        let index_serializer_msgs: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();
        assert_eq!(index_serializer_msgs.len(), 1);
        let msg = index_serializer_msgs.into_iter().next().unwrap();
        assert_eq!(msg.splits.len(), 11);
        for split in msg.splits {
            if split.split_attrs.partition_id == OTHER_PARTITION_ID {
                assert_eq!(split.split_attrs.num_docs, 90);
            } else {
                assert_eq!(split.split_attrs.num_docs, 1);
            }
        }
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexer_propagates_publish_lock() {
        let universe = Universe::with_accelerated_time();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper: Arc<DocMapper> =
            Arc::new(serde_json::from_str::<DocMapper>(DOCMAPPER_SIMPLE_JSON).unwrap());
        let body_field = doc_mapper.schema().get_field("body").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.split_num_docs_target = 1;
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_last_delete_opstamp()
            .times(2)
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore.expect_publish_splits().never();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);

        let first_lock = PublishLock::default();
        let second_lock = PublishLock::default();

        for lock in [&first_lock, &second_lock] {
            indexer_mailbox
                .send_message(NewPublishLock(lock.clone()))
                .await
                .unwrap();
            indexer_mailbox
                .send_message(ProcessedDocBatch::new(
                    vec![ProcessedDoc {
                        doc: doc!(body_field=>"doc 1"),
                        timestamp_opt: None,
                        partition: 0,
                        num_bytes: 30,
                    }],
                    SourceCheckpointDelta::from_range(0..1),
                    false,
                ))
                .await
                .unwrap();
        }
        universe
            .send_exit_with_success(&indexer_mailbox)
            .await
            .unwrap();
        let (exit_status, _indexer_counters) = indexer_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));

        let index_serializer_messages: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();
        assert_eq!(index_serializer_messages.len(), 2);
        assert_eq!(index_serializer_messages[0].splits.len(), 1);
        assert_eq!(index_serializer_messages[0].publish_lock, first_lock);
        assert_eq!(index_serializer_messages[1].splits.len(), 1);
        assert_eq!(index_serializer_messages[1].publish_lock, second_lock);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexer_ignores_messages_when_publish_lock_is_dead() {
        let universe = Universe::with_accelerated_time();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper: Arc<DocMapper> =
            Arc::new(serde_json::from_str::<DocMapper>(DOCMAPPER_SIMPLE_JSON).unwrap());
        let body_field = doc_mapper.schema().get_field("body").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let mut indexing_settings = IndexingSettings::for_test();
        indexing_settings.split_num_docs_target = 1;
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_last_delete_opstamp()
            .times(1)
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore.expect_publish_splits().never();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);

        let publish_lock = PublishLock::default();
        indexer_mailbox
            .send_message(NewPublishLock(publish_lock.clone()))
            .await
            .unwrap();
        indexer_handle.process_pending_and_observe().await;
        publish_lock.kill().await;
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![ProcessedDoc {
                    doc: doc!(body_field=>"doc 1"),
                    timestamp_opt: None,
                    partition: 0,
                    num_bytes: 30,
                }],
                SourceCheckpointDelta::from_range(0..1),
                false,
            ))
            .await
            .unwrap();
        universe
            .send_exit_with_success(&indexer_mailbox)
            .await
            .unwrap();
        let (exit_status, _indexer_counters) = indexer_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));

        let index_serializer_messages = index_serializer_inbox.drain_for_test();
        assert!(index_serializer_messages.is_empty());
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexer_honors_batch_commit_request() {
        let universe = Universe::with_accelerated_time();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper: Arc<DocMapper> =
            Arc::new(serde_json::from_str::<DocMapper>(DOCMAPPER_SIMPLE_JSON).unwrap());
        let body_field = doc_mapper.schema().get_field("body").unwrap();
        let indexing_directory = TempDirectory::for_test();
        let indexing_settings = IndexingSettings::for_test();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_last_delete_opstamp()
            .times(1)
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore.expect_publish_splits().never();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                vec![ProcessedDoc {
                    doc: doc!(body_field=>"doc 1"),
                    timestamp_opt: None,
                    partition: 0,
                    num_bytes: 30,
                }],
                SourceCheckpointDelta::from_range(0..1),
                true,
            ))
            .await
            .unwrap();
        universe
            .send_exit_with_success(&indexer_mailbox)
            .await
            .unwrap();
        let (exit_status, _indexer_counters) = indexer_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        let output_messages: Vec<IndexedSplitBatchBuilder> =
            index_serializer_inbox.drain_for_test_typed();

        assert_eq!(output_messages.len(), 1);
        assert_eq!(
            output_messages[0].commit_trigger,
            CommitTrigger::ForceCommit
        );
        assert_eq!(output_messages[0].splits[0].split_attrs.num_docs, 1);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexer_checkpoint_on_all_failed_docs() -> anyhow::Result<()> {
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let last_delete_opstamp = 10;
        let indexing_directory = TempDirectory::for_test();
        let indexing_settings = IndexingSettings::for_test();
        let commit_timeout = indexing_settings.commit_timeout();
        let universe = Universe::with_accelerated_time();
        let (index_serializer_mailbox, index_serializer_inbox) = universe.create_test_mailbox();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_publish_splits()
            .returning(move |publish_splits_request| {
                assert!(publish_splits_request.replaced_split_ids.is_empty());
                Ok(EmptyResponse {})
            });
        mock_metastore.expect_last_delete_opstamp().returning(
            move |_last_delete_opstamp_request| {
                Ok(LastDeleteOpstampResponse::new(last_delete_opstamp))
            },
        );
        let indexer = Indexer::new(
            pipeline_id,
            doc_mapper,
            MetastoreServiceClient::from_mock(mock_metastore),
            indexing_directory,
            indexing_settings,
            None,
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = universe.spawn_builder().spawn(indexer);
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                Vec::new(),
                SourceCheckpointDelta::from_range(4..6),
                false,
            ))
            .await?;
        indexer_mailbox
            .send_message(ProcessedDocBatch::new(
                Vec::new(),
                SourceCheckpointDelta::from_range(6..8),
                false,
            ))
            .await?;
        universe
            .sleep(commit_timeout + Duration::from_secs(2))
            .await;
        let indexer_counters = indexer_handle.process_pending_and_observe().await.state;
        assert_eq!(
            indexer_counters,
            IndexerCounters {
                num_splits_emitted: 0,
                num_split_batches_emitted: 0,
                num_docs_in_workbench: 0, //< the num docs in split counter has been reset.
                num_doc_batches_in_workbench: 2, //< the num docs in split counter has been reset.
                pipeline_metrics_opt: None,
            }
        );

        let index_serializer_messages: Vec<EmptySplit> =
            index_serializer_inbox.drain_for_test_typed();
        assert_eq!(index_serializer_messages.len(), 1);
        let update = index_serializer_messages.into_iter().next().unwrap();
        assert_eq!(update.index_uid.index_id, "test-index");
        assert_eq!(
            update.checkpoint_delta,
            IndexCheckpointDelta::for_test("test-source", 4..8)
        );

        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/indexing_pipeline.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::path::PathBuf;
use std::sync::Arc;
use std::time::{Duration, Instant};

use async_trait::async_trait;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, HEARTBEAT, Handler, Health, Mailbox,
    QueueCapacity, Supervisable,
};
use quickwit_common::KillSwitch;
use quickwit_common::metrics::OwnedGaugeGuard;
use quickwit_common::pubsub::EventBroker;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_config::{IndexingSettings, RetentionPolicy, SourceConfig};
use quickwit_doc_mapper::DocMapper;
use quickwit_ingest::IngesterPool;
use quickwit_proto::indexing::IndexingPipelineId;
use quickwit_proto::metastore::{MetastoreError, MetastoreServiceClient};
use quickwit_proto::types::ShardId;
use quickwit_storage::{Storage, StorageResolver};
use tokio::sync::Semaphore;
use tracing::{debug, error, info, instrument};

use super::MergePlanner;
use crate::SplitsUpdateMailbox;
use crate::actors::doc_processor::DocProcessor;
use crate::actors::index_serializer::IndexSerializer;
use crate::actors::publisher::PublisherType;
use crate::actors::sequencer::Sequencer;
use crate::actors::uploader::UploaderType;
use crate::actors::{Indexer, Packager, Publisher, Uploader};
use crate::merge_policy::MergePolicy;
use crate::models::IndexingStatistics;
use crate::source::{
    AssignShards, Assignment, SourceActor, SourceRuntime, quickwit_supported_sources,
};
use crate::split_store::IndexingSplitStore;

const SUPERVISE_INTERVAL: Duration = Duration::from_secs(1);

const MAX_RETRY_DELAY: Duration = Duration::from_secs(600); // 10 min.

#[derive(Debug)]
struct SuperviseLoop;

/// Calculates the wait time based on retry count.
// retry_count, wait_time
// 0   1s
// 1   2s
// 2   4s
// 3   8s
// ...
// >=8   5mn
pub(crate) fn wait_duration_before_retry(retry_count: usize) -> Duration {
    // Protect against a `retry_count` that will lead to an overflow.
    let max_power = (retry_count as u32).min(31);
    Duration::from_secs(2u64.pow(max_power)).min(MAX_RETRY_DELAY)
}

/// Spawning an indexing pipeline puts a lot of pressure on the file system, metastore, etc. so
/// we rely on this semaphore to limit the number of indexing pipelines that can be spawned
/// concurrently.
/// See also <https://github.com/quickwit-oss/quickwit/issues/1638>.
static SPAWN_PIPELINE_SEMAPHORE: Semaphore = Semaphore::const_new(10);

struct IndexingPipelineHandles {
    source_mailbox: Mailbox<SourceActor>,
    source_handle: ActorHandle<SourceActor>,
    doc_processor: ActorHandle<DocProcessor>,
    indexer: ActorHandle<Indexer>,
    index_serializer: ActorHandle<IndexSerializer>,
    packager: ActorHandle<Packager>,
    uploader: ActorHandle<Uploader>,
    sequencer: ActorHandle<Sequencer<Publisher>>,
    publisher: ActorHandle<Publisher>,
    next_check_for_progress: Instant,
}

impl IndexingPipelineHandles {
    fn should_check_for_progress(&mut self) -> bool {
        let now = Instant::now();
        let check_for_progress = now > self.next_check_for_progress;
        if check_for_progress {
            self.next_check_for_progress = now + *HEARTBEAT;
        }
        check_for_progress
    }
}

// Messages

#[derive(Clone, Copy, Debug, Default)]
pub struct Spawn {
    retry_count: usize,
}

pub struct IndexingPipeline {
    params: IndexingPipelineParams,
    previous_generations_statistics: IndexingStatistics,
    statistics: IndexingStatistics,
    handles_opt: Option<IndexingPipelineHandles>,
    // Killswitch used for the actors in the pipeline. This is not the supervisor killswitch.
    kill_switch: KillSwitch,

    // The set of shard is something that can change dynamically without necessarily
    // requiring a respawn of the pipeline.
    // We keep the list of shards here however, to reassign them after a respawn.
    shard_ids: BTreeSet<ShardId>,
    _indexing_pipelines_gauge_guard: OwnedGaugeGuard,
}

#[async_trait]
impl Actor for IndexingPipeline {
    type ObservableState = IndexingStatistics;

    fn observable_state(&self) -> Self::ObservableState {
        self.statistics.clone()
    }

    fn name(&self) -> String {
        "IndexingPipeline".to_string()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.handle(Spawn::default(), ctx).await?;
        self.handle(SuperviseLoop, ctx).await?;
        Ok(())
    }

    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        // We update the observation to ensure our last "black box" observation
        // is up to date.
        self.perform_observe(ctx);
        Ok(())
    }
}

impl IndexingPipeline {
    pub fn new(params: IndexingPipelineParams) -> Self {
        let indexing_pipelines_gauge = crate::metrics::INDEXER_METRICS
            .indexing_pipelines
            .with_label_values([&params.pipeline_id.index_uid.index_id]);
        let indexing_pipelines_gauge_guard = OwnedGaugeGuard::from_gauge(indexing_pipelines_gauge);
        let params_fingerprint = params.params_fingerprint;
        IndexingPipeline {
            params,
            previous_generations_statistics: Default::default(),
            handles_opt: None,
            kill_switch: KillSwitch::default(),
            statistics: IndexingStatistics {
                params_fingerprint,
                ..Default::default()
            },
            shard_ids: Default::default(),
            _indexing_pipelines_gauge_guard: indexing_pipelines_gauge_guard,
        }
    }

    fn supervisables(&self) -> Vec<&dyn Supervisable> {
        if let Some(handles) = &self.handles_opt {
            let supervisables: Vec<&dyn Supervisable> = vec![
                &handles.source_handle,
                &handles.doc_processor,
                &handles.indexer,
                &handles.index_serializer,
                &handles.packager,
                &handles.uploader,
                &handles.sequencer,
                &handles.publisher,
            ];
            supervisables
        } else {
            Vec::new()
        }
    }

    /// Performs healthcheck on all of the actors in the pipeline,
    /// and consolidates the result.
    fn healthcheck(&self, check_for_progress: bool) -> Health {
        let mut healthy_actors: Vec<&str> = Default::default();
        let mut failure_or_unhealthy_actors: Vec<&str> = Default::default();
        let mut success_actors: Vec<&str> = Default::default();
        for supervisable in self.supervisables() {
            match supervisable.check_health(check_for_progress) {
                Health::Healthy => {
                    // At least one other actor is running.
                    healthy_actors.push(supervisable.name());
                }
                Health::FailureOrUnhealthy => {
                    failure_or_unhealthy_actors.push(supervisable.name());
                }
                Health::Success => {
                    success_actors.push(supervisable.name());
                }
            }
        }

        if !failure_or_unhealthy_actors.is_empty() {
            error!(
                pipeline_id=?self.params.pipeline_id,
                generation=self.generation(),
                healthy_actors=?healthy_actors,
                failed_or_unhealthy_actors=?failure_or_unhealthy_actors,
                success_actors=?success_actors,
                "Indexing pipeline failure."
            );
            return Health::FailureOrUnhealthy;
        }
        if healthy_actors.is_empty() {
            // All the actors finished successfully.
            info!(
                pipeline_id=?self.params.pipeline_id,
                generation=self.generation(),
                "Indexing pipeline success."
            );
            return Health::Success;
        }
        // No error at this point and there are still some actors running.
        debug!(
            pipeline_id=?self.params.pipeline_id,
            generation=self.generation(),
            healthy_actors=?healthy_actors,
            failed_or_unhealthy_actors=?failure_or_unhealthy_actors,
            success_actors=?success_actors,
            "Indexing pipeline running."
        );
        Health::Healthy
    }

    fn generation(&self) -> usize {
        self.statistics.generation
    }

    fn perform_observe(&mut self, ctx: &ActorContext<Self>) {
        let Some(handles) = &self.handles_opt else {
            return;
        };
        handles.doc_processor.refresh_observe();
        handles.indexer.refresh_observe();
        handles.uploader.refresh_observe();
        handles.publisher.refresh_observe();
        self.statistics = self
            .previous_generations_statistics
            .clone()
            .add_actor_counters(
                &handles.doc_processor.last_observation(),
                &handles.indexer.last_observation(),
                &handles.uploader.last_observation(),
                &handles.publisher.last_observation(),
            )
            .set_generation(self.statistics.generation)
            .set_num_spawn_attempts(self.statistics.num_spawn_attempts);
        let pipeline_metrics_opt = handles.indexer.last_observation().pipeline_metrics_opt;
        self.statistics.pipeline_metrics_opt = pipeline_metrics_opt;
        self.statistics.params_fingerprint = self.params.params_fingerprint;
        self.statistics.shard_ids.clone_from(&self.shard_ids);
        ctx.observe(self);
    }

    /// Checks if some actors have terminated.
    async fn perform_health_check(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let Some(handles) = self.handles_opt.as_mut() else {
            return Ok(());
        };

        // While we check if the actor has terminated or not, we do not check for progress
        // at every single loop. Instead, we wait for the `HEARTBEAT` duration to have elapsed,
        // since our last check.
        let check_for_progress = handles.should_check_for_progress();
        let health = self.healthcheck(check_for_progress);
        match health {
            Health::Healthy => {}
            Health::FailureOrUnhealthy => {
                self.terminate().await;
                let first_retry_delay = wait_duration_before_retry(0);
                ctx.schedule_self_msg(first_retry_delay, Spawn { retry_count: 0 });
            }
            Health::Success => {
                return Err(ActorExitStatus::Success);
            }
        }
        Ok(())
    }

    // TODO this should return an error saying whether we can retry or not.
    #[instrument(
        name="spawn_pipeline",
        level="info",
        skip_all,
        fields(
            index=%self.params.pipeline_id.index_uid.index_id,
            r#gen=self.generation()
        ))]
    async fn spawn_pipeline(&mut self, ctx: &ActorContext<Self>) -> anyhow::Result<()> {
        let _spawn_pipeline_permit = ctx
            .protect_future(SPAWN_PIPELINE_SEMAPHORE.acquire())
            .await
            .expect("semaphore should not be closed");

        self.statistics.num_spawn_attempts += 1;
        self.kill_switch = ctx.kill_switch().child();

        let index_id = &self.params.pipeline_id.index_uid.index_id;
        let source_id = &self.params.pipeline_id.source_id;

        info!(
            index_id,
            source_id,
            pipeline_uid=%self.params.pipeline_id.pipeline_uid,
            root_dir=%self.params.indexing_directory.path().display(),
            "spawning indexing pipeline",
        );
        let (source_mailbox, source_inbox) = ctx
            .spawn_ctx()
            .create_mailbox::<SourceActor>("SourceActor", QueueCapacity::Unbounded);

        // Publisher
        let publisher = Publisher::new(
            PublisherType::MainPublisher,
            self.params.metastore.clone(),
            Some(self.params.merge_planner_mailbox.clone()),
            Some(source_mailbox.clone()),
        );
        let (publisher_mailbox, publisher_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["publisher"]),
            )
            .spawn(publisher);

        let sequencer = Sequencer::new(publisher_mailbox);
        let (sequencer_mailbox, sequencer_handle) = ctx
            .spawn_actor()
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["sequencer"]),
            )
            .set_kill_switch(self.kill_switch.clone())
            .spawn(sequencer);

        // Uploader
        let uploader = Uploader::new(
            UploaderType::IndexUploader,
            self.params.metastore.clone(),
            self.params.merge_policy.clone(),
            self.params.retention_policy.clone(),
            self.params.split_store.clone(),
            SplitsUpdateMailbox::Sequencer(sequencer_mailbox),
            self.params.max_concurrent_split_uploads_index,
            self.params.event_broker.clone(),
        );
        let (uploader_mailbox, uploader_handle) = ctx
            .spawn_actor()
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["uploader"]),
            )
            .set_kill_switch(self.kill_switch.clone())
            .spawn(uploader);

        // Packager
        let tag_fields = self.params.doc_mapper.tag_named_fields()?;
        let packager = Packager::new("Packager", tag_fields, uploader_mailbox);
        let (packager_mailbox, packager_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .spawn(packager);

        // Index Serializer
        let index_serializer = IndexSerializer::new(packager_mailbox);
        let (index_serializer_mailbox, index_serializer_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .spawn(index_serializer);

        // Indexer
        let indexer = Indexer::new(
            self.params.pipeline_id.clone(),
            self.params.doc_mapper.clone(),
            self.params.metastore.clone(),
            self.params.indexing_directory.clone(),
            self.params.indexing_settings.clone(),
            self.params.cooperative_indexing_permits.clone(),
            index_serializer_mailbox,
        );
        let (indexer_mailbox, indexer_handle) = ctx
            .spawn_actor()
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["indexer"]),
            )
            .set_kill_switch(self.kill_switch.clone())
            .spawn(indexer);

        let doc_processor = DocProcessor::try_new(
            index_id.to_string(),
            source_id.to_string(),
            self.params.doc_mapper.clone(),
            indexer_mailbox,
            self.params.source_config.transform_config.clone(),
            self.params.source_config.input_format,
        )?;
        let (doc_processor_mailbox, doc_processor_handle) = ctx
            .spawn_actor()
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["doc_processor"]),
            )
            .set_kill_switch(self.kill_switch.clone())
            .spawn(doc_processor);
        let source_runtime = SourceRuntime {
            pipeline_id: self.params.pipeline_id.clone(),
            source_config: self.params.source_config.clone(),
            metastore: self.params.metastore.clone(),
            ingester_pool: self.params.ingester_pool.clone(),
            queues_dir_path: self.params.queues_dir_path.clone(),
            storage_resolver: self.params.source_storage_resolver.clone(),
            event_broker: self.params.event_broker.clone(),
            indexing_setting: self.params.indexing_settings.clone(),
        };
        let source = ctx
            .protect_future(quickwit_supported_sources().load_source(source_runtime))
            .await?;
        let actor_source = SourceActor {
            source,
            doc_processor_mailbox,
        };
        let (source_mailbox, source_handle) = ctx
            .spawn_actor()
            .set_mailboxes(source_mailbox, source_inbox)
            .set_kill_switch(self.kill_switch.clone())
            .spawn(actor_source);
        let assign_shards_message = AssignShards(Assignment {
            shard_ids: self.shard_ids.clone(),
        });
        source_mailbox.send_message(assign_shards_message).await?;

        // Increment generation once we are sure there will be no spawning error.
        self.previous_generations_statistics = self.statistics.clone();
        self.statistics.generation += 1;
        self.handles_opt = Some(IndexingPipelineHandles {
            source_mailbox,
            source_handle,
            doc_processor: doc_processor_handle,
            indexer: indexer_handle,
            index_serializer: index_serializer_handle,
            packager: packager_handle,
            uploader: uploader_handle,
            sequencer: sequencer_handle,
            publisher: publisher_handle,
            next_check_for_progress: Instant::now() + *HEARTBEAT,
        });
        Ok(())
    }

    async fn terminate(&mut self) {
        self.kill_switch.kill();
        if let Some(handles) = self.handles_opt.take() {
            tokio::join!(
                handles.source_handle.kill(),
                handles.indexer.kill(),
                handles.packager.kill(),
                handles.uploader.kill(),
                handles.publisher.kill(),
            );
        }
    }
}

#[async_trait]
impl Handler<SuperviseLoop> for IndexingPipeline {
    type Reply = ();
    async fn handle(
        &mut self,
        supervise_loop_token: SuperviseLoop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.perform_observe(ctx);
        self.perform_health_check(ctx).await?;
        ctx.schedule_self_msg(SUPERVISE_INTERVAL, supervise_loop_token);
        Ok(())
    }
}

#[async_trait]
impl Handler<Spawn> for IndexingPipeline {
    type Reply = ();

    async fn handle(
        &mut self,
        spawn: Spawn,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if self.handles_opt.is_some() {
            return Ok(());
        }
        self.previous_generations_statistics.num_spawn_attempts = 1 + spawn.retry_count;
        if let Err(spawn_error) = self.spawn_pipeline(ctx).await {
            if let Some(MetastoreError::NotFound { .. }) =
                spawn_error.downcast_ref::<MetastoreError>()
            {
                info!(error = ?spawn_error, "could not spawn pipeline, index might have been deleted");
                return Err(ActorExitStatus::Success);
            }
            let retry_delay = wait_duration_before_retry(spawn.retry_count + 1);
            error!(error = ?spawn_error, retry_count = spawn.retry_count, retry_delay = ?retry_delay, "error while spawning indexing pipeline, retrying after some time");
            ctx.schedule_self_msg(
                retry_delay,
                Spawn {
                    retry_count: spawn.retry_count + 1,
                },
            );
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<AssignShards> for IndexingPipeline {
    type Reply = ();

    async fn handle(
        &mut self,
        assign_shards_message: AssignShards,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.shard_ids
            .clone_from(&assign_shards_message.0.shard_ids);
        // If the pipeline is running, we forward the message to its source.
        // If it is not, it will be respawned soon, and the shards will be assigned afterward.
        if let Some(handles) = &mut self.handles_opt {
            info!(
                shard_ids=?assign_shards_message.0.shard_ids,
                "assigning shards to indexing pipeline"
            );
            handles
                .source_mailbox
                .send_message(assign_shards_message)
                .await?;
        }
        // We perform observe to make sure the set of shard ids is up to date.
        self.perform_observe(ctx);
        Ok(())
    }
}

pub struct IndexingPipelineParams {
    pub pipeline_id: IndexingPipelineId,
    pub metastore: MetastoreServiceClient,
    pub storage: Arc<dyn Storage>,

    // Indexing-related parameters
    pub doc_mapper: Arc<DocMapper>,
    pub indexing_directory: TempDirectory,
    pub indexing_settings: IndexingSettings,
    pub split_store: IndexingSplitStore,
    pub max_concurrent_split_uploads_index: usize,
    pub cooperative_indexing_permits: Option<Arc<Semaphore>>,

    // Merge-related parameters
    pub merge_policy: Arc<dyn MergePolicy>,
    pub retention_policy: Option<RetentionPolicy>,
    pub merge_planner_mailbox: Mailbox<MergePlanner>,
    pub max_concurrent_split_uploads_merge: usize,

    // Source-related parameters
    pub source_config: SourceConfig,
    pub source_storage_resolver: StorageResolver,
    pub ingester_pool: IngesterPool,
    pub queues_dir_path: PathBuf,
    pub params_fingerprint: u64,

    pub event_broker: EventBroker,
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;
    use std::path::PathBuf;
    use std::sync::Arc;

    use quickwit_actors::{Command, Universe};
    use quickwit_common::ServiceStream;
    use quickwit_config::{IndexingSettings, SourceInputFormat, SourceParams};
    use quickwit_doc_mapper::{DocMapper, default_doc_mapper_for_test};
    use quickwit_metastore::checkpoint::IndexCheckpointDelta;
    use quickwit_metastore::{IndexMetadata, IndexMetadataResponseExt, PublishSplitsRequestExt};
    use quickwit_proto::metastore::{
        EmptyResponse, IndexMetadataResponse, LastDeleteOpstampResponse, MetastoreError,
        MockMetastoreService,
    };
    use quickwit_proto::types::{IndexUid, NodeId, PipelineUid};
    use quickwit_storage::RamStorage;

    use super::{IndexingPipeline, *};
    use crate::actors::merge_pipeline::{MergePipeline, MergePipelineParams};
    use crate::merge_policy::default_merge_policy;

    #[test]
    fn test_wait_duration() {
        assert_eq!(wait_duration_before_retry(0), Duration::from_secs(1));
        assert_eq!(wait_duration_before_retry(1), Duration::from_secs(2));
        assert_eq!(wait_duration_before_retry(2), Duration::from_secs(4));
        assert_eq!(wait_duration_before_retry(3), Duration::from_secs(8));
        assert_eq!(wait_duration_before_retry(9), Duration::from_secs(512));
        assert_eq!(wait_duration_before_retry(10), MAX_RETRY_DELAY);
    }

    async fn test_indexing_pipeline_num_fails_before_success(
        mut num_fails: usize,
        test_file: &str,
    ) -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::for_test("test-index", 2);
        let pipeline_id = IndexingPipelineId {
            node_id,
            index_uid,
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::for_test(0u128),
        };
        let source_config = SourceConfig {
            source_id: "test-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::file_from_str(test_file).unwrap(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_config_clone = source_config.clone();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .withf(|index_metadata_request| {
                index_metadata_request.index_uid.as_ref().unwrap() == &("test-index", 2)
            })
            .returning(move |_| {
                if num_fails == 0 {
                    let mut index_metadata =
                        IndexMetadata::for_test("test-index", "ram:///indexes/test-index");
                    index_metadata
                        .add_source(source_config_clone.clone())
                        .unwrap();
                    let response =
                        IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap();
                    return Ok(response);
                }
                num_fails -= 1;
                Err(MetastoreError::Timeout("timeout error".to_string()))
            });
        mock_metastore
            .expect_last_delete_opstamp()
            .returning(move |_last_delete_opstamp_request| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore
            .expect_mark_splits_for_deletion()
            .returning(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_stage_splits()
            .withf(|stage_splits_request| -> bool {
                stage_splits_request.index_uid() == &("test-index", 2)
            })
            .returning(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_publish_splits()
            .withf(|publish_splits_request| -> bool {
                let checkpoint_delta: IndexCheckpointDelta = publish_splits_request
                    .deserialize_index_checkpoint()
                    .unwrap()
                    .unwrap();
                publish_splits_request.index_uid() == &("test-index", 2)
                    && checkpoint_delta.source_id == "test-source"
                    && publish_splits_request.staged_split_ids.len() == 1
                    && publish_splits_request.replaced_split_ids.is_empty()
                    && format!("{:?}", checkpoint_delta.source_delta)
                        .ends_with(":(00000000000000000000..~00000000000000001030])")
            })
            .returning(|_| Ok(EmptyResponse {}));

        let universe = Universe::new();
        let (merge_planner_mailbox, _) = universe.create_test_mailbox();
        let storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::create_without_local_store_for_test(storage.clone());
        let pipeline_params = IndexingPipelineParams {
            pipeline_id,
            doc_mapper: Arc::new(default_doc_mapper_for_test()),
            source_config,
            source_storage_resolver: StorageResolver::for_test(),
            indexing_directory: TempDirectory::for_test(),
            indexing_settings: IndexingSettings::for_test(),
            ingester_pool: IngesterPool::default(),
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            storage,
            split_store,
            merge_policy: default_merge_policy(),
            retention_policy: None,
            queues_dir_path: PathBuf::from("./queues"),
            max_concurrent_split_uploads_index: 4,
            max_concurrent_split_uploads_merge: 5,
            cooperative_indexing_permits: None,
            merge_planner_mailbox,
            event_broker: EventBroker::default(),
            params_fingerprint: 42u64,
        };
        let pipeline = IndexingPipeline::new(pipeline_params);
        let (_pipeline_mailbox, pipeline_handle) = universe.spawn_builder().spawn(pipeline);
        let (pipeline_exit_status, pipeline_statistics) = pipeline_handle.join().await;
        assert_eq!(
            pipeline_statistics.generation, 1,
            "generation is {}, expected 1",
            pipeline_statistics.generation
        );
        assert_eq!(
            pipeline_statistics.num_spawn_attempts,
            1 + num_fails,
            "num spawn attempts is {}, expected 1 + {}",
            pipeline_statistics.num_spawn_attempts,
            1 + num_fails
        );
        assert!(pipeline_exit_status.is_success());
        Ok(())
    }

    #[tokio::test]
    async fn test_indexing_pipeline_retry_0() -> anyhow::Result<()> {
        test_indexing_pipeline_num_fails_before_success(0, "data/test_corpus.json").await
    }

    #[tokio::test]
    async fn test_indexing_pipeline_retry_1() -> anyhow::Result<()> {
        test_indexing_pipeline_num_fails_before_success(1, "data/test_corpus.json").await
    }

    #[tokio::test]
    async fn test_indexing_pipeline_retry_0_gz() -> anyhow::Result<()> {
        test_indexing_pipeline_num_fails_before_success(0, "data/test_corpus.json.gz").await
    }

    #[tokio::test]
    async fn test_indexing_pipeline_retry_1_gz() -> anyhow::Result<()> {
        test_indexing_pipeline_num_fails_before_success(1, "data/test_corpus.json.gz").await
    }

    async fn indexing_pipeline_simple(test_file: &str) -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid: IndexUid = IndexUid::for_test("test-index", 1);
        let pipeline_id = IndexingPipelineId {
            node_id,
            index_uid: index_uid.clone(),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::for_test(0u128),
        };
        let source_config = SourceConfig {
            source_id: "test-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::file_from_str(test_file).unwrap(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_config_clone = source_config.clone();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .withf(|index_metadata_request| {
                index_metadata_request.index_uid.as_ref().unwrap() == &("test-index", 1)
            })
            .returning(move |_| {
                let mut index_metadata =
                    IndexMetadata::for_test("test-index", "ram:///indexes/test-index");
                index_metadata
                    .add_source(source_config_clone.clone())
                    .unwrap();
                Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_last_delete_opstamp()
            .withf(move |last_delete_opstamp| last_delete_opstamp.index_uid() == &index_uid_clone)
            .returning(move |_| Ok(LastDeleteOpstampResponse::new(10)));
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_stage_splits()
            .withf(move |stage_splits_request| stage_splits_request.index_uid() == &index_uid_clone)
            .returning(|_| Ok(EmptyResponse {}));
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_publish_splits()
            .withf(move |publish_splits_request| -> bool {
                let checkpoint_delta: IndexCheckpointDelta = publish_splits_request
                    .deserialize_index_checkpoint()
                    .unwrap()
                    .unwrap();
                publish_splits_request.index_uid() == &index_uid_clone
                    && publish_splits_request.staged_split_ids.len() == 1
                    && publish_splits_request.replaced_split_ids.is_empty()
                    && checkpoint_delta.source_id == "test-source"
                    && format!("{:?}", checkpoint_delta.source_delta)
                        .ends_with(":(00000000000000000000..~00000000000000001030])")
            })
            .returning(|_| Ok(EmptyResponse {}));

        let universe = Universe::new();
        let storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::create_without_local_store_for_test(storage.clone());
        let (merge_planner_mailbox, _) = universe.create_test_mailbox();
        let pipeline_params = IndexingPipelineParams {
            pipeline_id,
            doc_mapper: Arc::new(default_doc_mapper_for_test()),
            source_config,
            source_storage_resolver: StorageResolver::for_test(),
            indexing_directory: TempDirectory::for_test(),
            indexing_settings: IndexingSettings::for_test(),
            ingester_pool: IngesterPool::default(),
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            queues_dir_path: PathBuf::from("./queues"),
            storage,
            split_store,
            merge_policy: default_merge_policy(),
            retention_policy: None,
            max_concurrent_split_uploads_index: 4,
            max_concurrent_split_uploads_merge: 5,
            cooperative_indexing_permits: None,
            merge_planner_mailbox,
            event_broker: Default::default(),
            params_fingerprint: 42u64,
        };
        let pipeline = IndexingPipeline::new(pipeline_params);
        let (_pipeline_mailbox, pipeline_handler) = universe.spawn_builder().spawn(pipeline);
        let (pipeline_exit_status, pipeline_statistics) = pipeline_handler.join().await;
        assert!(pipeline_exit_status.is_success());
        assert_eq!(pipeline_statistics.generation, 1);
        assert_eq!(pipeline_statistics.num_spawn_attempts, 1);
        assert_eq!(pipeline_statistics.num_published_splits, 1);
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_indexing_pipeline_simple() -> anyhow::Result<()> {
        indexing_pipeline_simple("data/test_corpus.json").await
    }

    #[tokio::test]
    async fn test_indexing_pipeline_simple_gz() -> anyhow::Result<()> {
        indexing_pipeline_simple("data/test_corpus.json.gz").await
    }

    #[tokio::test]
    async fn test_merge_pipeline_does_not_stop_on_indexing_pipeline_failure() {
        let node_id = NodeId::from("test-node");
        let pipeline_id = IndexingPipelineId {
            node_id,
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::for_test(0u128),
        };
        let source_config = SourceConfig {
            source_id: "test-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_config_clone = source_config.clone();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .withf(|index_metadata_request| {
                index_metadata_request.index_uid.as_ref().unwrap() == &("test-index", 2)
            })
            .returning(move |_| {
                let mut index_metadata =
                    IndexMetadata::for_test("test-index", "ram:///indexes/test-index");
                index_metadata
                    .add_source(source_config_clone.clone())
                    .unwrap();
                Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
            });
        mock_metastore
            .expect_list_splits()
            .returning(|_| Ok(ServiceStream::empty()));
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);

        let universe = Universe::with_accelerated_time();
        let doc_mapper = Arc::new(default_doc_mapper_for_test());
        let storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::create_without_local_store_for_test(storage.clone());
        let merge_pipeline_params = MergePipelineParams {
            pipeline_id: pipeline_id.merge_pipeline_id(),
            doc_mapper: doc_mapper.clone(),
            indexing_directory: TempDirectory::for_test(),
            metastore: metastore.clone(),
            split_store: split_store.clone(),
            merge_policy: default_merge_policy(),
            retention_policy: None,
            max_concurrent_split_uploads: 2,
            merge_io_throughput_limiter_opt: None,
            merge_scheduler_service: universe.get_or_spawn_one(),
            event_broker: Default::default(),
        };
        let merge_pipeline = MergePipeline::new(merge_pipeline_params, None, universe.spawn_ctx());
        let merge_planner_mailbox = merge_pipeline.merge_planner_mailbox().clone();
        let (_merge_pipeline_mailbox, merge_pipeline_handler) =
            universe.spawn_builder().spawn(merge_pipeline);
        let indexing_pipeline_params = IndexingPipelineParams {
            pipeline_id,
            doc_mapper,
            source_config,
            source_storage_resolver: StorageResolver::for_test(),
            indexing_directory: TempDirectory::for_test(),
            indexing_settings: IndexingSettings::for_test(),
            ingester_pool: IngesterPool::default(),
            metastore,
            queues_dir_path: PathBuf::from("./queues"),
            storage,
            split_store,
            merge_policy: default_merge_policy(),
            retention_policy: None,
            max_concurrent_split_uploads_index: 4,
            max_concurrent_split_uploads_merge: 5,
            cooperative_indexing_permits: None,
            merge_planner_mailbox: merge_planner_mailbox.clone(),
            event_broker: Default::default(),
            params_fingerprint: 42u64,
        };
        let indexing_pipeline = IndexingPipeline::new(indexing_pipeline_params);
        let (_indexing_pipeline_mailbox, indexing_pipeline_handler) =
            universe.spawn_builder().spawn(indexing_pipeline);
        let obs = indexing_pipeline_handler
            .process_pending_and_observe()
            .await;
        assert_eq!(obs.generation, 1);
        // Let's shutdown the indexer, this will trigger the indexing pipeline failure and the
        // restart.
        let indexer = universe.get::<Indexer>().into_iter().next().unwrap();
        let _ = indexer.ask(Command::Quit).await;
        for _ in 0..10 {
            universe.sleep(*quickwit_actors::HEARTBEAT).await;
            // Check indexing pipeline has restarted.
            let obs = indexing_pipeline_handler
                .process_pending_and_observe()
                .await;
            if obs.generation == 2 {
                assert_eq!(merge_pipeline_handler.check_health(true), Health::Healthy);
                universe.quit().await;
                return;
            }
        }
        panic!("Pipeline was apparently not restarted.");
    }

    async fn indexing_pipeline_all_failures_handling(test_file: &str) -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid: IndexUid = IndexUid::for_test("test-index", 2);
        let pipeline_id = IndexingPipelineId {
            node_id,
            index_uid: index_uid.clone(),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::for_test(0u128),
        };
        let source_config = SourceConfig {
            source_id: "test-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::file_from_str(test_file).unwrap(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_config_clone = source_config.clone();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .withf(|index_metadata_request| {
                index_metadata_request.index_uid.as_ref().unwrap() == &("test-index", 2)
            })
            .returning(move |_| {
                let mut index_metadata =
                    IndexMetadata::for_test("test-index", "ram:///indexes/test-index");
                index_metadata
                    .add_source(source_config_clone.clone())
                    .unwrap();

                Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_last_delete_opstamp()
            .withf(move |last_delete_opstamp| last_delete_opstamp.index_uid() == &index_uid_clone)
            .returning(move |_| Ok(LastDeleteOpstampResponse::new(10)));
        mock_metastore
            .expect_stage_splits()
            .never()
            .returning(|_| Ok(EmptyResponse {}));
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_publish_splits()
            .withf(move |publish_splits_request| -> bool {
                let checkpoint_delta: IndexCheckpointDelta = publish_splits_request
                    .deserialize_index_checkpoint()
                    .unwrap()
                    .unwrap();
                publish_splits_request.index_uid() == &index_uid_clone
                    && publish_splits_request.staged_split_ids.is_empty()
                    && publish_splits_request.replaced_split_ids.is_empty()
                    && checkpoint_delta.source_id == "test-source"
                    && format!("{:?}", checkpoint_delta.source_delta)
                        .ends_with(":(00000000000000000000..~00000000000000001030])")
            })
            .returning(|_| Ok(EmptyResponse {}));
        let universe = Universe::new();
        let storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::create_without_local_store_for_test(storage.clone());
        let (merge_planner_mailbox, _) = universe.create_test_mailbox();
        // Create a minimal mapper with wrong date format to ensure that all documents will fail
        let broken_mapper = serde_json::from_str::<DocMapper>(
            r#"
                {
                    "store_source": true,
                    "timestamp_field": "timestamp",
                    "field_mappings": [
                        {
                            "name": "timestamp",
                            "type": "datetime",
                            "input_formats": ["iso8601"],
                            "fast": true
                        }
                    ]
                }"#,
        )
        .unwrap();

        let pipeline_params = IndexingPipelineParams {
            pipeline_id,
            doc_mapper: Arc::new(broken_mapper),
            source_config,
            source_storage_resolver: StorageResolver::for_test(),
            indexing_directory: TempDirectory::for_test(),
            indexing_settings: IndexingSettings::for_test(),
            ingester_pool: IngesterPool::default(),
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            queues_dir_path: PathBuf::from("./queues"),
            storage,
            split_store,
            merge_policy: default_merge_policy(),
            retention_policy: None,
            max_concurrent_split_uploads_index: 4,
            max_concurrent_split_uploads_merge: 5,
            cooperative_indexing_permits: None,
            merge_planner_mailbox,
            params_fingerprint: 42u64,
            event_broker: Default::default(),
        };
        let pipeline = IndexingPipeline::new(pipeline_params);
        let (_pipeline_mailbox, pipeline_handler) = universe.spawn_builder().spawn(pipeline);
        let (pipeline_exit_status, pipeline_statistics) = pipeline_handler.join().await;
        assert!(pipeline_exit_status.is_success());
        // flaky. Sometimes generations is 2.
        assert_eq!(pipeline_statistics.generation, 1);
        assert_eq!(pipeline_statistics.num_spawn_attempts, 1);
        assert_eq!(pipeline_statistics.num_published_splits, 0);
        assert_eq!(pipeline_statistics.num_empty_splits, 1);
        assert_eq!(
            pipeline_statistics.num_docs,
            pipeline_statistics.num_invalid_docs
        );
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_indexing_pipeline_all_failures_handling() -> anyhow::Result<()> {
        indexing_pipeline_all_failures_handling("data/test_corpus.json").await
    }

    #[tokio::test]
    async fn test_indexing_pipeline_all_failures_handling_gz() -> anyhow::Result<()> {
        indexing_pipeline_all_failures_handling("data/test_corpus.json.gz").await
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/indexing_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::fmt::{Debug, Formatter};
use std::path::PathBuf;
use std::sync::Arc;

use anyhow::Context;
use async_trait::async_trait;
use futures::TryStreamExt;
use itertools::Itertools;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, ActorState, Handler, Healthz, Mailbox,
    Observation,
};
use quickwit_cluster::Cluster;
use quickwit_common::fs::get_cache_directory_path;
use quickwit_common::io::Limiter;
use quickwit_common::pubsub::EventBroker;
use quickwit_common::{io, temp_dir};
use quickwit_config::{
    INGEST_API_SOURCE_ID, IndexConfig, IndexerConfig, SourceConfig, build_doc_mapper,
    indexing_pipeline_params_fingerprint,
};
use quickwit_ingest::{
    DropQueueRequest, GetPartitionId, IngestApiService, IngesterPool, ListQueuesRequest,
    QUEUES_DIR_NAME,
};
use quickwit_metastore::{
    IndexMetadata, IndexMetadataResponseExt, IndexesMetadataResponseExt,
    ListIndexesMetadataResponseExt, ListSplitsQuery, ListSplitsRequestExt, ListSplitsResponseExt,
    SplitMetadata, SplitState,
};
use quickwit_proto::indexing::{
    ApplyIndexingPlanRequest, ApplyIndexingPlanResponse, IndexingError, IndexingPipelineId,
    IndexingTask, MergePipelineId, PipelineMetrics,
};
use quickwit_proto::metastore::{
    IndexMetadataRequest, IndexMetadataSubrequest, IndexesMetadataRequest,
    ListIndexesMetadataRequest, ListSplitsRequest, MetastoreResult, MetastoreService,
    MetastoreServiceClient,
};
use quickwit_proto::types::{IndexId, IndexUid, NodeId, PipelineUid, ShardId};
use quickwit_storage::StorageResolver;
use serde::{Deserialize, Serialize};
use time::OffsetDateTime;
use tokio::sync::Semaphore;
use tracing::{debug, error, info, warn};

use super::merge_pipeline::{MergePipeline, MergePipelineParams};
use super::{MergePlanner, MergeSchedulerService};
use crate::actors::merge_pipeline::FinishPendingMergesAndShutdownPipeline;
use crate::models::{DetachIndexingPipeline, DetachMergePipeline, ObservePipeline, SpawnPipeline};
use crate::source::{AssignShards, Assignment};
use crate::split_store::{IndexingSplitCache, SplitStoreQuota};
use crate::{IndexingPipeline, IndexingPipelineParams, IndexingSplitStore, IndexingStatistics};

/// Name of the indexing directory, usually located at `<data_dir_path>/indexing`.
pub const INDEXING_DIR_NAME: &str = "indexing";

#[derive(Clone, Debug, Default, Eq, PartialEq, Serialize, Deserialize)]
pub struct IndexingServiceCounters {
    pub num_running_pipelines: usize,
    pub num_successful_pipelines: usize,
    pub num_failed_pipelines: usize,
    pub num_running_merge_pipelines: usize,
    pub num_deleted_queues: usize,
    pub num_delete_queue_failures: usize,
}

struct MergePipelineHandle {
    mailbox: Mailbox<MergePlanner>,
    handle: ActorHandle<MergePipeline>,
}

struct PipelineHandle {
    mailbox: Mailbox<IndexingPipeline>,
    handle: ActorHandle<IndexingPipeline>,
    indexing_pipeline_id: IndexingPipelineId,
}

/// The indexing service is (single) actor service running on indexer and in charge
/// of executing the indexing plans received from the control plane.
///
/// Concretely this means receiving new plans, comparing the current situation
/// with the target situation, and spawning/shutting down the  indexing pipelines that
/// are respectively missing or extranumerous.
pub struct IndexingService {
    node_id: NodeId,
    indexing_root_directory: PathBuf,
    queue_dir_path: PathBuf,
    cluster: Cluster,
    metastore: MetastoreServiceClient,
    ingest_api_service_opt: Option<Mailbox<IngestApiService>>,
    merge_scheduler_service: Mailbox<MergeSchedulerService>,
    ingester_pool: IngesterPool,
    storage_resolver: StorageResolver,
    indexing_pipelines: HashMap<PipelineUid, PipelineHandle>,
    counters: IndexingServiceCounters,
    local_split_store: Arc<IndexingSplitCache>,
    max_concurrent_split_uploads: usize,
    merge_pipeline_handles: HashMap<MergePipelineId, MergePipelineHandle>,
    cooperative_indexing_permits: Option<Arc<Semaphore>>,
    merge_io_throughput_limiter_opt: Option<Limiter>,
    event_broker: EventBroker,
}

impl Debug for IndexingService {
    fn fmt(&self, formatter: &mut Formatter) -> std::fmt::Result {
        formatter
            .debug_struct("IndexingService")
            .field("cluster_id", &self.cluster.cluster_id())
            .field("self_node_id", &self.node_id)
            .field("indexing_root_directory", &self.indexing_root_directory)
            .finish()
    }
}

impl IndexingService {
    #[allow(clippy::too_many_arguments)]
    pub async fn new(
        node_id: NodeId,
        data_dir_path: PathBuf,
        indexer_config: IndexerConfig,
        num_blocking_threads: usize,
        cluster: Cluster,
        metastore: MetastoreServiceClient,
        ingest_api_service_opt: Option<Mailbox<IngestApiService>>,
        merge_scheduler_service: Mailbox<MergeSchedulerService>,
        ingester_pool: IngesterPool,
        storage_resolver: StorageResolver,
        event_broker: EventBroker,
    ) -> anyhow::Result<IndexingService> {
        let split_store_space_quota = SplitStoreQuota::try_new(
            indexer_config.split_store_max_num_splits,
            indexer_config.split_store_max_num_bytes,
        )?;
        let merge_io_throughput_limiter_opt =
            indexer_config.max_merge_write_throughput.map(io::limiter);
        let split_cache_dir_path = get_cache_directory_path(&data_dir_path);
        let local_split_store =
            IndexingSplitCache::open(split_cache_dir_path, split_store_space_quota).await?;
        let indexing_root_directory =
            temp_dir::create_or_purge_directory(&data_dir_path.join(INDEXING_DIR_NAME)).await?;
        let queue_dir_path = data_dir_path.join(QUEUES_DIR_NAME);
        let cooperative_indexing_permits = if indexer_config.enable_cooperative_indexing {
            Some(Arc::new(Semaphore::new(num_blocking_threads)))
        } else {
            None
        };
        Ok(IndexingService {
            node_id,
            indexing_root_directory,
            queue_dir_path,
            cluster,
            metastore,
            ingest_api_service_opt,
            merge_scheduler_service,
            ingester_pool,
            storage_resolver,
            local_split_store: Arc::new(local_split_store),
            indexing_pipelines: Default::default(),
            counters: Default::default(),
            max_concurrent_split_uploads: indexer_config.max_concurrent_split_uploads,
            merge_pipeline_handles: HashMap::new(),
            merge_io_throughput_limiter_opt,
            cooperative_indexing_permits,
            event_broker,
        })
    }

    async fn detach_indexing_pipeline(
        &mut self,
        pipeline_uid: &PipelineUid,
    ) -> Result<ActorHandle<IndexingPipeline>, IndexingError> {
        let pipeline_handle = self
            .indexing_pipelines
            .remove(pipeline_uid)
            .ok_or_else(|| {
                let message = format!("could not find indexing pipeline `{pipeline_uid}`");
                IndexingError::Internal(message)
            })?;
        self.counters.num_running_pipelines -= 1;
        Ok(pipeline_handle.handle)
    }

    async fn detach_merge_pipeline(
        &mut self,
        pipeline_id: &MergePipelineId,
    ) -> Result<ActorHandle<MergePipeline>, IndexingError> {
        let pipeline_handle = self
            .merge_pipeline_handles
            .remove(pipeline_id)
            .ok_or_else(|| {
                let message = format!("could not find merge pipeline `{pipeline_id}`");
                IndexingError::Internal(message)
            })?;
        self.counters.num_running_merge_pipelines -= 1;
        Ok(pipeline_handle.handle)
    }

    async fn observe_pipeline(
        &mut self,
        pipeline_uid: &PipelineUid,
    ) -> Result<Observation<IndexingStatistics>, IndexingError> {
        let pipeline_handle = &self
            .indexing_pipelines
            .get(pipeline_uid)
            .ok_or_else(|| {
                let message = format!("could not find indexing pipeline `{pipeline_uid}`");
                IndexingError::Internal(message)
            })?
            .handle;
        let observation = pipeline_handle.observe().await;
        Ok(observation)
    }

    async fn spawn_pipeline(
        &mut self,
        ctx: &ActorContext<Self>,
        index_id: IndexId,
        source_config: SourceConfig,
        pipeline_uid: PipelineUid,
    ) -> Result<IndexingPipelineId, IndexingError> {
        let index_metadata = self.index_metadata(ctx, &index_id).await?;
        let pipeline_id = IndexingPipelineId {
            index_uid: index_metadata.index_uid.clone(),
            source_id: source_config.source_id.clone(),
            node_id: self.node_id.clone(),
            pipeline_uid,
        };
        let index_config = index_metadata.into_index_config();
        self.spawn_pipeline_inner(
            ctx,
            pipeline_id.clone(),
            index_config,
            source_config,
            None,
            None,
        )
        .await?;
        Ok(pipeline_id)
    }

    async fn spawn_pipeline_inner(
        &mut self,
        ctx: &ActorContext<Self>,
        indexing_pipeline_id: IndexingPipelineId,
        index_config: IndexConfig,
        source_config: SourceConfig,
        immature_splits_opt: Option<Vec<SplitMetadata>>,
        expected_params_fingerprint: Option<u64>,
    ) -> Result<(), IndexingError> {
        if self
            .indexing_pipelines
            .contains_key(&indexing_pipeline_id.pipeline_uid)
        {
            let message = format!("pipeline `{indexing_pipeline_id}` already exists");
            return Err(IndexingError::Internal(message));
        }
        let pipeline_uid_str = indexing_pipeline_id.pipeline_uid.to_string();
        let indexing_directory = temp_dir::Builder::default()
            .join(&indexing_pipeline_id.index_uid.index_id)
            .join(&indexing_pipeline_id.index_uid.incarnation_id.to_string())
            .join(&indexing_pipeline_id.source_id)
            .join(&pipeline_uid_str)
            .tempdir_in(&self.indexing_root_directory)
            .map_err(|error| {
                let message = format!("failed to create indexing directory: {error}");
                IndexingError::Internal(message)
            })?;
        let storage = self
            .storage_resolver
            .resolve(&index_config.index_uri)
            .await
            .map_err(|error| {
                let message = format!("failed to spawn indexing pipeline: {error}");
                IndexingError::Internal(message)
            })?;
        let merge_policy =
            crate::merge_policy::merge_policy_from_settings(&index_config.indexing_settings);
        let retention_policy = index_config.retention_policy_opt.clone();
        let split_store = IndexingSplitStore::new(storage.clone(), self.local_split_store.clone());

        let doc_mapper = build_doc_mapper(&index_config.doc_mapping, &index_config.search_settings)
            .map_err(|error| IndexingError::Internal(error.to_string()))?;

        let merge_pipeline_id = indexing_pipeline_id.merge_pipeline_id();
        let merge_pipeline_params = MergePipelineParams {
            pipeline_id: merge_pipeline_id.clone(),
            doc_mapper: doc_mapper.clone(),
            indexing_directory: indexing_directory.clone(),
            metastore: self.metastore.clone(),
            split_store: split_store.clone(),
            merge_scheduler_service: self.merge_scheduler_service.clone(),
            merge_policy: merge_policy.clone(),
            retention_policy: retention_policy.clone(),
            merge_io_throughput_limiter_opt: self.merge_io_throughput_limiter_opt.clone(),
            max_concurrent_split_uploads: self.max_concurrent_split_uploads,
            event_broker: self.event_broker.clone(),
        };
        let merge_planner_mailbox =
            self.get_or_create_merge_pipeline(merge_pipeline_params, immature_splits_opt, ctx)?;
        // The concurrent uploads budget is split in 2: 1/2 for the indexing pipeline, 1/2 for the
        // merge pipeline.
        let max_concurrent_split_uploads_index = (self.max_concurrent_split_uploads / 2).max(1);
        let max_concurrent_split_uploads_merge =
            (self.max_concurrent_split_uploads - max_concurrent_split_uploads_index).max(1);

        let params_fingerprint =
            indexing_pipeline_params_fingerprint(&index_config, &source_config);
        if let Some(expected_params_fingerprint) = expected_params_fingerprint {
            // If the fingerprint of the config freshly fetched from the
            // metastore is different from that received from the control plane,
            // it means that the config changed again since the last indexing
            // plan was built. In this case, postpone the pipeline creation.
            if params_fingerprint != expected_params_fingerprint {
                info!(
                    index_id = indexing_pipeline_id.index_uid.index_id,
                    source_id = indexing_pipeline_id.source_id,
                    expected = expected_params_fingerprint,
                    actual = params_fingerprint,
                    "pipeline fingerprint mismatch, postponing pipeline creation"
                );
                return Ok(());
            }
        }
        let pipeline_params = IndexingPipelineParams {
            pipeline_id: indexing_pipeline_id.clone(),
            metastore: self.metastore.clone(),
            storage,

            // Indexing-related parameters
            doc_mapper,
            indexing_directory,
            indexing_settings: index_config.indexing_settings.clone(),
            split_store,
            max_concurrent_split_uploads_index,
            cooperative_indexing_permits: self.cooperative_indexing_permits.clone(),

            // Merge-related parameters
            merge_policy,
            retention_policy,
            max_concurrent_split_uploads_merge,
            merge_planner_mailbox,

            // Source-related parameters
            source_config,
            ingester_pool: self.ingester_pool.clone(),
            queues_dir_path: self.queue_dir_path.clone(),
            source_storage_resolver: self.storage_resolver.clone(),
            params_fingerprint,

            event_broker: self.event_broker.clone(),
        };
        let pipeline = IndexingPipeline::new(pipeline_params);
        let (pipeline_mailbox, pipeline_handle) = ctx.spawn_actor().spawn(pipeline);
        let pipeline_handle = PipelineHandle {
            mailbox: pipeline_mailbox,
            handle: pipeline_handle,
            indexing_pipeline_id: indexing_pipeline_id.clone(),
        };
        self.indexing_pipelines
            .insert(indexing_pipeline_id.pipeline_uid, pipeline_handle);
        self.counters.num_running_pipelines += 1;
        Ok(())
    }

    async fn index_metadata(
        &mut self,
        ctx: &ActorContext<Self>,
        index_id: &str,
    ) -> Result<IndexMetadata, IndexingError> {
        let _protected_zone_guard = ctx.protect_zone();
        let index_metadata_response = self
            .metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await?;
        let index_metadata = index_metadata_response.deserialize_index_metadata()?;
        Ok(index_metadata)
    }

    async fn indexes_metadata(
        &mut self,
        ctx: &ActorContext<Self>,
        indexing_pipeline_ids: &[IndexingPipelineId],
    ) -> Result<Vec<IndexMetadata>, IndexingError> {
        let index_metadata_subrequests: Vec<IndexMetadataSubrequest> = indexing_pipeline_ids
            .iter()
            // Remove duplicate subrequests
            .unique_by(|pipeline_id| &pipeline_id.index_uid)
            .map(|pipeline_id| IndexMetadataSubrequest {
                index_id: None,
                index_uid: Some(pipeline_id.index_uid.clone()),
            })
            .collect();
        let indexes_metadata_request = IndexesMetadataRequest {
            subrequests: index_metadata_subrequests,
        };
        let _protected_zone_guard = ctx.protect_zone();

        let indexes_metadata_response = self
            .metastore
            .indexes_metadata(indexes_metadata_request)
            .await?;
        let indexes_metadata = indexes_metadata_response
            .deserialize_indexes_metadata()
            .await?;
        Ok(indexes_metadata)
    }

    /// Fetches the immature splits candidates for merge for all the indexing pipelines for which a
    /// merge pipeline is not running.
    async fn fetch_immature_splits_for_new_merge_pipelines(
        &mut self,
        indexing_pipeline_ids: &[IndexingPipelineId],
        ctx: &ActorContext<Self>,
    ) -> MetastoreResult<HashMap<MergePipelineId, Vec<SplitMetadata>>> {
        let mut index_uids = Vec::new();

        for indexing_pipeline_id in indexing_pipeline_ids {
            let merge_pipeline_id = indexing_pipeline_id.merge_pipeline_id();

            if !self.merge_pipeline_handles.contains_key(&merge_pipeline_id) {
                index_uids.push(merge_pipeline_id.index_uid);
            }
        }
        if index_uids.is_empty() {
            return Ok(Default::default());
        }
        index_uids.sort_unstable();
        index_uids.dedup();

        let list_splits_query = ListSplitsQuery::try_from_index_uids(index_uids)
            .expect("`index_uids` should not be empty")
            .with_node_id(self.node_id.clone())
            .with_split_state(SplitState::Published)
            .retain_immature(OffsetDateTime::now_utc());
        let list_splits_request =
            ListSplitsRequest::try_from_list_splits_query(&list_splits_query)?;

        let mut immature_splits_stream = ctx
            .protect_future(self.metastore.list_splits(list_splits_request))
            .await?;

        let mut per_merge_pipeline_immature_splits: HashMap<MergePipelineId, Vec<SplitMetadata>> =
            indexing_pipeline_ids
                .iter()
                .map(|indexing_pipeline_id| (indexing_pipeline_id.merge_pipeline_id(), Vec::new()))
                .collect();

        let mut num_immature_splits = 0usize;

        while let Some(list_splits_response) = immature_splits_stream.try_next().await? {
            for split_metadata in list_splits_response.deserialize_splits_metadata().await? {
                num_immature_splits += 1;

                let merge_pipeline_id = MergePipelineId {
                    node_id: self.node_id.clone(),
                    index_uid: split_metadata.index_uid.clone(),
                    source_id: split_metadata.source_id.clone(),
                };
                per_merge_pipeline_immature_splits
                    .entry(merge_pipeline_id)
                    .or_default()
                    .push(split_metadata);
            }
        }
        info!("fetched {num_immature_splits} splits candidates for merge");
        Ok(per_merge_pipeline_immature_splits)
    }

    async fn handle_supervise(&mut self) -> Result<(), ActorExitStatus> {
        self.indexing_pipelines
            .retain(|pipeline_uid, pipeline_handle| {
                match pipeline_handle.handle.state() {
                    ActorState::Paused | ActorState::Running => true,
                    ActorState::Success => {
                        info!(
                            pipeline_uid=%pipeline_uid,
                            "indexing pipeline exited successfully"
                        );
                        self.counters.num_successful_pipelines += 1;
                        self.counters.num_running_pipelines -= 1;
                        false
                    }
                    ActorState::Failure => {
                        // This should never happen: Indexing Pipelines are not supposed to fail,
                        // and are themselves in charge of supervising the pipeline actors.
                        error!(
                            pipeline_uid=%pipeline_uid,
                            "indexing pipeline exited with failure: this should never happen, please report"
                        );
                        self.counters.num_failed_pipelines += 1;
                        self.counters.num_running_pipelines -= 1;
                        false
                    }
                }
            });
        let merge_pipelines_to_retain: HashSet<MergePipelineId> = self
            .indexing_pipelines
            .values()
            .map(|pipeline_handle| pipeline_handle.indexing_pipeline_id.merge_pipeline_id())
            .collect();

        let merge_pipelines_to_shutdown: Vec<MergePipelineId> = self
            .merge_pipeline_handles
            .keys()
            .filter(|running_merge_pipeline_id| {
                !merge_pipelines_to_retain.contains(running_merge_pipeline_id)
            })
            .cloned()
            .collect();

        for merge_pipeline_to_shutdown in merge_pipelines_to_shutdown {
            if let Some((_, merge_pipeline_handle)) = self
                .merge_pipeline_handles
                .remove_entry(&merge_pipeline_to_shutdown)
            {
                // We gracefully shutdown the merge pipeline, so we can complete the in-flight
                // merges.
                info!(
                    index_uid=%merge_pipeline_to_shutdown.index_uid,
                    source_id=%merge_pipeline_to_shutdown.source_id,
                    "shutting down orphan merge pipeline"
                );
                // The queue capacity of the merge pipeline is unbounded, so `.send_message(...)`
                // should not block.
                // We avoid using `.quit()` here because it waits for the actor to exit.
                merge_pipeline_handle
                    .handle
                    .mailbox()
                    .send_message(FinishPendingMergesAndShutdownPipeline)
                    .await
                    .expect("merge pipeline mailbox should not be full");
            }
        }
        // Finally, we remove the completed or failed merge pipelines.
        self.merge_pipeline_handles
            .retain(|_, merge_pipeline_handle| merge_pipeline_handle.handle.state().is_running());
        self.counters.num_running_merge_pipelines = self.merge_pipeline_handles.len();
        self.update_chitchat_running_plan().await;

        let pipeline_metrics: HashMap<&IndexingPipelineId, PipelineMetrics> = self
            .indexing_pipelines
            .values()
            .filter_map(|pipeline_handle| {
                let indexing_statistics = pipeline_handle.handle.last_observation();
                let pipeline_metrics = indexing_statistics.pipeline_metrics_opt?;
                Some((&pipeline_handle.indexing_pipeline_id, pipeline_metrics))
            })
            .collect();
        self.cluster
            .update_self_node_pipeline_metrics(&pipeline_metrics)
            .await;
        Ok(())
    }

    fn get_or_create_merge_pipeline(
        &mut self,
        merge_pipeline_params: MergePipelineParams,
        immature_splits_opt: Option<Vec<SplitMetadata>>,
        ctx: &ActorContext<Self>,
    ) -> Result<Mailbox<MergePlanner>, IndexingError> {
        if let Some(merge_pipeline_handle) = self
            .merge_pipeline_handles
            .get(&merge_pipeline_params.pipeline_id)
        {
            return Ok(merge_pipeline_handle.mailbox.clone());
        }
        let merge_pipeline_id = merge_pipeline_params.pipeline_id.clone();
        let merge_pipeline =
            MergePipeline::new(merge_pipeline_params, immature_splits_opt, ctx.spawn_ctx());
        let merge_planner_mailbox = merge_pipeline.merge_planner_mailbox().clone();
        let (_pipeline_mailbox, pipeline_handle) = ctx.spawn_actor().spawn(merge_pipeline);
        let merge_pipeline_handle = MergePipelineHandle {
            mailbox: merge_planner_mailbox.clone(),
            handle: pipeline_handle,
        };
        self.merge_pipeline_handles
            .insert(merge_pipeline_id, merge_pipeline_handle);
        self.counters.num_running_merge_pipelines += 1;
        Ok(merge_planner_mailbox)
    }

    /// For all Ingest V2 pipelines, assigns the set of shards they should be working on.
    /// This is done regardless of whether there has been a change in their shard list
    /// or not.
    ///
    /// If a pipeline actor has failed, this function just logs an error.
    async fn assign_shards_to_pipelines(&mut self, tasks: &[IndexingTask]) {
        for task in tasks {
            if task.shard_ids.is_empty() {
                continue;
            }
            let pipeline_uid = task.pipeline_uid();
            let Some(pipeline_handle) = self.indexing_pipelines.get(&pipeline_uid) else {
                continue;
            };
            let assignment = Assignment {
                shard_ids: task.shard_ids.iter().cloned().collect(),
            };
            let message = AssignShards(assignment);

            if let Err(error) = pipeline_handle.mailbox.send_message(message).await {
                error!(%error, "failed to assign shards to indexing pipeline");
            }
        }
    }

    /// Applies the indexing plan by:
    /// - Stopping the running pipelines not present in the provided plan.
    /// - Starting the pipelines that are not running.
    async fn apply_indexing_plan(
        &mut self,
        tasks: &[IndexingTask],
        ctx: &ActorContext<Self>,
    ) -> Result<(), IndexingError> {
        let pipeline_diff = self.compute_pipeline_diff(tasks);

        if !pipeline_diff.pipelines_to_shutdown.is_empty() {
            self.shutdown_pipelines(&pipeline_diff.pipelines_to_shutdown)
                .await;
        }
        let mut spawn_pipeline_failures: Vec<IndexingPipelineId> = Vec::new();

        if !pipeline_diff.pipelines_to_spawn.is_empty() {
            spawn_pipeline_failures = self
                .spawn_pipelines(&pipeline_diff.pipelines_to_spawn, ctx)
                .await?;
        }
        self.assign_shards_to_pipelines(tasks).await;
        self.update_chitchat_running_plan().await;

        if !spawn_pipeline_failures.is_empty() {
            let message =
                format!("failed to spawn indexing pipelines: {spawn_pipeline_failures:?}");
            return Err(IndexingError::Internal(message));
        }
        Ok(())
    }

    /// Identifies the pipelines to spawn and shutdown by comparing the scheduled plan with the
    /// current running plan.
    fn compute_pipeline_diff(&self, tasks: &[IndexingTask]) -> IndexingPipelineDiff {
        let mut pipelines_to_spawn: Vec<IndexingTask> = Vec::new();
        let mut scheduled_pipeline_uids: HashSet<PipelineUid> = HashSet::with_capacity(tasks.len());

        for task in tasks {
            let pipeline_uid = task.pipeline_uid();

            if !self.indexing_pipelines.contains_key(&pipeline_uid) {
                pipelines_to_spawn.push(task.clone());
            }
            scheduled_pipeline_uids.insert(pipeline_uid);
        }
        let pipelines_to_shutdown: Vec<PipelineUid> = self
            .indexing_pipelines
            .keys()
            .filter(|pipeline_uid| !scheduled_pipeline_uids.contains(pipeline_uid))
            .copied()
            .collect();

        IndexingPipelineDiff {
            pipelines_to_shutdown,
            pipelines_to_spawn,
        }
    }

    /// Spawns the pipelines with supplied ids and returns a list of failed pipelines.
    async fn spawn_pipelines(
        &mut self,
        pipelines_to_spawn: &[IndexingTask],
        ctx: &ActorContext<Self>,
    ) -> Result<Vec<IndexingPipelineId>, IndexingError> {
        let pipelines_to_spawn_ids: Vec<_> = pipelines_to_spawn
            .iter()
            .map(|task| IndexingPipelineId {
                node_id: self.node_id.clone(),
                index_uid: task.index_uid().clone(),
                pipeline_uid: task.pipeline_uid(),
                source_id: task.source_id.clone(),
            })
            .collect();
        let indexes_metadata = self.indexes_metadata(ctx, &pipelines_to_spawn_ids).await?;

        let per_index_uid_indexes_metadata: HashMap<IndexUid, IndexMetadata> = indexes_metadata
            .into_iter()
            .map(|index_metadata| (index_metadata.index_uid.clone(), index_metadata))
            .collect();

        let mut per_merge_pipeline_immature_splits: HashMap<MergePipelineId, Vec<SplitMetadata>> =
            self.fetch_immature_splits_for_new_merge_pipelines(&pipelines_to_spawn_ids, ctx)
                .await?;

        let mut spawn_pipeline_failures: Vec<IndexingPipelineId> = Vec::new();

        for (task_to_spawn, id_to_spawn) in pipelines_to_spawn.iter().zip(pipelines_to_spawn_ids) {
            if let Some(index_metadata) =
                per_index_uid_indexes_metadata.get(task_to_spawn.index_uid())
            {
                if let Some(source_config) = index_metadata.sources.get(&task_to_spawn.source_id) {
                    let merge_pipeline_id = id_to_spawn.merge_pipeline_id();
                    let immature_splits_opt =
                        per_merge_pipeline_immature_splits.remove(&merge_pipeline_id);

                    if let Err(error) = self
                        .spawn_pipeline_inner(
                            ctx,
                            id_to_spawn.clone(),
                            index_metadata.index_config.clone(),
                            source_config.clone(),
                            immature_splits_opt,
                            Some(task_to_spawn.params_fingerprint),
                        )
                        .await
                    {
                        error!(pipeline_id=?id_to_spawn, %error, "failed to spawn pipeline");
                        spawn_pipeline_failures.push(id_to_spawn.clone());
                    }
                } else {
                    error!(pipeline_id=?id_to_spawn, "failed to spawn pipeline: source not found");
                    spawn_pipeline_failures.push(id_to_spawn.clone());
                }
            } else {
                error!(
                    "failed to spawn pipeline: index `{}` no longer exists",
                    id_to_spawn.index_uid
                );
                spawn_pipeline_failures.push(id_to_spawn.clone());
            }
        }
        Ok(spawn_pipeline_failures)
    }

    /// Shuts down the pipelines with supplied ids and performs necessary cleanup.
    async fn shutdown_pipelines(&mut self, pipelines_to_shutdown: &[PipelineUid]) {
        info!(
            pipeline_uids=?pipelines_to_shutdown,
            "shutdown indexing pipelines"
        );
        let should_gc_ingest_api_queues = pipelines_to_shutdown
            .iter()
            .flat_map(|pipeline_uid| self.indexing_pipelines.get(pipeline_uid))
            .any(|pipeline_handle| {
                pipeline_handle.indexing_pipeline_id.source_id == INGEST_API_SOURCE_ID
            });

        for pipeline_to_shutdown in pipelines_to_shutdown {
            match self.detach_indexing_pipeline(pipeline_to_shutdown).await {
                Ok(pipeline_handle) => {
                    // Killing the pipeline ensures that all the pipeline actors will stop.
                    pipeline_handle.kill().await;
                }
                Err(error) => {
                    // Just log the detach error, it can only come from a missing pipeline in the
                    // `indexing_pipeline_handles`.
                    error!(
                        pipeline_uid=%pipeline_to_shutdown,
                        ?error,
                        "failed to detach indexing pipeline",
                    );
                }
            }
        }
        // If at least one ingest source has been removed, the related index has possibly been
        // deleted. Thus we run a garbage collect to remove queues of potentially deleted
        // indexes.
        if should_gc_ingest_api_queues && let Err(error) = self.run_ingest_api_queues_gc().await {
            warn!(
                %error,
                "failed to garbage collect ingest API queues",
            );
        }
    }

    /// Broadcasts the current running plan via chitchat.
    async fn update_chitchat_running_plan(&self) {
        let mut indexing_tasks: Vec<IndexingTask> = self
            .indexing_pipelines
            .values()
            .map(|pipeline_handle| {
                let assignment = pipeline_handle.handle.last_observation();
                let shard_ids: Vec<ShardId> = assignment.shard_ids.iter().cloned().collect();
                IndexingTask {
                    index_uid: Some(pipeline_handle.indexing_pipeline_id.index_uid.clone()),
                    source_id: pipeline_handle.indexing_pipeline_id.source_id.clone(),
                    pipeline_uid: Some(pipeline_handle.indexing_pipeline_id.pipeline_uid),
                    shard_ids,
                    params_fingerprint: assignment.params_fingerprint,
                }
            })
            .collect();

        // TODO: Does anybody why we sort the indexing tasks by pipeline_uid here?
        indexing_tasks.sort_unstable_by_key(|task| task.pipeline_uid);

        self.cluster
            .update_self_node_indexing_tasks(&indexing_tasks)
            .await;
    }

    /// Garbage collects ingest API queues of deleted indexes.
    async fn run_ingest_api_queues_gc(&mut self) -> anyhow::Result<()> {
        let Some(ingest_api_service) = &self.ingest_api_service_opt else {
            return Ok(());
        };
        let queues: HashSet<String> = ingest_api_service
            .ask_for_res(ListQueuesRequest {})
            .await
            .context("failed to list queues")?
            .queues
            .into_iter()
            .collect();
        debug!(queues=?queues, "list ingest API queues");

        if queues.is_empty() {
            return Ok(());
        }
        let indexes_metadata = self
            .metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await?
            .deserialize_indexes_metadata()
            .await?;
        let index_ids: HashSet<String> = indexes_metadata
            .into_iter()
            .map(|index_metadata| index_metadata.index_id().to_string())
            .collect();
        debug!(index_ids=?index_ids, "list indexes");

        let partition_id = ingest_api_service.ask(GetPartitionId).await?;
        let queue_ids_to_delete = queues.difference(&index_ids);

        for queue_id in queue_ids_to_delete {
            let delete_queue_res = ingest_api_service
                .ask_for_res(DropQueueRequest {
                    queue_id: queue_id.to_string(),
                })
                .await;
            if let Err(delete_queue_error) = delete_queue_res {
                error!(
                    index_id = %queue_id,
                    partition_id,
                    error = %delete_queue_error,
                    "failed to delete queue"
                );
                self.counters.num_delete_queue_failures += 1;
            } else {
                info!(
                    index_id = %queue_id,
                    partition_id,
                    "deleted queue successfully"
                );
                self.counters.num_deleted_queues += 1;
            }
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<ObservePipeline> for IndexingService {
    type Reply = Result<Observation<IndexingStatistics>, IndexingError>;

    async fn handle(
        &mut self,
        msg: ObservePipeline,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let pipeline_uid = msg.pipeline_id.pipeline_uid;
        let observation = self.observe_pipeline(&pipeline_uid).await;
        Ok(observation)
    }
}

#[async_trait]
impl Handler<DetachIndexingPipeline> for IndexingService {
    type Reply = Result<ActorHandle<IndexingPipeline>, IndexingError>;

    async fn handle(
        &mut self,
        msg: DetachIndexingPipeline,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let pipeline_uid = msg.pipeline_id.pipeline_uid;
        let detach_pipeline_result = self.detach_indexing_pipeline(&pipeline_uid).await;
        Ok(detach_pipeline_result)
    }
}

#[async_trait]
impl Handler<DetachMergePipeline> for IndexingService {
    type Reply = Result<ActorHandle<MergePipeline>, IndexingError>;

    async fn handle(
        &mut self,
        msg: DetachMergePipeline,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.detach_merge_pipeline(&msg.pipeline_id).await)
    }
}

#[derive(Debug)]
struct SuperviseLoop;

#[async_trait]
impl Handler<SuperviseLoop> for IndexingService {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: SuperviseLoop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.handle_supervise().await?;
        ctx.schedule_self_msg(*quickwit_actors::HEARTBEAT, SuperviseLoop);
        Ok(())
    }
}

#[async_trait]
impl Actor for IndexingService {
    type ObservableState = IndexingServiceCounters;

    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.run_ingest_api_queues_gc().await?;
        self.handle(SuperviseLoop, ctx).await
    }
}

#[async_trait]
impl Handler<SpawnPipeline> for IndexingService {
    type Reply = Result<IndexingPipelineId, IndexingError>;
    async fn handle(
        &mut self,
        message: SpawnPipeline,
        ctx: &ActorContext<Self>,
    ) -> Result<Result<IndexingPipelineId, IndexingError>, ActorExitStatus> {
        Ok(self
            .spawn_pipeline(
                ctx,
                message.index_id,
                message.source_config,
                message.pipeline_uid,
            )
            .await)
    }
}

#[async_trait]
impl Handler<ApplyIndexingPlanRequest> for IndexingService {
    type Reply = Result<ApplyIndexingPlanResponse, IndexingError>;

    async fn handle(
        &mut self,
        plan_request: ApplyIndexingPlanRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self
            .apply_indexing_plan(&plan_request.indexing_tasks, ctx)
            .await
            .map(|_| ApplyIndexingPlanResponse {}))
    }
}

#[async_trait]
impl Handler<Healthz> for IndexingService {
    type Reply = bool;

    async fn handle(
        &mut self,
        _msg: Healthz,
        _ctx: &ActorContext<Self>,
    ) -> Result<bool, ActorExitStatus> {
        // In the future, check metrics such as available disk space.
        Ok(true)
    }
}

#[derive(Debug)]
struct IndexingPipelineDiff {
    pipelines_to_shutdown: Vec<PipelineUid>,
    pipelines_to_spawn: Vec<IndexingTask>,
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;
    use std::path::Path;
    use std::time::Duration;

    use quickwit_actors::{HEARTBEAT, Health, ObservationType, Supervisable, Universe};
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_common::ServiceStream;
    use quickwit_common::rand::append_random_suffix;
    use quickwit_config::{
        IngestApiConfig, KafkaSourceParams, SourceConfig, SourceInputFormat, SourceParams,
        VecSourceParams,
    };
    use quickwit_ingest::{CreateQueueIfNotExistsRequest, init_ingest_api};
    use quickwit_metastore::{
        AddSourceRequestExt, CreateIndexRequestExt, ListIndexesMetadataResponseExt, Split,
        metastore_for_test,
    };
    use quickwit_proto::indexing::IndexingTask;
    use quickwit_proto::metastore::{
        AddSourceRequest, CreateIndexRequest, DeleteIndexRequest, IndexMetadataResponse,
        IndexesMetadataResponse, ListIndexesMetadataResponse, ListSplitsResponse,
        MockMetastoreService,
    };

    use super::*;
    use crate::actors::merge_pipeline::SUPERVISE_LOOP_INTERVAL;

    async fn spawn_indexing_service_for_test(
        data_dir_path: &Path,
        universe: &Universe,
        metastore: MetastoreServiceClient,
        cluster: Cluster,
    ) -> (Mailbox<IndexingService>, ActorHandle<IndexingService>) {
        let indexer_config = IndexerConfig::for_test().unwrap();
        let num_blocking_threads = 1;
        let storage_resolver = StorageResolver::unconfigured();
        let queues_dir_path = data_dir_path.join(QUEUES_DIR_NAME);
        let ingest_api_service =
            init_ingest_api(universe, &queues_dir_path, &IngestApiConfig::default())
                .await
                .unwrap();
        let merge_scheduler_mailbox: Mailbox<MergeSchedulerService> = universe.get_or_spawn_one();
        let indexing_server = IndexingService::new(
            NodeId::from("test-node"),
            data_dir_path.to_path_buf(),
            indexer_config,
            num_blocking_threads,
            cluster,
            metastore,
            Some(ingest_api_service),
            merge_scheduler_mailbox,
            IngesterPool::default(),
            storage_resolver.clone(),
            EventBroker::default(),
        )
        .await
        .unwrap();
        universe.spawn_builder().spawn(indexing_server)
    }

    #[tokio::test]
    async fn test_indexing_service_spawn_observe_detach() {
        quickwit_common::setup_logging_for_tests();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let metastore = metastore_for_test();

        let index_id = append_random_suffix("test-indexing-service");
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(&index_id, &index_uri);

        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();
        let create_source_request = AddSourceRequest::try_from_source_config(
            index_uid.clone(),
            &SourceConfig::ingest_api_default(),
        )
        .unwrap();
        metastore.add_source(create_source_request).await.unwrap();

        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir().unwrap();
        let (indexing_service, indexing_service_handle) =
            spawn_indexing_service_for_test(temp_dir.path(), &universe, metastore, cluster).await;
        let observation = indexing_service_handle.observe().await;
        assert_eq!(observation.num_running_pipelines, 0);
        assert_eq!(observation.num_failed_pipelines, 0);
        assert_eq!(observation.num_successful_pipelines, 0);

        // Test `spawn_pipeline`.
        let source_config_0 = SourceConfig {
            source_id: "test-indexing-service--source-0".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let spawn_pipeline_msg = SpawnPipeline {
            index_id: index_id.clone(),
            pipeline_uid: PipelineUid::for_test(1111u128),
            source_config: source_config_0.clone(),
        };
        let pipeline_id: IndexingPipelineId = indexing_service
            .ask_for_res(spawn_pipeline_msg.clone())
            .await
            .unwrap();
        indexing_service
            .ask_for_res(spawn_pipeline_msg)
            .await
            .unwrap_err();
        assert_eq!(pipeline_id.index_uid.index_id, index_id);
        assert_eq!(pipeline_id.source_id, source_config_0.source_id);
        assert_eq!(pipeline_id.node_id, "test-node");
        assert_eq!(pipeline_id.pipeline_uid, PipelineUid::for_test(1111u128));
        assert_eq!(
            indexing_service_handle
                .observe()
                .await
                .num_running_pipelines,
            1
        );

        // Test `observe_pipeline`.
        let observation = indexing_service
            .ask_for_res(ObservePipeline {
                pipeline_id: pipeline_id.clone(),
            })
            .await
            .unwrap();
        assert_eq!(observation.obs_type, ObservationType::Alive);
        assert_eq!(observation.generation, 1);
        assert_eq!(observation.num_spawn_attempts, 1);

        // Test detach.
        let pipeline_handle = indexing_service
            .ask_for_res(DetachIndexingPipeline {
                pipeline_id: pipeline_id.clone(),
            })
            .await
            .unwrap();
        pipeline_handle.kill().await;
        let _merge_pipeline = indexing_service
            .ask_for_res(DetachMergePipeline {
                pipeline_id: pipeline_id.merge_pipeline_id(),
            })
            .await
            .unwrap();
        let observation = indexing_service_handle.process_pending_and_observe().await;
        assert_eq!(observation.num_running_pipelines, 0);
        assert_eq!(observation.num_running_merge_pipelines, 0);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexing_service_supervise_pipelines() {
        quickwit_common::setup_logging_for_tests();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let metastore = metastore_for_test();

        let index_id = append_random_suffix("test-indexing-service");
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(&index_id, &index_uri);

        let source_config = SourceConfig {
            source_id: "test-indexing-service--source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Vec(VecSourceParams {
                docs: Vec::new(),
                batch_num_docs: 10,
                partition: "0".to_string(),
            }),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let create_index_request = CreateIndexRequest::try_from_index_and_source_configs(
            &index_config,
            std::slice::from_ref(&source_config),
        )
        .unwrap();
        metastore.create_index(create_index_request).await.unwrap();

        let universe = Universe::new();
        let temp_dir = tempfile::tempdir().unwrap();
        let (indexing_service, indexing_server_handle) =
            spawn_indexing_service_for_test(temp_dir.path(), &universe, metastore, cluster).await;

        indexing_service
            .ask_for_res(SpawnPipeline {
                index_id: index_id.clone(),
                source_config,
                pipeline_uid: PipelineUid::default(),
            })
            .await
            .unwrap();
        for _ in 0..2000 {
            let obs = indexing_server_handle.observe().await;
            if obs.num_successful_pipelines == 1 {
                // It may or may not panic
                universe.quit().await;
                return;
            }
            universe.sleep(Duration::from_millis(100)).await;
        }
        panic!("Pipeline not exited successfully.");
    }

    #[tokio::test]
    async fn test_indexing_service_apply_plan() {
        const PARAMS_FINGERPRINT_INGEST_API: u64 = 1637744865450232394;
        const PARAMS_FINGERPRINT_SOURCE_1: u64 = 1705211905504908791;
        const PARAMS_FINGERPRINT_SOURCE_2: u64 = 8706667372658059428;

        quickwit_common::setup_logging_for_tests();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let metastore = metastore_for_test();

        let index_id = append_random_suffix("test-indexing-service");
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(&index_id, &index_uri);

        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();
        let add_source_request = AddSourceRequest::try_from_source_config(
            index_uid.clone(),
            &SourceConfig::ingest_api_default(),
        )
        .unwrap();
        metastore.add_source(add_source_request).await.unwrap();
        let universe = Universe::new();
        let temp_dir = tempfile::tempdir().unwrap();
        let (indexing_service, indexing_service_handle) = spawn_indexing_service_for_test(
            temp_dir.path(),
            &universe,
            metastore.clone(),
            cluster.clone(),
        )
        .await;
        let metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.clone()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();

        let source_config_1 = SourceConfig {
            source_id: "test-indexing-service--source-1".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        {
            // Assign 2 indexing tasks
            // -> total: 1 source * 2 pipelines
            let add_source_request =
                AddSourceRequest::try_from_source_config(index_uid.clone(), &source_config_1)
                    .unwrap();
            metastore.add_source(add_source_request).await.unwrap();
            let indexing_tasks = vec![
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_1.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(0u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_1,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_1.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(1u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_1,
                },
            ];
            indexing_service
                .ask_for_res(ApplyIndexingPlanRequest { indexing_tasks })
                .await
                .unwrap();
            assert_eq!(
                indexing_service_handle
                    .observe()
                    .await
                    .num_running_pipelines,
                2
            );
        }
        let kafka_params = KafkaSourceParams {
            topic: "my-topic".to_string(),
            client_log_level: None,
            client_params: serde_json::Value::Null,
            enable_backfill_mode: false,
        };
        let source_config_2 = SourceConfig {
            source_id: "test-indexing-service--source-2".to_string(),
            num_pipelines: NonZeroUsize::new(2).unwrap(),
            enabled: true,
            source_params: SourceParams::Kafka(kafka_params),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        {
            // Assign 2 more indexing tasks (1 new source + activate ingest API source)
            // -> total: 2 source * 1 pipeline + 1 source * 2 pipelines
            let add_source_request_2 =
                AddSourceRequest::try_from_source_config(index_uid.clone(), &source_config_2)
                    .unwrap();
            metastore.add_source(add_source_request_2).await.unwrap();

            let indexing_tasks = vec![
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: INGEST_API_SOURCE_ID.to_string(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(3u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_INGEST_API,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_1.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(1u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_1,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_1.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(2u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_1,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_2.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(4u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_2,
                },
            ];
            indexing_service
                .ask_for_res(ApplyIndexingPlanRequest {
                    indexing_tasks: indexing_tasks.clone(),
                })
                .await
                .unwrap();
            assert_eq!(
                indexing_service_handle
                    .observe()
                    .await
                    .num_running_pipelines,
                4
            );
            cluster
                .wait_for_ready_members(
                    |members| {
                        members
                            .iter()
                            .any(|member| member.indexing_tasks.len() == indexing_tasks.len())
                    },
                    Duration::from_secs(5),
                )
                .await
                .unwrap();
            let self_member = &cluster.ready_members().await[0];
            assert_eq!(
                HashSet::<_>::from_iter(self_member.indexing_tasks.iter()),
                HashSet::from_iter(indexing_tasks.iter())
            );
        }
        {
            // Remove 1 task (source_1 runs only 1 pipeline)
            // -> total = 3 sources x 1 pipeline each
            let indexing_tasks = vec![
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: INGEST_API_SOURCE_ID.to_string(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(3u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_INGEST_API,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_1.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(1u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_1,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_2.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(4u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_2,
                },
            ];
            indexing_service
                .ask_for_res(ApplyIndexingPlanRequest {
                    indexing_tasks: indexing_tasks.clone(),
                })
                .await
                .unwrap();
            let indexing_service_obs = indexing_service_handle.observe().await;
            assert_eq!(indexing_service_obs.num_running_pipelines, 3);
            assert_eq!(indexing_service_obs.num_deleted_queues, 0);
            assert_eq!(indexing_service_obs.num_delete_queue_failures, 0);

            indexing_service_handle.process_pending_and_observe().await;

            cluster
                .wait_for_ready_members(
                    |members| {
                        members
                            .iter()
                            .any(|member| member.indexing_tasks.len() == indexing_tasks.len())
                    },
                    Duration::from_secs(5),
                )
                .await
                .unwrap();

            let self_member = &cluster.ready_members().await[0];

            assert_eq!(
                HashSet::<_>::from_iter(self_member.indexing_tasks.iter()),
                HashSet::from_iter(indexing_tasks.iter())
            );
        }
        {
            // Rescheduling a task (source_1) with an unexpected fingerprint
            // removes the existing pipeline but doesn't start a new one.
            // -> total: 2 sources x 1 pipeline
            let indexing_tasks = vec![
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: INGEST_API_SOURCE_ID.to_string(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(3u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_INGEST_API,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_1.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(7u128)),
                    params_fingerprint: 42,
                },
                IndexingTask {
                    index_uid: Some(metadata.index_uid.clone()),
                    source_id: source_config_2.source_id.clone(),
                    shard_ids: Vec::new(),
                    pipeline_uid: Some(PipelineUid::for_test(4u128)),
                    params_fingerprint: PARAMS_FINGERPRINT_SOURCE_2,
                },
            ];
            indexing_service
                .ask_for_res(ApplyIndexingPlanRequest {
                    indexing_tasks: indexing_tasks.clone(),
                })
                .await
                .unwrap();
            let indexing_service_obs = indexing_service_handle.observe().await;
            assert_eq!(indexing_service_obs.num_running_pipelines, 2);
            assert_eq!(indexing_service_obs.num_deleted_queues, 0);
            assert_eq!(indexing_service_obs.num_delete_queue_failures, 0);
        }

        // Delete index and apply empty plan
        metastore
            .delete_index(DeleteIndexRequest {
                index_uid: Some(index_uid.clone()),
            })
            .await
            .unwrap();
        indexing_service
            .ask_for_res(ApplyIndexingPlanRequest {
                indexing_tasks: Vec::new(),
            })
            .await
            .unwrap();
        let indexing_service_obs = indexing_service_handle.observe().await;
        assert_eq!(indexing_service_obs.num_running_pipelines, 0);
        assert_eq!(indexing_service_obs.num_deleted_queues, 1);
        assert_eq!(indexing_service_obs.num_delete_queue_failures, 0);
        indexing_service_handle.quit().await;
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexing_service_shutdown_merge_pipeline_when_no_indexing_pipeline() {
        quickwit_common::setup_logging_for_tests();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let metastore = metastore_for_test();

        let index_id = append_random_suffix("test-indexing-service");
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(&index_id, &index_uri);

        let source_config = SourceConfig {
            source_id: "test-indexing-service--source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();
        let add_source_request =
            AddSourceRequest::try_from_source_config(index_uid.clone(), &source_config).unwrap();
        metastore.add_source(add_source_request).await.unwrap();

        // Test `IndexingService::new`.
        let temp_dir = tempfile::tempdir().unwrap();
        let data_dir_path = temp_dir.path().to_path_buf();
        let indexer_config = IndexerConfig::for_test().unwrap();
        let num_blocking_threads = 1;
        let storage_resolver = StorageResolver::unconfigured();
        let universe = Universe::with_accelerated_time();
        let queues_dir_path = data_dir_path.join(QUEUES_DIR_NAME);
        let ingest_api_service =
            init_ingest_api(&universe, &queues_dir_path, &IngestApiConfig::default())
                .await
                .unwrap();
        let merge_scheduler_service = universe.get_or_spawn_one();
        let indexing_server = IndexingService::new(
            NodeId::from("test-node"),
            data_dir_path,
            indexer_config,
            num_blocking_threads,
            cluster.clone(),
            metastore.clone(),
            Some(ingest_api_service),
            merge_scheduler_service,
            IngesterPool::default(),
            storage_resolver.clone(),
            EventBroker::default(),
        )
        .await
        .unwrap();
        let (indexing_server_mailbox, indexing_server_handle) =
            universe.spawn_builder().spawn(indexing_server);
        let pipeline_id = indexing_server_mailbox
            .ask_for_res(SpawnPipeline {
                index_id: index_id.clone(),
                source_config,
                pipeline_uid: PipelineUid::default(),
            })
            .await
            .unwrap();
        let observation = indexing_server_handle.observe().await;
        assert_eq!(observation.num_running_pipelines, 1);
        assert_eq!(observation.num_failed_pipelines, 0);
        assert_eq!(observation.num_successful_pipelines, 0);
        assert_eq!(observation.num_running_merge_pipelines, 1);

        // Test `shutdown_pipeline`
        let pipeline = indexing_server_mailbox
            .ask_for_res(DetachIndexingPipeline { pipeline_id })
            .await
            .unwrap();
        pipeline.quit().await;

        // Let the service cleanup the merge pipelines.
        universe.sleep(*HEARTBEAT).await;

        let observation = indexing_server_handle.process_pending_and_observe().await;
        assert_eq!(observation.num_running_pipelines, 0);
        assert_eq!(observation.num_running_merge_pipelines, 0);
        universe.sleep(SUPERVISE_LOOP_INTERVAL).await;
        // Check that the merge pipeline is also shut down as they are no more indexing pipeilne on
        // the index.
        assert!(universe.get_one::<MergePipeline>().is_none());
        // It may or may not panic
        universe.quit().await;
    }

    #[derive(Debug)]
    struct FreezePipeline;
    #[async_trait]
    impl Handler<FreezePipeline> for IndexingPipeline {
        type Reply = ();
        async fn handle(
            &mut self,
            _: FreezePipeline,
            _ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, ActorExitStatus> {
            tokio::time::sleep(*HEARTBEAT * 5).await;
            Ok(())
        }
    }

    #[derive(Debug)]
    struct ObservePipelineHealth(IndexingPipelineId);
    #[async_trait]
    impl Handler<ObservePipelineHealth> for IndexingService {
        type Reply = Health;
        async fn handle(
            &mut self,
            message: ObservePipelineHealth,
            _ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, ActorExitStatus> {
            Ok(self
                .indexing_pipelines
                .get(&message.0.pipeline_uid)
                .unwrap()
                .handle
                .check_health(true))
        }
    }

    #[tokio::test]
    async fn test_indexing_service_does_not_shutdown_pipelines_on_indexing_pipeline_freeze() {
        quickwit_common::setup_logging_for_tests();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let index_id = append_random_suffix("test-indexing-service-indexing-pipeline-timeout");
        let index_uri = format!("ram:///indexes/{index_id}");
        let mut index_metadata = IndexMetadata::for_test(&index_id, &index_uri);
        let source_config = SourceConfig {
            source_id: "test-indexing-service--source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        index_metadata
            .sources
            .insert(source_config.source_id.clone(), source_config.clone());
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata_clone = index_metadata.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(move |_request| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata_clone,
                ]))
            });
        mock_metastore.expect_index_metadata().returning(move |_| {
            Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
        });
        mock_metastore
            .expect_list_splits()
            .returning(|_| Ok(ServiceStream::empty()));
        let universe = Universe::new();
        let temp_dir = tempfile::tempdir().unwrap();
        let (indexing_service, indexing_service_handle) = spawn_indexing_service_for_test(
            temp_dir.path(),
            &universe,
            MetastoreServiceClient::from_mock(mock_metastore),
            cluster,
        )
        .await;
        let _pipeline_id = indexing_service
            .ask_for_res(SpawnPipeline {
                index_id: index_id.clone(),
                source_config,
                pipeline_uid: PipelineUid::default(),
            })
            .await
            .unwrap();
        let observation = indexing_service_handle.observe().await;
        assert_eq!(observation.num_running_pipelines, 1);
        assert_eq!(observation.num_failed_pipelines, 0);
        assert_eq!(observation.num_successful_pipelines, 0);

        let indexing_pipeline = universe.get_one::<IndexingPipeline>().unwrap();

        // Freeze pipeline during 5 heartbeats.
        indexing_pipeline
            .send_message(FreezePipeline)
            .await
            .unwrap();
        universe.sleep(*HEARTBEAT * 5).await;
        // Check that indexing and merge pipelines are still running.
        let observation = indexing_service_handle.observe().await;
        assert_eq!(observation.num_running_pipelines, 1);
        assert_eq!(observation.num_failed_pipelines, 0);
        assert_eq!(observation.num_running_merge_pipelines, 1);
        // Might generate panics
        universe.quit().await;
    }

    #[tokio::test]
    async fn test_indexing_service_ingest_api_gc() {
        let index_id = "test-ingest-api-gc-index".to_string();
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(&index_id, &index_uri);
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let metastore = metastore_for_test();
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        // Setup ingest api objects
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir().unwrap();
        let queues_dir_path = temp_dir.path().join(QUEUES_DIR_NAME);
        let ingest_api_service =
            init_ingest_api(&universe, &queues_dir_path, &IngestApiConfig::default())
                .await
                .unwrap();
        let create_queue_req = CreateQueueIfNotExistsRequest {
            queue_id: index_id.clone(),
        };
        ingest_api_service
            .ask_for_res(create_queue_req)
            .await
            .unwrap();

        // Setup `IndexingService`
        let data_dir_path = temp_dir.path().to_path_buf();
        let indexer_config = IndexerConfig::for_test().unwrap();
        let num_blocking_threads = 1;
        let storage_resolver = StorageResolver::unconfigured();
        let merge_scheduler_service: Mailbox<MergeSchedulerService> = universe.get_or_spawn_one();
        let mut indexing_server = IndexingService::new(
            NodeId::from("test-ingest-api-gc-node"),
            data_dir_path,
            indexer_config,
            num_blocking_threads,
            cluster.clone(),
            metastore.clone(),
            Some(ingest_api_service.clone()),
            merge_scheduler_service,
            IngesterPool::default(),
            storage_resolver.clone(),
            EventBroker::default(),
        )
        .await
        .unwrap();

        indexing_server.run_ingest_api_queues_gc().await.unwrap();
        assert_eq!(indexing_server.counters.num_deleted_queues, 0);

        metastore
            .delete_index(DeleteIndexRequest {
                index_uid: Some(index_uid.clone()),
            })
            .await
            .unwrap();

        indexing_server.run_ingest_api_queues_gc().await.unwrap();
        assert_eq!(indexing_server.counters.num_deleted_queues, 1);

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_indexing_service_apply_indexing_plan_batches_metastore_calls() {
        let temp_dir = tempfile::tempdir().unwrap();
        let universe = Universe::new();

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .withf(|request| request.index_id.as_ref().unwrap() == "test-index-0")
            .return_once(|_request| {
                let index_metadata_0 =
                    IndexMetadata::for_test("test-index-0", "ram:///indexes/test-index-0");
                let response =
                    IndexMetadataResponse::try_from_index_metadata(&index_metadata_0).unwrap();
                Ok(response)
            });
        mock_metastore
            .expect_indexes_metadata()
            .withf(|request| {
                let index_uids: Vec<&IndexUid> = request
                    .subrequests
                    .iter()
                    .flat_map(|subrequest| &subrequest.index_uid)
                    .sorted()
                    .collect();

                index_uids == [&("test-index-1", 0), &("test-index-2", 0)]
            })
            .return_once(|_request| {
                let source_config = SourceConfig::for_test("test-source", SourceParams::void());

                let mut index_metadata_1 =
                    IndexMetadata::for_test("test-index-1", "ram:///indexes/test-index-1");
                index_metadata_1.add_source(source_config.clone()).unwrap();

                let mut index_metadata_2 =
                    IndexMetadata::for_test("test-index-2", "ram:///indexes/test-index-2");
                index_metadata_2.add_source(source_config).unwrap();

                let indexes_metadata = vec![index_metadata_1, index_metadata_2];
                let failures = Vec::new();
                let response = IndexesMetadataResponse::for_test(indexes_metadata, failures);
                Ok(response)
            });
        mock_metastore
            .expect_list_splits()
            .withf(|request| {
                let list_splits_query = request.deserialize_list_splits_query().unwrap();
                list_splits_query.index_uids.unwrap() == [("test-index-0", 0)]
            })
            .return_once(|_request| Ok(ServiceStream::empty()));
        mock_metastore
            .expect_list_splits()
            .withf(|request| {
                let list_splits_query = request.deserialize_list_splits_query().unwrap();
                list_splits_query.index_uids.unwrap() == [("test-index-1", 0), ("test-index-2", 0)]
            })
            .return_once(|_request| {
                let splits = vec![Split {
                    split_metadata: SplitMetadata::for_test("test-split".to_string()),
                    split_state: SplitState::Published,
                    update_timestamp: 0,
                    publish_timestamp: Some(0),
                }];
                let list_splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                let response = ServiceStream::from(vec![Ok(list_splits_response)]);
                Ok(response)
            });

        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let (indexing_service, _indexing_service_handle) = spawn_indexing_service_for_test(
            temp_dir.path(),
            &universe,
            MetastoreServiceClient::from_mock(mock_metastore),
            cluster,
        )
        .await;

        let source_config = SourceConfig::for_test("test-source", SourceParams::void());

        indexing_service
            .ask_for_res(SpawnPipeline {
                index_id: "test-index-0".to_string(),
                source_config,
                pipeline_uid: PipelineUid::for_test(0),
            })
            .await
            .unwrap();

        indexing_service
            .ask_for_res(ApplyIndexingPlanRequest {
                indexing_tasks: vec![
                    IndexingTask {
                        index_uid: Some(IndexUid::for_test("test-index-0", 0)),
                        source_id: "test-source".to_string(),
                        shard_ids: Vec::new(),
                        pipeline_uid: Some(PipelineUid::for_test(0)),
                        params_fingerprint: 0,
                    },
                    IndexingTask {
                        index_uid: Some(IndexUid::for_test("test-index-1", 0)),
                        source_id: "test-source".to_string(),
                        shard_ids: Vec::new(),
                        pipeline_uid: Some(PipelineUid::for_test(1)),
                        params_fingerprint: 0,
                    },
                    IndexingTask {
                        index_uid: Some(IndexUid::for_test("test-index-2", 0)),
                        source_id: "test-source".to_string(),
                        shard_ids: Vec::new(),
                        pipeline_uid: Some(PipelineUid::for_test(2)),
                        params_fingerprint: 0,
                    },
                ],
            })
            .await
            .unwrap();

        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/merge_executor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::ops::RangeInclusive;
use std::path::Path;
use std::sync::Arc;
use std::time::Instant;

use anyhow::{Context, anyhow};
use async_trait::async_trait;
use fail::fail_point;
use itertools::Itertools;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::io::IoControls;
use quickwit_common::runtimes::RuntimeType;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_directories::UnionDirectory;
use quickwit_doc_mapper::DocMapper;
use quickwit_metastore::SplitMetadata;
use quickwit_proto::indexing::MergePipelineId;
use quickwit_proto::metastore::{
    DeleteTask, ListDeleteTasksRequest, MarkSplitsForDeletionRequest, MetastoreService,
    MetastoreServiceClient,
};
use quickwit_proto::types::{NodeId, SplitId};
use quickwit_query::get_quickwit_fastfield_normalizer_manager;
use quickwit_query::query_ast::QueryAst;
use tantivy::directory::{Advice, DirectoryClone, MmapDirectory, RamDirectory};
use tantivy::index::SegmentId;
use tantivy::tokenizer::TokenizerManager;
use tantivy::{DateTime, Directory, Index, IndexMeta, IndexWriter, SegmentReader};
use tokio::runtime::Handle;
use tracing::{debug, error, info, instrument, warn};

use crate::actors::Packager;
use crate::controlled_directory::ControlledDirectory;
use crate::merge_policy::MergeOperationType;
use crate::models::{IndexedSplit, IndexedSplitBatch, MergeScratch, PublishLock, SplitAttrs};

#[derive(Clone)]
pub struct MergeExecutor {
    pipeline_id: MergePipelineId,
    metastore: MetastoreServiceClient,
    doc_mapper: Arc<DocMapper>,
    io_controls: IoControls,
    merge_packager_mailbox: Mailbox<Packager>,
}

#[async_trait]
impl Actor for MergeExecutor {
    type ObservableState = ();

    fn runtime_handle(&self) -> Handle {
        RuntimeType::Blocking.get_runtime_handle()
    }

    fn observable_state(&self) -> Self::ObservableState {}

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(1)
    }

    fn name(&self) -> String {
        "MergeExecutor".to_string()
    }
}

#[async_trait]
impl Handler<MergeScratch> for MergeExecutor {
    type Reply = ();

    #[instrument(level = "info", name = "merge_executor", parent = merge_scratch.merge_task.merge_parent_span.id(), skip_all)]
    async fn handle(
        &mut self,
        merge_scratch: MergeScratch,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let start = Instant::now();
        let merge_task = merge_scratch.merge_task;
        let indexed_split_opt: Option<IndexedSplit> = match merge_task.operation_type {
            MergeOperationType::Merge => {
                let merge_res = self
                    .process_merge(
                        merge_task.merge_split_id.clone(),
                        merge_task.splits.clone(),
                        merge_scratch.tantivy_dirs,
                        merge_scratch.merge_scratch_directory,
                        ctx,
                    )
                    .await;
                match merge_res {
                    Ok(indexed_split) => Some(indexed_split),
                    Err(err) => {
                        // A failure in a merge is a bit special.
                        //
                        // Instead of failing the pipeline, we just log it.
                        // The idea is to limit the risk associated with a potential split of death.
                        //
                        // Such a split is now not tracked by the merge planner and won't undergo a
                        // merge until the merge pipeline is restarted.
                        //
                        // With a merge policy that marks splits as mature after a day or so, this
                        // limits the noise associated to those failed
                        // merges.
                        error!(task=?merge_task, err=?err, "failed to merge splits");
                        return Ok(());
                    }
                }
            }
            MergeOperationType::DeleteAndMerge => {
                assert_eq!(
                    merge_task.splits.len(),
                    1,
                    "Delete tasks can be applied only on one split."
                );
                assert_eq!(merge_scratch.tantivy_dirs.len(), 1);
                let split_with_docs_to_delete = merge_task.splits[0].clone();
                self.process_delete_and_merge(
                    merge_task.merge_split_id.clone(),
                    split_with_docs_to_delete,
                    merge_scratch.tantivy_dirs,
                    merge_scratch.merge_scratch_directory,
                    ctx,
                )
                .await?
            }
        };
        if let Some(indexed_split) = indexed_split_opt {
            info!(
                merged_num_docs = %indexed_split.split_attrs.num_docs,
                elapsed_secs = %start.elapsed().as_secs_f32(),
                operation_type = %merge_task.operation_type,
                "merge-operation-success"
            );
            ctx.send_message(
                &self.merge_packager_mailbox,
                IndexedSplitBatch {
                    splits: vec![indexed_split],
                    checkpoint_delta_opt: Default::default(),
                    publish_lock: PublishLock::default(),
                    publish_token_opt: None,
                    batch_parent_span: merge_task.merge_parent_span.clone(),
                    merge_task_opt: Some(merge_task),
                },
            )
            .await?;
        } else {
            info!("no-splits-merged");
        }
        Ok(())
    }
}

fn combine_index_meta(mut index_metas: Vec<IndexMeta>) -> anyhow::Result<IndexMeta> {
    let mut union_index_meta = index_metas.pop().with_context(|| "only one IndexMeta")?;
    for index_meta in index_metas {
        union_index_meta.segments.extend(index_meta.segments);
    }
    Ok(union_index_meta)
}

fn open_split_directories(
    // Directories containing the splits to merge
    tantivy_dirs: &[Box<dyn Directory>],
    tokenizer_manager: &TokenizerManager,
) -> anyhow::Result<(IndexMeta, Vec<Box<dyn Directory>>)> {
    let mut directories: Vec<Box<dyn Directory>> = Vec::new();
    let mut index_metas = Vec::new();
    for tantivy_dir in tantivy_dirs {
        directories.push(tantivy_dir.clone());

        let index_meta = open_index(tantivy_dir.clone(), tokenizer_manager)?.load_metas()?;
        index_metas.push(index_meta);
    }
    let union_index_meta = combine_index_meta(index_metas)?;
    Ok((union_index_meta, directories))
}

/// Creates a directory with a single `meta.json` file describe in `index_meta`
fn create_shadowing_meta_json_directory(index_meta: IndexMeta) -> anyhow::Result<RamDirectory> {
    let union_index_meta_json = serde_json::to_string_pretty(&index_meta)?;
    let ram_directory = RamDirectory::default();
    ram_directory.atomic_write(Path::new("meta.json"), union_index_meta_json.as_bytes())?;
    Ok(ram_directory)
}

fn merge_time_range(splits: &[SplitMetadata]) -> Option<RangeInclusive<DateTime>> {
    splits
        .iter()
        .flat_map(|split| split.time_range.clone())
        .flat_map(|time_range| vec![*time_range.start(), *time_range.end()].into_iter())
        .minmax()
        .into_option()
        .map(|(min_timestamp, max_timestamp)| {
            DateTime::from_timestamp_secs(min_timestamp)
                ..=DateTime::from_timestamp_secs(max_timestamp)
        })
}

fn sum_doc_sizes_in_bytes(splits: &[SplitMetadata]) -> u64 {
    splits
        .iter()
        .map(|split| split.uncompressed_docs_size_in_bytes)
        .sum::<u64>()
}

fn sum_num_docs(splits: &[SplitMetadata]) -> u64 {
    splits.iter().map(|split| split.num_docs as u64).sum()
}

/// Following Boost's hash_combine.
fn combine_two_hashes(lhs: u64, rhs: u64) -> u64 {
    let update_to_xor = rhs
        .wrapping_add(0x9e3779b9)
        .wrapping_add(lhs << 6)
        .wrapping_add(lhs >> 2);
    lhs ^ update_to_xor
}

fn combine_partition_ids_aux(partition_ids: impl IntoIterator<Item = u64>) -> u64 {
    let sorted_unique_partition_ids: BTreeSet<u64> = partition_ids.into_iter().collect();
    let mut sorted_unique_partition_ids_it = sorted_unique_partition_ids.into_iter();
    if let Some(partition_id) = sorted_unique_partition_ids_it.next() {
        sorted_unique_partition_ids_it.fold(partition_id, |acc, partition_id| {
            combine_two_hashes(acc, partition_id)
        })
    } else {
        // This is not forbidden but this should never happen.
        0u64
    }
}

pub fn combine_partition_ids(splits: &[SplitMetadata]) -> u64 {
    combine_partition_ids_aux(splits.iter().map(|split| split.partition_id))
}

pub fn merge_split_attrs(
    pipeline_id: MergePipelineId,
    merge_split_id: SplitId,
    splits: &[SplitMetadata],
) -> anyhow::Result<SplitAttrs> {
    let partition_id = combine_partition_ids_aux(splits.iter().map(|split| split.partition_id));
    let time_range: Option<RangeInclusive<DateTime>> = merge_time_range(splits);
    let uncompressed_docs_size_in_bytes = sum_doc_sizes_in_bytes(splits);
    let num_docs = sum_num_docs(splits);
    let replaced_split_ids: Vec<SplitId> = splits
        .iter()
        .map(|split| split.split_id().to_string())
        .collect();
    let delete_opstamp = splits
        .iter()
        .map(|split| split.delete_opstamp)
        .min()
        .unwrap_or(0);
    let doc_mapping_uid = splits
        .first()
        .ok_or_else(|| anyhow::anyhow!("attempted to merge zero splits"))?
        .doc_mapping_uid;
    if splits
        .iter()
        .any(|split| split.doc_mapping_uid != doc_mapping_uid)
    {
        anyhow::bail!("attempted to merge splits with different doc mapping uid");
    }
    Ok(SplitAttrs {
        node_id: pipeline_id.node_id.clone(),
        index_uid: pipeline_id.index_uid.clone(),
        source_id: pipeline_id.source_id.clone(),
        doc_mapping_uid,
        split_id: merge_split_id,
        partition_id,
        replaced_split_ids,
        time_range,
        num_docs,
        uncompressed_docs_size_in_bytes,
        delete_opstamp,
        num_merge_ops: max_merge_ops(splits) + 1,
    })
}

fn max_merge_ops(splits: &[SplitMetadata]) -> usize {
    splits
        .iter()
        .map(|split| split.num_merge_ops)
        .max()
        .unwrap_or(0)
}

impl MergeExecutor {
    pub fn new(
        pipeline_id: MergePipelineId,
        metastore: MetastoreServiceClient,
        doc_mapper: Arc<DocMapper>,
        io_controls: IoControls,
        merge_packager_mailbox: Mailbox<Packager>,
    ) -> Self {
        MergeExecutor {
            pipeline_id,
            metastore,
            doc_mapper,
            io_controls,
            merge_packager_mailbox,
        }
    }

    async fn process_merge(
        &mut self,
        merge_split_id: SplitId,
        splits: Vec<SplitMetadata>,
        tantivy_dirs: Vec<Box<dyn Directory>>,
        merge_scratch_directory: TempDirectory,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<IndexedSplit> {
        let (union_index_meta, split_directories) = open_split_directories(
            &tantivy_dirs,
            self.doc_mapper.tokenizer_manager().tantivy_manager(),
        )?;
        // TODO it would be nice if tantivy could let us run the merge in the current thread.
        fail_point!("before-merge-split");
        let controlled_directory = self
            .merge_split_directories(
                union_index_meta,
                split_directories,
                Vec::new(),
                None,
                merge_scratch_directory.path(),
                ctx,
            )
            .await?;
        fail_point!("after-merge-split");

        // This will have the side effect of deleting the directory containing the downloaded
        // splits.
        let merged_index = open_index(
            controlled_directory.clone(),
            self.doc_mapper.tokenizer_manager().tantivy_manager(),
        )?;
        ctx.record_progress();

        let split_attrs = merge_split_attrs(self.pipeline_id.clone(), merge_split_id, &splits)?;
        Ok(IndexedSplit {
            split_attrs,
            index: merged_index,
            split_scratch_directory: merge_scratch_directory,
            controlled_directory_opt: Some(controlled_directory),
        })
    }

    async fn process_delete_and_merge(
        &mut self,
        merge_split_id: SplitId,
        split: SplitMetadata,
        tantivy_dirs: Vec<Box<dyn Directory>>,
        merge_scratch_directory: TempDirectory,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<Option<IndexedSplit>> {
        let list_delete_tasks_request =
            ListDeleteTasksRequest::new(split.index_uid.clone(), split.delete_opstamp);
        let delete_tasks = ctx
            .protect_future(self.metastore.list_delete_tasks(list_delete_tasks_request))
            .await?
            .delete_tasks;
        if delete_tasks.is_empty() {
            warn!(
                "No delete task found for split `{}` with `delete_optamp` = `{}`.",
                split.split_id(),
                split.delete_opstamp
            );
            return Ok(None);
        }

        let last_delete_opstamp = delete_tasks
            .iter()
            .map(|delete_task| delete_task.opstamp)
            .max()
            .expect("There is at least one delete task.");
        info!(
            delete_opstamp_start = split.delete_opstamp,
            num_delete_tasks = delete_tasks.len()
        );

        let (union_index_meta, split_directories) = open_split_directories(
            &tantivy_dirs,
            self.doc_mapper.tokenizer_manager().tantivy_manager(),
        )?;
        let controlled_directory = self
            .merge_split_directories(
                union_index_meta,
                split_directories,
                delete_tasks,
                Some(self.doc_mapper.clone()),
                merge_scratch_directory.path(),
                ctx,
            )
            .await?;

        // This will have the side effect of deleting the directory containing the downloaded split.
        let mut merged_index = Index::open(controlled_directory.clone())?;
        ctx.record_progress();
        merged_index.set_tokenizers(
            self.doc_mapper
                .tokenizer_manager()
                .tantivy_manager()
                .clone(),
        );
        merged_index.set_fast_field_tokenizers(
            get_quickwit_fastfield_normalizer_manager()
                .tantivy_manager()
                .clone(),
        );

        ctx.record_progress();

        // Compute merged split attributes.
        let merged_segment =
            if let Some(segment) = merged_index.searchable_segments()?.into_iter().next() {
                segment
            } else {
                info!(
                    "All documents from split `{}` were deleted.",
                    split.split_id()
                );
                let mark_splits_for_deletion_request = MarkSplitsForDeletionRequest::new(
                    split.index_uid.clone(),
                    vec![split.split_id.clone()],
                );
                self.metastore
                    .mark_splits_for_deletion(mark_splits_for_deletion_request)
                    .await?;
                return Ok(None);
            };

        let merged_segment_reader = SegmentReader::open(&merged_segment)?;
        let num_docs = merged_segment_reader.num_docs() as u64;
        let uncompressed_docs_size_in_bytes = (num_docs as f32
            * split.uncompressed_docs_size_in_bytes as f32
            / split.num_docs as f32) as u64;
        let time_range = if let Some(timestamp_field_name) = self.doc_mapper.timestamp_field_name()
        {
            let reader = merged_segment_reader
                .fast_fields()
                .date(timestamp_field_name)?;
            Some(reader.min_value()..=reader.max_value())
        } else {
            None
        };
        let indexed_split = IndexedSplit {
            split_attrs: SplitAttrs {
                node_id: NodeId::new(split.node_id),
                index_uid: split.index_uid,
                source_id: split.source_id,
                doc_mapping_uid: split.doc_mapping_uid,
                split_id: merge_split_id,
                partition_id: split.partition_id,
                replaced_split_ids: vec![split.split_id.clone()],
                time_range,
                num_docs,
                uncompressed_docs_size_in_bytes,
                delete_opstamp: last_delete_opstamp,
                num_merge_ops: split.num_merge_ops,
            },
            index: merged_index,
            split_scratch_directory: merge_scratch_directory,
            controlled_directory_opt: Some(controlled_directory),
        };
        Ok(Some(indexed_split))
    }

    async fn merge_split_directories(
        &self,
        union_index_meta: IndexMeta,
        split_directories: Vec<Box<dyn Directory>>,
        delete_tasks: Vec<DeleteTask>,
        doc_mapper_opt: Option<Arc<DocMapper>>,
        output_path: &Path,
        ctx: &ActorContext<MergeExecutor>,
    ) -> anyhow::Result<ControlledDirectory> {
        let shadowing_meta_json_directory = create_shadowing_meta_json_directory(union_index_meta)?;

        // This directory is here to receive the merged split, as well as the final meta.json file.
        let output_directory = ControlledDirectory::new(
            Box::new(MmapDirectory::open_with_madvice(
                output_path,
                Advice::Sequential,
            )?),
            self.io_controls
                .clone()
                .set_kill_switch(ctx.kill_switch().clone())
                .set_progress(ctx.progress().clone()),
        );
        let mut directory_stack: Vec<Box<dyn Directory>> = vec![
            output_directory.box_clone(),
            Box::new(shadowing_meta_json_directory),
        ];
        directory_stack.extend(split_directories.into_iter());
        let union_directory = UnionDirectory::union_of(directory_stack);
        let union_index = open_index(
            union_directory,
            self.doc_mapper.tokenizer_manager().tantivy_manager(),
        )?;

        ctx.record_progress();
        let _protect_guard = ctx.protect_zone();

        let mut index_writer: IndexWriter = union_index.writer_with_num_threads(1, 15_000_000)?;
        let num_delete_tasks = delete_tasks.len();
        if num_delete_tasks > 0 {
            let doc_mapper = doc_mapper_opt
                .ok_or_else(|| anyhow!("doc mapper must be present if there are delete tasks"))?;
            for delete_task in delete_tasks {
                let delete_query = delete_task
                    .delete_query
                    .expect("A delete task must have a delete query.");
                let query_ast: QueryAst = serde_json::from_str(&delete_query.query_ast)
                    .context("invalid query_ast json")?;
                // We ignore the docmapper default fields when we consider delete query.
                // We reparse the query here defensively, but actually, it should already have been
                // done in the delete task rest handler.
                let parsed_query_ast = query_ast.parse_user_query(&[]).context("invalid query")?;
                debug!(
                    "Delete all documents matched by query `{:?}`",
                    parsed_query_ast
                );
                let (query, _) =
                    doc_mapper.query(union_index.schema(), parsed_query_ast, false, None)?;
                index_writer.delete_query(query)?;
            }
            debug!("commit-delete-operations");
            index_writer.commit()?;
        }

        let segment_ids: Vec<SegmentId> = union_index
            .searchable_segment_metas()?
            .into_iter()
            .map(|segment_meta| segment_meta.id())
            .collect();

        // A merge is useless if there is no delete and only one segment.
        if num_delete_tasks == 0 && segment_ids.len() <= 1 {
            return Ok(output_directory);
        }

        // If after deletion there is no longer any document, don't try to merge.
        if num_delete_tasks != 0 && segment_ids.is_empty() {
            return Ok(output_directory);
        }

        debug!(segment_ids=?segment_ids,"merging-segments");
        // TODO it would be nice if tantivy could let us run the merge in the current thread.
        index_writer.merge(&segment_ids).await?;

        Ok(output_directory)
    }
}

fn open_index<T: Into<Box<dyn Directory>>>(
    directory: T,
    tokenizer_manager: &TokenizerManager,
) -> tantivy::Result<Index> {
    let mut index = Index::open(directory)?;
    index.set_tokenizers(tokenizer_manager.clone());
    index.set_fast_field_tokenizers(
        get_quickwit_fastfield_normalizer_manager()
            .tantivy_manager()
            .clone(),
    );
    Ok(index)
}

#[cfg(test)]
mod tests {
    use quickwit_actors::Universe;
    use quickwit_common::split_file;
    use quickwit_metastore::{
        ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitMetadata, StageSplitsRequestExt,
    };
    use quickwit_proto::metastore::{
        DeleteQuery, ListSplitsRequest, PublishSplitsRequest, StageSplitsRequest,
    };
    use serde_json::Value as JsonValue;
    use tantivy::{Document, ReloadPolicy, TantivyDocument};

    use super::*;
    use crate::merge_policy::{MergeOperation, MergeTask};
    use crate::{TestSandbox, get_tantivy_directory_from_split_bundle, new_split_id};

    #[tokio::test]
    async fn test_merge_executor() -> anyhow::Result<()> {
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: datetime
                input_formats:
                - unix_timestamp
                fast: true
            timestamp_field: ts
        "#;
        let test_sandbox =
            TestSandbox::create("test-index", doc_mapping_yaml, "", &["body"]).await?;
        for split_id in 0..4 {
            let single_doc = std::iter::once(
                serde_json::json!({"body ": format!("split{split_id}"), "ts": 1631072713u64 + split_id }),
            );
            test_sandbox.add_documents(single_doc).await?;
        }
        let metastore = test_sandbox.metastore();
        let index_uid = test_sandbox.index_uid();
        let list_splits_request = ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap();
        let split_metas: Vec<SplitMetadata> = metastore
            .list_splits(list_splits_request)
            .await
            .unwrap()
            .collect_splits_metadata()
            .await
            .unwrap();
        assert_eq!(split_metas.len(), 4);
        let merge_scratch_directory = TempDirectory::for_test();
        let downloaded_splits_directory =
            merge_scratch_directory.named_temp_child("downloaded-splits-")?;
        let mut tantivy_dirs: Vec<Box<dyn Directory>> = Vec::new();
        for split_meta in &split_metas {
            let split_filename = split_file(split_meta.split_id());
            let dest_filepath = downloaded_splits_directory.path().join(&split_filename);
            test_sandbox
                .storage()
                .copy_to_file(Path::new(&split_filename), &dest_filepath)
                .await?;
            tantivy_dirs.push(get_tantivy_directory_from_split_bundle(&dest_filepath).unwrap())
        }
        let merge_operation = MergeOperation::new_merge_operation(split_metas);
        let merge_task = MergeTask::from_merge_operation_for_test(merge_operation);
        let merge_scratch = MergeScratch {
            merge_task,
            tantivy_dirs,
            merge_scratch_directory,
            downloaded_splits_directory,
        };
        let pipeline_id = MergePipelineId {
            node_id: test_sandbox.node_id(),
            index_uid,
            source_id: test_sandbox.source_id(),
        };
        let (merge_packager_mailbox, merge_packager_inbox) =
            test_sandbox.universe().create_test_mailbox();
        let merge_executor = MergeExecutor::new(
            pipeline_id,
            test_sandbox.metastore(),
            test_sandbox.doc_mapper(),
            IoControls::default(),
            merge_packager_mailbox,
        );
        let (merge_executor_mailbox, merge_executor_handle) = test_sandbox
            .universe()
            .spawn_builder()
            .spawn(merge_executor);
        merge_executor_mailbox.send_message(merge_scratch).await?;
        merge_executor_handle.process_pending_and_observe().await;
        let packager_msgs: Vec<IndexedSplitBatch> = merge_packager_inbox.drain_for_test_typed();
        assert_eq!(packager_msgs.len(), 1);
        let split_attrs_after_merge = &packager_msgs[0].splits[0].split_attrs;
        assert_eq!(split_attrs_after_merge.num_docs, 4);
        assert_eq!(split_attrs_after_merge.uncompressed_docs_size_in_bytes, 136);
        assert_eq!(split_attrs_after_merge.num_merge_ops, 1);
        let reader = packager_msgs[0].splits[0]
            .index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        test_sandbox.assert_quit().await;
        Ok(())
    }

    #[test]
    fn test_combine_partition_ids_singleton_unchanged() {
        assert_eq!(combine_partition_ids_aux([17]), 17);
    }

    #[test]
    fn test_combine_partition_ids_zero_has_an_impact() {
        assert_ne!(
            combine_partition_ids_aux([12u64, 0u64]),
            combine_partition_ids_aux([12u64])
        );
    }

    #[test]
    fn test_combine_partition_ids_depends_on_partition_id_set() {
        assert_eq!(
            combine_partition_ids_aux([12, 16, 12, 13]),
            combine_partition_ids_aux([12, 16, 13])
        );
    }

    #[test]
    fn test_combine_partition_ids_order_does_not_matter() {
        assert_eq!(
            combine_partition_ids_aux([7, 12, 13]),
            combine_partition_ids_aux([12, 13, 7])
        );
    }

    async fn aux_test_delete_and_merge_executor(
        index_id: &str,
        docs: Vec<JsonValue>,
        delete_query: &str,
        result_docs: Vec<JsonValue>,
    ) -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: datetime
                input_formats:
                - unix_timestamp
                fast: true
            timestamp_field: ts
        "#;
        let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "", &["body"]).await?;
        test_sandbox.add_documents(docs).await?;
        let metastore = test_sandbox.metastore();
        let index_uid = test_sandbox.index_uid();
        metastore
            .create_delete_task(DeleteQuery {
                index_uid: Some(index_uid.clone()),
                start_timestamp: None,
                end_timestamp: None,
                query_ast: quickwit_query::query_ast::qast_json_helper(delete_query, &["body"]),
            })
            .await?;
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();

        // We want to test a delete on a split with num_merge_ops > 0.
        let mut new_split_metadata = splits[0].split_metadata.clone();
        new_split_metadata.split_id = new_split_id();
        new_split_metadata.num_merge_ops = 1;
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &new_split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![new_split_metadata.split_id.to_string()],
            replaced_split_ids: vec![splits[0].split_metadata.split_id.to_string()],
            index_checkpoint_delta_json_opt: None,
            publish_token_opt: None,
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();
        let expected_uncompressed_docs_size_in_bytes =
            (new_split_metadata.uncompressed_docs_size_in_bytes as f32 / 2_f32) as u64;
        let merge_scratch_directory = TempDirectory::for_test();
        let downloaded_splits_directory =
            merge_scratch_directory.named_temp_child("downloaded-splits-")?;
        let split_filename = split_file(splits[0].split_metadata.split_id());
        let new_split_filename = split_file(new_split_metadata.split_id());
        let dest_filepath = downloaded_splits_directory.path().join(&new_split_filename);
        test_sandbox
            .storage()
            .copy_to_file(Path::new(&split_filename), &dest_filepath)
            .await?;
        let tantivy_dir = get_tantivy_directory_from_split_bundle(&dest_filepath).unwrap();
        let merge_operation = MergeOperation::new_delete_and_merge_operation(new_split_metadata);
        let merge_task = MergeTask::from_merge_operation_for_test(merge_operation);
        let merge_scratch = MergeScratch {
            merge_task,
            tantivy_dirs: vec![tantivy_dir],
            merge_scratch_directory,
            downloaded_splits_directory,
        };
        let pipeline_id = MergePipelineId {
            node_id: test_sandbox.node_id(),
            index_uid: test_sandbox.index_uid(),
            source_id: test_sandbox.source_id(),
        };
        let universe = Universe::with_accelerated_time();
        let (merge_packager_mailbox, merge_packager_inbox) = universe.create_test_mailbox();
        let delete_task_executor = MergeExecutor::new(
            pipeline_id,
            metastore,
            test_sandbox.doc_mapper(),
            IoControls::default(),
            merge_packager_mailbox,
        );
        let (delete_task_executor_mailbox, delete_task_executor_handle) =
            universe.spawn_builder().spawn(delete_task_executor);
        delete_task_executor_mailbox
            .send_message(merge_scratch)
            .await?;
        delete_task_executor_handle
            .process_pending_and_observe()
            .await;

        let packager_msgs: Vec<IndexedSplitBatch> = merge_packager_inbox.drain_for_test_typed();
        if !result_docs.is_empty() {
            assert_eq!(packager_msgs.len(), 1);
            let split = &packager_msgs[0].splits[0];
            assert_eq!(split.split_attrs.num_docs, result_docs.len() as u64);
            assert_eq!(split.split_attrs.delete_opstamp, 1);
            // Delete operations do not update the num_merge_ops value.
            assert_eq!(split.split_attrs.num_merge_ops, 1);
            assert_eq!(
                split.split_attrs.uncompressed_docs_size_in_bytes,
                expected_uncompressed_docs_size_in_bytes,
            );
            let reader = split
                .index
                .reader_builder()
                .reload_policy(ReloadPolicy::Manual)
                .try_into()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);

            let documents_left = searcher
                .search(
                    &tantivy::query::AllQuery,
                    &tantivy::collector::TopDocs::with_limit(result_docs.len() + 1)
                        .order_by_score(),
                )?
                .into_iter()
                .map(|(_, doc_address)| {
                    let doc: TantivyDocument = searcher.doc(doc_address).unwrap();
                    let doc_json = doc.to_json(searcher.schema());
                    serde_json::from_str(&doc_json).unwrap()
                })
                .collect::<Vec<JsonValue>>();

            assert_eq!(documents_left.len(), result_docs.len());
            for doc in &documents_left {
                assert!(result_docs.contains(doc));
            }
            for doc in &result_docs {
                assert!(documents_left.contains(doc));
            }
        } else {
            assert!(packager_msgs.is_empty());
            let metastore = test_sandbox.metastore();
            let index_uid = test_sandbox.index_uid();
            let splits = metastore
                .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap();
            assert!(splits.iter().all(
                |split| split.split_state == quickwit_metastore::SplitState::MarkedForDeletion
            ));
        }
        test_sandbox.assert_quit().await;
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_delete_and_merge_executor() -> anyhow::Result<()> {
        aux_test_delete_and_merge_executor(
            "test-delete-and-merge-index",
            vec![
                serde_json::json!({"body": "info", "ts": 1624928208 }),
                serde_json::json!({"body": "delete", "ts": 1634928208 }),
            ],
            "body:delete",
            vec![serde_json::json!({"body": ["info"], "ts": ["2021-06-29T00:56:48Z"] })],
        )
        .await
    }

    #[tokio::test]
    async fn test_delete_termset_and_merge_executor() -> anyhow::Result<()> {
        aux_test_delete_and_merge_executor(
            "test-delete-termset-and-merge-executor",
            vec![
                serde_json::json!({"body": "info", "ts": 1624928208 }),
                serde_json::json!({"body": "info", "ts": 1624928209 }),
                serde_json::json!({"body": "delete", "ts": 1634928208 }),
                serde_json::json!({"body": "delete", "ts": 1634928209 }),
            ],
            "body: IN [delete]",
            vec![
                serde_json::json!({"body": ["info"], "ts": ["2021-06-29T00:56:48Z"] }),
                serde_json::json!({"body": ["info"], "ts": ["2021-06-29T00:56:49Z"] }),
            ],
        )
        .await
    }

    #[tokio::test]
    async fn test_delete_all() -> anyhow::Result<()> {
        aux_test_delete_and_merge_executor(
            "test-delete-all",
            vec![
                serde_json::json!({"body": "delete", "ts": 1634928208 }),
                serde_json::json!({"body": "delete", "ts": 1634928209 }),
            ],
            "body:delete",
            Vec::new(),
        )
        .await
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/merge_pipeline.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;
use std::time::{Duration, Instant};

use async_trait::async_trait;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, HEARTBEAT, Handler, Health, Inbox, Mailbox,
    SpawnContext, Supervisable,
};
use quickwit_common::KillSwitch;
use quickwit_common::io::{IoControls, Limiter};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_config::RetentionPolicy;
use quickwit_doc_mapper::DocMapper;
use quickwit_metastore::{
    ListSplitsQuery, ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitMetadata,
    SplitState,
};
use quickwit_proto::indexing::MergePipelineId;
use quickwit_proto::metastore::{
    ListSplitsRequest, MetastoreError, MetastoreResult, MetastoreService, MetastoreServiceClient,
};
use time::OffsetDateTime;
use tokio::sync::Semaphore;
use tracing::{debug, error, info, instrument};

use super::publisher::DisconnectMergePlanner;
use super::{MergeSchedulerService, RunFinalizeMergePolicyAndQuit};
use crate::actors::indexing_pipeline::wait_duration_before_retry;
use crate::actors::merge_split_downloader::MergeSplitDownloader;
use crate::actors::publisher::PublisherType;
use crate::actors::{MergeExecutor, MergePlanner, Packager, Publisher, Uploader, UploaderType};
use crate::merge_policy::MergePolicy;
use crate::models::MergeStatistics;
use crate::split_store::IndexingSplitStore;

/// Spawning a merge pipeline puts a lot of pressure on the metastore so
/// we rely on this semaphore to limit the number of merge pipelines that can be spawned
/// concurrently.
static SPAWN_PIPELINE_SEMAPHORE: Semaphore = Semaphore::const_new(10);

/// Instructs the merge pipeline that it should stop itself.
/// Merges that have already been scheduled are not aborted.
///
/// In addition, the finalizer merge policy will be executed to schedule a few
/// additional merges.
///
/// After reception the `FinalizeAndClosePipeline`, the merge pipeline loop will
/// be disconnected. In other words, the connection from the merge publisher to
/// the merge planner will be cut, so that the merge pipeline will terminate naturally.
///
/// Supervisation will still exist. However it will not restart the pipeline
/// in case of failure, it will just kill all of the merge pipeline actors. (for
/// instance, if one of the actor is stuck).
#[derive(Debug, Clone, Copy)]
pub struct FinishPendingMergesAndShutdownPipeline;

pub const SUPERVISE_LOOP_INTERVAL: Duration = Duration::from_secs(1);

struct MergePipelineHandles {
    merge_planner: ActorHandle<MergePlanner>,
    merge_split_downloader: ActorHandle<MergeSplitDownloader>,
    merge_executor: ActorHandle<MergeExecutor>,
    merge_packager: ActorHandle<Packager>,
    merge_uploader: ActorHandle<Uploader>,
    merge_publisher: ActorHandle<Publisher>,
    next_check_for_progress: Instant,
}

impl MergePipelineHandles {
    fn should_check_for_progress(&mut self) -> bool {
        let now = Instant::now();
        let check_for_progress = now > self.next_check_for_progress;
        if check_for_progress {
            self.next_check_for_progress = now + *HEARTBEAT;
        }
        check_for_progress
    }
}

// Messages
#[derive(Debug)]
struct SuperviseLoop;

#[derive(Clone, Copy, Debug, Default)]
struct Spawn {
    retry_count: usize,
}

pub struct MergePipeline {
    params: MergePipelineParams,
    merge_planner_mailbox: Mailbox<MergePlanner>,
    merge_planner_inbox: Inbox<MergePlanner>,
    previous_generations_statistics: MergeStatistics,
    statistics: MergeStatistics,
    handles_opt: Option<MergePipelineHandles>,
    kill_switch: KillSwitch,
    /// Immature splits passed to the merge planner the first time the pipeline is spawned.
    initial_immature_splits_opt: Option<Vec<SplitMetadata>>,
    // After it is set to true, we don't respawn pipeline actors if they fail.
    shutdown_initiated: bool,
}

#[async_trait]
impl Actor for MergePipeline {
    type ObservableState = MergeStatistics;

    fn observable_state(&self) -> Self::ObservableState {
        self.statistics.clone()
    }

    fn name(&self) -> String {
        "MergePipeline".to_string()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.handle(Spawn::default(), ctx).await?;
        self.handle(SuperviseLoop, ctx).await?;
        Ok(())
    }
}

impl MergePipeline {
    /// Creates a new merge pipeline. `initial_immature_splits_opt` is typically "seeded" by the
    /// indexing service who fetches the immature splits from the metastore for all the merge
    /// pipelines it is about to spawn. By issuing a single metastore query instead of one per merge
    /// pipeline, we reduce the load on the metastore. If the merge pipeline crashes and is
    /// respawned by the supervisor, the immature splits are fetched directly from the metastore.
    pub fn new(
        params: MergePipelineParams,
        initial_immature_splits_opt: Option<Vec<SplitMetadata>>,
        spawn_ctx: &SpawnContext,
    ) -> Self {
        // TODO improve API. Maybe it could take a spawnbuilder as argument, hence removing the need
        // for a public create_mailbox / MessageCount.
        let (merge_planner_mailbox, merge_planner_inbox) = spawn_ctx
            .create_mailbox::<MergePlanner>("MergePlanner", MergePlanner::queue_capacity());
        Self {
            params,
            previous_generations_statistics: Default::default(),
            handles_opt: None,
            kill_switch: KillSwitch::default(),
            statistics: MergeStatistics::default(),
            merge_planner_inbox,
            merge_planner_mailbox,
            initial_immature_splits_opt,
            shutdown_initiated: false,
        }
    }

    pub fn merge_planner_mailbox(&self) -> &Mailbox<MergePlanner> {
        &self.merge_planner_mailbox
    }

    fn supervisables(&self) -> Vec<&dyn Supervisable> {
        if let Some(handles) = &self.handles_opt {
            let supervisables: Vec<&dyn Supervisable> = vec![
                &handles.merge_planner,
                &handles.merge_split_downloader,
                &handles.merge_executor,
                &handles.merge_packager,
                &handles.merge_uploader,
                &handles.merge_publisher,
            ];
            supervisables
        } else {
            Vec::new()
        }
    }

    /// Performs healthcheck on all of the actors in the pipeline,
    /// and consolidates the result.
    fn healthcheck(&self, check_for_progress: bool) -> Health {
        let mut healthy_actors: Vec<&str> = Default::default();
        let mut failure_or_unhealthy_actors: Vec<&str> = Default::default();
        let mut success_actors: Vec<&str> = Default::default();

        for supervisable in self.supervisables() {
            match supervisable.check_health(check_for_progress) {
                Health::Healthy => {
                    // At least one other actor is running.
                    healthy_actors.push(supervisable.name());
                }
                Health::FailureOrUnhealthy => {
                    failure_or_unhealthy_actors.push(supervisable.name());
                }
                Health::Success => {
                    success_actors.push(supervisable.name());
                }
            }
        }
        if !failure_or_unhealthy_actors.is_empty() {
            error!(
                index_uid=%self.params.pipeline_id.index_uid,
                source_id=%self.params.pipeline_id.source_id,
                generation=self.generation(),
                healthy_actors=?healthy_actors,
                failed_or_unhealthy_actors=?failure_or_unhealthy_actors,
                success_actors=?success_actors,
                "merge pipeline failed"
            );
            return Health::FailureOrUnhealthy;
        }
        if healthy_actors.is_empty() {
            // All the actors finished successfully.
            info!(
                index_uid=%self.params.pipeline_id.index_uid,
                source_id=%self.params.pipeline_id.source_id,
                generation=self.generation(),
                "merge pipeline completed successfully"
            );
            return Health::Success;
        }
        // No error at this point and there are still some actors running.
        debug!(
            index_uid=%self.params.pipeline_id.index_uid,
            source_id=%self.params.pipeline_id.source_id,
            generation=self.generation(),
            healthy_actors=?healthy_actors,
            failed_or_unhealthy_actors=?failure_or_unhealthy_actors,
            success_actors=?success_actors,
            "merge pipeline is running and healthy"
        );
        Health::Healthy
    }

    fn generation(&self) -> usize {
        self.statistics.generation
    }

    // TODO: Should return an error saying whether we can retry or not.
    #[instrument(name="spawn_merge_pipeline", level="info", skip_all, fields(index_uid=%self.params.pipeline_id.index_uid, generation=self.generation()))]
    async fn spawn_pipeline(&mut self, ctx: &ActorContext<Self>) -> anyhow::Result<()> {
        let _spawn_pipeline_permit = ctx
            .protect_future(SPAWN_PIPELINE_SEMAPHORE.acquire())
            .await
            .expect("semaphore should not be closed");

        self.statistics.num_spawn_attempts += 1;
        self.kill_switch = ctx.kill_switch().child();

        info!(
            index_uid=%self.params.pipeline_id.index_uid,
            source_id=%self.params.pipeline_id.source_id,
            root_dir=%self.params.indexing_directory.path().display(),
            merge_policy=?self.params.merge_policy,
            "spawning merge pipeline",
        );
        let immature_splits = self.fetch_immature_splits(ctx).await?;

        // Merge publisher
        let merge_publisher = Publisher::new(
            PublisherType::MergePublisher,
            self.params.metastore.clone(),
            Some(self.merge_planner_mailbox.clone()),
            None,
        );
        let (merge_publisher_mailbox, merge_publisher_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["merge_publisher"]),
            )
            .spawn(merge_publisher);

        // Merge uploader
        let merge_uploader = Uploader::new(
            UploaderType::MergeUploader,
            self.params.metastore.clone(),
            self.params.merge_policy.clone(),
            self.params.retention_policy.clone(),
            self.params.split_store.clone(),
            merge_publisher_mailbox.into(),
            self.params.max_concurrent_split_uploads,
            self.params.event_broker.clone(),
        );
        let (merge_uploader_mailbox, merge_uploader_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .spawn(merge_uploader);

        // Merge Packager
        let tag_fields = self.params.doc_mapper.tag_named_fields()?;
        let merge_packager = Packager::new("MergePackager", tag_fields, merge_uploader_mailbox);
        let (merge_packager_mailbox, merge_packager_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .spawn(merge_packager);

        let split_downloader_io_controls = IoControls::default()
            .set_throughput_limiter_opt(self.params.merge_io_throughput_limiter_opt.clone())
            .set_component("split_downloader_merge");

        // The merge and split download share the same throughput limiter.
        // This is how cloning the `IoControls` works.
        let merge_executor_io_controls =
            split_downloader_io_controls.clone().set_component("merger");

        let merge_executor = MergeExecutor::new(
            self.params.pipeline_id.clone(),
            self.params.metastore.clone(),
            self.params.doc_mapper.clone(),
            merge_executor_io_controls,
            merge_packager_mailbox,
        );
        let (merge_executor_mailbox, merge_executor_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["merge_executor"]),
            )
            .spawn(merge_executor);

        let merge_split_downloader = MergeSplitDownloader {
            scratch_directory: self.params.indexing_directory.clone(),
            split_store: self.params.split_store.clone(),
            executor_mailbox: merge_executor_mailbox,
            io_controls: split_downloader_io_controls,
        };
        let (merge_split_downloader_mailbox, merge_split_downloader_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .set_backpressure_micros_counter(
                crate::metrics::INDEXER_METRICS
                    .backpressure_micros
                    .with_label_values(["merge_split_downloader"]),
            )
            .spawn(merge_split_downloader);

        // Merge planner
        let merge_planner = MergePlanner::new(
            &self.params.pipeline_id,
            immature_splits,
            self.params.merge_policy.clone(),
            merge_split_downloader_mailbox,
            self.params.merge_scheduler_service.clone(),
        );
        let (_, merge_planner_handle) = ctx
            .spawn_actor()
            .set_kill_switch(self.kill_switch.clone())
            .set_mailboxes(
                self.merge_planner_mailbox.clone(),
                self.merge_planner_inbox.clone(),
            )
            .spawn(merge_planner);

        self.previous_generations_statistics = self.statistics.clone();
        self.statistics.generation += 1;
        self.handles_opt = Some(MergePipelineHandles {
            merge_planner: merge_planner_handle,
            merge_split_downloader: merge_split_downloader_handle,
            merge_executor: merge_executor_handle,
            merge_packager: merge_packager_handle,
            merge_uploader: merge_uploader_handle,
            merge_publisher: merge_publisher_handle,
            next_check_for_progress: Instant::now() + *HEARTBEAT,
        });
        Ok(())
    }

    async fn terminate(&mut self) {
        self.kill_switch.kill();
        if let Some(handles) = self.handles_opt.take() {
            tokio::join!(
                handles.merge_planner.kill(),
                handles.merge_split_downloader.kill(),
                handles.merge_executor.kill(),
                handles.merge_packager.kill(),
                handles.merge_uploader.kill(),
                handles.merge_publisher.kill(),
            );
        }
    }

    async fn perform_observe(&mut self) {
        let Some(handles) = &self.handles_opt else {
            return;
        };
        handles.merge_planner.refresh_observe();
        handles.merge_uploader.refresh_observe();
        handles.merge_publisher.refresh_observe();
        let num_ongoing_merges = crate::metrics::INDEXER_METRICS
            .ongoing_merge_operations
            .get();
        self.statistics = self
            .previous_generations_statistics
            .clone()
            .add_actor_counters(
                &handles.merge_uploader.last_observation(),
                &handles.merge_publisher.last_observation(),
            )
            .set_generation(self.statistics.generation)
            .set_num_spawn_attempts(self.statistics.num_spawn_attempts)
            .set_ongoing_merges(usize::try_from(num_ongoing_merges).unwrap_or(0));
    }

    async fn perform_health_check(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let Some(handles) = self.handles_opt.as_mut() else {
            return Ok(());
        };
        // While we check if the actor has terminated or not, we do not check for progress
        // at every single loop. Instead, we wait for the `HEARTBEAT` duration to have elapsed,
        // since our last check.
        let check_for_progress = handles.should_check_for_progress();
        let health = self.healthcheck(check_for_progress);
        match health {
            Health::Healthy => {}
            Health::FailureOrUnhealthy => {
                self.terminate().await;
                ctx.schedule_self_msg(*quickwit_actors::HEARTBEAT, Spawn { retry_count: 0 });
            }
            Health::Success => {
                info!(index_uid=%self.params.pipeline_id.index_uid, "merge pipeline success, shutting down");
                return Err(ActorExitStatus::Success);
            }
        }
        Ok(())
    }

    async fn fetch_immature_splits(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> MetastoreResult<Vec<quickwit_metastore::SplitMetadata>> {
        // We consume the initial immature splits provided by the indexing service on the first
        // spawn.
        if let Some(immature_splits) = self.initial_immature_splits_opt.take() {
            return Ok(immature_splits);
        }
        // On subsequent spawns, we fetch the immature splits directly from the metastore.
        let index_uid = self.params.pipeline_id.index_uid.clone();
        let node_id = self.params.pipeline_id.node_id.clone();
        let list_splits_query = ListSplitsQuery::for_index(index_uid)
            .with_node_id(node_id)
            .with_split_state(SplitState::Published)
            .retain_immature(OffsetDateTime::now_utc());
        let list_splits_request =
            ListSplitsRequest::try_from_list_splits_query(&list_splits_query)?;
        let immature_splits_stream = ctx
            .protect_future(self.params.metastore.list_splits(list_splits_request))
            .await?;
        let immature_splits = ctx
            .protect_future(immature_splits_stream.collect_splits_metadata())
            .await?;
        info!(
            index_uid=%self.params.pipeline_id.index_uid,
            source_id=%self.params.pipeline_id.source_id,
            "fetched {} splits candidates for merge",
            immature_splits.len()
        );
        Ok(immature_splits)
    }
}

#[async_trait]
impl Handler<SuperviseLoop> for MergePipeline {
    type Reply = ();
    async fn handle(
        &mut self,
        supervise_loop_token: SuperviseLoop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.perform_observe().await;
        self.perform_health_check(ctx).await?;
        ctx.schedule_self_msg(SUPERVISE_LOOP_INTERVAL, supervise_loop_token);
        Ok(())
    }
}

#[async_trait]
impl Handler<FinishPendingMergesAndShutdownPipeline> for MergePipeline {
    type Reply = ();
    async fn handle(
        &mut self,
        _: FinishPendingMergesAndShutdownPipeline,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        info!(index_uid=%self.params.pipeline_id.index_uid, "shutdown merge pipeline initiated");
        // From now on, we will not respawn the pipeline if it fails.
        self.shutdown_initiated = true;
        if let Some(handles) = &self.handles_opt {
            // This disconnects the merge planner from the merge publisher,
            // breaking the merge planner pipeline loop.
            //
            // As a result, the pipeline will naturally terminate
            // once all of the pending / ongoing merge operations are completed.
            let _ = handles
                .merge_publisher
                .mailbox()
                .send_message(DisconnectMergePlanner)
                .await;

            // We also initiate the merge planner finalization routine.
            // Depending on the merge policy, it may emit a few more merge
            // operations.
            let _ = handles
                .merge_planner
                .mailbox()
                .send_message(RunFinalizeMergePolicyAndQuit)
                .await;
        } else {
            // we won't respawn the pipeline in the future, so there is nothing
            // to do here.
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<Spawn> for MergePipeline {
    type Reply = ();

    async fn handle(
        &mut self,
        spawn: Spawn,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if self.shutdown_initiated {
            return Ok(());
        }
        if self.handles_opt.is_some() {
            return Ok(());
        }
        self.previous_generations_statistics.num_spawn_attempts = 1 + spawn.retry_count;
        if let Err(spawn_error) = self.spawn_pipeline(ctx).await {
            if let Some(MetastoreError::NotFound { .. }) =
                spawn_error.downcast_ref::<MetastoreError>()
            {
                info!(error = ?spawn_error, "could not spawn pipeline, index might have been deleted");
                return Err(ActorExitStatus::Success);
            }
            let retry_delay = wait_duration_before_retry(spawn.retry_count);
            error!(error = ?spawn_error, retry_count = spawn.retry_count, retry_delay = ?retry_delay, "error while spawning indexing pipeline, retrying after some time");
            ctx.schedule_self_msg(
                retry_delay,
                Spawn {
                    retry_count: spawn.retry_count + 1,
                },
            );
        }
        Ok(())
    }
}

#[derive(Clone)]
pub struct MergePipelineParams {
    pub pipeline_id: MergePipelineId,
    pub doc_mapper: Arc<DocMapper>,
    pub indexing_directory: TempDirectory,
    pub metastore: MetastoreServiceClient,
    pub merge_scheduler_service: Mailbox<MergeSchedulerService>,
    pub split_store: IndexingSplitStore,
    pub merge_policy: Arc<dyn MergePolicy>,
    pub retention_policy: Option<RetentionPolicy>,
    pub max_concurrent_split_uploads: usize, //< TODO share with the indexing pipeline.
    pub merge_io_throughput_limiter_opt: Option<Limiter>,
    pub event_broker: EventBroker,
}

#[cfg(test)]
mod tests {
    use std::ops::Bound;
    use std::sync::Arc;

    use quickwit_actors::{ActorExitStatus, Universe};
    use quickwit_common::ServiceStream;
    use quickwit_common::temp_dir::TempDirectory;
    use quickwit_doc_mapper::default_doc_mapper_for_test;
    use quickwit_metastore::ListSplitsRequestExt;
    use quickwit_proto::indexing::MergePipelineId;
    use quickwit_proto::metastore::{MetastoreServiceClient, MockMetastoreService};
    use quickwit_proto::types::{IndexUid, NodeId};
    use quickwit_storage::RamStorage;

    use crate::IndexingSplitStore;
    use crate::actors::merge_pipeline::{MergePipeline, MergePipelineParams};
    use crate::actors::{MergePlanner, Publisher};
    use crate::merge_policy::default_merge_policy;

    #[tokio::test]
    async fn test_merge_pipeline_simple() -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let pipeline_id = MergePipelineId {
            index_uid: index_uid.clone(),
            source_id,
            node_id,
        };
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_splits()
            .times(1)
            .withf(move |list_splits_request| {
                let list_split_query = list_splits_request.deserialize_list_splits_query().unwrap();
                assert_eq!(list_split_query.index_uids, Some(vec![index_uid.clone()]));
                assert_eq!(
                    list_split_query.split_states,
                    vec![quickwit_metastore::SplitState::Published]
                );
                let Bound::Excluded(_) = list_split_query.mature else {
                    panic!("expected `Bound::Excluded`");
                };
                true
            })
            .returning(|_| Ok(ServiceStream::empty()));
        let universe = Universe::with_accelerated_time();
        let storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::create_without_local_store_for_test(storage.clone());
        let pipeline_params = MergePipelineParams {
            pipeline_id,
            doc_mapper: Arc::new(default_doc_mapper_for_test()),
            indexing_directory: TempDirectory::for_test(),
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            merge_scheduler_service: universe.get_or_spawn_one(),
            split_store,
            merge_policy: default_merge_policy(),
            retention_policy: None,
            max_concurrent_split_uploads: 2,
            merge_io_throughput_limiter_opt: None,
            event_broker: Default::default(),
        };
        let pipeline = MergePipeline::new(pipeline_params, None, universe.spawn_ctx());
        let _merge_planner_mailbox = pipeline.merge_planner_mailbox().clone();
        let (pipeline_mailbox, pipeline_handle) = universe.spawn_builder().spawn(pipeline);
        pipeline_mailbox
            .ask(super::FinishPendingMergesAndShutdownPipeline)
            .await
            .unwrap();

        let (pipeline_exit_status, pipeline_statistics) = pipeline_handle.join().await;
        assert_eq!(pipeline_statistics.generation, 1);
        assert_eq!(pipeline_statistics.num_spawn_attempts, 1);
        assert_eq!(pipeline_statistics.num_published_splits, 0);
        assert!(matches!(pipeline_exit_status, ActorExitStatus::Success));

        // Checking that the merge pipeline actors have been properly cleaned up.
        assert!(universe.get_one::<MergePlanner>().is_none());
        assert!(universe.get_one::<Publisher>().is_none());
        assert!(universe.get_one::<MergePipeline>().is_none());

        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/merge_planner.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::sync::Arc;
use std::time::Instant;

use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_metastore::{SplitMaturity, SplitMetadata};
use quickwit_proto::indexing::MergePipelineId;
use quickwit_proto::types::DocMappingUid;
use tantivy::Inventory;
use time::OffsetDateTime;
use tracing::{info, warn};

use super::MergeSchedulerService;
use crate::MergePolicy;
use crate::actors::MergeSplitDownloader;
use crate::actors::merge_scheduler_service::schedule_merge;
use crate::merge_policy::MergeOperation;
use crate::models::NewSplits;

#[derive(Debug)]
pub(crate) struct RunFinalizeMergePolicyAndQuit;

#[derive(Debug, Clone, PartialEq, Eq, Hash)]
struct MergePartition {
    partition_id: u64,
    doc_mapping_uid: DocMappingUid,
}

impl MergePartition {
    fn from_split_meta(split_meta: &SplitMetadata) -> MergePartition {
        MergePartition {
            partition_id: split_meta.partition_id,
            doc_mapping_uid: split_meta.doc_mapping_uid,
        }
    }
}

/// The merge planner decides when to start a merge task.
pub struct MergePlanner {
    /// A young split is a split that has not reached maturity
    /// yet and can be candidate to merge operations.
    partitioned_young_splits: HashMap<MergePartition, Vec<SplitMetadata>>,

    /// This set contains all of the split ids that we "acknowledged".
    /// The point of this set is to rapidly dismiss redundant `NewSplit` message.
    ///
    /// Complex scenarii that can result in the reemission of
    /// such messages are described in #3627.
    ///
    /// At any given point in time, the set must contains at least:
    /// - young splits (non-mature)
    /// - splits that are currently in merge.
    ///
    /// It also contain other splits, that have gone through a successful
    /// merge and have been deleted for instance.
    ///
    /// We incrementally build this set, by adding new splits to it.
    /// When it becomes too large, we entirely rebuild it.
    known_split_ids: HashSet<String>,
    known_split_ids_recompute_attempt_id: usize,

    merge_policy: Arc<dyn MergePolicy>,

    merge_split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
    merge_scheduler_service: Mailbox<MergeSchedulerService>,

    /// Inventory of ongoing merge operations. If everything goes well,
    /// a merge operation is dropped after the publish of the merged split.
    ///
    /// It is used to GC the known_split_ids set.
    ongoing_merge_operations_inventory: Inventory<MergeOperation>,

    /// We use the actor start_time as a way to identify incarnations.
    ///
    /// Since we recycle the mailbox of the merge planner, this incarnation
    /// makes it possible to ignore messages that where emitted from the previous
    /// instantiation.
    incarnation_started_at: Instant,
}

#[async_trait]
impl Actor for MergePlanner {
    type ObservableState = ();

    fn observable_state(&self) -> Self::ObservableState {}

    fn name(&self) -> String {
        "MergePlanner".to_string()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        MergePlanner::queue_capacity()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        // We do not call the handle method directly and instead queue the message in order to drain
        // the recycled mailbox and get a consolidated vision of the set of published
        // splits, before scheduling any merge operation. See #3847 for more details.

        // If the mailbox is full, this send message might fail (the capacity is very low).
        // This is however not much of a problem: it probably contains a NewSplit message.
        // If it does not, we will be losing an opportunity to plan merge right away, but it will
        // happen on the next split publication.
        let _ = ctx.try_send_self_message(PlanMerge {
            incarnation_started_at: self.incarnation_started_at,
        });

        Ok(())
    }
}

#[async_trait]
impl Handler<RunFinalizeMergePolicyAndQuit> for MergePlanner {
    type Reply = ();

    async fn handle(
        &mut self,
        _plan_merge: RunFinalizeMergePolicyAndQuit,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        // Note we ignore messages that could be coming from a different incarnation.
        // (See comment on `Self::incarnation_start_at`.)
        self.send_merge_ops(true, ctx).await?;
        Err(ActorExitStatus::Success)
    }
}

#[async_trait]
impl Handler<PlanMerge> for MergePlanner {
    type Reply = ();

    async fn handle(
        &mut self,
        plan_merge: PlanMerge,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if plan_merge.incarnation_started_at == self.incarnation_started_at {
            // Note we ignore messages that could be coming from a different incarnation.
            // (See comment on `Self::incarnation_start_at`.)
            self.send_merge_ops(false, ctx).await?;
        }
        self.recompute_known_splits_if_necessary();
        Ok(())
    }
}

#[async_trait]
impl Handler<NewSplits> for MergePlanner {
    type Reply = ();

    async fn handle(
        &mut self,
        new_splits: NewSplits,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.record_splits_if_necessary(new_splits.new_splits);
        self.send_merge_ops(false, ctx).await?;
        self.recompute_known_splits_if_necessary();
        Ok(())
    }
}

impl MergePlanner {
    pub fn queue_capacity() -> QueueCapacity {
        // We cannot have a Queue capacity of 0 here because `try_send_self`
        // would never succeed.
        QueueCapacity::Bounded(1)
    }

    pub fn new(
        pipeline_id: &MergePipelineId,
        immature_splits: Vec<SplitMetadata>,
        merge_policy: Arc<dyn MergePolicy>,
        merge_split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
        merge_scheduler_service: Mailbox<MergeSchedulerService>,
    ) -> MergePlanner {
        let immature_splits: Vec<SplitMetadata> = immature_splits
            .into_iter()
            .filter(|split_metadata| belongs_to_pipeline(pipeline_id, split_metadata))
            .collect();
        let mut merge_planner = MergePlanner {
            known_split_ids: Default::default(),
            known_split_ids_recompute_attempt_id: 0,
            partitioned_young_splits: Default::default(),
            merge_policy,
            merge_split_downloader_mailbox,
            merge_scheduler_service,
            ongoing_merge_operations_inventory: Inventory::default(),

            incarnation_started_at: Instant::now(),
        };
        merge_planner.record_splits_if_necessary(immature_splits);
        merge_planner
    }

    fn rebuild_known_split_ids(&self) -> HashSet<String> {
        let mut known_split_ids: HashSet<String> = HashSet::default();
        // Add splits that in `partitioned_young_splits`.
        for young_split_partition in self.partitioned_young_splits.values() {
            for split in young_split_partition {
                known_split_ids.insert(split.split_id().to_string());
            }
        }
        let ongoing_merge_operations = self.ongoing_merge_operations_inventory.list();
        // Add splits that are known as in merge.
        for merge_op in ongoing_merge_operations {
            for split in &merge_op.splits {
                known_split_ids.insert(split.split_id().to_string());
            }
        }
        if known_split_ids.len() * 2 >= self.known_split_ids.len() {
            warn!(
                known_split_ids_len_after = known_split_ids.len(),
                known_split_ids_len_before = self.known_split_ids.len(),
                "Rebuilding the known split ids set ended up not halving its size. Please report. \
                 This is likely a bug, please report."
            );
        }
        known_split_ids
    }

    /// Updates `known_split_ids` and return true if the split was not
    /// previously known and should be recorded.
    fn acknownledge_split(&mut self, split_id: &str) -> bool {
        if self.known_split_ids.contains(split_id) {
            return false;
        }
        self.known_split_ids.insert(split_id.to_string());
        true
    }

    // No need to rebuild every time, we do once out of 100 times.
    fn recompute_known_splits_if_necessary(&mut self) {
        self.known_split_ids_recompute_attempt_id += 1;
        if self
            .known_split_ids_recompute_attempt_id
            .is_multiple_of(100)
        {
            self.known_split_ids = self.rebuild_known_split_ids();
            self.known_split_ids_recompute_attempt_id = 0;
        }
    }

    // Record a split. This function does NOT check if the split is mature or not, or if the split
    // is known or not.
    fn record_split(&mut self, new_split: SplitMetadata) {
        let splits_for_partition: &mut Vec<SplitMetadata> = self
            .partitioned_young_splits
            .entry(MergePartition::from_split_meta(&new_split))
            .or_default();
        splits_for_partition.push(new_split);
    }

    // Records a list of splits.
    //
    // Internally this function will detect and avoid adding the split
    // that are:
    // - already known
    // - mature
    // - do not belong to the current timeline.
    fn record_splits_if_necessary(&mut self, split_metadatas: Vec<SplitMetadata>) {
        for new_split in split_metadatas {
            if let SplitMaturity::Mature = self
                .merge_policy
                .split_maturity(new_split.num_docs, new_split.num_merge_ops)
            {
                // This can happen if the merge policy changed (e.g, decreased
                // split_num_docs_target).
                continue;
            }
            if new_split.is_mature(OffsetDateTime::now_utc()) {
                continue;
            }
            // Due to the recycling of the mailbox of the merge planner, it is possible for
            // a split already in store to be received.
            //
            // See `known_split_ids`.
            if !self.acknownledge_split(new_split.split_id()) {
                continue;
            }
            self.record_split(new_split);
        }
    }
    async fn compute_merge_ops(
        &mut self,
        is_finalize: bool,
        ctx: &ActorContext<Self>,
    ) -> Result<Vec<MergeOperation>, ActorExitStatus> {
        let mut merge_operations = Vec::new();
        for young_splits in self.partitioned_young_splits.values_mut() {
            if !young_splits.is_empty() {
                let operations = if is_finalize {
                    self.merge_policy.finalize_operations(young_splits)
                } else {
                    self.merge_policy.operations(young_splits)
                };
                merge_operations.extend(operations);
            }
            ctx.record_progress();
            ctx.yield_now().await;
        }
        self.partitioned_young_splits
            .retain(|_, splits| !splits.is_empty());
        // We recompute the number of young splits.
        Ok(merge_operations)
    }

    async fn send_merge_ops(
        &mut self,
        is_finalize: bool,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        // We identify all of the merge operations we want to run and leave it
        // to the merge scheduler to decide in which order these should be scheduled.
        //
        // The merge scheduler has the merit of knowing about merge operations from other
        // index as well.
        let merge_ops = self.compute_merge_ops(is_finalize, ctx).await?;
        for merge_operation in merge_ops {
            info!(merge_operation=?merge_operation, "schedule merge operation");
            let tracked_merge_operation = self
                .ongoing_merge_operations_inventory
                .track(merge_operation);
            schedule_merge(
                &self.merge_scheduler_service,
                tracked_merge_operation,
                self.merge_split_downloader_mailbox.clone(),
            )
            .await?
        }
        Ok(())
    }
}

/// We can only merge splits with the same (node_id, index_id, source_id).
fn belongs_to_pipeline(pipeline_id: &MergePipelineId, split: &SplitMetadata) -> bool {
    pipeline_id.node_id == split.node_id
        && pipeline_id.index_uid == split.index_uid
        && pipeline_id.source_id == split.source_id
}

#[derive(Debug)]
struct PlanMerge {
    incarnation_started_at: Instant,
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::time::Duration;

    use itertools::Itertools;
    use quickwit_actors::{ActorExitStatus, Command, QueueCapacity, Universe};
    use quickwit_config::IndexingSettings;
    use quickwit_config::merge_policy_config::{
        ConstWriteAmplificationMergePolicyConfig, MergePolicyConfig, StableLogMergePolicyConfig,
    };
    use quickwit_metastore::{SplitMaturity, SplitMetadata};
    use quickwit_proto::indexing::MergePipelineId;
    use quickwit_proto::types::{DocMappingUid, IndexUid, NodeId};
    use time::OffsetDateTime;

    use crate::actors::MergePlanner;
    use crate::merge_policy::{
        MergePolicy, MergeTask, StableLogMergePolicy, merge_policy_from_settings,
    };
    use crate::models::NewSplits;

    fn split_metadata_for_test(
        index_uid: &IndexUid,
        split_id: &str,
        partition_id: u64,
        doc_mapping_uid: DocMappingUid,
        num_docs: usize,
        num_merge_ops: usize,
    ) -> SplitMetadata {
        SplitMetadata {
            split_id: split_id.to_string(),
            index_uid: index_uid.clone(),
            source_id: "test-source".to_string(),
            node_id: "test-node".to_string(),
            num_docs,
            partition_id,
            num_merge_ops,
            create_timestamp: OffsetDateTime::now_utc().unix_timestamp(),
            maturity: SplitMaturity::Immature {
                maturation_period: Duration::from_secs(3600),
            },
            doc_mapping_uid,
            ..Default::default()
        }
    }

    #[tokio::test]
    async fn test_merge_planner_with_stable_custom_merge_policy() -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();
        let [doc_mapping_uid1, doc_mapping_uid2] = {
            let mut doc_mappings = [DocMappingUid::random(), DocMappingUid::random()];
            doc_mappings.sort();
            doc_mappings
        };
        let pipeline_id = MergePipelineId {
            node_id,
            index_uid: index_uid.clone(),
            source_id,
        };
        let merge_policy = Arc::new(StableLogMergePolicy::new(
            StableLogMergePolicyConfig {
                min_level_num_docs: 10_000,
                merge_factor: 3,
                max_merge_factor: 5,
                maturation_period: Duration::from_secs(3600),
            },
            50_000,
        ));
        let universe = Universe::with_accelerated_time();
        let (merge_split_downloader_mailbox, merge_split_downloader_inbox) =
            universe.create_test_mailbox();

        let merge_planner = MergePlanner::new(
            &pipeline_id,
            Vec::new(),
            merge_policy,
            merge_split_downloader_mailbox,
            universe.get_or_spawn_one(),
        );
        let (merge_planner_mailbox, merge_planner_handle) =
            universe.spawn_builder().spawn(merge_planner);
        {
            // send one split
            let message = NewSplits {
                new_splits: vec![
                    split_metadata_for_test(&index_uid, "1_1", 1, doc_mapping_uid1, 2500, 0),
                    split_metadata_for_test(&index_uid, "1v2_1", 1, doc_mapping_uid2, 2500, 0),
                    split_metadata_for_test(&index_uid, "1_2", 2, doc_mapping_uid1, 3000, 0),
                ],
            };
            merge_planner_mailbox.send_message(message).await?;
            let merge_ops = merge_split_downloader_inbox.drain_for_test();
            assert_eq!(merge_ops.len(), 0);
        }
        {
            // send two splits with a duplicate
            let message = NewSplits {
                new_splits: vec![
                    split_metadata_for_test(&index_uid, "2_1", 1, doc_mapping_uid1, 2000, 0),
                    split_metadata_for_test(&index_uid, "2v2_1", 1, doc_mapping_uid2, 2500, 0),
                    split_metadata_for_test(&index_uid, "1_2", 2, doc_mapping_uid1, 3000, 0),
                ],
            };
            merge_planner_mailbox.send_message(message).await?;
            let merge_ops = merge_split_downloader_inbox.drain_for_test();
            assert_eq!(merge_ops.len(), 0);
        }
        {
            // send four more splits to generate merge
            let message = NewSplits {
                new_splits: vec![
                    split_metadata_for_test(&index_uid, "3_1", 1, doc_mapping_uid1, 1500, 0),
                    split_metadata_for_test(&index_uid, "4_1", 1, doc_mapping_uid1, 1000, 0),
                    split_metadata_for_test(&index_uid, "3v2_1", 1, doc_mapping_uid2, 1500, 0),
                    split_metadata_for_test(&index_uid, "2_2", 2, doc_mapping_uid1, 2000, 0),
                    split_metadata_for_test(&index_uid, "3_2", 2, doc_mapping_uid1, 4000, 0),
                ],
            };
            merge_planner_mailbox.send_message(message).await?;
            merge_planner_handle.process_pending_and_observe().await;
            let operations = merge_split_downloader_inbox.drain_for_test_typed::<MergeTask>();
            assert_eq!(operations.len(), 3);
            let mut merge_operations = operations
                .into_iter()
                .sorted_by_key(|op| (op.splits[0].partition_id, op.splits[0].doc_mapping_uid));

            let first_merge_operation = merge_operations.next().unwrap();
            assert_eq!(first_merge_operation.splits.len(), 4);
            assert!(
                first_merge_operation
                    .splits
                    .iter()
                    .all(|split| split.partition_id == 1
                        && split.doc_mapping_uid == doc_mapping_uid1)
            );

            let second_merge_operation = merge_operations.next().unwrap();
            assert_eq!(second_merge_operation.splits.len(), 3);
            assert!(
                second_merge_operation
                    .splits
                    .iter()
                    .all(|split| split.partition_id == 1
                        && split.doc_mapping_uid == doc_mapping_uid2)
            );

            let third_merge_operation = merge_operations.next().unwrap();
            assert_eq!(third_merge_operation.splits.len(), 3);
            assert!(
                third_merge_operation
                    .splits
                    .iter()
                    .all(|split| split.partition_id == 2
                        && split.doc_mapping_uid == doc_mapping_uid1)
            );
        }
        universe.assert_quit().await;

        Ok(())
    }

    #[tokio::test]
    async fn test_merge_planner_spawns_merge_over_existing_splits_on_startup() -> anyhow::Result<()>
    {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();
        let doc_mapping_uid = DocMappingUid::random();
        let pipeline_id = MergePipelineId {
            node_id,
            index_uid: index_uid.clone(),
            source_id,
        };
        let universe = Universe::with_accelerated_time();
        let (merge_split_downloader_mailbox, merge_split_downloader_inbox) = universe
            .spawn_ctx()
            .create_mailbox("MergeSplitDownloader", QueueCapacity::Bounded(2));
        let merge_policy_config = ConstWriteAmplificationMergePolicyConfig {
            merge_factor: 2,
            max_merge_factor: 2,
            max_merge_ops: 3,
            ..Default::default()
        };
        let indexing_settings = IndexingSettings {
            merge_policy: MergePolicyConfig::ConstWriteAmplification(merge_policy_config),
            ..Default::default()
        };
        let immature_splits = vec![
            split_metadata_for_test(
                &index_uid,
                "a_small",
                0, // partition_id
                doc_mapping_uid,
                1_000_000,
                2,
            ),
            split_metadata_for_test(
                &index_uid,
                "b_small",
                0, // partition_id
                doc_mapping_uid,
                1_000_000,
                2,
            ),
        ];
        let merge_policy: Arc<dyn MergePolicy> = merge_policy_from_settings(&indexing_settings);
        let merge_planner = MergePlanner::new(
            &pipeline_id,
            immature_splits.clone(),
            merge_policy,
            merge_split_downloader_mailbox,
            universe.get_or_spawn_one(),
        );
        let (merge_planner_mailbox, merge_planner_handle) =
            universe.spawn_builder().spawn(merge_planner);

        // We wait for the first merge ops. If we sent the Quit message right away, it would have
        // been queue before first `PlanMerge` message.
        let merge_task_res = merge_split_downloader_inbox
            .recv_typed_message::<MergeTask>()
            .await;
        assert!(merge_task_res.is_ok());

        // We make sure that the known splits filtering set filters out splits are currently in
        // merge.
        merge_planner_mailbox
            .ask(NewSplits {
                new_splits: immature_splits,
            })
            .await?;

        let _ = merge_planner_handle.process_pending_and_observe().await;

        let merge_ops = merge_split_downloader_inbox.drain_for_test_typed::<MergeTask>();

        assert!(merge_ops.is_empty());

        merge_planner_mailbox.send_message(Command::Quit).await?;

        let (exit_status, _last_state) = merge_planner_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Quit));
        let merge_ops = merge_split_downloader_inbox.drain_for_test_typed::<MergeTask>();
        assert!(merge_ops.is_empty());
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_merge_planner_dismiss_splits_from_different_pipeline_id() -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();
        let doc_mapping_uid = DocMappingUid::random();
        let pipeline_id = MergePipelineId {
            node_id,
            index_uid,
            source_id,
        };
        // This test makes sure that the merge planner ignores the splits that do not belong
        // to the same pipeline
        let universe = Universe::with_accelerated_time();
        let (merge_split_downloader_mailbox, merge_split_downloader_inbox) = universe
            .spawn_ctx()
            .create_mailbox("MergeSplitDownloader", QueueCapacity::Bounded(2));

        let merge_policy_config = ConstWriteAmplificationMergePolicyConfig {
            merge_factor: 2,
            max_merge_factor: 2,
            max_merge_ops: 3,
            ..Default::default()
        };
        let indexing_settings = IndexingSettings {
            merge_policy: MergePolicyConfig::ConstWriteAmplification(merge_policy_config),
            ..Default::default()
        };

        // It is different from the index_uid because the index uid has a unique suffix.
        let other_index_uid = IndexUid::new_with_random_ulid("test-index");

        let immature_splits = vec![
            split_metadata_for_test(
                &other_index_uid,
                "a_small",
                0, // partition_id
                doc_mapping_uid,
                1_000_000,
                2,
            ),
            split_metadata_for_test(
                &other_index_uid,
                "b_small",
                0, // partition_id
                doc_mapping_uid,
                1_000_000,
                2,
            ),
        ];
        let merge_policy: Arc<dyn MergePolicy> = merge_policy_from_settings(&indexing_settings);
        let merge_planner = MergePlanner::new(
            &pipeline_id,
            immature_splits.clone(),
            merge_policy,
            merge_split_downloader_mailbox,
            universe.get_or_spawn_one(),
        );
        let (merge_planner_mailbox, merge_planner_handle) =
            universe.spawn_builder().spawn(merge_planner);
        universe.sleep(Duration::from_secs(10)).await;
        merge_planner_mailbox.send_message(Command::Quit).await?;
        let (exit_status, _last_state) = merge_planner_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Quit));
        let merge_tasks = merge_split_downloader_inbox.drain_for_test_typed::<MergeTask>();

        assert!(merge_tasks.is_empty());
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_merge_planner_inherit_mailbox_with_splits_bug_3847() -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();
        let doc_mapping_uid = DocMappingUid::random();
        let pipeline_id = MergePipelineId {
            node_id,
            index_uid: index_uid.clone(),
            source_id,
        };
        let universe = Universe::with_accelerated_time();
        let (merge_split_downloader_mailbox, merge_split_downloader_inbox) = universe
            .spawn_ctx()
            .create_mailbox("MergeSplitDownloader", QueueCapacity::Bounded(2));

        let merge_policy_config = ConstWriteAmplificationMergePolicyConfig {
            merge_factor: 2,
            max_merge_factor: 2,
            max_merge_ops: 3,
            ..Default::default()
        };
        let indexing_settings = IndexingSettings {
            merge_policy: MergePolicyConfig::ConstWriteAmplification(merge_policy_config),
            ..Default::default()
        };
        let immature_splits = vec![
            split_metadata_for_test(
                &index_uid,
                "a_small",
                0, // partition_id
                doc_mapping_uid,
                1_000_000,
                2,
            ),
            split_metadata_for_test(
                &index_uid,
                "b_small",
                0, // partition_id
                doc_mapping_uid,
                1_000_000,
                2,
            ),
        ];
        let merge_policy: Arc<dyn MergePolicy> = merge_policy_from_settings(&indexing_settings);
        let merge_planner = MergePlanner::new(
            &pipeline_id,
            immature_splits.clone(),
            merge_policy,
            merge_split_downloader_mailbox,
            universe.get_or_spawn_one(),
        );
        // We create a fake old mailbox that contains two new splits and a PlanMerge message from an
        // old incarnation. This could happen in real life if the merge pipeline failed
        // right after a `PlanMerge` was pushed to the pipeline. Note that #3847 did not
        // even require the `PlanMerge` to be in the pipeline
        let (merge_planner_mailbox, merge_planner_inbox) =
            universe.create_test_mailbox::<MergePlanner>();

        // We spawn our merge planner with this recycled mailbox.
        let (merge_planner_mailbox, merge_planner_handle) = universe
            .spawn_builder()
            .set_mailboxes(merge_planner_mailbox, merge_planner_inbox)
            .spawn(merge_planner);

        // The low capacity of the queue of the merge planner prevents us from sending a Command in
        // the low priority queue. It would take the single slot and prevent the message
        // sent in the initialize method.

        // Instead, we wait for the first merge ops.
        let merge_task_res = merge_split_downloader_inbox
            .recv_typed_message::<MergeTask>()
            .await;
        assert!(merge_task_res.is_ok());

        // At this point, our merge has been initialized.
        merge_planner_mailbox.send_message(Command::Quit).await?;
        let (exit_status, _last_state) = merge_planner_handle.join().await;

        assert!(matches!(exit_status, ActorExitStatus::Quit));
        let merge_tasks = merge_split_downloader_inbox.drain_for_test_typed::<MergeTask>();
        assert!(merge_tasks.is_empty());

        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/merge_scheduler_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Reverse;
use std::collections::BinaryHeap;
use std::collections::binary_heap::PeekMut;
use std::sync::Arc;

use anyhow::Context;
use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox};
use tantivy::TrackedObject;
use tokio::sync::{OwnedSemaphorePermit, Semaphore};
use tracing::error;

use super::MergeSplitDownloader;
use crate::merge_policy::{MergeOperation, MergeTask};

pub struct MergePermit {
    _semaphore_permit: Option<OwnedSemaphorePermit>,
    merge_scheduler_mailbox: Option<Mailbox<MergeSchedulerService>>,
}

impl MergePermit {
    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> MergePermit {
        MergePermit {
            _semaphore_permit: None,
            merge_scheduler_mailbox: None,
        }
    }
}

impl Drop for MergePermit {
    fn drop(&mut self) {
        let Some(merge_scheduler_mailbox) = self.merge_scheduler_mailbox.take() else {
            return;
        };
        if merge_scheduler_mailbox
            .send_message_with_high_priority(PermitReleased)
            .is_err()
        {
            error!("merge scheduler service is dead");
        }
    }
}

pub async fn schedule_merge(
    merge_scheduler_service: &Mailbox<MergeSchedulerService>,
    merge_operation: TrackedObject<MergeOperation>,
    merge_split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
) -> anyhow::Result<()> {
    let schedule_merge = ScheduleMerge::new(merge_operation, merge_split_downloader_mailbox);
    // TODO add backpressure.
    merge_scheduler_service
        .ask(schedule_merge)
        .await
        .context("failed to acquire permit")?;
    Ok(())
}

struct ScheduledMerge {
    score: u64,
    id: u64, //< just for total ordering.
    merge_operation: TrackedObject<MergeOperation>,
    split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
}

impl ScheduledMerge {
    fn order_key(&self) -> (u64, Reverse<u64>) {
        (self.score, std::cmp::Reverse(self.id))
    }
}

impl Eq for ScheduledMerge {}

impl PartialEq for ScheduledMerge {
    fn eq(&self, other: &Self) -> bool {
        self.cmp(other).is_eq()
    }
}

impl PartialOrd for ScheduledMerge {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}

impl Ord for ScheduledMerge {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        self.order_key().cmp(&other.order_key())
    }
}

/// The merge scheduler service is in charge of keeping track of all scheduled merge operations,
/// and schedule them in the best possible order, respecting the `merge_concurrency` limit.
///
/// This actor is not supervised and should stay as simple as possible.
/// In particular,
/// - the `ScheduleMerge` handler should reply in microseconds.
/// - the task should never be dropped before reaching its `split_downloader_mailbox` destination as
///   it would break the consistency of `MergePlanner` with the metastore (ie: several splits will
///   never be merged).
pub struct MergeSchedulerService {
    merge_semaphore: Arc<Semaphore>,
    merge_concurrency: usize,
    pending_merge_queue: BinaryHeap<ScheduledMerge>,
    next_merge_id: u64,
    pending_merge_bytes: u64,
}

impl Default for MergeSchedulerService {
    fn default() -> MergeSchedulerService {
        MergeSchedulerService::new(3)
    }
}

impl MergeSchedulerService {
    pub fn new(merge_concurrency: usize) -> MergeSchedulerService {
        let merge_semaphore = Arc::new(Semaphore::new(merge_concurrency));
        MergeSchedulerService {
            merge_semaphore,
            merge_concurrency,
            pending_merge_queue: BinaryHeap::default(),
            next_merge_id: 0,
            pending_merge_bytes: 0,
        }
    }

    fn schedule_pending_merges(&mut self, ctx: &ActorContext<Self>) {
        // We schedule as many pending merges as we can,
        // until there are no permits available or merges to schedule.
        loop {
            let merge_semaphore = self.merge_semaphore.clone();
            let Some(next_merge) = self.pending_merge_queue.peek_mut() else {
                // No merge to schedule.
                break;
            };
            let Ok(semaphore_permit) = Semaphore::try_acquire_owned(merge_semaphore) else {
                // No permit available right away.
                break;
            };
            let merge_permit = MergePermit {
                _semaphore_permit: Some(semaphore_permit),
                merge_scheduler_mailbox: Some(ctx.mailbox().clone()),
            };
            let ScheduledMerge {
                merge_operation,
                split_downloader_mailbox,
                ..
            } = PeekMut::pop(next_merge);
            let merge_task = MergeTask {
                merge_operation,
                _merge_permit: merge_permit,
            };
            self.pending_merge_bytes -= merge_task.merge_operation.total_num_bytes();
            crate::metrics::INDEXER_METRICS
                .pending_merge_operations
                .set(self.pending_merge_queue.len() as i64);
            crate::metrics::INDEXER_METRICS
                .pending_merge_bytes
                .set(self.pending_merge_bytes as i64);
            match split_downloader_mailbox.try_send_message(merge_task) {
                Ok(_) => {}
                Err(quickwit_actors::TrySendError::Full(_)) => {
                    // The split downloader mailbox has an unbounded queue capacity,
                    error!("split downloader queue is full: please report");
                }
                Err(quickwit_actors::TrySendError::Disconnected) => {
                    // It means the split downloader is dead.
                    // This is fine, the merge pipeline has probably been restarted.
                }
            }
        }
        let num_merges =
            self.merge_concurrency as i64 - self.merge_semaphore.available_permits() as i64;
        crate::metrics::INDEXER_METRICS
            .ongoing_merge_operations
            .set(num_merges);
    }
}

#[async_trait]
impl Actor for MergeSchedulerService {
    type ObservableState = ();

    fn observable_state(&self) {}

    async fn initialize(&mut self, _ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        Ok(())
    }
}

#[derive(Debug)]
struct ScheduleMerge {
    score: u64,
    merge_operation: TrackedObject<MergeOperation>,
    split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
}

/// The higher, the sooner we will execute the merge operation.
/// A good merge operation
/// - strongly reduces the number splits
/// - is light.
fn score_merge_operation(merge_operation: &MergeOperation) -> u64 {
    let total_num_bytes: u64 = merge_operation.total_num_bytes();
    if total_num_bytes == 0 {
        // Silly corner case that should never happen.
        return u64::MAX;
    }
    // We will remove splits.len() and add 1 merge splits.
    let delta_num_splits = (merge_operation.splits.len() - 1) as u64;
    // We use integer arithmetic to avoid `f64 are not ordered` silliness.
    (delta_num_splits << 48)
        .checked_div(total_num_bytes)
        .unwrap_or(1u64)
}

impl ScheduleMerge {
    pub fn new(
        merge_operation: TrackedObject<MergeOperation>,
        split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
    ) -> ScheduleMerge {
        let score = score_merge_operation(&merge_operation);
        ScheduleMerge {
            score,
            merge_operation,
            split_downloader_mailbox,
        }
    }
}

#[async_trait]
impl Handler<ScheduleMerge> for MergeSchedulerService {
    type Reply = ();

    async fn handle(
        &mut self,
        schedule_merge: ScheduleMerge,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let ScheduleMerge {
            score,
            merge_operation,
            split_downloader_mailbox,
        } = schedule_merge;
        let merge_id = self.next_merge_id;
        self.next_merge_id += 1;
        let scheduled_merge = ScheduledMerge {
            score,
            id: merge_id,
            merge_operation,
            split_downloader_mailbox,
        };
        self.pending_merge_bytes += scheduled_merge.merge_operation.total_num_bytes();
        self.pending_merge_queue.push(scheduled_merge);
        crate::metrics::INDEXER_METRICS
            .pending_merge_operations
            .set(self.pending_merge_queue.len() as i64);
        crate::metrics::INDEXER_METRICS
            .pending_merge_bytes
            .set(self.pending_merge_bytes as i64);
        self.schedule_pending_merges(ctx);
        Ok(())
    }
}

#[derive(Debug)]
struct PermitReleased;

#[async_trait]
impl Handler<PermitReleased> for MergeSchedulerService {
    type Reply = ();

    async fn handle(
        &mut self,
        _: PermitReleased,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.schedule_pending_merges(ctx);
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_actors::Universe;
    use quickwit_metastore::SplitMetadata;
    use tantivy::Inventory;
    use tokio::time::timeout;

    use super::*;
    use crate::merge_policy::{MergeOperation, MergeTask};

    fn build_merge_operation(num_splits: usize, num_bytes_per_split: u64) -> MergeOperation {
        let splits: Vec<SplitMetadata> = std::iter::repeat_with(|| SplitMetadata {
            footer_offsets: num_bytes_per_split..num_bytes_per_split,
            ..Default::default()
        })
        .take(num_splits)
        .collect();
        MergeOperation::new_merge_operation(splits)
    }

    #[test]
    fn test_score_merge_operation() {
        let score_merge_operation_aux = |num_splits, num_bytes_per_split| {
            let merge_operation = build_merge_operation(num_splits, num_bytes_per_split);
            score_merge_operation(&merge_operation)
        };
        assert!(score_merge_operation_aux(10, 10_000_000) < score_merge_operation_aux(10, 999_999));
        assert!(
            score_merge_operation_aux(10, 10_000_000) > score_merge_operation_aux(9, 10_000_000)
        );
        assert_eq!(
            // 9 - 1 = 8 splits removed.
            score_merge_operation_aux(9, 10_000_000),
            // 5 - 1  = 4 splits removed.
            score_merge_operation_aux(5, 10_000_000 * 9 / 10)
        );
    }

    #[tokio::test]
    async fn test_merge_schedule_service_prioritize() {
        let universe = Universe::new();
        let (merge_scheduler_service, _) = universe
            .spawn_builder()
            .spawn(MergeSchedulerService::new(2));
        let inventory = Inventory::new();

        let (merge_split_downloader_mailbox, merge_split_downloader_inbox) =
            universe.create_test_mailbox();
        {
            let large_merge_operation = build_merge_operation(10, 4_000_000);
            let tracked_large_merge_operation = inventory.track(large_merge_operation);
            schedule_merge(
                &merge_scheduler_service,
                tracked_large_merge_operation,
                merge_split_downloader_mailbox.clone(),
            )
            .await
            .unwrap();
        }
        {
            let large_merge_operation2 = build_merge_operation(10, 3_000_000);
            let tracked_large_merge_operation2 = inventory.track(large_merge_operation2);
            schedule_merge(
                &merge_scheduler_service,
                tracked_large_merge_operation2,
                merge_split_downloader_mailbox.clone(),
            )
            .await
            .unwrap();
        }
        {
            let large_merge_operation2 = build_merge_operation(10, 5_000_000);
            let tracked_large_merge_operation2 = inventory.track(large_merge_operation2);
            schedule_merge(
                &merge_scheduler_service,
                tracked_large_merge_operation2,
                merge_split_downloader_mailbox.clone(),
            )
            .await
            .unwrap();
        }
        {
            let large_merge_operation2 = build_merge_operation(10, 2_000_000);
            let tracked_large_merge_operation2 = inventory.track(large_merge_operation2);
            schedule_merge(
                &merge_scheduler_service,
                tracked_large_merge_operation2,
                merge_split_downloader_mailbox.clone(),
            )
            .await
            .unwrap();
        }
        {
            let large_merge_operation2 = build_merge_operation(10, 1_000_000);
            let tracked_large_merge_operation2 = inventory.track(large_merge_operation2);
            schedule_merge(
                &merge_scheduler_service,
                tracked_large_merge_operation2,
                merge_split_downloader_mailbox.clone(),
            )
            .await
            .unwrap();
        }
        {
            let merge_task: MergeTask = merge_split_downloader_inbox
                .recv_typed_message::<MergeTask>()
                .await
                .unwrap();
            assert_eq!(
                merge_task.merge_operation.splits[0].footer_offsets.end,
                4_000_000
            );
            let merge_task2: MergeTask = merge_split_downloader_inbox
                .recv_typed_message::<MergeTask>()
                .await
                .unwrap();
            assert_eq!(
                merge_task2.merge_operation.splits[0].footer_offsets.end,
                3_000_000
            );
            assert!(
                timeout(
                    Duration::from_millis(200),
                    merge_split_downloader_inbox.recv_typed_message::<MergeTask>()
                )
                .await
                .is_err()
            );
        }
        {
            let merge_task: MergeTask = merge_split_downloader_inbox
                .recv_typed_message::<MergeTask>()
                .await
                .unwrap();
            assert_eq!(
                merge_task.merge_operation.splits[0].footer_offsets.end,
                1_000_000
            );
        }
        {
            let merge_task: MergeTask = merge_split_downloader_inbox
                .recv_typed_message::<MergeTask>()
                .await
                .unwrap();
            assert_eq!(
                merge_task.merge_operation.splits[0].footer_offsets.end,
                2_000_000
            );
        }
        {
            let merge_task: MergeTask = merge_split_downloader_inbox
                .recv_typed_message::<MergeTask>()
                .await
                .unwrap();
            assert_eq!(
                merge_task.merge_operation.splits[0].footer_offsets.end,
                5_000_000
            );
        }
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/merge_split_downloader.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::Path;

use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::io::IoControls;
use quickwit_common::temp_dir::{self, TempDirectory};
use quickwit_metastore::SplitMetadata;
use tantivy::Directory;
use tracing::{debug, info, instrument};

use super::MergeExecutor;
use crate::merge_policy::MergeTask;
use crate::models::MergeScratch;
use crate::split_store::IndexingSplitStore;

#[derive(Clone)]
pub struct MergeSplitDownloader {
    pub scratch_directory: TempDirectory,
    pub split_store: IndexingSplitStore,
    pub executor_mailbox: Mailbox<MergeExecutor>,
    pub io_controls: IoControls,
}

impl Actor for MergeSplitDownloader {
    type ObservableState = ();
    fn observable_state(&self) -> Self::ObservableState {}

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Unbounded
    }

    fn name(&self) -> String {
        "MergeSplitDownloader".to_string()
    }
}

#[async_trait]
impl Handler<MergeTask> for MergeSplitDownloader {
    type Reply = ();

    #[instrument(
        name = "merge_split_downloader",
        parent = merge_task.merge_parent_span.id(),
        skip_all,
    )]
    async fn handle(
        &mut self,
        merge_task: MergeTask,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        let merge_scratch_directory = temp_dir::Builder::default()
            .join("merge")
            .tempdir_in(self.scratch_directory.path())
            .map_err(|error| anyhow::anyhow!(error))?;
        info!(dir=%merge_scratch_directory.path().display(), "download-merge-splits");
        let downloaded_splits_directory = temp_dir::Builder::default()
            .join("downloaded-splits")
            .tempdir_in(merge_scratch_directory.path())
            .map_err(|error| anyhow::anyhow!(error))?;
        let tantivy_dirs = self
            .download_splits(
                merge_task.splits_as_slice(),
                downloaded_splits_directory.path(),
                ctx,
            )
            .await?;
        let msg = MergeScratch {
            merge_task,
            merge_scratch_directory,
            downloaded_splits_directory,
            tantivy_dirs,
        };
        ctx.send_message(&self.executor_mailbox, msg).await?;
        Ok(())
    }
}

impl MergeSplitDownloader {
    async fn download_splits(
        &self,
        splits: &[SplitMetadata],
        download_directory: &Path,
        ctx: &ActorContext<Self>,
    ) -> Result<Vec<Box<dyn Directory>>, quickwit_actors::ActorExitStatus> {
        // we download all of the split files in the scratch directory.
        let mut tantivy_dirs = Vec::new();
        for split in splits {
            if ctx.kill_switch().is_dead() {
                debug!(
                    split_id = split.split_id(),
                    "Kill switch was activated. Cancelling download."
                );
                return Err(ActorExitStatus::Killed);
            }
            let io_controls = self
                .io_controls
                .clone()
                .set_progress(ctx.progress().clone())
                .set_kill_switch(ctx.kill_switch().clone());
            let _protect_guard = ctx.protect_zone();
            let tantivy_dir = self
                .split_store
                .fetch_and_open_split(split.split_id(), download_directory, &io_controls)
                .await
                .map_err(|error| {
                    let split_id = split.split_id();
                    anyhow::anyhow!(error).context(format!("failed to download split `{split_id}`"))
                })?;
            tantivy_dirs.push(tantivy_dir);
        }
        Ok(tantivy_dirs)
    }
}

#[cfg(test)]
mod tests {
    use std::iter;
    use std::sync::Arc;

    use quickwit_actors::Universe;
    use quickwit_common::split_file;
    use quickwit_storage::{PutPayload, RamStorageBuilder, SplitPayloadBuilder};

    use super::*;
    use crate::merge_policy::MergeOperation;
    use crate::new_split_id;

    #[tokio::test]
    async fn test_merge_split_downloader() -> anyhow::Result<()> {
        let scratch_directory = TempDirectory::for_test();
        let splits_to_merge: Vec<SplitMetadata> = iter::repeat_with(|| {
            let split_id = new_split_id();
            SplitMetadata {
                split_id,
                ..Default::default()
            }
        })
        .take(10)
        .collect();

        let split_store = {
            let mut storage_builder = RamStorageBuilder::default();
            for split in &splits_to_merge {
                let buffer = SplitPayloadBuilder::get_split_payload(&[], &[], &[1, 2, 3])?
                    .read_all()
                    .await?;
                storage_builder = storage_builder.put(&split_file(split.split_id()), &buffer);
            }
            let ram_storage = storage_builder.build();
            IndexingSplitStore::create_without_local_store_for_test(Arc::new(ram_storage))
        };

        let universe = Universe::with_accelerated_time();
        let (merge_executor_mailbox, merge_executor_inbox) = universe.create_test_mailbox();
        let merge_split_downloader = MergeSplitDownloader {
            scratch_directory,
            split_store,
            executor_mailbox: merge_executor_mailbox,
            io_controls: IoControls::default(),
        };
        let (merge_split_downloader_mailbox, merge_split_downloader_handler) =
            universe.spawn_builder().spawn(merge_split_downloader);
        let merge_operation: MergeOperation = MergeOperation::new_merge_operation(splits_to_merge);
        let merge_task = MergeTask::from_merge_operation_for_test(merge_operation);
        merge_split_downloader_mailbox
            .send_message(merge_task)
            .await?;
        merge_split_downloader_handler
            .process_pending_and_observe()
            .await;
        let merge_scratches = merge_executor_inbox.drain_for_test();
        assert_eq!(merge_scratches.len(), 1);
        let merge_scratch = merge_scratches
            .into_iter()
            .next()
            .unwrap()
            .downcast::<MergeScratch>()
            .unwrap();
        assert_eq!(merge_scratch.merge_task.splits_as_slice().len(), 10);
        for split in merge_scratch.merge_task.splits_as_slice() {
            let split_filename = split_file(split.split_id());
            let split_filepath = merge_scratch
                .downloaded_splits_directory
                .path()
                .join(split_filename);
            assert!(split_filepath.try_exists().unwrap());
        }
        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod cooperative_indexing;
mod doc_processor;
mod index_serializer;
mod indexer;
mod indexing_pipeline;
mod indexing_service;
mod merge_executor;
mod merge_pipeline;
mod merge_planner;
mod merge_scheduler_service;
mod merge_split_downloader;
mod packager;
mod publisher;
mod sequencer;
mod uploader;
#[cfg(feature = "vrl")]
mod vrl_processing;

pub use doc_processor::{DocProcessor, DocProcessorCounters};
pub use index_serializer::IndexSerializer;
pub use indexer::{Indexer, IndexerCounters};
pub use indexing_pipeline::{IndexingPipeline, IndexingPipelineParams};
pub use indexing_service::{INDEXING_DIR_NAME, IndexingService, IndexingServiceCounters};
pub use merge_executor::{MergeExecutor, combine_partition_ids, merge_split_attrs};
pub use merge_pipeline::{FinishPendingMergesAndShutdownPipeline, MergePipeline};
pub(crate) use merge_planner::{MergePlanner, RunFinalizeMergePolicyAndQuit};
pub use merge_scheduler_service::{MergePermit, MergeSchedulerService, schedule_merge};
pub use merge_split_downloader::MergeSplitDownloader;
pub use packager::Packager;
pub use publisher::{Publisher, PublisherCounters, PublisherType};
pub use quickwit_proto::indexing::IndexingError;
pub use sequencer::Sequencer;
pub use uploader::{SplitsUpdateMailbox, Uploader, UploaderCounters, UploaderType};


================================================
FILE: quickwit/quickwit-indexing/src/actors/packager.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::io;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use anyhow::{Context, bail};
use async_trait::async_trait;
use fail::fail_point;
use itertools::Itertools;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::runtimes::RuntimeType;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_directories::write_hotcache;
use quickwit_doc_mapper::NamedField;
use quickwit_doc_mapper::tag_pruning::append_to_tag_set;
use quickwit_proto::search::{
    ListFieldType, ListFields, ListFieldsEntryResponse, serialize_split_fields,
};
use tantivy::index::FieldMetadata;
use tantivy::schema::{FieldType, Type};
use tantivy::{InvertedIndexReader, ReloadPolicy, SegmentMeta};
use tokio::runtime::Handle;
use tracing::{debug, info, instrument, warn};

/// Maximum distinct values allowed for a tag field within a split.
const MAX_VALUES_PER_TAG_FIELD: usize = if cfg!(any(test, feature = "testsuite")) {
    6
} else {
    1000
};

use crate::actors::Uploader;
use crate::models::{
    EmptySplit, IndexedSplit, IndexedSplitBatch, PackagedSplit, PackagedSplitBatch,
};

/// The role of the packager is to get an index writer and
/// produce a split file.
///
/// This includes the following steps:
/// - commit: this step is CPU heavy
/// - identifying the list of tags for the splits, and labelling it accordingly
/// - creating a bundle file
/// - computing the hotcache
/// - appending it to the split file.
///
/// The split format is described in `internals/split-format.md`
#[derive(Clone)]
pub struct Packager {
    actor_name: &'static str,
    uploader_mailbox: Mailbox<Uploader>,
    /// List of tag fields ([`Vec<NamedField>`]) defined in the index config.
    tag_fields: Vec<NamedField>,
}

impl Packager {
    pub fn new(
        actor_name: &'static str,
        tag_fields: Vec<NamedField>,
        uploader_mailbox: Mailbox<Uploader>,
    ) -> Packager {
        Packager {
            actor_name,
            uploader_mailbox,
            tag_fields,
        }
    }

    pub async fn process_indexed_split(
        &self,
        split: IndexedSplit,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<PackagedSplit> {
        let segment_metas = split.index.searchable_segment_metas()?;
        assert_eq!(segment_metas.len(), 1);
        let packaged_split =
            create_packaged_split(&segment_metas[..], split, &self.tag_fields, ctx)?;
        Ok(packaged_split)
    }
}

#[async_trait]
impl Actor for Packager {
    type ObservableState = ();

    #[allow(clippy::unused_unit)]
    fn observable_state(&self) -> Self::ObservableState {
        ()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(1)
    }

    fn name(&self) -> String {
        self.actor_name.to_string()
    }

    fn runtime_handle(&self) -> Handle {
        RuntimeType::Blocking.get_runtime_handle()
    }
}

#[async_trait]
impl Handler<IndexedSplitBatch> for Packager {
    type Reply = ();

    #[instrument(level = "info", name = "packager", parent=batch.batch_parent_span.id(), skip_all)]
    async fn handle(
        &mut self,
        batch: IndexedSplitBatch,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let split_ids: Vec<String> = batch
            .splits
            .iter()
            .map(|split| split.split_id().to_string())
            .collect_vec();
        debug!(
            split_ids=?split_ids,
            "start-packaging-splits"
        );
        fail_point!("packager:before");
        let mut packaged_splits = Vec::with_capacity(batch.splits.len());
        for split in batch.splits {
            if batch.publish_lock.is_dead() {
                // TODO: Remove the junk right away?
                info!(
                    split_ids=?split_ids,
                    "Splits' publish lock is dead."
                );
                return Ok(());
            }
            let packaged_split = self.process_indexed_split(split, ctx).await?;
            packaged_splits.push(packaged_split);
        }
        ctx.send_message(
            &self.uploader_mailbox,
            PackagedSplitBatch::new(
                packaged_splits,
                batch.checkpoint_delta_opt,
                batch.publish_lock,
                batch.publish_token_opt,
                batch.merge_task_opt,
                batch.batch_parent_span,
            ),
        )
        .await?;
        fail_point!("packager:after");
        Ok(())
    }
}

#[async_trait]
impl Handler<EmptySplit> for Packager {
    type Reply = ();

    #[instrument(
        name="package_empty_batch"
        parent=empty_split.batch_parent_span.id(),
        skip_all,
    )]
    async fn handle(
        &mut self,
        empty_split: EmptySplit,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        ctx.send_message(&self.uploader_mailbox, empty_split)
            .await?;
        Ok(())
    }
}

fn list_split_files(
    segment_metas: &[SegmentMeta],
    scratch_directory: &TempDirectory,
) -> io::Result<Vec<PathBuf>> {
    let mut index_files = vec![scratch_directory.path().join("meta.json")];

    // list the segment files
    for segment_meta in segment_metas {
        for relative_path in segment_meta.list_files() {
            let filepath = scratch_directory.path().join(relative_path);
            if filepath.try_exists()? {
                // If the file is missing, this is fine.
                // segment_meta.list_files() may actually returns files that
                // may not exist.
                index_files.push(filepath);
            }
        }
    }
    index_files.sort();
    Ok(index_files)
}

fn build_hotcache<W: io::Write>(split_path: &Path, out: &mut W) -> anyhow::Result<()> {
    let mmap_directory = tantivy::directory::MmapDirectory::open(split_path)?;
    write_hotcache(mmap_directory, out)?;
    Ok(())
}

/// Attempts to exhaustively extract the list of terms in a
/// field term dictionary.
///
/// returns None if:
/// - the number of terms exceed MAX_VALUES_PER_TAG_FIELD
/// - some of the terms are not value utf8.
/// - an error occurs.
///
/// Returns None may hurt split pruning and affects performance,
/// but it does not affect Quickwit's result validity.
fn try_extract_terms(
    named_field: &NamedField,
    inv_indexes: &[Arc<InvertedIndexReader>],
    max_terms: usize,
) -> anyhow::Result<Vec<String>> {
    let num_terms = inv_indexes
        .iter()
        .map(|inv_index| inv_index.terms().num_terms())
        .sum::<usize>();
    if num_terms > max_terms {
        bail!(
            "number of unique terms for tag field {} > {}",
            named_field.name,
            max_terms
        );
    }
    let mut terms = Vec::with_capacity(num_terms);
    for inv_index in inv_indexes {
        let mut terms_streamer = inv_index.terms().stream()?;
        while let Some((term_data, _)) = terms_streamer.next() {
            let term = match named_field.field_type {
                FieldType::U64(_) => u64_from_term_data(term_data)?.to_string(),
                FieldType::I64(_) => {
                    tantivy::u64_to_i64(u64_from_term_data(term_data)?).to_string()
                }
                FieldType::F64(_) => {
                    tantivy::u64_to_f64(u64_from_term_data(term_data)?).to_string()
                }
                FieldType::Bool(_) => match u64_from_term_data(term_data)? {
                    0 => false,
                    1 => true,
                    _ => bail!("invalid boolean value"),
                }
                .to_string(),
                FieldType::Bytes(_) => {
                    bail!("tags collection is not allowed on `bytes` fields")
                }
                _ => std::str::from_utf8(term_data)?.to_string(),
            };
            terms.push(term);
        }
    }
    Ok(terms)
}

fn create_packaged_split(
    segment_metas: &[SegmentMeta],
    split: IndexedSplit,
    tag_fields: &[NamedField],
    ctx: &ActorContext<Packager>,
) -> anyhow::Result<PackagedSplit> {
    debug!(split_id = split.split_id(), "create-packaged-split");
    let split_files = list_split_files(segment_metas, &split.split_scratch_directory)?;

    // Extracts tag values from inverted indexes only when a field cardinality is less
    // than `MAX_VALUES_PER_TAG_FIELD`.
    debug!(split_id = split.split_id(), tag_fields =? tag_fields, "extract-tags-values");
    let index_reader = split
        .index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()?;

    let fields_metadata = split.index.fields_metadata()?;

    let mut tags = BTreeSet::default();
    for named_field in tag_fields {
        let inverted_indexes = index_reader
            .searcher()
            .segment_readers()
            .iter()
            .map(|segment| segment.inverted_index(named_field.field))
            .collect::<Result<Vec<_>, _>>()?;

        match try_extract_terms(named_field, &inverted_indexes, MAX_VALUES_PER_TAG_FIELD) {
            Ok(terms) => {
                append_to_tag_set(&named_field.name, &terms, &mut tags);
            }
            Err(tag_extraction_error) => {
                warn!(err=?tag_extraction_error,  "no field values will be registered in the split metadata");
            }
        }
    }

    ctx.record_progress();

    debug!(split_id = split.split_id(), "build-hotcache");
    let mut hotcache_bytes = Vec::new();
    build_hotcache(split.split_scratch_directory.path(), &mut hotcache_bytes)?;
    ctx.record_progress();

    let serialized_split_fields = serialize_field_metadata(&fields_metadata);

    let packaged_split = PackagedSplit {
        serialized_split_fields,
        split_attrs: split.split_attrs,
        split_scratch_directory: split.split_scratch_directory,
        tags,
        split_files,
        hotcache_bytes,
    };
    Ok(packaged_split)
}

/// Serializes the Split fields.
///
/// `fields_metadata` has to be sorted.
fn serialize_field_metadata(fields_metadata: &[FieldMetadata]) -> Vec<u8> {
    let fields = fields_metadata
        .iter()
        .map(field_metadata_to_list_field_serialized)
        .collect::<Vec<_>>();

    serialize_split_fields(ListFields { fields })
}

fn tantivy_type_to_list_field_type(typ: Type) -> ListFieldType {
    match typ {
        Type::Str => ListFieldType::Str,
        Type::U64 => ListFieldType::U64,
        Type::I64 => ListFieldType::I64,
        Type::F64 => ListFieldType::F64,
        Type::Bool => ListFieldType::Bool,
        Type::Date => ListFieldType::Date,
        Type::Facet => ListFieldType::Facet,
        Type::Bytes => ListFieldType::Bytes,
        Type::Json => ListFieldType::Json,
        Type::IpAddr => ListFieldType::IpAddr,
    }
}

fn field_metadata_to_list_field_serialized(
    field_metadata: &FieldMetadata,
) -> ListFieldsEntryResponse {
    ListFieldsEntryResponse {
        field_name: field_metadata.field_name.to_string(),
        field_type: tantivy_type_to_list_field_type(field_metadata.typ) as i32,
        searchable: field_metadata.is_indexed(),
        aggregatable: field_metadata.is_fast(),
        index_ids: Vec::new(),
        non_searchable_index_ids: Vec::new(),
        non_aggregatable_index_ids: Vec::new(),
    }
}

/// Reads u64 from stored term data.
fn u64_from_term_data(data: &[u8]) -> anyhow::Result<u64> {
    let u64_bytes: [u8; 8] = data[0..8]
        .try_into()
        .context("could not interpret term bytes as u64")?;
    Ok(u64::from_be_bytes(u64_bytes))
}

#[cfg(test)]
mod tests {
    use std::ops::RangeInclusive;

    use quickwit_actors::{ObservationType, Universe};
    use quickwit_metastore::checkpoint::IndexCheckpointDelta;
    use quickwit_proto::search::{ListFieldsEntryResponse, deserialize_split_fields};
    use quickwit_proto::types::{DocMappingUid, IndexUid, NodeId};
    use tantivy::directory::MmapDirectory;
    use tantivy::schema::{FAST, NumericOptions, STRING, Schema, TEXT, Type};
    use tantivy::{DateTime, IndexBuilder, IndexSettings, doc};
    use tracing::Span;

    use super::*;
    use crate::models::{PublishLock, SplitAttrs};

    #[test]
    fn serialize_field_metadata_test() {
        let fields_metadata = vec![
            FieldMetadata {
                field_name: "test".to_string(),
                typ: Type::Str,
                stored: true,
                fast_size: Some(10u64.into()),
                term_dictionary_size: Some(10u64.into()),
                postings_size: Some(10u64.into()),
                positions_size: Some(10u64.into()),
            },
            FieldMetadata {
                field_name: "test2".to_string(),
                typ: Type::Str,
                stored: false,
                fast_size: None,
                term_dictionary_size: Some(10u64.into()),
                postings_size: Some(10u64.into()),
                positions_size: Some(10u64.into()),
            },
            FieldMetadata {
                field_name: "test3".to_string(),
                typ: Type::U64,
                stored: false,
                fast_size: Some(10u64.into()),
                term_dictionary_size: Some(10u64.into()),
                postings_size: Some(10u64.into()),
                positions_size: Some(10u64.into()),
            },
        ];

        let out = serialize_field_metadata(&fields_metadata);

        let deserialized: Vec<ListFieldsEntryResponse> =
            deserialize_split_fields(&mut &out[..]).unwrap().fields;

        assert_eq!(fields_metadata.len(), deserialized.len());
        assert_eq!(deserialized[0].field_name, "test");
        assert_eq!(deserialized[0].field_type, ListFieldType::Str as i32);
        assert!(deserialized[0].searchable);
        assert!(deserialized[0].aggregatable);

        assert_eq!(deserialized[1].field_name, "test2");
        assert_eq!(deserialized[1].field_type, ListFieldType::Str as i32);
        assert!(deserialized[1].searchable);
        assert!(!deserialized[1].aggregatable);

        assert_eq!(deserialized[2].field_name, "test3");
        assert_eq!(deserialized[2].field_type, ListFieldType::U64 as i32);
        assert!(deserialized[2].searchable);
        assert!(deserialized[2].aggregatable);
    }

    fn make_indexed_split_for_test(
        segment_timestamps: &[DateTime],
    ) -> anyhow::Result<IndexedSplit> {
        let split_scratch_directory = TempDirectory::for_test();
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let timestamp_field = schema_builder.add_u64_field("timestamp", FAST);
        let tag_str = schema_builder.add_text_field("tag_str", STRING);
        let tag_many = schema_builder.add_text_field("tag_many", STRING);
        let tag_u64 =
            schema_builder.add_u64_field("tag_u64", NumericOptions::default().set_indexed());
        let tag_i64 =
            schema_builder.add_i64_field("tag_i64", NumericOptions::default().set_indexed());
        let tag_f64 =
            schema_builder.add_f64_field("tag_f64", NumericOptions::default().set_indexed());
        let tag_bool =
            schema_builder.add_bool_field("tag_bool", NumericOptions::default().set_indexed());
        let schema = schema_builder.build();
        let index_builder = IndexBuilder::new()
            .settings(IndexSettings::default())
            .schema(schema)
            .tokenizers(
                quickwit_query::create_default_quickwit_tokenizer_manager()
                    .tantivy_manager()
                    .clone(),
            )
            .fast_field_tokenizers(
                quickwit_query::get_quickwit_fastfield_normalizer_manager()
                    .tantivy_manager()
                    .clone(),
            );
        let index_directory = MmapDirectory::open(split_scratch_directory.path())?;
        let mut index_writer =
            index_builder.single_segment_index_writer(index_directory, 100_000_000)?;
        let mut timerange_opt: Option<RangeInclusive<DateTime>> = None;
        let mut num_docs = 0;
        for &timestamp in segment_timestamps {
            for num in 1..10 {
                let doc = doc!(
                    text_field => format!("timestamp is {timestamp:?}"),
                    timestamp_field => timestamp,
                    tag_str => "value",
                    tag_many => format!("many-{num}"),
                    tag_u64 => 42u64,
                    tag_i64 => -42i64,
                    tag_f64 => -42.02f64,
                    tag_bool => true,
                );
                index_writer.add_document(doc)?;
                num_docs += 1;
                timerange_opt = Some(
                    timerange_opt
                        .map(|timestamp_range| {
                            let start = timestamp.min(*timestamp_range.start());
                            let end = timestamp.max(*timestamp_range.end());
                            RangeInclusive::new(start, end)
                        })
                        .unwrap_or_else(|| RangeInclusive::new(timestamp, timestamp)),
                )
            }
        }
        let index = index_writer.finalize()?;

        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();

        // TODO: In the future we would like that kind of segment flush to emit a new split,
        // but this will require work on tantivy.
        let indexed_split = IndexedSplit {
            split_attrs: SplitAttrs {
                node_id,
                index_uid,
                source_id,
                doc_mapping_uid: DocMappingUid::default(),
                split_id: "test-split".to_string(),
                partition_id: 17u64,
                num_docs,
                uncompressed_docs_size_in_bytes: num_docs * 15,
                time_range: timerange_opt,
                replaced_split_ids: Vec::new(),
                delete_opstamp: 0,
                num_merge_ops: 0,
            },
            index,
            split_scratch_directory,
            controlled_directory_opt: None,
        };
        Ok(indexed_split)
    }

    fn get_tag_fields(schema: Schema, field_names: &[&str]) -> Vec<NamedField> {
        field_names
            .iter()
            .map(|field_name| {
                let field = schema.get_field(field_name).unwrap();
                let field_type = schema.get_field_entry(field).field_type().clone();
                NamedField {
                    name: field_name.to_string(),
                    field,
                    field_type,
                }
            })
            .collect()
    }

    #[tokio::test]
    async fn test_packager_simple() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let (mailbox, inbox) = universe.create_test_mailbox();
        let indexed_split = make_indexed_split_for_test(&[
            DateTime::from_timestamp_secs(1628203589),
            DateTime::from_timestamp_secs(1628203640),
        ])?;
        let tag_fields = get_tag_fields(
            indexed_split.index.schema(),
            &[
                "tag_str", "tag_many", "tag_u64", "tag_i64", "tag_f64", "tag_bool",
            ],
        );
        let packager = Packager::new("TestPackager", tag_fields, mailbox);
        let (packager_mailbox, packager_handle) = universe.spawn_builder().spawn(packager);
        packager_mailbox
            .send_message(IndexedSplitBatch {
                splits: vec![indexed_split],
                checkpoint_delta_opt: IndexCheckpointDelta::for_test("source_id", 10..20).into(),
                publish_lock: PublishLock::default(),
                publish_token_opt: None,
                merge_task_opt: None,
                batch_parent_span: Span::none(),
            })
            .await?;
        assert_eq!(
            packager_handle.process_pending_and_observe().await.obs_type,
            ObservationType::Alive
        );
        let packaged_splits = inbox.drain_for_test();
        assert_eq!(packaged_splits.len(), 1);
        let packaged_split = packaged_splits[0]
            .downcast_ref::<PackagedSplitBatch>()
            .unwrap();
        let split = &packaged_split.splits[0];
        assert_eq!(
            &split.tags.iter().map(|s| s.as_str()).collect::<Vec<&str>>(),
            &[
                "tag_bool!",
                "tag_bool:true",
                "tag_f64!",
                "tag_f64:-42.02",
                "tag_i64!",
                "tag_i64:-42",
                "tag_str!",
                "tag_str:value",
                "tag_u64!",
                "tag_u64:42"
            ]
        );
        assert_eq!(
            split.split_attrs.time_range,
            Some(
                DateTime::from_timestamp_secs(1628203589)
                    ..=DateTime::from_timestamp_secs(1628203640)
            )
        );
        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/publisher.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use anyhow::Context;
use async_trait::async_trait;
use fail::fail_point;
use quickwit_actors::{Actor, ActorContext, Handler, Mailbox, QueueCapacity};
use quickwit_proto::metastore::{MetastoreService, MetastoreServiceClient, PublishSplitsRequest};
use serde::Serialize;
use tracing::{info, instrument, warn};

use crate::actors::MergePlanner;
use crate::models::{NewSplits, SplitsUpdate};
use crate::source::{SourceActor, SuggestTruncate};

#[derive(Clone, Debug, Default, Serialize)]
pub struct PublisherCounters {
    pub num_published_splits: u64,
    pub num_replace_operations: u64,
    pub num_empty_splits: u64,
}

#[derive(Clone, Copy, Debug)]
pub enum PublisherType {
    MainPublisher,
    MergePublisher,
}

impl PublisherType {
    pub fn actor_name(&self) -> &'static str {
        match self {
            PublisherType::MainPublisher => "Publisher",
            PublisherType::MergePublisher => "MergePublisher",
        }
    }
}

/// Disconnect the merge planner loop back.
/// This message is used to cut the merge pipeline loop, and let it terminate.
#[derive(Debug)]
pub(crate) struct DisconnectMergePlanner;

#[derive(Clone)]
pub struct Publisher {
    publisher_type: PublisherType,
    metastore: MetastoreServiceClient,
    merge_planner_mailbox_opt: Option<Mailbox<MergePlanner>>,
    source_mailbox_opt: Option<Mailbox<SourceActor>>,
    counters: PublisherCounters,
}

impl Publisher {
    pub fn new(
        publisher_type: PublisherType,
        metastore: MetastoreServiceClient,
        merge_planner_mailbox_opt: Option<Mailbox<MergePlanner>>,
        source_mailbox_opt: Option<Mailbox<SourceActor>>,
    ) -> Publisher {
        Publisher {
            publisher_type,
            metastore,
            merge_planner_mailbox_opt,
            source_mailbox_opt,
            counters: PublisherCounters::default(),
        }
    }
}

#[async_trait]
impl Actor for Publisher {
    type ObservableState = PublisherCounters;

    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    fn name(&self) -> String {
        self.publisher_type.actor_name().to_string()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        match self.publisher_type {
            PublisherType::MainPublisher => QueueCapacity::Bounded(1),
            PublisherType::MergePublisher => QueueCapacity::Unbounded,
        }
    }
}

#[async_trait]
impl Handler<DisconnectMergePlanner> for Publisher {
    type Reply = ();

    async fn handle(
        &mut self,
        _: DisconnectMergePlanner,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        info!("disconnecting merge planner mailbox");
        self.merge_planner_mailbox_opt = None;
        Ok(())
    }
}

#[async_trait]
impl Handler<SplitsUpdate> for Publisher {
    type Reply = ();

    #[instrument(name="publisher", parent=split_update.parent_span.id(),  skip(self, ctx))]
    async fn handle(
        &mut self,
        split_update: SplitsUpdate,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        fail_point!("publisher:before");

        let SplitsUpdate {
            index_uid,
            new_splits,
            replaced_split_ids,
            checkpoint_delta_opt,
            publish_lock,
            publish_token_opt,
            ..
        } = split_update;

        let index_checkpoint_delta_json_opt = checkpoint_delta_opt
            .as_ref()
            .map(serde_json::to_string)
            .transpose()
            .context("failed to serialize `IndexCheckpointDelta`")?;
        let split_ids: Vec<String> = new_splits
            .iter()
            .map(|split| split.split_id.clone())
            .collect();
        if let Some(_guard) = publish_lock.acquire().await {
            let publish_splits_request = PublishSplitsRequest {
                index_uid: Some(index_uid),
                staged_split_ids: split_ids.clone(),
                replaced_split_ids: replaced_split_ids.clone(),
                index_checkpoint_delta_json_opt,
                publish_token_opt: publish_token_opt.clone(),
            };
            ctx.protect_future(self.metastore.publish_splits(publish_splits_request))
                .await
                .context("failed to publish splits")?;
        } else {
            // TODO: Remove the junk right away?
            info!(
                split_ids=?split_ids,
                "Splits' publish lock is dead."
            );
            return Ok(());
        }
        info!("publish-new-splits");
        if let Some(source_mailbox) = self.source_mailbox_opt.as_ref()
            && let Some(checkpoint) = checkpoint_delta_opt
        {
            // We voluntarily do not log anything here.
            //
            // Not being to send the truncation message is a common event and should not be
            // considered an error. For instance, if the source is a
            // FileSource, it will terminate upon EOF and drop its
            // mailbox.
            let suggest_truncate_res = ctx
                .send_message(
                    source_mailbox,
                    SuggestTruncate(checkpoint.source_delta.get_source_checkpoint()),
                )
                .await;
            if let Err(send_truncate_err) = suggest_truncate_res {
                warn!(error=?send_truncate_err, "failed to send truncate message from publisher to source");
            }
        }

        if !new_splits.is_empty() {
            // The merge planner is not necessarily awake and this is not an error.
            // For instance, when a source reaches its end, and the last "new" split
            // has been packaged, the packager finalizer sends a message to the merge
            // planner in order to stop it.
            if let Some(merge_planner_mailbox) = self.merge_planner_mailbox_opt.as_ref() {
                let _ = ctx
                    .send_message(merge_planner_mailbox, NewSplits { new_splits })
                    .await;
            }

            if replaced_split_ids.is_empty() {
                self.counters.num_published_splits += 1;
            } else {
                self.counters.num_replace_operations += 1;
            }
        } else {
            self.counters.num_empty_splits += 1;
        }
        fail_point!("publisher:after");
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use quickwit_actors::Universe;
    use quickwit_metastore::checkpoint::{
        IndexCheckpointDelta, PartitionId, SourceCheckpoint, SourceCheckpointDelta,
    };
    use quickwit_metastore::{PublishSplitsRequestExt, SplitMetadata};
    use quickwit_proto::metastore::{EmptyResponse, MockMetastoreService};
    use quickwit_proto::types::{IndexUid, Position};
    use tracing::Span;

    use super::*;
    use crate::models::PublishLock;

    #[tokio::test]
    async fn test_publisher_publish_operation() {
        let universe = Universe::with_accelerated_time();
        let ref_index_uid: IndexUid = IndexUid::for_test("index", 1);
        let mut mock_metastore = MockMetastoreService::new();
        let ref_index_uid_clone = ref_index_uid.clone();
        mock_metastore
            .expect_publish_splits()
            .withf(move |publish_splits_request| {
                let checkpoint_delta: IndexCheckpointDelta = publish_splits_request
                    .deserialize_index_checkpoint()
                    .unwrap()
                    .unwrap();
                publish_splits_request.index_uid() == &ref_index_uid_clone
                    && checkpoint_delta.source_id == "source"
                    && publish_splits_request.staged_split_ids[..] == ["split"]
                    && publish_splits_request.replaced_split_ids.is_empty()
                    && checkpoint_delta.source_delta == SourceCheckpointDelta::from_range(1..3)
            })
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let (merge_planner_mailbox, merge_planner_inbox) = universe.create_test_mailbox();

        let (source_mailbox, source_inbox) = universe.create_test_mailbox();

        let publisher = Publisher::new(
            PublisherType::MainPublisher,
            MetastoreServiceClient::from_mock(mock_metastore),
            Some(merge_planner_mailbox),
            Some(source_mailbox),
        );
        let (publisher_mailbox, publisher_handle) = universe.spawn_builder().spawn(publisher);

        assert!(
            publisher_mailbox
                .send_message(SplitsUpdate {
                    index_uid: ref_index_uid.clone(),
                    new_splits: vec![SplitMetadata {
                        split_id: "split".to_string(),
                        ..Default::default()
                    }],
                    replaced_split_ids: Vec::new(),
                    checkpoint_delta_opt: Some(IndexCheckpointDelta {
                        source_id: "source".to_string(),
                        source_delta: SourceCheckpointDelta::from_range(1..3),
                    }),
                    publish_lock: PublishLock::default(),
                    publish_token_opt: None,
                    merge_task: None,
                    parent_span: tracing::Span::none(),
                })
                .await
                .is_ok()
        );

        let publisher_observation = publisher_handle.process_pending_and_observe().await.state;
        assert_eq!(publisher_observation.num_published_splits, 1);

        let suggest_truncate_checkpoints: Vec<SourceCheckpoint> = source_inbox
            .drain_for_test_typed::<SuggestTruncate>()
            .into_iter()
            .map(|msg| msg.0)
            .collect();

        assert_eq!(suggest_truncate_checkpoints.len(), 1);
        assert_eq!(
            suggest_truncate_checkpoints[0]
                .position_for_partition(&PartitionId::default())
                .unwrap(),
            &Position::offset(2u64)
        );

        let merger_msgs: Vec<NewSplits> = merge_planner_inbox.drain_for_test_typed::<NewSplits>();
        assert_eq!(merger_msgs.len(), 1);
        assert_eq!(merger_msgs[0].new_splits.len(), 1);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_publisher_publish_operation_with_empty_splits() {
        let universe = Universe::with_accelerated_time();
        let ref_index_uid: IndexUid = IndexUid::for_test("index", 1);
        let mut mock_metastore = MockMetastoreService::new();
        let ref_index_uid_clone = ref_index_uid.clone();
        mock_metastore
            .expect_publish_splits()
            .withf(move |publish_splits_request| {
                let checkpoint_delta: IndexCheckpointDelta = publish_splits_request
                    .deserialize_index_checkpoint()
                    .unwrap()
                    .unwrap();
                publish_splits_request.index_uid() == &ref_index_uid_clone
                    && checkpoint_delta.source_id == "source"
                    && publish_splits_request.staged_split_ids.is_empty()
                    && publish_splits_request.replaced_split_ids.is_empty()
                    && checkpoint_delta.source_delta == SourceCheckpointDelta::from_range(1..3)
            })
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let (merge_planner_mailbox, merge_planner_inbox) = universe.create_test_mailbox();

        let (source_mailbox, source_inbox) = universe.create_test_mailbox();

        let publisher = Publisher::new(
            PublisherType::MainPublisher,
            MetastoreServiceClient::from_mock(mock_metastore),
            Some(merge_planner_mailbox),
            Some(source_mailbox),
        );
        let (publisher_mailbox, publisher_handle) = universe.spawn_builder().spawn(publisher);

        assert!(
            publisher_mailbox
                .send_message(SplitsUpdate {
                    index_uid: ref_index_uid.clone(),
                    new_splits: Vec::new(),
                    replaced_split_ids: Vec::new(),
                    checkpoint_delta_opt: Some(IndexCheckpointDelta {
                        source_id: "source".to_string(),
                        source_delta: SourceCheckpointDelta::from_range(1..3),
                    }),
                    publish_lock: PublishLock::default(),
                    publish_token_opt: None,
                    merge_task: None,
                    parent_span: tracing::Span::none(),
                })
                .await
                .is_ok()
        );

        let publisher_observation = publisher_handle.process_pending_and_observe().await.state;
        assert_eq!(publisher_observation.num_published_splits, 0);
        assert_eq!(publisher_observation.num_replace_operations, 0);
        assert_eq!(publisher_observation.num_empty_splits, 1);

        let suggest_truncate_checkpoints: Vec<SourceCheckpoint> = source_inbox
            .drain_for_test_typed::<SuggestTruncate>()
            .into_iter()
            .map(|msg| msg.0)
            .collect();

        assert_eq!(suggest_truncate_checkpoints.len(), 1);
        assert_eq!(
            suggest_truncate_checkpoints[0]
                .position_for_partition(&PartitionId::default())
                .unwrap(),
            &Position::offset(2u64)
        );

        let merger_msgs: Vec<NewSplits> = merge_planner_inbox.drain_for_test_typed::<NewSplits>();
        assert_eq!(merger_msgs.len(), 0);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_publisher_replace_operation() {
        let universe = Universe::with_accelerated_time();
        let mut mock_metastore = MockMetastoreService::new();
        let ref_index_uid: IndexUid = IndexUid::for_test("index", 1);
        let ref_index_uid_clone = ref_index_uid.clone();
        mock_metastore
            .expect_publish_splits()
            .withf(move |publish_splits_requests| {
                publish_splits_requests.index_uid() == &ref_index_uid_clone
                    && publish_splits_requests.staged_split_ids[..] == ["split3"]
                    && publish_splits_requests.replaced_split_ids[..] == ["split1", "split2"]
                    && publish_splits_requests
                        .index_checkpoint_delta_json_opt()
                        .is_empty()
            })
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let (merge_planner_mailbox, merge_planner_inbox) = universe.create_test_mailbox();
        let publisher = Publisher::new(
            PublisherType::MainPublisher,
            MetastoreServiceClient::from_mock(mock_metastore),
            Some(merge_planner_mailbox),
            None,
        );
        let (publisher_mailbox, publisher_handle) = universe.spawn_builder().spawn(publisher);
        let publisher_message = SplitsUpdate {
            index_uid: ref_index_uid.clone(),
            new_splits: vec![SplitMetadata {
                split_id: "split3".to_string(),
                ..Default::default()
            }],
            replaced_split_ids: vec!["split1".to_string(), "split2".to_string()],
            checkpoint_delta_opt: None,
            publish_lock: PublishLock::default(),
            publish_token_opt: None,
            merge_task: None,
            parent_span: Span::none(),
        };
        assert!(
            publisher_mailbox
                .send_message(publisher_message)
                .await
                .is_ok()
        );
        let publisher_observation = publisher_handle.process_pending_and_observe().await.state;
        assert_eq!(publisher_observation.num_published_splits, 0);
        assert_eq!(publisher_observation.num_replace_operations, 1);
        let merge_planner_msgs = merge_planner_inbox.drain_for_test_typed::<NewSplits>();
        assert_eq!(merge_planner_msgs.len(), 1);
        assert_eq!(merge_planner_msgs[0].new_splits.len(), 1);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn publisher_acquires_publish_lock() {
        let universe = Universe::with_accelerated_time();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_publish_splits().never();
        let (merge_planner_mailbox, merge_planner_inbox) = universe.create_test_mailbox();

        let publisher = Publisher::new(
            PublisherType::MainPublisher,
            MetastoreServiceClient::from_mock(mock_metastore),
            Some(merge_planner_mailbox),
            None,
        );
        let (publisher_mailbox, publisher_handle) = universe.spawn_builder().spawn(publisher);

        let publish_lock = PublishLock::default();
        publish_lock.kill().await;

        publisher_mailbox
            .send_message(SplitsUpdate {
                index_uid: IndexUid::new_with_random_ulid("index"),
                new_splits: vec![SplitMetadata::for_test("test-split".to_string())],
                replaced_split_ids: Vec::new(),
                checkpoint_delta_opt: None,
                publish_lock,
                publish_token_opt: None,
                merge_task: None,
                parent_span: Span::none(),
            })
            .await
            .unwrap();

        let publisher_observation = publisher_handle.process_pending_and_observe().await.state;
        assert_eq!(publisher_observation.num_published_splits, 0);

        let merger_messages = merge_planner_inbox.drain_for_test();
        assert!(merger_messages.is_empty());
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/sequencer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Debug;

use anyhow::Context;
use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use tokio::sync::oneshot;

/// The sequencer serves as a proxy to another actor,
/// delivering message in a specific order.
///
/// Producers of message first "reserve" a position in the
/// queue of message by sending `oneshot::Receiver<Message>` to the `Sequencer`.
///
/// The Sequencer then simply resolves these messages and forwards them to the
/// targeted actor.
///
/// It is used by the uploader actor, to run uploads concurrently and yet
/// ensures that publish message are send in the right order.
pub struct Sequencer<A: Actor> {
    mailbox: Mailbox<A>,
}

impl<A: Actor> Sequencer<A> {
    pub fn new(mailbox: Mailbox<A>) -> Self {
        Sequencer { mailbox }
    }
}

#[async_trait]
impl<A: Actor> Actor for Sequencer<A> {
    type ObservableState = ();

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(2)
    }

    fn observable_state(&self) {}
}

#[derive(Debug)]
pub enum SequencerCommand<T: Debug> {
    /// Discard position in the sequence.
    Discard,
    /// Proceed with the enclosed value.
    Proceed(T),
}

#[async_trait]
impl<A, M> Handler<oneshot::Receiver<SequencerCommand<M>>> for Sequencer<A>
where
    A: Actor,
    A: Handler<M>,
    M: Send + Sync + 'static + std::fmt::Debug,
{
    type Reply = ();

    async fn handle(
        &mut self,
        message: oneshot::Receiver<SequencerCommand<M>>,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let command = ctx
            .protect_future(message)
            .await
            .context("failed to receive command from uploader")?;
        if let SequencerCommand::Proceed(msg) = command {
            ctx.send_message(&self.mailbox, msg)
                .await
                .context("failed to send message to publisher")?;
        }
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use quickwit_actors::Universe;

    use super::*;

    #[derive(Default)]
    struct SequencerTestActor {
        messages: Vec<usize>,
    }

    impl Actor for SequencerTestActor {
        type ObservableState = Vec<usize>;

        fn observable_state(&self) -> Self::ObservableState {
            self.messages.clone()
        }
    }

    #[async_trait]
    impl Handler<usize> for SequencerTestActor {
        type Reply = ();

        async fn handle(
            &mut self,
            message: usize,
            _ctx: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            self.messages.push(message);
            Ok(())
        }
    }

    #[tokio::test]
    async fn test_sequencer() {
        let universe = Universe::with_accelerated_time();
        let test_actor = SequencerTestActor::default();
        let (test_mailbox, test_handle) = universe.spawn_builder().spawn(test_actor);
        let sequencer = Sequencer::new(test_mailbox);
        let (sequencer_mailbox, sequencer_handle) = universe.spawn_builder().spawn(sequencer);
        // The sequencer has a capacity of 2.
        // This is the maximum we can do without provoking a deadlock.
        let (fut_tx_1, fut_rx_1) = oneshot::channel();
        let (fut_tx_2, fut_rx_2) = oneshot::channel();
        let (fut_tx_3, fut_rx_3) = oneshot::channel();
        sequencer_mailbox.send_message(fut_rx_1).await.unwrap();
        sequencer_mailbox.send_message(fut_rx_2).await.unwrap();
        fut_tx_3.send(SequencerCommand::<usize>::Discard).unwrap();
        sequencer_mailbox.send_message(fut_rx_3).await.unwrap();
        fut_tx_2.send(SequencerCommand::Proceed(2)).unwrap();
        fut_tx_1.send(SequencerCommand::Proceed(1)).unwrap();
        std::mem::drop(sequencer_mailbox);
        let (exit_status, last_state) = test_handle.join().await;
        assert!(matches!(exit_status, ActorExitStatus::Success));
        assert_eq!(&last_state, &[1, 2]);
        let (sequencer_exit_status, _) = sequencer_handle.join().await;
        assert!(matches!(sequencer_exit_status, ActorExitStatus::Success));
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/uploader.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::iter::FromIterator;
use std::mem;
use std::sync::Arc;
use std::sync::atomic::{AtomicU64, Ordering};

use anyhow::{Context, bail};
use async_trait::async_trait;
use fail::fail_point;
use itertools::Itertools;
use once_cell::sync::OnceCell;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::spawn_named_task;
use quickwit_config::RetentionPolicy;
use quickwit_metastore::checkpoint::IndexCheckpointDelta;
use quickwit_metastore::{SplitMetadata, StageSplitsRequestExt};
use quickwit_proto::metastore::{MetastoreService, MetastoreServiceClient, StageSplitsRequest};
use quickwit_proto::search::{ReportSplit, ReportSplitsRequest};
use quickwit_proto::types::{IndexUid, PublishToken};
use quickwit_storage::SplitPayloadBuilder;
use serde::Serialize;
use tokio::sync::oneshot::Sender;
use tokio::sync::{Semaphore, SemaphorePermit, oneshot};
use tracing::{Instrument, Span, debug, info, instrument, warn};

use crate::actors::Publisher;
use crate::actors::sequencer::{Sequencer, SequencerCommand};
use crate::merge_policy::{MergePolicy, MergeTask};
use crate::metrics::INDEXER_METRICS;
use crate::models::{
    EmptySplit, PackagedSplit, PackagedSplitBatch, PublishLock, SplitsUpdate, create_split_metadata,
};
use crate::split_store::IndexingSplitStore;

/// The following two semaphores ensures that, we have at most `max_concurrent_split_uploads` split
/// uploads can happen at the same time, as configured in the `IndexerConfig`.
///
/// This "budget" is actually split into two semaphores: one for the indexing pipeline and the merge
/// pipeline. The idea is that the merge pipeline is by nature a bit irregular, and we don't want it
/// to stall the indexing pipeline, decreasing its throughput.
static CONCURRENT_UPLOAD_PERMITS_INDEX: OnceCell<Semaphore> = OnceCell::new();
static CONCURRENT_UPLOAD_PERMITS_MERGE: OnceCell<Semaphore> = OnceCell::new();

#[derive(Clone, Copy, Debug)]
pub enum UploaderType {
    IndexUploader,
    MergeUploader,
    DeleteUploader,
}

/// [`SplitsUpdateMailbox`] wraps either a [`Mailbox<Sequencer>`] or [`Mailbox<Publisher>`].
///
/// It makes it possible to send a [`SplitsUpdate`] either to the [`Sequencer`] or directly
/// to [`Publisher`]. It is used in combination with `SplitsUpdateSender` that will do the send.
///
/// This is useful as we have different requirements between the indexing pipeline and
/// the merge/delete task pipelines.
/// 1. In the indexing pipeline, we want to publish splits in the same order as they are produced by
///    the indexer/packager to ensure we are publishing splits without "holes" in checkpoints. We
///    thus send [`SplitsUpdate`] to the [`Sequencer`] to keep the right ordering.
/// 2. In the merge pipeline and the delete task pipeline, we are merging splits and in in this
///    case, publishing order does not matter. In this case, we can just send [`SplitsUpdate`]
///    directly to the [`Publisher`].
#[derive(Clone, Debug)]
pub enum SplitsUpdateMailbox {
    Sequencer(Mailbox<Sequencer<Publisher>>),
    Publisher(Mailbox<Publisher>),
}

impl From<Mailbox<Publisher>> for SplitsUpdateMailbox {
    fn from(publisher_mailbox: Mailbox<Publisher>) -> Self {
        SplitsUpdateMailbox::Publisher(publisher_mailbox)
    }
}

impl From<Mailbox<Sequencer<Publisher>>> for SplitsUpdateMailbox {
    fn from(publisher_sequencer_mailbox: Mailbox<Sequencer<Publisher>>) -> Self {
        SplitsUpdateMailbox::Sequencer(publisher_sequencer_mailbox)
    }
}

impl SplitsUpdateMailbox {
    async fn get_split_update_sender(
        &self,
        ctx: &ActorContext<Uploader>,
    ) -> anyhow::Result<SplitsUpdateSender> {
        match self {
            SplitsUpdateMailbox::Sequencer(sequencer_mailbox) => {
                // We send the future to the sequencer right away.
                // The sequencer will then resolve the future in their arrival order and ensure that
                // the publisher publishes splits in order.
                let (split_uploaded_tx, split_uploaded_rx) =
                    oneshot::channel::<SequencerCommand<SplitsUpdate>>();
                ctx.send_message(sequencer_mailbox, split_uploaded_rx)
                    .await?;
                Ok(SplitsUpdateSender::Sequencer(split_uploaded_tx))
            }
            SplitsUpdateMailbox::Publisher(publisher_mailbox) => {
                // We just need the publisher mailbox to send the split in this case.
                Ok(SplitsUpdateSender::Publisher(publisher_mailbox.clone()))
            }
        }
    }
}

enum SplitsUpdateSender {
    Sequencer(Sender<SequencerCommand<SplitsUpdate>>),
    Publisher(Mailbox<Publisher>),
}

impl SplitsUpdateSender {
    fn discard(self) -> anyhow::Result<()> {
        if let SplitsUpdateSender::Sequencer(split_uploader_tx) = self
            && split_uploader_tx.send(SequencerCommand::Discard).is_err()
        {
            bail!("failed to send cancel command to sequencer. the sequencer is probably dead");
        }
        Ok(())
    }

    async fn send(
        self,
        split_update: SplitsUpdate,
        ctx: &ActorContext<Uploader>,
    ) -> anyhow::Result<()> {
        match self {
            SplitsUpdateSender::Sequencer(split_uploaded_tx) => {
                if let Err(publisher_message) =
                    split_uploaded_tx.send(SequencerCommand::Proceed(split_update))
                {
                    bail!(
                        "failed to send upload split `{:?}`. the publisher is probably dead",
                        &publisher_message
                    );
                }
            }
            SplitsUpdateSender::Publisher(publisher_mailbox) => {
                ctx.send_message(&publisher_mailbox, split_update).await?;
            }
        }
        Ok(())
    }
}

#[derive(Clone)]
pub struct Uploader {
    uploader_type: UploaderType,
    metastore: MetastoreServiceClient,
    merge_policy: Arc<dyn MergePolicy>,
    retention_policy: Option<RetentionPolicy>,
    split_store: IndexingSplitStore,
    split_update_mailbox: SplitsUpdateMailbox,
    max_concurrent_split_uploads: usize,
    counters: UploaderCounters,
    event_broker: EventBroker,
}

impl Uploader {
    #[allow(clippy::too_many_arguments)]
    pub fn new(
        uploader_type: UploaderType,
        metastore: MetastoreServiceClient,
        merge_policy: Arc<dyn MergePolicy>,
        retention_policy: Option<RetentionPolicy>,
        split_store: IndexingSplitStore,
        split_update_mailbox: SplitsUpdateMailbox,
        max_concurrent_split_uploads: usize,
        event_broker: EventBroker,
    ) -> Uploader {
        Uploader {
            uploader_type,
            metastore,
            merge_policy,
            retention_policy,
            split_store,
            split_update_mailbox,
            max_concurrent_split_uploads,
            counters: Default::default(),
            event_broker,
        }
    }
    async fn acquire_semaphore(
        &self,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<SemaphorePermit<'static>> {
        let _guard = ctx.protect_zone();
        let (concurrent_upload_permits_once_cell, concurrent_upload_permits_gauge) =
            match self.uploader_type {
                UploaderType::IndexUploader => (
                    &CONCURRENT_UPLOAD_PERMITS_INDEX,
                    INDEXER_METRICS
                        .available_concurrent_upload_permits
                        .with_label_values(["indexer"]),
                ),
                UploaderType::MergeUploader => (
                    &CONCURRENT_UPLOAD_PERMITS_MERGE,
                    INDEXER_METRICS
                        .available_concurrent_upload_permits
                        .with_label_values(["merger"]),
                ),
                UploaderType::DeleteUploader => (
                    &CONCURRENT_UPLOAD_PERMITS_MERGE,
                    INDEXER_METRICS
                        .available_concurrent_upload_permits
                        .with_label_values(["merger"]),
                ),
            };
        let concurrent_upload_permits = concurrent_upload_permits_once_cell
            .get_or_init(|| Semaphore::const_new(self.max_concurrent_split_uploads));
        concurrent_upload_permits_gauge.set(concurrent_upload_permits.available_permits() as i64);
        concurrent_upload_permits
            .acquire()
            .await
            .context("the uploader semaphore is closed. (this should never happen)")
    }
}

#[derive(Clone, Debug, Default, Serialize)]
pub struct UploaderCounters {
    pub num_staged_splits: Arc<AtomicU64>,
    pub num_uploaded_splits: Arc<AtomicU64>,
}

#[async_trait]
impl Actor for Uploader {
    type ObservableState = UploaderCounters;

    #[allow(clippy::unused_unit)]
    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        // We do not need a large capacity here...
        // The uploader just spawns tasks that are uploading,
        // so that in a sense, the CONCURRENT_UPLOAD_PERMITS semaphore also acts as
        // a queue capacity.
        //
        // Having a large queue is costly too, because each message is a handle over
        // a split directory. We DO need aggressive backpressure here.
        QueueCapacity::Bounded(0)
    }

    fn name(&self) -> String {
        format!("{:?}", self.uploader_type)
    }
}

#[async_trait]
impl Handler<PackagedSplitBatch> for Uploader {
    type Reply = ();

    #[instrument(name = "uploader",
        parent=batch.batch_parent_span.id(),
        skip_all)]
    async fn handle(
        &mut self,
        batch: PackagedSplitBatch,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        fail_point!("uploader:before");
        let split_update_sender = self
            .split_update_mailbox
            .get_split_update_sender(ctx)
            .await?;

        // The permit will be added back manually to the semaphore the task after it is finished.
        // This is not a valid usage of protected zone here.
        //
        // Protected zone are supposed to be used when the cause for blocking is
        // outside of the responsibility of the current actor.
        // For instance, when sending a message on a downstream actor with a saturated
        // mailbox.
        // This is meant to be fixed with ParallelActors.
        let permit_guard = self.acquire_semaphore(ctx).await?;
        let kill_switch = ctx.kill_switch().clone();
        let split_ids = batch.split_ids();
        if kill_switch.is_dead() {
            warn!(split_ids=?split_ids,"kill switch was activated, cancelling upload");
            return Err(ActorExitStatus::Killed);
        }
        let metastore = self.metastore.clone();
        let split_store = self.split_store.clone();
        let counters = self.counters.clone();
        let index_uid = batch.index_uid();
        let ctx_clone = ctx.clone();
        let merge_policy = self.merge_policy.clone();
        let retention_policy = self.retention_policy.clone();
        debug!(split_ids=?split_ids, "start-stage-and-store-splits");
        let event_broker = self.event_broker.clone();
        spawn_named_task(
            async move {
                fail_point!("uploader:intask:before");

                let mut split_metadata_list = Vec::with_capacity(batch.splits.len());
                let mut report_splits: Vec<ReportSplit> = Vec::with_capacity(batch.splits.len());

                for packaged_split in batch.splits.iter() {
                    if batch.publish_lock.is_dead() {
                        // TODO: Remove the junk right away?
                        info!("splits' publish lock is dead");
                        if let Err(e) = split_update_sender.discard() {
                            warn!(cause=?e, "could not discard split");
                        }
                        return;
                    }

                    let split_streamer = match SplitPayloadBuilder::get_split_payload(
                        &packaged_split.split_files,
                        &packaged_split.serialized_split_fields,
                        &packaged_split.hotcache_bytes,
                    ) {
                        Ok(split_streamer) => split_streamer,
                        Err(e) => {
                            warn!(cause=?e, split_id=packaged_split.split_id(), "could not create split streamer");
                            return;
                        }
                    };
                    let split_metadata = create_split_metadata(
                        &merge_policy,
                        retention_policy.as_ref(),
                        &packaged_split.split_attrs,
                        packaged_split.tags.clone(),
                        split_streamer.footer_range.start..split_streamer.footer_range.end,
                    );

                    report_splits.push(ReportSplit {
                        storage_uri: split_store.remote_uri().to_string(),
                        split_id: packaged_split.split_id().to_string(),
                    });

                    split_metadata_list.push(split_metadata);

                }

                let stage_splits_request = match StageSplitsRequest::try_from_splits_metadata(index_uid.clone(), split_metadata_list.clone()) {
                    Ok(stage_splits_request) => stage_splits_request,
                    Err(e) => {
                        warn!(cause=?e, "could not create stage splits request");
                        return;
                    }
                };
                if let Err(e) = metastore
                    .clone()
                    .stage_splits(stage_splits_request)
                    .await
                {
                    warn!(cause=?e, "failed to stage splits");
                    return;
                };

                counters.num_staged_splits.fetch_add(split_metadata_list.len() as u64, Ordering::SeqCst);

                let mut packaged_splits_and_metadata = Vec::with_capacity(batch.splits.len());

                event_broker.publish(ReportSplitsRequest { report_splits });

                for (packaged_split, metadata) in batch.splits.into_iter().zip(split_metadata_list) {
                    let upload_result = upload_split(
                        &packaged_split,
                        &metadata,
                        &split_store,
                        counters.clone(),
                    )
                    .await;

                    if let Err(cause) = upload_result {
                        warn!(cause=?cause, split_id=packaged_split.split_id(), "Failed to upload split. Killing!");
                        kill_switch.kill();
                        return;
                    }

                    packaged_splits_and_metadata.push((packaged_split, metadata));
                }

                let splits_update = make_publish_operation(
                    index_uid,
                    packaged_splits_and_metadata,
                    batch.checkpoint_delta_opt,
                    batch.publish_lock,
                    batch.publish_token_opt,
                    batch.merge_task_opt,
                    batch.batch_parent_span,
                );

                let target = match &split_update_sender {
                    SplitsUpdateSender::Sequencer(_) => "sequencer",
                    SplitsUpdateSender::Publisher(_) => "publisher",
                };
                if let Err(e) = split_update_sender.send(splits_update, &ctx_clone).await {
                    warn!(cause=?e, target, "failed to send uploaded split");
                    return;
                }
                // We explicitly drop it in order to force move the permit guard into the async
                // task.
                mem::drop(permit_guard);
            }
            .instrument(Span::current()),
            "upload_single_task"
        );
        fail_point!("uploader:intask:after");
        Ok(())
    }
}

#[async_trait]
impl Handler<EmptySplit> for Uploader {
    type Reply = ();

    #[instrument(
        name="upload_empty_split",
        parent=empty_split.batch_parent_span.id(),
        skip_all,
    )]
    async fn handle(
        &mut self,
        empty_split: EmptySplit,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let split_update_sender = self
            .split_update_mailbox
            .get_split_update_sender(ctx)
            .await?;
        let splits_update = SplitsUpdate {
            index_uid: empty_split.index_uid,
            new_splits: Vec::new(),
            replaced_split_ids: Vec::new(),
            checkpoint_delta_opt: Some(empty_split.checkpoint_delta),
            publish_lock: empty_split.publish_lock,
            publish_token_opt: empty_split.publish_token_opt,
            merge_task: None,
            parent_span: empty_split.batch_parent_span,
        };

        split_update_sender.send(splits_update, ctx).await?;
        Ok(())
    }
}

fn make_publish_operation(
    index_uid: IndexUid,
    packaged_splits_and_metadatas: Vec<(PackagedSplit, SplitMetadata)>,
    checkpoint_delta_opt: Option<IndexCheckpointDelta>,
    publish_lock: PublishLock,
    publish_token_opt: Option<PublishToken>,
    merge_task: Option<MergeTask>,
    parent_span: Span,
) -> SplitsUpdate {
    assert!(!packaged_splits_and_metadatas.is_empty());
    let replaced_split_ids = packaged_splits_and_metadatas
        .iter()
        .flat_map(|(split, _)| split.split_attrs.replaced_split_ids.clone())
        .collect::<HashSet<_>>();
    SplitsUpdate {
        index_uid,
        new_splits: packaged_splits_and_metadatas
            .into_iter()
            .map(|split_and_meta| split_and_meta.1)
            .collect_vec(),
        replaced_split_ids: Vec::from_iter(replaced_split_ids),
        checkpoint_delta_opt,
        publish_lock,
        publish_token_opt,
        merge_task,
        parent_span,
    }
}

#[instrument(
    level = "info"
    name = "upload",
    fields(split = %packaged_split.split_attrs.split_id),
    skip_all
)]
async fn upload_split(
    packaged_split: &PackagedSplit,
    split_metadata: &SplitMetadata,
    split_store: &IndexingSplitStore,
    counters: UploaderCounters,
) -> anyhow::Result<()> {
    let split_streamer = SplitPayloadBuilder::get_split_payload(
        &packaged_split.split_files,
        &packaged_split.serialized_split_fields,
        &packaged_split.hotcache_bytes,
    )?;

    split_store
        .store_split(
            split_metadata,
            packaged_split.split_scratch_directory.path(),
            Box::new(split_streamer),
        )
        .await?;
    counters.num_uploaded_splits.fetch_add(1, Ordering::SeqCst);
    Ok(())
}

#[cfg(test)]
mod tests {
    use std::path::PathBuf;
    use std::time::Duration;

    use quickwit_actors::{ObservationType, Universe};
    use quickwit_common::pubsub::EventSubscriber;
    use quickwit_common::temp_dir::TempDirectory;
    use quickwit_metastore::checkpoint::{IndexCheckpointDelta, SourceCheckpointDelta};
    use quickwit_proto::metastore::{EmptyResponse, MockMetastoreService};
    use quickwit_proto::types::{DocMappingUid, NodeId};
    use quickwit_storage::RamStorage;
    use tantivy::DateTime;
    use tokio::sync::oneshot;

    use super::*;
    use crate::merge_policy::{NopMergePolicy, default_merge_policy};
    use crate::models::{SplitAttrs, SplitsUpdate};

    #[tokio::test]
    async fn test_uploader_with_sequencer() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();

        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();

        let event_broker = EventBroker::default();
        let universe = Universe::new();
        let (sequencer_mailbox, sequencer_inbox) =
            universe.create_test_mailbox::<Sequencer<Publisher>>();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_stage_splits()
            .withf(move |stage_splits_request| -> bool {
                let splits_metadata = stage_splits_request.deserialize_splits_metadata().unwrap();
                let split_metadata = &splits_metadata[0];
                let index_uid: IndexUid = stage_splits_request.index_uid().clone();
                index_uid.index_id == "test-index"
                    && split_metadata.split_id() == "test-split"
                    && split_metadata.time_range == Some(1628203589..=1628203640)
            })
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let ram_storage = RamStorage::default();
        let split_store =
            IndexingSplitStore::create_without_local_store_for_test(Arc::new(ram_storage.clone()));
        let merge_policy = Arc::new(NopMergePolicy);
        let uploader = Uploader::new(
            UploaderType::IndexUploader,
            MetastoreServiceClient::from_mock(mock_metastore),
            merge_policy,
            None,
            split_store,
            SplitsUpdateMailbox::Sequencer(sequencer_mailbox),
            4,
            event_broker,
        );
        let (uploader_mailbox, uploader_handle) = universe.spawn_builder().spawn(uploader);
        let split_scratch_directory = TempDirectory::for_test();
        let checkpoint_delta_opt: Option<IndexCheckpointDelta> = Some(IndexCheckpointDelta {
            source_id: "test-source".to_string(),
            source_delta: SourceCheckpointDelta::from_range(3..15),
        });
        uploader_mailbox
            .send_message(PackagedSplitBatch::new(
                vec![PackagedSplit {
                    split_attrs: SplitAttrs {
                        node_id,
                        index_uid,
                        source_id,
                        doc_mapping_uid: DocMappingUid::default(),
                        partition_id: 3u64,
                        time_range: Some(
                            DateTime::from_timestamp_secs(1_628_203_589)
                                ..=DateTime::from_timestamp_secs(1_628_203_640),
                        ),
                        uncompressed_docs_size_in_bytes: 1_000,
                        num_docs: 10,
                        replaced_split_ids: Vec::new(),
                        split_id: "test-split".to_string(),
                        delete_opstamp: 10,
                        num_merge_ops: 0,
                    },
                    serialized_split_fields: Vec::new(),
                    split_scratch_directory,
                    tags: Default::default(),
                    hotcache_bytes: Vec::new(),
                    split_files: Vec::new(),
                }],
                checkpoint_delta_opt,
                PublishLock::default(),
                None,
                None,
                Span::none(),
            ))
            .await?;
        assert_eq!(
            uploader_handle.process_pending_and_observe().await.obs_type,
            ObservationType::Alive
        );
        let mut publish_futures: Vec<oneshot::Receiver<SequencerCommand<SplitsUpdate>>> =
            sequencer_inbox.drain_for_test_typed();
        assert_eq!(publish_futures.len(), 1);

        let publisher_message = match publish_futures.pop().unwrap().await? {
            SequencerCommand::Discard => panic!(
                "expected `SequencerCommand::Proceed(SplitUpdate)`, got \
                 `SequencerCommand::Discard`"
            ),
            SequencerCommand::Proceed(publisher_message) => publisher_message,
        };
        let SplitsUpdate {
            index_uid,
            new_splits,
            checkpoint_delta_opt,
            replaced_split_ids,
            ..
        } = publisher_message;

        assert_eq!(index_uid.index_id, "test-index");
        assert_eq!(new_splits.len(), 1);
        assert_eq!(new_splits[0].split_id(), "test-split");
        let checkpoint_delta = checkpoint_delta_opt.unwrap();
        assert_eq!(checkpoint_delta.source_id, "test-source");
        assert_eq!(
            checkpoint_delta.source_delta,
            SourceCheckpointDelta::from_range(3..15)
        );
        assert!(replaced_split_ids.is_empty());
        let mut files = ram_storage.list_files().await;
        files.sort();
        assert_eq!(&files, &[PathBuf::from("test-split.split")]);
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_uploader_with_sequencer_emits_replace() -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();

        let universe = Universe::new();
        let (sequencer_mailbox, sequencer_inbox) =
            universe.create_test_mailbox::<Sequencer<Publisher>>();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_stage_splits()
            .withf(move |stage_splits_request| -> bool {
                let splits_metadata = stage_splits_request.deserialize_splits_metadata().unwrap();
                let is_metadata_valid = splits_metadata.iter().all(|metadata| {
                    ["test-split-1", "test-split-2"].contains(&metadata.split_id())
                        && metadata.time_range == Some(1628203589..=1628203640)
                });
                let index_uid: IndexUid = stage_splits_request.index_uid().clone();
                index_uid.index_id == "test-index" && is_metadata_valid
            })
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let ram_storage = RamStorage::default();
        let split_store =
            IndexingSplitStore::create_without_local_store_for_test(Arc::new(ram_storage.clone()));
        let merge_policy = Arc::new(NopMergePolicy);
        let uploader = Uploader::new(
            UploaderType::IndexUploader,
            MetastoreServiceClient::from_mock(mock_metastore),
            merge_policy,
            None,
            split_store,
            SplitsUpdateMailbox::Sequencer(sequencer_mailbox),
            4,
            EventBroker::default(),
        );
        let (uploader_mailbox, uploader_handle) = universe.spawn_builder().spawn(uploader);
        let split_scratch_directory_1 = TempDirectory::for_test();
        let split_scratch_directory_2 = TempDirectory::for_test();
        let packaged_split_1 = PackagedSplit {
            split_attrs: SplitAttrs {
                node_id: node_id.clone(),
                index_uid: index_uid.clone(),
                source_id: source_id.clone(),
                doc_mapping_uid: DocMappingUid::default(),
                split_id: "test-split-1".to_string(),
                partition_id: 3u64,
                num_docs: 10,
                uncompressed_docs_size_in_bytes: 1_000,
                time_range: Some(
                    DateTime::from_timestamp_secs(1_628_203_589)
                        ..=DateTime::from_timestamp_secs(1_628_203_640),
                ),
                replaced_split_ids: vec![
                    "replaced-split-1".to_string(),
                    "replaced-split-2".to_string(),
                ],
                delete_opstamp: 0,
                num_merge_ops: 0,
            },
            serialized_split_fields: Vec::new(),
            split_scratch_directory: split_scratch_directory_1,
            tags: Default::default(),
            split_files: Vec::new(),
            hotcache_bytes: Vec::new(),
        };
        let package_split_2 = PackagedSplit {
            split_attrs: SplitAttrs {
                node_id,
                index_uid,
                source_id,
                doc_mapping_uid: DocMappingUid::default(),
                split_id: "test-split-2".to_string(),
                partition_id: 3u64,
                num_docs: 10,
                uncompressed_docs_size_in_bytes: 1_000,
                time_range: Some(
                    DateTime::from_timestamp_secs(1_628_203_589)
                        ..=DateTime::from_timestamp_secs(1_628_203_640),
                ),
                replaced_split_ids: vec![
                    "replaced-split-1".to_string(),
                    "replaced-split-2".to_string(),
                ],
                delete_opstamp: 0,
                num_merge_ops: 0,
            },
            serialized_split_fields: Vec::new(),
            split_scratch_directory: split_scratch_directory_2,
            tags: Default::default(),
            split_files: Vec::new(),
            hotcache_bytes: Vec::new(),
        };
        uploader_mailbox
            .send_message(PackagedSplitBatch::new(
                vec![packaged_split_1, package_split_2],
                None,
                PublishLock::default(),
                None,
                None,
                Span::none(),
            ))
            .await?;
        assert_eq!(
            uploader_handle.process_pending_and_observe().await.obs_type,
            ObservationType::Alive
        );
        let mut publish_futures: Vec<oneshot::Receiver<SequencerCommand<SplitsUpdate>>> =
            sequencer_inbox.drain_for_test_typed();
        assert_eq!(publish_futures.len(), 1);

        let publisher_message = match publish_futures.pop().unwrap().await? {
            SequencerCommand::Discard => panic!(
                "Expected `SequencerCommand::Proceed(SplitsUpdate)`, got \
                 `SequencerCommand::Discard`."
            ),
            SequencerCommand::Proceed(publisher_message) => publisher_message,
        };
        let SplitsUpdate {
            index_uid,
            new_splits,
            mut replaced_split_ids,
            checkpoint_delta_opt,
            ..
        } = publisher_message;
        assert_eq!(index_uid.index_id, "test-index");
        // Sort first to avoid test failing.
        replaced_split_ids.sort();
        assert_eq!(new_splits.len(), 2);
        assert_eq!(new_splits[0].split_id(), "test-split-1");
        assert_eq!(new_splits[1].split_id(), "test-split-2");
        assert_eq!(
            &replaced_split_ids,
            &[
                "replaced-split-1".to_string(),
                "replaced-split-2".to_string()
            ]
        );
        assert!(checkpoint_delta_opt.is_none());

        let mut files = ram_storage.list_files().await;
        files.sort();
        assert_eq!(
            &files,
            &[
                PathBuf::from("test-split-1.split"),
                PathBuf::from("test-split-2.split")
            ]
        );
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_uploader_without_sequencer() -> anyhow::Result<()> {
        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::for_test("test-index", 0);
        let index_uid_clone = index_uid.clone();
        let source_id = "test-source".to_string();

        let universe = Universe::new();
        let (publisher_mailbox, publisher_inbox) = universe.create_test_mailbox::<Publisher>();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_stage_splits()
            .withf(move |stage_splits_request| -> bool {
                stage_splits_request.index_uid() == &index_uid_clone
            })
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let ram_storage = RamStorage::default();
        let split_store =
            IndexingSplitStore::create_without_local_store_for_test(Arc::new(ram_storage.clone()));
        let merge_policy = Arc::new(NopMergePolicy);
        let uploader = Uploader::new(
            UploaderType::IndexUploader,
            MetastoreServiceClient::from_mock(mock_metastore),
            merge_policy,
            None,
            split_store,
            SplitsUpdateMailbox::Publisher(publisher_mailbox),
            4,
            EventBroker::default(),
        );
        let (uploader_mailbox, uploader_handle) = universe.spawn_builder().spawn(uploader);
        let split_scratch_directory = TempDirectory::for_test();
        let checkpoint_delta_opt: Option<IndexCheckpointDelta> = Some(IndexCheckpointDelta {
            source_id: "test-source".to_string(),
            source_delta: SourceCheckpointDelta::from_range(3..15),
        });
        uploader_mailbox
            .send_message(PackagedSplitBatch::new(
                vec![PackagedSplit {
                    split_attrs: SplitAttrs {
                        node_id,
                        index_uid,
                        source_id,
                        doc_mapping_uid: DocMappingUid::default(),
                        split_id: "test-split".to_string(),
                        partition_id: 3u64,
                        time_range: None,
                        uncompressed_docs_size_in_bytes: 1_000,
                        num_docs: 10,
                        replaced_split_ids: Vec::new(),
                        delete_opstamp: 10,
                        num_merge_ops: 0,
                    },
                    serialized_split_fields: Vec::new(),
                    split_scratch_directory,
                    tags: Default::default(),
                    hotcache_bytes: Vec::new(),
                    split_files: Vec::new(),
                }],
                checkpoint_delta_opt,
                PublishLock::default(),
                None,
                None,
                Span::none(),
            ))
            .await?;
        assert_eq!(
            uploader_handle.process_pending_and_observe().await.obs_type,
            ObservationType::Alive
        );
        let SplitsUpdate {
            index_uid,
            new_splits,
            replaced_split_ids,
            ..
        } = publisher_inbox.recv_typed_message().await.unwrap();

        assert_eq!(index_uid.index_id, "test-index");
        assert_eq!(new_splits.len(), 1);
        assert!(replaced_split_ids.is_empty());
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_uploader_with_empty_splits() -> anyhow::Result<()> {
        let universe = Universe::new();
        let (sequencer_mailbox, sequencer_inbox) =
            universe.create_test_mailbox::<Sequencer<Publisher>>();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_stage_splits().never();
        let ram_storage = RamStorage::default();
        let split_store =
            IndexingSplitStore::create_without_local_store_for_test(Arc::new(ram_storage.clone()));
        let uploader = Uploader::new(
            UploaderType::IndexUploader,
            MetastoreServiceClient::from_mock(mock_metastore),
            default_merge_policy(),
            None,
            split_store,
            SplitsUpdateMailbox::Sequencer(sequencer_mailbox),
            4,
            EventBroker::default(),
        );
        let (uploader_mailbox, uploader_handle) = universe.spawn_builder().spawn(uploader);
        let checkpoint_delta = IndexCheckpointDelta {
            source_id: "test-source".to_string(),
            source_delta: SourceCheckpointDelta::from_range(3..15),
        };
        uploader_mailbox
            .send_message(EmptySplit {
                index_uid: IndexUid::new_with_random_ulid("test-index"),
                checkpoint_delta,
                publish_lock: PublishLock::default(),
                publish_token_opt: None,
                batch_parent_span: Span::none(),
            })
            .await?;
        assert_eq!(
            uploader_handle.process_pending_and_observe().await.obs_type,
            ObservationType::Alive
        );
        let mut publish_futures: Vec<oneshot::Receiver<SequencerCommand<SplitsUpdate>>> =
            sequencer_inbox.drain_for_test_typed();
        assert_eq!(publish_futures.len(), 1);

        let publisher_message = match publish_futures.pop().unwrap().await? {
            SequencerCommand::Discard => panic!(
                "Expected `SequencerCommand::Proceed(SplitUpdate)`, got \
                 `SequencerCommand::Discard`."
            ),
            SequencerCommand::Proceed(publisher_message) => publisher_message,
        };
        let SplitsUpdate {
            index_uid,
            new_splits,
            checkpoint_delta_opt,
            replaced_split_ids,
            ..
        } = publisher_message;

        assert_eq!(index_uid.index_id, "test-index");
        assert_eq!(new_splits.len(), 0);
        let checkpoint_delta = checkpoint_delta_opt.unwrap();
        assert_eq!(checkpoint_delta.source_id, "test-source");
        assert_eq!(
            checkpoint_delta.source_delta,
            SourceCheckpointDelta::from_range(3..15)
        );
        assert!(replaced_split_ids.is_empty());
        let files = ram_storage.list_files().await;
        assert!(files.is_empty());
        universe.assert_quit().await;
        Ok(())
    }

    struct ReportSplitListener {
        report_splits_tx: flume::Sender<ReportSplitsRequest>,
    }

    impl std::fmt::Debug for ReportSplitListener {
        fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
            f.debug_struct("ReportSplitListener").finish()
        }
    }

    #[async_trait]
    impl EventSubscriber<ReportSplitsRequest> for ReportSplitListener {
        async fn handle_event(&mut self, event: ReportSplitsRequest) {
            self.report_splits_tx.send(event).unwrap();
        }
    }

    #[tokio::test]
    async fn test_uploader_notifies_event_broker() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        const SPLIT_ULID_STR: &str = "01HAV29D4XY3D462FS3D8K5Q2H";
        let event_broker = EventBroker::default();
        let (report_splits_tx, report_splits_rx) = flume::unbounded();
        let report_splits_listener = ReportSplitListener { report_splits_tx };

        // we need to keep the handle alive.
        let _subscribe_handle = event_broker.subscribe(report_splits_listener);

        let node_id = NodeId::from("test-node");
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_id = "test-source".to_string();

        let universe = Universe::new();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_stage_splits()
            .times(1)
            .returning(|_| Ok(EmptyResponse {}));
        let ram_storage = RamStorage::default();
        let split_store =
            IndexingSplitStore::create_without_local_store_for_test(Arc::new(ram_storage.clone()));
        let merge_policy = Arc::new(NopMergePolicy);
        let (publisher_mailbox, _publisher_inbox) = universe.create_test_mailbox();
        let uploader = Uploader::new(
            UploaderType::IndexUploader,
            MetastoreServiceClient::from_mock(mock_metastore),
            merge_policy,
            None,
            split_store,
            SplitsUpdateMailbox::Publisher(publisher_mailbox),
            4,
            event_broker,
        );
        let (uploader_mailbox, uploader_handle) = universe.spawn_builder().spawn(uploader);
        let split_scratch_directory = TempDirectory::for_test();
        let checkpoint_delta_opt: Option<IndexCheckpointDelta> = Some(IndexCheckpointDelta {
            source_id: "test-source".to_string(),
            source_delta: SourceCheckpointDelta::from_range(3..15),
        });
        uploader_mailbox
            .send_message(PackagedSplitBatch::new(
                vec![PackagedSplit {
                    split_attrs: SplitAttrs {
                        node_id,
                        index_uid,
                        source_id,
                        doc_mapping_uid: DocMappingUid::default(),
                        partition_id: 3u64,
                        time_range: Some(
                            DateTime::from_timestamp_secs(1_628_203_589)
                                ..=DateTime::from_timestamp_secs(1_628_203_640),
                        ),
                        uncompressed_docs_size_in_bytes: 1_000,
                        num_docs: 10,
                        replaced_split_ids: Vec::new(),
                        split_id: SPLIT_ULID_STR.to_string(),
                        delete_opstamp: 10,
                        num_merge_ops: 0,
                    },
                    serialized_split_fields: Vec::new(),
                    split_scratch_directory,
                    tags: Default::default(),
                    hotcache_bytes: Vec::new(),
                    split_files: Vec::new(),
                }],
                checkpoint_delta_opt,
                PublishLock::default(),
                None,
                None,
                Span::none(),
            ))
            .await?;
        assert_eq!(
            uploader_handle.process_pending_and_observe().await.obs_type,
            ObservationType::Alive
        );
        mem::drop(uploader_mailbox);
        let report_splits: ReportSplitsRequest = report_splits_rx
            .recv_timeout(Duration::from_secs(1))
            .unwrap();
        assert_eq!(report_splits.report_splits.len(), 1);
        let split = &report_splits.report_splits[0];
        assert_eq!(split.storage_uri, "ram:///");
        assert_eq!(split.split_id, SPLIT_ULID_STR);
        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/actors/vrl_processing.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;

use quickwit_config::TransformConfig;
use tracing::warn;
use vrl::compiler::runtime::Runtime;
pub use vrl::compiler::runtime::Terminate as VrlTerminate;
use vrl::compiler::state::RuntimeState;
use vrl::compiler::{Program, TargetValueRef, TimeZone};
pub use vrl::value::{Secrets as VrlSecrets, Value as VrlValue};

use super::doc_processor::DocProcessorError;

pub(super) struct VrlDoc {
    pub vrl_value: VrlValue,
    pub num_bytes: usize,
}

impl VrlDoc {
    pub fn new(vrl_value: VrlValue, num_bytes: usize) -> Self {
        Self {
            vrl_value,
            num_bytes,
        }
    }
}

pub(super) struct VrlProgram {
    program: Program,
    timezone: TimeZone,
    runtime: Runtime,
    metadata: VrlValue,
    secrets: VrlSecrets,
}

impl VrlProgram {
    pub fn transform_doc(&mut self, vrl_doc: VrlDoc) -> Result<VrlDoc, DocProcessorError> {
        let VrlDoc {
            mut vrl_value,
            num_bytes,
        } = vrl_doc;

        let mut target = TargetValueRef {
            value: &mut vrl_value,
            metadata: &mut self.metadata,
            secrets: &mut self.secrets,
        };
        let runtime_res = self
            .runtime
            .resolve(&mut target, &self.program, &self.timezone)
            .map_err(|transform_error| {
                warn!(transform_error=?transform_error);
                DocProcessorError::Transform(transform_error)
            });

        if let VrlValue::Object(metadata) = target.metadata {
            metadata.clear();
        }
        self.runtime.clear();

        runtime_res.map(|vrl_value| VrlDoc::new(vrl_value, num_bytes))
    }

    pub fn try_from_transform_config(transform_config: TransformConfig) -> anyhow::Result<Self> {
        let (program, timezone) = transform_config.compile_vrl_script()?;
        let state = RuntimeState::default();
        let runtime = Runtime::new(state);

        Ok(VrlProgram {
            program,
            runtime,
            timezone,
            metadata: VrlValue::Object(BTreeMap::new()),
            secrets: VrlSecrets::default(),
        })
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/controlled_directory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io::{BufWriter, IntoInnerError};
use std::ops::Deref;
use std::path::Path;
use std::sync::Arc;
use std::{fmt, io};

use arc_swap::ArcSwap;
use quickwit_common::ProtectedZoneGuard;
use quickwit_common::io::{ControlledWrite, IoControls, IoControlsAccess};
use tantivy::Directory;
use tantivy::directory::error::{DeleteError, OpenReadError, OpenWriteError};
use tantivy::directory::{
    AntiCallToken, FileHandle, TerminatingWrite, WatchCallback, WatchHandle, WritePtr,
};

/// Buffer capacity.
///
/// This is the current default for the BufWriter, but considering this constant
/// will have a direct impact on health check, we'd better fix it.
const BUFFER_NUM_BYTES: usize = 8_192;

/// The `ControlledDirectory` wraps another directory and enhances it
/// with functionalities such as
/// - records progress everytime a write (Note there is however a buffer writer above it)
/// - if the killswitch is activated, returns an error on the first write happening after it
/// - in the future, record a writing speed, possibly introduce some throttling, etc.
#[derive(Clone)]
pub struct ControlledDirectory {
    underlying: Arc<dyn Directory>,
    io_controls: HotswappableIoControls,
}

impl ControlledDirectory {
    pub fn new(directory: Box<dyn Directory>, io_controls: IoControls) -> ControlledDirectory {
        ControlledDirectory {
            underlying: directory.into(),
            io_controls: HotswappableIoControls::new(io_controls),
        }
    }

    pub fn check_if_alive(&self) -> io::Result<ProtectedZoneGuard> {
        self.io_controls.load().check_if_alive()
    }

    pub fn set_io_controls(&self, io_controls: IoControls) {
        self.io_controls.store(Arc::new(io_controls));
    }
}

impl fmt::Debug for ControlledDirectory {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("ControlledDirectory").finish()
    }
}

impl Directory for ControlledDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        self.check_if_alive()
            .map_err(|io_err| OpenReadError::wrap_io_error(io_err, path.to_path_buf()))?;
        self.underlying.get_file_handle(path)
    }

    fn delete(&self, path: &Path) -> Result<(), DeleteError> {
        self.check_if_alive()
            .map_err(|io_error| DeleteError::IoError {
                io_error: Arc::new(io_error),
                filepath: path.to_path_buf(),
            })?;
        self.underlying.delete(path)
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        self.check_if_alive()
            .map_err(|io_err| OpenReadError::wrap_io_error(io_err, path.to_path_buf()))?;
        self.underlying.exists(path)
    }

    fn open_write(&self, path: &Path) -> Result<WritePtr, OpenWriteError> {
        self.check_if_alive()
            .map_err(|io_err| OpenWriteError::wrap_io_error(io_err, path.to_path_buf()))?;

        let underlying_wrt: Box<dyn TerminatingWrite> = self
            .underlying
            .open_write(path)?
            .into_inner()
            .map_err(IntoInnerError::into_error)
            .map_err(|io_err| OpenWriteError::wrap_io_error(io_err, path.to_path_buf()))?;
        let controlled_wrt = self.io_controls.clone().wrap_write(underlying_wrt);
        Ok(BufWriter::with_capacity(
            BUFFER_NUM_BYTES,
            Box::new(AdoptedControlledWrite(controlled_wrt)),
        ))
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        self.check_if_alive()
            .map_err(|io_err| OpenReadError::wrap_io_error(io_err, path.to_path_buf()))?;
        self.underlying.atomic_read(path)
    }

    fn atomic_write(&self, path: &Path, data: &[u8]) -> io::Result<()> {
        self.check_if_alive()?;
        self.underlying.atomic_write(path, data)
    }

    fn watch(&self, watch_callback: WatchCallback) -> tantivy::Result<WatchHandle> {
        self.check_if_alive()?;
        self.underlying.watch(watch_callback)
    }

    fn sync_directory(&self) -> io::Result<()> {
        self.check_if_alive()?;
        self.underlying.sync_directory()
    }
}

#[derive(Clone)]
struct HotswappableIoControls(Arc<ArcSwap<IoControls>>);

impl Deref for HotswappableIoControls {
    type Target = ArcSwap<IoControls>;

    fn deref(&self) -> &Self::Target {
        &self.0
    }
}

impl HotswappableIoControls {
    pub fn new(io_controls: IoControls) -> Self {
        Self(Arc::new(ArcSwap::new(Arc::new(io_controls))))
    }
}

impl IoControlsAccess for HotswappableIoControls {
    fn apply<F, R>(&self, f: F) -> R
    where F: Fn(&IoControls) -> R {
        let guard = self.0.load();
        f(&guard)
    }
}

// Wrapper to work around the orphan rule. (hence the word "Adopted").
struct AdoptedControlledWrite(ControlledWrite<HotswappableIoControls, Box<dyn TerminatingWrite>>);

impl io::Write for AdoptedControlledWrite {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        self.0.write(buf)
    }

    fn flush(&mut self) -> io::Result<()> {
        self.0.flush()
    }
}

impl TerminatingWrite for AdoptedControlledWrite {
    #[inline]
    fn terminate_ref(&mut self, token: AntiCallToken) -> io::Result<()> {
        let underlying_wrt = self.0.underlying_wrt();
        underlying_wrt.flush()?;
        underlying_wrt.terminate_ref(token)
    }
}

#[cfg(test)]
mod tests {
    use std::io::Write;

    use tantivy::directory::RamDirectory;

    use super::*;

    #[test]
    fn test_records_progress_on_write() -> anyhow::Result<()> {
        let directory = RamDirectory::default();
        let io_controls = IoControls::default();
        let controlled_directory =
            ControlledDirectory::new(Box::new(directory), io_controls.clone());
        let progress = io_controls.progress().clone();
        assert!(progress.registered_activity_since_last_call());
        assert!(!progress.registered_activity_since_last_call());
        let mut wrt = controlled_directory.open_write(Path::new("test"))?;
        assert!(progress.registered_activity_since_last_call());
        // We use a large buffer to force the buf writer to flush at least once.
        let large_buffer = vec![0u8; wrt.capacity() + 1];
        assert_eq!(io_controls.num_bytes(), 0u64);
        wrt.write_all(&large_buffer)?;
        assert_eq!(io_controls.num_bytes(), 8_193u64);
        assert!(progress.registered_activity_since_last_call());
        wrt.write_all(b"small payload")?;
        // The buffering makes it so that this last write does not
        // get actually written right away.
        assert_eq!(io_controls.num_bytes(), 8_193u64);
        // Here we check that the progress only concerns is only
        // trigger when the BufWriter flushes.
        assert!(!progress.registered_activity_since_last_call());
        wrt.write_all(&large_buffer)?;
        assert_eq!(io_controls.num_bytes(), 16_399);
        assert!(progress.registered_activity_since_last_call());
        assert!(!progress.registered_activity_since_last_call());
        wrt.write_all(&b"aa"[..])?;
        assert_eq!(io_controls.num_bytes(), 16_399u64);
        wrt.terminate()?;
        // Flush works as expected and makes sure all data buffered goes through
        assert_eq!(io_controls.num_bytes(), 16_401u64);
        assert!(progress.registered_activity_since_last_call());
        Ok(())
    }

    #[test]
    fn test_records_kill_switch_triggers_io_error() -> anyhow::Result<()> {
        let directory = RamDirectory::default();
        let io_controls = IoControls::default();
        let controlled_directory =
            ControlledDirectory::new(Box::new(directory), io_controls.clone());
        let mut wrt = controlled_directory.open_write(Path::new("test"))?;
        // We use a large buffer to force the buf writer to flush at least once.
        let large_buffer = vec![0u8; wrt.capacity() + 1];
        wrt.write_all(&large_buffer)?;
        io_controls.kill();
        let err = wrt.write_all(&large_buffer).err().unwrap();
        assert_eq!(err.kind(), io::ErrorKind::Other);
        wrt.terminate()?;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

use quickwit_actors::{Mailbox, Universe};
use quickwit_cluster::Cluster;
use quickwit_common::pubsub::EventBroker;
use quickwit_config::NodeConfig;
use quickwit_ingest::{IngestApiService, IngesterPool};
use quickwit_proto::indexing::PipelineMetrics;
use quickwit_proto::metastore::MetastoreServiceClient;
use quickwit_storage::StorageResolver;
use tracing::info;

use crate::actors::MergeSchedulerService;
pub use crate::actors::{
    FinishPendingMergesAndShutdownPipeline, IndexingError, IndexingPipeline,
    IndexingPipelineParams, IndexingService, PublisherType, Sequencer, SplitsUpdateMailbox,
};
pub use crate::controlled_directory::ControlledDirectory;
use crate::models::IndexingStatistics;
pub use crate::split_store::{IndexingSplitStore, get_tantivy_directory_from_split_bundle};

pub mod actors;
mod controlled_directory;
pub mod merge_policy;
mod metrics;
pub mod models;
pub mod source;
mod split_store;
#[cfg(any(test, feature = "testsuite"))]
mod test_utils;

use quickwit_proto::indexing::CpuCapacity;
#[cfg(any(test, feature = "testsuite"))]
pub use test_utils::{MockSplitBuilder, TestSandbox, mock_split, mock_split_meta};

use self::merge_policy::MergePolicy;
pub use self::source::check_source_connectivity;

#[derive(utoipa::OpenApi)]
#[openapi(components(schemas(IndexingStatistics, PipelineMetrics, CpuCapacity)))]
/// Schema used for the OpenAPI generation which are apart of this crate.
pub struct IndexingApiSchemas;

pub fn new_split_id() -> String {
    ulid::Ulid::new().to_string()
}

#[allow(clippy::too_many_arguments)]
pub async fn start_indexing_service(
    universe: &Universe,
    config: &NodeConfig,
    num_blocking_threads: usize,
    cluster: Cluster,
    metastore: MetastoreServiceClient,
    ingester_pool: IngesterPool,
    storage_resolver: StorageResolver,
    event_broker: EventBroker,
) -> anyhow::Result<Mailbox<IndexingService>> {
    info!("starting indexer service");
    let ingest_api_service_mailbox = universe.get_one::<IngestApiService>();
    let (merge_scheduler_mailbox, _) = universe.spawn_builder().spawn(MergeSchedulerService::new(
        config.indexer_config.merge_concurrency.get(),
    ));
    // Spawn indexing service.
    let indexing_service = IndexingService::new(
        config.node_id.clone(),
        config.data_dir_path.to_path_buf(),
        config.indexer_config.clone(),
        num_blocking_threads,
        cluster,
        metastore.clone(),
        ingest_api_service_mailbox,
        merge_scheduler_mailbox,
        ingester_pool,
        storage_resolver,
        event_broker,
    )
    .await?;
    let (indexing_service, _) = universe.spawn_builder().spawn(indexing_service);
    Ok(indexing_service)
}


================================================
FILE: quickwit/quickwit-indexing/src/merge_policy/const_write_amplification.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::ops::RangeInclusive;

use quickwit_config::IndexingSettings;
use quickwit_config::merge_policy_config::ConstWriteAmplificationMergePolicyConfig;
use quickwit_metastore::{SplitMaturity, SplitMetadata};
use time::OffsetDateTime;
use tracing::info;

use super::MergeOperation;
use crate::merge_policy::MergePolicy;

// Smallest number of splits in a finalize merge.
const FINALIZE_MIN_MERGE_FACTOR: usize = 3;

/// The `ConstWriteAmplificationMergePolicy` has been designed for a use
/// case where there are a several index partitions with different sizes,
/// and partitions tend to be searched separately. (e.g. partitioning by tenant.)
///
/// In that case, the StableLogMergePolicy would tend to target the same number
/// of docs for all tenants. Assuming a merge factor of 10 and a target num docs of 10 millions,
/// The write amplification observed for a small tenant, emitting splits of 1
/// document would be 7.
///
/// These extra merges have the benefit of making less splits, but really we are
/// over-trading write amplification for read amplification here.
///
/// The `ConstWriteAmplificationMergePolicy` is very simple. It targets a number
/// of merges instead, and stops once this number of merges is reached.
///
/// Only splits with the same number of merge operations are merged together,
/// and for a given merge operation, we build split in a greedy way.
/// After sorting the splits per creation date, we append splits one after the
/// other until we either reach `max_merge_factor` or we exceed the
/// targeted` split_num_docs`.
#[derive(Debug, Clone)]
pub struct ConstWriteAmplificationMergePolicy {
    config: ConstWriteAmplificationMergePolicyConfig,
    split_num_docs_target: usize,
}

impl Default for ConstWriteAmplificationMergePolicy {
    fn default() -> Self {
        ConstWriteAmplificationMergePolicy {
            config: Default::default(),
            split_num_docs_target: IndexingSettings::default_split_num_docs_target(),
        }
    }
}

impl ConstWriteAmplificationMergePolicy {
    pub fn new(
        config: ConstWriteAmplificationMergePolicyConfig,
        split_num_docs_target: usize,
    ) -> Self {
        ConstWriteAmplificationMergePolicy {
            config,
            split_num_docs_target,
        }
    }

    #[cfg(test)]
    fn for_test() -> ConstWriteAmplificationMergePolicy {
        use std::time::Duration;

        let config = ConstWriteAmplificationMergePolicyConfig {
            max_merge_ops: 3,
            merge_factor: 3,
            max_merge_factor: 5,
            maturation_period: Duration::from_secs(3600),
            max_finalize_merge_operations: 0,
            max_finalize_split_num_docs: None,
        };
        Self::new(config, 10_000_000)
    }

    /// Returns a merge operation within one `num_merge_ops` level if one can be built from the
    /// given splits. This method assumes that the splits are sorted by reverse creation date
    /// and have all the same `num_merge_ops`.
    fn single_merge_operation_within_num_merge_op_level(
        &self,
        splits: &mut Vec<SplitMetadata>,
        merge_factor_range: RangeInclusive<usize>,
    ) -> Option<MergeOperation> {
        let mut num_splits_in_merge = 0;
        let mut num_docs_in_merge = 0;
        for split in splits.iter().take(*merge_factor_range.end()) {
            num_docs_in_merge += split.num_docs;
            num_splits_in_merge += 1;
            if num_docs_in_merge >= self.split_num_docs_target {
                break;
            }
        }
        if (num_docs_in_merge < self.split_num_docs_target)
            && (num_splits_in_merge < *merge_factor_range.start())
        {
            return None;
        }
        assert!(num_splits_in_merge >= 2);
        let splits_in_merge = splits.drain(0..num_splits_in_merge).collect();
        let merge_operation = MergeOperation::new_merge_operation(splits_in_merge);
        Some(merge_operation)
    }

    fn merge_operations_within_num_merge_op_level(
        &self,
        splits: &mut Vec<SplitMetadata>,
    ) -> Vec<MergeOperation> {
        splits.sort_by(|left, right| {
            left.create_timestamp
                .cmp(&right.create_timestamp)
                .then_with(|| left.split_id().cmp(right.split_id()))
        });
        let mut merge_operations = Vec::new();
        while let Some(merge_op) =
            self.single_merge_operation_within_num_merge_op_level(splits, self.merge_factor_range())
        {
            merge_operations.push(merge_op);
        }
        merge_operations
    }

    fn merge_factor_range(&self) -> RangeInclusive<usize> {
        self.config.merge_factor..=self.config.max_merge_factor
    }
}

impl MergePolicy for ConstWriteAmplificationMergePolicy {
    fn operations(&self, splits: &mut Vec<SplitMetadata>) -> Vec<MergeOperation> {
        let mut group_by_num_merge_ops: HashMap<usize, Vec<SplitMetadata>> = HashMap::default();
        let mut mature_splits = Vec::new();
        let now = OffsetDateTime::now_utc();
        for split in splits.drain(..) {
            if split.is_mature(now) {
                mature_splits.push(split);
            } else {
                group_by_num_merge_ops
                    .entry(split.num_merge_ops)
                    .or_default()
                    .push(split);
            }
        }
        splits.extend(mature_splits);
        let mut merge_operations = Vec::new();
        for splits_in_group in group_by_num_merge_ops.values_mut() {
            let merge_ops = self.merge_operations_within_num_merge_op_level(splits_in_group);
            merge_operations.extend(merge_ops);
            // we readd the splits that are not used in a merge operation into the splits vector.
            splits.append(splits_in_group);
        }
        merge_operations
    }

    fn finalize_operations(&self, splits: &mut Vec<SplitMetadata>) -> Vec<MergeOperation> {
        if self.config.max_finalize_merge_operations == 0 {
            return Vec::new();
        }

        let now = OffsetDateTime::now_utc();

        // We first isolate mature splits. Let's not touch them.
        let (mature_splits, mut young_splits): (Vec<SplitMetadata>, Vec<SplitMetadata>) =
            splits.drain(..).partition(|split: &SplitMetadata| {
                if let Some(max_finalize_split_num_docs) = self.config.max_finalize_split_num_docs
                    && split.num_docs > max_finalize_split_num_docs
                {
                    return true;
                }
                split.is_mature(now)
            });
        splits.extend(mature_splits);

        // We then sort the split by reverse creation date and split id.
        // You may notice that reverse is the opposite of the rest of the policy.
        //
        // This is because these are the youngest splits. If we limit ourselves in the number of
        // merge we will operate, we might as well focus on the young == smaller ones for that
        // last merge.
        young_splits.sort_by(|left, right| {
            left.create_timestamp
                .cmp(&right.create_timestamp)
                .reverse()
                .then_with(|| left.split_id().cmp(right.split_id()))
        });
        let mut merge_operations = Vec::new();
        while merge_operations.len() < self.config.max_finalize_merge_operations {
            let min_merge_factor = FINALIZE_MIN_MERGE_FACTOR.min(self.config.max_merge_factor);
            let merge_factor_range = min_merge_factor..=self.config.max_merge_factor;
            if let Some(merge_op) = self.single_merge_operation_within_num_merge_op_level(
                &mut young_splits,
                merge_factor_range,
            ) {
                merge_operations.push(merge_op);
            } else {
                break;
            }
        }

        // We readd the young splits that are not used in any merge operation.
        splits.extend(young_splits);

        assert!(merge_operations.len() <= self.config.max_finalize_merge_operations);

        let num_splits_per_merge_op: Vec<usize> =
            merge_operations.iter().map(|op| op.splits.len()).collect();
        let num_docs_per_merge_op: Vec<usize> = merge_operations
            .iter()
            .map(|op| op.splits.iter().map(|split| split.num_docs).sum::<usize>())
            .collect();
        info!(
            num_splits_per_merge_op=?num_splits_per_merge_op,
            num_docs_per_merge_op=?num_docs_per_merge_op,
            "finalize merge operation");
        merge_operations
    }

    fn split_maturity(&self, split_num_docs: usize, split_num_merge_ops: usize) -> SplitMaturity {
        if split_num_merge_ops >= self.config.max_merge_ops {
            return SplitMaturity::Mature;
        }
        if split_num_docs >= self.split_num_docs_target {
            return SplitMaturity::Mature;
        }
        SplitMaturity::Immature {
            maturation_period: self.config.maturation_period,
        }
    }

    #[cfg(test)]
    fn check_is_valid(&self, merge_op: &MergeOperation, _remaining_splits: &[SplitMetadata]) {
        use std::collections::HashSet;
        assert!(merge_op.splits_as_slice().len() <= self.config.max_merge_factor);
        if merge_op.splits_as_slice().len() < self.config.merge_factor {
            let num_docs: usize = merge_op
                .splits_as_slice()
                .iter()
                .map(|split| split.num_docs)
                .sum();
            let last_split_num_docs = merge_op.splits_as_slice().last().unwrap().num_docs;
            assert!(num_docs >= self.split_num_docs_target);
            assert!(num_docs - last_split_num_docs < self.split_num_docs_target);
        }
        let num_merge_ops: HashSet<usize> = merge_op
            .splits_as_slice()
            .iter()
            .map(|merge_op| merge_op.num_merge_ops)
            .collect();
        assert_eq!(num_merge_ops.len(), 1);
        assert!(num_merge_ops.into_iter().next().unwrap() < self.config.max_merge_ops);
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;
    use std::sync::Arc;
    use std::time::Duration;

    use quickwit_metastore::{SplitMaturity, SplitMetadata};
    use rand::seq::SliceRandom;
    use time::OffsetDateTime;

    use super::ConstWriteAmplificationMergePolicy;
    use crate::MergePolicy;
    use crate::merge_policy::MergeOperation;
    use crate::merge_policy::tests::create_splits;

    #[test]
    fn test_split_is_mature() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let split = create_splits(&merge_policy, vec![9_000_000])
            .into_iter()
            .next()
            .unwrap();
        // Split under split_num_docs_target, num_merge_ops < max_merge_ops and created before now()
        // - maturation_period is not mature.
        assert_eq!(
            merge_policy.split_maturity(split.num_docs, split.num_merge_ops),
            SplitMaturity::Immature {
                maturation_period: Duration::from_secs(3600)
            }
        );
        // Split with docs > split_num_docs_target is mature.
        assert_eq!(
            merge_policy
                .split_maturity(merge_policy.split_num_docs_target + 1, split.num_merge_ops),
            SplitMaturity::Mature
        );

        // Split with num_merge_ops >= max_merge_ops is mature
        assert_eq!(
            merge_policy.split_maturity(split.num_docs, merge_policy.config.max_merge_ops),
            SplitMaturity::Mature
        );
    }

    #[test]
    fn test_const_write_amplification_merge_policy_empty() {
        let mut splits = Vec::new();
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        assert!(merge_policy.operations(&mut splits).is_empty());
    }

    #[test]
    fn test_const_write_merge_policy_single_split() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let mut splits = vec![SplitMetadata {
            split_id: "01GE1R0KBFQHJ76030RYRAS8QA".to_string(),
            num_docs: 1,
            create_timestamp: 1665000000,
            maturity: merge_policy.split_maturity(1, 0),
            num_merge_ops: 4,
            ..Default::default()
        }];
        let operations: Vec<MergeOperation> = merge_policy.operations(&mut splits);
        assert!(operations.is_empty());
        assert_eq!(splits.len(), 1);
    }

    #[test]
    fn test_const_write_merge_policy_simple() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let create_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        let mut splits = (0..merge_policy.config.merge_factor)
            .map(|i| SplitMetadata {
                split_id: format!("split-{i}"),
                num_docs: 1_000,
                num_merge_ops: 1,
                create_timestamp,
                maturity: merge_policy.split_maturity(1_000, 1),
                ..Default::default()
            })
            .collect();
        let operations: Vec<MergeOperation> = merge_policy.operations(&mut splits);
        assert_eq!(operations.len(), 1);
        assert_eq!(
            operations[0].splits_as_slice().len(),
            merge_policy.config.merge_factor
        );
    }

    #[test]
    fn test_const_write_merge_policy_merge_factor_max() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let time_to_maturity = merge_policy.split_maturity(1_000, 1);
        let create_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        let mut splits =
            (0..merge_policy.config.max_merge_factor + merge_policy.config.merge_factor - 1)
                .map(|i| SplitMetadata {
                    split_id: format!("split-{i}"),
                    num_docs: 1_000,
                    num_merge_ops: 1,
                    create_timestamp,
                    maturity: time_to_maturity,
                    ..Default::default()
                })
                .collect();
        let operations: Vec<MergeOperation> = merge_policy.operations(&mut splits);
        assert_eq!(operations.len(), 1);
        assert_eq!(
            operations[0].splits_as_slice().len(),
            merge_policy.config.max_merge_factor
        );
    }

    #[test]
    fn test_const_write_merge_policy_older_first() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let time_to_maturity = merge_policy.split_maturity(1_000, 1);
        let now_timestamp: i64 = OffsetDateTime::now_utc().unix_timestamp();
        let mut splits: Vec<SplitMetadata> = (0..merge_policy.config.max_merge_factor)
            .map(|i| SplitMetadata {
                split_id: format!("split-{i}"),
                num_docs: 1_000,
                num_merge_ops: 1,
                create_timestamp: now_timestamp + i as i64,
                maturity: time_to_maturity,
                ..Default::default()
            })
            .collect();
        splits.shuffle(&mut rand::rng());
        let operations: Vec<MergeOperation> = merge_policy.operations(&mut splits);
        assert_eq!(operations.len(), 1);
        assert_eq!(
            operations[0].splits_as_slice().len(),
            merge_policy.config.max_merge_factor
        );
        let split_ids: Vec<&str> = operations[0]
            .splits_as_slice()
            .iter()
            .map(|split| split.split_id())
            .collect();
        assert_eq!(
            &split_ids[..],
            &["split-0", "split-1", "split-2", "split-3", "split-4"]
        );
    }

    #[test]
    fn test_const_write_merge_policy_target_num_docs() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let create_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        let mut splits = (0..4)
            .map(|i| {
                let num_docs = merge_policy.split_num_docs_target.div_ceil(3);
                let time_to_maturity = merge_policy.split_maturity(num_docs, 1);
                SplitMetadata {
                    split_id: format!("split-{i}"),
                    num_docs,
                    num_merge_ops: 1,
                    create_timestamp,
                    maturity: time_to_maturity,
                    ..Default::default()
                }
            })
            .collect();
        let operations: Vec<MergeOperation> = merge_policy.operations(&mut splits);
        assert_eq!(operations.len(), 1);
        assert_eq!(operations[0].splits_as_slice().len(), 3);
    }

    #[test]
    fn test_const_write_amp_merge_policy_proptest() {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        crate::merge_policy::tests::proptest_merge_policy(&merge_policy);
    }

    #[tokio::test]
    async fn test_simulate_const_write_amplification_merge_policy() -> anyhow::Result<()> {
        let merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        let vals = vec![1; 1_211]; //< 1_211 splits with a single doc each.
        let final_splits = crate::merge_policy::tests::aux_test_simulate_merge_planner_num_docs(
            Arc::new(merge_policy.clone()),
            &vals[..],
            &|splits| {
                let mut num_merge_ops_counts: HashMap<usize, usize> = HashMap::default();
                for split in splits {
                    *num_merge_ops_counts.entry(split.num_merge_ops).or_default() += 1;
                }
                for split in splits {
                    assert!(split.num_merge_ops <= merge_policy.config.max_merge_ops);
                }
                for i in 0..merge_policy.config.max_merge_ops {
                    assert!(
                        num_merge_ops_counts.get(&i).copied().unwrap_or(0)
                            < merge_policy.config.merge_factor
                    );
                }
            },
        )
        .await?;
        assert_eq!(final_splits.len(), 49);
        Ok(())
    }

    #[tokio::test]
    async fn test_simulate_const_write_amplification_merge_policy_with_finalize() {
        let mut merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        merge_policy.config.max_merge_factor = 10;
        merge_policy.config.merge_factor = 10;
        merge_policy.split_num_docs_target = 10_000_000;

        let vals: Vec<usize> = vec![1; 9 + 90 + 900]; //< 1_211 splits with a single doc each.

        let num_final_splits_given_max_finalize_merge_operations =
            |split_num_docs: Vec<usize>, max_finalize_merge_operations: usize| {
                let mut merge_policy_clone = merge_policy.clone();
                merge_policy_clone.config.max_finalize_merge_operations =
                    max_finalize_merge_operations;
                async move {
                    crate::merge_policy::tests::aux_test_simulate_merge_planner_num_docs(
                        Arc::new(merge_policy_clone),
                        &split_num_docs[..],
                        &|_splits| {},
                    )
                    .await
                    .unwrap()
                }
            };

        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vals.clone(), 0)
                .await
                .len(),
            27
        );
        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vals.clone(), 1)
                .await
                .len(),
            18
        );
        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vals.clone(), 2)
                .await
                .len(),
            9
        );
        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vals.clone(), 3)
                .await
                .len(),
            3
        );
        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vec![1; 6], 1)
                .await
                .len(),
            1
        );
        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vec![1; 3], 1)
                .await
                .len(),
            1
        );
        assert_eq!(
            num_final_splits_given_max_finalize_merge_operations(vec![1; 2], 1)
                .await
                .len(),
            2
        );

        // We check that the youngest splits are merged in priority.
        let final_splits = num_final_splits_given_max_finalize_merge_operations(
            vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11],
            1,
        )
        .await;
        assert_eq!(final_splits.len(), 2);

        let mut split_num_docs: Vec<usize> = final_splits
            .iter()
            .map(|split| split.num_docs)
            .collect::<Vec<_>>();
        split_num_docs.sort();
        assert_eq!(split_num_docs[0], 11);
        assert_eq!(split_num_docs[1], 55);
    }

    #[tokio::test]
    async fn test_simulate_const_write_amplification_merge_policy_with_finalize_max_num_docs() {
        let mut merge_policy = ConstWriteAmplificationMergePolicy::for_test();
        merge_policy.config.max_merge_factor = 10;
        merge_policy.config.merge_factor = 10;
        merge_policy.split_num_docs_target = 10_000_000;
        merge_policy.config.max_finalize_split_num_docs = Some(999_999);
        merge_policy.config.max_finalize_merge_operations = 3;

        let split_num_docs: Vec<usize> = vec![999_999, 1_000_000, 999_999, 999_999];

        let final_splits = crate::merge_policy::tests::aux_test_simulate_merge_planner_num_docs(
            Arc::new(merge_policy),
            &split_num_docs[..],
            &|_splits| {},
        )
        .await
        .unwrap();

        assert_eq!(final_splits.len(), 2);
        let mut split_num_docs: Vec<usize> =
            final_splits.iter().map(|split| split.num_docs).collect();
        split_num_docs.sort();
        assert_eq!(split_num_docs[0], 1_000_000);
        assert_eq!(split_num_docs[1], 999_999 * 3);
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/merge_policy/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod const_write_amplification;
mod nop_merge_policy;
mod stable_log_merge_policy;

use std::fmt;
use std::ops::Deref;
use std::sync::Arc;

pub(crate) use const_write_amplification::ConstWriteAmplificationMergePolicy;
use itertools::Itertools;
pub use nop_merge_policy::NopMergePolicy;
use quickwit_config::IndexingSettings;
use quickwit_config::merge_policy_config::MergePolicyConfig;
use quickwit_metastore::{SplitMaturity, SplitMetadata};
use quickwit_proto::types::SplitId;
use serde::Serialize;
pub(crate) use stable_log_merge_policy::StableLogMergePolicy;
use tantivy::TrackedObject;
use tracing::{Span, info_span};

use crate::actors::MergePermit;
use crate::new_split_id;

#[derive(Clone, Debug, PartialEq, Eq, Serialize)]
pub enum MergeOperationType {
    Merge,
    DeleteAndMerge,
}

impl fmt::Display for MergeOperationType {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{self:?}")
    }
}

pub struct MergeTask {
    pub merge_operation: TrackedObject<MergeOperation>,
    pub(crate) _merge_permit: MergePermit,
}

impl MergeTask {
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_merge_operation_for_test(merge_operation: MergeOperation) -> MergeTask {
        let inventory = tantivy::Inventory::default();
        let tracked_merge_operation = inventory.track(merge_operation);
        MergeTask {
            merge_operation: tracked_merge_operation,
            _merge_permit: MergePermit::for_test(),
        }
    }
}

impl fmt::Debug for MergeTask {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        self.merge_operation.as_ref().fmt(f)
    }
}

impl Deref for MergeTask {
    type Target = MergeOperation;

    fn deref(&self) -> &Self::Target {
        self.merge_operation.as_ref()
    }
}

#[derive(Clone, Serialize)]
pub struct MergeOperation {
    #[serde(skip_serializing)]
    pub merge_parent_span: Span,
    pub merge_split_id: SplitId,
    pub splits: Vec<SplitMetadata>,
    pub operation_type: MergeOperationType,
}

impl MergeOperation {
    pub fn new_merge_operation(splits: Vec<SplitMetadata>) -> Self {
        let merge_split_id = new_split_id();
        let split_ids = splits.iter().map(|split| split.split_id()).collect_vec();
        let merge_parent_span = info_span!("merge", merge_split_id=%merge_split_id, split_ids=?split_ids, typ=%MergeOperationType::Merge);
        Self {
            merge_parent_span,
            merge_split_id,
            splits,
            operation_type: MergeOperationType::Merge,
        }
    }

    pub fn total_num_bytes(&self) -> u64 {
        self.splits
            .iter()
            .map(|split: &SplitMetadata| split.footer_offsets.end)
            .sum()
    }

    pub fn new_delete_and_merge_operation(split: SplitMetadata) -> Self {
        let merge_split_id = new_split_id();
        let merge_parent_span = info_span!("delete", merge_split_id=%merge_split_id, split_ids=?split.split_id(), typ=%MergeOperationType::DeleteAndMerge);
        Self {
            merge_parent_span,
            merge_split_id,
            splits: vec![split],
            operation_type: MergeOperationType::DeleteAndMerge,
        }
    }

    pub fn splits_as_slice(&self) -> &[SplitMetadata] {
        self.splits.as_slice()
    }
}

impl fmt::Debug for MergeOperation {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "Merge(operation_type={}, merged_split_id={},splits=[",
            self.operation_type, self.merge_split_id
        )?;
        for split in &self.splits {
            write!(f, "{},", split.split_id())?;
        }
        write!(f, "])")?;
        Ok(())
    }
}

/// A merge policy wraps the logic that decides what should be merged.
/// The SplitMetadata must be extracted from the splits `Vec`.
///
/// It is called by the merge planner whenever a new split is added.
pub trait MergePolicy: Send + Sync + fmt::Debug {
    /// Returns the list of merge operations that should be performed.
    fn operations(&self, splits: &mut Vec<SplitMetadata>) -> Vec<MergeOperation>;

    /// After the last indexing pipeline has been shutdown, quickwit
    /// finishes the ongoing merge operations, and eventually needs to shut it down.
    ///
    /// This method makes it possible to offer a last list of merge operations before
    /// really shutting down the merge policy.
    ///
    /// This is especially useful for users relying on a one-index-per-day scheme.
    fn finalize_operations(&self, _splits: &mut Vec<SplitMetadata>) -> Vec<MergeOperation> {
        Vec::new()
    }

    /// Returns split maturity.
    /// A split is either:
    /// - `Mature` if it does not undergo new merge operations.
    /// - or `Immature` with a `maturation_period` after which it becomes mature.
    fn split_maturity(&self, split_num_docs: usize, split_num_merge_ops: usize) -> SplitMaturity;

    /// Checks a bunch of properties specific to the given merge policy.
    /// This method is used in proptesting.
    ///
    /// - `merge_op` is a merge operation emitted by this merge policy.
    /// - `remaining_splits` is the list of remaining splits.
    #[cfg(test)]
    fn check_is_valid(&self, _merge_op: &MergeOperation, _remaining_splits: &[SplitMetadata]) {}
}

pub fn merge_policy_from_settings(settings: &IndexingSettings) -> Arc<dyn MergePolicy> {
    match settings.merge_policy.clone() {
        MergePolicyConfig::Nop => Arc::new(NopMergePolicy),
        MergePolicyConfig::ConstWriteAmplification(config) => {
            let merge_policy =
                ConstWriteAmplificationMergePolicy::new(config, settings.split_num_docs_target);
            Arc::new(merge_policy)
        }
        MergePolicyConfig::StableLog(config) => {
            let merge_policy = StableLogMergePolicy::new(config, settings.split_num_docs_target);
            Arc::new(merge_policy)
        }
    }
}

pub fn default_merge_policy() -> Arc<dyn MergePolicy> {
    let indexing_settings = IndexingSettings::default();
    merge_policy_from_settings(&indexing_settings)
}

pub fn nop_merge_policy() -> Arc<dyn MergePolicy> {
    Arc::new(NopMergePolicy)
}

struct SplitShortDebug<'a>(&'a SplitMetadata);

impl fmt::Debug for SplitShortDebug<'_> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("Split")
            .field("split_id", &self.0.split_id())
            .field("num_docs", &self.0.num_docs)
            .finish()
    }
}

fn splits_short_debug(splits: &[SplitMetadata]) -> Vec<SplitShortDebug<'_>> {
    splits.iter().map(SplitShortDebug).collect()
}

#[cfg(test)]
pub mod tests {

    use std::collections::hash_map::DefaultHasher;
    use std::collections::{BTreeSet, HashMap};
    use std::hash::Hasher;
    use std::ops::RangeInclusive;

    use proptest::prelude::*;
    use quickwit_actors::Universe;
    use quickwit_proto::indexing::{IndexingPipelineId, MergePipelineId};
    use quickwit_proto::types::{IndexUid, NodeId, PipelineUid};
    use rand::seq::SliceRandom;
    use time::OffsetDateTime;

    use super::*;
    use crate::actors::{
        MergePlanner, MergeSchedulerService, MergeSplitDownloader, RunFinalizeMergePolicyAndQuit,
        merge_split_attrs,
    };
    use crate::models::{NewSplits, create_split_metadata};

    fn pow_of_10(n: usize) -> usize {
        10usize.pow(n as u32)
    }

    prop_compose! {
        fn num_docs_around_power_of_ten()(
            pow_ten in 1usize..5usize,
            diff in -2isize..2isize
        ) -> usize {
            (pow_of_10(pow_ten) as isize + diff).max(1isize) as usize
        }
    }

    fn num_docs_strategy() -> impl Strategy<Value = usize> {
        prop_oneof![1usize..10_000_000usize, num_docs_around_power_of_ten()]
    }

    prop_compose! {
      fn split_strategy()
        (num_merge_ops in 0usize..5usize, start_timestamp in 1_664_000_000i64..1_665_000_000i64, average_time_delta in 100i64..120i64, delta_creation_date in 0u64..100_000u64, num_docs in num_docs_strategy()) -> SplitMetadata {
        let split_id = crate::new_split_id();
        let end_timestamp = start_timestamp + average_time_delta * pow_of_10(num_merge_ops) as i64;
        let create_timestamp: i64 = (end_timestamp as u64 + delta_creation_date) as i64;
        SplitMetadata {
            split_id,
            time_range: Some(start_timestamp..=end_timestamp),
            num_docs,
            create_timestamp,
            num_merge_ops,
            .. Default::default()
        }
      }
    }

    pub(crate) fn create_splits(
        merge_policy: &dyn MergePolicy,
        num_docs_vec: Vec<usize>,
    ) -> Vec<SplitMetadata> {
        let num_docs_with_timestamp = num_docs_vec
            .into_iter()
            // we give the same timestamp to all of them and rely on stable sort to keep the split
            // order.
            .map(|num_docs| (num_docs, (1630563067..=1630564067)))
            .collect();
        create_splits_with_timestamps(merge_policy, num_docs_with_timestamp)
    }

    fn create_splits_with_timestamps(
        merge_policy: &dyn MergePolicy,
        num_docs_vec: Vec<(usize, RangeInclusive<i64>)>,
    ) -> Vec<SplitMetadata> {
        num_docs_vec
            .into_iter()
            .enumerate()
            .map(|(split_ord, (num_docs, time_range))| {
                let create_timestamp = OffsetDateTime::now_utc().unix_timestamp();
                let time_to_maturity = merge_policy.split_maturity(num_docs, 0);
                SplitMetadata {
                    split_id: format!("split_{split_ord:02}"),
                    num_docs,
                    time_range: Some(time_range),
                    create_timestamp,
                    maturity: time_to_maturity,
                    ..Default::default()
                }
            })
            .collect()
    }

    // Creates a checksum for a given merge operation.
    // This does not take in account the merge split id,
    // and is split order independent.
    fn compute_checksum_op(op: &MergeOperation) -> u64 {
        let mut checksum = 0u64;
        for split in op.splits_as_slice() {
            let mut hasher = DefaultHasher::default();
            hasher.write(split.split_id.as_bytes());
            checksum ^= hasher.finish();
        }
        checksum
    }

    // Creates a checksum for a set of operations.
    // This checksum does not depend on the order of the merrge operations,
    // nor the merge split ids.
    fn compute_checksum_ops(ops: &[MergeOperation]) -> u64 {
        let mut checksum = 0u64;
        for op in ops {
            let op_checksum = compute_checksum_op(op);
            let mut hasher = DefaultHasher::default();
            hasher.write_u64(op_checksum);
            checksum ^= hasher.finish();
        }
        checksum
    }

    fn compare_merge_operations(left_ops: &[MergeOperation], right_ops: &[MergeOperation]) -> bool {
        compute_checksum_ops(left_ops) == compute_checksum_ops(right_ops)
    }

    pub(crate) fn proptest_merge_policy(merge_policy: &dyn MergePolicy) {
        proptest!(|(mut splits in prop::collection::vec(split_strategy(), 0..100))| {
            let mut cloned_splits = splits.clone();
            cloned_splits.shuffle(&mut rand::rng());

            let original_num_splits = splits.len();

            let mut operations: Vec<MergeOperation> = merge_policy.operations(&mut splits);
            let operations_after_shuffle = merge_policy.operations(&mut cloned_splits);
            assert!(compare_merge_operations(&operations[..],
                &operations_after_shuffle[..]),
                "Merge policy result should be independent from the original order.");

            let num_splits_in_merge: usize = operations.iter().map(|op| op.splits_as_slice().len()).sum();

            assert_eq!(
                num_splits_in_merge + splits.len(), original_num_splits,
                "Splits should not be lost."
            );

            // This property is not uninteresting but is currently not observed
            // in the stable log merge policy.
            // assert!(
            //     merge_policy.operations(&mut splits).is_empty(),
            //     "Merge policy are expected to return all available merge operations."
            // );
            let now_utc = OffsetDateTime::now_utc();
            for merge_op in &mut operations {
                assert_eq!(merge_op.operation_type, MergeOperationType::Merge,
                    "A merge policy should only emit Merge operations."
                );
                assert!(merge_op.splits_as_slice().len() >= 2,
            "Merge policies should not suggest merging a single split.");
                for split in merge_op.splits_as_slice() {
                    assert!(!split.is_mature(now_utc), "Merges should not contain mature splits.");
                }
                merge_policy.check_is_valid(merge_op, &splits[..]);
            }
        });
    }

    fn merge_tags(splits: &[SplitMetadata]) -> BTreeSet<String> {
        splits
            .iter()
            .flat_map(|split| split.tags.iter().cloned())
            .collect()
    }

    fn fake_merge(merge_policy: &Arc<dyn MergePolicy>, splits: &[SplitMetadata]) -> SplitMetadata {
        assert!(!splits.is_empty(), "Split list should not be empty.");
        let merged_split_id = new_split_id();
        let tags = merge_tags(splits);
        let pipeline_id = MergePipelineId {
            node_id: NodeId::from("test_node"),
            index_uid: IndexUid::new_with_random_ulid("test_index"),
            source_id: "test_source".to_string(),
        };
        let split_attrs = merge_split_attrs(pipeline_id, merged_split_id, splits).unwrap();
        create_split_metadata(merge_policy, None, &split_attrs, tags, 0..0)
    }

    fn apply_merge(
        merge_policy: &Arc<dyn MergePolicy>,
        split_index: &mut HashMap<String, SplitMetadata>,
        merge_op: &MergeOperation,
    ) -> SplitMetadata {
        for split in merge_op.splits_as_slice() {
            assert!(split_index.remove(split.split_id()).is_some());
        }
        let merged_split = fake_merge(merge_policy, merge_op.splits_as_slice());
        split_index.insert(merged_split.split_id().to_string(), merged_split.clone());
        merged_split
    }

    async fn aux_test_simulate_merge_planner(
        merge_policy: Arc<dyn MergePolicy>,
        incoming_splits: Vec<SplitMetadata>,
        check_final_configuration: &dyn Fn(&[SplitMetadata]),
    ) -> anyhow::Result<Vec<SplitMetadata>> {
        let universe = Universe::new();
        let (merge_task_mailbox, merge_task_inbox) =
            universe.create_test_mailbox::<MergeSplitDownloader>();
        let pipeline_id = IndexingPipelineId {
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: NodeId::from("test-node"),
            pipeline_uid: PipelineUid::default(),
        };
        let merge_planner = MergePlanner::new(
            &pipeline_id.merge_pipeline_id(),
            Vec::new(),
            merge_policy.clone(),
            merge_task_mailbox,
            universe.get_or_spawn_one::<MergeSchedulerService>(),
        );
        let mut split_index: HashMap<String, SplitMetadata> = HashMap::default();
        let (merge_planner_mailbox, merge_planner_handler) =
            universe.spawn_builder().spawn(merge_planner);

        for split in incoming_splits {
            split_index.insert(split.split_id().to_string(), split.clone());
            merge_planner_mailbox
                .send_message(NewSplits {
                    new_splits: vec![split],
                })
                .await?;
            loop {
                let obs = merge_planner_handler.process_pending_and_observe().await;
                assert_eq!(obs.obs_type, quickwit_actors::ObservationType::Alive);
                let merge_tasks = merge_task_inbox.drain_for_test_typed::<MergeTask>();
                if merge_tasks.is_empty() {
                    break;
                }
                let new_splits: Vec<SplitMetadata> = merge_tasks
                    .into_iter()
                    .map(|merge_op| apply_merge(&merge_policy, &mut split_index, &merge_op))
                    .collect();
                merge_planner_mailbox
                    .send_message(NewSplits { new_splits })
                    .await?;
            }
            let split_metadatas: Vec<SplitMetadata> = split_index.values().cloned().collect();
            check_final_configuration(&split_metadatas);
        }

        merge_planner_mailbox
            .send_message(RunFinalizeMergePolicyAndQuit)
            .await
            .unwrap();

        let obs = merge_planner_handler.process_pending_and_observe().await;
        assert_eq!(obs.obs_type, quickwit_actors::ObservationType::PostMortem);

        let merge_tasks = merge_task_inbox.drain_for_test_typed::<MergeTask>();
        for merge_task in merge_tasks {
            apply_merge(&merge_policy, &mut split_index, &merge_task);
        }

        let split_metadatas: Vec<SplitMetadata> = split_index.values().cloned().collect();

        universe.assert_quit().await;
        Ok(split_metadatas)
    }

    /// Mock split meta helper.
    fn mock_split_meta_from_num_docs(
        time_range: RangeInclusive<i64>,
        num_docs: u64,
        maturity: SplitMaturity,
    ) -> SplitMetadata {
        SplitMetadata {
            split_id: crate::new_split_id(),
            partition_id: 3u64,
            num_docs: num_docs as usize,
            uncompressed_docs_size_in_bytes: 256u64 * num_docs,
            time_range: Some(time_range),
            create_timestamp: OffsetDateTime::now_utc().unix_timestamp(),
            maturity,
            tags: BTreeSet::from_iter(vec!["tenant_id:1".to_string(), "tenant_id:2".to_string()]),
            footer_offsets: 0..100,
            index_uid: IndexUid::new_with_random_ulid("test-index"),
            source_id: "test-source".to_string(),
            node_id: "test-node".to_string(),
            ..Default::default()
        }
    }

    pub async fn aux_test_simulate_merge_planner_num_docs(
        merge_policy: Arc<dyn MergePolicy>,
        batch_num_docs: &[usize],
        check_final_configuration: &dyn Fn(&[SplitMetadata]),
    ) -> anyhow::Result<Vec<SplitMetadata>> {
        let split_metadatas: Vec<SplitMetadata> = batch_num_docs
            .iter()
            .cloned()
            .enumerate()
            .map(|(split_ord, num_docs)| {
                let time_first = split_ord as i64 * 1_000;
                let time_last = time_first + 999;
                let time_range = time_first..=time_last;
                let time_to_maturity = merge_policy.split_maturity(num_docs, 0);
                mock_split_meta_from_num_docs(time_range, num_docs as u64, time_to_maturity)
            })
            .collect();
        aux_test_simulate_merge_planner(merge_policy, split_metadatas, check_final_configuration)
            .await
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/merge_policy/nop_merge_policy.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use quickwit_metastore::SplitMaturity;

use crate::merge_policy::MergePolicy;

/// The NopMergePolicy, as the name suggests, is no-op and does not perform any merges.
/// <https://en.wikipedia.org/wiki/NOP_(code)>
#[derive(Debug)]
pub struct NopMergePolicy;

impl fmt::Display for NopMergePolicy {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        write!(f, "{self:?}")
    }
}

impl MergePolicy for NopMergePolicy {
    fn operations(
        &self,
        _splits: &mut Vec<quickwit_metastore::SplitMetadata>,
    ) -> Vec<super::MergeOperation> {
        Vec::new()
    }

    fn split_maturity(&self, _split_num_docs: usize, _split_num_merge_ops: usize) -> SplitMaturity {
        // With the no merge policy, all splits are mature immediately as they will never undergo
        // any merge.
        SplitMaturity::Mature
    }
}

#[cfg(test)]
mod tests {

    use quickwit_metastore::SplitMaturity;

    use crate::merge_policy::{MergePolicy, NopMergePolicy};

    #[test]
    pub fn test_no_merge_policy_maturity_timestamp() {
        // All splits are always mature for `NopMergePolicy`.
        assert_eq!(NopMergePolicy.split_maturity(10, 0), SplitMaturity::Mature);
    }

    #[test]
    pub fn test_no_merge_policy_operations() {
        let mut splits = super::super::tests::create_splits(&NopMergePolicy, vec![1; 100]);
        assert!(NopMergePolicy.operations(&mut splits).is_empty());
        assert_eq!(splits.len(), 100);
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/merge_policy/stable_log_merge_policy.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Ordering;
use std::ops::Range;

use quickwit_config::IndexingSettings;
use quickwit_config::merge_policy_config::StableLogMergePolicyConfig;
use quickwit_metastore::{SplitMaturity, SplitMetadata};
use time::OffsetDateTime;
use tracing::debug;

use crate::merge_policy::{MergeOperation, MergePolicy, splits_short_debug};

/// `StableLogMergePolicy` is a rather naive implementation optimized
/// for splits produced by a rather stable stream of splits,
/// with incoming documents ordered more or less as expected time, so that splits are
/// time pruning is efficient out of the box.
///
/// The logic goes as follows.
/// Each splits has
/// - a number of documents
/// - an end time
///
/// The policy first builds the merge operations
///
/// ### Build merge operations
/// We start by sorting the splits by reverse date so that the most recent splits are
/// coming first.
/// We iterate through the splits and assign them to increasing levels.
/// Level 0 will receive `{split_i}` for i within `[0..l_0)`
/// ...
/// Level k will receive `{split_i}` for i within `[l_{k-1}..l_k)`
///
/// The limit at which we change level is simply defined as
/// `l_0 = 3 x self.min_level_num_docs`.
///
/// Assuming level N-1 has been built, level N is given by
/// `l_N = min(num_docs(split_l_{N_1})` * 3, self.split_num_docs_target)`.
/// We stop once l_N = self.split_num_docs_target is reached.
///
/// As a result, each level interval is at least 3 times larger than the previous one,
/// forming a logscale over the number of documents.
///
/// Because we stop merging splits reaching a size larger than if it would result in a size larger
/// than `target_num_docs`.
#[derive(Debug, Clone)]
pub struct StableLogMergePolicy {
    config: StableLogMergePolicyConfig,
    split_num_docs_target: usize,
}

impl Default for StableLogMergePolicy {
    fn default() -> Self {
        StableLogMergePolicy {
            config: Default::default(),
            split_num_docs_target: IndexingSettings::default_split_num_docs_target(),
        }
    }
}

fn remove_matching_items<T, Pred: Fn(&T) -> bool>(items: &mut Vec<T>, predicate: Pred) -> Vec<T> {
    let mut matching_items = Vec::new();
    let mut i = 0;
    while i < items.len() {
        if predicate(&items[i]) {
            let matching_item = items.remove(i);
            matching_items.push(matching_item);
        } else {
            i += 1;
        }
    }
    matching_items
}

impl StableLogMergePolicy {
    pub fn new(
        config: StableLogMergePolicyConfig,
        split_num_docs_target: usize,
    ) -> StableLogMergePolicy {
        StableLogMergePolicy {
            config,
            split_num_docs_target,
        }
    }
}

impl MergePolicy for StableLogMergePolicy {
    fn operations(&self, splits: &mut Vec<SplitMetadata>) -> Vec<MergeOperation> {
        let original_num_splits = splits.len();
        let operations = self.merge_operations(splits);
        debug_assert_eq!(
            original_num_splits,
            operations
                .iter()
                .map(|op| op.splits_as_slice().len())
                .sum::<usize>()
                + splits.len(),
            "The merge policy is supposed to keep the number of splits."
        );
        operations
    }

    /// A mature split for merge is a split that won't undergo any merge operation in the future.
    fn split_maturity(&self, split_num_docs: usize, _split_num_merge_ops: usize) -> SplitMaturity {
        if split_num_docs >= self.split_num_docs_target {
            return SplitMaturity::Mature;
        }
        SplitMaturity::Immature {
            maturation_period: self.config.maturation_period,
        }
    }

    #[cfg(test)]
    fn check_is_valid(&self, merge_op: &MergeOperation, _remaining_splits: &[SplitMetadata]) {
        assert!(merge_op.splits_as_slice().len() <= self.config.max_merge_factor);
        if merge_op.splits_as_slice().len() < self.config.merge_factor {
            let num_docs: usize = merge_op
                .splits_as_slice()
                .iter()
                .map(|split| split.num_docs)
                .sum();
            let last_split_num_docs = merge_op
                .splits_as_slice()
                .iter()
                .min_by(|&left, &right| cmp_splits_by_reverse_time_end(left, right))
                .unwrap()
                .num_docs;
            assert!(num_docs >= self.split_num_docs_target);
            assert!(num_docs - last_split_num_docs < self.split_num_docs_target);
        }
    }
}

#[derive(Clone, Copy, Eq, PartialEq)]
enum MergeCandidateSize {
    /// The split candidate is too small to be considered for execution.
    TooSmall,
    /// The split candidate is good to go.
    ValidSplit,
    /// We should not add an extra split in this candidate.
    /// This can happen for any of the two following reasons:
    /// - the number of splits involved already reached `merge_factor_max`.
    /// - the overall number of docs that will end up in the merged segment already exceeds
    ///   `split_num_docs_target`.
    OneMoreSplitWouldBeTooBig,
}

fn extract_time_end(split: &SplitMetadata) -> Option<i64> {
    let end_timestamp = split.time_range.as_ref()?.end();
    Some(*end_timestamp)
}

// Total ordering by
// - reverse time end.
// - number of docs
// - split ids <- this one is just to make the result of the policy  invariant when shuffling the
//   input splits.
fn cmp_splits_by_reverse_time_end(left: &SplitMetadata, right: &SplitMetadata) -> Ordering {
    extract_time_end(left)
        .cmp(&extract_time_end(right))
        .reverse()
        .then_with(|| left.num_docs.cmp(&right.num_docs))
        .then_with(|| {
            left.split_id().cmp(right.split_id()) //< for determinism.
        })
}

impl StableLogMergePolicy {
    fn merge_operations(&self, splits: &mut Vec<SplitMetadata>) -> Vec<MergeOperation> {
        if splits.len() < 2 {
            return Vec::new();
        }
        // First we isolate splits that are mature.
        let splits_not_for_merge =
            remove_matching_items(splits, |split| split.is_mature(OffsetDateTime::now_utc()));

        let mut merge_operations: Vec<MergeOperation> = Vec::new();
        splits.sort_unstable_by(cmp_splits_by_reverse_time_end);
        debug!(splits=?splits_short_debug(&splits[..]), "merge-policy-run");

        // Splits should naturally have an increasing num_merge
        let split_levels = self.build_split_levels(splits);
        for split_range in split_levels.into_iter().rev() {
            debug!(splits=?splits_short_debug(&splits[split_range.clone()]));
            if let Some(merge_range) = self.merge_candidate_from_level(splits, split_range) {
                debug!(merge_range=?merge_range, "merge-candidate");
                let splits_in_merge: Vec<SplitMetadata> = splits.drain(merge_range).collect();
                let merge_operation = MergeOperation::new_merge_operation(splits_in_merge);
                merge_operations.push(merge_operation);
            } else {
                debug!("no-merge");
            }
        }
        splits.extend(splits_not_for_merge);
        merge_operations
    }

    /// This function groups splits in levels.
    ///
    /// It assumes that splits are almost sorted by their increasing size,
    /// but should behave decently (not create too many levels) if they are not.
    ///
    /// All splits are required to have a number of documents lower than
    /// `self.split_num_docs_target`
    pub(crate) fn build_split_levels(&self, splits: &[SplitMetadata]) -> Vec<Range<usize>> {
        assert!(
            splits
                .iter()
                .all(|split| split.num_docs < self.split_num_docs_target),
            "All splits are expected to be smaller than `split_num_docs_target`."
        );
        if splits.is_empty() {
            return Vec::new();
        }

        let mut split_levels: Vec<Range<usize>> = Vec::new();
        let mut current_level_start_ord = 0;
        let mut current_level_max_docs =
            (splits[0].num_docs * 3).max(self.config.min_level_num_docs);

        #[allow(clippy::single_range_in_vec_init)]
        let mut levels = vec![(0..current_level_max_docs)]; // for logging only
        for (split_ord, split) in splits.iter().enumerate() {
            if split.num_docs >= current_level_max_docs {
                split_levels.push(current_level_start_ord..split_ord);
                current_level_start_ord = split_ord;
                current_level_max_docs = 3 * split.num_docs;
                levels.push(split.num_docs..current_level_max_docs)
            }
        }
        debug!(levels=?levels);
        split_levels.push(current_level_start_ord..splits.len());
        split_levels
    }

    /// Given splits tries to select a subrange of level_range that would be a good merge candidate.
    fn merge_candidate_from_level(
        &self,
        splits: &[SplitMetadata],
        level_range: Range<usize>,
    ) -> Option<Range<usize>> {
        let merge_candidate_end = level_range.end;
        let mut merge_candidate_start = merge_candidate_end;
        for split_ord in level_range.rev() {
            if self.merge_candidate_size(&splits[merge_candidate_start..merge_candidate_end])
                == MergeCandidateSize::OneMoreSplitWouldBeTooBig
            {
                break;
            }
            merge_candidate_start = split_ord;
        }
        if self.merge_candidate_size(&splits[merge_candidate_start..merge_candidate_end])
            == MergeCandidateSize::TooSmall
        {
            return None;
        }
        Some(merge_candidate_start..merge_candidate_end)
    }

    /// Returns `MergeCandidateSize` iff we should stop adding extra split into this
    /// merge candidate.
    fn merge_candidate_size(&self, splits: &[SplitMetadata]) -> MergeCandidateSize {
        // We don't perform merge with a single segment. We
        // may relax this in the future in order to compact deletes.
        if splits.len() <= 1 {
            return MergeCandidateSize::TooSmall;
        }

        // There are already enough splits in this merge.
        if splits.len() >= self.config.max_merge_factor {
            return MergeCandidateSize::OneMoreSplitWouldBeTooBig;
        }
        let num_docs_in_merge: usize = splits.iter().map(|split| split.num_docs).sum();

        // The resulting split will exceed `split_num_docs_target`.
        if num_docs_in_merge >= self.split_num_docs_target {
            return MergeCandidateSize::OneMoreSplitWouldBeTooBig;
        }

        if splits.len() < self.config.merge_factor {
            return MergeCandidateSize::TooSmall;
        }

        MergeCandidateSize::ValidSplit
    }
}

// Helpers which expose some internal properties of
// the stable log merge policy to be tested in unit tests.
#[cfg(test)]
impl StableLogMergePolicy {
    fn case_levels_given_growth_factor(&self, growth_factor: usize) -> Vec<usize> {
        assert!(self.config.min_level_num_docs > 0);
        assert!(self.config.merge_factor > 1);
        assert!(self.config.max_merge_factor >= self.config.merge_factor);
        assert!(self.split_num_docs_target > self.config.min_level_num_docs);
        let mut levels_start_num_docs = vec![1];
        let mut level_end_doc = self.config.min_level_num_docs;
        while level_end_doc < self.split_num_docs_target {
            levels_start_num_docs.push(level_end_doc);
            level_end_doc *= growth_factor;
        }
        levels_start_num_docs.push(self.split_num_docs_target);
        levels_start_num_docs
    }

    pub fn max_num_splits_ideal_case(&self, num_docs: u64) -> usize {
        let levels = self.case_levels_given_growth_factor(self.config.merge_factor);
        self.max_num_splits_knowning_levels(num_docs, &levels, true)
    }

    pub fn max_num_splits_worst_case(&self, num_docs: u64) -> usize {
        let levels = self.case_levels_given_growth_factor(3);
        self.max_num_splits_knowning_levels(num_docs, &levels, false)
    }

    fn max_num_splits_knowning_levels(
        &self,
        mut num_docs: u64,
        levels: &[usize],
        sorted: bool,
    ) -> usize {
        assert!(levels.is_sorted());

        if num_docs == 0 {
            return 0;
        }
        let (&head, tail) = levels.split_first().unwrap();
        if num_docs < head as u64 {
            return 0;
        }
        let first_level_min_saturation_docs = if sorted {
            head * (self.config.merge_factor - 1)
        } else {
            head + (self.config.merge_factor - 2)
        };
        if tail.is_empty() || num_docs <= first_level_min_saturation_docs as u64 {
            return (num_docs as usize).div_ceil(head);
        }
        num_docs -= first_level_min_saturation_docs as u64;
        self.config.merge_factor - 1 + self.max_num_splits_knowning_levels(num_docs, tail, sorted)
    }
}

#[cfg(test)]
mod tests {

    use std::sync::Arc;
    use std::time::Duration;

    use super::*;
    use crate::merge_policy::tests::{aux_test_simulate_merge_planner_num_docs, create_splits};

    #[test]
    fn test_split_is_mature() {
        let merge_policy = StableLogMergePolicy::default();
        // Split under split_num_docs_target and created before now() - maturation_period is not
        // mature.
        assert_eq!(
            merge_policy.split_maturity(9_000_000, 0),
            SplitMaturity::Immature {
                maturation_period: Duration::from_secs(3600 * 48)
            }
        );
        assert_eq!(
            merge_policy.split_maturity(&merge_policy.split_num_docs_target + 1, 0),
            SplitMaturity::Mature
        );
        // Split under split_num_docs_target but with create_timestamp >= now + maturity duration is
        // mature.
        assert_eq!(
            merge_policy.split_maturity(9_000_000, 0),
            SplitMaturity::Immature {
                maturation_period: merge_policy.config.maturation_period
            }
        );
    }

    #[test]
    fn test_build_split_levels() {
        let merge_policy = StableLogMergePolicy::default();
        let splits = Vec::new();
        let split_groups = merge_policy.build_split_levels(&splits);
        assert!(split_groups.is_empty());
    }

    #[test]
    fn test_stable_log_merge_policy_build_split_simple() {
        let merge_policy: StableLogMergePolicy = StableLogMergePolicy::default();
        let splits = create_splits(
            &merge_policy,
            vec![100_000, 100_000, 100_000, 800_000, 900_000],
        );
        let split_groups = merge_policy.build_split_levels(&splits);
        assert_eq!(&split_groups, &[0..3, 3..5]);
    }

    #[test]
    fn test_stable_log_merge_policy_build_split_perfect_world() {
        let merge_policy = StableLogMergePolicy::default();
        let splits = create_splits(
            &merge_policy,
            vec![
                100_000, 100_000, 100_000, 100_000, 100_000, 100_000, 100_000, 100_000, 800_000,
                1_600_000,
            ],
        );
        let split_groups = merge_policy.build_split_levels(&splits);
        assert_eq!(&split_groups, &[0..8, 8..10]);
    }

    #[test]
    fn test_stable_log_merge_policy_build_split_decreasing() {
        let merge_policy = StableLogMergePolicy::default();
        let splits = create_splits(
            &merge_policy,
            vec![
                100_000, 100_000, 100_000, 100_000, 100_000, 100_000, 100_000, 100_000, 800_000,
                100_000, 1_600_000,
            ],
        );
        let split_groups = merge_policy.build_split_levels(&splits);
        assert_eq!(&split_groups, &[0..8, 8..11]);
    }

    #[test]
    #[should_panic(expected = "All splits are expected to be smaller than `split_num_docs_target`.")]
    fn test_stable_log_merge_policy_build_split_panics_if_exceeding_split_num_docs_target() {
        let merge_policy = StableLogMergePolicy::default();
        let splits = create_splits(&merge_policy, vec![11_000_000]);
        merge_policy.build_split_levels(&splits);
    }

    #[test]
    fn test_stable_log_merge_policy_not_enough_splits() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![100; 7]);
        assert_eq!(splits.len(), 7);
        assert!(merge_policy.operations(&mut splits).is_empty());
    }

    #[test]
    fn test_stable_log_merge_policy_just_enough_splits_for_a_merge() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![100; 10]);
        let mut merge_ops = merge_policy.operations(&mut splits);
        assert!(splits.is_empty());
        assert_eq!(merge_ops.len(), 1);
        let merge_op = merge_ops.pop().unwrap();
        let mut merge_segment_ids: Vec<String> = merge_op
            .splits_as_slice()
            .iter()
            .map(|split| split.split_id().to_string())
            .collect();
        merge_segment_ids.sort();
        assert_eq!(
            merge_segment_ids,
            &[
                "split_00", "split_01", "split_02", "split_03", "split_04", "split_05", "split_06",
                "split_07", "split_08", "split_09"
            ]
        );
    }

    #[test]
    fn test_stable_log_merge_policy_many_splits_on_same_level() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![100; 13]);
        let mut merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 1);
        assert_eq!(splits[0].split_id(), "split_00");
        assert_eq!(merge_ops.len(), 1);
        let merge_op = merge_ops.pop().unwrap();
        let mut merge_split_ids: Vec<String> = merge_op
            .splits_as_slice()
            .iter()
            .map(|split| split.split_id().to_string())
            .collect();
        merge_split_ids.sort();
        assert_eq!(
            merge_split_ids,
            &[
                "split_01", "split_02", "split_03", "split_04", "split_05", "split_06", "split_07",
                "split_08", "split_09", "split_10", "split_11", "split_12"
            ]
        );
    }

    #[test]
    fn test_stable_log_merge_policy_splits_below_min_level() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(
            &merge_policy,
            vec![
                100, 1000, 10_000, 10_000, 10_000, 10_000, 10_000, 40_000, 40_000, 40_000,
            ],
        );
        let mut merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 0);
        assert_eq!(merge_ops.len(), 1);
        let merge_op = merge_ops.pop().unwrap();
        let mut merge_split_ids: Vec<String> = merge_op
            .splits_as_slice()
            .iter()
            .map(|split| split.split_id().to_string())
            .collect();
        merge_split_ids.sort();
        assert_eq!(
            merge_split_ids,
            &[
                "split_00", "split_01", "split_02", "split_03", "split_04", "split_05", "split_06",
                "split_07", "split_08", "split_09"
            ]
        );
    }

    #[test]
    fn test_stable_log_merge_policy_splits_above_min_level() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(
            &merge_policy,
            vec![
                100_000, 1_000_000, 1_000_000, 1_000_000, 1_000_000, 1_000_000, 1_000_000,
                1_000_000,
            ],
        );
        let merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 8);
        assert_eq!(merge_ops.len(), 0);
    }

    #[test]
    fn test_stable_log_merge_policy_above_split_num_docs_target_is_ignored() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(
            &merge_policy,
            vec![
                100_000, 100_000, 100_000, 100_000, 100_000,
                10_000_000, // this split should not interfere with the merging of other splits
                100_000, 100_000, 100_000, 100_000, 100_000,
            ],
        );
        let merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 1);
        assert_eq!(splits[0].num_docs, 10_000_000);
        assert_eq!(merge_ops.len(), 1);
    }

    #[test]
    fn test_merge_policy_splits_too_large_are_ignored() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![9_999_999, 10_000_000]);
        for split in splits.iter_mut() {
            let time_to_maturity = merge_policy.split_maturity(split.num_docs, split.num_merge_ops);
            split.maturity = time_to_maturity;
        }
        let merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 2);
        assert_eq!(splits[0].num_docs, 9_999_999);
        assert_eq!(splits[1].num_docs, 10_000_000);
        assert!(merge_ops.is_empty());
    }

    #[test]
    fn test_merge_policy_splits_entire_level_reach_merge_max_doc() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![5_000_000, 5_000_000]);
        let merge_ops = merge_policy.operations(&mut splits);
        assert!(splits.is_empty());
        assert_eq!(merge_ops.len(), 1);
        assert_eq!(merge_ops[0].splits_as_slice().len(), 2);
    }

    #[test]
    fn test_merge_policy_last_merge_can_have_a_lower_merge_factor() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![9_999_997, 9_999_998, 9_999_999]);
        let merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 1);
        assert_eq!(splits[0].num_docs, 9_999_997);
        assert_eq!(merge_ops.len(), 1);
        assert_eq!(merge_ops[0].splits_as_slice().len(), 2);
    }

    #[test]
    fn test_merge_policy_no_merge_with_only_one_split() {
        let merge_policy = StableLogMergePolicy::default();
        let mut splits = create_splits(&merge_policy, vec![9_999_999]);
        let merge_ops = merge_policy.operations(&mut splits);
        assert_eq!(splits.len(), 1);
        assert_eq!(splits[0].num_docs, 9_999_999);
        assert!(merge_ops.is_empty());
    }

    #[test]
    fn test_stable_log_merge_policy_max_num_splits_worst_case() {
        let merge_policy = StableLogMergePolicy::default();
        assert_eq!(merge_policy.max_num_splits_worst_case(99), 9);
        assert_eq!(merge_policy.max_num_splits_worst_case(1_000_000), 27);
        assert_eq!(merge_policy.max_num_splits_worst_case(2_000_000), 36);
        assert_eq!(merge_policy.max_num_splits_worst_case(3_000_000), 36);
        assert_eq!(merge_policy.max_num_splits_worst_case(4_000_000), 36);
        assert_eq!(merge_policy.max_num_splits_worst_case(5_000_000), 45);
        assert_eq!(merge_policy.max_num_splits_worst_case(7_000_000), 45);
        assert_eq!(merge_policy.max_num_splits_worst_case(10_000_000), 45);
        assert_eq!(merge_policy.max_num_splits_worst_case(20_000_000), 54);
        assert_eq!(merge_policy.max_num_splits_worst_case(100_000_000), 63);
        assert_eq!(merge_policy.max_num_splits_worst_case(1_000_000_000), 153);
    }

    #[test]
    fn test_stable_log_merge_policy_max_num_splits_ideal_case() {
        let merge_policy = StableLogMergePolicy::default();
        assert_eq!(merge_policy.max_num_splits_ideal_case(1_000_000), 18);
        assert_eq!(merge_policy.max_num_splits_ideal_case(99), 9);
        assert_eq!(merge_policy.max_num_splits_ideal_case(2_000_000), 20);
        assert_eq!(merge_policy.max_num_splits_ideal_case(3_000_000), 21);
        assert_eq!(merge_policy.max_num_splits_ideal_case(4_000_000), 22);
        assert_eq!(merge_policy.max_num_splits_ideal_case(5_000_000), 23);
        assert_eq!(merge_policy.max_num_splits_ideal_case(7_000_000), 25);
        assert_eq!(merge_policy.max_num_splits_ideal_case(10_000_000), 27);
        assert_eq!(merge_policy.max_num_splits_ideal_case(100_000_000), 37);
        assert_eq!(merge_policy.max_num_splits_ideal_case(1_000_000_000), 127);
    }

    #[test]
    fn test_stable_log_merge_policy_proptest() {
        let config = StableLogMergePolicyConfig {
            min_level_num_docs: 100_000,
            merge_factor: 4,
            max_merge_factor: 6,
            maturation_period: Duration::from_secs(3600),
        };
        let merge_policy = StableLogMergePolicy::new(config, 10_000_000);
        crate::merge_policy::tests::proptest_merge_policy(&merge_policy);
    }

    #[tokio::test]
    #[cfg_attr(not(feature = "ci-test"), ignore)]
    async fn test_simulate_stable_log_merge_policy_constant_case() -> anyhow::Result<()> {
        let merge_policy = StableLogMergePolicy::default();
        aux_test_simulate_merge_planner_num_docs(
            Arc::new(merge_policy.clone()),
            &vec![10_000; 100_000],
            &|splits| {
                let num_docs = splits.iter().map(|split| split.num_docs as u64).sum();
                assert!(splits.len() <= merge_policy.max_num_splits_ideal_case(num_docs))
            },
        )
        .await?;
        Ok(())
    }

    use proptest::prelude::*;
    use proptest::sample::select;
    use tokio::runtime::Runtime;

    fn proptest_config() -> ProptestConfig {
        let mut proptest_config = ProptestConfig::with_cases(20);
        proptest_config.max_shrink_iters = 600;
        proptest_config
    }

    proptest! {
        #![proptest_config(proptest_config())]
        #[test]
        fn test_proptest_simulate_stable_log_merge_planner_adversarial(batch_num_docs in proptest::collection::vec(select(&[11, 1_990, 10_000, 50_000, 310_000][..]), 1..1_000)) {
            let merge_policy = StableLogMergePolicy::default();
            let rt = Runtime::new().unwrap();
            rt.block_on(
            aux_test_simulate_merge_planner_num_docs(
                Arc::new(merge_policy.clone()),
                &batch_num_docs,
                &|splits| {
                    let num_docs = splits.iter().map(|split| split.num_docs as u64).sum();
                    assert!(splits.len() <= merge_policy.max_num_splits_worst_case(num_docs));
                },
            )).unwrap();
        }
    }

    #[tokio::test]
    async fn test_simulate_stable_log_merge_planner_edge_case() {
        let merge_policy = StableLogMergePolicy::default();
        let batch_num_docs = vec![
            11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
        ];
        aux_test_simulate_merge_planner_num_docs(
            Arc::new(merge_policy.clone()),
            &batch_num_docs,
            &|splits| {
                let num_docs = splits.iter().map(|split| split.num_docs as u64).sum();
                assert!(splits.len() <= merge_policy.max_num_splits_worst_case(num_docs));
            },
        )
        .await
        .unwrap();
    }

    #[tokio::test]
    async fn test_simulate_stable_log_merge_planner_ideal_case() -> anyhow::Result<()> {
        let merge_policy = StableLogMergePolicy::default();
        aux_test_simulate_merge_planner_num_docs(
            Arc::new(merge_policy.clone()),
            &vec![10_000; 1_000],
            &|splits| {
                let num_docs = splits.iter().map(|split| split.num_docs as u64).sum();
                assert!(splits.len() <= merge_policy.max_num_splits_ideal_case(num_docs));
            },
        )
        .await?;
        Ok(())
    }

    #[tokio::test]
    async fn test_simulate_stable_log_merge_planner_bug() -> anyhow::Result<()> {
        let merge_policy = StableLogMergePolicy::default();
        let vals = &[11, 11, 11, 11, 11, 11, 310000, 11, 11, 11, 11, 11, 11, 11];
        aux_test_simulate_merge_planner_num_docs(
            Arc::new(merge_policy.clone()),
            &vals[..],
            &|splits| {
                let num_docs = splits.iter().map(|split| split.num_docs as u64).sum();
                assert!(splits.len() <= merge_policy.max_num_splits_worst_case(num_docs));
            },
        )
        .await?;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    IntCounter, IntCounterVec, IntGauge, IntGaugeVec, new_counter, new_counter_vec, new_gauge,
    new_gauge_vec,
};

pub struct IndexerMetrics {
    pub processed_docs_total: IntCounterVec<2>,
    pub processed_bytes: IntCounterVec<2>,
    pub indexing_pipelines: IntGaugeVec<1>,
    pub backpressure_micros: IntCounterVec<1>,
    pub available_concurrent_upload_permits: IntGaugeVec<1>,
    pub split_builders: IntGauge,
    pub ongoing_merge_operations: IntGauge,
    pub pending_merge_operations: IntGauge,
    pub pending_merge_bytes: IntGauge,
    // We use a lazy counter, as most users do not use Kafka.
    #[cfg_attr(not(feature = "kafka"), allow(dead_code))]
    pub kafka_rebalance_total: Lazy<IntCounter>,
}

impl Default for IndexerMetrics {
    fn default() -> Self {
        IndexerMetrics {
            processed_docs_total: new_counter_vec(
                "processed_docs_total",
                "Number of processed docs by index, source and processed status in [valid, \
                 schema_error, parse_error, transform_error]",
                "indexing",
                &[],
                ["index", "docs_processed_status"],
            ),
            processed_bytes: new_counter_vec(
                "processed_bytes",
                "Number of bytes of processed documents by index, source and processed status in \
                 [valid, schema_error, parse_error, transform_error]",
                "indexing",
                &[],
                ["index", "docs_processed_status"],
            ),
            indexing_pipelines: new_gauge_vec(
                "indexing_pipelines",
                "Number of running indexing pipelines",
                "indexing",
                &[],
                ["index"],
            ),
            backpressure_micros: new_counter_vec(
                "backpressure_micros",
                "Amount of time spent in backpressure (in micros). This time only includes the \
                 amount of time spent waiting for a place in the queue of another actor.",
                "indexing",
                &[],
                ["actor_name"],
            ),
            available_concurrent_upload_permits: new_gauge_vec(
                "concurrent_upload_available_permits_num",
                "Number of available concurrent upload permits by component in [merger, indexer]",
                "indexing",
                &[],
                ["component"],
            ),
            split_builders: new_gauge(
                "split_builders",
                "Number of existing index writer instances.",
                "indexing",
                &[],
            ),
            ongoing_merge_operations: new_gauge(
                "ongoing_merge_operations",
                "Number of ongoing merge operations",
                "indexing",
                &[],
            ),
            pending_merge_operations: new_gauge(
                "pending_merge_operations",
                "Number of pending merge operations",
                "indexing",
                &[],
            ),
            pending_merge_bytes: new_gauge(
                "pending_merge_bytes",
                "Number of pending merge bytes",
                "indexing",
                &[],
            ),
            kafka_rebalance_total: Lazy::new(|| {
                new_counter(
                    "kafka_rebalance_total",
                    "Number of kafka rebalances",
                    "indexing",
                    &[],
                )
            }),
        }
    }
}

/// `INDEXER_METRICS` exposes indexing related metrics through a prometheus
/// endpoint.
pub static INDEXER_METRICS: Lazy<IndexerMetrics> = Lazy::new(IndexerMetrics::default);


================================================
FILE: quickwit/quickwit-indexing/src/models/indexed_split.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::path::Path;

use quickwit_common::io::IoControls;
use quickwit_common::metrics::GaugeGuard;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_metastore::checkpoint::IndexCheckpointDelta;
use quickwit_proto::indexing::IndexingPipelineId;
use quickwit_proto::types::{DocMappingUid, IndexUid, PublishToken};
use tantivy::IndexBuilder;
use tantivy::directory::MmapDirectory;
use tracing::{Span, instrument};

use crate::controlled_directory::ControlledDirectory;
use crate::merge_policy::MergeTask;
use crate::models::{PublishLock, SplitAttrs};
use crate::new_split_id;

pub struct IndexedSplitBuilder {
    pub split_attrs: SplitAttrs,
    pub index_writer: tantivy::SingleSegmentIndexWriter,
    pub split_scratch_directory: TempDirectory,
    pub controlled_directory_opt: Option<ControlledDirectory>,
}

pub struct IndexedSplit {
    pub split_attrs: SplitAttrs,
    pub index: tantivy::Index,
    pub split_scratch_directory: TempDirectory,
    pub controlled_directory_opt: Option<ControlledDirectory>,
}

impl IndexedSplit {
    pub fn split_id(&self) -> &str {
        &self.split_attrs.split_id
    }
}

impl fmt::Debug for IndexedSplit {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("IndexedSplit")
            .field("split_id", &self.split_attrs.split_id)
            .field("dir", &self.split_scratch_directory.path())
            .field("num_docs", &self.split_attrs.num_docs)
            .finish()
    }
}

impl fmt::Debug for IndexedSplitBuilder {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("IndexedSplitBuilder")
            .field("split_id", &self.split_attrs.split_id)
            .field("dir", &self.split_scratch_directory.path())
            .field("num_docs", &self.split_attrs.num_docs)
            .finish()
    }
}

impl IndexedSplitBuilder {
    pub fn new_in_dir(
        pipeline_id: IndexingPipelineId,
        partition_id: u64,
        last_delete_opstamp: u64,
        doc_mapping_uid: DocMappingUid,
        scratch_directory: TempDirectory,
        index_builder: IndexBuilder,
        io_controls: IoControls,
    ) -> anyhow::Result<Self> {
        // We avoid intermediary merge, and instead merge all segments in the packager.
        // The benefit is that we don't have to wait for potentially existing merges,
        // and avoid possible race conditions.
        let split_id = new_split_id();
        let split_scratch_directory_prefix = format!("split-{split_id}-");
        let split_scratch_directory =
            scratch_directory.named_temp_child(&split_scratch_directory_prefix)?;
        let mmap_directory = MmapDirectory::open(split_scratch_directory.path())?;
        let box_mmap_directory = Box::new(mmap_directory);

        let controlled_directory = ControlledDirectory::new(box_mmap_directory, io_controls);

        let index_writer =
            index_builder.single_segment_index_writer(controlled_directory.clone(), 15_000_000)?;
        Ok(Self {
            split_attrs: SplitAttrs {
                node_id: pipeline_id.node_id,
                index_uid: pipeline_id.index_uid,
                source_id: pipeline_id.source_id,
                doc_mapping_uid,
                partition_id,
                split_id,
                num_docs: 0,
                replaced_split_ids: Vec::new(),
                uncompressed_docs_size_in_bytes: 0,
                time_range: None,
                delete_opstamp: last_delete_opstamp,
                num_merge_ops: 0,
            },
            index_writer,
            split_scratch_directory,
            controlled_directory_opt: Some(controlled_directory),
        })
    }

    #[instrument(name="serialize_split",
        skip_all,
        fields(
            node_id=%self.split_attrs.node_id,
            index_uid=%self.split_attrs.index_uid,
            source_id=%self.split_attrs.source_id,
            split_id=%self.split_attrs.split_id,
            partition_id=%self.split_attrs.partition_id,
            num_docs=%self.split_attrs.num_docs,
            uncompressed_docs_size_in_bytes=%self.split_attrs.uncompressed_docs_size_in_bytes,
            delete_opstamp=%self.split_attrs.delete_opstamp,
            num_merge_ops=%self.split_attrs.num_merge_ops,
        )
    )]
    pub fn finalize(self) -> anyhow::Result<IndexedSplit> {
        let index = self.index_writer.finalize()?;
        Ok(IndexedSplit {
            split_attrs: self.split_attrs,
            index,
            split_scratch_directory: self.split_scratch_directory,
            controlled_directory_opt: self.controlled_directory_opt,
        })
    }

    pub fn path(&self) -> &Path {
        self.split_scratch_directory.path()
    }

    pub fn split_id(&self) -> &str {
        &self.split_attrs.split_id
    }
}

#[derive(Debug)]
pub struct IndexedSplitBatch {
    pub splits: Vec<IndexedSplit>,
    pub checkpoint_delta_opt: Option<IndexCheckpointDelta>,
    pub publish_lock: PublishLock,
    pub publish_token_opt: Option<PublishToken>,
    /// A [`MergeTask`] tracked by either the `MergePlanner` or the `DeleteTaskPlanner`
    /// in the `MergePipeline` or `DeleteTaskPipeline`.
    /// See planners docs to understand the usage.
    /// If `None`, the split batch was built in the `IndexingPipeline`.
    pub merge_task_opt: Option<MergeTask>,
    pub batch_parent_span: Span,
}

#[derive(Clone, Copy, Debug, Eq, PartialEq)]
pub enum CommitTrigger {
    Drained,
    ForceCommit,
    MemoryLimit,
    NoMoreDocs,
    NumDocsLimit,
    Timeout,
}

#[derive(Debug)]
pub struct IndexedSplitBatchBuilder {
    pub splits: Vec<IndexedSplitBuilder>,
    pub checkpoint_delta_opt: Option<IndexCheckpointDelta>,
    pub publish_lock: PublishLock,
    pub publish_token_opt: Option<PublishToken>,
    pub commit_trigger: CommitTrigger,
    pub batch_parent_span: Span,
    pub memory_usage: GaugeGuard<'static>,
    pub _split_builders_guard: GaugeGuard<'static>,
}

/// Sends notifications to the Publisher that the last batch of splits was empty.
#[derive(Debug)]
pub struct EmptySplit {
    pub index_uid: IndexUid,
    pub checkpoint_delta: IndexCheckpointDelta,
    pub publish_lock: PublishLock,
    pub publish_token_opt: Option<PublishToken>,
    pub batch_parent_span: Span,
}


================================================
FILE: quickwit/quickwit-indexing/src/models/indexing_service_message.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::SourceConfig;
use quickwit_proto::indexing::{IndexingPipelineId, MergePipelineId};
use quickwit_proto::types::{IndexId, PipelineUid};

#[derive(Clone, Debug)]
pub struct SpawnPipeline {
    pub index_id: IndexId,
    pub source_config: SourceConfig,
    pub pipeline_uid: PipelineUid,
}

/// Detaches a pipeline from the indexing service. The pipeline is no longer managed by the
/// server. This is mostly useful for ad-hoc indexing pipelines launched with `quickwit index
/// ingest ..` and testing.
#[derive(Debug)]
pub struct DetachIndexingPipeline {
    pub pipeline_id: IndexingPipelineId,
}

/// Detaches a merge pipeline from the indexing service. The pipeline is no longer managed by the
/// server. This is mostly useful for preventing the server killing an existing merge pipeline
/// if a indexing pipeline is detached.
#[derive(Debug)]
pub struct DetachMergePipeline {
    pub pipeline_id: MergePipelineId,
}

#[derive(Debug)]
pub struct ObservePipeline {
    pub pipeline_id: IndexingPipelineId,
}


================================================
FILE: quickwit/quickwit-indexing/src/models/indexing_statistics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::sync::atomic::Ordering;

use quickwit_proto::indexing::PipelineMetrics;
use quickwit_proto::types::ShardId;
use serde::Serialize;

use crate::actors::{DocProcessorCounters, IndexerCounters, PublisherCounters, UploaderCounters};

/// A Struct that holds all statistical data about indexing
#[derive(Clone, Debug, Default, Serialize, utoipa::ToSchema)]
pub struct IndexingStatistics {
    /// Number of document processed (valid or not)
    pub num_docs: u64,
    /// Number of document parse error, or missing timestamps
    pub num_invalid_docs: u64,
    /// Number of created split
    pub num_local_splits: u64,
    /// Number of staged splits
    pub num_staged_splits: u64,
    /// Number of uploaded splits
    pub num_uploaded_splits: u64,
    /// Number of published splits
    pub num_published_splits: u64,
    /// Number of empty batches
    pub num_empty_splits: u64,
    /// Size in byte of document processed
    pub total_bytes_processed: u64,
    /// Size in bytes of resulting split
    pub total_size_splits: u64,
    /// Pipeline generation.
    pub generation: usize,
    /// Number of successive pipeline spawn attempts.
    pub num_spawn_attempts: usize,
    // Pipeline metrics.
    pub pipeline_metrics_opt: Option<PipelineMetrics>,
    // List of shard ids.
    #[schema(value_type = Vec<u64>)]
    pub shard_ids: BTreeSet<ShardId>,
    pub params_fingerprint: u64,
}

impl IndexingStatistics {
    pub fn add_actor_counters(
        mut self,
        doc_processor_counters: &DocProcessorCounters,
        indexer_counters: &IndexerCounters,
        uploader_counters: &UploaderCounters,
        publisher_counters: &PublisherCounters,
    ) -> Self {
        self.num_docs += doc_processor_counters.num_processed_docs();
        self.num_invalid_docs += doc_processor_counters.num_invalid_docs();
        self.num_local_splits += indexer_counters.num_splits_emitted;
        self.total_bytes_processed += doc_processor_counters
            .num_bytes_total
            .load(Ordering::Relaxed);
        self.num_staged_splits += uploader_counters.num_staged_splits.load(Ordering::Relaxed);
        self.num_uploaded_splits += uploader_counters
            .num_uploaded_splits
            .load(Ordering::Relaxed);
        self.num_published_splits += publisher_counters.num_published_splits;
        self.num_empty_splits += publisher_counters.num_empty_splits;
        self
    }

    pub fn set_num_spawn_attempts(mut self, num_spawn_attempts: usize) -> Self {
        self.num_spawn_attempts = num_spawn_attempts;
        self
    }

    pub fn set_generation(mut self, generation: usize) -> Self {
        self.generation = generation;
        self
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/merge_planner_message.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_metastore::SplitMetadata;

#[derive(Clone, Debug)]
pub struct NewSplits {
    pub new_splits: Vec<SplitMetadata>,
}


================================================
FILE: quickwit/quickwit-indexing/src/models/merge_scratch.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::temp_dir::TempDirectory;
use tantivy::Directory;

use crate::merge_policy::MergeTask;

#[derive(Debug)]
pub struct MergeScratch {
    /// A [`MergeTask`] tracked by either the `MergePlanner` or the `DeleteTaskPlanner`
    /// See planners docs to understand the usage.
    pub merge_task: MergeTask,
    /// Scratch directory for computing the merge.
    pub merge_scratch_directory: TempDirectory,
    pub downloaded_splits_directory: TempDirectory,
    pub tantivy_dirs: Vec<Box<dyn Directory>>,
}


================================================
FILE: quickwit/quickwit-indexing/src/models/merge_statistics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::atomic::Ordering;

use serde::Serialize;

use crate::actors::{PublisherCounters, UploaderCounters};

/// A Struct to hold all merge statistical data.
#[derive(Clone, Debug, Default, Serialize)]
pub struct MergeStatistics {
    /// Number of uploaded splits
    pub num_uploaded_splits: u64,
    /// Number of published splits
    pub num_published_splits: u64,
    /// Pipeline generation.
    pub generation: usize,
    /// Number of successive pipeline spawn attempts.
    pub num_spawn_attempts: usize,
    /// Number of merges currently in progress.
    pub num_ongoing_merges: usize,
}

impl MergeStatistics {
    pub fn add_actor_counters(
        mut self,
        uploader_counters: &UploaderCounters,
        publisher_counters: &PublisherCounters,
    ) -> Self {
        self.num_uploaded_splits += uploader_counters.num_uploaded_splits.load(Ordering::SeqCst);
        self.num_published_splits += publisher_counters.num_published_splits;
        self
    }

    pub fn set_num_spawn_attempts(mut self, num_spawn_attempts: usize) -> Self {
        self.num_spawn_attempts = num_spawn_attempts;
        self
    }

    pub fn set_generation(mut self, generation: usize) -> Self {
        self.generation = generation;
        self
    }

    pub fn set_ongoing_merges(mut self, n: usize) -> Self {
        self.num_ongoing_merges = n;
        self
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![allow(rustdoc::invalid_html_tags)]

mod indexed_split;
mod indexing_service_message;
mod indexing_statistics;
mod merge_planner_message;
mod merge_scratch;
mod merge_statistics;
mod packaged_split;
mod processed_doc;
mod publish_lock;
mod publisher_message;
mod raw_doc_batch;
mod shard_positions;
mod split_attrs;

pub use indexed_split::{
    CommitTrigger, EmptySplit, IndexedSplit, IndexedSplitBatch, IndexedSplitBatchBuilder,
    IndexedSplitBuilder,
};
pub use indexing_service_message::{
    DetachIndexingPipeline, DetachMergePipeline, ObservePipeline, SpawnPipeline,
};
pub use indexing_statistics::IndexingStatistics;
pub use merge_planner_message::NewSplits;
pub use merge_scratch::MergeScratch;
pub use merge_statistics::MergeStatistics;
pub use packaged_split::{PackagedSplit, PackagedSplitBatch};
pub use processed_doc::{ProcessedDoc, ProcessedDocBatch};
pub use publish_lock::{NewPublishLock, PublishLock};
pub use publisher_message::SplitsUpdate;
use quickwit_proto::types::PublishToken;
pub use raw_doc_batch::RawDocBatch;
pub(crate) use shard_positions::LocalShardPositionsUpdate;
pub use shard_positions::ShardPositionsService;
pub use split_attrs::{SplitAttrs, create_split_metadata};

#[derive(Debug)]
pub struct NewPublishToken(pub PublishToken);


================================================
FILE: quickwit/quickwit-indexing/src/models/packaged_split.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::fmt;
use std::path::PathBuf;

use itertools::Itertools;
use quickwit_common::temp_dir::TempDirectory;
use quickwit_metastore::checkpoint::IndexCheckpointDelta;
use quickwit_proto::types::{IndexUid, PublishToken, SplitId};
use tracing::Span;

use crate::merge_policy::MergeTask;
use crate::models::{PublishLock, SplitAttrs};

pub struct PackagedSplit {
    pub serialized_split_fields: Vec<u8>,
    pub split_attrs: SplitAttrs,
    pub split_scratch_directory: TempDirectory,
    pub tags: BTreeSet<String>,
    pub split_files: Vec<PathBuf>,
    pub hotcache_bytes: Vec<u8>,
}

impl PackagedSplit {
    pub fn index_uid(&self) -> &IndexUid {
        &self.split_attrs.index_uid
    }

    pub fn split_id(&self) -> &str {
        &self.split_attrs.split_id
    }
}

impl fmt::Debug for PackagedSplit {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("PackagedSplit")
            .field("split_attrs", &self.split_attrs)
            .field("split_scratch_directory", &self.split_scratch_directory)
            .field("tags", &self.tags)
            .field("split_files", &self.split_files)
            .finish()
    }
}

#[derive(Debug)]
pub struct PackagedSplitBatch {
    pub splits: Vec<PackagedSplit>,
    pub checkpoint_delta_opt: Option<IndexCheckpointDelta>,
    pub publish_lock: PublishLock,
    pub publish_token_opt: Option<PublishToken>,
    /// A [`MergeTask`] tracked by either the `MergePlanner` or the `DeleteTaskPlanner`
    /// in the `MergePipeline` or `DeleteTaskPipeline`.
    /// See planners docs to understand the usage.
    /// If `None`, the split batch was built in the `IndexingPipeline`.
    pub merge_task_opt: Option<MergeTask>,
    pub batch_parent_span: Span,
}

impl PackagedSplitBatch {
    /// Instantiate a consistent [`PackagedSplitBatch`] that
    /// satisfies two constraints:
    /// - a batch must have at least one split
    /// - all splits must belong to the same `index_uid`.
    pub fn new(
        splits: Vec<PackagedSplit>,
        checkpoint_delta_opt: Option<IndexCheckpointDelta>,
        publish_lock: PublishLock,
        publish_token_opt: Option<PublishToken>,
        merge_task_opt: Option<MergeTask>,
        batch_parent_span: Span,
    ) -> Self {
        assert!(!splits.is_empty());
        assert!(
            splits
                .iter()
                .tuple_windows()
                .all(|(left_split, right_split)| left_split.index_uid() == right_split.index_uid()),
            "All splits must belong to the same `index_uid`."
        );
        Self {
            splits,
            checkpoint_delta_opt,
            publish_lock,
            publish_token_opt,
            merge_task_opt,
            batch_parent_span,
        }
    }

    pub fn index_uid(&self) -> IndexUid {
        self.splits[0].split_attrs.index_uid.clone()
    }

    pub fn split_ids(&self) -> Vec<SplitId> {
        self.splits
            .iter()
            .map(|split| split.split_attrs.split_id.clone())
            .collect::<Vec<_>>()
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/processed_doc.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_metastore::checkpoint::SourceCheckpointDelta;
use tantivy::{DateTime, TantivyDocument};

pub struct ProcessedDoc {
    pub doc: TantivyDocument,
    pub timestamp_opt: Option<DateTime>,
    pub partition: u64,
    pub num_bytes: usize,
}

impl fmt::Debug for ProcessedDoc {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("ProcessedDoc")
            .field("timestamp_opt", &self.timestamp_opt)
            .field("partition", &self.partition)
            .field("num_bytes", &self.num_bytes)
            .finish()
    }
}

pub struct ProcessedDocBatch {
    // Do not directly append documents to this vector; otherwise, in-flight metrics will be
    // incorrect.
    pub docs: Vec<ProcessedDoc>,
    pub checkpoint_delta: SourceCheckpointDelta,
    pub force_commit: bool,
    _gauge_guard: GaugeGuard<'static>,
}

impl ProcessedDocBatch {
    pub fn new(
        docs: Vec<ProcessedDoc>,
        checkpoint_delta: SourceCheckpointDelta,
        force_commit: bool,
    ) -> Self {
        let delta = docs.iter().map(|doc| doc.num_bytes as i64).sum::<i64>();
        let mut gauge_guard = GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.indexer_mailbox);
        gauge_guard.add(delta);
        Self {
            docs,
            checkpoint_delta,
            force_commit,
            _gauge_guard: gauge_guard,
        }
    }
}

impl fmt::Debug for ProcessedDocBatch {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("ProcessedDocBatch")
            .field("num_docs", &self.docs.len())
            .field("checkpoint_delta", &self.checkpoint_delta)
            .field("force_commit", &self.force_commit)
            .finish()
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/publish_lock.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Debug;
use std::sync::Arc;
use std::sync::atomic::{AtomicBool, Ordering};

use tokio::sync::{Mutex, MutexGuard};

// Publisher locks have two clients: publishers and sources.
//
// Publishers must acquire the lock and ensure that the lock is alive before publishing.
//
// When a partition reassignment occurs, sources must (i) acquire, then (ii) kill, and finally (iii)
// release the lock before propagating a new lock via message passing to the downstream consumers.
#[derive(Clone, Default)]
pub struct PublishLock {
    inner: Arc<PublishLockInner>,
}

impl PartialEq for PublishLock {
    fn eq(&self, other: &Self) -> bool {
        std::ptr::eq(self.inner.as_ref(), other.inner.as_ref())
    }
}

impl Debug for PublishLock {
    fn fmt(&self, fmt: &mut std::fmt::Formatter) -> std::fmt::Result {
        fmt.debug_struct("PublishLock")
            .field("is_alive", &self.is_alive())
            .finish()
    }
}

struct PublishLockInner {
    alive: AtomicBool,
    mutex: Mutex<()>,
}

impl Default for PublishLockInner {
    fn default() -> Self {
        Self {
            alive: AtomicBool::new(true),
            mutex: Mutex::default(),
        }
    }
}

impl PublishLock {
    pub fn dead() -> Self {
        PublishLock {
            inner: Arc::new(PublishLockInner {
                alive: AtomicBool::new(false),
                mutex: Mutex::default(),
            }),
        }
    }
    pub async fn acquire(&self) -> Option<MutexGuard<'_, ()>> {
        let guard = self.inner.mutex.lock().await;
        if self.is_dead() {
            return None;
        }
        Some(guard)
    }

    pub fn is_alive(&self) -> bool {
        self.inner.alive.load(Ordering::Relaxed)
    }

    pub fn is_dead(&self) -> bool {
        !self.is_alive()
    }

    pub async fn kill(&self) {
        let _guard = self.inner.mutex.lock().await;
        self.inner.alive.store(false, Ordering::Relaxed);
    }
}

#[derive(Debug, PartialEq)]
pub struct NewPublishLock(pub PublishLock);

#[cfg(test)]
mod tests {

    use std::time::Duration;

    use tokio::time::timeout;

    use super::*;

    #[tokio::test]
    async fn test_publish_lock() {
        let lock = PublishLock::default();
        assert!(lock.is_alive());

        let guard = lock.acquire().await.unwrap();
        assert!(
            timeout(Duration::from_millis(50), lock.kill())
                .await
                .is_err()
        );
        drop(guard);

        lock.kill().await;
        assert!(lock.is_dead());
        assert!(lock.acquire().await.is_none());
    }

    #[test]
    fn test_publish_lock_dead() {
        let publish_lock = PublishLock::dead();
        assert!(publish_lock.is_dead());
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/publisher_message.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use itertools::Itertools;
use quickwit_metastore::SplitMetadata;
use quickwit_metastore::checkpoint::IndexCheckpointDelta;
use quickwit_proto::types::{IndexUid, PublishToken};
use tracing::Span;

use crate::merge_policy::MergeTask;
use crate::models::PublishLock;

pub struct SplitsUpdate {
    pub index_uid: IndexUid,
    pub new_splits: Vec<SplitMetadata>,
    pub replaced_split_ids: Vec<String>,
    pub checkpoint_delta_opt: Option<IndexCheckpointDelta>,
    pub publish_lock: PublishLock,
    pub publish_token_opt: Option<PublishToken>,
    /// A [`MergeTask`] tracked by either the `MergePlanner` or the `DeleteTaskPlanner`
    /// in the `MergePipeline` or `DeleteTaskPipeline`.
    /// See planners docs to understand the usage.
    /// If `None`, the split batch was built in the `IndexingPipeline`.
    pub merge_task: Option<MergeTask>,
    pub parent_span: Span,
}

impl fmt::Debug for SplitsUpdate {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let new_split_ids: String = self
            .new_splits
            .iter()
            .map(|split| split.split_id())
            .join(",");
        f.debug_struct("SplitsUpdate")
            .field("index_id", &self.index_uid.index_id)
            .field("new_splits", &new_split_ids)
            .field("checkpoint_delta", &self.checkpoint_delta_opt)
            .finish()
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/raw_doc_batch.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use bytes::Bytes;
use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_metastore::checkpoint::SourceCheckpointDelta;

pub struct RawDocBatch {
    // Do not directly append documents to this vector; otherwise, in-flight metrics will be
    // incorrect.
    pub docs: Vec<Bytes>,
    pub checkpoint_delta: SourceCheckpointDelta,
    pub force_commit: bool,
    _gauge_guard: GaugeGuard<'static>,
}

impl RawDocBatch {
    pub fn new(
        docs: Vec<Bytes>,
        checkpoint_delta: SourceCheckpointDelta,
        force_commit: bool,
    ) -> Self {
        let delta = docs.iter().map(|doc| doc.len() as i64).sum::<i64>();
        let mut gauge_guard =
            GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.doc_processor_mailbox);
        gauge_guard.add(delta);

        Self {
            docs,
            checkpoint_delta,
            force_commit,
            _gauge_guard: gauge_guard,
        }
    }

    #[cfg(test)]
    pub fn for_test(docs: &[&[u8]], range: std::ops::Range<u64>) -> Self {
        let docs = docs.iter().map(|doc| Bytes::from(doc.to_vec())).collect();
        let checkpoint_delta = SourceCheckpointDelta::from_range(range);
        Self::new(docs, checkpoint_delta, false)
    }
}

impl fmt::Debug for RawDocBatch {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("RawDocBatch")
            .field("num_docs", &self.docs.len())
            .field("checkpoint_delta", &self.checkpoint_delta)
            .field("force_commit", &self.force_commit)
            .finish()
    }
}

impl Default for RawDocBatch {
    fn default() -> Self {
        let _gauge_guard = GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.doc_processor_mailbox);
        Self {
            docs: Vec::new(),
            checkpoint_delta: SourceCheckpointDelta::default(),
            force_commit: false,
            _gauge_guard,
        }
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/shard_positions.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::fmt::Debug;
use std::time::{Duration, Instant};

use anyhow::Context;
use async_trait::async_trait;
use fnv::FnvHashMap;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, SpawnContext};
use quickwit_cluster::{Cluster, ListenerHandle};
use quickwit_common::pretty::PrettyDisplay;
use quickwit_common::pubsub::{Event, EventBroker};
use quickwit_proto::indexing::ShardPositionsUpdate;
use quickwit_proto::types::{Position, ShardId, SourceUid};
use tracing::{debug, error, info, warn};

/// Prefix used in chitchat to publish the shard positions.
const SHARD_POSITIONS_PREFIX: &str = "indexer.shard_positions:";

/// This event means that a pipeline running in the current node (hence "local")
/// performed a publish on an ingest pipeline, and hence the position of a shard has been updated.
///
/// This event is meant to be built by the `IngestSource`, upon reception of suggest truncate
/// event. It should only be consumed by the `ShardPositionsService`.
///
/// (This is why its member are private).
///
/// The new position is to be exposed to the entire cluster via chitchat.
///
/// Consumers of such events should listen to the more `ShardPositionsUpdate` event instead.
/// That event is broadcasted via the cluster event broker, and will include both local
/// changes and changes from other nodes.
#[derive(Debug, Clone, PartialEq, Eq)]
pub(crate) struct LocalShardPositionsUpdate {
    source_uid: SourceUid,
    // This list can be partial: not all shards for the source need to be listed here.
    shard_positions: Vec<(ShardId, Position)>,
}

impl LocalShardPositionsUpdate {
    pub fn new(source_uid: SourceUid, shard_positions: Vec<(ShardId, Position)>) -> Self {
        LocalShardPositionsUpdate {
            source_uid,
            shard_positions,
        }
    }
}

/// This event is an internal detail of the `ShardPositionsService`.
///
/// When a shard position change in the cluster is detected, a `ClusterShardPositionUpdate`
/// message is queued into the `ShardPositionsService`
#[derive(Debug)]
struct ClusterShardPositionsUpdate {
    pub source_uid: SourceUid,
    pub shard_id: ShardId,
    pub position: Position,
}

impl Event for LocalShardPositionsUpdate {}

/// The published shard positions is a model unique to the indexer service instance that
/// keeps track of the latest (known) published position for the shards of all managed sources.
///
/// It receives updates through the event broker, and only keeps the maximum published position
/// for each shard.
pub struct ShardPositionsService {
    shard_positions_per_source: FnvHashMap<SourceUid, BTreeMap<ShardId, Position>>,
    cluster: Cluster,
    event_broker: EventBroker,
    cluster_listener_handle_opt: Option<ListenerHandle>,
}

fn parse_shard_positions_from_kv(
    key: &str,
    value: &str,
) -> anyhow::Result<ClusterShardPositionsUpdate> {
    let (source_uid_str, shard_id_str) = key.rsplit_once(':').context("invalid key")?;
    let shard_id = ShardId::from(shard_id_str);
    let (index_uid_str, source_id) = source_uid_str.rsplit_once(':').context("invalid key")?;
    let index_uid = index_uid_str.parse()?;
    let source_uid = SourceUid {
        index_uid,
        source_id: source_id.to_string(),
    };
    let position = Position::from(value.to_string());
    Ok(ClusterShardPositionsUpdate {
        source_uid,
        shard_id,
        position,
    })
}

fn push_position_update(
    shard_positions_service_mailbox: &Mailbox<ShardPositionsService>,
    key: &str,
    value: &str,
) {
    let shard_positions = match parse_shard_positions_from_kv(key, value) {
        Ok(shard_positions) => shard_positions,
        Err(error) => {
            error!(key=key, value=value, error=%error, "failed to parse shard positions from cluster kv");
            return;
        }
    };
    if shard_positions_service_mailbox
        .try_send_message(shard_positions)
        .is_err()
    {
        error!("failed to send shard positions to the shard positions service");
    }
}

#[async_trait]
impl Actor for ShardPositionsService {
    type ObservableState = ();
    fn observable_state(&self) {}

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        let mailbox = ctx.mailbox().clone();

        self.cluster_listener_handle_opt = Some(
            self.cluster
                .subscribe(SHARD_POSITIONS_PREFIX, move |event| {
                    push_position_update(&mailbox, event.key, event.value);
                })
                .await,
        );

        // We are now listening to new updates. However, the cluster has been started earlier.
        // It might have already received shard updates from other nodes.
        //
        // Let's also sync our `ShardPositionsService` with the current state of the cluster.
        // Shard position updates are trivially idempotent, so we can replay all the events,
        // without worrying about duplicates.

        let now = Instant::now();
        let chitchat = self.cluster.chitchat().await;
        let chitchat_lock = chitchat.lock().await;
        let mut num_keys = 0;
        for node_state in chitchat_lock.node_states().values() {
            for (key, versioned_value) in node_state.iter_prefix(SHARD_POSITIONS_PREFIX) {
                let key_stripped = key.strip_prefix(SHARD_POSITIONS_PREFIX).unwrap();
                push_position_update(ctx.mailbox(), key_stripped, &versioned_value.value);
                num_keys += 1;
            }
            // It is tempting to yield here, but we are holding the chitchat lock.
            // Let's just log the amount of time it takes for the moment.
        }
        let elapsed = now.elapsed();
        if elapsed > Duration::from_millis(300) {
            warn!(
                "initializing shard positions took longer than expected: {} ({num_keys} keys)",
                elapsed.pretty_display(),
            );
        } else {
            info!(
                "initialized shard positions in {} ({num_keys} keys)",
                elapsed.pretty_display(),
            );
        }
        Ok(())
    }
}

impl ShardPositionsService {
    pub fn spawn(spawn_ctx: &SpawnContext, event_broker: EventBroker, cluster: Cluster) {
        let shard_positions_service = ShardPositionsService::new(event_broker.clone(), cluster);
        let (shard_positions_service_mailbox, _) =
            spawn_ctx.spawn_builder().spawn(shard_positions_service);
        // This subscription is in charge of updating the shard positions model.
        event_broker
            .subscribe_without_timeout::<LocalShardPositionsUpdate>(move |update| {
                if shard_positions_service_mailbox
                    .try_send_message(update)
                    .is_err()
                {
                    error!("failed to send update to shard positions service");
                }
            })
            .forever();
    }

    fn new(event_broker: EventBroker, cluster: Cluster) -> ShardPositionsService {
        ShardPositionsService {
            shard_positions_per_source: Default::default(),
            cluster,
            event_broker,
            cluster_listener_handle_opt: None,
        }
    }
}

#[async_trait]
impl Handler<ClusterShardPositionsUpdate> for ShardPositionsService {
    type Reply = ();

    async fn handle(
        &mut self,
        update: ClusterShardPositionsUpdate,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let ClusterShardPositionsUpdate {
            source_uid,
            shard_id,
            position,
        } = update;
        let updated_shard_positions = self.apply_update(&source_uid, vec![(shard_id, position)]);
        debug!(updated_shard_positions=?updated_shard_positions, "cluster position update");
        if !updated_shard_positions.is_empty() {
            self.publish_shard_updates_to_event_broker(source_uid, updated_shard_positions);
        }
        Ok(())
    }
}

#[async_trait]
impl Handler<LocalShardPositionsUpdate> for ShardPositionsService {
    type Reply = ();

    async fn handle(
        &mut self,
        update: LocalShardPositionsUpdate,
        _ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let LocalShardPositionsUpdate {
            source_uid,
            shard_positions,
        } = update;
        let updated_shard_positions: Vec<(ShardId, Position)> =
            self.apply_update(&source_uid, shard_positions);
        if updated_shard_positions.is_empty() {
            return Ok(());
        }
        self.publish_positions_into_chitchat(&source_uid, &updated_shard_positions)
            .await;
        self.publish_shard_updates_to_event_broker(source_uid, updated_shard_positions);
        Ok(())
    }
}

impl ShardPositionsService {
    async fn publish_positions_into_chitchat(
        &self,
        source_uid: &SourceUid,
        shard_positions: &[(ShardId, Position)],
    ) {
        let SourceUid {
            index_uid,
            source_id,
        } = &source_uid;
        for (shard_id, position) in shard_positions {
            let key = format!("{SHARD_POSITIONS_PREFIX}{index_uid}:{source_id}:{shard_id}");
            self.cluster
                .set_self_key_value_delete_after_ttl(key, position)
                .await;
        }
    }

    fn publish_shard_updates_to_event_broker(
        &self,
        source_uid: SourceUid,
        shard_positions: Vec<(ShardId, Position)>,
    ) {
        debug!(shard_positions=?shard_positions, "shard positions updates");
        self.event_broker.publish(ShardPositionsUpdate {
            source_uid,
            updated_shard_positions: shard_positions,
        });
    }

    /// Updates the internal model holding the last position per shard, and
    /// returns the list of shards that were updated.
    fn apply_update(
        &mut self,
        source_uid: &SourceUid,
        published_positions_per_shard: Vec<(ShardId, Position)>,
    ) -> Vec<(ShardId, Position)> {
        if published_positions_per_shard.is_empty() {
            warn!("received an empty publish shard positions update");
            return Vec::new();
        }
        let current_shard_positions = self
            .shard_positions_per_source
            .entry(source_uid.clone())
            .or_default();

        let updated_positions_per_shard = published_positions_per_shard
            .into_iter()
            .filter(|(shard, new_position)| {
                let Some(position) = current_shard_positions.get(shard) else {
                    return true;
                };
                new_position > position
            })
            .collect::<Vec<_>>();

        for (shard, position) in updated_positions_per_shard.iter() {
            current_shard_positions.insert(shard.clone(), position.clone());
        }

        updated_positions_per_shard
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_actors::Universe;
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_common::pubsub::EventBroker;
    use quickwit_proto::types::IndexUid;

    use super::*;

    #[tokio::test]
    async fn test_shard_positions_from_cluster() {
        quickwit_common::setup_logging_for_tests();

        let transport = ChannelTransport::default();

        let universe1 = Universe::with_accelerated_time();
        let universe2 = Universe::with_accelerated_time();

        let event_broker1 = EventBroker::default();
        let event_broker2 = EventBroker::default();

        let (tx1, mut rx1) = tokio::sync::mpsc::unbounded_channel::<ShardPositionsUpdate>();
        let (tx2, mut rx2) = tokio::sync::mpsc::unbounded_channel::<ShardPositionsUpdate>();

        event_broker1
            .subscribe(move |update: ShardPositionsUpdate| {
                tx1.send(update).unwrap();
            })
            .forever();

        event_broker2
            .subscribe(move |update: ShardPositionsUpdate| {
                tx2.send(update).unwrap();
            })
            .forever();

        let index_uid = IndexUid::new_with_random_ulid("index-test");
        let source_id = "test-source".to_string();
        let source_uid = SourceUid {
            index_uid,
            source_id,
        };

        let cluster1 =
            create_cluster_for_test(Vec::new(), &["indexer", "metastore"], &transport, true)
                .await
                .unwrap();
        ShardPositionsService::spawn(
            universe1.spawn_ctx(),
            event_broker1.clone(),
            cluster1.clone(),
        );

        // One of the event is published before cluster formation.
        event_broker1.publish(LocalShardPositionsUpdate::new(
            source_uid.clone(),
            vec![(ShardId::from(20), Position::offset(100u64))],
        ));

        let cluster2 = create_cluster_for_test(
            vec![cluster1.gossip_listen_addr.to_string()],
            &["indexer"],
            &transport,
            true,
        )
        .await
        .unwrap();

        cluster1
            .wait_for_ready_members(|members| members.len() == 2, Duration::from_secs(5))
            .await
            .unwrap();
        cluster2
            .wait_for_ready_members(|members| members.len() == 2, Duration::from_secs(5))
            .await
            .unwrap();

        ShardPositionsService::spawn(
            universe2.spawn_ctx(),
            event_broker2.clone(),
            cluster2.clone(),
        );

        // ----------------------
        // One of the node publishes a given shard position update.
        // This is done using a LocalPublishShardPositionUpdate

        event_broker1.publish(LocalShardPositionsUpdate::new(
            source_uid.clone(),
            vec![(ShardId::from(2), Position::offset(10u64))],
        ));
        event_broker1.publish(LocalShardPositionsUpdate::new(
            source_uid.clone(),
            vec![(ShardId::from(1), Position::offset(10u64))],
        ));
        event_broker2.publish(LocalShardPositionsUpdate::new(
            source_uid.clone(),
            vec![(ShardId::from(2), Position::offset(10u64))],
        ));
        event_broker2.publish(LocalShardPositionsUpdate::new(
            source_uid.clone(),
            vec![(ShardId::from(2), Position::offset(12u64))],
        ));
        event_broker2.publish(LocalShardPositionsUpdate::new(
            source_uid.clone(),
            vec![
                (ShardId::from(1), Position::Beginning),
                (ShardId::from(2), Position::offset(12u64)),
            ],
        ));

        let mut updates1: Vec<Vec<(ShardId, Position)>> = Vec::new();
        for _ in 0..4 {
            let update = rx1.recv().await.unwrap();
            assert_eq!(update.source_uid, source_uid);
            updates1.push(update.updated_shard_positions);
        }

        // The updates as seen from the first node.
        assert_eq!(
            updates1,
            vec![
                vec![(ShardId::from(20), Position::offset(100u64))],
                vec![(ShardId::from(2u64), Position::offset(10u64))],
                vec![(ShardId::from(1u64), Position::offset(10u64)),],
                vec![(ShardId::from(2u64), Position::offset(12u64)),],
            ]
        );

        // The updates as seen from the second.
        let mut updates2: Vec<Vec<(ShardId, Position)>> = Vec::new();
        for _ in 0..5 {
            let update = rx2.recv().await.unwrap();
            assert_eq!(update.source_uid, source_uid);
            updates2.push(update.updated_shard_positions);
        }
        assert_eq!(
            updates2,
            vec![
                vec![(ShardId::from(20u64), Position::offset(100u64))],
                vec![(ShardId::from(2u64), Position::offset(10u64))],
                vec![(ShardId::from(2u64), Position::offset(12u64))],
                vec![(ShardId::from(1u64), Position::Beginning)],
                vec![(ShardId::from(1u64), Position::offset(10u64))]
            ]
        );

        universe1.assert_quit().await;
        universe2.assert_quit().await;
    }

    #[tokio::test]
    async fn test_shard_positions_local_updates_publish_to_cluster() {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let transport = ChannelTransport::default();

        let cluster: Cluster = create_cluster_for_test(Vec::new(), &[], &transport, true)
            .await
            .unwrap();
        let event_broker = EventBroker::default();

        ShardPositionsService::spawn(universe.spawn_ctx(), event_broker.clone(), cluster.clone());

        let index_uid = IndexUid::new_with_random_ulid("index-test");
        let source_id = "test-source".to_string();
        let key_prefix = format!("{SHARD_POSITIONS_PREFIX}{index_uid}:{source_id}");
        let source_uid = SourceUid {
            index_uid,
            source_id,
        };

        let shard_id1 = ShardId::from(1);
        let shard_id2 = ShardId::from(2);
        let shard_id3 = ShardId::from(3);

        {
            event_broker.publish(LocalShardPositionsUpdate::new(
                source_uid.clone(),
                vec![(ShardId::from(1), Position::Beginning)],
            ));
            tokio::time::sleep(Duration::from_secs(1)).await;
            let key = format!("{key_prefix}:{shard_id1}");
            let value = cluster.get_self_key_value(&key).await.unwrap();
            assert_eq!(&value, "");
        }
        {
            event_broker.publish(LocalShardPositionsUpdate::new(
                source_uid.clone(),
                vec![
                    (shard_id1.clone(), Position::offset(1_000u64)),
                    (shard_id2.clone(), Position::offset(2_000u64)),
                ],
            ));
            tokio::time::sleep(Duration::from_secs(1)).await;
            let value1 = cluster
                .get_self_key_value(&format!("{key_prefix}:{shard_id1}"))
                .await
                .unwrap();
            assert_eq!(&value1, "00000000000000001000");
            let value2 = cluster
                .get_self_key_value(&format!("{key_prefix}:{shard_id2}"))
                .await
                .unwrap();
            assert_eq!(&value2, "00000000000000002000");
        }
        {
            event_broker.publish(LocalShardPositionsUpdate::new(
                source_uid.clone(),
                vec![
                    (shard_id1.clone(), Position::offset(999u64)),
                    (shard_id3.clone(), Position::offset(3_000u64)),
                ],
            ));
            tokio::time::sleep(Duration::from_secs(1)).await;
            let value1 = cluster
                .get_self_key_value(&format!("{key_prefix}:{shard_id1}"))
                .await
                .unwrap();
            // We do not update the position that got lower, nor the position that disappeared
            assert_eq!(&value1, "00000000000000001000");
            let value2 = cluster
                .get_self_key_value(&format!("{key_prefix}:{shard_id2}"))
                .await
                .unwrap();
            assert_eq!(&value2, "00000000000000002000");
            let value3 = cluster
                .get_self_key_value(&format!("{key_prefix}:{shard_id3}"))
                .await
                .unwrap();
            assert_eq!(&value3, "00000000000000003000");
        }
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/models/split_attrs.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::fmt;
use std::ops::{Range, RangeInclusive};
use std::sync::Arc;
use std::time::Duration;

use quickwit_metastore::{SplitMaturity, SplitMetadata};
use quickwit_proto::types::{DocMappingUid, IndexUid, NodeId, SourceId, SplitId};
use tantivy::DateTime;
use time::OffsetDateTime;

use crate::merge_policy::MergePolicy;

pub struct SplitAttrs {
    /// ID of the node that produced the split.
    pub node_id: NodeId,
    // Index UID to which the split belongs.
    pub index_uid: IndexUid,
    /// Source ID to which the split belongs.
    pub source_id: SourceId,

    /// Doc mapping UID used to produce this split.
    pub doc_mapping_uid: DocMappingUid,

    /// Split ID. Joined with the index URI (<index URI>/<split ID>), this ID
    /// should be enough to uniquely identify a split.
    /// In reality, some information may be implicitly configured
    /// in the storage resolver: for instance, the Amazon S3 region.
    pub split_id: SplitId,

    /// Partition to which the split belongs.
    ///
    /// Partitions are usually meant to isolate documents based on some field like
    /// `tenant_id`. For this reason, ideally splits with a different `partition_id`
    /// should not be merged together. Merging two splits with different `partition_id`
    /// does not hurt correctness however.
    pub partition_id: u64,

    /// Number of valid documents in the split.
    pub num_docs: u64,

    // Sum of the size of the document that were sent to the indexed.
    // This includes both documents that are valid or documents that are
    // invalid.
    pub uncompressed_docs_size_in_bytes: u64,

    pub time_range: Option<RangeInclusive<DateTime>>,

    pub replaced_split_ids: Vec<String>,

    /// Delete opstamp.
    pub delete_opstamp: u64,

    // Number of merge operation the split has been through so far.
    pub num_merge_ops: usize,
}

impl fmt::Debug for SplitAttrs {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("SplitAttrs")
            .field("split_id", &self.split_id)
            .field("partition_id", &self.partition_id)
            .field("replaced_split_ids", &self.replaced_split_ids)
            .field("time_range", &self.time_range)
            .field(
                "uncompressed_docs_size_in_bytes",
                &self.uncompressed_docs_size_in_bytes,
            )
            .field("num_docs", &self.num_docs)
            .field("num_merge_ops", &self.num_merge_ops)
            .finish()
    }
}

pub fn create_split_metadata(
    merge_policy: &Arc<dyn MergePolicy>,
    retention_policy: Option<&quickwit_config::RetentionPolicy>,
    split_attrs: &SplitAttrs,
    tags: BTreeSet<String>,
    footer_offsets: Range<u64>,
) -> SplitMetadata {
    let create_timestamp = OffsetDateTime::now_utc().unix_timestamp();

    let time_range = split_attrs
        .time_range
        .as_ref()
        .map(|range| range.start().into_timestamp_secs()..=range.end().into_timestamp_secs());

    let mut maturity =
        merge_policy.split_maturity(split_attrs.num_docs as usize, split_attrs.num_merge_ops);
    if let Some(max_maturity) = max_maturity_before_end_of_retention(
        retention_policy,
        create_timestamp,
        time_range.as_ref().map(|time_range| *time_range.end()),
    ) {
        maturity = maturity.min(max_maturity);
    }
    SplitMetadata {
        node_id: split_attrs.node_id.to_string(),
        index_uid: split_attrs.index_uid.clone(),
        source_id: split_attrs.source_id.clone(),
        doc_mapping_uid: split_attrs.doc_mapping_uid,
        split_id: split_attrs.split_id.clone(),
        partition_id: split_attrs.partition_id,
        num_docs: split_attrs.num_docs as usize,
        time_range,
        uncompressed_docs_size_in_bytes: split_attrs.uncompressed_docs_size_in_bytes,
        create_timestamp,
        maturity,
        tags,
        footer_offsets,
        delete_opstamp: split_attrs.delete_opstamp,
        num_merge_ops: split_attrs.num_merge_ops,
    }
}

/// reduce the maturity period of a split based on retention policy, so that it doesn't get merged
/// after it expires.
fn max_maturity_before_end_of_retention(
    retention_policy: Option<&quickwit_config::RetentionPolicy>,
    create_timestamp: i64,
    time_range_end: Option<i64>,
) -> Option<SplitMaturity> {
    let time_range_end = time_range_end? as u64;
    let retention_period_s = retention_policy?.retention_period().ok()?.as_secs();

    let maturity = if let Some(maturation_period_s) =
        (time_range_end + retention_period_s).checked_sub(create_timestamp as u64)
    {
        SplitMaturity::Immature {
            maturation_period: Duration::from_secs(maturation_period_s),
        }
    } else {
        // this split could be deleted as soon as it is created. Ideally we would
        // handle that sooner.
        SplitMaturity::Mature
    };
    Some(maturity)
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_metastore::SplitMaturity;

    use super::max_maturity_before_end_of_retention;

    #[test]
    fn test_max_maturity_before_end_of_retention() {
        let retention_policy = quickwit_config::RetentionPolicy {
            evaluation_schedule: "daily".to_string(),
            retention_period: "300 sec".to_string(),
        };
        let create_timestamp = 1000;

        // this should be deleted asap, not subject to merge
        assert_eq!(
            max_maturity_before_end_of_retention(
                Some(&retention_policy),
                create_timestamp,
                Some(200),
            ),
            Some(SplitMaturity::Mature)
        );

        // retention ends at 750 + 300 = 1050, which is 50s from now
        assert_eq!(
            max_maturity_before_end_of_retention(
                Some(&retention_policy),
                create_timestamp,
                Some(750),
            ),
            Some(SplitMaturity::Immature {
                maturation_period: Duration::from_secs(50)
            })
        );

        // no retention policy
        assert_eq!(
            max_maturity_before_end_of_retention(None, create_timestamp, Some(850),),
            None,
        );

        // no timestamp_range.end but a retention policy, that's odd, don't change anything about
        // the maturity period
        assert_eq!(
            max_maturity_before_end_of_retention(Some(&retention_policy), create_timestamp, None,),
            None,
        );
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/doc_file_reader.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;
use std::path::Path;

use anyhow::Context;
use async_compression::tokio::bufread::GzipDecoder;
use bytes::Bytes;
use quickwit_common::Progress;
use quickwit_common::uri::Uri;
use quickwit_metastore::checkpoint::PartitionId;
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::Position;
use quickwit_storage::StorageResolver;
use tokio::io::{AsyncBufReadExt, AsyncRead, AsyncReadExt, BufReader};

use super::{BATCH_NUM_BYTES_LIMIT, BatchBuilder};

pub struct FileRecord {
    pub next_offset: u64,
    pub doc: Bytes,
    pub is_last: bool,
}

/// A helper wrapper that lets you skip bytes in compressed files where you
/// cannot seek (e.g. gzip files).
struct SkipReader {
    reader: BufReader<Box<dyn AsyncRead + Send + Unpin>>,
    num_bytes_to_skip: usize,
}

impl SkipReader {
    fn new(reader: Box<dyn AsyncRead + Send + Unpin>, num_bytes_to_skip: usize) -> Self {
        Self {
            reader: BufReader::new(reader),
            num_bytes_to_skip,
        }
    }

    async fn skip(&mut self) -> io::Result<()> {
        // allocate on the heap to avoid stack overflows
        let mut buf = vec![0u8; 64_000];
        while self.num_bytes_to_skip > 0 {
            let num_bytes_to_read = self.num_bytes_to_skip.min(buf.len());
            let num_bytes_read = self
                .reader
                .read_exact(&mut buf[..num_bytes_to_read])
                .await?;
            self.num_bytes_to_skip -= num_bytes_read;
        }
        Ok(())
    }

    /// Reads a line and peeks into the readers buffer. Returns the number of
    /// bytes read and true the end of the file is reached.
    async fn read_line_and_peek(&mut self, buf: &mut String) -> io::Result<(usize, bool)> {
        if self.num_bytes_to_skip > 0 {
            self.skip().await?;
        }
        let line_size = self.reader.read_line(buf).await?;
        if line_size == 0 {
            return Ok((0, true));
        }
        let next_bytes = self.reader.fill_buf().await?;
        Ok((line_size, next_bytes.is_empty()))
    }
}

pub struct DocFileReader {
    reader: SkipReader,
    next_offset: u64,
}

impl DocFileReader {
    pub fn empty() -> Self {
        DocFileReader {
            reader: SkipReader::new(Box::new(tokio::io::empty()), 0),
            next_offset: 0,
        }
    }

    pub async fn from_uri(
        storage_resolver: &StorageResolver,
        uri: &Uri,
        offset: usize,
    ) -> anyhow::Result<Self> {
        let (dir_uri, file_name) = dir_and_filename(uri)?;
        let storage = storage_resolver.resolve(&dir_uri).await?;
        let file_size = storage.file_num_bytes(file_name).await?.try_into().unwrap();
        if file_size == 0 {
            return Ok(DocFileReader::empty());
        }
        // If it's a gzip file, we can't seek to a specific offset. `SkipReader`
        // starts from the beginning of the file, decompresses and skips the
        // first `offset` bytes.
        let reader = if uri.extension() == Some("gz") {
            let stream = storage.get_slice_stream(file_name, 0..file_size).await?;
            let decompressed_stream = Box::new(GzipDecoder::new(BufReader::new(stream)));
            DocFileReader {
                reader: SkipReader::new(decompressed_stream, offset),
                next_offset: offset as u64,
            }
        } else {
            let stream = storage
                .get_slice_stream(file_name, offset..file_size)
                .await?;
            DocFileReader {
                reader: SkipReader::new(stream, 0),
                next_offset: offset as u64,
            }
        };
        Ok(reader)
    }

    /// Reads the next record from the underlying file. Returns `None` when EOF
    /// is reached.
    pub async fn next_record(&mut self) -> anyhow::Result<Option<FileRecord>> {
        let mut buf = String::new();
        // TODO retry if stream is broken (#5243)
        let (bytes_read, is_last) = self.reader.read_line_and_peek(&mut buf).await?;
        if bytes_read == 0 {
            Ok(None)
        } else {
            self.next_offset += bytes_read as u64;
            Ok(Some(FileRecord {
                next_offset: self.next_offset,
                doc: Bytes::from(buf),
                is_last,
            }))
        }
    }
}

pub struct ObjectUriBatchReader {
    partition_id: PartitionId,
    reader: DocFileReader,
    current_offset: usize,
    is_eof: bool,
}

impl ObjectUriBatchReader {
    pub async fn try_new(
        storage_resolver: &StorageResolver,
        partition_id: PartitionId,
        uri: &Uri,
        position: Position,
    ) -> anyhow::Result<Self> {
        let current_offset = match position {
            Position::Beginning => 0,
            Position::Offset(offset) => offset
                .as_usize()
                .context("file offset should be stored as usize")?,
            Position::Eof(_) => {
                return Ok(ObjectUriBatchReader {
                    partition_id,
                    reader: DocFileReader::empty(),
                    current_offset: 0,
                    is_eof: true,
                });
            }
        };
        let reader = DocFileReader::from_uri(storage_resolver, uri, current_offset).await?;
        Ok(ObjectUriBatchReader {
            partition_id,
            reader,
            current_offset,
            is_eof: false,
        })
    }

    pub async fn read_batch(
        &mut self,
        source_progress: &Progress,
        source_type: SourceType,
    ) -> anyhow::Result<BatchBuilder> {
        let mut batch_builder = BatchBuilder::new(source_type);
        if self.is_eof {
            return Ok(batch_builder);
        }
        let limit_num_bytes = self.current_offset + BATCH_NUM_BYTES_LIMIT as usize;
        let mut new_offset = self.current_offset;
        while new_offset < limit_num_bytes {
            if let Some(record) = source_progress
                .protect_future(self.reader.next_record())
                .await?
            {
                new_offset = record.next_offset as usize;
                batch_builder.add_doc(record.doc);
                if record.is_last {
                    self.is_eof = true;
                    break;
                }
            } else {
                self.is_eof = true;
                break;
            }
        }
        let to_position = if self.is_eof {
            Position::eof(new_offset)
        } else {
            Position::offset(new_offset)
        };
        batch_builder.checkpoint_delta.record_partition_delta(
            self.partition_id.clone(),
            Position::offset(self.current_offset),
            to_position,
        )?;
        self.current_offset = new_offset;
        Ok(batch_builder)
    }

    pub fn is_eof(&self) -> bool {
        self.is_eof
    }
}

pub(crate) fn dir_and_filename(filepath: &Uri) -> anyhow::Result<(Uri, &Path)> {
    let dir_uri: Uri = filepath
        .parent()
        .context("Parent directory could not be resolved")?;
    let file_name = filepath
        .file_name()
        .context("Path does not appear to be a file")?;
    Ok((dir_uri, file_name))
}

#[cfg(test)]
pub mod file_test_helpers {
    use std::io::Write;

    use async_compression::tokio::write::GzipEncoder;
    use tempfile::NamedTempFile;

    pub const DUMMY_DOC: &[u8] = r#"{"body": "hello happy tax payer!"}"#.as_bytes();

    async fn gzip_bytes(bytes: &[u8]) -> Vec<u8> {
        let mut gzip_documents = Vec::new();
        let mut encoder = GzipEncoder::new(&mut gzip_documents);
        tokio::io::AsyncWriteExt::write_all(&mut encoder, bytes)
            .await
            .unwrap();
        // flush is not sufficient here and reading the file will raise a unexpected end of file
        // error.
        tokio::io::AsyncWriteExt::shutdown(&mut encoder)
            .await
            .unwrap();
        gzip_documents
    }

    async fn write_to_tmp(data: Vec<u8>, gzip: bool) -> NamedTempFile {
        let mut temp_file: tempfile::NamedTempFile = if gzip {
            tempfile::Builder::new().suffix(".gz").tempfile().unwrap()
        } else {
            tempfile::NamedTempFile::new().unwrap()
        };
        if gzip {
            let gzip_documents = gzip_bytes(&data).await;
            temp_file.write_all(&gzip_documents).unwrap();
        } else {
            temp_file.write_all(&data).unwrap();
        }
        temp_file.flush().unwrap();
        temp_file
    }

    pub async fn generate_dummy_doc_file(gzip: bool, lines: usize) -> (NamedTempFile, usize) {
        let mut documents_bytes = Vec::with_capacity(DUMMY_DOC.len() * lines);
        for _ in 0..lines {
            documents_bytes.write_all(DUMMY_DOC).unwrap();
            documents_bytes.write_all("\n".as_bytes()).unwrap();
        }
        let size = documents_bytes.len();
        let file = write_to_tmp(documents_bytes, gzip).await;
        (file, size)
    }

    /// Generates a file with increasing padded numbers. Each line is 8 bytes
    /// including the newline char.
    ///
    /// 0000000\n0000001\n0000002\n...
    pub async fn generate_index_doc_file(gzip: bool, lines: usize) -> NamedTempFile {
        assert!(lines < 9999999, "each line is 7 digits + newline");
        let mut documents_bytes = Vec::new();
        for i in 0..lines {
            documents_bytes
                .write_all(format!("{i:0>7}\n").as_bytes())
                .unwrap();
        }
        write_to_tmp(documents_bytes, gzip).await
    }
}

#[cfg(test)]
mod tests {
    use std::io::Cursor;
    use std::str::FromStr;

    use file_test_helpers::generate_index_doc_file;
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;

    use super::*;

    #[tokio::test]
    async fn test_skip_reader() {
        {
            // Skip 0 bytes.
            let mut reader = SkipReader::new(Box::new("hello".as_bytes()), 0);
            let mut buf = String::new();
            let (bytes_read, eof) = reader.read_line_and_peek(&mut buf).await.unwrap();
            assert_eq!(buf, "hello");
            assert!(eof);
            assert_eq!(bytes_read, 5)
        }
        {
            // Skip 2 bytes.
            let mut reader = SkipReader::new(Box::new("hello".as_bytes()), 2);
            let mut buf = String::new();
            let (bytes_read, eof) = reader.read_line_and_peek(&mut buf).await.unwrap();
            assert_eq!(buf, "llo");
            assert!(eof);
            assert_eq!(bytes_read, 3)
        }
        {
            let input = "hello";
            let cursor = Cursor::new(input);
            let mut reader = SkipReader::new(Box::new(cursor), 5);
            let mut buf = String::new();
            let (bytes_read, eof) = reader.read_line_and_peek(&mut buf).await.unwrap();
            assert!(eof);
            assert_eq!(bytes_read, 0)
        }
        {
            let input = "hello";
            let cursor = Cursor::new(input);
            let mut reader = SkipReader::new(Box::new(cursor), 10);
            let mut buf = String::new();
            assert!(reader.read_line_and_peek(&mut buf).await.is_err());
        }
        {
            let input = "hello world".repeat(10000);
            let cursor = Cursor::new(input.clone());
            let mut reader = SkipReader::new(Box::new(cursor), 64000);
            let mut buf = String::new();
            reader.read_line_and_peek(&mut buf).await.unwrap();
            assert_eq!(buf, input[64000..]);
        }
        {
            let input = "hello world".repeat(10000);
            let cursor = Cursor::new(input.clone());
            let mut reader = SkipReader::new(Box::new(cursor), 64001);
            let mut buf = String::new();
            reader.read_line_and_peek(&mut buf).await.unwrap();
            assert_eq!(buf, input[64001..]);
        }
    }

    async fn aux_test_full_read_record(file: impl AsRef<str>, expected_lines: usize) {
        let storage_resolver = StorageResolver::for_test();
        let uri = Uri::from_str(file.as_ref()).unwrap();
        let mut doc_reader = DocFileReader::from_uri(&storage_resolver, &uri, 0)
            .await
            .unwrap();
        let mut parsed_lines = 0;
        while doc_reader.next_record().await.unwrap().is_some() {
            parsed_lines += 1;
        }
        assert_eq!(parsed_lines, expected_lines);
    }

    #[tokio::test]
    async fn test_full_read_record() {
        aux_test_full_read_record("data/test_corpus.json", 4).await;
    }

    #[tokio::test]
    async fn test_full_read_record_gz() {
        aux_test_full_read_record("data/test_corpus.json.gz", 4).await;
    }

    #[tokio::test]
    async fn test_empty_file() {
        let empty_file = tempfile::NamedTempFile::new().unwrap();
        let empty_file_uri = empty_file.path().to_str().unwrap();
        aux_test_full_read_record(empty_file_uri, 0).await;
    }

    async fn aux_test_resumed_read_record(
        file: impl AsRef<str>,
        expected_lines: usize,
        stop_at_line: usize,
    ) {
        let storage_resolver = StorageResolver::for_test();
        let uri = Uri::from_str(file.as_ref()).unwrap();
        // read the first part of the file
        let mut first_part_reader = DocFileReader::from_uri(&storage_resolver, &uri, 0)
            .await
            .unwrap();
        let mut resume_offset = 0;
        let mut parsed_lines = 0;
        for _ in 0..stop_at_line {
            let rec = first_part_reader
                .next_record()
                .await
                .unwrap()
                .expect("EOF happened before stop_at_line");
            resume_offset = rec.next_offset as usize;
            assert_eq!(Bytes::from(format!("{parsed_lines:0>7}\n")), rec.doc);
            parsed_lines += 1;
        }
        // read the second part of the file
        let mut second_part_reader =
            DocFileReader::from_uri(&storage_resolver, &uri, resume_offset)
                .await
                .unwrap();
        while let Some(rec) = second_part_reader.next_record().await.unwrap() {
            assert_eq!(Bytes::from(format!("{parsed_lines:0>7}\n")), rec.doc);
            parsed_lines += 1;
        }
        assert_eq!(parsed_lines, expected_lines);
    }

    #[tokio::test]
    async fn test_resumed_read_record() {
        let dummy_doc_file = generate_index_doc_file(false, 1000).await;
        let dummy_doc_file_uri = dummy_doc_file.path().to_str().unwrap();
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 1).await;
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 40).await;
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 999).await;
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 1000).await;
    }

    #[tokio::test]
    async fn test_resumed_read_record_gz() {
        let dummy_doc_file = generate_index_doc_file(true, 1000).await;
        let dummy_doc_file_uri = dummy_doc_file.path().to_str().unwrap();
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 1).await;
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 40).await;
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 999).await;
        aux_test_resumed_read_record(dummy_doc_file_uri, 1000, 1000).await;
    }

    async fn aux_test_full_read_batch(
        file: impl AsRef<str>,
        expected_lines: usize,
        expected_batches: usize,
        file_size: usize,
        from: Position,
    ) {
        let progress = Progress::default();
        let storage_resolver = StorageResolver::for_test();
        let uri = Uri::from_str(file.as_ref()).unwrap();
        let partition = PartitionId::from("test");
        let mut batch_reader =
            ObjectUriBatchReader::try_new(&storage_resolver, partition.clone(), &uri, from)
                .await
                .unwrap();

        let mut parsed_lines = 0;
        let mut parsed_batches = 0;
        let mut checkpoint_delta = SourceCheckpointDelta::default();
        while !batch_reader.is_eof() {
            let batch = batch_reader
                .read_batch(&progress, SourceType::Unspecified)
                .await
                .unwrap();
            parsed_lines += batch.docs.len();
            parsed_batches += 1;
            checkpoint_delta.extend(batch.checkpoint_delta).unwrap();
        }
        assert_eq!(parsed_lines, expected_lines);
        assert_eq!(parsed_batches, expected_batches);
        let position = checkpoint_delta
            .get_source_checkpoint()
            .position_for_partition(&partition)
            .unwrap()
            .clone();
        assert_eq!(position, Position::eof(file_size))
    }

    #[tokio::test]
    async fn test_read_batch_empty_file() {
        let empty_file = tempfile::NamedTempFile::new().unwrap();
        let empty_file_uri = empty_file.path().to_str().unwrap();
        aux_test_full_read_batch(empty_file_uri, 0, 1, 0, Position::Beginning).await;
    }

    #[tokio::test]
    async fn test_full_read_single_batch() {
        let num_lines = 10;
        let dummy_doc_file = generate_index_doc_file(false, num_lines).await;
        let dummy_doc_file_uri = dummy_doc_file.path().to_str().unwrap();
        aux_test_full_read_batch(
            dummy_doc_file_uri,
            num_lines,
            1,
            num_lines * 8,
            Position::Beginning,
        )
        .await;
    }

    #[tokio::test]
    async fn test_full_read_single_batch_max_size() {
        let num_lines = BATCH_NUM_BYTES_LIMIT as usize / 8;
        let dummy_doc_file = generate_index_doc_file(false, num_lines).await;
        let dummy_doc_file_uri = dummy_doc_file.path().to_str().unwrap();
        aux_test_full_read_batch(
            dummy_doc_file_uri,
            num_lines,
            1,
            num_lines * 8,
            Position::Beginning,
        )
        .await;
    }

    #[tokio::test]
    async fn test_full_read_two_batches() {
        let num_lines = BATCH_NUM_BYTES_LIMIT as usize / 8 + 10;
        let dummy_doc_file = generate_index_doc_file(false, num_lines).await;
        let dummy_doc_file_uri = dummy_doc_file.path().to_str().unwrap();
        aux_test_full_read_batch(
            dummy_doc_file_uri,
            num_lines,
            2,
            num_lines * 8,
            Position::Beginning,
        )
        .await;
    }

    #[tokio::test]
    async fn test_resume_read_batches() {
        let total_num_lines = BATCH_NUM_BYTES_LIMIT as usize / 8 * 3;
        let resume_after_lines = total_num_lines / 2;
        let dummy_doc_file = generate_index_doc_file(false, total_num_lines).await;
        let dummy_doc_file_uri = dummy_doc_file.path().to_str().unwrap();
        aux_test_full_read_batch(
            dummy_doc_file_uri,
            total_num_lines - resume_after_lines,
            2,
            total_num_lines * 8,
            Position::offset(resume_after_lines * 8),
        )
        .await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/file_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_config::FileSourceParams;
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::SourceId;

use super::doc_file_reader::ObjectUriBatchReader;
#[cfg(feature = "queue-sources")]
use super::queue_sources::coordinator::QueueCoordinator;
use crate::actors::DocProcessor;
use crate::source::{Source, SourceContext, SourceRuntime, TypedSourceFactory};

enum FileSourceState {
    #[cfg(feature = "queue-sources")]
    Notification(Box<QueueCoordinator>),
    Filepath {
        batch_reader: ObjectUriBatchReader,
        num_bytes_processed: u64,
        num_lines_processed: u64,
    },
}

pub struct FileSource {
    source_id: SourceId,
    state: FileSourceState,
    source_type: SourceType,
}

impl fmt::Debug for FileSource {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "FileSource {{ source_id: {} }}", self.source_id)
    }
}

#[async_trait]
impl Source for FileSource {
    #[allow(unused_variables)]
    async fn initialize(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        match &mut self.state {
            #[cfg(feature = "queue-sources")]
            FileSourceState::Notification(coordinator) => {
                coordinator.initialize(doc_processor_mailbox, ctx).await
            }
            FileSourceState::Filepath { .. } => Ok(()),
        }
    }

    #[allow(unused_variables)]
    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        match &mut self.state {
            #[cfg(feature = "queue-sources")]
            FileSourceState::Notification(coordinator) => {
                coordinator.emit_batches(doc_processor_mailbox, ctx).await?;
            }
            FileSourceState::Filepath {
                batch_reader,
                num_bytes_processed,
                num_lines_processed,
            } => {
                let batch_builder = batch_reader
                    .read_batch(ctx.progress(), self.source_type)
                    .await?;
                *num_bytes_processed += batch_builder.num_bytes;
                *num_lines_processed += batch_builder.docs.len() as u64;
                doc_processor_mailbox
                    .send_message(batch_builder.build())
                    .await?;
                if batch_reader.is_eof() {
                    ctx.send_exit_with_success(doc_processor_mailbox).await?;
                    return Err(ActorExitStatus::Success);
                }
            }
        }
        Ok(Duration::ZERO)
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    #[allow(unused_variables)]
    async fn suggest_truncate(
        &mut self,
        checkpoint: SourceCheckpoint,
        ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        match &mut self.state {
            #[cfg(feature = "queue-sources")]
            FileSourceState::Notification(coordinator) => {
                coordinator.suggest_truncate(checkpoint, ctx).await
            }
            FileSourceState::Filepath { .. } => Ok(()),
        }
    }

    fn observable_state(&self) -> serde_json::Value {
        match &self.state {
            #[cfg(feature = "queue-sources")]
            FileSourceState::Notification(coordinator) => {
                serde_json::to_value(coordinator.observable_state()).unwrap()
            }
            FileSourceState::Filepath {
                num_bytes_processed,
                num_lines_processed,
                ..
            } => {
                serde_json::json!({
                    "num_bytes_processed": num_bytes_processed,
                    "num_lines_processed": num_lines_processed,
                })
            }
        }
    }
}

pub struct FileSourceFactory;

#[async_trait]
impl TypedSourceFactory for FileSourceFactory {
    type Source = FileSource;
    type Params = FileSourceParams;

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        params: FileSourceParams,
    ) -> anyhow::Result<FileSource> {
        let source_id = source_runtime.source_config.source_id.clone();
        let source_type = source_runtime.source_config.source_type();
        let state = match params {
            FileSourceParams::Filepath(file_uri) => {
                let partition_id = PartitionId::from(file_uri.as_str());
                let position = source_runtime
                    .fetch_checkpoint()
                    .await?
                    .position_for_partition(&partition_id)
                    .cloned()
                    .unwrap_or_default();
                let batch_reader = ObjectUriBatchReader::try_new(
                    &source_runtime.storage_resolver,
                    partition_id,
                    &file_uri,
                    position,
                )
                .await?;
                FileSourceState::Filepath {
                    batch_reader,
                    num_bytes_processed: 0,
                    num_lines_processed: 0,
                }
            }
            #[cfg(feature = "sqs")]
            FileSourceParams::Notifications(quickwit_config::FileSourceNotification::Sqs(
                sqs_config,
            )) => {
                let coordinator =
                    QueueCoordinator::try_from_sqs_config(sqs_config, source_runtime).await?;
                FileSourceState::Notification(Box::new(coordinator))
            }
            #[cfg(not(feature = "sqs"))]
            FileSourceParams::Notifications(quickwit_config::FileSourceNotification::Sqs(_)) => {
                anyhow::bail!("Quickwit was compiled without the `sqs` feature")
            }
        };

        Ok(FileSource {
            state,
            source_id,
            source_type,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;
    use std::str::FromStr;

    use bytes::Bytes;
    use quickwit_actors::{Command, Universe};
    use quickwit_common::uri::Uri;
    use quickwit_config::{SourceConfig, SourceInputFormat, SourceParams};
    use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpointDelta};
    use quickwit_proto::types::{IndexUid, Position};

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::doc_file_reader::file_test_helpers::{
        DUMMY_DOC, generate_dummy_doc_file, generate_index_doc_file,
    };
    use crate::source::tests::SourceRuntimeBuilder;
    use crate::source::{BATCH_NUM_BYTES_LIMIT, SourceActor};

    #[tokio::test]
    async fn test_file_source() {
        aux_test_file_source(false).await;
        aux_test_file_source(true).await;
    }

    async fn aux_test_file_source(gzip: bool) {
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let params = if gzip {
            FileSourceParams::from_filepath("data/test_corpus.json.gz").unwrap()
        } else {
            FileSourceParams::from_filepath("data/test_corpus.json").unwrap()
        };
        let source_config = SourceConfig {
            source_id: "test-file-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::File(params.clone()),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let file_source = FileSourceFactory::typed_create_source(source_runtime, params)
            .await
            .unwrap();
        let file_source_actor = SourceActor {
            source: Box::new(file_source),
            doc_processor_mailbox,
        };
        let (_file_source_mailbox, file_source_handle) =
            universe.spawn_builder().spawn(file_source_actor);
        let (actor_termination, counters) = file_source_handle.join().await;
        assert!(actor_termination.is_success());
        assert_eq!(
            counters,
            serde_json::json!({
                "num_bytes_processed": 1030u64,
                "num_lines_processed": 4u32
            })
        );
        let batch = indexer_inbox.drain_for_test();
        assert_eq!(batch.len(), 2);
        batch[0].downcast_ref::<RawDocBatch>().unwrap();
        assert!(matches!(
            batch[1].downcast_ref::<Command>().unwrap(),
            Command::ExitWithSuccess
        ));
    }

    #[tokio::test]
    async fn test_file_source_several_batch() {
        aux_test_file_source_several_batch(false).await;
        aux_test_file_source_several_batch(true).await;
    }

    async fn aux_test_file_source_several_batch(gzip: bool) {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let lines = BATCH_NUM_BYTES_LIMIT as usize / DUMMY_DOC.len() + 1;
        let (temp_file, temp_file_size) = generate_dummy_doc_file(gzip, lines).await;
        let filepath = temp_file.path().to_str().unwrap();
        let uri = Uri::from_str(filepath).unwrap();
        let params = FileSourceParams::Filepath(uri.clone());
        let source_config = SourceConfig {
            source_id: "test-file-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::File(params.clone()),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let file_source = FileSourceFactory::typed_create_source(source_runtime, params)
            .await
            .unwrap();
        let file_source_actor = SourceActor {
            source: Box::new(file_source),
            doc_processor_mailbox,
        };
        let (_file_source_mailbox, file_source_handle) =
            universe.spawn_builder().spawn(file_source_actor);
        let (actor_termination, counters) = file_source_handle.join().await;
        assert!(actor_termination.is_success());
        assert_eq!(
            counters,
            serde_json::json!({
                "num_lines_processed": lines,
                "num_bytes_processed": temp_file_size,
            })
        );
        let indexer_msgs = doc_processor_inbox.drain_for_test();
        assert_eq!(indexer_msgs.len(), 3);
        let batch1 = indexer_msgs[0].downcast_ref::<RawDocBatch>().unwrap();
        let batch2 = indexer_msgs[1].downcast_ref::<RawDocBatch>().unwrap();
        let command = indexer_msgs[2].downcast_ref::<Command>().unwrap();
        assert_eq!(
            format!("{:?}", &batch1.checkpoint_delta),
            format!(
                "∆({}:{})",
                uri, "(00000000000000000000..00000000000005242895]"
            )
        );
        assert_eq!(
            format!("{:?}", &batch2.checkpoint_delta),
            format!(
                "∆({}:{})",
                uri, "(00000000000005242895..~00000000000005397105]"
            )
        );
        assert!(matches!(command, &Command::ExitWithSuccess));
    }

    #[tokio::test]
    async fn test_file_source_resume_from_checkpoint() {
        aux_test_file_source_resume_from_checkpoint(false).await;
        aux_test_file_source_resume_from_checkpoint(true).await;
    }

    async fn aux_test_file_source_resume_from_checkpoint(gzip: bool) {
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let temp_file = generate_index_doc_file(gzip, 100).await;
        let temp_file_path = temp_file.path().to_str().unwrap();
        let uri = Uri::from_str(temp_file_path).unwrap();
        let params = FileSourceParams::Filepath(uri.clone());
        let source_config = SourceConfig {
            source_id: "test-file-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::File(params.clone()),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let partition_id = PartitionId::from(uri.as_str());
        let source_checkpoint_delta = SourceCheckpointDelta::from_partition_delta(
            partition_id,
            Position::Beginning,
            Position::offset(16usize),
        )
        .unwrap();

        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_mock_metastore(Some(source_checkpoint_delta))
            .with_queues_dir(temp_file_path)
            .build();

        let file_source = FileSourceFactory::typed_create_source(source_runtime, params)
            .await
            .unwrap();
        let file_source_actor = SourceActor {
            source: Box::new(file_source),
            doc_processor_mailbox,
        };
        let (_file_source_mailbox, file_source_handle) =
            universe.spawn_builder().spawn(file_source_actor);
        let (actor_termination, counters) = file_source_handle.join().await;
        assert!(actor_termination.is_success());
        assert_eq!(
            counters,
            serde_json::json!({
                "num_bytes_processed": (800-16) as u64,
                "num_lines_processed": (100-2) as u64,
            })
        );
        let indexer_messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(
            indexer_messages[0].docs[0],
            Bytes::from_static(b"0000002\n")
        );
    }
}

#[cfg(all(test, feature = "sqs-localstack-tests"))]
mod localstack_tests {
    use std::str::FromStr;

    use quickwit_actors::Universe;
    use quickwit_common::rand::append_random_suffix;
    use quickwit_common::uri::Uri;
    use quickwit_config::{
        FileSourceMessageType, FileSourceNotification, FileSourceSqs, SourceConfig, SourceParams,
    };
    use quickwit_metastore::metastore_for_test;

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::SourceActor;
    use crate::source::doc_file_reader::file_test_helpers::generate_dummy_doc_file;
    use crate::source::queue_sources::sqs_queue::test_helpers::{
        create_queue, get_localstack_sqs_client, send_message,
    };
    use crate::source::test_setup_helper::setup_index;
    use crate::source::tests::SourceRuntimeBuilder;

    #[tokio::test]
    async fn test_file_source_sqs_notifications() {
        // queue setup
        let sqs_client = get_localstack_sqs_client().await.unwrap();
        let queue_url = create_queue(&sqs_client, "file-source-sqs-notifications").await;
        let (dummy_doc_file, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri = Uri::from_str(dummy_doc_file.path().to_str().unwrap()).unwrap();
        send_message(&sqs_client, &queue_url, test_uri.as_str()).await;

        // source setup
        let source_params =
            FileSourceParams::Notifications(FileSourceNotification::Sqs(FileSourceSqs {
                queue_url,
                message_type: FileSourceMessageType::RawUri,
                deduplication_window_duration_secs: 100,
                deduplication_window_max_messages: 100,
                deduplication_cleanup_interval_secs: 60,
            }));
        let source_config = SourceConfig::for_test(
            "test-file-source-sqs-notifications",
            SourceParams::File(source_params.clone()),
        );
        let metastore = metastore_for_test();
        let index_id = append_random_suffix("test-sqs-index");
        let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_metastore(metastore)
            .build();
        let sqs_source = FileSourceFactory::typed_create_source(source_runtime, source_params)
            .await
            .unwrap();

        // actor setup
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        {
            let actor = SourceActor {
                source: Box::new(sqs_source),
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_mailbox, handle) = universe.spawn_builder().spawn(actor);

            // run the source actor for a while
            tokio::time::timeout(Duration::from_millis(500), handle.join())
                .await
                .unwrap_err();

            let next_message = doc_processor_inbox
                .drain_for_test()
                .into_iter()
                .flat_map(|box_any| box_any.downcast::<RawDocBatch>().ok())
                .map(|box_raw_doc_batch| *box_raw_doc_batch)
                .next()
                .unwrap();
            assert_eq!(next_message.docs.len(), 10);
        }
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/gcp_pubsub_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::{Duration, Instant};
use std::{fmt, mem};

use anyhow::Context;
use async_trait::async_trait;
use bytes::Bytes;
use google_cloud_auth::credentials::CredentialsFile;
use google_cloud_gax::retry::RetrySetting;
use google_cloud_pubsub::client::{Client, ClientConfig};
use google_cloud_pubsub::subscription::Subscription;
use quickwit_actors::{ActorContext, ActorExitStatus, Mailbox};
use quickwit_common::rand::append_random_suffix;
use quickwit_config::PubSubSourceParams;
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::Position;
use serde_json::{Value as JsonValue, json};
use tokio::time;
use tracing::{debug, info, warn};

use super::{BATCH_NUM_BYTES_LIMIT, EMIT_BATCHES_TIMEOUT, SourceActor};
use crate::actors::DocProcessor;
use crate::source::{BatchBuilder, Source, SourceContext, SourceRuntime, TypedSourceFactory};

const DEFAULT_MAX_MESSAGES_PER_PULL: i32 = 1_000;

pub struct GcpPubSubSourceFactory;

#[async_trait]
impl TypedSourceFactory for GcpPubSubSourceFactory {
    type Source = GcpPubSubSource;
    type Params = PubSubSourceParams;

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        source_params: PubSubSourceParams,
    ) -> anyhow::Result<Self::Source> {
        GcpPubSubSource::try_new(source_runtime, source_params).await
    }
}

#[derive(Default)]
pub struct GcpPubSubSourceState {
    /// Number of bytes processed by the source.
    num_bytes_processed: u64,
    /// Number of messages processed by the source.
    num_messages_processed: u64,
    /// Current position of the source, i.e. the position of the last message processed.
    current_position: Position,
    // Number of invalid messages, i.e., that were empty or could not be parsed.
    num_invalid_messages: u64,
    /// Number of time we looped without getting a single message
    num_consecutive_empty_batches: u64,
}

pub struct GcpPubSubSource {
    source_runtime: SourceRuntime,
    subscription_name: String,
    subscription: Subscription,
    state: GcpPubSubSourceState,
    backfill_mode_enabled: bool,
    partition_id: PartitionId,
    max_messages_per_pull: i32,
}

impl fmt::Debug for GcpPubSubSource {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("GcpPubSubSource")
            .field("index_id", &self.source_runtime.index_id())
            .field("source_id", &self.source_runtime.source_id())
            .field("subscription", &self.subscription)
            .finish()
    }
}

impl GcpPubSubSource {
    pub async fn try_new(
        source_runtime: SourceRuntime,
        source_params: PubSubSourceParams,
    ) -> anyhow::Result<Self> {
        let subscription_name = source_params.subscription;
        let backfill_mode_enabled = source_params.enable_backfill_mode;
        let max_messages_per_pull = source_params
            .max_messages_per_pull
            .unwrap_or(DEFAULT_MAX_MESSAGES_PER_PULL);

        let mut client_config: ClientConfig = match source_params.credentials_file {
            Some(credentials_file) => {
                let credentials = CredentialsFile::new_from_file(credentials_file.clone())
                    .await
                    .with_context(|| {
                        format!(
                            "failed to load GCP PubSub credentials file from `{credentials_file}`"
                        )
                    })?;
                ClientConfig::default().with_credentials(credentials).await
            }
            _ => ClientConfig::default().with_auth().await,
        }
        .context("failed to create GCP PubSub client config")?;

        if source_params.project_id.is_some() {
            client_config.project_id = source_params.project_id
        }

        let client = Client::new(client_config)
            .await
            .context("failed to create GCP PubSub client")?;
        let subscription = client.subscription(&subscription_name);
        // TODO: replace with "<node_id>/<index_id>/<source_id>/<pipeline_ord>"
        let partition_id = append_random_suffix(&format!("gpc-pubsub-{subscription_name}"));
        let partition_id = PartitionId::from(partition_id);

        info!(
            index_id=%source_runtime.index_id(),
            source_id=%source_runtime.source_id(),
            subscription=%subscription_name,
            max_messages_per_pull=%max_messages_per_pull,
            "starting GCP PubSub source"
        );
        if !subscription.exists(Some(RetrySetting::default())).await? {
            anyhow::bail!("GCP PubSub subscription `{subscription_name}` does not exist");
        }
        Ok(Self {
            source_runtime,
            subscription_name,
            subscription,
            state: GcpPubSubSourceState::default(),
            backfill_mode_enabled,
            partition_id,
            max_messages_per_pull,
        })
    }

    fn should_exit(&self) -> bool {
        self.backfill_mode_enabled && self.state.num_consecutive_empty_batches >= 10
    }
}

#[async_trait]
impl Source for GcpPubSubSource {
    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let now = Instant::now();
        let mut batch_builder = BatchBuilder::new(SourceType::PubSub);
        let deadline = time::sleep(*EMIT_BATCHES_TIMEOUT);
        tokio::pin!(deadline);
        // TODO: ensure we ACK the message after being commit: at least once
        // TODO: ensure we increase_ack_deadline for the items
        loop {
            tokio::select! {
                resp = self.pull_message_batch(&mut batch_builder) => {
                    if let Err(err) = resp {
                        warn!("failed to pull messages from subscription `{}`: {:?}", self.subscription_name, err);
                    }
                    if batch_builder.num_bytes >= BATCH_NUM_BYTES_LIMIT {
                        break;
                    }
                }
                _ = &mut deadline => {
                    break;
                }
            }
            ctx.record_progress();
        }

        if batch_builder.num_bytes > 0 {
            self.state.num_consecutive_empty_batches = 0
        } else {
            self.state.num_consecutive_empty_batches += 1
        }

        // TODO: need to wait for all the id to be ack for at_least_once
        if self.should_exit() {
            info!(subscription=%self.subscription_name, "reached end of subscription");
            ctx.send_exit_with_success(doc_processor_mailbox).await?;
            return Err(ActorExitStatus::Success);
        }
        if !batch_builder.checkpoint_delta.is_empty() {
            debug!(
                num_bytes=%batch_builder.num_bytes,
                num_docs=%batch_builder.docs.len(),
                num_millis=%now.elapsed().as_millis(),
                "Sending doc batch to indexer.");
            let message = batch_builder.build();
            ctx.send_message(doc_processor_mailbox, message).await?;
        }
        Ok(Duration::default())
    }

    async fn suggest_truncate(
        &mut self,
        _checkpoint: SourceCheckpoint,
        _ctx: &ActorContext<SourceActor>,
    ) -> anyhow::Result<()> {
        // TODO: add ack of ids
        Ok(())
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    fn observable_state(&self) -> JsonValue {
        json!({
            "index_id": self.source_runtime.index_id(),
            "source_id": self.source_runtime.source_id(),
            "subscription": self.subscription_name,
            "num_bytes_processed": self.state.num_bytes_processed,
            "num_messages_processed": self.state.num_messages_processed,
            "num_invalid_messages": self.state.num_invalid_messages,
            "num_consecutive_empty_batches": self.state.num_consecutive_empty_batches,
        })
    }
}

impl GcpPubSubSource {
    async fn pull_message_batch(&mut self, batch: &mut BatchBuilder) -> anyhow::Result<()> {
        let messages = self
            .subscription
            .pull(self.max_messages_per_pull, None)
            .await
            .context("failed to pull messages from subscription")?;

        let Some(last_message) = messages.last() else {
            return Ok(());
        };
        let message_id = last_message.message.message_id.clone();
        let publish_timestamp_millis = last_message
            .message
            .publish_time
            .as_ref()
            .map(|timestamp| timestamp.seconds * 1_000 + (timestamp.nanos as i64 / 1_000_000))
            .unwrap_or(0); // TODO: Replace with now UTC millis.

        for message in messages {
            message.ack().await?; // TODO: remove ACK here when doing at least once
            self.state.num_messages_processed += 1;
            self.state.num_bytes_processed += message.message.data.len() as u64;
            let doc: Bytes = Bytes::from(message.message.data);
            if doc.is_empty() {
                self.state.num_invalid_messages += 1;
            } else {
                batch.add_doc(doc);
            }
        }
        let to_position = Position::from(format!(
            "{}:{message_id}:{publish_timestamp_millis}",
            self.state.num_messages_processed
        ));
        let from_position = mem::replace(&mut self.state.current_position, to_position.clone());

        batch
            .checkpoint_delta
            .record_partition_delta(self.partition_id.clone(), from_position, to_position)
            .context("failed to record partition delta")?;
        Ok(())
    }
}

// TODO: first implementation of the test
// After we need to ensure at_least_once and concurrent pipeline
#[cfg(all(test, feature = "gcp-pubsub-emulator-tests"))]
mod gcp_pubsub_emulator_tests {
    use std::env::var;
    use std::num::NonZeroUsize;

    use google_cloud_googleapis::pubsub::v1::PubsubMessage;
    use google_cloud_pubsub::publisher::Publisher;
    use google_cloud_pubsub::subscription::SubscriptionConfig;
    use quickwit_actors::Universe;
    use quickwit_config::{SourceConfig, SourceInputFormat, SourceParams};
    use quickwit_proto::types::{IndexId, IndexUid};
    use serde_json::json;

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::quickwit_supported_sources;
    use crate::source::tests::SourceRuntimeBuilder;

    static GCP_TEST_PROJECT: &str = "quickwit-emulator";

    fn get_source_config(subscription: &str) -> SourceConfig {
        var("PUBSUB_EMULATOR_HOST").expect(
            "environment variable `PUBSUB_EMULATOR_HOST` should be set when running GCP PubSub \
             source tests",
        );
        let source_id = append_random_suffix("test-gcp-pubsub-source--source");
        SourceConfig {
            source_id,
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::PubSub(PubSubSourceParams {
                project_id: Some(GCP_TEST_PROJECT.to_string()),
                enable_backfill_mode: true,
                subscription: subscription.to_string(),
                credentials_file: None,
                max_messages_per_pull: None,
            }),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }
    }

    async fn create_topic_and_subscription(topic: &str, subscription: &str) -> Publisher {
        let client_config = google_cloud_pubsub::client::ClientConfig {
            project_id: Some(GCP_TEST_PROJECT.to_string()),
            ..Default::default()
        };
        let client = Client::new(client_config.with_auth().await.unwrap())
            .await
            .unwrap();
        let subscription_config = SubscriptionConfig::default();

        let created_topic = client.create_topic(topic, None, None).await.unwrap();
        client
            .create_subscription(subscription, topic, subscription_config, None)
            .await
            .unwrap();
        created_topic.new_publisher(None)
    }

    #[tokio::test]
    async fn test_gcp_pubsub_source_invalid_subscription() {
        let subscription =
            append_random_suffix("test-gcp-pubsub-source--invalid-subscription--subscription");
        let source_config = get_source_config(&subscription);

        let index_id = append_random_suffix("test-gcp-pubsub-source--invalid-subscription--index");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let SourceParams::PubSub(params) = source_config.clone().source_params else {
            panic!(
                "Expected `SourceParams::GcpPubSub` source params, got {:?}",
                source_config.source_params
            );
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        GcpPubSubSource::try_new(source_runtime, params)
            .await
            .unwrap_err();
    }

    #[tokio::test]
    async fn test_gcp_pubsub_source() {
        let universe = Universe::with_accelerated_time();

        let topic = append_random_suffix("test-gcp-pubsub-source--topic");
        let subscription = append_random_suffix("test-gcp-pubsub-source--subscription");
        let publisher = create_topic_and_subscription(&topic, &subscription).await;

        let source_config = get_source_config(&subscription);
        let source_id = source_config.source_id.clone();

        let source_loader = quickwit_supported_sources();
        let index_id: IndexId = append_random_suffix("test-gcp-pubsub-source--index");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);

        let mut pubsub_messages = Vec::with_capacity(6);
        for i in 0..6 {
            let pubsub_message = PubsubMessage {
                data: format!("Message {i}").into(),
                ..Default::default()
            };
            pubsub_messages.push(pubsub_message);
        }
        let awaiters = publisher.publish_bulk(pubsub_messages).await;
        for awaiter in awaiters {
            awaiter.get().await.unwrap();
        }
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let source = source_loader.load_source(source_runtime).await.unwrap();

        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let source_actor = SourceActor {
            source,
            doc_processor_mailbox: doc_processor_mailbox.clone(),
        };
        let (_source_mailbox, source_handle) = universe.spawn_builder().spawn(source_actor);
        let (exit_status, exit_state) = source_handle.join().await;
        assert!(exit_status.is_success());

        let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(messages.len(), 1);
        let expected_docs = vec![
            "Message 0",
            "Message 1",
            "Message 2",
            "Message 3",
            "Message 4",
            "Message 5",
        ];
        assert_eq!(messages[0].docs, expected_docs);
        let expected_exit_state = json!({
            "index_id": index_id,
            "source_id": source_id,
            "subscription": subscription,
            "num_bytes_processed": 54,
            "num_messages_processed": 6,
            "num_invalid_messages": 0,
            "num_consecutive_empty_batches": 10,
        });
        assert_eq!(exit_state, expected_exit_state);
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/ingest/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::fmt;
use std::time::Duration;

use anyhow::Context;
use async_trait::async_trait;
use fnv::FnvHashMap;
use itertools::Itertools;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::retry::RetryParams;
use quickwit_ingest::{
    FetchStreamError, IngesterPool, MRecord, MultiFetchStream, decoded_mrecords,
};
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::ingest::IngestV2Error;
use quickwit_proto::ingest::ingester::{
    FetchEof, FetchPayload, IngesterService, TruncateShardsRequest, TruncateShardsSubrequest,
    fetch_message,
};
use quickwit_proto::metastore::{
    AcquireShardsRequest, AcquireShardsResponse, MetastoreService, MetastoreServiceClient,
    SourceType,
};
use quickwit_proto::types::{
    NodeId, PipelineUid, Position, PublishToken, ShardId, SourceId, SourceUid,
};
use serde::Serialize;
use serde_json::json;
use tokio::time;
use tracing::{debug, error, info, warn};
use ulid::Ulid;

use super::{
    BATCH_NUM_BYTES_LIMIT, BatchBuilder, EMIT_BATCHES_TIMEOUT, Source, SourceContext,
    SourceRuntime, TypedSourceFactory,
};
use crate::actors::DocProcessor;
use crate::models::{LocalShardPositionsUpdate, NewPublishLock, NewPublishToken, PublishLock};

pub struct IngestSourceFactory;

#[async_trait]
impl TypedSourceFactory for IngestSourceFactory {
    type Source = IngestSource;
    type Params = ();

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        _params: Self::Params,
    ) -> anyhow::Result<Self::Source> {
        // Retry parameters for the fetch stream: retry indefinitely until the shard is complete or
        // unassigned.
        let retry_params = RetryParams {
            max_attempts: usize::MAX,
            base_delay: Duration::from_secs(5),
            max_delay: Duration::from_secs(10 * 60), // 10 minutes
        };
        IngestSource::try_new(source_runtime, retry_params).await
    }
}

/// The [`ClientId`] is a unique identifier for a client of the ingest service and allows to
/// distinguish which indexers are streaming documents from a shard. It is also used to form a
/// publish token.
#[derive(Debug, Clone)]
struct ClientId {
    node_id: NodeId,
    source_uid: SourceUid,
    pipeline_uid: PipelineUid,
}

impl fmt::Display for ClientId {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        write!(
            formatter,
            "indexer/{}/{}/{}/{}",
            self.node_id, self.source_uid.index_uid, self.source_uid.source_id, self.pipeline_uid
        )
    }
}

impl ClientId {
    fn new(node_id: NodeId, source_uid: SourceUid, pipeline_uid: PipelineUid) -> Self {
        ClientId {
            node_id,
            source_uid,
            pipeline_uid,
        }
    }

    fn new_publish_token(&self) -> String {
        let ulid = if cfg!(test) { Ulid::nil() } else { Ulid::new() };
        format!("{self}/{ulid}")
    }
}

#[derive(Debug, Clone, Copy, Default, Eq, PartialEq, Serialize)]
#[serde(rename_all = "snake_case")]
enum IndexingStatus {
    #[default]
    // Indexing is in progress.
    Active,
    // All documents have been indexed AND published.
    Complete,
    Error,
    // The shard no longer exists.
    NotFound,
    // We have received all documents from the stream. Note that they
    // are not necessarily published yet.
    ReachedEof,
}

#[derive(Debug, Eq, PartialEq)]
struct AssignedShard {
    leader_id: NodeId,
    follower_id_opt: Option<NodeId>,
    // This is just the shard id converted to a partition id object.
    partition_id: PartitionId,
    current_position_inclusive: Position,
    status: IndexingStatus,
}

/// Streams documents from a set of shards.
pub struct IngestSource {
    client_id: ClientId,
    metastore: MetastoreServiceClient,
    ingester_pool: IngesterPool,
    assigned_shards: FnvHashMap<ShardId, AssignedShard>,
    fetch_stream: MultiFetchStream,
    publish_lock: PublishLock,
    publish_token: PublishToken,
    event_broker: EventBroker,
}

impl fmt::Debug for IngestSource {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter.debug_struct("IngestSource").finish()
    }
}

impl IngestSource {
    pub async fn try_new(
        source_runtime: SourceRuntime,
        retry_params: RetryParams,
    ) -> anyhow::Result<IngestSource> {
        let self_node_id: NodeId = source_runtime.node_id().into();
        let client_id = ClientId::new(
            self_node_id.clone(),
            SourceUid {
                index_uid: source_runtime.index_uid().clone(),
                source_id: source_runtime.source_id().to_string(),
            },
            source_runtime.pipeline_uid(),
        );
        let metastore = source_runtime.metastore.clone();
        let ingester_pool = source_runtime.ingester_pool.clone();
        let assigned_shards = FnvHashMap::default();
        let fetch_stream = MultiFetchStream::new(
            self_node_id,
            client_id.to_string(),
            ingester_pool.clone(),
            retry_params,
        );
        // We start as dead. The first reset with a non-empty list of shards will create an alive
        // publish lock.
        let publish_lock = PublishLock::dead();
        let publish_token = client_id.new_publish_token();

        Ok(IngestSource {
            client_id,
            metastore,
            ingester_pool,
            assigned_shards,
            fetch_stream,
            publish_lock,
            publish_token,
            event_broker: source_runtime.event_broker.clone(),
        })
    }

    fn process_fetch_payload(
        &mut self,
        batch_builder: &mut BatchBuilder,
        fetch_payload: FetchPayload,
    ) -> anyhow::Result<()> {
        let mrecord_batch = match &fetch_payload.mrecord_batch {
            Some(mrecord_batch) if !mrecord_batch.is_empty() => mrecord_batch,
            _ => {
                warn!("received empty mrecord batch");
                return Ok(());
            }
        };
        let assigned_shard = self
            .assigned_shards
            .get_mut(fetch_payload.shard_id())
            .expect("shard should be assigned");

        assigned_shard.status = IndexingStatus::Active;

        let partition_id = assigned_shard.partition_id.clone();
        let from_position_exclusive = fetch_payload.from_position_exclusive();
        let to_position_inclusive = fetch_payload.to_position_inclusive();

        for mrecord in decoded_mrecords(mrecord_batch) {
            match mrecord {
                MRecord::Doc(doc) => {
                    batch_builder.add_doc(doc);
                }
                MRecord::Commit => {
                    batch_builder.force_commit();
                }
            }
        }
        batch_builder
            .checkpoint_delta
            .record_partition_delta(
                partition_id,
                from_position_exclusive,
                to_position_inclusive.clone(),
            )
            .context("failed to record partition delta")?;
        assigned_shard.current_position_inclusive = to_position_inclusive;
        Ok(())
    }

    fn process_fetch_eof(
        &mut self,
        batch_builder: &mut BatchBuilder,
        fetch_eof: FetchEof,
    ) -> anyhow::Result<()> {
        let assigned_shard = self
            .assigned_shards
            .get_mut(fetch_eof.shard_id())
            .expect("shard should be assigned");

        assigned_shard.status = IndexingStatus::ReachedEof;

        let partition_id = assigned_shard.partition_id.clone();
        let from_position_exclusive = assigned_shard.current_position_inclusive.clone();
        let to_position_inclusive = fetch_eof.eof_position();

        batch_builder
            .checkpoint_delta
            .record_partition_delta(
                partition_id,
                from_position_exclusive,
                to_position_inclusive.clone(),
            )
            .context("failed to record partition delta")?;
        assigned_shard.current_position_inclusive = to_position_inclusive;
        Ok(())
    }

    fn process_fetch_stream_error(
        &mut self,
        batch_builder: &mut BatchBuilder,
        fetch_stream_error: FetchStreamError,
    ) -> anyhow::Result<()> {
        let Some(assigned_shard) = self.assigned_shards.get_mut(&fetch_stream_error.shard_id)
        else {
            return Ok(());
        };
        if assigned_shard.status == IndexingStatus::Complete {
            return Ok(());
        }
        if let IngestV2Error::ShardNotFound { .. } = fetch_stream_error.ingest_error {
            batch_builder.checkpoint_delta.record_partition_delta(
                assigned_shard.partition_id.clone(),
                assigned_shard.current_position_inclusive.clone(),
                assigned_shard.current_position_inclusive.as_eof(),
            )?;
            assigned_shard.current_position_inclusive.to_eof();
            assigned_shard.status = IndexingStatus::NotFound;
        } else if assigned_shard.status != IndexingStatus::ReachedEof {
            assigned_shard.status = IndexingStatus::Error;
        }
        Ok(())
    }

    async fn truncate(&mut self, truncate_up_to_positions: Vec<(ShardId, Position)>) {
        if truncate_up_to_positions.is_empty() {
            return;
        }
        let shard_positions_update = LocalShardPositionsUpdate::new(
            self.client_id.source_uid.clone(),
            truncate_up_to_positions.clone(),
        );
        // Let's record all shards that have reached Eof as complete.
        for (shard, truncate_up_to_position_inclusive) in &truncate_up_to_positions {
            if truncate_up_to_position_inclusive.is_eof()
                && let Some(assigned_shard) = self.assigned_shards.get_mut(shard)
            {
                assigned_shard.status = IndexingStatus::Complete;
            }
        }

        // We publish the event to the event broker.
        self.event_broker.publish(shard_positions_update);

        // Finally, we push the information to ingesters in a best effort manner.
        // If the request fails, we just log an error.
        let mut per_ingester_truncate_subrequests: FnvHashMap<
            &NodeId,
            Vec<TruncateShardsSubrequest>,
        > = FnvHashMap::default();

        for (shard_id, truncate_up_to_position_inclusive) in truncate_up_to_positions {
            if truncate_up_to_position_inclusive.is_beginning() {
                continue;
            }
            let Some(shard) = self.assigned_shards.get(&shard_id) else {
                warn!("failed to truncate shard `{shard_id}`: shard is no longer assigned");
                continue;
            };
            let truncate_shards_subrequest = TruncateShardsSubrequest {
                index_uid: self.client_id.source_uid.index_uid.clone().into(),
                source_id: self.client_id.source_uid.source_id.clone(),
                shard_id: Some(shard_id),
                truncate_up_to_position_inclusive: Some(truncate_up_to_position_inclusive),
            };
            if let Some(follower_id) = &shard.follower_id_opt {
                per_ingester_truncate_subrequests
                    .entry(follower_id)
                    .or_default()
                    .push(truncate_shards_subrequest.clone());
            }
            per_ingester_truncate_subrequests
                .entry(&shard.leader_id)
                .or_default()
                .push(truncate_shards_subrequest);
        }
        for (ingester_id, truncate_subrequests) in per_ingester_truncate_subrequests {
            let Some(ingester) = self.ingester_pool.get(ingester_id) else {
                warn!("failed to truncate shard(s): ingester `{ingester_id}` is unavailable");
                continue;
            };
            let truncate_shards_request = TruncateShardsRequest {
                ingester_id: ingester_id.clone().into(),
                subrequests: truncate_subrequests,
            };
            let truncate_future = async move {
                let retry_params = RetryParams {
                    base_delay: Duration::from_secs(1),
                    max_delay: Duration::from_secs(10),
                    max_attempts: 5,
                };
                for num_attempts in 1..=retry_params.max_attempts {
                    let Err(error) = ingester
                        .client
                        .truncate_shards(truncate_shards_request.clone())
                        .await
                    else {
                        return;
                    };
                    let delay = retry_params.compute_delay(num_attempts);
                    time::sleep(delay).await;

                    if num_attempts == retry_params.max_attempts {
                        warn!(
                            ingester_id=%truncate_shards_request.ingester_id,
                            "failed to truncate shard(s): {error}"
                        );
                    }
                }
            };
            // Truncation is best-effort, so fire and forget.
            tokio::spawn(truncate_future);
        }
    }

    /// If the new assignment removes a shard that we were in the middle of indexing (ie they have
    /// not reached `IndexingStatus::Complete` status yet), we need to reset the pipeline:
    ///
    /// Ongoing work and splits traveling through the pipeline will be dropped.
    ///
    /// After this method has returned we are guaranteed to have the following post condition:
    /// - a alive publish lock / non-empty publish token
    /// - all currently assigned shards included in the `new_assigned_shard_ids` set.
    async fn reset_if_needed(
        &mut self,
        new_assigned_shard_ids: &BTreeSet<ShardId>,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        // No need to do anything if the list of shards before and after are empty.
        if new_assigned_shard_ids.is_empty() && self.assigned_shards.is_empty() {
            return Ok(());
        }
        // There are two reasons why we might want to reset the pipeline.
        // 1) it has never been initialized in the first place. This happens typically on the first
        // call to `assign_shards` with a non-empty list of shards. We check that by looking at
        // whether the publish lock is dead or not.
        // 2) we are removing a shard that has not reached the complete status yet.
        let reset_needed: bool = self.publish_lock.is_dead()
            || self
                .assigned_shards
                .keys()
                .filter(|&shard_id| !new_assigned_shard_ids.contains(shard_id))
                .any(|removed_shard_id| {
                    let Some(assigned_shard) = self.assigned_shards.get(removed_shard_id) else {
                        return false;
                    };
                    assigned_shard.status != IndexingStatus::Complete
                });

        if !reset_needed {
            // Not need to reset the fetch streams, we can just remove the shard that have been
            // completely indexed.
            self.assigned_shards.retain(|shard_id, assignment| {
                if new_assigned_shard_ids.contains(shard_id) {
                    true
                } else {
                    assert_eq!(assignment.status, IndexingStatus::Complete);
                    false
                }
            });
            return Ok(());
        }
        info!(
            index_uid=%self.client_id.source_uid.index_uid,
            pipeline_uid=%self.client_id.pipeline_uid,
            "resetting indexing pipeline"
        );
        self.assigned_shards.clear();
        self.fetch_stream.reset();
        self.publish_lock.kill().await;
        self.publish_lock = PublishLock::default();
        self.publish_token = self.client_id.new_publish_token();
        ctx.send_message(
            doc_processor_mailbox,
            NewPublishLock(self.publish_lock.clone()),
        )
        .await?;
        ctx.send_message(
            doc_processor_mailbox,
            NewPublishToken(self.publish_token.clone()),
        )
        .await?;
        Ok(())
    }
}

#[async_trait]
impl Source for IngestSource {
    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let mut batch_builder = BatchBuilder::new(SourceType::IngestV2);

        let now = time::Instant::now();
        let deadline = now + *EMIT_BATCHES_TIMEOUT;
        loop {
            match time::timeout_at(deadline, self.fetch_stream.next()).await {
                Ok(Ok(fetch_message)) => match fetch_message.message {
                    Some(fetch_message::Message::Payload(fetch_payload)) => {
                        self.process_fetch_payload(&mut batch_builder, fetch_payload)?;

                        if batch_builder.num_bytes >= BATCH_NUM_BYTES_LIMIT {
                            break;
                        }
                    }
                    Some(fetch_message::Message::Eof(fetch_eof)) => {
                        self.process_fetch_eof(&mut batch_builder, fetch_eof)?;
                    }
                    None => {
                        warn!("received empty fetch message");
                        continue;
                    }
                },
                Ok(Err(fetch_stream_error)) => {
                    self.process_fetch_stream_error(&mut batch_builder, fetch_stream_error)?;
                }
                Err(_) => {
                    // The deadline has elapsed.
                    break;
                }
            }
            ctx.record_progress();
        }
        if !batch_builder.checkpoint_delta.is_empty() {
            debug!(
                num_docs=%batch_builder.docs.len(),
                num_bytes=%batch_builder.num_bytes,
                num_millis=%now.elapsed().as_millis(),
                "Sending doc batch to indexer."
            );
            let message = batch_builder.build();
            ctx.send_message(doc_processor_mailbox, message).await?;
        }
        Ok(Duration::default())
    }

    async fn assign_shards(
        &mut self,
        new_assigned_shard_ids: BTreeSet<ShardId>,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        self.reset_if_needed(&new_assigned_shard_ids, doc_processor_mailbox, ctx)
            .await?;

        // As enforced by `reset_if_needed`, at this point, all currently assigned shards should be
        // in the new_assigned_shards.
        debug_assert!(
            self.assigned_shards
                .keys()
                .all(|shard_id| new_assigned_shard_ids.contains(shard_id))
        );

        if self.assigned_shards.len() == new_assigned_shard_ids.len() {
            // Nothing to do.
            // The set shards is unchanged.
            return Ok(());
        }

        let added_shard_ids: Vec<ShardId> = new_assigned_shard_ids
            .into_iter()
            .filter(|shard_id| !self.assigned_shards.contains_key(shard_id))
            .collect();

        assert!(!added_shard_ids.is_empty());
        info!(added_shards=?added_shard_ids, "adding shards assignment");

        let acquire_shards_request = AcquireShardsRequest {
            index_uid: Some(self.client_id.source_uid.index_uid.clone()),
            source_id: self.client_id.source_uid.source_id.clone(),
            shard_ids: added_shard_ids.clone(),
            publish_token: self.publish_token.clone(),
        };
        let acquire_shards_response: AcquireShardsResponse = ctx
            .protect_future(self.metastore.acquire_shards(acquire_shards_request))
            .await
            .context("failed to acquire shards")?;

        if acquire_shards_response.acquired_shards.len() != added_shard_ids.len() {
            let missing_shards = added_shard_ids
                .iter()
                .filter(|shard_id| {
                    !acquire_shards_response
                        .acquired_shards
                        .iter()
                        .any(|acquired_shard| acquired_shard.shard_id() == *shard_id)
                })
                .collect::<Vec<_>>();
            // This can happen if the shards have been deleted by the control plane, after building
            // the plan and before the apply terminated. See #4888.
            info!(missing_shards=?missing_shards, "failed to acquire all assigned shards");
        }

        let mut truncate_up_to_positions =
            Vec::with_capacity(acquire_shards_response.acquired_shards.len());

        for acquired_shard in acquire_shards_response.acquired_shards {
            let index_uid = acquired_shard.index_uid().clone();
            let shard_id = acquired_shard.shard_id().clone();
            let mut current_position_inclusive = acquired_shard.publish_position_inclusive();
            let leader_id: NodeId = acquired_shard.leader_id.into();
            let follower_id_opt: Option<NodeId> = acquired_shard.follower_id.map(Into::into);
            let source_id: SourceId = acquired_shard.source_id;
            let partition_id = PartitionId::from(shard_id.as_str());
            let from_position_exclusive = current_position_inclusive.clone();

            let status = if from_position_exclusive.is_eof() {
                IndexingStatus::Complete
            } else if let Err(error) = ctx
                .protect_future(self.fetch_stream.subscribe(
                    leader_id.clone(),
                    follower_id_opt.clone(),
                    index_uid,
                    source_id,
                    shard_id.clone(),
                    from_position_exclusive,
                ))
                .await
            {
                if let IngestV2Error::ShardNotFound { .. } = error {
                    error!("failed to subscribe to shard `{shard_id}`: shard not found");
                    current_position_inclusive.to_eof();
                    IndexingStatus::NotFound
                } else {
                    error!(%error, "failed to subscribe to shard `{shard_id}`");
                    IndexingStatus::Error
                }
            } else {
                IndexingStatus::Active
            };
            truncate_up_to_positions.push((shard_id.clone(), current_position_inclusive.clone()));

            let assigned_shard = AssignedShard {
                leader_id,
                follower_id_opt,
                partition_id,
                current_position_inclusive,
                status,
            };
            self.assigned_shards.insert(shard_id, assigned_shard);
        }

        self.truncate(truncate_up_to_positions).await;

        Ok(())
    }

    async fn suggest_truncate(
        &mut self,
        checkpoint: SourceCheckpoint,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        let truncate_up_to_positions: Vec<(ShardId, Position)> = checkpoint
            .iter()
            .map(|(partition_id, position)| {
                let shard_id = ShardId::from(partition_id.as_str());
                (shard_id, position)
            })
            .collect();
        self.truncate(truncate_up_to_positions).await;
        Ok(())
    }

    fn name(&self) -> String {
        "IngestSource".to_string()
    }

    fn observable_state(&self) -> serde_json::Value {
        let assigned_shards: Vec<serde_json::Value> = self
            .assigned_shards
            .iter()
            .sorted_by(|(left_shard_id, _), (right_shard_id, _)| left_shard_id.cmp(right_shard_id))
            .map(|(shard_id, assigned_shard)| {
                json!({
                    "shard_id": *shard_id,
                    "current_position": assigned_shard.current_position_inclusive,
                    "status": assigned_shard.status,
                })
            })
            .collect();
        json!({
            "client_id": self.client_id.to_string(),
            "assigned_shards": assigned_shards,
            "publish_token": self.publish_token,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::iter::once;
    use std::path::PathBuf;
    use std::sync::Arc;
    use std::sync::atomic::AtomicBool;

    use bytesize::ByteSize;
    use itertools::Itertools;
    use quickwit_actors::{ActorContext, Universe};
    use quickwit_common::ServiceStream;
    use quickwit_common::metrics::MEMORY_METRICS;
    use quickwit_common::stream_utils::InFlightValue;
    use quickwit_config::{IndexingSettings, SourceConfig, SourceParams};
    use quickwit_ingest::IngesterPoolEntry;
    use quickwit_proto::indexing::IndexingPipelineId;
    use quickwit_proto::ingest::ingester::{
        FetchMessage, IngesterServiceClient, MockIngesterService, TruncateShardsResponse,
    };
    use quickwit_proto::ingest::{IngestV2Error, MRecordBatch, Shard, ShardState};
    use quickwit_proto::metastore::{AcquireShardsResponse, MockMetastoreService};
    use quickwit_proto::types::{DocMappingUid, IndexUid, PipelineUid};
    use quickwit_storage::StorageResolver;
    use tokio::sync::mpsc::error::TryRecvError;
    use tokio::sync::watch;

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::SourceActor;

    // In this test, we simulate a source to which we sequentially assign the following set of
    // shards []
    // [1] (triggers a reset, and the creation of a publish lock)
    // [1,2]
    // [2,3] (which triggers a reset)
    #[tokio::test]
    async fn test_ingest_source_assign_shards() {
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);
        let publish_token = "indexer/test-node/test-index:0/test-source/\
                             00000000000000000000000000/00000000000000000000000000";

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_acquire_shards()
            .withf(|request| request.shard_ids == [ShardId::from(0)])
            .once()
            .returning(|request| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                let response = AcquireShardsResponse {
                    acquired_shards: vec![Shard {
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        leader_id: "test-ingester-0".to_string(),
                        follower_id: None,
                        shard_id: Some(ShardId::from(0)),
                        shard_state: ShardState::Open as i32,
                        doc_mapping_uid: Some(DocMappingUid::default()),
                        publish_position_inclusive: Some(Position::offset(10u64)),
                        publish_token: Some(publish_token.to_string()),
                        update_timestamp: 1724158996,
                    }],
                };
                Ok(response)
            });
        mock_metastore
            .expect_acquire_shards()
            .once()
            .withf(|request| request.shard_ids == [ShardId::from(1)])
            .returning(|request| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");

                let response = AcquireShardsResponse {
                    acquired_shards: vec![Shard {
                        leader_id: "test-ingester-0".to_string(),
                        follower_id: None,
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        doc_mapping_uid: Some(DocMappingUid::default()),
                        publish_position_inclusive: Some(Position::offset(11u64)),
                        publish_token: Some(publish_token.to_string()),
                        update_timestamp: 1724158996,
                    }],
                };
                Ok(response)
            });
        mock_metastore
            .expect_acquire_shards()
            .withf(|request| request.shard_ids == [ShardId::from(1), ShardId::from(2)])
            .once()
            .returning(|request| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");

                let response = AcquireShardsResponse {
                    acquired_shards: vec![
                        Shard {
                            leader_id: "test-ingester-0".to_string(),
                            follower_id: None,
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(1)),
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: Some(Position::offset(11u64)),
                            publish_token: Some(publish_token.to_string()),
                            update_timestamp: 1724158996,
                        },
                        Shard {
                            leader_id: "test-ingester-0".to_string(),
                            follower_id: None,
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(2)),
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: Some(Position::offset(12u64)),
                            publish_token: Some(publish_token.to_string()),
                            update_timestamp: 1724158996,
                        },
                    ],
                };
                Ok(response)
            });
        let ingester_pool = IngesterPool::default();

        // This sequence is used to remove the race condition by waiting for the fetch stream
        // request.
        let (sequence_tx, mut sequence_rx) = tokio::sync::mpsc::unbounded_channel::<usize>();

        let mut mock_ingester_0 = MockIngesterService::new();
        let sequence_tx_clone1 = sequence_tx.clone();
        mock_ingester_0
            .expect_open_fetch_stream()
            .withf(|request| {
                request.from_position_exclusive() == Position::offset(10u64)
                    && request.shard_id() == ShardId::from(0)
            })
            .once()
            .returning(move |request| {
                sequence_tx_clone1.send(1).unwrap();
                assert_eq!(
                    request.client_id,
                    "indexer/test-node/test-index:00000000000000000000000000/test-source/\
                     00000000000000000000000000"
                );
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");

                let (_service_stream_tx, service_stream) = ServiceStream::new_bounded(1);
                Ok(service_stream)
            });
        let sequence_tx_clone2 = sequence_tx.clone();
        mock_ingester_0
            .expect_open_fetch_stream()
            .withf(|request| {
                request.from_position_exclusive() == Position::offset(11u64)
                    && request.shard_id() == ShardId::from(1)
            })
            .times(2)
            .returning(move |request| {
                sequence_tx_clone2.send(2).unwrap();
                assert_eq!(
                    request.client_id,
                    "indexer/test-node/test-index:00000000000000000000000000/test-source/\
                     00000000000000000000000000"
                );
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");

                let (_service_stream_tx, service_stream) = ServiceStream::new_bounded(1);
                Ok(service_stream)
            });
        let sequence_tx_clone3 = sequence_tx.clone();
        mock_ingester_0
            .expect_open_fetch_stream()
            .withf(|request| {
                request.from_position_exclusive() == Position::offset(12u64)
                    && request.shard_id() == ShardId::from(2)
            })
            .once()
            .returning(move |request| {
                sequence_tx_clone3.send(3).unwrap();
                assert_eq!(
                    request.client_id,
                    "indexer/test-node/test-index:00000000000000000000000000/test-source/\
                     00000000000000000000000000"
                );
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");

                let (_service_stream_tx, service_stream) = ServiceStream::new_bounded(1);
                Ok(service_stream)
            });
        mock_ingester_0
            .expect_truncate_shards()
            .withf(|truncate_req| truncate_req.subrequests[0].shard_id() == ShardId::from(0))
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-0");
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(
                    subrequest.truncate_up_to_position_inclusive(),
                    Position::offset(10u64)
                );

                let response = TruncateShardsResponse {};
                Ok(response)
            });

        mock_ingester_0
            .expect_truncate_shards()
            .withf(|truncate_req| truncate_req.subrequests[0].shard_id() == ShardId::from(1))
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-0");
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(
                    subrequest.truncate_up_to_position_inclusive(),
                    Position::offset(11u64)
                );

                Ok(TruncateShardsResponse {})
            });
        mock_ingester_0
            .expect_truncate_shards()
            .withf(|truncate_req| {
                truncate_req.subrequests.len() == 2
                    && truncate_req.subrequests[0].shard_id() == ShardId::from(1)
                    && truncate_req.subrequests[1].shard_id() == ShardId::from(2)
            })
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-0");

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(
                    subrequest.truncate_up_to_position_inclusive(),
                    Position::offset(11u64)
                );

                let subrequest = &request.subrequests[1];
                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(
                    subrequest.truncate_up_to_position_inclusive(),
                    Position::offset(12u64)
                );

                let response = TruncateShardsResponse {};
                Ok(response)
            });

        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));
        ingester_pool.insert("test-ingester-0".into(), ingester_0.clone());

        let event_broker = EventBroker::default();

        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool: ingester_pool.clone(),
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker,
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::no_retries();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        // We assign [0] (previously []).
        // The stream does not need to be reset.
        let shard_ids: BTreeSet<ShardId> = once(0).map(ShardId::from).collect();
        let publish_lock = source.publish_lock.clone();
        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();
        assert_eq!(sequence_rx.recv().await.unwrap(), 1);
        assert!(!publish_lock.is_alive());

        assert!(source.publish_lock.is_alive());
        assert!(!source.publish_token.is_empty());

        // We assign [0,1] (previously [0]). This should just add the shard 1.
        // The stream does not need to be reset.
        let shard_ids: BTreeSet<ShardId> = (0..2).map(ShardId::from).collect();
        let publish_lock = source.publish_lock.clone();
        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();
        assert_eq!(sequence_rx.recv().await.unwrap(), 2);
        assert!(publish_lock.is_alive());
        assert_eq!(publish_lock, source.publish_lock);

        // We assign [1,2]. (previously [0,1]) This should reset the stream
        // because the shard 0 has to be removed.
        // The publish lock should be killed and a new one should be created.
        let shard_ids: BTreeSet<ShardId> = (1..3).map(ShardId::from).collect();
        let publish_lock = source.publish_lock.clone();
        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        assert_eq!(sequence_rx.recv().await.unwrap(), 2);
        assert_eq!(sequence_rx.recv().await.unwrap(), 3);
        assert!(!publish_lock.is_alive());
        assert!(source.publish_lock.is_alive());
        assert_ne!(publish_lock, source.publish_lock);

        let NewPublishLock(publish_lock) = doc_processor_inbox
            .recv_typed_message::<NewPublishLock>()
            .await
            .unwrap();
        assert_ne!(&source.publish_lock, &publish_lock);

        // assert!(publish_token != source.publish_token);

        let NewPublishToken(publish_token) = doc_processor_inbox
            .recv_typed_message::<NewPublishToken>()
            .await
            .unwrap();
        assert_eq!(source.publish_token, publish_token);

        assert_eq!(source.assigned_shards.len(), 2);

        let assigned_shard = source.assigned_shards.get(&ShardId::from(1)).unwrap();
        let expected_assigned_shard = AssignedShard {
            leader_id: "test-ingester-0".into(),
            follower_id_opt: None,
            partition_id: 1u64.into(),
            current_position_inclusive: Position::offset(11u64),
            status: IndexingStatus::Active,
        };
        assert_eq!(assigned_shard, &expected_assigned_shard);

        let assigned_shard = source.assigned_shards.get(&ShardId::from(2)).unwrap();
        let expected_assigned_shard = AssignedShard {
            leader_id: "test-ingester-0".into(),
            follower_id_opt: None,
            partition_id: 2u64.into(),
            current_position_inclusive: Position::offset(12u64),
            status: IndexingStatus::Active,
        };
        assert_eq!(assigned_shard, &expected_assigned_shard);

        // Wait for the truncate future to complete.
        time::sleep(Duration::from_millis(1)).await;
    }

    #[tokio::test]
    async fn test_ingest_source_assign_shards_all_eof() {
        // In this test, we check that if all assigned shards are originally marked as EOF in the
        // metastore, we observe the following:
        // - emission of a suggest truncate
        // - no stream request is emitted
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);
        let publish_token = "indexer/test-node/test-index:0/test-source/\
                             00000000000000000000000000/00000000000000000000000000";

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_acquire_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_ids, [ShardId::from(1), ShardId::from(2)]);

                let response = AcquireShardsResponse {
                    acquired_shards: vec![
                        Shard {
                            leader_id: "test-ingester-0".to_string(),
                            follower_id: None,
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(1)),
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: Some(Position::eof(11u64)),
                            publish_token: Some(publish_token.to_string()),
                            update_timestamp: 1724158996,
                        },
                        Shard {
                            leader_id: "test-ingester-0".to_string(),
                            follower_id: None,
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(2)),
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: Some(Position::Beginning.as_eof()),
                            publish_token: Some(publish_token.to_string()),
                            update_timestamp: 1724158996,
                        },
                    ],
                };
                Ok(response)
            });
        let ingester_pool = IngesterPool::default();

        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_truncate_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-0");
                assert_eq!(request.subrequests.len(), 2);

                let subrequest_0 = &request.subrequests[0];
                assert_eq!(subrequest_0.index_uid(), &("test-index", 0));
                assert_eq!(subrequest_0.source_id, "test-source");
                assert_eq!(subrequest_0.shard_id(), ShardId::from(1));
                assert_eq!(
                    subrequest_0.truncate_up_to_position_inclusive(),
                    Position::eof(11u64)
                );

                let subrequest_1 = &request.subrequests[1];
                assert_eq!(subrequest_1.index_uid(), &("test-index", 0));
                assert_eq!(subrequest_1.source_id, "test-source");
                assert_eq!(subrequest_1.shard_id(), ShardId::from(2));
                assert_eq!(
                    subrequest_1.truncate_up_to_position_inclusive(),
                    Position::Beginning.as_eof()
                );

                let response = TruncateShardsResponse {};
                Ok(response)
            });

        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));
        ingester_pool.insert("test-ingester-0".into(), ingester_0.clone());

        let event_broker = EventBroker::default();
        let (shard_positions_update_tx, mut shard_positions_update_rx) =
            tokio::sync::mpsc::unbounded_channel::<LocalShardPositionsUpdate>();
        event_broker
            .subscribe::<LocalShardPositionsUpdate>(move |update| {
                shard_positions_update_tx.send(update).unwrap();
            })
            .forever();

        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool: ingester_pool.clone(),
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker,
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::for_test();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, _doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        // In this scenario, the indexer will be able to acquire shard 1 and 2.
        let shard_ids: BTreeSet<ShardId> =
            BTreeSet::from_iter([ShardId::from(1), ShardId::from(2)]);

        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        let expected_local_update = LocalShardPositionsUpdate::new(
            SourceUid {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".to_string(),
            },
            vec![
                (ShardId::from(1), Position::eof(11u64)),
                (ShardId::from(2), Position::Beginning.as_eof()),
            ],
        );
        let local_update = shard_positions_update_rx.recv().await.unwrap();
        assert_eq!(local_update, expected_local_update);
    }

    #[tokio::test]
    async fn test_ingest_source_assign_shards_some_eof() {
        // In this test, we check that if some shards that are originally marked as EOF in the
        // metastore, we observe the following:
        // - emission of a suggest truncate
        // - the stream request emitted does not include the EOF shards
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);
        let publish_token = "indexer/test-node/test-index:0/test-source/\
                             00000000000000000000000000/00000000000000000000000000";

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_acquire_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_ids, [ShardId::from(1), ShardId::from(2)]);

                let response = AcquireShardsResponse {
                    acquired_shards: vec![
                        Shard {
                            leader_id: "test-ingester-0".to_string(),
                            follower_id: None,
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(1)),
                            shard_state: ShardState::Open as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: Some(Position::offset(11u64)),
                            publish_token: Some(publish_token.to_string()),
                            update_timestamp: 1724158996,
                        },
                        Shard {
                            leader_id: "test-ingester-0".to_string(),
                            follower_id: None,
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(2)),
                            shard_state: ShardState::Closed as i32,
                            doc_mapping_uid: Some(DocMappingUid::default()),
                            publish_position_inclusive: Some(Position::eof(22u64)),
                            publish_token: Some(publish_token.to_string()),
                            update_timestamp: 1724158996,
                        },
                    ],
                };
                Ok(response)
            });
        let ingester_pool = IngesterPool::default();

        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_open_fetch_stream()
            .once()
            .returning(|request| {
                assert_eq!(
                    request.client_id,
                    "indexer/test-node/test-index:00000000000000000000000000/test-source/\
                     00000000000000000000000000"
                );
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(11u64));

                let (_service_stream_tx, service_stream) = ServiceStream::new_bounded(1);
                Ok(service_stream)
            });
        mock_ingester_0
            .expect_truncate_shards()
            .once()
            .returning(|mut request| {
                assert_eq!(request.ingester_id, "test-ingester-0");
                assert_eq!(request.subrequests.len(), 2);
                request
                    .subrequests
                    .sort_unstable_by(|left, right| left.shard_id.cmp(&right.shard_id));

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(subrequest.shard_id(), ShardId::from(1));
                assert_eq!(
                    subrequest.truncate_up_to_position_inclusive(),
                    Position::offset(11u64)
                );

                let subrequest = &request.subrequests[1];
                assert_eq!(subrequest.index_uid(), &("test-index", 0));
                assert_eq!(subrequest.source_id, "test-source");
                assert_eq!(subrequest.shard_id(), ShardId::from(2));
                assert_eq!(
                    subrequest.truncate_up_to_position_inclusive(),
                    Position::eof(22u64)
                );

                let response = TruncateShardsResponse {};
                Ok(response)
            });

        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));
        ingester_pool.insert("test-ingester-0".into(), ingester_0.clone());

        let event_broker = EventBroker::default();
        let (shard_positions_update_tx, mut shard_positions_update_rx) =
            tokio::sync::mpsc::unbounded_channel::<LocalShardPositionsUpdate>();
        event_broker
            .subscribe::<LocalShardPositionsUpdate>(move |update| {
                shard_positions_update_tx.send(update).unwrap();
            })
            .forever();

        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool: ingester_pool.clone(),
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker,
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::for_test();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, _doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        // In this scenario, the indexer will only be able to acquire shard 1.
        let shard_ids: BTreeSet<ShardId> = (1..3).map(ShardId::from).collect();
        assert_eq!(
            shard_positions_update_rx.try_recv().unwrap_err(),
            TryRecvError::Empty
        );

        // In this scenario, the indexer will only be able to acquire shard 1.
        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        let local_shard_positions_update = shard_positions_update_rx.recv().await.unwrap();
        let expected_local_shard_positions_update = LocalShardPositionsUpdate::new(
            SourceUid {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".to_string(),
            },
            vec![
                (ShardId::from(1), Position::offset(11u64)),
                (ShardId::from(2), Position::eof(22u64)),
            ],
        );
        assert_eq!(
            local_shard_positions_update,
            expected_local_shard_positions_update,
        );
    }

    #[tokio::test]
    async fn test_ingest_source_emit_batches() {
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);
        let mock_metastore = MockMetastoreService::new();
        let ingester_pool = IngesterPool::default();
        let event_broker = EventBroker::default();

        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool: ingester_pool.clone(),
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker,
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::for_test();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        // In this scenario, the ingester receives fetch responses from shard 1 and 2.
        source.assigned_shards.insert(
            ShardId::from(1),
            AssignedShard {
                leader_id: "test-ingester-0".into(),
                follower_id_opt: None,
                partition_id: 1u64.into(),
                current_position_inclusive: Position::offset(11u64),
                status: IndexingStatus::Active,
            },
        );
        source.assigned_shards.insert(
            ShardId::from(2),
            AssignedShard {
                leader_id: "test-ingester-1".into(),
                follower_id_opt: None,
                partition_id: 2u64.into(),
                current_position_inclusive: Position::offset(22u64),
                status: IndexingStatus::Active,
            },
        );
        let fetch_message_tx = source.fetch_stream.fetch_message_tx();

        let fetch_payload = FetchPayload {
            index_uid: Some(IndexUid::for_test("test-index", 0)),
            source_id: "test-source".into(),
            shard_id: Some(ShardId::from(1)),
            mrecord_batch: MRecordBatch::for_test([
                "\0\0test-doc-foo",
                "\0\0test-doc-bar",
                "\0\x01",
            ]),
            from_position_exclusive: Some(Position::offset(11u64)),
            to_position_inclusive: Some(Position::offset(14u64)),
        };
        let batch_size = fetch_payload.estimate_size();
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        let in_flight_value = InFlightValue::new(
            fetch_message,
            batch_size,
            &MEMORY_METRICS.in_flight.fetch_stream,
        );
        fetch_message_tx.send(Ok(in_flight_value)).await.unwrap();

        let fetch_payload = FetchPayload {
            index_uid: Some(IndexUid::for_test("test-index", 0)),
            source_id: "test-source".into(),
            shard_id: Some(ShardId::from(2)),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-qux"]),
            from_position_exclusive: Some(Position::offset(22u64)),
            to_position_inclusive: Some(Position::offset(23u64)),
        };
        let batch_size = fetch_payload.estimate_size();
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        let in_flight_value = InFlightValue::new(
            fetch_message,
            batch_size,
            &MEMORY_METRICS.in_flight.fetch_stream,
        );
        fetch_message_tx.send(Ok(in_flight_value)).await.unwrap();

        let fetch_eof = FetchEof {
            index_uid: Some(IndexUid::for_test("test-index", 0)),
            source_id: "test-source".into(),
            shard_id: Some(ShardId::from(2)),
            eof_position: Some(Position::eof(23u64)),
        };
        let fetch_message = FetchMessage::new_eof(fetch_eof);
        let in_flight_value = InFlightValue::new(
            fetch_message,
            ByteSize(0),
            &MEMORY_METRICS.in_flight.fetch_stream,
        );
        fetch_message_tx.send(Ok(in_flight_value)).await.unwrap();

        source
            .emit_batches(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();
        let doc_batch = doc_processor_inbox
            .recv_typed_message::<RawDocBatch>()
            .await
            .unwrap();
        assert_eq!(doc_batch.docs.len(), 3);
        assert_eq!(doc_batch.docs[0], "test-doc-foo");
        assert_eq!(doc_batch.docs[1], "test-doc-bar");
        assert_eq!(doc_batch.docs[2], "test-doc-qux");
        assert!(doc_batch.force_commit);

        let partition_deltas = doc_batch
            .checkpoint_delta
            .iter()
            .sorted_by(|left, right| left.0.cmp(&right.0))
            .collect::<Vec<_>>();

        assert_eq!(partition_deltas.len(), 2);
        assert_eq!(partition_deltas[0].0, 1u64.into());
        assert_eq!(partition_deltas[0].1.from, Position::offset(11u64));
        assert_eq!(partition_deltas[0].1.to, Position::offset(14u64));

        assert_eq!(partition_deltas[1].0, 2u64.into());
        assert_eq!(partition_deltas[1].1.from, Position::offset(22u64));
        assert_eq!(partition_deltas[1].1.to, Position::eof(23u64));

        source
            .emit_batches(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();
        let shard = source.assigned_shards.get(&ShardId::from(2)).unwrap();
        assert_eq!(shard.status, IndexingStatus::ReachedEof);

        fetch_message_tx
            .send(Err(FetchStreamError {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".into(),
                shard_id: ShardId::from(1),
                ingest_error: IngestV2Error::Internal("test-error".to_string()),
            }))
            .await
            .unwrap();

        source
            .emit_batches(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();
        let shard = source.assigned_shards.get(&ShardId::from(1)).unwrap();
        assert_eq!(shard.status, IndexingStatus::Error);

        let fetch_payload = FetchPayload {
            index_uid: Some(IndexUid::for_test("test-index", 0)),
            source_id: "test-source".into(),
            shard_id: Some(ShardId::from(1)),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-baz"]),
            from_position_exclusive: Some(Position::offset(14u64)),
            to_position_inclusive: Some(Position::offset(15u64)),
        };
        let batch_size = fetch_payload.estimate_size();
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        let in_flight_value = InFlightValue::new(
            fetch_message,
            batch_size,
            &MEMORY_METRICS.in_flight.fetch_stream,
        );
        fetch_message_tx.send(Ok(in_flight_value)).await.unwrap();

        source
            .emit_batches(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();
        let shard = source.assigned_shards.get(&ShardId::from(1)).unwrap();
        assert_eq!(shard.status, IndexingStatus::Active);
    }

    #[tokio::test]
    async fn test_ingest_source_emit_batches_shard_not_found() {
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);
        let publish_token = "indexer/test-node/test-index:0/test-source/\
                             00000000000000000000000000/00000000000000000000000000";

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_acquire_shards()
            .once()
            .returning(|request: AcquireShardsRequest| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_ids, [ShardId::from(1)]);

                let response = AcquireShardsResponse {
                    acquired_shards: vec![Shard {
                        leader_id: "test-ingester-0".to_string(),
                        follower_id: None,
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        doc_mapping_uid: Some(DocMappingUid::default()),
                        publish_position_inclusive: Some(Position::Beginning),
                        publish_token: Some(publish_token.to_string()),
                        update_timestamp: 1724158996,
                    }],
                };
                Ok(response)
            });
        let ingester_pool = IngesterPool::default();

        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_open_fetch_stream()
            .once()
            .returning(|request| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::Beginning);

                Err(IngestV2Error::ShardNotFound {
                    shard_id: ShardId::from(1),
                })
            });

        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));
        ingester_pool.insert("test-ingester-0".into(), ingester_0.clone());

        let event_broker = EventBroker::default();
        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool,
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker,
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::for_test();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        let shard_ids: BTreeSet<ShardId> = BTreeSet::from_iter([ShardId::from(1)]);

        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        source
            .emit_batches(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        let shard = source.assigned_shards.get(&ShardId::from(1)).unwrap();
        assert_eq!(shard.status, IndexingStatus::NotFound);
        assert_eq!(
            shard.current_position_inclusive,
            Position::Beginning.as_eof()
        );
        let raw_doc_batch = doc_processor_inbox
            .recv_typed_message::<RawDocBatch>()
            .await
            .unwrap();

        let (partition_id, position) = raw_doc_batch.checkpoint_delta.iter().next().unwrap();
        assert_eq!(partition_id, PartitionId::from(1u64));
        assert_eq!(position.from, Position::Beginning);
        assert_eq!(position.to, Position::Beginning.as_eof());
    }

    #[tokio::test]
    async fn test_ingest_source_suggest_truncate() {
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);
        let mock_metastore = MockMetastoreService::new();

        let ingester_pool = IngesterPool::default();

        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_truncate_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-0");
                assert_eq!(request.subrequests.len(), 3);

                let subrequest_0 = &request.subrequests[0];
                assert_eq!(subrequest_0.shard_id(), ShardId::from(1));
                assert_eq!(
                    subrequest_0.truncate_up_to_position_inclusive(),
                    Position::offset(11u64)
                );

                let subrequest_1 = &request.subrequests[1];
                assert_eq!(subrequest_1.shard_id(), ShardId::from(2));
                assert_eq!(
                    subrequest_1.truncate_up_to_position_inclusive(),
                    Position::offset(22u64)
                );

                let subrequest_2 = &request.subrequests[2];
                assert_eq!(subrequest_2.shard_id(), ShardId::from(3));
                assert_eq!(
                    subrequest_2.truncate_up_to_position_inclusive(),
                    Position::eof(33u64)
                );

                Ok(TruncateShardsResponse {})
            });
        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));
        ingester_pool.insert("test-ingester-0".into(), ingester_0.clone());

        let mut mock_ingester_1 = MockIngesterService::new();
        mock_ingester_1
            .expect_truncate_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-1");
                assert_eq!(request.subrequests.len(), 2);

                let subrequest_0 = &request.subrequests[0];
                assert_eq!(subrequest_0.shard_id(), ShardId::from(2));
                assert_eq!(
                    subrequest_0.truncate_up_to_position_inclusive(),
                    Position::offset(22u64)
                );

                let subrequest_1 = &request.subrequests[1];
                assert_eq!(subrequest_1.shard_id(), ShardId::from(3));
                assert_eq!(
                    subrequest_1.truncate_up_to_position_inclusive(),
                    Position::eof(33u64)
                );

                Ok(TruncateShardsResponse {})
            });
        let ingester_1 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1));
        ingester_pool.insert("test-ingester-1".into(), ingester_1.clone());

        let mut mock_ingester_3 = MockIngesterService::new();
        mock_ingester_3
            .expect_truncate_shards()
            .once()
            .returning(|request| {
                assert_eq!(request.ingester_id, "test-ingester-3");
                assert_eq!(request.subrequests.len(), 1);

                let subrequest_0 = &request.subrequests[0];
                assert_eq!(subrequest_0.shard_id(), ShardId::from(4));
                assert_eq!(
                    subrequest_0.truncate_up_to_position_inclusive(),
                    Position::offset(44u64)
                );

                Ok(TruncateShardsResponse {})
            });
        let ingester_3 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_3));
        ingester_pool.insert("test-ingester-3".into(), ingester_3.clone());

        let event_broker = EventBroker::default();
        let (shard_positions_update_tx, mut shard_positions_update_rx) =
            tokio::sync::mpsc::unbounded_channel::<LocalShardPositionsUpdate>();
        event_broker
            .subscribe::<LocalShardPositionsUpdate>(move |update| {
                shard_positions_update_tx.send(update).unwrap();
            })
            .forever();

        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool: ingester_pool.clone(),
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker,
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::for_test();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        // In this scenario, the ingester 2 is not available and the shard 6 is no longer assigned.
        source.assigned_shards.insert(
            ShardId::from(1),
            AssignedShard {
                leader_id: "test-ingester-0".into(),
                follower_id_opt: None,
                partition_id: 1u64.into(),
                current_position_inclusive: Position::offset(11u64),
                status: IndexingStatus::Active,
            },
        );
        source.assigned_shards.insert(
            ShardId::from(2),
            AssignedShard {
                leader_id: "test-ingester-0".into(),
                follower_id_opt: Some("test-ingester-1".into()),
                partition_id: 2u64.into(),
                current_position_inclusive: Position::offset(22u64),
                status: IndexingStatus::Active,
            },
        );
        source.assigned_shards.insert(
            ShardId::from(3),
            AssignedShard {
                leader_id: "test-ingester-1".into(),
                follower_id_opt: Some("test-ingester-0".into()),
                partition_id: 3u64.into(),
                current_position_inclusive: Position::offset(33u64),
                status: IndexingStatus::Active,
            },
        );
        source.assigned_shards.insert(
            ShardId::from(4),
            AssignedShard {
                leader_id: "test-ingester-2".into(),
                follower_id_opt: Some("test-ingester-3".into()),
                partition_id: 4u64.into(),
                current_position_inclusive: Position::offset(44u64),
                status: IndexingStatus::Active,
            },
        );
        source.assigned_shards.insert(
            ShardId::from(5),
            AssignedShard {
                leader_id: "test-ingester-2".into(),
                follower_id_opt: Some("test-ingester-3".into()),
                partition_id: 5u64.into(),
                current_position_inclusive: Position::Beginning,
                status: IndexingStatus::Active,
            },
        );

        let checkpoint = SourceCheckpoint::from_iter(vec![
            (1u64.into(), Position::offset(11u64)),
            (2u64.into(), Position::offset(22u64)),
            (3u64.into(), Position::eof(33u64)),
            (4u64.into(), Position::offset(44u64)),
            (5u64.into(), Position::Beginning),
            (6u64.into(), Position::offset(66u64)),
        ]);
        source.suggest_truncate(checkpoint, &ctx).await.unwrap();

        let local_shards_update = shard_positions_update_rx.recv().await.unwrap();
        let expected_local_shards_update = LocalShardPositionsUpdate::new(
            SourceUid {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".to_string(),
            },
            vec![
                (ShardId::from(1u64), Position::offset(11u64)),
                (ShardId::from(2u64), Position::offset(22u64)),
                (ShardId::from(3u64), Position::eof(33u64)),
                (ShardId::from(4u64), Position::offset(44u64)),
                (ShardId::from(5u64), Position::Beginning),
                (ShardId::from(6u64), Position::offset(66u64)),
            ],
        );
        assert_eq!(local_shards_update, expected_local_shards_update);
    }

    // Motivated by #4888
    #[tokio::test]
    async fn test_assigned_deleted_shards() {
        // It is possible for the control plan to assign a shard to an indexer and delete it right
        // away. In that case, the ingester should just ignore the assigned shard, as
        // opposed to fail as the metastore does not let it `acquire` the shard.
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from("test-node"),
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: "test-source".to_string(),
            pipeline_uid: PipelineUid::default(),
        };
        let source_config = SourceConfig::for_test("test-source", SourceParams::Ingest);

        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_acquire_shards()
            .once()
            .returning(|request: AcquireShardsRequest| {
                assert_eq!(request.index_uid(), &("test-index", 0));
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_ids, [ShardId::from(1)]);

                let response = AcquireShardsResponse {
                    acquired_shards: Vec::new(),
                };
                Ok(response)
            });
        let ingester_pool = IngesterPool::default();

        let event_broker = EventBroker::default();
        let source_runtime = SourceRuntime {
            pipeline_id,
            source_config,
            metastore: MetastoreServiceClient::from_mock(mock_metastore),
            ingester_pool,
            queues_dir_path: PathBuf::from("./queues"),
            storage_resolver: StorageResolver::for_test(),
            event_broker: event_broker.clone(),
            indexing_setting: IndexingSettings::default(),
        };
        let retry_params = RetryParams::for_test();
        let mut source = IngestSource::try_new(source_runtime, retry_params)
            .await
            .unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, _doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        let shard_ids: BTreeSet<ShardId> = BTreeSet::from_iter([ShardId::from(1)]);

        let truncation_happened = Arc::new(AtomicBool::new(false));
        let truncation_happened_clone = truncation_happened.clone();

        let _subscription_guard = event_broker.subscribe(move |_: LocalShardPositionsUpdate| {
            truncation_happened_clone.store(true, std::sync::atomic::Ordering::Relaxed);
        });

        source
            .assign_shards(shard_ids, &doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        tokio::time::sleep(Duration::from_millis(100)).await;
        assert!(!truncation_happened.load(std::sync::atomic::Ordering::Relaxed));
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/ingest_api_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

use anyhow::bail;
use async_trait::async_trait;
use quickwit_actors::{ActorContext, ActorExitStatus, Mailbox};
use quickwit_ingest::{
    CreateQueueIfNotExistsRequest, DocCommand, FetchRequest, FetchResponse, GetPartitionId,
    IngestApiService, SuggestTruncateRequest, get_ingest_api_service,
};
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::{Position, SourceId};
use serde::Serialize;
use serde_json::Value as JsonValue;
use tracing::{error, info};

use super::{BatchBuilder, Source, SourceActor, SourceContext, TypedSourceFactory};
use crate::actors::DocProcessor;
use crate::source::SourceRuntime;

/// Wait time for SourceActor before pooling for new documents.
/// TODO: Think of better way, maybe increment this (i.e wait longer) as time
/// goes on without receiving docs.
const INGEST_API_POLLING_COOL_DOWN: Duration = Duration::from_secs(1);

#[derive(Default, Clone, Debug, Eq, PartialEq, Serialize)]
pub struct IngestApiSourceCounters {
    /// Maintains the value of where we stopped in queue from
    /// a previous call on `emit_batch` and allows
    /// setting the lower-bound of the checkpoint delta.
    /// It has the same value as `current_offset` at the end of emit_batch.
    pub previous_offset: Option<u64>,
    /// Maintains the value of where we are in queue and allows
    /// setting the upper-bound of the checkpoint delta.
    pub current_offset: Option<u64>,
    pub num_docs_processed: u64,
}

pub struct IngestApiSource {
    source_runtime: SourceRuntime,
    source_id: SourceId,
    partition_id: PartitionId,
    ingest_api_service: Mailbox<IngestApiService>,
    counters: IngestApiSourceCounters,
}

impl fmt::Debug for IngestApiSource {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "IngestApiSource {{ source_id: {} }}", self.source_id)
    }
}

impl IngestApiSource {
    pub async fn try_new(source_runtime: SourceRuntime) -> anyhow::Result<Self> {
        let source_id = source_runtime.source_id().to_string();
        let queues_dir_path = source_runtime.queues_dir_path.as_path();
        let ingest_api_service = get_ingest_api_service(queues_dir_path).await?;
        let partition_id: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();

        // Ensure a queue for this index exists.
        let create_queue_req = CreateQueueIfNotExistsRequest {
            queue_id: source_runtime.index_id().to_string(),
        };
        match ingest_api_service.ask_for_res(create_queue_req).await {
            Ok(response) if response.created => {
                info!(
                    index_id = source_runtime.index_id(),
                    %partition_id,
                    "created queue successfully"
                );
            }
            Ok(_) => {}
            Err(error) => {
                error!(
                    index_id = source_runtime.index_id(),
                    %partition_id,
                    %error,
                    "failed to create queue"
                );
                bail!(error);
            }
        }
        let checkpoint = source_runtime.fetch_checkpoint().await?;
        let previous_offset: Option<u64> = checkpoint
            .position_for_partition(&partition_id)
            .map(|position| position.as_u64().expect("offset should be stored as u64"));
        let current_offset = previous_offset;
        let ingest_api_source = IngestApiSource {
            source_runtime,
            source_id,
            partition_id,
            ingest_api_service,
            counters: IngestApiSourceCounters {
                previous_offset,
                current_offset,
                num_docs_processed: 0,
            },
        };
        Ok(ingest_api_source)
    }

    async fn send_suggest_truncate_to_ingest_service(
        &self,
        up_to_position_included: u64,
        ctx: &ActorContext<SourceActor>,
    ) -> anyhow::Result<()> {
        let suggest_truncate_req = SuggestTruncateRequest {
            index_id: self.source_runtime.index_id().to_string(),
            up_to_position_included,
        };
        ctx.ask_for_res(&self.ingest_api_service, suggest_truncate_req)
            .await?;
        Ok(())
    }

    fn update_counters(&mut self, current_offset: u64, num_docs: u64) {
        self.counters.num_docs_processed += num_docs;
        self.counters.current_offset = Some(current_offset);
        self.counters.previous_offset = Some(current_offset);
    }
}

#[async_trait]
impl Source for IngestApiSource {
    async fn initialize(
        &mut self,
        _: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        if let Some(position) = self.counters.previous_offset {
            self.send_suggest_truncate_to_ingest_service(position, ctx)
                .await?;
        }
        Ok(())
    }

    async fn emit_batches(
        &mut self,
        batch_sink: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let fetch_req = FetchRequest {
            index_id: self.source_runtime.index_id().to_string(),
            start_after: self.counters.current_offset,
            num_bytes_limit: None,
        };
        let FetchResponse {
            first_position: first_position_opt,
            doc_batch: doc_batch_opt,
        } = ctx
            .ask_for_res(&self.ingest_api_service, fetch_req)
            .await
            .map_err(anyhow::Error::from)?;

        // The `first_position_opt` being none means the doc_batch is empty and there is
        // no more document available, at least for the time being.
        // That is, we have consumed all pending docs in the queue and need to
        // make the client wait a bit before pooling again.
        let (first_position, doc_batch) = if let Some(first_position) = first_position_opt {
            (first_position, doc_batch_opt.unwrap())
        } else {
            return Ok(INGEST_API_POLLING_COOL_DOWN);
        };

        let batch_num_docs = doc_batch.num_docs();
        // TODO use a timestamp (in the raw doc batch) given by at ingest time to be more accurate.
        let mut batch_builder =
            BatchBuilder::with_capacity(doc_batch.num_docs(), SourceType::IngestV1);
        for doc in doc_batch.into_iter() {
            match doc {
                DocCommand::Ingest { payload } => batch_builder.add_doc(payload),
                DocCommand::Commit => batch_builder.force_commit(),
            }
        }
        let current_offset = first_position + batch_num_docs as u64 - 1;
        let partition_id = self.partition_id.clone();
        batch_builder
            .checkpoint_delta
            .record_partition_delta(
                partition_id,
                self.counters
                    .previous_offset
                    .map(Position::offset)
                    .unwrap_or_default(),
                Position::offset(current_offset),
            )
            .map_err(anyhow::Error::from)?;

        self.update_counters(current_offset, batch_builder.docs.len() as u64);
        ctx.send_message(batch_sink, batch_builder.build()).await?;
        Ok(Duration::default())
    }

    async fn suggest_truncate(
        &mut self,
        checkpoint: SourceCheckpoint,
        ctx: &ActorContext<SourceActor>,
    ) -> anyhow::Result<()> {
        if let Some(Position::Offset(offset)) =
            checkpoint.position_for_partition(&self.partition_id)
        {
            let up_to_position_included = offset.as_u64().expect("offset should be stored as u64");
            self.send_suggest_truncate_to_ingest_service(up_to_position_included, ctx)
                .await?;
        }
        Ok(())
    }

    fn name(&self) -> String {
        "IngestApiSource".to_string()
    }

    fn observable_state(&self) -> JsonValue {
        serde_json::to_value(&self.counters).unwrap()
    }
}

pub struct IngestApiSourceFactory;

#[async_trait]
impl TypedSourceFactory for IngestApiSourceFactory {
    type Source = IngestApiSource;
    type Params = ();

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        _: (),
    ) -> anyhow::Result<Self::Source> {
        IngestApiSource::try_new(source_runtime).await
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;
    use std::time::Duration;

    use quickwit_actors::Command::Nudge;
    use quickwit_actors::Universe;
    use quickwit_common::rand::append_random_suffix;
    use quickwit_config::{
        INGEST_API_SOURCE_ID, IngestApiConfig, SourceConfig, SourceInputFormat, SourceParams,
    };
    use quickwit_ingest::{CommitType, DocBatchBuilder, IngestRequest, init_ingest_api};
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;
    use quickwit_proto::types::{IndexId, IndexUid};

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::SourceActor;
    use crate::source::tests::SourceRuntimeBuilder;

    fn make_ingest_request(
        index_id: IndexId,
        num_batch: u64,
        batch_size: usize,
        commit_type: CommitType,
    ) -> IngestRequest {
        let mut doc_batches = Vec::new();
        let mut doc_id = 0usize;
        for _ in 0..num_batch {
            let mut doc_batch_builder = DocBatchBuilder::new(index_id.clone());
            for _ in 0..batch_size {
                doc_batch_builder.ingest_doc(
                    format!("{doc_id:0>6} - The quick brown fox jumps over the lazy dog")
                        .as_bytes(),
                );
                doc_id += 1;
            }
            doc_batches.push(doc_batch_builder.build());
        }
        IngestRequest {
            doc_batches,
            commit: commit_type.into(),
        }
    }

    fn make_source_config() -> SourceConfig {
        SourceConfig {
            source_id: INGEST_API_SOURCE_ID.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::IngestApi,
            transform_config: None,
            input_format: SourceInputFormat::Json,
        }
    }

    #[tokio::test]
    async fn test_ingest_api_source() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_id = append_random_suffix("test-ingest-api-source");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let source_config = make_source_config();
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_queues_dir(queues_dir_path)
            .build();
        let ingest_api_source = IngestApiSource::try_new(source_runtime).await?;
        let ingest_api_source_actor = SourceActor {
            source: Box::new(ingest_api_source),
            doc_processor_mailbox,
        };
        let (_ingest_api_source_mailbox, ingest_api_source_handle) =
            universe.spawn_builder().spawn(ingest_api_source_actor);

        let ingest_req = make_ingest_request(index_id.clone(), 2, 20_000, CommitType::Auto);
        ingest_api_service
            .ask_for_res(ingest_req)
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        universe.sleep(Duration::from_secs(2)).await;
        let counters = ingest_api_source_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(
            counters,
            serde_json::json!({
                "previous_offset": 39999u64,
                "current_offset": 39999u64,
                "num_docs_processed": 40000u64
            })
        );
        let doc_batches: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(doc_batches.len(), 2);
        assert!(&doc_batches[1].docs[0].starts_with(b"037736"));
        // TODO: Source deadlocks and test hangs occasionally if we don't quit source first.
        ingest_api_source_handle.quit().await;
        universe.assert_quit().await;
        Ok(())
    }

    /// See #2310
    #[tokio::test]
    async fn test_ingest_api_source_partition_id_changes() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let partition_id_before_lost_queue_dir = {
            let temp_dir = tempfile::tempdir()?;
            let queues_dir_path = temp_dir.path();
            let ingest_api_service =
                init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
            let partition_id: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();
            let partition_id2: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();
            assert_eq!(partition_id, partition_id2);
            drop(ingest_api_service);
            let ingest_api_service =
                init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
            let partition_id3: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();
            assert_eq!(partition_id, partition_id3);
            partition_id
        };
        let partition_id_after_lost_queue_dir = {
            let temp_dir = tempfile::tempdir()?;
            let queues_dir_path = temp_dir.path();
            let ingest_api_service =
                init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
            let partition_id: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();
            partition_id
        };
        assert_ne!(
            partition_id_before_lost_queue_dir,
            partition_id_after_lost_queue_dir
        );
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_ingest_api_source_resume_from_checkpoint() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_id = append_random_suffix("test-ingest-api-source");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
        let create_queue_req = CreateQueueIfNotExistsRequest {
            queue_id: index_id.clone(),
        };
        ingest_api_service
            .ask_for_res(create_queue_req)
            .await
            .unwrap();

        let ingest_req = make_ingest_request(index_id.clone(), 4, 1000, CommitType::Auto);
        ingest_api_service
            .ask_for_res(ingest_req)
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;

        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let partition_id: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();
        let checkpoint_delta = SourceCheckpointDelta::from_partition_delta(
            partition_id.clone(),
            Position::Beginning,
            Position::offset(1200u64),
        )
        .unwrap();

        let source_config = make_source_config();
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_mock_metastore(Some(checkpoint_delta))
            .with_queues_dir(queues_dir_path)
            .build();

        let ingest_api_source = IngestApiSource::try_new(source_runtime).await?;
        let ingest_api_source_actor = SourceActor {
            source: Box::new(ingest_api_source),
            doc_processor_mailbox,
        };
        let (_ingest_api_source_mailbox, ingest_api_source_handle) =
            universe.spawn_builder().spawn(ingest_api_source_actor);

        universe.sleep(Duration::from_secs(2)).await;
        let counters = ingest_api_source_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(
            counters,
            serde_json::json!({
                "previous_offset": 3999u64,
                "current_offset": 3999u64,
                "num_docs_processed": 2799u64
            })
        );
        let doc_batches: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(doc_batches.len(), 1);
        assert!(&doc_batches[0].docs[0].starts_with(b"001201"));
        assert_eq!(doc_batches[0].checkpoint_delta.num_partitions(), 1);
        assert_eq!(
            doc_batches[0].checkpoint_delta.partitions().next().unwrap(),
            &partition_id
        );
        // TODO: Source deadlocks and test hangs occasionally if we don't quit source first.
        ingest_api_source_handle.quit().await;
        universe.assert_quit().await;

        Ok(())
    }

    #[tokio::test]
    async fn test_ingest_api_source_with_one_doc() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_id = append_random_suffix("test-ingest-api-source");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();
        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;

        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let source_config = make_source_config();
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_queues_dir(queues_dir_path)
            .build();

        let ingest_api_source = IngestApiSource::try_new(source_runtime).await?;
        let ingest_api_source_actor = SourceActor {
            source: Box::new(ingest_api_source),
            doc_processor_mailbox,
        };
        let (_ingest_api_source_mailbox, ingest_api_source_handle) =
            universe.spawn_builder().spawn(ingest_api_source_actor);

        let ingest_req = make_ingest_request(index_id.clone(), 1, 1, CommitType::Auto);
        ingest_api_service
            .ask_for_res(ingest_req)
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        universe.sleep(Duration::from_secs(2)).await;
        let counters = ingest_api_source_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(
            counters,
            serde_json::json!({
                "previous_offset": 0u64,
                "current_offset": 0u64,
                "num_docs_processed": 1u64
            })
        );
        let doc_batches: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(doc_batches.len(), 1);
        assert!(&doc_batches[0].docs[0].starts_with(b"000000"));
        // TODO: Source deadlocks and test hangs occasionally if we don't quit source first.
        ingest_api_source_handle.quit().await;
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_ingest_api_source_with_force_commit() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_id = append_random_suffix("test-ingest-api-source");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let source_config = make_source_config();
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_queues_dir(queues_dir_path)
            .build();

        let ingest_api_source = IngestApiSource::try_new(source_runtime).await?;
        let ingest_api_source_actor = SourceActor {
            source: Box::new(ingest_api_source),
            doc_processor_mailbox,
        };
        let (_ingest_api_source_mailbox, ingest_api_source_handle) =
            universe.spawn_builder().spawn(ingest_api_source_actor);

        let ingest_req = make_ingest_request(index_id.clone(), 2, 20_000, CommitType::Force);
        let ingest_res = ingest_api_service
            .send_message(ingest_req)
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        universe.sleep(Duration::from_secs(2)).await;
        let counters = ingest_api_source_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(
            counters,
            serde_json::json!({
                "previous_offset": 40001u64,
                "current_offset": 40001u64,
                "num_docs_processed": 40000u64
            })
        );
        let doc_batches: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(doc_batches.len(), 2);
        assert!(doc_batches[1].docs[0].starts_with(b"037736"));
        assert!(doc_batches[0].force_commit);
        assert!(doc_batches[1].force_commit);
        ingest_api_service
            .ask_for_res(SuggestTruncateRequest {
                index_id: index_id.clone(),
                up_to_position_included: 40001,
            })
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        let res = ingest_res
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        assert_eq!(res.num_docs_for_processing, 40_000);
        ingest_api_source_handle.quit().await;
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_ingest_api_source_with_wait() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_id = append_random_suffix("test-ingest-api-source");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let source_config = make_source_config();
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_queues_dir(queues_dir_path)
            .build();

        let ingest_api_source = IngestApiSource::try_new(source_runtime).await?;
        let ingest_api_source_actor = SourceActor {
            source: Box::new(ingest_api_source),
            doc_processor_mailbox,
        };
        let (_ingest_api_source_mailbox, ingest_api_source_handle) =
            universe.spawn_builder().spawn(ingest_api_source_actor);
        let ingest_req = make_ingest_request(index_id.clone(), 2, 20_000, CommitType::WaitFor);
        let ingest_res = ingest_api_service
            .send_message(ingest_req)
            .await
            .map_err(|err| anyhow::anyhow!(err.to_string()))?;
        universe.sleep(Duration::from_secs(2)).await;
        let counters = ingest_api_source_handle
            .process_pending_and_observe()
            .await
            .state;
        assert_eq!(
            counters,
            serde_json::json!({
                "previous_offset": 39999u64,
                "current_offset": 39999u64,
                "num_docs_processed": 40000u64
            })
        );
        let doc_batches: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert_eq!(doc_batches.len(), 2);
        assert!(doc_batches[1].docs[0].starts_with(b"037736"));
        assert!(!doc_batches[0].force_commit);
        assert!(!doc_batches[1].force_commit);
        ingest_api_service
            .ask_for_res(SuggestTruncateRequest {
                index_id: index_id.clone(),
                up_to_position_included: 39999,
            })
            .await
            .unwrap();
        let res = ingest_res.await.unwrap().unwrap();
        assert_eq!(res.num_docs_for_processing, 40_000);
        ingest_api_source_handle.quit().await;
        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_ingest_api_source_truncate_on_initialize() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_id = append_random_suffix("test-ingest-api-source");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;
        let (doc_processor_mailbox, _doc_processor_inbox) = universe.create_test_mailbox();
        let source_config = make_source_config();
        let _source_runtime = SourceRuntimeBuilder::new(index_uid.clone(), source_config.clone())
            .with_queues_dir(queues_dir_path)
            .build();

        let create_queue_req = CreateQueueIfNotExistsRequest {
            queue_id: index_id.clone(),
        };
        ingest_api_service
            .ask_for_res(create_queue_req)
            .await
            .unwrap();

        let ingest_req = make_ingest_request(index_id.clone(), 2, 20_000, CommitType::Auto);
        ingest_api_service.ask(ingest_req).await.unwrap().unwrap();

        let fetch_request = FetchRequest {
            index_id: index_id.clone(),
            start_after: None,
            num_bytes_limit: None,
        };
        let FetchResponse { first_position, .. } = ingest_api_service
            .ask(fetch_request.clone())
            .await
            .unwrap()
            .unwrap();
        assert_eq!(first_position, Some(0));

        let partition_id: PartitionId = ingest_api_service.ask(GetPartitionId).await?.into();
        let checkpoint_delta = SourceCheckpointDelta::from_partition_delta(
            partition_id.clone(),
            Position::Beginning,
            Position::offset(10u64),
        )
        .unwrap();

        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_mock_metastore(Some(checkpoint_delta))
            .with_queues_dir(queues_dir_path)
            .build();

        let ingest_api_source = IngestApiSource::try_new(source_runtime).await?;
        let ingest_api_source_actor = SourceActor {
            source: Box::new(ingest_api_source),
            doc_processor_mailbox,
        };
        let (ingest_api_source_mailbox, ingest_api_source_handle) =
            universe.spawn_builder().spawn(ingest_api_source_actor);

        ingest_api_source_mailbox.ask(Nudge).await.unwrap();
        let FetchResponse { first_position, .. } = ingest_api_service
            .ask(fetch_request.clone())
            .await
            .unwrap()
            .unwrap();
        // We should have truncated to keep only message strictly after the source checkpoint.
        assert_eq!(first_position, Some(11u64));

        ingest_api_source_handle.quit().await;
        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/kafka_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::time::{Duration, Instant};

use anyhow::{Context, anyhow, bail};
use async_trait::async_trait;
use bytes::Bytes;
use itertools::Itertools;
use oneshot;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_config::KafkaSourceParams;
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::{IndexUid, Position};
use rdkafka::config::{ClientConfig, RDKafkaLogLevel};
use rdkafka::consumer::{
    BaseConsumer, CommitMode, Consumer, ConsumerContext, DefaultConsumerContext, Rebalance,
};
use rdkafka::error::KafkaError;
use rdkafka::message::BorrowedMessage;
use rdkafka::util::Timeout;
use rdkafka::{ClientContext, Message, Offset, TopicPartitionList};
use serde_json::{Value as JsonValue, json};
use tokio::sync::{mpsc, watch};
use tokio::task::{JoinHandle, spawn_blocking};
use tokio::time;
use tracing::{debug, info, warn};

use crate::actors::DocProcessor;
use crate::models::{NewPublishLock, PublishLock};
use crate::source::{
    BATCH_NUM_BYTES_LIMIT, BatchBuilder, EMIT_BATCHES_TIMEOUT, Source, SourceContext,
    SourceRuntime, TypedSourceFactory,
};

type GroupId = String;

/// Factory for instantiating a `KafkaSource`.
pub struct KafkaSourceFactory;

#[async_trait]
impl TypedSourceFactory for KafkaSourceFactory {
    type Source = KafkaSource;
    type Params = KafkaSourceParams;

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        params: KafkaSourceParams,
    ) -> anyhow::Result<Self::Source> {
        KafkaSource::try_new(source_runtime, params).await
    }
}

#[derive(Debug)]
enum KafkaEvent {
    Message(KafkaMessage),
    AssignPartitions {
        partitions: Vec<i32>,
        assignment_tx: oneshot::Sender<Vec<(i32, Offset)>>,
    },
    RevokePartitions {
        ack_tx: oneshot::Sender<()>,
    },
    PartitionEOF(i32),
    Error(anyhow::Error),
}

#[derive(Debug)]
struct KafkaMessage {
    doc_opt: Option<Bytes>,
    payload_len: u64,
    partition: i32,
    offset: i64,
}

impl From<BorrowedMessage<'_>> for KafkaMessage {
    fn from(message: BorrowedMessage<'_>) -> Self {
        Self {
            doc_opt: message_payload_to_doc(&message),
            payload_len: message.payload_len() as u64,
            partition: message.partition(),
            offset: message.offset(),
        }
    }
}

struct RdKafkaContext {
    topic: String,
    events_tx: mpsc::Sender<KafkaEvent>,
}

impl ClientContext for RdKafkaContext {}

macro_rules! return_if_err {
    ($expression:expr, $lit: literal) => {
        match $expression {
            Ok(v) => v,
            Err(_) => {
                debug!(concat!($lit, "the source was dropped"));
                return;
            }
        }
    };
}

/// The rebalance protocol at a very high level:
/// - A consumer joins or leaves a consumer group.
/// - Consumers receive a revoke partitions notification, which gives them the opportunity to commit
///   the work in progress.
/// - Broker waits for ALL the consumers to ack the revoke notification (synchronization barrier).
/// - Consumers receive new partition assignmennts.
///
/// The API of the rebalance callback is better explained in the docs of `librdkafka`:
/// <https://docs.confluent.io/2.0.0/clients/librdkafka/classRdKafka_1_1RebalanceCb.html>
impl ConsumerContext for RdKafkaContext {
    fn pre_rebalance(&self, _consumer: &BaseConsumer<Self>, rebalance: &Rebalance) {
        crate::metrics::INDEXER_METRICS.kafka_rebalance_total.inc();
        quickwit_common::rate_limited_info!(limit_per_min = 3, topic = self.topic, "rebalance");
        if let Rebalance::Revoke(tpl) = rebalance {
            let partitions = collect_partitions(tpl, &self.topic);
            debug!(partitions=?partitions, "revoke partitions");

            let (ack_tx, ack_rx) = oneshot::channel();
            return_if_err!(
                self.events_tx
                    .blocking_send(KafkaEvent::RevokePartitions { ack_tx }),
                "failed to send revoke message to source"
            );
            return_if_err!(ack_rx.recv(), "failed to receive revoke ack from source");
        }
        if let Rebalance::Assign(tpl) = rebalance {
            let partitions = collect_partitions(tpl, &self.topic);
            debug!(partitions=?partitions, "assign partitions");

            let (assignment_tx, assignment_rx) = oneshot::channel();
            return_if_err!(
                self.events_tx.blocking_send(KafkaEvent::AssignPartitions {
                    partitions,
                    assignment_tx,
                }),
                "failed to send assign message to source"
            );
            let assignment = return_if_err!(
                assignment_rx.recv(),
                "failed to receive assignment from source"
            );
            for (partition_id, offset) in assignment {
                let Some(mut partition) = tpl.find_partition(&self.topic, partition_id) else {
                    warn!("partition `{partition_id}` not found in assignment");
                    continue;
                };
                if let Err(error) = partition.set_offset(offset) {
                    warn!(
                        "failed to set offset to `{offset:?}` for partition `{partition_id}`: \
                         {error}"
                    );
                }
            }
        }
    }
}

fn collect_partitions(tpl: &TopicPartitionList, topic: &str) -> Vec<i32> {
    tpl.elements()
        .iter()
        .map(|tple| {
            assert_eq!(tple.topic(), topic);
            tple.partition()
        })
        .collect()
}

type RdKafkaConsumer = BaseConsumer<RdKafkaContext>;

#[derive(Default)]
pub struct KafkaSourceState {
    /// Partitions IDs assigned to the source.
    pub assigned_partitions: HashMap<i32, PartitionId>,
    /// Offset for each partition of the last message received.
    pub current_positions: HashMap<i32, Position>,
    /// Number of inactive partitions, i.e., that have reached EOF.
    pub num_inactive_partitions: usize,
    /// Number of bytes processed by the source.
    pub num_bytes_processed: u64,
    /// Number of messages processed by the source (including invalid messages).
    pub num_messages_processed: u64,
    // Number of invalid messages, i.e., that were empty or could not be parsed.
    pub num_invalid_messages: u64,
    /// Number of rebalances the consumer went through.
    pub num_rebalances: usize,
}

/// A `KafkaSource` consumes a topic and forwards its messages to an `Indexer`.
pub struct KafkaSource {
    source_runtime: SourceRuntime,
    topic: String,
    group_id: GroupId,
    state: KafkaSourceState,
    backfill_mode_enabled: bool,
    events_rx: mpsc::Receiver<KafkaEvent>,
    truncate_tx: watch::Sender<SourceCheckpoint>,
    poll_loop_jh: JoinHandle<()>,
    publish_lock: PublishLock,
}

impl fmt::Debug for KafkaSource {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("KafkaSource")
            .field("index_uid", self.source_runtime.index_uid())
            .field("source_id", &self.source_runtime.source_id())
            .field("topic", &self.topic)
            .finish()
    }
}

impl KafkaSource {
    /// Instantiates a new `KafkaSource`.
    pub async fn try_new(
        source_runtime: SourceRuntime,
        source_params: KafkaSourceParams,
    ) -> anyhow::Result<Self> {
        let topic = source_params.topic.clone();
        let backfill_mode_enabled = source_params.enable_backfill_mode;

        let (events_tx, events_rx) = mpsc::channel(100);
        let (truncate_tx, truncate_rx) = watch::channel(SourceCheckpoint::default());
        let (client_config, consumer, group_id) = create_consumer(
            source_runtime.index_uid(),
            source_runtime.source_id(),
            source_params,
            events_tx.clone(),
        )?;
        let native_client_config = client_config.create_native_config()?;
        let session_timeout_ms = native_client_config
            .get("session.timeout.ms")?
            .parse::<u64>()?;
        let max_poll_interval_ms = native_client_config
            .get("max.poll.interval.ms")?
            .parse::<u64>()?;

        let poll_loop_jh =
            spawn_consumer_poll_loop(consumer, topic.clone(), events_tx, truncate_rx);
        let publish_lock = PublishLock::default();

        info!(
            index_uid=%source_runtime.index_uid(),
            source_id=%source_runtime.source_id(),
            topic,
            group_id,
            max_poll_interval_ms,
            session_timeout_ms,
            "starting Kafka source"
        );
        if max_poll_interval_ms <= 60_000 {
            warn!(
                "`max.poll.interval.ms` is set to a short duration that may cause the source to \
                 crash when back pressure from the indexer occurs. The recommended value is \
                 `300000` (5 minutes)."
            );
        }
        Ok(KafkaSource {
            source_runtime,
            topic,
            group_id,
            state: KafkaSourceState::default(),
            backfill_mode_enabled,
            events_rx,
            truncate_tx,
            poll_loop_jh,
            publish_lock,
        })
    }

    async fn process_message(
        &mut self,
        message: KafkaMessage,
        batch: &mut BatchBuilder,
    ) -> anyhow::Result<()> {
        let KafkaMessage {
            doc_opt,
            payload_len,
            partition,
            offset,
            ..
        } = message;

        if let Some(doc) = doc_opt {
            batch.add_doc(doc);
        } else {
            self.state.num_invalid_messages += 1;
        }
        self.state.num_bytes_processed += payload_len;
        self.state.num_messages_processed += 1;

        let partition_id = self
            .state
            .assigned_partitions
            .get(&partition)
            .ok_or_else(|| {
                anyhow::anyhow!(
                    "received message from unassigned partition `{}`. Assigned partitions: \
                     `{{{}}}`",
                    partition,
                    self.state.assigned_partitions.keys().join(", "),
                )
            })?
            .clone();
        let current_position = Position::offset(offset);
        let previous_position = self
            .state
            .current_positions
            .insert(partition, current_position.clone())
            .unwrap_or_else(|| previous_position_for_offset(offset));
        batch
            .checkpoint_delta
            .record_partition_delta(partition_id, previous_position, current_position)
            .context("failed to record partition delta")?;
        Ok(())
    }

    async fn process_assign_partitions(
        &mut self,
        ctx: &SourceContext,
        partitions: &[i32],
        assignment_tx: oneshot::Sender<Vec<(i32, Offset)>>,
    ) -> anyhow::Result<()> {
        let checkpoint = ctx
            .protect_future(self.source_runtime.fetch_checkpoint())
            .await?;

        self.state.assigned_partitions.clear();
        self.state.current_positions.clear();
        self.state.num_inactive_partitions = 0;

        let mut next_offsets: Vec<(i32, Offset)> = Vec::with_capacity(partitions.len());

        for &partition in partitions {
            let partition_id = PartitionId::from(partition as i64);

            self.state
                .assigned_partitions
                .insert(partition, partition_id.clone());

            let Some(current_position) = checkpoint.position_for_partition(&partition_id).cloned()
            else {
                continue;
            };
            let next_offset = match &current_position {
                Position::Beginning => Offset::Beginning,
                Position::Offset(offset) => {
                    let offset = offset
                        .as_i64()
                        .expect("Kafka offset should be stored as i64");
                    Offset::Offset(offset + 1)
                }
                Position::Eof(_) => {
                    panic!("position of a Kafka partition should never be EOF")
                }
            };
            self.state
                .current_positions
                .insert(partition, current_position);
            next_offsets.push((partition, next_offset));
        }
        info!(
            index_id=%self.source_runtime.index_id(),
            source_id=%self.source_runtime.source_id(),
            topic=%self.topic,
            group_id=%self.group_id,
            partitions=?partitions,
            "new partition assignment after rebalance",
        );
        assignment_tx
            .send(next_offsets)
            .context("Kafka consumer context was dropped")?;
        Ok(())
    }

    async fn process_revoke_partitions(
        &mut self,
        ctx: &SourceContext,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        batch: &mut BatchBuilder,
        ack_tx: oneshot::Sender<()>,
    ) -> anyhow::Result<()> {
        ctx.protect_future(self.publish_lock.kill()).await;
        ack_tx
            .send(())
            .context("Kafka consumer context was dropped")?;

        batch.clear();
        self.publish_lock = PublishLock::default();
        self.state.num_rebalances += 1;
        ctx.send_message(
            doc_processor_mailbox,
            NewPublishLock(self.publish_lock.clone()),
        )
        .await?;
        Ok(())
    }

    fn process_partition_eof(&mut self, partition: i32) {
        self.state.num_inactive_partitions += 1;

        info!(
            topic=%self.topic,
            partition=%partition,
            num_inactive_partitions=?self.state.num_inactive_partitions,
            "reached end of partition"
        );
    }

    fn should_exit(&self) -> bool {
        self.backfill_mode_enabled
            // This check ensures that we don't shutdown the source before the first partition assignment.
            && self.state.num_inactive_partitions > 0
            && self.state.num_inactive_partitions == self.state.assigned_partitions.len()
    }

    fn truncate(&self, checkpoint: SourceCheckpoint) -> anyhow::Result<()> {
        self.truncate_tx
            .send(checkpoint)
            .context("Kafka consumer was dropped")?;
        Ok(())
    }
}

#[async_trait]
impl Source for KafkaSource {
    async fn initialize(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        let publish_lock = self.publish_lock.clone();
        ctx.send_message(doc_processor_mailbox, NewPublishLock(publish_lock))
            .await?;
        Ok(())
    }

    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let now = Instant::now();
        let mut batch_builder = BatchBuilder::new(SourceType::Kafka);
        let deadline = time::sleep(*EMIT_BATCHES_TIMEOUT);
        tokio::pin!(deadline);

        loop {
            tokio::select! {
                event_opt = self.events_rx.recv() => {
                    let event = event_opt.ok_or_else(|| ActorExitStatus::from(anyhow!("consumer was dropped")))?;
                    match event {
                        KafkaEvent::Message(message) => self.process_message(message, &mut batch_builder).await?,
                        KafkaEvent::AssignPartitions { partitions, assignment_tx} => self.process_assign_partitions(ctx, &partitions, assignment_tx).await?,
                        KafkaEvent::RevokePartitions { ack_tx } => self.process_revoke_partitions(ctx, doc_processor_mailbox, &mut batch_builder, ack_tx).await?,
                        KafkaEvent::PartitionEOF(partition) => self.process_partition_eof(partition),
                        KafkaEvent::Error(error) => Err(ActorExitStatus::from(error))?,
                    }
                    if batch_builder.num_bytes >= BATCH_NUM_BYTES_LIMIT {
                        break;
                    }
                }
                _ = &mut deadline => {
                    break;
                }
            }
            ctx.record_progress();
        }
        if !batch_builder.checkpoint_delta.is_empty() {
            debug!(
                num_docs=%batch_builder.docs.len(),
                num_bytes=%batch_builder.num_bytes,
                num_millis=%now.elapsed().as_millis(),
                "sending doc batch to indexer"
            );
            let message = batch_builder.build();
            ctx.send_message(doc_processor_mailbox, message).await?;
        }
        if self.should_exit() {
            info!(topic = %self.topic, "reached end of topic");
            ctx.send_exit_with_success(doc_processor_mailbox).await?;
            return Err(ActorExitStatus::Success);
        }
        Ok(Duration::default())
    }

    async fn suggest_truncate(
        &mut self,
        checkpoint: SourceCheckpoint,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        self.truncate(checkpoint)?;
        Ok(())
    }

    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        self.poll_loop_jh.abort();
        Ok(())
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    fn observable_state(&self) -> JsonValue {
        let assigned_partitions: Vec<&i32> =
            self.state.assigned_partitions.keys().sorted().collect();
        let current_positions: Vec<(&i32, &Position)> =
            self.state.current_positions.iter().sorted().collect();
        json!({
            "index_id": self.source_runtime.index_id(),
            "source_id": self.source_runtime.source_id(),
            "topic": self.topic,
            "assigned_partitions": assigned_partitions,
            "current_positions": current_positions,
            "num_inactive_partitions": self.state.num_inactive_partitions,
            "num_bytes_processed": self.state.num_bytes_processed,
            "num_messages_processed": self.state.num_messages_processed,
            "num_invalid_messages": self.state.num_invalid_messages,
            "num_rebalances": self.state.num_rebalances,
        })
    }
}

// `rust-rdkafka` provides an async API via `StreamConsumer` for consuming topics asynchronously,
// BUT the async calls to `recev()` end up being sync when a rebalance occurs because the rebalance
// callback is sync. Until `rust-rdkafka` offers a fully asynchronous API, we poll the consumer in a
// blocking tokio task and handle the rebalance events via message passing between the rebalance
// callback and the source.
fn spawn_consumer_poll_loop(
    consumer: RdKafkaConsumer,
    topic: String,
    events_tx: mpsc::Sender<KafkaEvent>,
    mut truncate_rx: watch::Receiver<SourceCheckpoint>,
) -> JoinHandle<()> {
    spawn_blocking(move || {
        // `subscribe()` returns immediately but triggers the execution of synchronous code (e.g.
        // rebalance callback) so it must be called in a blocking task.
        //
        // From the librdkafka docs:
        // `subscribe()` is an asynchronous method which returns immediately: background threads
        // will (re)join the group, wait for group rebalance, issue any registered rebalance_cb,
        // assign() the assigned partitions, and then start fetching messages.
        if let Err(error) = consumer.subscribe(&[&topic]) {
            let _ = events_tx.blocking_send(KafkaEvent::Error(anyhow!(error)));
            return;
        }
        while !events_tx.is_closed() {
            if let Some(message_res) = consumer.poll(Some(Duration::from_secs(1))) {
                let event = match message_res {
                    Ok(message) => KafkaEvent::Message(message.into()),
                    Err(KafkaError::PartitionEOF(partition)) => KafkaEvent::PartitionEOF(partition),
                    Err(error) => KafkaEvent::Error(anyhow!(error)),
                };
                // When the source experiences backpressure, this channel becomes full and the
                // consumer might not call `poll()` for a duration that exceeds
                // `max.poll.interval.ms`. When that happens the consumer is kicked out of the group
                // and the source fails. This should not happen in practice with a
                // sufficiently large value for `max.poll.interval.ms`. The default value is 5
                // minutes.
                if events_tx.blocking_send(event).is_err() {
                    break;
                }
            }
            if let Ok(true) = truncate_rx.has_changed() {
                let checkpoint = truncate_rx.borrow_and_update();

                let mut tpl = TopicPartitionList::new();
                for (partition_id, position) in checkpoint.iter() {
                    let partition = partition_id
                        .as_i64()
                        .expect("Kafka partition should be stored as i64.")
                        as i32;
                    // Quickwit positions are inclusive whereas Kafka offsets are exclusive, hence
                    // the increment by 1.
                    let next_position = position
                        .as_i64()
                        .expect("Kafka offset should be stored as i64.")
                        + 1;
                    let offset = Offset::Offset(next_position);
                    tpl.add_partition_offset(&topic, partition, offset)
                        .expect("The offset should be valid.");
                }
                if let Err(error) = consumer.commit(&tpl, CommitMode::Async) {
                    warn!(error=?error, "failed to commit offsets");
                }
            }
        }
        debug!("exiting consumer poll loop");
        consumer.unsubscribe();
    })
}

/// Returns the preceding `Position` for the offset.
fn previous_position_for_offset(offset: i64) -> Position {
    if offset == 0 {
        Position::Beginning
    } else {
        Position::offset(offset - 1)
    }
}

/// Checks whether we can establish a connection to the Kafka broker.
pub(super) async fn check_connectivity(params: KafkaSourceParams) -> anyhow::Result<()> {
    let mut client_config = parse_client_params(params.client_params)?;

    let consumer: BaseConsumer<DefaultConsumerContext> = client_config
        .set("group.id", "quickwit-connectivity-check".to_string())
        .set_log_level(RDKafkaLogLevel::Error)
        .create()?;

    let topic = params.topic.clone();
    let timeout = Timeout::After(Duration::from_secs(5));
    let cluster_metadata = spawn_blocking(move || {
        consumer
            .fetch_metadata(Some(&topic), timeout)
            .with_context(|| format!("failed to fetch metadata for topic `{topic}`"))
    })
    .await??;

    if cluster_metadata.topics().is_empty() {
        bail!("topic `{}` does not exist", params.topic);
    }
    let topic_metadata = &cluster_metadata.topics()[0];
    assert_eq!(topic_metadata.name(), params.topic); // Belt and suspenders.

    if topic_metadata.partitions().is_empty() {
        bail!("topic `{}` has no partitions", params.topic);
    }
    Ok(())
}

/// Creates a new `KafkaSourceConsumer`.
fn create_consumer(
    index_uid: &IndexUid,
    source_id: &str,
    params: KafkaSourceParams,
    events_tx: mpsc::Sender<KafkaEvent>,
) -> anyhow::Result<(ClientConfig, RdKafkaConsumer, GroupId)> {
    // Group ID is limited to 255 characters.
    let mut group_id = match &params.client_params["group.id"] {
        JsonValue::String(group_id) => group_id.clone(),
        _ => format!("quickwit-{index_uid}-{source_id}"),
    };
    group_id.truncate(255);

    let mut client_config = parse_client_params(params.client_params)?;

    let log_level = parse_client_log_level(params.client_log_level)?;
    let consumer: RdKafkaConsumer = client_config
        .set("enable.auto.commit", "false") // We manage offsets ourselves: we always want to set this value to `false`.
        .set(
            "enable.partition.eof",
            params.enable_backfill_mode.to_string(),
        )
        .set("group.id", &group_id)
        .set_log_level(log_level)
        .create_with_context(RdKafkaContext {
            topic: params.topic,
            events_tx,
        })
        .context("failed to create Kafka consumer")?;

    Ok((client_config, consumer, group_id))
}

fn parse_client_log_level(client_log_level: Option<String>) -> anyhow::Result<RDKafkaLogLevel> {
    let log_level = match client_log_level
        .map(|log_level| log_level.to_lowercase())
        .as_deref()
    {
        Some("debug") => RDKafkaLogLevel::Debug,
        Some("info") | None => RDKafkaLogLevel::Info,
        Some("warn") | Some("warning") => RDKafkaLogLevel::Warning,
        Some("error") => RDKafkaLogLevel::Error,
        Some("critical") => RDKafkaLogLevel::Critical,
        Some("alert") => RDKafkaLogLevel::Alert,
        Some("emerg") => RDKafkaLogLevel::Emerg,
        Some(level) => bail!(
            "failed to parse Kafka client log level. value `{}` is not supported",
            level
        ),
    };
    Ok(log_level)
}

fn parse_client_params(client_params: JsonValue) -> anyhow::Result<ClientConfig> {
    let params = if let JsonValue::Object(params) = client_params {
        params
    } else {
        bail!("failed to parse Kafka client parameters. `client_params` must be a JSON object");
    };
    let mut client_config = ClientConfig::new();
    for (key, value_json) in params {
        let value = match value_json {
            JsonValue::Bool(value_bool) => value_bool.to_string(),
            JsonValue::Number(value_number) => value_number.to_string(),
            JsonValue::String(value_string) => value_string,
            JsonValue::Null => continue,
            JsonValue::Array(_) | JsonValue::Object(_) => bail!(
                "failed to parse Kafka client parameters. `client_params.{}` must be a boolean, \
                 number, or string",
                key
            ),
        };
        client_config.set(key, value);
    }
    Ok(client_config)
}

/// Returns the message payload as a `Bytes` object if it exists and is not empty.
fn message_payload_to_doc(message: &BorrowedMessage) -> Option<Bytes> {
    match message.payload() {
        Some(payload) if !payload.is_empty() => {
            let doc = Bytes::from(payload.to_vec());
            return Some(doc);
        }
        Some(_) => debug!(
            topic=%message.topic(),
            partition=%message.partition(),
            offset=%message.offset(),
            timestamp=?message.timestamp(),
            "Document is empty."
        ),
        None => debug!(
            topic=%message.topic(),
            partition=%message.partition(),
            offset=%message.offset(),
            timestamp=?message.timestamp(),
            "Message payload is empty."
        ),
    }
    None
}

#[cfg(all(test, feature = "kafka-broker-tests"))]
mod kafka_broker_tests {
    use std::num::NonZeroUsize;

    use quickwit_actors::{ActorContext, Universe};
    use quickwit_common::rand::append_random_suffix;
    use quickwit_config::{SourceConfig, SourceInputFormat, SourceParams};
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;
    use quickwit_metastore::metastore_for_test;
    use quickwit_proto::types::IndexUid;
    use rdkafka::admin::{AdminClient, AdminOptions, NewTopic, TopicReplication};
    use rdkafka::client::DefaultClientContext;
    use rdkafka::message::ToBytes;
    use rdkafka::producer::{FutureProducer, FutureRecord};
    use tokio::sync::watch;

    use super::*;
    use crate::source::test_setup_helper::setup_index;
    use crate::source::tests::SourceRuntimeBuilder;
    use crate::source::{RawDocBatch, SourceActor, quickwit_supported_sources};

    fn create_base_consumer(group_id: &str) -> BaseConsumer {
        ClientConfig::new()
            .set("bootstrap.servers", "localhost:9092")
            .set("group.id", group_id)
            .create()
            .unwrap()
    }

    fn create_admin_client() -> AdminClient<DefaultClientContext> {
        ClientConfig::new()
            .set("bootstrap.servers", "localhost:9092")
            .create()
            .unwrap()
    }

    async fn create_topic(
        admin_client: &AdminClient<DefaultClientContext>,
        topic: &str,
        num_partitions: i32,
    ) -> anyhow::Result<()> {
        admin_client
            .create_topics(
                &[NewTopic::new(
                    topic,
                    num_partitions,
                    TopicReplication::Fixed(1),
                )],
                &AdminOptions::new().operation_timeout(Some(Duration::from_secs(5))),
            )
            .await?
            .into_iter()
            .collect::<Result<Vec<_>, _>>()
            .map_err(|(topic, err_code)| {
                anyhow::anyhow!(
                    "failed to create topic `{}`. error code: `{}`",
                    topic,
                    err_code
                )
            })?;
        Ok(())
    }

    async fn populate_topic<K, M, J, Q>(
        topic: &str,
        num_messages: i32,
        key_fn: &K,
        message_fn: &M,
        partition: Option<i32>,
        timestamp: Option<i64>,
    ) -> anyhow::Result<HashMap<(i32, i64), i32>>
    where
        K: Fn(i32) -> J,
        M: Fn(i32) -> Q,
        J: ToBytes,
        Q: ToBytes,
    {
        let producer: &FutureProducer = &ClientConfig::new()
            .set("bootstrap.servers", "localhost:9092")
            .set("statistics.interval.ms", "500")
            .set("api.version.request", "true")
            .set("debug", "all")
            .set("message.timeout.ms", "30000")
            .create()?;
        let tasks = (0..num_messages).map(|id| async move {
            producer
                .send(
                    FutureRecord {
                        topic,
                        partition,
                        timestamp,
                        key: Some(&key_fn(id)),
                        payload: Some(&message_fn(id)),
                        headers: None,
                    },
                    Duration::from_secs(1),
                )
                .await
                .map(|delivery| (id, delivery.partition, delivery.offset))
                .map_err(|(err, _)| err)
        });
        let message_map = futures::future::try_join_all(tasks)
            .await?
            .into_iter()
            .fold(HashMap::new(), |mut acc, (id, partition, offset)| {
                acc.insert((partition, offset), id);
                acc
            });
        Ok(message_map)
    }

    fn key_fn(id: i32) -> String {
        format!("Key {id}")
    }

    fn get_source_config(topic: &str, auto_offset_reset: &str) -> (String, SourceConfig) {
        let source_id = append_random_suffix("test-kafka-source--source");
        // Setting explicitly ip v4 with `broker.address.family` is required
        // because of https://github.com/fede1024/rust-rdkafka/issues/809
        let source_config = SourceConfig {
            source_id: source_id.clone(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Kafka(KafkaSourceParams {
                topic: topic.to_string(),
                client_log_level: None,
                client_params: json!({
                    "auto.offset.reset": auto_offset_reset,
                    "bootstrap.servers": "localhost:9092",
                    "broker.address.family": "v4",
                }),
                enable_backfill_mode: true,
            }),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        (source_id, source_config)
    }

    fn merge_doc_batches(batches: Vec<RawDocBatch>) -> anyhow::Result<RawDocBatch> {
        let mut merged_batch = RawDocBatch::default();
        for batch in batches {
            merged_batch.docs.extend(batch.docs);
            merged_batch
                .checkpoint_delta
                .extend(batch.checkpoint_delta)?;
        }
        merged_batch.docs.sort();
        Ok(merged_batch)
    }

    #[tokio::test]
    async fn test_kafka_source_process_message() {
        let admin_client = create_admin_client();
        let topic = append_random_suffix("test-kafka-source--process-message--topic");
        create_topic(&admin_client, &topic, 2).await.unwrap();

        let index_id = append_random_suffix("test-kafka-source--process-message--index");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let (_source_id, source_config) = get_source_config(&topic, "earliest");
        let SourceParams::Kafka(params) = source_config.clone().source_params else {
            panic!(
                "Expected Kafka source params, got {:?}.",
                source_config.source_params
            );
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let mut kafka_source = KafkaSource::try_new(source_runtime, params).await.unwrap();

        let partition_id_1 = PartitionId::from(1u64);
        let partition_id_2 = PartitionId::from(2u64);

        kafka_source.state.assigned_partitions =
            HashMap::from_iter([(1, partition_id_1.clone()), (2, partition_id_2.clone())]);

        assert_eq!(kafka_source.state.num_messages_processed, 0);
        assert_eq!(kafka_source.state.num_invalid_messages, 0);

        let mut batch_builder = BatchBuilder::new(SourceType::Kafka);

        let message = KafkaMessage {
            doc_opt: None,
            payload_len: 7,
            partition: 1,
            offset: 0,
        };
        kafka_source
            .process_message(message, &mut batch_builder)
            .await
            .unwrap();

        assert_eq!(batch_builder.docs.len(), 0);
        assert_eq!(batch_builder.num_bytes, 0);
        assert_eq!(
            kafka_source.state.current_positions.get(&1).unwrap(),
            &Position::offset(0u64)
        );
        assert_eq!(kafka_source.state.num_bytes_processed, 7);
        assert_eq!(kafka_source.state.num_messages_processed, 1);
        assert_eq!(kafka_source.state.num_invalid_messages, 1);

        let message = KafkaMessage {
            doc_opt: Some(Bytes::from_static(b"test-doc")),
            payload_len: 8,
            partition: 1,
            offset: 1,
        };
        kafka_source
            .process_message(message, &mut batch_builder)
            .await
            .unwrap();

        assert_eq!(batch_builder.docs.len(), 1);
        assert_eq!(batch_builder.docs[0], "test-doc");
        assert_eq!(batch_builder.num_bytes, 8);
        assert_eq!(
            kafka_source.state.current_positions.get(&1).unwrap(),
            &Position::offset(1u64)
        );
        assert_eq!(kafka_source.state.num_bytes_processed, 15);
        assert_eq!(kafka_source.state.num_messages_processed, 2);
        assert_eq!(kafka_source.state.num_invalid_messages, 1);

        let message = KafkaMessage {
            doc_opt: Some(Bytes::from_static(b"test-doc")),
            payload_len: 8,
            partition: 2,
            offset: 42,
        };
        kafka_source
            .process_message(message, &mut batch_builder)
            .await
            .unwrap();

        assert_eq!(batch_builder.docs.len(), 2);
        assert_eq!(batch_builder.docs[1], "test-doc");
        assert_eq!(batch_builder.num_bytes, 16);
        assert_eq!(
            kafka_source.state.current_positions.get(&2).unwrap(),
            &Position::offset(42u64)
        );
        assert_eq!(kafka_source.state.num_bytes_processed, 23);
        assert_eq!(kafka_source.state.num_messages_processed, 3);
        assert_eq!(kafka_source.state.num_invalid_messages, 1);

        let mut expected_checkpoint_delta = SourceCheckpointDelta::default();
        expected_checkpoint_delta
            .record_partition_delta(partition_id_1, Position::Beginning, Position::offset(1u64))
            .unwrap();
        expected_checkpoint_delta
            .record_partition_delta(
                partition_id_2,
                Position::offset(41u64),
                Position::offset(42u64),
            )
            .unwrap();
        assert_eq!(batch_builder.checkpoint_delta, expected_checkpoint_delta);

        // Message from unassigned partition
        let message = KafkaMessage {
            doc_opt: Some(Bytes::from_static(b"test-doc")),
            payload_len: 8,
            partition: 3,
            offset: 42,
        };
        kafka_source
            .process_message(message, &mut batch_builder)
            .await
            .unwrap_err();
    }

    #[tokio::test]
    async fn test_kafka_source_process_assign_partitions() {
        let admin_client = create_admin_client();
        let topic = append_random_suffix("test-kafka-source--process-assign-partitions--topic");
        create_topic(&admin_client, &topic, 2).await.unwrap();

        let metastore = metastore_for_test();
        let index_id = append_random_suffix("test-kafka-source--process-assign-partitions--index");
        let (_source_id, source_config) = get_source_config(&topic, "earliest");

        let index_uid = setup_index(
            metastore.clone(),
            &index_id,
            &source_config,
            &[(
                PartitionId::from(2u64),
                Position::Beginning,
                Position::offset(42u64),
            )],
        )
        .await;

        let SourceParams::Kafka(params) = source_config.clone().source_params else {
            panic!(
                "Expected Kafka source params, got {:?}.",
                source_config.source_params
            );
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_metastore(metastore)
            .build();
        let mut kafka_source = KafkaSource::try_new(source_runtime, params).await.unwrap();
        kafka_source.state.num_inactive_partitions = 1;

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox();
        let (observable_state_tx, _observable_state_rx) = watch::channel(json!({}));
        let ctx: ActorContext<SourceActor> =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);
        let (assignment_tx, assignment_rx) = oneshot::channel();

        kafka_source
            .process_assign_partitions(&ctx, &[1, 2], assignment_tx)
            .await
            .unwrap();

        assert_eq!(kafka_source.state.num_inactive_partitions, 0);

        let expected_assigned_partitions =
            HashMap::from_iter([(1, PartitionId::from(1u64)), (2, PartitionId::from(2u64))]);
        assert_eq!(
            kafka_source.state.assigned_partitions,
            expected_assigned_partitions
        );
        let expected_current_positions = HashMap::from_iter([(2, Position::offset(42u64))]);
        assert_eq!(
            kafka_source.state.current_positions,
            expected_current_positions
        );

        let assignment = assignment_rx.await.unwrap();
        assert_eq!(assignment, &[(2, Offset::Offset(43))])
    }

    #[tokio::test]
    async fn test_kafka_source_process_revoke_partitions() {
        let admin_client = create_admin_client();
        let topic = append_random_suffix("test-kafka-source--process-revoke-partitions--topic");
        create_topic(&admin_client, &topic, 1).await.unwrap();

        let index_id = append_random_suffix("test-kafka-source--process-revoke--partitions--index");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let (_source_id, source_config) = get_source_config(&topic, "earliest");
        let SourceParams::Kafka(params) = source_config.clone().source_params else {
            panic!(
                "Expected Kafka source params, got {:?}.",
                source_config.source_params
            );
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let mut kafka_source = KafkaSource::try_new(source_runtime, params).await.unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox();
        let (indexer_mailbox, indexer_inbox) = universe.create_test_mailbox();
        let (observable_state_tx, _observable_state_rx) = watch::channel(json!({}));
        let ctx: ActorContext<SourceActor> =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);
        let (ack_tx, ack_rx) = oneshot::channel();

        let mut batch_builder = BatchBuilder::new(SourceType::Kafka);
        batch_builder.add_doc(Bytes::from_static(b"test-doc"));

        let publish_lock = kafka_source.publish_lock.clone();
        assert!(publish_lock.is_alive());
        assert_eq!(kafka_source.state.num_rebalances, 0);

        kafka_source
            .process_revoke_partitions(&ctx, &indexer_mailbox, &mut batch_builder, ack_tx)
            .await
            .unwrap();

        ack_rx.await.unwrap();
        assert!(batch_builder.docs.is_empty());
        assert!(publish_lock.is_dead());

        assert_eq!(kafka_source.state.num_rebalances, 1);

        let indexer_messages: Vec<NewPublishLock> = indexer_inbox.drain_for_test_typed();
        assert_eq!(indexer_messages.len(), 1);
        assert!(indexer_messages[0].0.is_alive());
    }

    #[tokio::test]
    async fn test_kafka_source_process_partition_eof() {
        let admin_client = create_admin_client();
        let topic = append_random_suffix("test-kafka-source--process-partition-eof--topic");
        create_topic(&admin_client, &topic, 1).await.unwrap();

        let index_id = append_random_suffix("test-kafka-source--process-partition-eof--index");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let (_source_id, source_config) = get_source_config(&topic, "earliest");
        let SourceParams::Kafka(params) = source_config.clone().source_params else {
            panic!(
                "Expected Kafka source params, got {:?}.",
                source_config.source_params
            );
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let mut kafka_source = KafkaSource::try_new(source_runtime, params).await.unwrap();
        let partition_id_1 = PartitionId::from(1u64);
        kafka_source.state.assigned_partitions = HashMap::from_iter([(1, partition_id_1)]);

        assert!(!kafka_source.should_exit());

        kafka_source.process_partition_eof(1);
        assert_eq!(kafka_source.state.num_inactive_partitions, 1);
        assert!(kafka_source.should_exit());

        kafka_source.backfill_mode_enabled = false;
        assert!(!kafka_source.should_exit());
    }

    #[tokio::test]
    async fn test_kafka_source_suggest_truncate() {
        let admin_client = create_admin_client();
        let topic = append_random_suffix("test-kafka-source--suggest-truncate--topic");
        create_topic(&admin_client, &topic, 2).await.unwrap();

        let metastore = metastore_for_test();
        let index_id = append_random_suffix("test-kafka-source--suggest-truncate--index");
        let (_source_id, source_config) = get_source_config(&topic, "earliest");
        let index_uid = setup_index(
            metastore.clone(),
            &index_id,
            &source_config,
            &[(
                PartitionId::from(2u64),
                Position::Beginning,
                Position::offset(42u64),
            )],
        )
        .await;

        let SourceParams::Kafka(params) = source_config.clone().source_params else {
            panic!(
                "Expected Kafka source params, got {:?}.",
                source_config.source_params
            );
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_metastore(metastore)
            .build();
        let mut kafka_source = KafkaSource::try_new(source_runtime, params).await.unwrap();

        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox();
        let (observable_state_tx, _observable_state_rx) = watch::channel(json!({}));
        let ctx: ActorContext<SourceActor> =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        let KafkaEvent::AssignPartitions {
            partitions,
            assignment_tx,
        } = kafka_source.events_rx.recv().await.unwrap()
        else {
            panic!("Expected `AssignPartitions` event.");
        };
        kafka_source
            .process_assign_partitions(&ctx, &partitions, assignment_tx)
            .await
            .unwrap();

        let checkpoint: SourceCheckpoint = [(0u64, 1u64), (1u64, 2u64)]
            .into_iter()
            .map(|(partition_id, offset)| {
                (PartitionId::from(partition_id), Position::offset(offset))
            })
            .collect();
        kafka_source.truncate(checkpoint).unwrap();

        tokio::time::sleep(Duration::from_secs(1)).await;

        let mut tpl = TopicPartitionList::new();
        tpl.add_partition(&topic, 0);
        tpl.add_partition(&topic, 1);

        let consumer = create_base_consumer(&kafka_source.group_id);
        let committed_offsets = consumer
            .committed_offsets(tpl.clone(), Duration::from_secs(10))
            .unwrap();

        assert_eq!(
            committed_offsets
                .find_partition(&topic, 0)
                .unwrap()
                .offset(),
            Offset::Offset(2)
        );
        assert_eq!(
            committed_offsets
                .find_partition(&topic, 1)
                .unwrap()
                .offset(),
            Offset::Offset(3)
        );
    }

    #[tokio::test]
    async fn test_kafka_source() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let admin_client = create_admin_client();
        let topic = append_random_suffix("test-kafka-source--topic");
        create_topic(&admin_client, &topic, 3).await?;

        let source_loader = quickwit_supported_sources();
        {
            // Test Kafka source with empty topic.
            let metastore = metastore_for_test();
            let index_id = append_random_suffix("test-kafka-source--index");
            let (source_id, source_config) = get_source_config(&topic, "earliest");
            let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;
            let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
                .with_metastore(metastore)
                .build();
            let source = source_loader.load_source(source_runtime).await?;
            let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
            let source_actor = SourceActor {
                source,
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_source_mailbox, source_handle) = universe.spawn_builder().spawn(source_actor);
            let (exit_status, exit_state) = source_handle.join().await;
            assert!(exit_status.is_success());

            let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
            assert!(messages.is_empty());

            let expected_state = json!({
                "index_id": index_id,
                "source_id": source_id,
                "topic":  topic,
                "assigned_partitions": vec![0, 1, 2],
                "current_positions": json!([]),
                "num_inactive_partitions": 3,
                "num_bytes_processed": 0,
                "num_messages_processed": 0,
                "num_invalid_messages": 0,
                "num_rebalances": 0,
            });
            assert_eq!(exit_state, expected_state);
        }
        for partition_id in 0..3 {
            populate_topic(
                &topic,
                3,
                &key_fn,
                &|message_id| {
                    if message_id == 1 {
                        "".to_string()
                    } else {
                        format!("Message #{:0>3}", partition_id * 100 + message_id)
                    }
                },
                Some(partition_id),
                None,
            )
            .await?;
        }
        {
            let metastore = metastore_for_test();
            let index_id = append_random_suffix("test-kafka-source--index");
            let (source_id, source_config) = get_source_config(&topic, "earliest");
            let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;
            let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
                .with_metastore(metastore)
                .build();
            let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
            let source = source_loader.load_source(source_runtime).await?;
            let source_actor = SourceActor {
                source,
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_source_mailbox, source_handle) = universe.spawn_builder().spawn(source_actor);
            let (exit_status, exit_state) = source_handle.join().await;
            assert!(exit_status.is_success());

            let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
            assert!(!messages.is_empty());

            let batch = merge_doc_batches(messages)?;
            let expected_docs = vec![
                "Message #000",
                "Message #002",
                "Message #100",
                "Message #102",
                "Message #200",
                "Message #202",
            ];
            assert_eq!(batch.docs, expected_docs);

            let mut expected_checkpoint_delta = SourceCheckpointDelta::default();
            for partition in 0u64..3u64 {
                expected_checkpoint_delta.record_partition_delta(
                    PartitionId::from(partition),
                    Position::Beginning,
                    Position::offset(2u64),
                )?;
            }
            assert_eq!(batch.checkpoint_delta, expected_checkpoint_delta);

            let expected_state = json!({
                "index_id": index_id,
                "source_id": source_id,
                "topic":  topic,
                "assigned_partitions": vec![0, 1, 2],
                "current_positions":  vec![(0, "00000000000000000002"), (1, "00000000000000000002"), (2, "00000000000000000002")],
                "num_inactive_partitions": 3,
                "num_bytes_processed": 72,
                "num_messages_processed": 9,
                "num_invalid_messages": 3,
                "num_rebalances": 0,
            });
            assert_eq!(exit_state, expected_state);
        }
        {
            // Test Kafka source with `earliest` offset reset.
            let metastore = metastore_for_test();
            let index_id = append_random_suffix("test-kafka-source--index");
            let (source_id, source_config) = get_source_config(&topic, "earliest");
            let index_uid = setup_index(
                metastore.clone(),
                &index_id,
                &source_config,
                &[
                    (
                        PartitionId::from(0u64),
                        Position::Beginning,
                        Position::offset(0u64),
                    ),
                    (
                        PartitionId::from(1u64),
                        Position::Beginning,
                        Position::offset(2u64),
                    ),
                ],
            )
            .await;
            let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
                .with_metastore(metastore)
                .build();
            let source = source_loader.load_source(source_runtime).await?;
            let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
            let source_actor = SourceActor {
                source,
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_source_mailbox, source_handle) = universe.spawn_builder().spawn(source_actor);
            let (exit_status, exit_state) = source_handle.join().await;
            assert!(exit_status.is_success());

            let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
            assert!(!messages.is_empty());

            let batch = merge_doc_batches(messages)?;
            let expected_docs = vec!["Message #002", "Message #200", "Message #202"];
            assert_eq!(batch.docs, expected_docs);

            let mut expected_checkpoint_delta = SourceCheckpointDelta::default();
            expected_checkpoint_delta.record_partition_delta(
                PartitionId::from(0u64),
                Position::offset(0u64),
                Position::offset(2u64),
            )?;
            expected_checkpoint_delta.record_partition_delta(
                PartitionId::from(2u64),
                Position::Beginning,
                Position::offset(2u64),
            )?;
            assert_eq!(batch.checkpoint_delta, expected_checkpoint_delta,);

            let expected_exit_state = json!({
                "index_id": index_id,
                "source_id": source_id,
                "topic":  topic,
                "assigned_partitions": vec![0, 1, 2],
                "current_positions":  vec![(0, "00000000000000000002"), (1, "00000000000000000002"), (2, "00000000000000000002")],
                "num_inactive_partitions": 3,
                "num_bytes_processed": 36,
                "num_messages_processed": 5,
                "num_invalid_messages": 2,
                "num_rebalances": 0,
            });
            assert_eq!(exit_state, expected_exit_state);
        }
        {
            // Test Kafka source with `latest` offset reset.
            let metastore = metastore_for_test();
            let index_id = append_random_suffix("test-kafka-source--index");
            let (source_id, source_config) = get_source_config(&topic, "latest");
            let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;
            let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
                .with_metastore(metastore)
                .build();
            let source = source_loader.load_source(source_runtime).await?;
            let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
            let source_actor = SourceActor {
                source,
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_source_mailbox, source_handle) = universe.spawn_builder().spawn(source_actor);
            let (exit_status, exit_state) = source_handle.join().await;
            assert!(exit_status.is_success());

            let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
            assert!(messages.is_empty());

            let expected_state = json!({
                "index_id": index_id,
                "source_id": source_id,
                "topic":  topic,
                "assigned_partitions": vec![0, 1, 2],
                "current_positions": json!([]),
                "num_inactive_partitions": 3,
                "num_bytes_processed": 0,
                "num_messages_processed": 0,
                "num_invalid_messages": 0,
                "num_rebalances": 0,
            });
            assert_eq!(exit_state, expected_state);
        }
        Ok(())
    }

    #[tokio::test]
    async fn test_kafka_connectivity() {
        let bootstrap_servers = "localhost:9092".to_string();
        let topic = append_random_suffix("test-kafka-connectivity-topic");

        let admin_client = create_admin_client();
        create_topic(&admin_client, &topic, 1).await.unwrap();

        // Check valid connectivity
        check_connectivity(KafkaSourceParams {
            topic: topic.clone(),
            client_log_level: None,
            client_params: json!({ "bootstrap.servers": bootstrap_servers }),
            enable_backfill_mode: true,
        })
        .await
        .unwrap();

        // TODO: these tests should be checking the specific errors.
        // Non existent topic should throw an error.
        check_connectivity(KafkaSourceParams {
            topic: "non-existent-topic".to_string(),
            client_log_level: None,
            client_params: json!({ "bootstrap.servers": bootstrap_servers }),
            enable_backfill_mode: true,
        })
        .await
        .unwrap_err();

        // Invalid brokers should throw an error
        let _result = check_connectivity(KafkaSourceParams {
            topic: topic.clone(),
            client_log_level: None,
            client_params: json!({
                "bootstrap.servers": "192.0.2.10:9092"
            }),
            enable_backfill_mode: true,
        })
        .await
        .unwrap_err();
    }

    #[test]
    fn test_client_config_default_max_poll_interval() {
        // If the client config does not specify `max.poll.interval.ms`, then the default value
        // provided by the native config will be used.
        //
        // This unit test will warn us if the current default value of 5 minutes changes.
        let config = ClientConfig::new();
        let native_config = config.create_native_config().unwrap();
        let default_max_poll_interval_ms = native_config.get("max.poll.interval.ms").unwrap();
        assert_eq!(default_max_poll_interval_ms, "300000");
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/kinesis/api.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use aws_sdk_kinesis::Client as KinesisClient;
use aws_sdk_kinesis::operation::get_records::GetRecordsOutput;
use aws_sdk_kinesis::types::{Shard, ShardIteratorType};
use quickwit_aws::retry::aws_retry;
use quickwit_common::retry::RetryParams;

/// Gets records from a Kinesis data stream's shard.
/// <https://docs.aws.amazon.com/kinesis/latest/APIReference/API_GetRecords.html>
pub(crate) async fn get_records(
    kinesis_client: &KinesisClient,
    retry_params: &RetryParams,
    shard_iterator: String,
) -> anyhow::Result<GetRecordsOutput> {
    // TODO: Return an error other than `anyhow::Error` so that expired shard iterators can be
    // handled properly.
    let response = aws_retry(retry_params, || async {
        kinesis_client
            .get_records()
            .shard_iterator(shard_iterator.clone())
            .send()
            .await
    })
    .await?;

    Ok(response)
}

/// Gets a Kinesis shard iterator. A shard iterator expires 5 minutes after it is returned
/// to the requester.
/// <https://docs.aws.amazon.com/kinesis/latest/APIReference/API_GetShardIterator.html>
///
/// The returned shard iterator points to the record positioned right after
/// `from_sequence_number_exclusive` if a value is provided. Otherwise, it points to the first
/// (oldest) record in the shard.
pub(crate) async fn get_shard_iterator(
    kinesis_client: &KinesisClient,
    retry_params: &RetryParams,
    stream_name: &str,
    shard_id: &str,
    from_sequence_number_exclusive: Option<String>,
) -> anyhow::Result<Option<String>> {
    let shard_iterator_type = if from_sequence_number_exclusive.is_some() {
        ShardIteratorType::AfterSequenceNumber
    } else {
        ShardIteratorType::TrimHorizon
    };

    let response = aws_retry(retry_params, || async {
        kinesis_client
            .get_shard_iterator()
            .stream_name(stream_name)
            .shard_id(shard_id.to_string())
            .shard_iterator_type(shard_iterator_type.clone())
            .set_starting_sequence_number(from_sequence_number_exclusive.clone())
            .send()
            .await
    })
    .await?;
    Ok(response.shard_iterator)
}

/// Lists the shards in a stream and provides information about each shard. This operation has a
/// limit of 1000 transactions per second per data stream.
/// <https://docs.aws.amazon.com/kinesis/latest/APIReference/API_ListShards.html>
pub(crate) async fn list_shards(
    kinesis_client: &KinesisClient,
    retry_params: &RetryParams,
    stream_name: &str,
    limit_per_request: Option<usize>,
) -> anyhow::Result<Vec<Shard>> {
    let mut shards = Vec::new();
    let mut next_token = None;

    loop {
        // `stream_name` and `next_token` cannot be set simultaneously.
        let stream_name = if next_token.is_none() {
            Some(stream_name.to_string())
        } else {
            None
        };
        let limit_per_request = limit_per_request.map(|limit| limit as i32);
        let response = aws_retry(retry_params, || async {
            kinesis_client
                .list_shards()
                .set_stream_name(stream_name.clone())
                .set_next_token(next_token.clone())
                .set_max_results(limit_per_request)
                .send()
                .await
        })
        .await?;

        if let Some(shrds) = response.shards {
            shards.extend_from_slice(&shrds);
        }
        if response.next_token.is_none() {
            return Ok(shards);
        }
        next_token = response.next_token;
    }
}

#[cfg(all(test, feature = "kinesis-localstack-tests"))]
pub(crate) mod tests {
    use std::collections::BTreeSet;
    use std::time::Duration;

    use anyhow::{Context, anyhow};
    use aws_sdk_kinesis::types::StreamDescription;

    use super::*;
    use crate::source::kinesis::helpers::tests::DEFAULT_RETRY_PARAMS;

    /// Creates a Kinesis data stream.
    /// https://docs.aws.amazon.com/kinesis/latest/APIReference/API_CreateStream.html
    pub(crate) async fn create_stream(
        kinesis_client: &KinesisClient,
        stream_name: &str,
        num_shards: usize,
    ) -> anyhow::Result<()> {
        aws_retry(&DEFAULT_RETRY_PARAMS, || async {
            kinesis_client
                .create_stream()
                .stream_name(stream_name)
                .shard_count(num_shards as i32)
                .send()
                .await
        })
        .await
        .with_context(|| format!("failed to create Kinesis data stream `{stream_name}`"))?;
        Ok(())
    }

    /// Deletes a Kinesis data stream. Only streams in `ACTIVE` state can be deleted.
    /// https://docs.aws.amazon.com/kinesis/latest/APIReference/API_DeleteStream.html
    pub(crate) async fn delete_stream(
        kinesis_client: &KinesisClient,
        stream_name: &str,
    ) -> anyhow::Result<()> {
        aws_retry(&DEFAULT_RETRY_PARAMS, || async {
            kinesis_client
                .delete_stream()
                .stream_name(stream_name.to_string())
                .send()
                .await
        })
        .await
        .with_context(|| format!("failed to delete Kinesis data stream `{stream_name}`"))?;
        Ok(())
    }

    /// Provides a summarized description of the specified Kinesis data stream without the shard
    /// list. https://docs.aws.amazon.com/kinesis/latest/APIReference/API_DescribeStreamSummary.html
    pub(crate) async fn describe_stream(
        kinesis_client: &KinesisClient,
        stream_name: &str,
    ) -> anyhow::Result<StreamDescription> {
        let response = aws_retry(&DEFAULT_RETRY_PARAMS, || async {
            kinesis_client
                .describe_stream()
                .stream_name(stream_name.to_string())
                .send()
                .await
        })
        .await?;

        response
            .stream_description
            .ok_or_else(|| anyhow!("no stream summary was returned from AWS"))
    }
    /// Lists the Kinesis data streams.
    /// https://docs.aws.amazon.com/kinesis/latest/APIReference/API_ListStreams.html
    pub(crate) async fn list_streams(
        kinesis_client: &KinesisClient,
        mut exclusive_start_stream_name: Option<String>,
        limit_per_request: Option<usize>,
    ) -> anyhow::Result<BTreeSet<String>> {
        let mut stream_names = BTreeSet::new();
        let mut has_more_streams = true;
        let limit_per_request = limit_per_request.map(|limit| limit as i32);
        while has_more_streams {
            let response = aws_retry(&DEFAULT_RETRY_PARAMS, || async {
                kinesis_client
                    .list_streams()
                    .set_exclusive_start_stream_name(exclusive_start_stream_name.clone())
                    .set_limit(limit_per_request)
                    .send()
                    .await
            })
            .await?;
            exclusive_start_stream_name = response.stream_names.last().cloned();
            has_more_streams = response.has_more_streams;
            stream_names.extend(response.stream_names);
        }
        Ok(stream_names)
    }

    /// Merges two adjacent shards in a Kinesis data stream and combines them into a single shard.
    /// https://docs.aws.amazon.com/kinesis/latest/APIReference/API_MergeShards.html
    #[cfg(test)]
    pub(crate) async fn merge_shards(
        kinesis_client: &KinesisClient,
        stream_name: &str,
        shard_id: &str,
        adjacent_shard_id: &str,
    ) -> anyhow::Result<()> {
        aws_retry(&DEFAULT_RETRY_PARAMS, || async {
            kinesis_client
                .merge_shards()
                .stream_name(stream_name)
                .shard_to_merge(shard_id)
                .adjacent_shard_to_merge(adjacent_shard_id)
                .send()
                .await
        })
        .await?;
        Ok(())
    }

    /// Splits a shard into two new shards in the Kinesis data stream.
    /// https://docs.aws.amazon.com/kinesis/latest/APIReference/API_SplitShard.html
    #[cfg(test)]
    pub(crate) async fn split_shard(
        kinesis_client: &KinesisClient,
        stream_name: &str,
        shard_id: &str,
        starting_hash_key: &str,
    ) -> anyhow::Result<()> {
        aws_retry(&DEFAULT_RETRY_PARAMS, || async {
            kinesis_client
                .split_shard()
                .stream_name(stream_name)
                .shard_to_split(shard_id)
                .new_starting_hash_key(starting_hash_key)
                .send()
                .await
        })
        .await?;
        Ok(())
    }

    /// Waits for a Kinesis data stream's status to satisfy the specified predicate. This is done
    /// through periodically polling the `[describe_stream]` API for the stream. Returns an error
    /// after the specified `timeout` duration has passed.
    #[cfg(test)]
    pub(crate) async fn wait_for_stream_status<P>(
        kinesis_client: &KinesisClient,
        stream_name: &str,
        stream_status_predicate: P,
        timeout: Duration,
    ) -> Result<anyhow::Result<()>, tokio::time::error::Elapsed>
    where
        P: Fn(aws_sdk_kinesis::types::StreamStatus) -> bool,
    {
        tokio::time::timeout(timeout, async {
            let period = Duration::from_millis(if cfg!(test) { 100 } else { 5000 });
            let mut interval = tokio::time::interval(period);
            loop {
                interval.tick().await;
                let stream_status = describe_stream(kinesis_client, stream_name)
                    .await?
                    .stream_status;

                if stream_status_predicate(stream_status) {
                    return Ok(());
                }
            }
        })
        .await
    }
}

#[cfg(all(test, feature = "kinesis-localstack-tests"))]
mod kinesis_localstack_tests {
    use std::time::Duration;

    use aws_sdk_kinesis::types::StreamStatus;
    use quickwit_common::rand::append_random_suffix;

    use super::*;
    use crate::source::kinesis::api::tests::{
        create_stream, delete_stream, describe_stream, list_streams, wait_for_stream_status,
    };
    use crate::source::kinesis::helpers::tests::{
        DEFAULT_RETRY_PARAMS, get_localstack_client, make_shard_id, put_records_into_shards, setup,
        teardown, wait_for_active_stream,
    };

    #[ignore]
    #[tokio::test]
    async fn test_create_stream() -> anyhow::Result<()> {
        let stream_name = append_random_suffix("test-create-stream");
        let kinesis_client = get_localstack_client().await?;
        create_stream(&kinesis_client, &stream_name, 1).await?;
        wait_for_active_stream(&kinesis_client, &stream_name).await??;
        let description_summary = describe_stream(&kinesis_client, &stream_name).await?;
        assert_eq!(description_summary.stream_name, stream_name);
        assert_eq!(description_summary.stream_status, StreamStatus::Active,);
        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    #[ignore]
    #[tokio::test]
    async fn test_delete_stream() -> anyhow::Result<()> {
        let (kinesis_client, stream_name) = setup("test-delete-stream", 1).await?;
        delete_stream(&kinesis_client, &stream_name).await?;
        let _ = wait_for_stream_status(
            &kinesis_client,
            &stream_name,
            |stream_status| stream_status != StreamStatus::Deleting,
            Duration::from_secs(1),
        )
        .await;
        assert!(
            !list_streams(&kinesis_client, None, None,)
                .await?
                .contains(&stream_name)
        );
        Ok(())
    }

    #[ignore]
    #[tokio::test]
    async fn test_get_records() -> anyhow::Result<()> {
        let (kinesis_client, stream_name) = setup("test-get-records", 2).await?;
        let _sequence_numbers = put_records_into_shards(
            &kinesis_client,
            &stream_name,
            [(0, "Record #00"), (0, "Record #01"), (1, "Record #10")],
        )
        .await?;
        let shard_id = make_shard_id(0);
        let shard_iterator = get_shard_iterator(
            &kinesis_client,
            &DEFAULT_RETRY_PARAMS,
            &stream_name,
            &shard_id,
            None,
        )
        .await?;

        let get_records_output = get_records(
            &kinesis_client,
            &DEFAULT_RETRY_PARAMS,
            shard_iterator.unwrap(),
        )
        .await?;

        let records = get_records_output.records;
        assert_eq!(records.len(), 2);
        assert_eq!(std::str::from_utf8(records[0].data.as_ref())?, "Record #00");
        assert_eq!(std::str::from_utf8(records[1].data.as_ref())?, "Record #01");
        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    // Ignoring this test because the localstack implementation of Kinesis is bogus.
    #[ignore]
    #[tokio::test]
    async fn test_get_shard_iterator() -> anyhow::Result<()> {
        let (kinesis_client, stream_name) = setup("test-get-shard-iterator", 2).await?;
        let sequence_numbers = put_records_into_shards(
            &kinesis_client,
            &stream_name,
            [(0, "Record #00"), (1, "Record #10")],
        )
        .await?;
        let shard_id = make_shard_id(0);
        {
            let shard_iterator = get_shard_iterator(
                &kinesis_client,
                &DEFAULT_RETRY_PARAMS,
                &stream_name,
                &shard_id,
                None,
            )
            .await?;
            assert!(shard_iterator.is_some());

            let get_records_output = get_records(
                &kinesis_client,
                &DEFAULT_RETRY_PARAMS,
                shard_iterator.unwrap(),
            )
            .await?;
            assert_eq!(get_records_output.records.len(), 1);
        }
        {
            let starting_sequence_number = sequence_numbers.get(&0).unwrap().first().cloned();
            let shard_iterator = get_shard_iterator(
                &kinesis_client,
                &DEFAULT_RETRY_PARAMS,
                &stream_name,
                &shard_id,
                starting_sequence_number,
            )
            .await?;
            assert!(shard_iterator.is_some());

            let get_records_output = get_records(
                &kinesis_client,
                &DEFAULT_RETRY_PARAMS,
                shard_iterator.unwrap(),
            )
            .await?;
            assert_eq!(get_records_output.records.len(), 0)
        }
        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    #[ignore]
    #[tokio::test]
    async fn test_list_shards() -> anyhow::Result<()> {
        let (kinesis_client, stream_name) = setup("test-list-shards", 2).await?;
        let shards = list_shards(
            &kinesis_client,
            &DEFAULT_RETRY_PARAMS,
            &stream_name,
            Some(1),
        )
        .await?;
        assert_eq!(shards.len(), 2);
        assert_eq!(shards[0].shard_id, make_shard_id(0));
        assert_eq!(shards[1].shard_id, make_shard_id(1));
        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    // Ignoring this test because the localstack implementation of Kinesis is bogus.
    #[ignore]
    #[tokio::test]
    async fn test_list_streams() -> anyhow::Result<()> {
        let kinesis_client = get_localstack_client().await?;
        let mut stream_names = Vec::new();

        for stream_name_suffix in ["foo", "bar"] {
            let (_kinesis_client, stream_name) =
                setup(format!("test-list-streams-{stream_name_suffix}"), 1).await?;
            stream_names.push(stream_name);
        }
        {
            let streams = list_streams(&kinesis_client, None, Some(1)).await?;
            assert!(streams.contains(&stream_names[0]));
            assert!(streams.contains(&stream_names[1]));
        }
        {
            let streams = list_streams(
                &kinesis_client,
                Some("test-list-streams-foo".to_string()),
                Some(1),
            )
            .await?;
            assert!(streams.contains(&stream_names[0]));
            assert!(!streams.contains(&stream_names[1]));
        }
        for stream_name in stream_names {
            teardown(&kinesis_client, &stream_name).await;
        }
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/kinesis/helpers.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use aws_sdk_kinesis::config::{Region, SharedAsyncSleep};
use aws_sdk_kinesis::{Client, Config};
use quickwit_aws::{DEFAULT_AWS_REGION, aws_behavior_version, get_aws_config};
use quickwit_config::RegionOrEndpoint;

pub async fn get_kinesis_client(region_or_endpoint: RegionOrEndpoint) -> anyhow::Result<Client> {
    let aws_config = get_aws_config().await;

    let mut kinesis_config = Config::builder().behavior_version(aws_behavior_version());
    kinesis_config.set_retry_config(aws_config.retry_config().cloned());
    kinesis_config.set_credentials_provider(aws_config.credentials_provider());
    kinesis_config.set_http_client(aws_config.http_client());
    kinesis_config.set_timeout_config(aws_config.timeout_config().cloned());
    if let Some(identity_cache) = aws_config.identity_cache() {
        kinesis_config.set_identity_cache(identity_cache);
    }
    kinesis_config.set_sleep_impl(Some(SharedAsyncSleep::new(
        quickwit_aws::TokioSleep::default(),
    )));

    match region_or_endpoint {
        RegionOrEndpoint::Region(region) => {
            kinesis_config = kinesis_config.region(Some(Region::new(region)));
        }
        RegionOrEndpoint::Endpoint(endpoint) => {
            kinesis_config = kinesis_config.endpoint_url(endpoint);
            kinesis_config = kinesis_config.region(Some(DEFAULT_AWS_REGION));
        }
    }

    Ok(Client::from_conf(kinesis_config.build()))
}

#[cfg(all(test, feature = "kinesis-localstack-tests"))]
pub(crate) mod tests {
    use std::collections::HashMap;
    use std::time::Duration;

    use anyhow::bail;
    use aws_sdk_kinesis::Client as KinesisClient;
    use aws_sdk_kinesis::primitives::Blob;
    use aws_sdk_kinesis::types::{PutRecordsRequestEntry, StreamStatus};
    use once_cell::sync::Lazy;
    use quickwit_common::rand::append_random_suffix;
    use quickwit_common::retry::RetryParams;
    use quickwit_config::RegionOrEndpoint;
    use tracing::error;

    use crate::source::kinesis::api::list_shards;
    use crate::source::kinesis::api::tests::{
        create_stream, delete_stream, wait_for_stream_status,
    };
    use crate::source::kinesis::helpers::get_kinesis_client;

    pub static DEFAULT_RETRY_PARAMS: Lazy<RetryParams> = Lazy::new(RetryParams::standard);

    pub async fn get_localstack_client() -> anyhow::Result<KinesisClient> {
        let endpoint = RegionOrEndpoint::Endpoint("http://localhost:4566".to_string());
        get_kinesis_client(endpoint).await
    }

    pub fn make_shard_id(id: usize) -> String {
        format!("shardId-{id:0>12}")
    }

    pub fn parse_shard_id<S: AsRef<str>>(shard_id: S) -> Option<usize> {
        shard_id
            .as_ref()
            .strip_prefix("shardId-")
            .and_then(|shard_id| shard_id.parse::<usize>().ok())
    }

    pub async fn put_records_into_shards<I>(
        kinesis_client: &aws_sdk_kinesis::Client,
        stream_name: &str,
        records: I,
    ) -> anyhow::Result<HashMap<usize, Vec<String>>>
    where
        I: IntoIterator<Item = (usize, &'static str)>,
    {
        let shard_hash_keys: HashMap<usize, String> =
            list_shards(kinesis_client, &DEFAULT_RETRY_PARAMS, stream_name, None)
                .await?
                .into_iter()
                .flat_map(|shard| {
                    let starting_hash_key = shard.hash_key_range?.starting_hash_key;
                    parse_shard_id(shard.shard_id).map(|shard_id| (shard_id, starting_hash_key))
                })
                .collect();

        let put_records_request_entries = records
            .into_iter()
            .map(|(shard_id, record)| {
                PutRecordsRequestEntry::builder()
                    .set_explicit_hash_key(shard_hash_keys.get(&shard_id).cloned())
                    .partition_key("Overridden by hash key".to_string())
                    .data(Blob::new(record.as_bytes()))
                    .build()
            })
            .collect::<Result<Vec<_>, _>>()?;

        let response = kinesis_client
            .put_records()
            .stream_name(stream_name.to_string())
            .set_records(Some(put_records_request_entries))
            .send()
            .await?;

        let mut sequence_numbers = HashMap::new();
        for record in response.records {
            if let Some(sequence_number) = record.sequence_number {
                sequence_numbers
                    .entry(record.shard_id.and_then(parse_shard_id).unwrap())
                    .or_insert_with(Vec::new)
                    .push(sequence_number);
            } else {
                bail!("sequence number is missing from record");
            }
        }
        Ok(sequence_numbers)
    }

    pub async fn setup<S: AsRef<str>>(
        test_name: S,
        num_shards: usize,
    ) -> anyhow::Result<(aws_sdk_kinesis::Client, String)> {
        let stream_name = append_random_suffix(test_name.as_ref());
        let kinesis_client = get_localstack_client().await?;
        create_stream(&kinesis_client, &stream_name, num_shards).await?;
        wait_for_active_stream(&kinesis_client, &stream_name).await??;
        Ok((kinesis_client, stream_name))
    }

    pub async fn teardown(kinesis_client: &aws_sdk_kinesis::Client, stream_name: &str) {
        if let Err(error) = delete_stream(kinesis_client, stream_name).await {
            error!(stream_name = %stream_name, error = ?error, "Failed to delete stream.")
        }
    }

    pub async fn wait_for_active_stream(
        kinesis_client: &aws_sdk_kinesis::Client,
        stream_name: &str,
    ) -> Result<anyhow::Result<()>, tokio::time::error::Elapsed> {
        wait_for_stream_status(
            kinesis_client,
            stream_name,
            |stream_status| stream_status == StreamStatus::Active,
            Duration::from_secs(30),
        )
        .await
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/kinesis/kinesis_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::time::Duration;

use anyhow::{Context, bail};
use async_trait::async_trait;
use aws_sdk_kinesis::Client as KinesisClient;
use bytes::Bytes;
use itertools::Itertools;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_aws::get_aws_config;
use quickwit_common::retry::RetryParams;
use quickwit_config::{KinesisSourceParams, RegionOrEndpoint};
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::Position;
use serde_json::{Value as JsonValue, json};
use tokio::sync::mpsc;
use tokio::time;
use tracing::{info, warn};

use super::api::list_shards;
use super::shard_consumer::{ShardConsumer, ShardConsumerHandle, ShardConsumerMessage};
use crate::actors::DocProcessor;
use crate::source::kinesis::helpers::get_kinesis_client;
use crate::source::{
    BATCH_NUM_BYTES_LIMIT, BatchBuilder, EMIT_BATCHES_TIMEOUT, Source, SourceContext,
    SourceRuntime, TypedSourceFactory,
};

type ShardId = String;

/// Factory for instantiating a `KafkaSource`.
pub struct KinesisSourceFactory;

#[async_trait]
impl TypedSourceFactory for KinesisSourceFactory {
    type Source = KinesisSource;
    type Params = KinesisSourceParams;

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        source_params: KinesisSourceParams,
    ) -> anyhow::Result<Self::Source> {
        KinesisSource::try_new(source_runtime, source_params).await
    }
}

struct ShardConsumerState {
    partition_id: PartitionId,
    current_position: Position,
    lag_millis: Option<i64>,
    _shard_consumer_handle: ShardConsumerHandle,
}

#[derive(Default)]
pub struct KinesisSourceState {
    /// Pool of [`ShardConsumer`] managed by the source.
    shard_consumers: HashMap<ShardId, ShardConsumerState>,
    /// Number of bytes processed by the source.
    pub num_bytes_processed: u64,
    /// Number of records processed by the source (including invalid messages).
    pub num_records_processed: u64,
    // Number of invalid records, i.e., that were empty or could not be parsed.
    pub num_invalid_records: u64,
}

pub struct KinesisSource {
    // Runtime arguments.
    source_runtime: SourceRuntime,
    // Target stream to consume.
    stream_name: String,
    kinesis_client: KinesisClient,
    // Retry parameters (max attempts, max delay, ...).
    retry_params: RetryParams,
    // Sender for the communication channel between the source and the shard consumers.
    shard_consumers_tx: mpsc::Sender<ShardConsumerMessage>,
    // Receiver for the communication channel between the source and the shard consumers.
    shard_consumers_rx: mpsc::Receiver<ShardConsumerMessage>,
    state: KinesisSourceState,
    backfill_mode_enabled: bool,
}

impl fmt::Debug for KinesisSource {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("KinesisSource")
            .field("index_uid", self.source_runtime.index_uid())
            .field("source_id", &self.source_runtime.source_id())
            .field("stream_Name", &self.stream_name)
            .finish()
    }
}

impl KinesisSource {
    /// Instantiates a new `KinesisSource`.
    pub async fn try_new(
        source_runtime: SourceRuntime,
        source_params: KinesisSourceParams,
    ) -> anyhow::Result<Self> {
        let stream_name = source_params.stream_name;
        let backfill_mode_enabled = source_params.enable_backfill_mode;
        let region = get_region(source_params.region_or_endpoint).await?;
        let kinesis_client = get_kinesis_client(region).await?;
        let (shard_consumers_tx, shard_consumers_rx) = mpsc::channel(1_000);
        let state = KinesisSourceState::default();
        let retry_params = RetryParams::aggressive();
        let kinesis_source = KinesisSource {
            source_runtime,
            stream_name,
            kinesis_client,
            shard_consumers_tx,
            shard_consumers_rx,
            state,
            backfill_mode_enabled,
            retry_params,
        };
        Ok(kinesis_source)
    }

    fn spawn_shard_consumer(
        &mut self,
        ctx: &SourceContext,
        shard_id: ShardId,
        checkpoint: &SourceCheckpoint,
    ) {
        if self.state.shard_consumers.contains_key(&shard_id) {
            info!(
                stream_name = %self.stream_name,
                shard_id = %shard_id,
                "Shard consumer already exists, skipping creation."
            );
            return;
        }

        let partition_id = PartitionId::from(shard_id.as_str());
        let from_position = checkpoint
            .position_for_partition(&partition_id)
            .cloned()
            .unwrap_or(Position::Beginning);
        let from_sequence_number_exclusive = match &from_position {
            Position::Beginning => None,
            Position::Offset(offset) => Some(offset.to_string()),
            Position::Eof(_) => panic!("position of a Kinesis shard should never be EOF"),
        };
        info!(
            stream_name = %self.stream_name,
            shard_id = %shard_id,
            start_position = ?from_position,
            "Spawning new shard consumer"
        );
        let shard_consumer = ShardConsumer::new(
            self.stream_name.clone(),
            shard_id.clone(),
            from_sequence_number_exclusive,
            self.backfill_mode_enabled,
            self.kinesis_client.clone(),
            self.shard_consumers_tx.clone(),
            self.retry_params,
        );
        let _shard_consumer_handle = shard_consumer.spawn(ctx);
        let shard_consumer_state = ShardConsumerState {
            partition_id,
            current_position: from_position,
            lag_millis: None,
            _shard_consumer_handle,
        };
        self.state
            .shard_consumers
            .insert(shard_id, shard_consumer_state);
    }
}

#[async_trait]
impl Source for KinesisSource {
    async fn initialize(
        &mut self,
        _doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        let shards = ctx
            .protect_future(list_shards(
                &self.kinesis_client,
                &self.retry_params,
                &self.stream_name,
                None,
            ))
            .await?;
        let checkpoint = self
            .source_runtime
            .fetch_checkpoint()
            .await
            .context("failed to fetch checkpoint")?;

        for shard in shards {
            self.spawn_shard_consumer(ctx, shard.shard_id, &checkpoint);
        }
        info!(
            stream_name = %self.stream_name,
            assigned_shards = %self.state.shard_consumers.keys().sorted().join(", "),
            "Starting Kinesis source."
        );
        Ok(())
    }

    async fn emit_batches(
        &mut self,
        indexer_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let mut batch_builder = BatchBuilder::new(SourceType::Kinesis);
        let deadline = time::sleep(*EMIT_BATCHES_TIMEOUT);
        tokio::pin!(deadline);

        loop {
            tokio::select! {
                message_opt = self.shard_consumers_rx.recv() => {
                    // The source always carries a sender for this channel.
                    match message_opt.expect("Channel unexpectedly closed.") {
                        ShardConsumerMessage::ChildShards(shard_ids) => {
                            let checkpoint = self.source_runtime.fetch_checkpoint().await.context("failed to fetch checkpoint")?;

                            for shard_id in shard_ids {
                                self.spawn_shard_consumer(ctx, shard_id, &checkpoint);
                            }
                        }
                        ShardConsumerMessage::Records { shard_id, records, lag_millis } => {
                            let num_records = records.len();

                            for (i, record) in records.into_iter().enumerate() {
                                let record_data = record.data.into_inner();

                                if record_data.is_empty() {
                                    warn!(
                                        stream_name=%self.stream_name,
                                        shard_id=%shard_id,
                                        sequence_number=%record.sequence_number,
                                        "record is empty"
                                    );
                                    self.state.num_invalid_records += 1;
                                    continue;
                                }
                                batch_builder.add_doc(Bytes::from(record_data));

                                if i == num_records - 1 {
                                    let shard_consumer_state = self
                                        .state
                                        .shard_consumers
                                        .get_mut(&shard_id)
                                        .ok_or_else(|| {
                                            anyhow::anyhow!(
                                                "received record from unassigned shard `{}`", shard_id,
                                            )
                                        })?;
                                    shard_consumer_state.lag_millis = lag_millis;

                                    let partition_id = shard_consumer_state.partition_id.clone();
                                    let current_position = Position::from(record.sequence_number);
                                    let previous_position = std::mem::replace(&mut shard_consumer_state.current_position, current_position.clone());

                                    batch_builder.checkpoint_delta.record_partition_delta(
                                        partition_id,
                                        previous_position,
                                        current_position,
                                    ).context("failed to record partition delta")?;
                                }
                            }
                            if batch_builder.num_bytes >= BATCH_NUM_BYTES_LIMIT {
                                break;
                            }
                        }
                        ShardConsumerMessage::ShardClosed(shard_id) => {
                            info!(
                                stream_name = %self.stream_name,
                                shard_id = %shard_id,
                                num_active_shards = %self.state.shard_consumers.len(),
                                "Shard is closed."
                            );
                            self.state.shard_consumers.remove(&shard_id);

                        }
                        ShardConsumerMessage::ShardEOF(shard_id) => {
                            info!(
                                stream_name = %self.stream_name,
                                shard_id = %shard_id,
                                num_active_shards = %self.state.shard_consumers.len(),
                                "Reached end of shard."
                            );
                            self.state.shard_consumers.remove(&shard_id);
                        }
                    }
                    ctx.record_progress();
                }
                _ = &mut deadline => {
                    break;
                }
            }
        }
        self.state.num_bytes_processed += batch_builder.num_bytes;
        self.state.num_records_processed += batch_builder.docs.len() as u64;

        if !batch_builder.checkpoint_delta.is_empty() {
            ctx.send_message(indexer_mailbox, batch_builder.build())
                .await?;
        }
        if self.state.shard_consumers.is_empty() {
            info!(stream_name = %self.stream_name, "reached end of stream");
            ctx.send_exit_with_success(indexer_mailbox).await?;
            return Err(ActorExitStatus::Success);
        }
        Ok(Duration::default())
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    fn observable_state(&self) -> JsonValue {
        let shard_consumer_positions: Vec<(&ShardId, &Position)> = self
            .state
            .shard_consumers
            .iter()
            .map(|(shard_id, shard_consumer_state)| {
                (shard_id, &shard_consumer_state.current_position)
            })
            .sorted()
            .collect();
        json!({
            "stream_name": self.stream_name,
            "shard_consumer_positions": shard_consumer_positions,
            "num_bytes_processed": self.state.num_bytes_processed,
            "num_records_processed": self.state.num_records_processed,
            "num_invalid_records": self.state.num_invalid_records,
        })
    }
}

pub(super) async fn get_region(
    region_or_endpoint_opt: Option<RegionOrEndpoint>,
) -> anyhow::Result<RegionOrEndpoint> {
    if let Some(region_or_endpoint) = region_or_endpoint_opt {
        return Ok(region_or_endpoint);
    }
    //< We fallback to AWS region if `region_or_endpoint` is `None`
    let sdk_config = get_aws_config().await;

    if let Some(region) = sdk_config.region() {
        return Ok(RegionOrEndpoint::Region(region.to_string()));
    }
    if let Some(endpoint) = sdk_config.endpoint_url() {
        return Ok(RegionOrEndpoint::Endpoint(endpoint.to_string()));
    }
    bail!("unable to sniff region from environment")
}

#[cfg(all(test, feature = "kinesis-localstack-tests"))]
mod tests {

    use quickwit_actors::Universe;
    use quickwit_config::{SourceConfig, SourceParams};
    use quickwit_metastore::checkpoint::SourceCheckpointDelta;
    use quickwit_proto::types::IndexUid;

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::SourceActor;
    use crate::source::kinesis::helpers::tests::{
        make_shard_id, put_records_into_shards, setup, teardown,
    };
    use crate::source::tests::SourceRuntimeBuilder;

    // Sequence number
    type SeqNo = String;

    fn merge_doc_batches(batches: Vec<RawDocBatch>) -> anyhow::Result<RawDocBatch> {
        let mut merged_batch = RawDocBatch::default();
        for batch in batches {
            merged_batch.docs.extend(batch.docs);
            merged_batch
                .checkpoint_delta
                .extend(batch.checkpoint_delta)?;
        }
        merged_batch.docs.sort();
        Ok(merged_batch)
    }

    #[ignore]
    #[tokio::test]
    async fn test_kinesis_source_handles_resharding_with_split() {
        use crate::source::kinesis::api::tests::split_shard;
        use crate::source::kinesis::helpers::tests::wait_for_active_stream;

        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, _doc_processor_inbox) = universe.create_test_mailbox();
        let (kinesis_client, stream_name) = setup("test-resharding-split", 1).await.unwrap();
        let index_id = "test-kinesis-resharding-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);

        // Split the shard (1 -> 2 shards)
        let shard_id_0 = make_shard_id(0);
        split_shard(
            &kinesis_client,
            &stream_name,
            &shard_id_0,
            "85070591730234615865843651857942052864",
        )
        .await
        .unwrap();

        // Wait for stream to be active after split
        let _ = wait_for_active_stream(&kinesis_client, &stream_name)
            .await
            .unwrap();

        // Initialize source after split
        let kinesis_params = KinesisSourceParams {
            stream_name: stream_name.clone(),
            region_or_endpoint: Some(RegionOrEndpoint::Endpoint(
                "http://localhost:4566".to_string(),
            )),
            enable_backfill_mode: true,
        };
        let source_params = SourceParams::Kinesis(kinesis_params.clone());
        let source_config = SourceConfig::for_test("test-kinesis-resharding", source_params);
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();

        let kinesis_source = KinesisSource::try_new(source_runtime, kinesis_params)
            .await
            .unwrap();

        let actor = SourceActor {
            source: Box::new(kinesis_source),
            doc_processor_mailbox: doc_processor_mailbox.clone(),
        };
        let (_mailbox, handle) = universe.spawn_builder().spawn(actor);
        let (exit_status, _exit_state) = handle.join().await;
        assert!(exit_status.is_success());

        teardown(&kinesis_client, &stream_name).await;
    }

    #[ignore]
    #[tokio::test]
    async fn test_kinesis_source() {
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let (kinesis_client, stream_name) = setup("test-kinesis-source", 3).await.unwrap();
        let index_id = "test-kinesis-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let kinesis_params = KinesisSourceParams {
            stream_name: stream_name.clone(),
            region_or_endpoint: Some(RegionOrEndpoint::Endpoint(
                "http://localhost:4566".to_string(),
            )),
            enable_backfill_mode: true,
        };
        let source_params = SourceParams::Kinesis(kinesis_params.clone());
        let source_config = SourceConfig::for_test("test-kinesis-source", source_params);
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        {
            let kinesis_source =
                KinesisSource::try_new(source_runtime.clone(), kinesis_params.clone())
                    .await
                    .unwrap();
            let actor = SourceActor {
                source: Box::new(kinesis_source),
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_mailbox, handle) = universe.spawn_builder().spawn(actor);
            let (exit_status, exit_state) = handle.join().await;
            assert!(exit_status.is_success());

            let next_message = doc_processor_inbox
                .drain_for_test()
                .into_iter()
                .flat_map(|box_any| box_any.downcast::<RawDocBatch>().ok())
                .map(|box_raw_doc_batch| *box_raw_doc_batch)
                .next();
            assert!(next_message.is_none());

            let expected_shard_consumer_positions: Vec<(ShardId, SeqNo)> = Vec::new();
            let expected_state = json!({
                "stream_name":  stream_name,
                "shard_consumer_positions": expected_shard_consumer_positions,
                "num_bytes_processed": 0,
                "num_records_processed": 0,
                "num_invalid_records": 0,
            });
            assert_eq!(exit_state, expected_state);
        }
        let sequence_numbers = put_records_into_shards(
            &kinesis_client,
            &stream_name,
            [
                (0, "Record #00"),
                (0, "Record #01"),
                (1, "Record #10"),
                (1, "Record #11"),
                (2, "Record #20"),
                (2, "Record #21"),
            ],
        )
        .await
        .unwrap();
        let shard_sequence_numbers: HashMap<usize, SeqNo> = sequence_numbers
            .iter()
            .map(|(shard_id, records)| (*shard_id, records.last().unwrap().clone()))
            .collect();
        let shard_positions: HashMap<usize, Position> = shard_sequence_numbers
            .iter()
            .map(|(shard_id, seqno)| (*shard_id, Position::from(seqno.clone())))
            .collect();
        {
            let kinesis_source =
                KinesisSource::try_new(source_runtime.clone(), kinesis_params.clone())
                    .await
                    .unwrap();
            let actor = SourceActor {
                source: Box::new(kinesis_source),
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_mailbox, handle) = universe.spawn_builder().spawn(actor);
            let (exit_status, exit_state) = handle.join().await;
            assert!(exit_status.is_success());

            let messages: Vec<RawDocBatch> = doc_processor_inbox
                .drain_for_test()
                .into_iter()
                .flat_map(|box_any| box_any.downcast::<RawDocBatch>().ok())
                .map(|box_raw_doc_batch| *box_raw_doc_batch)
                .collect();
            assert!(!messages.is_empty());

            let batch = merge_doc_batches(messages).unwrap();
            let expected_docs = vec![
                "Record #00",
                "Record #01",
                "Record #10",
                "Record #11",
                "Record #20",
                "Record #21",
            ];
            assert_eq!(batch.docs, expected_docs);

            let mut expected_checkpoint_delta = SourceCheckpointDelta::default();
            for shard_id in 0..3 {
                expected_checkpoint_delta
                    .record_partition_delta(
                        PartitionId::from(make_shard_id(shard_id)),
                        Position::Beginning,
                        shard_positions.get(&shard_id).unwrap().clone(),
                    )
                    .unwrap();
            }
            assert_eq!(batch.checkpoint_delta, expected_checkpoint_delta);

            let expected_shard_consumer_positions: Vec<(ShardId, SeqNo)> = Vec::new();
            let expected_state = json!({
                "stream_name":  stream_name,
                "shard_consumer_positions": expected_shard_consumer_positions,
                "num_bytes_processed": 60,
                "num_records_processed": 6,
                "num_invalid_records": 0,
            });
            assert_eq!(exit_state, expected_state);
        }
        {
            let from_sequence_number_exclusive_shard_1 =
                sequence_numbers.get(&1).unwrap().first().unwrap().clone();
            let from_sequence_number_exclusive_shard_2 =
                sequence_numbers.get(&2).unwrap().last().unwrap().clone();
            let _checkpoint: SourceCheckpoint = vec![
                (
                    make_shard_id(1),
                    from_sequence_number_exclusive_shard_1.clone(),
                ),
                (
                    make_shard_id(2),
                    from_sequence_number_exclusive_shard_2.clone(),
                ),
            ]
            .into_iter()
            .map(|(partition_id, offset)| (PartitionId::from(partition_id), Position::from(offset)))
            .collect();
            let kinesis_source = KinesisSource::try_new(source_runtime, kinesis_params)
                .await
                .unwrap();
            let actor = SourceActor {
                source: Box::new(kinesis_source),
                doc_processor_mailbox: doc_processor_mailbox.clone(),
            };
            let (_mailbox, handle) = universe.spawn_builder().spawn(actor);
            let (exit_status, exit_state) = handle.join().await;
            assert!(exit_status.is_success());

            let messages: Vec<RawDocBatch> = doc_processor_inbox
                .drain_for_test()
                .into_iter()
                .flat_map(|box_any| box_any.downcast::<RawDocBatch>().ok())
                .map(|box_raw_doc_batch| *box_raw_doc_batch)
                .collect();
            assert!(!messages.is_empty());

            let batch = merge_doc_batches(messages).unwrap();
            let expected_docs = vec!["Record #00", "Record #01", "Record #11"];
            assert_eq!(batch.docs, expected_docs);

            let mut expected_checkpoint_delta = SourceCheckpointDelta::default();
            for (shard_id, from_position) in [
                Position::Beginning,
                Position::from(from_sequence_number_exclusive_shard_1),
            ]
            .into_iter()
            .enumerate()
            {
                expected_checkpoint_delta
                    .record_partition_delta(
                        PartitionId::from(make_shard_id(shard_id)),
                        from_position,
                        shard_positions.get(&shard_id).unwrap().clone(),
                    )
                    .unwrap();
            }
            assert_eq!(batch.checkpoint_delta, expected_checkpoint_delta);

            let expected_shard_consumer_positions: Vec<(ShardId, SeqNo)> = Vec::new();
            let expected_state = json!({
                "stream_name":  stream_name,
                "shard_consumer_positions": expected_shard_consumer_positions,
                "num_bytes_processed": 30,
                "num_records_processed": 3,
                "num_invalid_records": 0,
            });
            assert_eq!(exit_state, expected_state);
        }
        teardown(&kinesis_client, &stream_name).await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/kinesis/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod api;
mod helpers;
pub mod kinesis_source;
mod shard_consumer;

use quickwit_common::retry::RetryParams;
use quickwit_config::KinesisSourceParams;

use crate::source::kinesis::api::{get_records, get_shard_iterator, list_shards};
use crate::source::kinesis::helpers::get_kinesis_client;
use crate::source::kinesis::kinesis_source::get_region;

/// Checks whether we can establish a connection to the Kinesis service and read some records.
pub(super) async fn check_connectivity(params: KinesisSourceParams) -> anyhow::Result<()> {
    let region = get_region(params.region_or_endpoint).await?;
    let kinesis_client = get_kinesis_client(region).await?;
    let retry_params = RetryParams::standard();
    let shards = list_shards(&kinesis_client, &retry_params, &params.stream_name, Some(1)).await?;

    if let Some(shard_id) = shards.first().map(|s| s.shard_id()) {
        let shard_iterator_opt = get_shard_iterator(
            &kinesis_client,
            &retry_params,
            &params.stream_name,
            shard_id,
            None,
        )
        .await?;

        if let Some(shard_iterator) = shard_iterator_opt {
            get_records(&kinesis_client, &retry_params, shard_iterator).await?;
        }
    }
    Ok(())
}


================================================
FILE: quickwit/quickwit-indexing/src/source/kinesis/shard_consumer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

use async_trait::async_trait;
use aws_sdk_kinesis::types::Record;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, ActorHandle, Handler, Mailbox};
use quickwit_common::retry::RetryParams;
use serde_json::{Value as JsonValue, json};
use tokio::sync::mpsc;

use crate::source::SourceContext;
use crate::source::kinesis::api::{get_records, get_shard_iterator};

#[derive(Debug)]
pub(super) enum ShardConsumerMessage {
    /// The shard was the subject of a merge or a split and points to one (merge) or two (split)
    /// children.
    ChildShards(Vec<String>),
    Records {
        shard_id: String,
        records: Vec<Record>,
        lag_millis: Option<i64>,
    },
    /// The shard is closed after a merge or a split. There are no new records available.
    ShardClosed(String),
    /// The consumer has reached the latest record in the shard and stops if
    /// `shutdown_at_shard_eof` is set to true.
    ShardEOF(String),
}

#[derive(Default)]
pub(super) struct ShardConsumerState {
    /// The sequence number of the last record processed.
    current_sequence_number: Option<String>,
    /// The number of milliseconds the last `GetRecords` response is from the tip of the stream.
    lag_millis: Option<i64>,
    /// Number of bytes processed by the consumer.
    num_bytes_processed: u64,
    /// Number of records processed by the consumer.
    num_records_processed: u64,
    /// The shard iterator value that will be used for the next call to `GetRecords`.
    next_shard_iterator: Option<String>,
}

pub(super) struct ShardConsumer {
    stream_name: String,
    shard_id: String,
    /// Sequence number of the last record processed. Consumption of the shard is resumed right
    /// after this sequence number.
    from_sequence_number_exclusive: Option<String>,
    /// When this value is set to true, the consumer shuts down after reaching the last (most
    /// recent) record in the shard.
    shutdown_at_shard_eof: bool,
    state: ShardConsumerState,
    kinesis_client: aws_sdk_kinesis::Client,
    sink: mpsc::Sender<ShardConsumerMessage>,
    retry_params: RetryParams,
}

impl fmt::Debug for ShardConsumer {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "KinesisShardConsumer {{ stream_name: {}, shard_id: {} }}",
            self.stream_name, self.shard_id
        )
    }
}

impl ShardConsumer {
    pub fn new(
        stream_name: String,
        shard_id: String,
        from_sequence_number_exclusive: Option<String>,
        shutdown_at_shard_eof: bool,
        kinesis_client: aws_sdk_kinesis::Client,
        sink: mpsc::Sender<ShardConsumerMessage>,
        retry_params: RetryParams,
    ) -> Self {
        Self {
            stream_name,
            shard_id,
            from_sequence_number_exclusive,
            state: Default::default(),
            shutdown_at_shard_eof,
            kinesis_client,
            sink,
            retry_params,
        }
    }

    pub fn spawn(self, ctx: &SourceContext) -> ShardConsumerHandle {
        let (_mailbox, _actor_handle) = ctx.spawn_actor().spawn(self);
        ShardConsumerHandle {
            _mailbox,
            _actor_handle,
        }
    }

    async fn send_message(
        &self,
        ctx: &ActorContext<Self>,
        message: ShardConsumerMessage,
    ) -> anyhow::Result<()> {
        let _guard = ctx.protect_zone();
        self.sink.send(message).await?;
        Ok(())
    }
}

pub(super) struct ShardConsumerHandle {
    _mailbox: Mailbox<ShardConsumer>,
    _actor_handle: ActorHandle<ShardConsumer>,
}

#[derive(Debug)]
pub(super) struct Loop;

#[async_trait]
impl Actor for ShardConsumer {
    type ObservableState = JsonValue;

    fn name(&self) -> String {
        "KinesisShardConsumer".to_string()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.state.next_shard_iterator = ctx
            .protect_future(get_shard_iterator(
                &self.kinesis_client,
                &self.retry_params,
                &self.stream_name,
                &self.shard_id,
                self.from_sequence_number_exclusive.clone(),
            ))
            .await?;
        ctx.send_self_message(Loop).await?;
        Ok(())
    }

    fn yield_after_each_message(&self) -> bool {
        false
    }

    fn observable_state(&self) -> Self::ObservableState {
        json!({
            "stream_name": self.stream_name,
            "shard_id": self.shard_id,
            "current_sequence_number": self.state.current_sequence_number,
            "lag_millis": self.state.lag_millis,
            "num_bytes_processed": self.state.num_bytes_processed,
            "num_records_processed": self.state.num_records_processed,
        })
    }
}

#[async_trait]
impl Handler<Loop> for ShardConsumer {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: Loop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if let Some(shard_iterator) = self.state.next_shard_iterator.take() {
            let response = ctx
                .protect_future(get_records(
                    &self.kinesis_client,
                    &self.retry_params,
                    shard_iterator,
                ))
                .await?;
            self.state.lag_millis = response.millis_behind_latest;
            self.state.next_shard_iterator = response.next_shard_iterator;

            if !response.records.is_empty() {
                self.state.current_sequence_number = response
                    .records
                    .last()
                    .map(|record| record.sequence_number.clone());
                self.state.num_bytes_processed += response
                    .records
                    .iter()
                    .map(|record| record.data().as_ref().len() as u64)
                    .sum::<u64>();
                self.state.num_records_processed += response.records.len() as u64;

                let message = ShardConsumerMessage::Records {
                    shard_id: self.shard_id.clone(),
                    records: response.records,
                    lag_millis: response.millis_behind_latest,
                };
                self.send_message(ctx, message).await?;
            }
            if let Some(children) = response.child_shards {
                let shard_ids: Vec<String> = children
                    .into_iter()
                    // Filter out duplicate message when two shards are merged.
                    .filter(|child| child.parent_shards().first() == Some(&self.shard_id))
                    .map(|child| child.shard_id)
                    .collect();
                if !shard_ids.is_empty() {
                    let message = ShardConsumerMessage::ChildShards(shard_ids);
                    self.send_message(ctx, message).await?;
                }
            }
            if self.shutdown_at_shard_eof && response.millis_behind_latest == Some(0) {
                let message = ShardConsumerMessage::ShardEOF(self.shard_id.clone());
                self.send_message(ctx, message).await?;
                return Err(ActorExitStatus::Success);
            };
            // The `GetRecords` API has a limit of 5 transactions per second. 1s / 5 + ε = 210ms.
            let interval = Duration::from_millis(210);
            ctx.schedule_self_msg(interval, Loop);
            return Ok(());
        }
        let message = ShardConsumerMessage::ShardClosed(self.shard_id.clone());
        self.send_message(ctx, message).await?;
        Err(ActorExitStatus::Success)
    }
}

#[cfg(all(test, feature = "kinesis-localstack-tests"))]
mod tests {
    use quickwit_actors::Universe;
    use serde_json::Value as JsonValue;

    use super::*;
    use crate::source::kinesis::api::tests::{merge_shards, split_shard};
    use crate::source::kinesis::helpers::tests::{
        DEFAULT_RETRY_PARAMS, make_shard_id, put_records_into_shards, setup, teardown,
    };

    async fn drain_messages(
        sink_rx: &mut mpsc::Receiver<ShardConsumerMessage>,
    ) -> Vec<ShardConsumerMessage> {
        let mut messages = Vec::new();
        while let Ok(message) = sink_rx.try_recv() {
            messages.push(message);
        }
        messages
    }

    #[ignore]
    #[tokio::test]
    async fn test_shard_eof() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (sink_tx, mut sink_rx) = mpsc::channel(100);
        let (kinesis_client, stream_name) = setup("test-shard-eof", 1).await?;
        let shard_id_0 = make_shard_id(0);
        let shard_consumer = ShardConsumer::new(
            stream_name.clone(),
            shard_id_0.clone(),
            None,
            true,
            kinesis_client.clone(),
            sink_tx,
            *DEFAULT_RETRY_PARAMS,
        );
        let (_mailbox, handle) = universe.spawn_builder().spawn(shard_consumer);
        let (exit_status, exit_state) = handle.join().await;
        assert!(exit_status.is_success());

        let messages = drain_messages(&mut sink_rx).await;
        assert_eq!(messages.len(), 1);

        assert!(matches!(
            &messages[0],
            ShardConsumerMessage::ShardEOF(shard_id) if *shard_id == shard_id_0
        ));
        let expected_state = json!({
            "stream_name": stream_name,
            "shard_id": shard_id_0,
            "current_sequence_number": JsonValue::Null,
            "lag_millis": 0,
            "num_bytes_processed": 0,
            "num_records_processed": 0,
        });
        assert_eq!(exit_state, expected_state);

        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    #[ignore]
    #[tokio::test]
    async fn test_start_at_horizon() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (sink_tx, mut sink_rx) = mpsc::channel(100);
        let (kinesis_client, stream_name) = setup("test-start-at-horizon", 1).await?;
        let sequence_numbers = put_records_into_shards(
            &kinesis_client,
            &stream_name,
            [(0, "Record #00"), (0, "Record #01")],
        )
        .await?;
        let shard_id_0 = make_shard_id(0);
        let shard_consumer = ShardConsumer::new(
            stream_name.clone(),
            shard_id_0.clone(),
            None,
            true,
            kinesis_client.clone(),
            sink_tx,
            *DEFAULT_RETRY_PARAMS,
        );
        let (_mailbox, handle) = universe.spawn_builder().spawn(shard_consumer);
        let (exit_status, exit_state) = handle.join().await;
        assert!(exit_status.is_success());

        let messages = drain_messages(&mut sink_rx).await;
        assert_eq!(messages.len(), 2);

        assert!(matches!(
            &messages[0],
            ShardConsumerMessage::Records { shard_id, records, lag_millis: _ } if *shard_id == shard_id_0 && records.len() == 2
        ));
        assert!(matches!(
            &messages[1],
            ShardConsumerMessage::ShardEOF(shard_id) if *shard_id == shard_id_0
        ));
        let current_sequence_number = sequence_numbers
            .get(&0)
            .and_then(|per_shard_sequence_numbers| per_shard_sequence_numbers.last())
            .cloned();
        let expected_state = json!({
            "stream_name": stream_name,
            "shard_id": shard_id_0,
            "current_sequence_number": current_sequence_number,
            "lag_millis": 0,
            "num_bytes_processed": 20,
            "num_records_processed": 2,
        });
        assert_eq!(exit_state, expected_state);

        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    // Ignoring this test because the localstack implementation of Kinesis is bogus.
    #[ignore]
    #[tokio::test]
    async fn test_start_after_sequence_number() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (sink_tx, mut sink_rx) = mpsc::channel(100);
        let (kinesis_client, stream_name) = setup("test-start-after-sequence-number", 1).await?;
        let sequence_numbers = put_records_into_shards(
            &kinesis_client,
            &stream_name,
            [(0, "Record #00"), (0, "Record #01")],
        )
        .await?;
        let shard_id_0 = make_shard_id(0);
        let from_sequence_number_exclusive = sequence_numbers
            .get(&0)
            .and_then(|sequence_numbers| sequence_numbers.first())
            .cloned();
        let shard_consumer = ShardConsumer::new(
            stream_name.clone(),
            shard_id_0.clone(),
            from_sequence_number_exclusive,
            true,
            kinesis_client.clone(),
            sink_tx,
            *DEFAULT_RETRY_PARAMS,
        );
        let (_mailbox, handle) = universe.spawn_builder().spawn(shard_consumer);
        let (exit_status, exit_state) = handle.join().await;
        assert!(exit_status.is_success());

        let messages = drain_messages(&mut sink_rx).await;
        assert_eq!(messages.len(), 2);

        assert!(matches!(
            &messages[0],
            ShardConsumerMessage::Records { shard_id, records, lag_millis: _ } if *shard_id == shard_id_0 && records.len() == 1
        ));
        assert!(matches!(
            &messages[1],
            ShardConsumerMessage::ShardEOF(shard_id) if *shard_id == shard_id_0
        ));
        let current_sequence_number = sequence_numbers
            .get(&0)
            .and_then(|per_shard_sequence_numbers| per_shard_sequence_numbers.last())
            .cloned();
        let expected_state = json!({
            "stream_name": stream_name,
            "shard_id": shard_id_0,
            "current_sequence_number": current_sequence_number,
            "lag_millis": 0,
            "num_bytes_processed": 10,
            "num_records_processed": 1,
        });
        assert_eq!(exit_state, expected_state);

        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    // Ignoring this test because the localstack implementation of Kinesis is bogus.
    #[ignore]
    #[tokio::test]
    async fn test_merge_shards() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (sink_tx, mut sink_rx) = mpsc::channel(100);
        let (kinesis_client, stream_name) = setup("test-merge-shards", 2).await?;
        let shard_id_0 = make_shard_id(0);
        let shard_id_1 = make_shard_id(1);
        merge_shards(&kinesis_client, &stream_name, &shard_id_0, &shard_id_1).await?;
        {
            let shard_consumer_0 = ShardConsumer::new(
                stream_name.clone(),
                shard_id_0.clone(),
                None,
                false,
                kinesis_client.clone(),
                sink_tx.clone(),
                *DEFAULT_RETRY_PARAMS,
            );
            let (_mailbox, handle) = universe.spawn_builder().spawn(shard_consumer_0);
            let (exit_status, _exit_state) = handle.join().await;
            assert!(exit_status.is_success());

            let messages = drain_messages(&mut sink_rx).await;
            assert_eq!(messages.len(), 2);

            assert!(matches!(
                &messages[0],
                ShardConsumerMessage::ChildShards(shard_ids) if *shard_ids == vec![make_shard_id(2)]
            ));
            assert!(matches!(
                &messages[1],
                ShardConsumerMessage::ShardClosed(shard_id) if *shard_id == shard_id_0
            ));
        }
        {
            let shard_consumer_1 = ShardConsumer::new(
                stream_name.clone(),
                shard_id_1.clone(),
                None,
                false,
                kinesis_client.clone(),
                sink_tx,
                *DEFAULT_RETRY_PARAMS,
            );
            let (_mailbox, handle) = universe.spawn_builder().spawn(shard_consumer_1);
            let (exit_status, _exit_state) = handle.join().await;
            assert!(exit_status.is_success());

            let messages = drain_messages(&mut sink_rx).await;
            assert_eq!(messages.len(), 1);

            assert!(matches!(
                &messages[0],
                ShardConsumerMessage::ShardClosed(shard_id) if *shard_id == shard_id_1
            ));
        }
        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }

    // Ignoring this test because the localstack implementation of Kinesis is bogus.
    #[ignore]
    #[tokio::test]
    async fn test_split_shard() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (sink_tx, mut sink_rx) = mpsc::channel(100);
        let (kinesis_client, stream_name) = setup("test-split-shard", 1).await?;
        let shard_id_0 = make_shard_id(0);
        split_shard(&kinesis_client, &stream_name, &shard_id_0, "42").await?;

        let shard_consumer = ShardConsumer::new(
            stream_name.clone(),
            shard_id_0.clone(),
            None,
            false,
            kinesis_client.clone(),
            sink_tx,
            *DEFAULT_RETRY_PARAMS,
        );
        let (_mailbox, handle) = universe.spawn_builder().spawn(shard_consumer);
        let (exit_status, _exit_state) = handle.join().await;
        assert!(exit_status.is_success());

        let messages = drain_messages(&mut sink_rx).await;
        assert_eq!(messages.len(), 2);

        assert!(matches!(
            &messages[0],
            ShardConsumerMessage::ChildShards(shard_ids) if *shard_ids == vec![make_shard_id(1), make_shard_id(2)]
        ));
        assert!(matches!(
            &messages[1],
            ShardConsumerMessage::ShardClosed(shard_id) if *shard_id == shard_id_0
        ));
        teardown(&kinesis_client, &stream_name).await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! # Sources
//!
//! Quickwit gets its data from so-called `Sources`.
//!
//! The role of a source is to push message to an indexer mailbox.
//! Implementers need to focus on the implementation of the [`Source`] trait
//! and in particular its emit_batches method.
//! In addition, they need to implement a source factory.
//!
//! The source trait will executed in an actor.
//!
//! # Checkpoints and exactly-once semantics
//!
//! Quickwit is designed to offer exactly-once semantics whenever possible using the following
//! strategy, using checkpoints.
//!
//! Messages are split into partitions, and within a partition messages are totally ordered: they
//! are marked by a unique position within this partition.
//!
//! Sources are required to emit messages in a way that respects this partial order.
//! If two message belong 2 different partitions, they can be emitted in any order.
//! If two message belong to the same partition, they  are required to be emitted in the order of
//! their position.
//!
//! The set of documents processed by a source can then be expressed entirely as Checkpoint, that is
//! simply a mapping `(PartitionId -> Position)`.
//!
//! This checkpoint is used in Quickwit to implement exactly-once semantics.
//! When a new split is published, it is atomically published with an update of the last indexed
//! checkpoint.
//!
//! If the indexing pipeline is restarted, the source will simply be recreated with that checkpoint.
//!
//! # Example sources
//!
//! Right now two sources are implemented in quickwit.
//! - the file source: there partition here is a filepath, and the position is a byte-offset within
//!   that file.
//! - the kafka source: the partition id is a kafka topic partition id, and the position is a kafka
//!   offset.
mod doc_file_reader;
mod file_source;
#[cfg(feature = "gcp-pubsub")]
mod gcp_pubsub_source;
mod ingest;
mod ingest_api_source;
#[cfg(feature = "kafka")]
mod kafka_source;
#[cfg(feature = "kinesis")]
mod kinesis;
#[cfg(feature = "pulsar")]
mod pulsar_source;
#[cfg(feature = "queue-sources")]
mod queue_sources;
mod source_factory;
mod stdin_source;
mod vec_source;
mod void_source;

use std::collections::BTreeSet;
use std::path::PathBuf;
use std::time::Duration;

use async_trait::async_trait;
use bytes::Bytes;
use bytesize::ByteSize;
pub use file_source::{FileSource, FileSourceFactory};
#[cfg(feature = "gcp-pubsub")]
pub use gcp_pubsub_source::{GcpPubSubSource, GcpPubSubSourceFactory};
#[cfg(feature = "kafka")]
pub use kafka_source::{KafkaSource, KafkaSourceFactory};
#[cfg(feature = "kinesis")]
pub use kinesis::kinesis_source::{KinesisSource, KinesisSourceFactory};
use once_cell::sync::{Lazy, OnceCell};
#[cfg(feature = "pulsar")]
pub use pulsar_source::{PulsarSource, PulsarSourceFactory};
#[cfg(feature = "sqs")]
pub use queue_sources::sqs_queue;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox};
use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::runtimes::RuntimeType;
use quickwit_config::{
    FileSourceNotification, FileSourceParams, IndexingSettings, SourceConfig, SourceParams,
};
use quickwit_ingest::IngesterPool;
use quickwit_metastore::IndexMetadataResponseExt;
use quickwit_metastore::checkpoint::{SourceCheckpoint, SourceCheckpointDelta};
use quickwit_proto::indexing::IndexingPipelineId;
use quickwit_proto::metastore::{
    IndexMetadataRequest, MetastoreError, MetastoreResult, MetastoreService,
    MetastoreServiceClient, SourceType,
};
use quickwit_proto::types::{IndexUid, NodeIdRef, PipelineUid, ShardId};
use quickwit_storage::StorageResolver;
use serde_json::Value as JsonValue;
pub use source_factory::{SourceFactory, SourceLoader, TypedSourceFactory};
use tokio::runtime::Handle;
use tracing::error;
pub use vec_source::{VecSource, VecSourceFactory};
pub use void_source::{VoidSource, VoidSourceFactory};

use self::doc_file_reader::dir_and_filename;
use self::stdin_source::StdinSourceFactory;
use crate::actors::DocProcessor;
use crate::models::RawDocBatch;
use crate::source::ingest::IngestSourceFactory;
use crate::source::ingest_api_source::IngestApiSourceFactory;

/// Number of bytes after which we cut a new batch.
///
/// We try to emit chewable batches for the indexer.
/// One batch = one message to the indexer actor.
///
/// If batches are too large:
/// - we might not be able to observe the state of the indexer for 5 seconds.
/// - we will be needlessly occupying resident memory in the mailbox.
/// - we will not have a precise control of the timeout before commit.
///
/// 5MB seems like a good one size fits all value.
const BATCH_NUM_BYTES_LIMIT: u64 = ByteSize::mib(5).as_u64();

static EMIT_BATCHES_TIMEOUT: Lazy<Duration> = Lazy::new(|| {
    if cfg!(any(test, feature = "testsuite")) {
        let timeout = Duration::from_millis(100);
        assert!(timeout < *quickwit_actors::HEARTBEAT);
        timeout
    } else {
        let timeout = Duration::from_millis(1_000);
        if *quickwit_actors::HEARTBEAT < timeout {
            error!("QW_ACTOR_HEARTBEAT_SECS smaller than batch timeout");
        }
        timeout
    }
});

/// Runtime configuration used during execution of a source actor.
#[derive(Clone)]
pub struct SourceRuntime {
    pub pipeline_id: IndexingPipelineId,
    pub source_config: SourceConfig,
    pub metastore: MetastoreServiceClient,
    pub ingester_pool: IngesterPool,
    // Ingest API queues directory path.
    pub queues_dir_path: PathBuf,
    pub storage_resolver: StorageResolver,
    pub event_broker: EventBroker,
    pub indexing_setting: IndexingSettings,
}

impl SourceRuntime {
    pub fn node_id(&self) -> &NodeIdRef {
        &self.pipeline_id.node_id
    }

    pub fn index_uid(&self) -> &IndexUid {
        &self.pipeline_id.index_uid
    }

    pub fn index_id(&self) -> &str {
        &self.pipeline_id.index_uid.index_id
    }

    pub fn source_id(&self) -> &str {
        &self.pipeline_id.source_id
    }

    pub fn pipeline_uid(&self) -> PipelineUid {
        self.pipeline_id.pipeline_uid
    }

    pub async fn fetch_checkpoint(&self) -> MetastoreResult<SourceCheckpoint> {
        let index_uid = self.index_uid().clone();
        let request = IndexMetadataRequest::for_index_uid(index_uid);
        let response = self.metastore.clone().index_metadata(request).await?;
        let index_metadata = response.deserialize_index_metadata()?;

        if let Some(checkpoint) = index_metadata
            .checkpoint
            .source_checkpoint(self.source_id())
            .cloned()
        {
            return Ok(checkpoint);
        }
        Err(MetastoreError::Internal {
            message: format!(
                "could not find checkpoint for index `{}` and source `{}`",
                self.index_uid(),
                self.source_id()
            ),
            cause: "".to_string(),
        })
    }
}

pub type SourceContext = ActorContext<SourceActor>;

/// A Source is a trait that is mounted in a light wrapping Actor called `SourceActor`.
///
/// For this reason, its methods mimics those of Actor.
/// One key difference is the absence of messages.
///
/// The `SourceActor` implements a loop until emit_batches returns an
/// ActorExitStatus.
///
/// Conceptually, a source execution works as if it was a simple loop
/// as follow:
///
/// ```ignore
/// fn whatever() -> anyhow::Result<()> {
///     source.initialize(ctx)?;
///     let exit_status = loop {
///         if let Err(exit_status) = source.emit_batches()? {
///             break exit_status;
///         }
///     };
///     source.finalize(exit_status)?;
///     Ok(())
/// }
/// ```
#[async_trait]
pub trait Source: Send + 'static {
    /// This method will be called before any calls to `emit_batches`.
    async fn initialize(
        &mut self,
        _doc_processor_mailbox: &Mailbox<DocProcessor>,
        _ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        Ok(())
    }

    /// Main part of the source implementation, `emit_batches` can emit 0..n batches.
    ///
    /// The `batch_sink` is a mailbox that has a bounded capacity.
    /// In that case, `batch_sink` will block.
    ///
    /// It returns an optional duration specifying how long the batch requester
    /// should wait before polling again.
    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus>;

    /// Assign shards is called when the source is assigned a new set of shards by the control
    /// plane.
    async fn assign_shards(
        &mut self,
        _shard_ids: BTreeSet<ShardId>,
        _doc_processor_mailbox: &Mailbox<DocProcessor>,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        Ok(())
    }

    /// After publication of a split, `suggest_truncate` is called.
    /// This makes it possible for the implementation of a source to
    /// release some resources associated to the data that was just published.
    ///
    /// This method is for instance useful for the ingest API, as it is possible
    /// to delete all message anterior to the checkpoint in the ingest API queue.
    ///
    /// It is perfectly fine for implementation to ignore this function.
    /// For instance, message queue like kafka are meant to be shared by different
    /// client, and rely on a retention strategy to delete messages.
    ///
    /// Returning an error has no effect on the source actor itself or the
    /// indexing pipeline, as truncation is just "a suggestion".
    /// The error will however be logged.
    async fn suggest_truncate(
        &mut self,
        _checkpoint: SourceCheckpoint,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        Ok(())
    }

    /// Finalize is called once after the actor terminates.
    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        Ok(())
    }

    /// A name identifying the type of source.
    fn name(&self) -> String;

    /// Returns an observable_state for the actor.
    ///
    /// This object is simply a json object, and its content may vary depending on the
    /// source.
    fn observable_state(&self) -> JsonValue;
}

/// The SourceActor acts as a thin wrapper over a source trait object to execute.
///
/// It mostly takes care of running a loop calling `emit_batches(...)`.
pub struct SourceActor {
    pub source: Box<dyn Source>,
    pub doc_processor_mailbox: Mailbox<DocProcessor>,
}

#[derive(Debug)]
struct Loop;

#[derive(Debug)]
pub struct Assignment {
    pub shard_ids: BTreeSet<ShardId>,
}

#[derive(Debug)]
pub struct AssignShards(pub Assignment);

#[async_trait]
impl Actor for SourceActor {
    type ObservableState = JsonValue;

    fn name(&self) -> String {
        self.source.name()
    }

    fn observable_state(&self) -> Self::ObservableState {
        self.source.observable_state()
    }

    fn runtime_handle(&self) -> Handle {
        RuntimeType::NonBlocking.get_runtime_handle()
    }

    fn yield_after_each_message(&self) -> bool {
        false
    }

    async fn initialize(&mut self, ctx: &SourceContext) -> Result<(), ActorExitStatus> {
        self.source
            .initialize(&self.doc_processor_mailbox, ctx)
            .await?;
        self.handle(Loop, ctx).await?;
        Ok(())
    }

    async fn finalize(
        &mut self,
        exit_status: &ActorExitStatus,
        ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        self.source.finalize(exit_status, ctx).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<Loop> for SourceActor {
    type Reply = ();

    async fn handle(&mut self, _message: Loop, ctx: &SourceContext) -> Result<(), ActorExitStatus> {
        let wait_for = self
            .source
            .emit_batches(&self.doc_processor_mailbox, ctx)
            .await?;
        if wait_for.is_zero() {
            ctx.send_self_message(Loop).await?;
            return Ok(());
        }
        ctx.schedule_self_msg(wait_for, Loop);
        Ok(())
    }
}

#[async_trait]
impl Handler<AssignShards> for SourceActor {
    type Reply = ();

    async fn handle(
        &mut self,
        assign_shards_message: AssignShards,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        let AssignShards(Assignment { shard_ids }) = assign_shards_message;
        self.source
            .assign_shards(shard_ids, &self.doc_processor_mailbox, ctx)
            .await?;
        Ok(())
    }
}

// TODO: Use `SourceType` instead of `&str``.
pub fn quickwit_supported_sources() -> &'static SourceLoader {
    static SOURCE_LOADER: OnceCell<SourceLoader> = OnceCell::new();
    SOURCE_LOADER.get_or_init(|| {
        let mut source_factory = SourceLoader::default();
        source_factory.add_source(SourceType::File, FileSourceFactory);
        #[cfg(feature = "gcp-pubsub")]
        source_factory.add_source(SourceType::PubSub, GcpPubSubSourceFactory);
        source_factory.add_source(SourceType::IngestV1, IngestApiSourceFactory);
        source_factory.add_source(SourceType::IngestV2, IngestSourceFactory);
        #[cfg(feature = "kafka")]
        source_factory.add_source(SourceType::Kafka, KafkaSourceFactory);
        #[cfg(feature = "kinesis")]
        source_factory.add_source(SourceType::Kinesis, KinesisSourceFactory);
        #[cfg(feature = "pulsar")]
        source_factory.add_source(SourceType::Pulsar, PulsarSourceFactory);
        source_factory.add_source(SourceType::Stdin, StdinSourceFactory);
        source_factory.add_source(SourceType::Vec, VecSourceFactory);
        source_factory.add_source(SourceType::Void, VoidSourceFactory);
        source_factory
    })
}

pub async fn check_source_connectivity(
    storage_resolver: &StorageResolver,
    source_config: &SourceConfig,
) -> anyhow::Result<()> {
    match &source_config.source_params {
        SourceParams::File(FileSourceParams::Filepath(file_uri)) => {
            let (dir_uri, file_name) = dir_and_filename(file_uri)?;
            let storage = storage_resolver.resolve(&dir_uri).await?;
            storage.file_num_bytes(file_name).await?;
            Ok(())
        }
        #[allow(unused_variables)]
        SourceParams::File(FileSourceParams::Notifications(FileSourceNotification::Sqs(
            sqs_config,
        ))) => {
            #[cfg(not(feature = "sqs"))]
            anyhow::bail!("Quickwit was compiled without the `sqs` feature");

            #[cfg(feature = "sqs")]
            {
                queue_sources::sqs_queue::check_connectivity(&sqs_config.queue_url).await?;
                Ok(())
            }
        }
        #[allow(unused_variables)]
        SourceParams::Kafka(params) => {
            #[cfg(not(feature = "kafka"))]
            anyhow::bail!("Quickwit was compiled without the `kafka` feature");

            #[cfg(feature = "kafka")]
            {
                kafka_source::check_connectivity(params.clone()).await?;
                Ok(())
            }
        }
        #[allow(unused_variables)]
        SourceParams::Kinesis(params) => {
            #[cfg(not(feature = "kinesis"))]
            anyhow::bail!("Quickwit was compiled without the `kinesis` feature");

            #[cfg(feature = "kinesis")]
            {
                kinesis::check_connectivity(params.clone()).await?;
                Ok(())
            }
        }
        #[allow(unused_variables)]
        SourceParams::Pulsar(params) => {
            #[cfg(not(feature = "pulsar"))]
            anyhow::bail!("Quickwit was compiled without the `pulsar` feature");

            #[cfg(feature = "pulsar")]
            {
                pulsar_source::check_connectivity(params).await?;
                Ok(())
            }
        }
        _ => Ok(()),
    }
}

#[derive(Debug)]
pub struct SuggestTruncate(pub SourceCheckpoint);

#[async_trait]
impl Handler<SuggestTruncate> for SourceActor {
    type Reply = ();

    async fn handle(
        &mut self,
        suggest_truncate: SuggestTruncate,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        let SuggestTruncate(checkpoint) = suggest_truncate;

        if let Err(error) = self.source.suggest_truncate(checkpoint, ctx).await {
            // Failing to process suggest truncate does not
            // kill the source nor the indexing pipeline, but we log the error.
            error!(%error, "failed to process suggest truncate");
        }
        Ok(())
    }
}

pub(super) struct BatchBuilder {
    // Do not directly append documents to this vector; otherwise, in-flight metrics will be
    // incorrect. Use `add_doc` instead.
    docs: Vec<Bytes>,
    num_bytes: u64,
    checkpoint_delta: SourceCheckpointDelta,
    force_commit: bool,
    gauge_guard: GaugeGuard<'static>,
}

impl BatchBuilder {
    pub fn new(source_type: SourceType) -> Self {
        Self::with_capacity(0, source_type)
    }

    pub fn with_capacity(capacity: usize, source_type: SourceType) -> Self {
        let gauge = match source_type {
            SourceType::File => MEMORY_METRICS.in_flight.file(),
            SourceType::IngestV2 => MEMORY_METRICS.in_flight.ingest(),
            SourceType::Kafka => MEMORY_METRICS.in_flight.kafka(),
            SourceType::Kinesis => MEMORY_METRICS.in_flight.kinesis(),
            SourceType::PubSub => MEMORY_METRICS.in_flight.pubsub(),
            SourceType::Pulsar => MEMORY_METRICS.in_flight.pulsar(),
            _ => MEMORY_METRICS.in_flight.other(),
        };
        let gauge_guard = GaugeGuard::from_gauge(gauge);

        Self {
            docs: Vec::with_capacity(capacity),
            num_bytes: 0,
            checkpoint_delta: SourceCheckpointDelta::default(),
            force_commit: false,
            gauge_guard,
        }
    }

    pub fn add_doc(&mut self, doc: Bytes) {
        let num_bytes = doc.len();
        self.docs.push(doc);
        self.gauge_guard.add(num_bytes as i64);
        self.num_bytes += num_bytes as u64;
    }

    pub fn force_commit(&mut self) {
        self.force_commit = true;
    }

    pub fn build(self) -> RawDocBatch {
        RawDocBatch::new(self.docs, self.checkpoint_delta, self.force_commit)
    }

    #[cfg(feature = "kafka")]
    pub fn clear(&mut self) {
        self.docs.clear();
        self.checkpoint_delta = SourceCheckpointDelta::default();
        self.gauge_guard.sub(self.num_bytes as i64);
        self.num_bytes = 0;
    }
}

#[cfg(test)]
mod tests {

    use std::num::NonZeroUsize;

    use quickwit_config::{SourceInputFormat, VecSourceParams};
    use quickwit_metastore::IndexMetadata;
    use quickwit_metastore::checkpoint::IndexCheckpointDelta;
    use quickwit_proto::metastore::{IndexMetadataResponse, MockMetastoreService};
    use quickwit_proto::types::NodeId;

    use super::*;

    pub struct SourceRuntimeBuilder {
        index_uid: IndexUid,
        source_config: SourceConfig,
        metastore_opt: Option<MetastoreServiceClient>,
        queues_dir_path_opt: Option<PathBuf>,
    }

    impl SourceRuntimeBuilder {
        pub fn new(index_uid: IndexUid, source_config: SourceConfig) -> Self {
            SourceRuntimeBuilder {
                index_uid,
                source_config,
                metastore_opt: None,
                queues_dir_path_opt: None,
            }
        }

        pub fn build(mut self) -> SourceRuntime {
            let metastore = self
                .metastore_opt
                .take()
                .unwrap_or_else(|| self.setup_mock_metastore(None));

            let queues_dir_path = self
                .queues_dir_path_opt
                .unwrap_or_else(|| PathBuf::from("./queues"));

            SourceRuntime {
                pipeline_id: IndexingPipelineId {
                    node_id: NodeId::from("test-node"),
                    index_uid: self.index_uid,
                    source_id: self.source_config.source_id.clone(),
                    pipeline_uid: PipelineUid::for_test(0u128),
                },
                metastore,
                ingester_pool: IngesterPool::default(),
                queues_dir_path,
                source_config: self.source_config,
                storage_resolver: StorageResolver::for_test(),
                event_broker: EventBroker::default(),
                indexing_setting: IndexingSettings::default(),
            }
        }

        #[cfg(all(
            test,
            any(feature = "kafka-broker-tests", feature = "sqs-localstack-tests")
        ))]
        pub fn with_metastore(mut self, metastore: MetastoreServiceClient) -> Self {
            self.metastore_opt = Some(metastore);
            self
        }

        pub fn with_mock_metastore(
            mut self,
            source_checkpoint_delta_opt: Option<SourceCheckpointDelta>,
        ) -> Self {
            self.metastore_opt = Some(self.setup_mock_metastore(source_checkpoint_delta_opt));
            self
        }

        pub fn with_queues_dir(mut self, queues_dir_path: impl Into<PathBuf>) -> Self {
            self.queues_dir_path_opt = Some(queues_dir_path.into());
            self
        }

        fn setup_mock_metastore(
            &self,
            source_checkpoint_delta_opt: Option<SourceCheckpointDelta>,
        ) -> MetastoreServiceClient {
            let index_uid = self.index_uid.clone();
            let source_config = self.source_config.clone();

            let mut mock_metastore = MockMetastoreService::new();
            mock_metastore
                .expect_index_metadata()
                .returning(move |_request| {
                    let index_uri = format!("ram:///indexes/{}", index_uid.index_id);
                    let mut index_metadata =
                        IndexMetadata::for_test(&index_uid.index_id, &index_uri);
                    index_metadata.index_uid = index_uid.clone();

                    let source_id = source_config.source_id.clone();
                    index_metadata.add_source(source_config.clone()).unwrap();

                    if let Some(source_delta) = source_checkpoint_delta_opt.clone() {
                        let delta = IndexCheckpointDelta {
                            source_id,
                            source_delta,
                        };
                        index_metadata.checkpoint.try_apply_delta(delta).unwrap();
                    }
                    let response =
                        IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap();
                    Ok(response)
                });
            MetastoreServiceClient::from_mock(mock_metastore)
        }
    }

    #[tokio::test]
    async fn test_check_source_connectivity() -> anyhow::Result<()> {
        {
            let source_config = SourceConfig {
                source_id: "void".to_string(),
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::void(),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            };
            check_source_connectivity(&StorageResolver::for_test(), &source_config).await?;
        }
        {
            let source_config = SourceConfig {
                source_id: "vec".to_string(),
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::Vec(VecSourceParams::default()),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            };
            check_source_connectivity(&StorageResolver::for_test(), &source_config).await?;
        }
        {
            let source_config = SourceConfig {
                source_id: "file".to_string(),
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::file_from_str("file-does-not-exist.json").unwrap(),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            };
            assert!(
                check_source_connectivity(&StorageResolver::for_test(), &source_config)
                    .await
                    .is_err()
            );
        }
        {
            let source_config = SourceConfig {
                source_id: "file".to_string(),
                num_pipelines: NonZeroUsize::MIN,
                enabled: true,
                source_params: SourceParams::file_from_str("data/test_corpus.json").unwrap(),
                transform_config: None,
                input_format: SourceInputFormat::Json,
            };
            assert!(
                check_source_connectivity(&StorageResolver::for_test(), &source_config)
                    .await
                    .is_ok()
            );
        }
        Ok(())
    }
}

#[cfg(all(
    test,
    any(
        feature = "sqs-localstack-tests",
        feature = "kafka-broker-tests",
        feature = "pulsar-broker-tests"
    )
))]
mod test_setup_helper {

    use quickwit_config::IndexConfig;
    use quickwit_metastore::checkpoint::{IndexCheckpointDelta, PartitionId};
    use quickwit_metastore::{CreateIndexRequestExt, SplitMetadata, StageSplitsRequestExt};
    use quickwit_proto::metastore::{CreateIndexRequest, PublishSplitsRequest, StageSplitsRequest};
    use quickwit_proto::types::Position;

    use super::*;
    use crate::new_split_id;

    pub async fn setup_index(
        metastore: MetastoreServiceClient,
        index_id: &str,
        source_config: &SourceConfig,
        partition_deltas: &[(PartitionId, Position, Position)],
    ) -> IndexUid {
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(index_id, &index_uri);
        let create_index_request = CreateIndexRequest::try_from_index_and_source_configs(
            &index_config,
            std::slice::from_ref(source_config),
        )
        .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        if partition_deltas.is_empty() {
            return index_uid;
        }
        let split_id = new_split_id();
        let split_metadata = SplitMetadata::for_test(split_id.clone());
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let mut source_delta = SourceCheckpointDelta::default();
        for (partition_id, from_position, to_position) in partition_deltas.iter().cloned() {
            source_delta
                .record_partition_delta(partition_id, from_position, to_position)
                .unwrap();
        }
        let checkpoint_delta = IndexCheckpointDelta {
            source_id: source_config.source_id.to_string(),
            source_delta,
        };
        let checkpoint_delta_json = serde_json::to_string(&checkpoint_delta).unwrap();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            index_checkpoint_delta_json_opt: Some(checkpoint_delta_json),
            staged_split_ids: vec![split_id.clone()],
            replaced_split_ids: Vec::new(),
            publish_token_opt: None,
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();
        index_uid
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/pulsar_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::fmt;
use std::time::{Duration, Instant};

use anyhow::{Context, anyhow};
use async_trait::async_trait;
use bytes::Bytes;
use futures::StreamExt;
use pulsar::authentication::oauth2::{OAuth2Authentication, OAuth2Params};
use pulsar::consumer::Message;
use pulsar::message::proto::MessageIdData;
use pulsar::{
    Authentication, Consumer, DeserializeMessage, Payload, Pulsar, SubType, TokioExecutor,
};
use quickwit_actors::{ActorContext, ActorExitStatus, Mailbox};
use quickwit_config::{PulsarSourceAuth, PulsarSourceParams};
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpoint};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::{IndexUid, Position};
use serde_json::{Value as JsonValue, json};
use tokio::time;
use tracing::{debug, info, warn};

use crate::actors::DocProcessor;
use crate::source::{
    BATCH_NUM_BYTES_LIMIT, BatchBuilder, EMIT_BATCHES_TIMEOUT, Source, SourceActor, SourceContext,
    SourceRuntime, TypedSourceFactory,
};

type PulsarConsumer = Consumer<PulsarMessage, TokioExecutor>;

pub struct PulsarSourceFactory;

#[async_trait]
impl TypedSourceFactory for PulsarSourceFactory {
    type Source = PulsarSource;
    type Params = PulsarSourceParams;

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        source_params: PulsarSourceParams,
    ) -> anyhow::Result<Self::Source> {
        PulsarSource::try_new(source_runtime, source_params).await
    }
}

#[derive(Default, Debug)]
pub struct PulsarSourceState {
    /// Number of bytes processed by the source.
    pub num_bytes_processed: u64,
    /// Number of messages processed by the source (including invalid messages).
    pub num_messages_processed: u64,
    /// Number of invalid messages, i.e., that were empty or could not be parsed.
    pub num_invalid_messages: u64,
    /// The number of messages that were skipped due to the message being older
    /// than the current checkpoint position
    pub num_skipped_messages: u64,
}

pub struct PulsarSource {
    source_runtime: SourceRuntime,
    source_params: PulsarSourceParams,
    pulsar_consumer: PulsarConsumer,
    subscription_name: String,
    current_positions: BTreeMap<PartitionId, Position>,
    state: PulsarSourceState,
}

impl fmt::Debug for PulsarSource {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("PulsarSource")
            .field("index_uid", self.source_runtime.index_uid())
            .field("source_id", &self.source_runtime.source_id())
            .field("subscription_name", &self.subscription_name)
            .field("topics", &self.source_params.topics.join(", "))
            .finish()
    }
}

impl PulsarSource {
    pub async fn try_new(
        source_runtime: SourceRuntime,
        source_params: PulsarSourceParams,
    ) -> anyhow::Result<Self> {
        let subscription_name =
            subscription_name(source_runtime.index_uid(), source_runtime.source_id());
        info!(
            index_id=%source_runtime.index_id(),
            source_id=%source_runtime.source_id(),
            topics=?source_params.topics,
            subscription_name=%subscription_name,
            "Create Pulsar source."
        );
        let pulsar = connect_pulsar(&source_params).await?;
        let checkpoint = source_runtime.fetch_checkpoint().await?;

        // Current positions are built mapping the topic ID to the last-saved
        // message ID, pulsar ensures these topics (and topic partitions) are
        // unique so that we don't inadvertently clash.
        let mut current_positions = BTreeMap::new();
        for topic in source_params.topics.iter() {
            let partitions = pulsar.lookup_partitioned_topic(topic).await?;

            for (partition, _) in partitions {
                let partition_id = PartitionId::from(partition);
                let position_opt = checkpoint.position_for_partition(&partition_id).cloned();

                if let Some(position) = position_opt {
                    current_positions.insert(partition_id, position);
                }
            }
        }
        let pulsar_consumer = create_pulsar_consumer(
            subscription_name.clone(),
            source_params.clone(),
            pulsar,
            current_positions.clone(),
        )
        .await?;

        Ok(Self {
            source_runtime,
            source_params,
            pulsar_consumer,
            subscription_name,
            current_positions,
            state: PulsarSourceState::default(),
        })
    }

    fn process_message(
        &mut self,
        message: Message<PulsarMessage>,
        batch: &mut BatchBuilder,
    ) -> anyhow::Result<()> {
        let current_position = msg_id_to_position(message.message_id());
        let doc = message.deserialize();
        self.add_doc_to_batch(&message.topic, current_position, doc, batch)
    }

    fn add_doc_to_batch(
        &mut self,
        topic: &str,
        msg_position: Position,
        doc: Bytes,
        batch: &mut BatchBuilder,
    ) -> anyhow::Result<()> {
        if doc.is_empty() {
            warn!("message received from queue was empty");
            self.state.num_invalid_messages += 1;
            return Ok(());
        }

        let partition = PartitionId::from(topic);
        let num_bytes = doc.len() as u64;

        if let Some(current_position) = self.current_positions.get(&partition) {
            // We skip messages older or equal to the current recorded position.
            // This is because Pulsar may replay messages which have not yet been acknowledged but
            // are in the process of being published, this can occur in situations like pulsar
            // re-balancing topic partitions if a node leaves, node failure, etc...
            if &msg_position <= current_position {
                self.state.num_skipped_messages += 1;
                return Ok(());
            }
        }

        let current_position = self
            .current_positions
            .insert(partition.clone(), msg_position.clone())
            .unwrap_or(Position::Beginning);

        batch
            .checkpoint_delta
            .record_partition_delta(partition, current_position, msg_position)
            .context("failed to record partition delta")?;
        batch.add_doc(doc);

        self.state.num_bytes_processed += num_bytes;
        self.state.num_messages_processed += 1;

        Ok(())
    }

    async fn try_ack_messages(&mut self, checkpoint: SourceCheckpoint) -> anyhow::Result<()> {
        debug!(ckpt = ?checkpoint, "truncating message queue");
        for (partition, position) in checkpoint.iter() {
            if let Some(msg_id) = msg_id_from_position(&position) {
                self.pulsar_consumer
                    .cumulative_ack_with_id(partition.0.as_ref(), msg_id)
                    .await?;
            }
        }
        Ok(())
    }
}

#[async_trait]
impl Source for PulsarSource {
    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let now = Instant::now();
        let mut batch_builder = BatchBuilder::new(SourceType::Pulsar);
        let deadline = time::sleep(*EMIT_BATCHES_TIMEOUT);
        tokio::pin!(deadline);

        loop {
            tokio::select! {
                // This does not actually acquire the lock of the mutex internally
                // we're using the mutex in order to convince the Rust compiler
                // that we can use the consumer within this Sync context.
                message = self.pulsar_consumer.next() => {
                    let message = message
                        .ok_or_else(|| ActorExitStatus::from(anyhow!("consumer was dropped")))?
                        .map_err(|e| ActorExitStatus::from(anyhow!("failed to get message from consumer: {:?}", e)))?;

                    self.process_message(message, &mut batch_builder).map_err(ActorExitStatus::from)?;

                    if batch_builder.num_bytes >= BATCH_NUM_BYTES_LIMIT {
                        break;
                    }
                }
                _ = &mut deadline => {
                    break;
                }
            }
            ctx.record_progress();
        }

        if !batch_builder.checkpoint_delta.is_empty() {
            debug!(
                num_docs=%batch_builder.docs.len(),
                num_bytes=%batch_builder.num_bytes,
                num_millis=%now.elapsed().as_millis(),
                "sending doc batch to indexer"
            );
            let message = batch_builder.build();
            ctx.send_message(doc_processor_mailbox, message).await?;
        }
        Ok(Duration::default())
    }

    async fn suggest_truncate(
        &mut self,
        checkpoint: SourceCheckpoint,
        _ctx: &ActorContext<SourceActor>,
    ) -> anyhow::Result<()> {
        self.try_ack_messages(checkpoint).await
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        self.pulsar_consumer.close().await?;
        Ok(())
    }

    fn observable_state(&self) -> JsonValue {
        json!({
            "index_id": self.source_runtime.index_id(),
            "source_id": self.source_runtime.source_id(),
            "topics": self.source_params.topics,
            "subscription_name": self.subscription_name,
            "consumer_name": self.source_params.consumer_name,
            "num_bytes_processed": self.state.num_bytes_processed,
            "num_messages_processed": self.state.num_messages_processed,
            "num_invalid_messages": self.state.num_invalid_messages,
        })
    }
}

#[derive(Debug)]
struct PulsarMessage;

impl DeserializeMessage for PulsarMessage {
    type Output = Bytes;

    fn deserialize_message(payload: &Payload) -> Self::Output {
        Bytes::from(payload.data.clone())
    }
}

#[tracing::instrument(name = "pulsar-consumer", skip(pulsar))]
/// Creates a new pulsar consumer
async fn create_pulsar_consumer(
    subscription_name: String,
    params: PulsarSourceParams,
    pulsar: Pulsar<TokioExecutor>,
    current_positions: BTreeMap<PartitionId, Position>,
) -> anyhow::Result<PulsarConsumer> {
    let mut consumer: Consumer<PulsarMessage, _> = pulsar
        .consumer()
        .with_topics(&params.topics)
        .with_consumer_name(&params.consumer_name)
        .with_subscription(subscription_name)
        .with_subscription_type(SubType::Failover)
        .build()
        .await?;

    let consumer_ids = consumer
        .consumer_id()
        .into_iter()
        .map(|id| id.to_string())
        .collect::<Vec<_>>();
    info!(positions = ?current_positions, "seeking to last checkpoint positions");
    for (_, position) in current_positions {
        let seek_to = msg_id_from_position(&position);

        if seek_to.is_some() {
            consumer
                .seek(Some(consumer_ids.clone()), seek_to, None, pulsar.clone())
                .await?;
        }
    }
    Ok(consumer)
}

fn msg_id_to_position(msg: &MessageIdData) -> Position {
    // The order of these fields are important as they affect the sorting
    // of the checkpoint positions.
    //
    // The key parts of the ID used for ordering are:
    // - The ledger ID which is a sequentially increasing ID.
    // - The entry ID the unique ID of the message within the ledger.
    // - The batch position for the current chunk of messages.
    //
    // The remaining keys are not required for sorting but are required
    // in order to re-construct the message ID in order to send back to pulsar.
    // The ledger_id, entry_id and the batch_index form a unique composite key which will
    // prevent the remaining parts of the ID from interfering with the sorting.
    let position_str = format!(
        "{:0>20},{:0>20},{},{},{}",
        msg.ledger_id,
        msg.entry_id,
        msg.batch_index
            .map(|v| format!("{v:010}"))
            .unwrap_or_default(),
        msg.partition
            .and_then(|v| if v < 0 {
                None
            } else {
                Some(format!("{v:010}"))
            })
            .unwrap_or_default(),
        msg.batch_size
            .map(|v| format!("{v:010}"))
            .unwrap_or_default(),
    );

    Position::from(position_str)
}

fn msg_id_from_position(position: &Position) -> Option<MessageIdData> {
    let Position::Offset(offset) = position else {
        return None;
    };
    let mut parts = offset.as_str().split(',');

    let ledger_id = parts.next()?.parse::<u64>().ok()?;
    let entry_id = parts.next()?.parse::<u64>().ok()?;
    let batch_index = parts.next()?.parse::<i32>().ok();
    let partition = parts.next()?.parse::<i32>().unwrap_or(-1);
    let batch_size = parts.next()?.parse::<i32>().ok();

    Some(MessageIdData {
        ledger_id,
        entry_id,
        batch_index,
        batch_size,
        partition: Some(partition),
        ack_set: Vec::new(),
        first_chunk_message_id: None,
    })
}

async fn connect_pulsar(params: &PulsarSourceParams) -> anyhow::Result<Pulsar<TokioExecutor>> {
    let mut builder = Pulsar::builder(&params.address, TokioExecutor);

    match params.authentication.clone() {
        None => {}
        Some(PulsarSourceAuth::Token(token)) => {
            let auth = Authentication {
                name: "token".to_string(),
                data: token.as_bytes().to_vec(),
            };

            builder = builder.with_auth(auth);
        }
        Some(PulsarSourceAuth::Oauth2 {
            issuer_url,
            credentials_url,
            audience,
            scope,
        }) => {
            let auth = OAuth2Params {
                issuer_url,
                credentials_url,
                audience,
                scope,
            };
            builder = builder.with_auth_provider(OAuth2Authentication::client_credentials(auth));
        }
    }
    let pulsar: Pulsar<_> = builder.build().await?;
    Ok(pulsar)
}

/// Checks whether we can establish a connection to the pulsar broker.
pub(crate) async fn check_connectivity(params: &PulsarSourceParams) -> anyhow::Result<()> {
    connect_pulsar(params).await?;
    Ok(())
}

fn subscription_name(index_uid: &IndexUid, source_id: &str) -> String {
    format!("quickwit-{index_uid}-{source_id}")
}

#[cfg(all(test, feature = "pulsar-broker-tests"))]
mod pulsar_broker_tests {
    use std::collections::HashSet;
    use std::num::NonZeroUsize;
    use std::ops::Range;

    use futures::future::join_all;
    use quickwit_actors::{ActorHandle, HEARTBEAT, Inbox, Universe};
    use quickwit_common::rand::append_random_suffix;
    use quickwit_config::{SourceConfig, SourceInputFormat, SourceParams};
    use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpointDelta};
    use quickwit_metastore::metastore_for_test;
    use quickwit_proto::metastore::MetastoreServiceClient;
    use reqwest::StatusCode;

    use super::*;
    use crate::source::pulsar_source::{msg_id_from_position, msg_id_to_position};
    use crate::source::test_setup_helper::setup_index;
    use crate::source::tests::SourceRuntimeBuilder;
    use crate::source::{RawDocBatch, SuggestTruncate, quickwit_supported_sources};

    static PULSAR_URI: &str = "pulsar://localhost:6650";
    static PULSAR_ADMIN_URI: &str = "http://localhost:8081";
    static CLIENT_NAME: &str = "quickwit-tester";

    macro_rules! positions {
        ($($partition:expr => $position:expr $(,)?)*) => {{
            let mut positions = BTreeMap::new();
            $(
                positions.insert(PartitionId::from($partition), Position::offset($position));
            )*
            positions
        }};
    }

    macro_rules! checkpoints {
        ($($partition:expr => $position:expr $(,)?)*) => {{
            let mut checkpoint = SourceCheckpointDelta::default();
            $(
                checkpoint.record_partition_delta(
                    PartitionId::from($partition),
                    Position::Beginning,
                    $position,
                ).unwrap();
            )*
            checkpoint
        }};
    }

    fn get_source_config<S: AsRef<str>>(
        topics: impl IntoIterator<Item = S>,
    ) -> (String, SourceConfig) {
        let source_id = append_random_suffix("test-pulsar-source--source");
        let source_config = SourceConfig {
            source_id: source_id.clone(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Pulsar(PulsarSourceParams {
                topics: topics.into_iter().map(|v| v.as_ref().to_string()).collect(),
                address: PULSAR_URI.to_string(),
                consumer_name: CLIENT_NAME.to_string(),
                authentication: None,
            }),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        (source_id, source_config)
    }

    fn merge_doc_batches(batches: Vec<RawDocBatch>) -> RawDocBatch {
        let mut merged_batch = RawDocBatch::default();
        for batch in batches {
            merged_batch.docs.extend(batch.docs);
            merged_batch
                .checkpoint_delta
                .extend(batch.checkpoint_delta)
                .unwrap();
        }
        merged_batch.docs.sort();
        merged_batch
    }

    struct TopicData {
        messages: Vec<String>,
        expected_position: Position,
    }

    impl TopicData {
        fn num_bytes(&self) -> usize {
            self.messages.iter().map(|v| v.len()).sum::<usize>()
        }

        fn len(&self) -> usize {
            self.messages.len()
        }
    }

    /// Populates a given set of topics with messages produced by closure `M`
    ///
    /// A set of messages and it's expected last checkpoint position is returned
    /// for each topic provided.
    async fn populate_topic<'a, S: AsRef<str> + 'a, M>(
        topics: impl IntoIterator<Item = S>,
        range_message_ids: Range<usize>,
        message_fn: M,
    ) -> anyhow::Result<Vec<TopicData>>
    where
        M: Fn(&str, usize) -> JsonValue,
    {
        let client = Pulsar::builder(PULSAR_URI, TokioExecutor).build().await?;

        let mut pending_messages = Vec::new();
        for topic in topics {
            let mut topic_messages = Vec::with_capacity(range_message_ids.len());
            let mut producer = client
                .producer()
                .with_name(append_random_suffix(CLIENT_NAME))
                .with_topic(topic.as_ref())
                .build()
                .await?;

            for id in range_message_ids.clone() {
                let msg = (message_fn)(topic.as_ref(), id).to_string();
                topic_messages.push(msg);
            }

            let futures = producer.send_all(topic_messages.clone()).await?;
            let receipts = join_all(futures).await;

            let mut last_expected_position = Position::Beginning;
            for result in receipts {
                let msg_id = result?.message_id.unwrap();
                last_expected_position = msg_id_to_position(&msg_id);
            }

            topic_messages.sort();
            pending_messages.push(TopicData {
                messages: topic_messages,
                expected_position: last_expected_position,
            });
            producer.close().await.expect("Close connection.");
        }

        Ok(pending_messages)
    }

    async fn wait_for_completion(
        source_handle: ActorHandle<SourceActor>,
        num_expected: usize,
        partition: PartitionId,
        truncate_to: Position,
    ) -> JsonValue {
        loop {
            let observation = source_handle.observe().await;
            let value = observation.state;
            let num_messages_processed = value
                .get("num_messages_processed")
                .unwrap()
                .as_u64()
                .unwrap();
            if num_messages_processed >= num_expected as u64 {
                break;
            }
            tokio::time::sleep(Duration::from_secs(1)).await;
        }

        let mut checkpoint = SourceCheckpoint::default();
        checkpoint
            .try_apply_delta(checkpoints!(partition => truncate_to))
            .expect("Create checkpoint");
        let truncate = SuggestTruncate(checkpoint);
        source_handle
            .mailbox()
            .send_message(truncate)
            .await
            .expect("Truncate");

        let (_exit_status, exit_state) = source_handle.quit().await;
        exit_state
    }

    async fn create_partitioned_topic(topic: &str, num_partitions: usize) {
        let client = reqwest::Client::new();
        let res = client
            .put(format!(
                "{PULSAR_ADMIN_URI}/admin/v2/persistent/public/default/{topic}/partitions"
            ))
            .body(num_partitions.to_string())
            .header("content-type", b"application/json".as_ref())
            .send()
            .await
            .expect("Send admin request");

        assert_eq!(
            res.status(),
            StatusCode::NO_CONTENT,
            "Expect 204 status code."
        );
    }

    async fn create_source(
        universe: &Universe,
        _metastore: MetastoreServiceClient,
        index_uid: IndexUid,
        source_config: SourceConfig,
        _start_checkpoint: SourceCheckpoint,
    ) -> anyhow::Result<(ActorHandle<SourceActor>, Inbox<DocProcessor>)> {
        let source_loader = quickwit_supported_sources();
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let source = source_loader.load_source(source_runtime).await?;
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let source_actor = SourceActor {
            source,
            doc_processor_mailbox,
        };
        let (_source_mailbox, source_handle) = universe.spawn_builder().spawn(source_actor);

        Ok((source_handle, doc_processor_inbox))
    }

    fn message_generator(topic: &str, id: usize) -> JsonValue {
        json!({
            "id": id.to_string(),
            "topic": topic,
            "timestamp": 1674515715,
            "body": "Hello, world! This is some test data.",
        })
    }

    fn count_unique_messages_in_batches(batches: &[RawDocBatch]) -> usize {
        let message_ids_topic: HashSet<String> = batches
            .iter()
            .flat_map(|batch| &batch.docs)
            .map(|doc| {
                let json_doc = serde_json::from_slice::<serde_json::Value>(doc).unwrap();
                let id: &str = json_doc.get("id").unwrap().as_str().unwrap();
                let topic: &str = json_doc.get("topic").unwrap().as_str().unwrap();
                format!("{id}-{topic}")
            })
            .collect();
        message_ids_topic.len()
    }

    #[test]
    fn test_position_serialization() {
        let populated_id = MessageIdData {
            ledger_id: 1,
            entry_id: 134,
            batch_index: Some(3),
            partition: Some(-1),
            batch_size: Some(6),

            // We never serialize these fields.
            ack_set: Vec::new(),
            first_chunk_message_id: None,
        };

        let position = msg_id_to_position(&populated_id);
        assert_eq!(
            position.to_string(),
            format!("{:0>20},{:0>20},{:010},,{:010}", 1, 134, 3, 6)
        );
        let retrieved_id = msg_id_from_position(&position)
            .expect("Successfully deserialize message ID from position.");
        assert_eq!(retrieved_id, populated_id);

        let partitioned_id = MessageIdData {
            ledger_id: 1,
            entry_id: 134,
            batch_index: Some(3),
            partition: Some(5),
            batch_size: Some(6),

            // We never serialize these fields.
            ack_set: Vec::new(),
            first_chunk_message_id: None,
        };

        let position = msg_id_to_position(&partitioned_id);
        assert_eq!(
            position.to_string(),
            format!("{:0>20},{:0>20},{:010},{:010},{:010}", 1, 134, 3, 5, 6)
        );
        let retrieved_id = msg_id_from_position(&position)
            .expect("Successfully deserialize message ID from position.");
        assert_eq!(retrieved_id, partitioned_id);

        let sparse_id = MessageIdData {
            ledger_id: 1,
            entry_id: 4,
            batch_index: None,
            partition: Some(-1),
            batch_size: Some(0),

            // We never serialize these fields.
            ack_set: Vec::new(),
            first_chunk_message_id: None,
        };

        let position = msg_id_to_position(&sparse_id);
        assert_eq!(
            position.to_string(),
            format!("{:0>20},{:0>20},,,{:010}", 1, 4, 0)
        );
        let retrieved_id = msg_id_from_position(&position)
            .expect("Successfully deserialize message ID from position.");
        assert_eq!(retrieved_id, sparse_id);
    }

    #[tokio::test]
    async fn test_doc_batching_logic() {
        let topic = append_random_suffix("test-pulsar-source-topic");

        let index_id = append_random_suffix("test-pulsar-source-index");
        let index_uid = IndexUid::new_with_random_ulid(&index_id);
        let (_source_id, source_config) = get_source_config([&topic]);
        let params = if let SourceParams::Pulsar(params) = source_config.clone().source_params {
            params
        } else {
            unreachable!()
        };

        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let mut pulsar_source = PulsarSource::try_new(source_runtime, params)
            .await
            .expect("Setup pulsar source");

        let position = Position::Beginning;
        let mut batch = BatchBuilder::new(SourceType::Pulsar);
        pulsar_source
            .add_doc_to_batch(&topic, position, Bytes::from_static(b""), &mut batch)
            .expect("Add batch should not error on empty doc.");
        assert_eq!(pulsar_source.state.num_invalid_messages, 1);
        assert_eq!(pulsar_source.state.num_messages_processed, 0);
        assert_eq!(pulsar_source.state.num_bytes_processed, 0);
        assert!(pulsar_source.current_positions.is_empty());
        assert_eq!(batch.num_bytes, 0);
        assert!(batch.docs.is_empty());

        let position = Position::offset(1u64); // Used for testing simplicity.
        let mut batch = BatchBuilder::new(SourceType::Pulsar);
        let doc = Bytes::from_static(b"some-demo-data");
        pulsar_source
            .add_doc_to_batch(&topic, position, doc, &mut batch)
            .expect("Add batch should not error on empty doc.");

        assert_eq!(pulsar_source.state.num_invalid_messages, 1);
        assert_eq!(pulsar_source.state.num_messages_processed, 1);
        assert_eq!(pulsar_source.state.num_bytes_processed, 14);
        assert_eq!(
            pulsar_source.current_positions,
            positions!(topic.as_str() => 1u64)
        );
        assert_eq!(batch.num_bytes, 14);
        assert_eq!(batch.docs.len(), 1);

        let position = Position::offset(4u64); // Used for testing simplicity.
        let mut batch = BatchBuilder::new(SourceType::Pulsar);
        let doc = Bytes::from_static(b"some-demo-data-2");
        pulsar_source
            .add_doc_to_batch(&topic, position, doc, &mut batch)
            .expect("Add batch should not error on empty doc.");
        assert_eq!(pulsar_source.state.num_invalid_messages, 1);
        assert_eq!(pulsar_source.state.num_messages_processed, 2);
        assert_eq!(pulsar_source.state.num_bytes_processed, 30);
        assert_eq!(
            pulsar_source.current_positions,
            positions!(topic.as_str() => 4u64)
        );
        assert_eq!(batch.num_bytes, 16);
        assert_eq!(batch.docs.len(), 1);

        let mut expected_checkpoint_delta = SourceCheckpointDelta::default();
        expected_checkpoint_delta
            .record_partition_delta(
                PartitionId::from(topic.as_str()),
                Position::offset(1u64),
                Position::offset(4u64),
            )
            .unwrap();
        assert_eq!(batch.checkpoint_delta, expected_checkpoint_delta);
    }

    #[tokio::test]
    async fn test_topic_ingestion() {
        let universe = Universe::with_accelerated_time();
        let metastore = metastore_for_test();
        let topic = append_random_suffix("test-pulsar-source--topic-ingestion--topic");

        let index_id = append_random_suffix("test-pulsar-source--topic-ingestion--index");
        let (source_id, source_config) = get_source_config([&topic]);

        let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;

        let (source_handle, doc_processor_inbox) = create_source(
            &universe,
            metastore,
            index_uid.clone(),
            source_config,
            SourceCheckpoint::default(),
        )
        .await
        .expect("Create source");

        let expected_docs = populate_topic([&topic], 0..10, message_generator)
            .await
            .unwrap();

        let exit_state = wait_for_completion(
            source_handle,
            expected_docs[0].len(),
            PartitionId::from(topic.clone()),
            expected_docs[0].expected_position.clone(),
        )
        .await;
        let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert!(!messages.is_empty());

        let batch = merge_doc_batches(messages);
        assert_eq!(batch.docs, expected_docs[0].messages);
        assert_eq!(
            batch.checkpoint_delta,
            checkpoints!(topic.as_str() => expected_docs[0].expected_position.clone())
        );

        let num_bytes = expected_docs[0].num_bytes();
        let expected_state = json!({
            "index_id": index_id,
            "source_id": source_id,
            "topics": vec![topic],
            "subscription_name": subscription_name(&index_uid, &source_id),
            "consumer_name": CLIENT_NAME,
            "num_bytes_processed": num_bytes,
            "num_messages_processed": 10,
            "num_invalid_messages": 0,
        });
        assert_eq!(exit_state, expected_state);
    }

    #[tokio::test]
    async fn test_multi_topic_ingestion() {
        let universe = Universe::with_accelerated_time();
        let metastore = metastore_for_test();
        let topic1 = append_random_suffix("test-pulsar-source--topic-ingestion--topic");
        let topic2 = append_random_suffix("test-pulsar-source--topic-ingestion--topic");

        let index_id = append_random_suffix("test-pulsar-source--topic-ingestion--index");
        let (source_id, source_config) = get_source_config([&topic1, &topic2]);

        let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;

        let (source_handle, doc_processor_inbox) = create_source(
            &universe,
            metastore,
            index_uid.clone(),
            source_config,
            SourceCheckpoint::default(),
        )
        .await
        .expect("Create source");

        let expected_docs = populate_topic([&topic1, &topic2], 0..10, message_generator)
            .await
            .unwrap();

        let mut combined_messages = expected_docs
            .iter()
            .flat_map(|v| &v.messages)
            .cloned()
            .collect::<Vec<_>>();
        combined_messages.sort();

        let exit_state = wait_for_completion(
            source_handle,
            combined_messages.len(),
            PartitionId::from(topic1.clone()),
            expected_docs[0].expected_position.clone(),
        )
        .await;
        let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert!(!messages.is_empty());

        let batch = merge_doc_batches(messages);
        assert_eq!(batch.docs, combined_messages);
        assert_eq!(
            batch.checkpoint_delta,
            checkpoints! {
                topic1.as_str() => expected_docs[0].expected_position.clone(),
                topic2.as_str() => expected_docs[1].expected_position.clone(),
            }
        );

        let num_bytes = expected_docs[0].num_bytes() + expected_docs[1].num_bytes();
        let expected_state = json!({
            "index_id": index_id,
            "source_id": source_id,
            "topics": vec![topic1, topic2],
            "subscription_name": subscription_name(&index_uid, &source_id),
            "consumer_name": CLIENT_NAME,
            "num_bytes_processed": num_bytes,
            "num_messages_processed": 20,
            "num_invalid_messages": 0,
        });
        assert_eq!(exit_state, expected_state);
    }

    #[tokio::test]
    async fn test_partitioned_topic_single_consumer_ingestion() {
        let universe = Universe::with_accelerated_time();
        let metastore = metastore_for_test();
        let topic = append_random_suffix("test-pulsar-source--partitioned-single-consumer--topic");

        let index_id =
            append_random_suffix("test-pulsar-source--partitioned-single-consumer--index");
        let (source_id, source_config) = get_source_config([&topic]);

        create_partitioned_topic(&topic, 2).await;
        let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;

        let (source_handle, doc_processor_inbox) = create_source(
            &universe,
            metastore,
            index_uid.clone(),
            source_config,
            SourceCheckpoint::default(),
        )
        .await
        .expect("Create source");

        let expected_docs = populate_topic([&topic], 0..10, message_generator)
            .await
            .unwrap();

        let exit_state = wait_for_completion(
            source_handle,
            expected_docs.len(),
            PartitionId::from(topic.clone()),
            expected_docs[0].expected_position.clone(),
        )
        .await;
        let messages: Vec<RawDocBatch> = doc_processor_inbox.drain_for_test_typed();
        assert!(!messages.is_empty());

        let batch = merge_doc_batches(messages);
        assert_eq!(batch.docs, expected_docs[0].messages);

        let num_bytes = expected_docs[0].num_bytes();
        let expected_state = json!({
            "index_id": index_id,
            "source_id": source_id,
            "topics": vec![topic],
            "subscription_name": subscription_name(&index_uid, &source_id),
            "consumer_name": CLIENT_NAME,
            "num_bytes_processed": num_bytes,
            "num_messages_processed": 10,
            "num_invalid_messages": 0,
        });
        assert_eq!(exit_state, expected_state);
    }

    #[tokio::test]
    async fn test_partitioned_topic_multi_consumer_ingestion() {
        let universe = Universe::with_accelerated_time();
        let metastore = metastore_for_test();
        let topic = append_random_suffix("test-pulsar-source--partitioned-multi-consumer--topic");

        let index_id =
            append_random_suffix("test-pulsar-source--partitioned-multi-consumer--index");
        let (source_id, source_config) = get_source_config([&topic]);

        create_partitioned_topic(&topic, 2).await;
        let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;

        let topic_partition_1 = format!("{topic}-partition-0");
        let topic_partition_2 = format!("{topic}-partition-1");

        let (source_handle1, doc_processor_inbox1) = create_source(
            &universe,
            metastore.clone(),
            index_uid.clone(),
            source_config.clone(),
            SourceCheckpoint::default(),
        )
        .await
        .expect("Create source");

        let (source_handle2, doc_processor_inbox2) = create_source(
            &universe,
            metastore,
            index_uid.clone(),
            source_config,
            SourceCheckpoint::default(),
        )
        .await
        .expect("Create source");

        let expected_docs = populate_topic(
            [&topic_partition_1, &topic_partition_2],
            0..10,
            message_generator,
        )
        .await
        .unwrap();

        let exit_state1 = wait_for_completion(
            source_handle1,
            10,
            PartitionId::from(topic_partition_1.clone()),
            expected_docs[0].expected_position.clone(),
        )
        .await;
        let exit_state2 = wait_for_completion(
            source_handle2,
            10,
            PartitionId::from(topic_partition_2.clone()),
            expected_docs[1].expected_position.clone(),
        )
        .await;
        let messages1: Vec<RawDocBatch> = doc_processor_inbox1.drain_for_test_typed();
        assert!(!messages1.is_empty());
        let messages2: Vec<RawDocBatch> = doc_processor_inbox2.drain_for_test_typed();
        assert!(!messages2.is_empty());

        let batch1 = merge_doc_batches(messages1);
        assert_eq!(batch1.docs, expected_docs[0].messages);

        let batch2 = merge_doc_batches(messages2);
        assert_eq!(batch2.docs, expected_docs[1].messages);

        let num_bytes = expected_docs[1].num_bytes();
        let expected_state = json!({
            "index_id": index_id,
            "source_id": source_id,
            "topics": vec![topic],
            "subscription_name": subscription_name(&index_uid, &source_id),
            "consumer_name": CLIENT_NAME,
            "num_bytes_processed": num_bytes,
            "num_messages_processed": 10,
            "num_invalid_messages": 0,
        });
        assert_eq!(exit_state1, expected_state);
        assert_eq!(exit_state2, expected_state);
    }

    #[tokio::test]
    async fn test_partitioned_topic_multi_consumer_ingestion_with_failover() {
        // We test successive failures of one source and observe pulsar failover mechanism.
        quickwit_common::setup_logging_for_tests();
        let universe = Universe::new();
        let metastore = metastore_for_test();
        let topic =
            append_random_suffix("test-pulsar-source--partitioned-multi-consumer-failure--topic");

        let index_id =
            append_random_suffix("test-pulsar-source--partitioned-multi-consumer-failure--index");
        let (_, source_config) = get_source_config([&topic]);

        create_partitioned_topic(&topic, 2).await;
        let index_uid = setup_index(metastore.clone(), &index_id, &source_config, &[]).await;

        let topic_partition_1 = format!("{topic}-partition-0");
        let topic_partition_2 = format!("{topic}-partition-1");

        let (_source_handle1, doc_processor_inbox1) = create_source(
            &universe,
            metastore.clone(),
            index_uid.clone(),
            source_config.clone(),
            SourceCheckpoint::default(),
        )
        .await
        .expect("Create source");

        // Send 10 messages on each topic and kill the source 5 times.
        for idx in 0..5 {
            let (source_handle2, _) = create_source(
                &universe,
                metastore.clone(),
                index_uid.clone(),
                source_config.clone(),
                SourceCheckpoint::default(),
            )
            .await
            .expect("Create source");
            populate_topic(
                [&topic_partition_1, &topic_partition_2],
                idx * 10..(idx + 1) * 10,
                message_generator,
            )
            .await
            .unwrap();
            tokio::time::sleep(*HEARTBEAT * 5).await;
            source_handle2.kill().await;
        }

        let messages1: Vec<RawDocBatch> = doc_processor_inbox1.drain_for_test_typed();
        assert!(!messages1.is_empty());
        let num_docs_sent_to_doc_processor: usize =
            messages1.iter().map(|batch| batch.docs.len()).sum();
        assert_eq!(100, num_docs_sent_to_doc_processor);
        // Check that we have received all the messages without duplicates.
        assert_eq!(100, count_unique_messages_in_batches(&messages1));
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/coordinator.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::sync::Arc;
use std::time::Duration;

use itertools::Itertools;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_common::rate_limited_error;
use quickwit_config::{FileSourceMessageType, FileSourceSqs};
use quickwit_metastore::checkpoint::SourceCheckpoint;
use quickwit_proto::indexing::IndexingPipelineId;
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::SourceUid;
use quickwit_storage::StorageResolver;
use serde::Serialize;
use ulid::Ulid;

use super::Queue;
use super::helpers::QueueReceiver;
use super::local_state::QueueLocalState;
use super::message::{MessageType, PreProcessingError, ReadyMessage};
use super::shared_state::{QueueSharedState, checkpoint_messages};
use super::visibility::{VisibilitySettings, spawn_visibility_task};
use crate::actors::DocProcessor;
use crate::models::{NewPublishLock, NewPublishToken, PublishLock};
use crate::source::{SourceContext, SourceRuntime};

/// Maximum duration that the `emit_batches()` callback can wait for
/// `queue.receive()` calls. If too small, the actor loop will spin
/// un-necessarily. If too large, the actor loop will be slow to react to new
/// messages (or shutdown).
pub const RECEIVE_POLL_TIMEOUT: Duration = Duration::from_millis(500);

#[derive(Default, Serialize)]
pub struct QueueCoordinatorObservableState {
    /// Number of bytes processed by the source.
    pub num_bytes_processed: u64,
    /// Number of lines processed by the source.
    pub num_lines_processed: u64,
    /// Number of messages processed by the source.
    pub num_messages_processed: u64,
    /// Number of messages that could not be pre-processed.
    pub num_messages_failed_preprocessing: u64,
    /// Number of messages that could not be moved to in-progress.
    pub num_messages_failed_opening: u64,
}

/// The `QueueCoordinator` fetches messages from a queue, converts them into
/// record batches, and tracks the messages' state until their entire content is
/// published. Its API closely resembles the [`crate::source::Source`] trait,
/// making the implementation of queue sources straightforward.
pub struct QueueCoordinator {
    storage_resolver: StorageResolver,
    pipeline_id: IndexingPipelineId,
    source_type: SourceType,
    queue: Arc<dyn Queue>,
    queue_receiver: QueueReceiver,
    observable_state: QueueCoordinatorObservableState,
    message_type: MessageType,
    publish_lock: PublishLock,
    shared_state: QueueSharedState,
    local_state: QueueLocalState,
    publish_token: String,
    visibility_settings: VisibilitySettings,
}

impl fmt::Debug for QueueCoordinator {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("QueueTracker")
            .field("index_id", &self.pipeline_id.index_uid.index_id)
            .field("queue", &self.queue)
            .finish()
    }
}

impl QueueCoordinator {
    pub fn new(
        source_runtime: SourceRuntime,
        queue: Arc<dyn Queue>,
        message_type: MessageType,
        shard_max_age: Option<Duration>,
        shard_max_count: Option<u32>,
        shard_pruning_interval: Duration,
    ) -> Self {
        Self {
            shared_state: QueueSharedState::new(
                source_runtime.metastore,
                SourceUid {
                    index_uid: source_runtime.pipeline_id.index_uid.clone(),
                    source_id: source_runtime.pipeline_id.source_id.clone(),
                },
                Duration::from_secs(2 * source_runtime.indexing_setting.commit_timeout_secs as u64),
                shard_max_age,
                shard_max_count,
                shard_pruning_interval,
            ),
            local_state: QueueLocalState::default(),
            pipeline_id: source_runtime.pipeline_id,
            source_type: source_runtime.source_config.source_type(),
            storage_resolver: source_runtime.storage_resolver,
            queue_receiver: QueueReceiver::new(queue.clone(), RECEIVE_POLL_TIMEOUT),
            queue,
            observable_state: QueueCoordinatorObservableState::default(),
            message_type,
            publish_lock: PublishLock::default(),
            publish_token: Ulid::new().to_string(),
            visibility_settings: VisibilitySettings::from_commit_timeout(
                source_runtime.indexing_setting.commit_timeout_secs,
            ),
        }
    }

    #[cfg(feature = "sqs")]
    pub async fn try_from_sqs_config(
        config: FileSourceSqs,
        source_runtime: SourceRuntime,
    ) -> anyhow::Result<Self> {
        use super::sqs_queue::SqsQueue;
        let queue = SqsQueue::try_new(config.queue_url).await?;
        let message_type = match config.message_type {
            FileSourceMessageType::S3Notification => MessageType::S3Notification,
            FileSourceMessageType::RawUri => MessageType::RawUri,
        };
        let shard_max_age = Duration::from_secs(config.deduplication_window_duration_secs as u64);
        Ok(QueueCoordinator::new(
            source_runtime,
            Arc::new(queue),
            message_type,
            Some(shard_max_age),
            Some(config.deduplication_window_max_messages),
            Duration::from_secs(config.deduplication_cleanup_interval_secs as u64),
        ))
    }

    pub async fn initialize(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<(), ActorExitStatus> {
        let publish_lock = self.publish_lock.clone();
        ctx.send_message(doc_processor_mailbox, NewPublishLock(publish_lock))
            .await?;
        ctx.send_message(
            doc_processor_mailbox,
            NewPublishToken(self.publish_token.clone()),
        )
        .await?;
        Ok(())
    }

    /// Polls messages from the queue and prepares them for processing
    async fn poll_messages(&mut self, ctx: &SourceContext) -> Result<(), ActorExitStatus> {
        let raw_messages = self
            .queue_receiver
            .receive(1, self.visibility_settings.deadline_for_receive)
            .await?;

        let mut format_errors = Vec::new();
        let mut discardable_ack_ids = Vec::new();
        let mut preprocessed_messages = Vec::new();
        for message in raw_messages {
            match message.pre_process(self.message_type) {
                Ok(preprocessed_message) => preprocessed_messages.push(preprocessed_message),
                Err(PreProcessingError::UnexpectedFormat(err)) => format_errors.push(err),
                Err(PreProcessingError::Discardable { ack_id }) => discardable_ack_ids.push(ack_id),
            }
        }
        if !format_errors.is_empty() {
            self.observable_state.num_messages_failed_preprocessing += format_errors.len() as u64;
            rate_limited_error!(
                limit_per_min = 10,
                count = format_errors.len(),
                last_err = ?format_errors.last().unwrap(),
                "invalid messages not processed, use a dead letter queue to limit retries"
            );
        }
        if preprocessed_messages.is_empty() {
            self.queue.acknowledge(&discardable_ack_ids).await?;
            return Ok(());
        }

        // in rare situations, there might be duplicates within a batch
        let deduplicated_messages = preprocessed_messages
            .into_iter()
            .unique_by(|x| x.partition_id());

        let mut untracked_locally = Vec::new();
        let mut already_completed = Vec::new();
        for message in deduplicated_messages {
            let partition_id = message.partition_id();
            if self.local_state.is_completed(&partition_id) {
                already_completed.push(message);
            } else if !self.local_state.is_tracked(&partition_id) {
                untracked_locally.push(message);
            }
        }

        let checkpointed_messages = checkpoint_messages(
            &mut self.shared_state,
            &self.publish_token,
            untracked_locally,
        )
        .await?;

        let mut ready_messages = Vec::new();
        for (message, position) in checkpointed_messages {
            if position.is_eof() {
                self.local_state.mark_completed(message.partition_id());
                already_completed.push(message);
            } else {
                ready_messages.push(ReadyMessage {
                    visibility_handle: spawn_visibility_task(
                        ctx,
                        self.queue.clone(),
                        message.metadata.ack_id.clone(),
                        message.metadata.initial_deadline,
                        self.visibility_settings.clone(),
                    ),
                    content: message,
                    position,
                })
            }
        }

        self.local_state.set_ready_for_read(ready_messages);

        // Acknowledge messages that already have been processed
        let mut ack_ids = already_completed
            .iter()
            .map(|msg| msg.metadata.ack_id.clone())
            .collect::<Vec<_>>();
        ack_ids.append(&mut discardable_ack_ids);
        self.queue.acknowledge(&ack_ids).await?;

        Ok(())
    }

    pub async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        if let Some(in_progress_ref) = self.local_state.read_in_progress_mut() {
            // TODO: should we kill the publish lock if the message visibility extension failed?
            let batch_builder = in_progress_ref
                .batch_reader
                .read_batch(ctx.progress(), self.source_type)
                .await?;
            self.observable_state.num_lines_processed += batch_builder.docs.len() as u64;
            self.observable_state.num_bytes_processed += batch_builder.num_bytes;
            doc_processor_mailbox
                .send_message(batch_builder.build())
                .await?;
            if in_progress_ref.batch_reader.is_eof() {
                self.local_state.drop_currently_read().await?;
                self.observable_state.num_messages_processed += 1;
            }
        } else if let Some(ready_message) = self.local_state.get_ready_for_read() {
            match ready_message.start_processing(&self.storage_resolver).await {
                Ok(new_in_progress) => {
                    self.local_state.set_currently_read(new_in_progress)?;
                }
                Err(err) => {
                    self.observable_state.num_messages_failed_opening += 1;
                    rate_limited_error!(
                        limit_per_min = 5,
                        err = ?err,
                        "failed to start message processing"
                    );
                }
            }
        } else {
            self.poll_messages(ctx).await?;
        }

        Ok(Duration::ZERO)
    }

    pub async fn suggest_truncate(
        &mut self,
        checkpoint: SourceCheckpoint,
        _ctx: &SourceContext,
    ) -> anyhow::Result<()> {
        let committed_partition_ids = checkpoint
            .iter()
            .filter(|(_, pos)| pos.is_eof())
            .map(|(pid, _)| pid)
            .collect::<Vec<_>>();
        let mut completed = Vec::new();
        for partition_id in committed_partition_ids {
            let ack_id_opt = self.local_state.mark_completed(partition_id);
            if let Some(ack_id) = ack_id_opt {
                completed.push(ack_id);
            }
        }
        self.queue.acknowledge(&completed).await
    }

    pub fn observable_state(&self) -> &QueueCoordinatorObservableState {
        &self.observable_state
    }
}

#[cfg(test)]
mod tests {
    use std::str::FromStr;

    use quickwit_actors::{ActorContext, Universe};
    use quickwit_common::uri::Uri;
    use quickwit_proto::types::{NodeId, PipelineUid, Position};
    use tokio::sync::watch;
    use ulid::Ulid;

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::doc_file_reader::file_test_helpers::{DUMMY_DOC, generate_dummy_doc_file};
    use crate::source::queue_sources::memory_queue::MemoryQueueForTests;
    use crate::source::queue_sources::message::PreProcessedPayload;
    use crate::source::queue_sources::shared_state::shared_state_for_tests::init_state;
    use crate::source::{BATCH_NUM_BYTES_LIMIT, SourceActor};

    fn setup_coordinator(
        queue: Arc<MemoryQueueForTests>,
        shared_state: QueueSharedState,
    ) -> QueueCoordinator {
        let pipeline_id = IndexingPipelineId {
            node_id: NodeId::from_str("test-node").unwrap(),
            index_uid: shared_state.source_uid.index_uid.clone(),
            source_id: shared_state.source_uid.source_id.clone(),
            pipeline_uid: PipelineUid::random(),
        };

        QueueCoordinator {
            local_state: QueueLocalState::default(),
            shared_state,
            pipeline_id,
            observable_state: QueueCoordinatorObservableState::default(),
            publish_lock: PublishLock::default(),
            // set a very high chunking timeout to make it possible to count the
            // number of iterations required to process messages
            queue_receiver: QueueReceiver::new(queue.clone(), Duration::from_secs(10)),
            queue,
            message_type: MessageType::RawUri,
            source_type: SourceType::Unspecified,
            storage_resolver: StorageResolver::for_test(),
            publish_token: Ulid::new().to_string(),
            visibility_settings: VisibilitySettings::from_commit_timeout(5),
        }
    }

    async fn process_messages(
        coordinator: &mut QueueCoordinator,
        queue: Arc<MemoryQueueForTests>,
        messages: &[(&Uri, &str)],
    ) -> Vec<RawDocBatch> {
        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox::<SourceActor>();
        let (doc_processor_mailbox, doc_processor_inbox) =
            universe.create_test_mailbox::<DocProcessor>();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);

        coordinator
            .initialize(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        coordinator
            .emit_batches(&doc_processor_mailbox, &ctx)
            .await
            .unwrap();

        for (uri, ack_id) in messages {
            queue.send_message(uri.to_string(), ack_id);
        }

        // Need 3 iterations for each msg to emit the first batch (receive,
        // start, emit), assuming the `QueueReceiver` doesn't chunk the receive
        // future.
        for _ in 0..(messages.len() * 4) {
            coordinator
                .emit_batches(&doc_processor_mailbox, &ctx)
                .await
                .unwrap();
        }

        let batches = doc_processor_inbox
            .drain_for_test()
            .into_iter()
            .flat_map(|box_any| box_any.downcast::<RawDocBatch>().ok())
            .map(|box_raw_doc_batch| *box_raw_doc_batch)
            .collect::<Vec<_>>();
        universe.assert_quit().await;
        batches
    }

    #[tokio::test]
    async fn test_process_empty_queue() {
        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state("test-index", Default::default());
        let mut coordinator = setup_coordinator(queue.clone(), shared_state);
        let batches = process_messages(&mut coordinator, queue, &[]).await;
        assert_eq!(batches.len(), 0);
    }

    #[tokio::test]
    async fn test_process_one_small_message() {
        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state("test-index", Default::default());
        let mut coordinator = setup_coordinator(queue.clone(), shared_state.clone());
        let (dummy_doc_file, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri = Uri::from_str(dummy_doc_file.path().to_str().unwrap()).unwrap();
        let partition_id = PreProcessedPayload::ObjectUri(test_uri.clone()).partition_id();
        let batches = process_messages(&mut coordinator, queue, &[(&test_uri, "ack-id")]).await;
        assert_eq!(batches.len(), 1);
        assert_eq!(batches[0].docs.len(), 10);
        assert!(coordinator.local_state.is_awaiting_commit(&partition_id));
    }

    #[tokio::test]
    async fn test_process_one_big_message() {
        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state("test-index", Default::default());
        let mut coordinator = setup_coordinator(queue.clone(), shared_state);
        let lines = BATCH_NUM_BYTES_LIMIT as usize / DUMMY_DOC.len() + 1;
        let (dummy_doc_file, _) = generate_dummy_doc_file(true, lines).await;
        let test_uri = Uri::from_str(dummy_doc_file.path().to_str().unwrap()).unwrap();
        let batches = process_messages(&mut coordinator, queue, &[(&test_uri, "ack-id")]).await;
        assert_eq!(batches.len(), 2);
        assert_eq!(batches.iter().map(|b| b.docs.len()).sum::<usize>(), lines);
    }

    #[tokio::test]
    async fn test_process_two_messages_different_compression() {
        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state("test-index", Default::default());
        let mut coordinator = setup_coordinator(queue.clone(), shared_state);
        let (dummy_doc_file_1, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri_1 = Uri::from_str(dummy_doc_file_1.path().to_str().unwrap()).unwrap();
        let (dummy_doc_file_2, _) = generate_dummy_doc_file(true, 10).await;
        let test_uri_2 = Uri::from_str(dummy_doc_file_2.path().to_str().unwrap()).unwrap();
        let batches = process_messages(
            &mut coordinator,
            queue,
            &[(&test_uri_1, "ack-id-1"), (&test_uri_2, "ack-id-2")],
        )
        .await;
        // could be generated in 1 or 2 batches, it doesn't matter
        assert_eq!(batches.iter().map(|b| b.docs.len()).sum::<usize>(), 20);
    }

    #[tokio::test]
    async fn test_process_local_duplicate_message() {
        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state("test-index", Default::default());
        let mut coordinator = setup_coordinator(queue.clone(), shared_state);
        let (dummy_doc_file, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri = Uri::from_str(dummy_doc_file.path().to_str().unwrap()).unwrap();
        let batches = process_messages(
            &mut coordinator,
            queue,
            &[(&test_uri, "ack-id-1"), (&test_uri, "ack-id-2")],
        )
        .await;
        assert_eq!(batches.len(), 1);
        assert_eq!(batches.iter().map(|b| b.docs.len()).sum::<usize>(), 10);
    }

    #[tokio::test]
    async fn test_process_shared_complete_message() {
        let (dummy_doc_file, file_size) = generate_dummy_doc_file(false, 10).await;
        let test_uri = Uri::from_str(dummy_doc_file.path().to_str().unwrap()).unwrap();
        let partition_id = PreProcessedPayload::ObjectUri(test_uri.clone()).partition_id();

        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state(
            "test-index",
            &[(
                partition_id.clone(),
                (
                    "existing_token".to_string(),
                    Position::eof(file_size),
                    false,
                ),
            )],
        );
        let mut coordinator = setup_coordinator(queue.clone(), shared_state.clone());

        assert!(!coordinator.local_state.is_tracked(&partition_id));
        let batches = process_messages(&mut coordinator, queue, &[(&test_uri, "ack-id-1")]).await;
        assert_eq!(batches.len(), 0);
        assert!(coordinator.local_state.is_completed(&partition_id));
    }

    #[tokio::test]
    async fn test_process_existing_messages() {
        let (dummy_doc_file_1, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri_1 = Uri::from_str(dummy_doc_file_1.path().to_str().unwrap()).unwrap();
        let partition_id_1 = PreProcessedPayload::ObjectUri(test_uri_1.clone()).partition_id();

        let (dummy_doc_file_2, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri_2 = Uri::from_str(dummy_doc_file_2.path().to_str().unwrap()).unwrap();
        let partition_id_2 = PreProcessedPayload::ObjectUri(test_uri_2.clone()).partition_id();

        let (dummy_doc_file_3, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri_3 = Uri::from_str(dummy_doc_file_3.path().to_str().unwrap()).unwrap();
        let partition_id_3 = PreProcessedPayload::ObjectUri(test_uri_3.clone()).partition_id();

        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state(
            "test-index",
            &[
                (
                    partition_id_1.clone(),
                    ("existing_token_1".to_string(), Position::Beginning, true),
                ),
                (
                    partition_id_2.clone(),
                    (
                        "existing_token_2".to_string(),
                        Position::offset((DUMMY_DOC.len() + 1) * 2),
                        true,
                    ),
                ),
                (
                    partition_id_3.clone(),
                    (
                        "existing_token_3".to_string(),
                        Position::offset((DUMMY_DOC.len() + 1) * 6),
                        false, // should not be processed because not stale yet
                    ),
                ),
            ],
        );
        let mut coordinator = setup_coordinator(queue.clone(), shared_state.clone());
        let batches = process_messages(
            &mut coordinator,
            queue,
            &[
                (&test_uri_1, "ack-id-1"),
                (&test_uri_2, "ack-id-2"),
                (&test_uri_3, "ack-id-3"),
            ],
        )
        .await;
        assert_eq!(batches.len(), 2);
        assert_eq!(batches.iter().map(|b| b.docs.len()).sum::<usize>(), 18);
        assert!(coordinator.local_state.is_awaiting_commit(&partition_id_1));
        assert!(coordinator.local_state.is_awaiting_commit(&partition_id_2));
    }

    #[tokio::test]
    async fn test_process_multiple_coordinator() {
        let queue = Arc::new(MemoryQueueForTests::new());
        let shared_state = init_state("test-index", Default::default());
        let mut coord_1 = setup_coordinator(queue.clone(), shared_state.clone());
        let mut coord_2 = setup_coordinator(queue.clone(), shared_state.clone());
        let (dummy_doc_file, _) = generate_dummy_doc_file(false, 10).await;
        let test_uri = Uri::from_str(dummy_doc_file.path().to_str().unwrap()).unwrap();
        let partition_id = PreProcessedPayload::ObjectUri(test_uri.clone()).partition_id();

        let batches_1 = process_messages(&mut coord_1, queue.clone(), &[(&test_uri, "ack1")]).await;
        let batches_2 = process_messages(&mut coord_2, queue, &[(&test_uri, "ack2")]).await;

        assert_eq!(batches_1.len(), 1);
        assert_eq!(batches_1[0].docs.len(), 10);
        assert!(coord_1.local_state.is_awaiting_commit(&partition_id));
        // proc_2 learns from shared state that the message is likely still
        // being processed and skips it
        assert_eq!(batches_2.len(), 0);
        assert!(!coord_2.local_state.is_tracked(&partition_id));
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/design.md
================================================
# Queue source design

## Exactly once

Besides the usual failures that can happen during indexing, most queues are also subject to duplicates. To ensure that all object files are indexed exactly once, we track the progress of their indexing using the shard table:
- each file object is tracked as a shard, the file URI is the shard ID
- progress made on the indexing of a given shard is committed in the shard table in a common transaction with the split publishing
- after some time (called deduplication window) shards are garbage collected to keep the size of the shard table small

## Visibility extension task

To keep messages invisible to other pipelines while they are being processed, each received message spawns a visibility extension task. This task is responsible of extending the visibility timeout each time the visibility deadlines approaches. When the last batch is read for the message and sent to the indexing pipeline:
- a last visibility extension is requested to give time for the indexing to complete (typically twice the commit timeout) 
- the visibility extension task stopped

## Cleanup of old shards

Garbage collection is owned by the queue based sources. Each pipeline with a queue source will spawn a garbage collection task. To avoid having an increased load on the metastore as the number of pipeline scales, garbage collection calls are debounced by the control plane.

## Onboarding new queues

This module is meant to be generic enough to:
- use other queue implementations, such as GCP Pub/Sub
- source the data from other sources than object storage, e.g directly from the message

Note that because every single messages is tracked by the metastore, this design will not behave well with high message rates. For instance it is not meant to be efficient with a data stream where every message contains a single event. As a rule of thumb, to protect the metastore, it is discouraged to try processing more than 50 messages per second with this design. This means that high throughput can only be achieved with larger contents for each message (e.g larger files when the using the file source with queue notifications).

## Implementation

The `QueueCoordinator` is a concrete implementation of the machinery necessary to consume data from a queue, from the message reception to its acknowledgment after indexing. The `QueueCoordinator` interacts with 3 main components.

### The `Queue`

The `Queue` is an abstract interface that can represent any queue implementation (AWS SQS, Google Pub/Sub...). It is sufficient that the queue guaranties at least one delivery of its messages. The abstraction reduces the actual queue's API surface to 3 main functions:
- receive messages that are ready to be processed
- extend their visibility timeout, i.e delay the time at which a message is visible again to other consumers
- acknowledge messages, i.e delete them definitively from the queue after successful indexing

### The `QueueLocalState`

The local state is an in memory data structure that keeps track of the knowledge that the current source has of recently received messages. It manages the transitions of messages between 4 states:
- ready for read
- read in progress
- awaiting commit
- completed


### The `QueueSharedState`

The shared state is a client of the Shard API, a metastore API that was mainly designed to serve ingest V2. The Shard API improves on the previous checkpoint API which was stored as a blob in one of the fields of the index model. The flow is the following one:

The queue source opens a shard, using an ID that uniquely identifies the content of the message as shard ID. For the file source, the shard ID is the file URI. Each source has a unique publish token that is provided in the `OpenShards` metastore request. The response of the `OpenShards` requests returns the token of the caller that called the API first. Either:
- The returned token matches the current pipeline's token. This means that we have the ownership of this message content and can proceed with its indexing
- The returned token does not match the current pipeline's token. This means that another pipeline has the ownership. In that case, we look at the content of the shard:
  - if it's already completely processed (EOF), we acknowledge the message drop it
  - if its last update timestamp is old (e.g twice the commit timeout), we assume the processing of the content to be stale (e.g the owning pipeline failed). We perform an `AcquireShards` call to update the shard's token in the metastore with the local one. This indicates subsequent attempts to process the shard that this pipeline now has its ownership. Note though that this is subject to a race conditions: 2 pipelines might acquire the shard concurrently. In that case both pipelines will assume that it owns the shard, and one of them will fail at commit time.
  - if its last update timestamp is recent, we assume that the processing of the content is still in progress in another pipeline. We just drop the message (without any acknowledgment) and let it be re-processed once its visibility timeout expires.

The `QueueSharedState` also owns the background task that will periodically initiate a call to `PruneShards` to garbage collect old shards.


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/helpers.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;
use std::time::Duration;

use futures::future::BoxFuture;

use super::Queue;
use super::message::RawMessage;

type ReceiveResult = anyhow::Result<Vec<RawMessage>>;

/// A statefull wrapper around a `Queue` that chunks the slow `receive()` call
/// into shorter iterations. This enables yielding back to the actor system
/// without compromising on queue poll durations. Without this, an actor that
/// tries to receive messages from a `Queue` will be blocked for multiple seconds
/// before being able to process new mailbox messages (or shutting down).
pub struct QueueReceiver {
    queue: Arc<dyn Queue>,
    receive: Option<BoxFuture<'static, ReceiveResult>>,
    iteration: Duration,
}

impl QueueReceiver {
    pub fn new(queue: Arc<dyn Queue>, iteration: Duration) -> Self {
        Self {
            queue,
            receive: None,
            iteration,
        }
    }

    pub async fn receive(
        &mut self,
        max_messages: usize,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Vec<RawMessage>> {
        if self.receive.is_none() {
            self.receive = Some(self.queue.clone().receive(max_messages, suggested_deadline));
        }
        tokio::select! {
            res = self.receive.as_mut().unwrap() => {
                self.receive = None;
                res
            }
            _ = tokio::time::sleep(self.iteration) => {
                Ok(Vec::new())
            }

        }
    }
}

#[cfg(test)]
mod tests {
    use std::time::{Duration, Instant};

    use anyhow::bail;
    use async_trait::async_trait;

    use super::*;

    #[derive(Clone, Debug)]
    struct SleepyQueue {
        receive_sleep: Duration,
    }

    #[async_trait]
    impl Queue for SleepyQueue {
        async fn receive(
            self: Arc<Self>,
            _max_messages: usize,
            _suggested_deadline: Duration,
        ) -> anyhow::Result<Vec<RawMessage>> {
            tokio::time::sleep(self.receive_sleep).await;
            bail!("Waking up from my nap")
        }

        async fn acknowledge(&self, _ack_ids: &[String]) -> anyhow::Result<()> {
            unimplemented!()
        }

        async fn modify_deadlines(
            &self,
            _ack_id: &str,
            _suggested_deadline: Duration,
        ) -> anyhow::Result<Instant> {
            unimplemented!()
        }
    }

    #[tokio::test]
    async fn test_queue_receiver_slow_receive() {
        let queue = Arc::new(SleepyQueue {
            receive_sleep: Duration::from_millis(100),
        });
        let mut receiver = QueueReceiver::new(queue, Duration::from_millis(20));
        let mut iterations = 0;
        while receiver.receive(1, Duration::from_secs(1)).await.is_ok() {
            iterations += 1;
        }
        assert!(iterations >= 4);
    }

    #[tokio::test]
    async fn test_queue_receiver_fast_receive() {
        let queue = Arc::new(SleepyQueue {
            receive_sleep: Duration::from_millis(10),
        });
        let mut receiver = QueueReceiver::new(queue, Duration::from_millis(50));
        assert!(receiver.receive(1, Duration::from_secs(1)).await.is_err());
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/local_state.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, BTreeSet, VecDeque};

use anyhow::bail;
use quickwit_metastore::checkpoint::PartitionId;

use super::message::{InProgressMessage, ReadyMessage};

/// Tracks the state of the queue messages that are known to the owning indexing
/// pipeline.
///
/// Messages first land in the `ready_for_read` queue. They are then moved to
/// `read_in_progress` to track the reader's progress. Once the reader reaches
/// EOF, the message is transitioned as `awaiting_commit`. Once the message is
/// known to be fully indexed and committed (e.g after receiving the
/// `suggest_truncate` call), it is moved to `completed`.
#[derive(Default)]
pub struct QueueLocalState {
    /// Messages that were received from the queue and are ready to be read
    ready_for_read: VecDeque<ReadyMessage>,
    /// Message that is currently being read and sent to the `DocProcessor`
    read_in_progress: Option<InProgressMessage>,
    /// Partitions that were read and are still being indexed, with their
    /// associated ack_id
    awaiting_commit: BTreeMap<PartitionId, String>,
    /// Partitions that were fully indexed and committed
    completed: BTreeSet<PartitionId>,
}

impl QueueLocalState {
    pub fn is_ready_for_read(&self, partition_id: &PartitionId) -> bool {
        self.ready_for_read
            .iter()
            .any(|msg| &msg.partition_id() == partition_id)
    }

    pub fn is_read_in_progress(&self, partition_id: &PartitionId) -> bool {
        self.read_in_progress
            .as_ref()
            .map(|msg| &msg.partition_id == partition_id)
            .unwrap_or(false)
    }

    pub fn is_awaiting_commit(&self, partition_id: &PartitionId) -> bool {
        self.awaiting_commit.contains_key(partition_id)
    }

    pub fn is_completed(&self, partition_id: &PartitionId) -> bool {
        self.completed.contains(partition_id)
    }

    pub fn is_tracked(&self, partition_id: &PartitionId) -> bool {
        self.is_ready_for_read(partition_id)
            || self.is_read_in_progress(partition_id)
            || self.is_awaiting_commit(partition_id)
            || self.is_completed(partition_id)
    }

    pub fn set_ready_for_read(&mut self, ready_messages: Vec<ReadyMessage>) {
        for message in ready_messages {
            self.ready_for_read.push_back(message)
        }
    }

    pub fn get_ready_for_read(&mut self) -> Option<ReadyMessage> {
        while let Some(msg) = self.ready_for_read.pop_front() {
            // don't return messages for which we didn't manage to extend the
            // visibility, they will pop up in the queue again anyway
            if !msg.visibility_handle.extension_failed() {
                return Some(msg);
            }
        }
        None
    }

    pub fn read_in_progress_mut(&mut self) -> Option<&mut InProgressMessage> {
        self.read_in_progress.as_mut()
    }

    pub async fn drop_currently_read(&mut self) -> anyhow::Result<()> {
        if let Some(in_progress) = self.read_in_progress.take() {
            self.awaiting_commit.insert(
                in_progress.partition_id.clone(),
                in_progress.visibility_handle.ack_id().to_string(),
            );
            in_progress
                .visibility_handle
                .request_last_extension()
                .await?;
        }
        Ok(())
    }

    /// Tries to set the message that is currently being read. Returns an error
    /// if there is already a message being read.
    pub fn set_currently_read(
        &mut self,
        in_progress: Option<InProgressMessage>,
    ) -> anyhow::Result<()> {
        if self.read_in_progress.is_some() {
            bail!("trying to replace in progress message");
        }
        self.read_in_progress = in_progress;
        Ok(())
    }

    /// Returns the ack_id if that message was awaiting_commit
    pub fn mark_completed(&mut self, partition_id: PartitionId) -> Option<String> {
        let ack_id_opt = self.awaiting_commit.remove(&partition_id);
        self.completed.insert(partition_id);
        ack_id_opt
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/memory_queue.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, VecDeque};
use std::fmt;
use std::sync::{Arc, Mutex};
use std::time::{Duration, Instant};

use anyhow::bail;
use async_trait::async_trait;
use quickwit_storage::OwnedBytes;
use ulid::Ulid;

use super::Queue;
use super::message::{MessageMetadata, RawMessage};

#[derive(Default)]
struct InnerState {
    in_queue: VecDeque<RawMessage>,
    in_flight: BTreeMap<String, RawMessage>,
    acked: Vec<RawMessage>,
}

impl fmt::Debug for InnerState {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("Queue")
            .field("in_queue_count", &self.in_queue.len())
            .field("in_flight_count", &self.in_flight.len())
            .field("acked_count", &self.acked.len())
            .finish()
    }
}

/// A simple in-memory queue
#[derive(Clone, Debug)]
pub struct MemoryQueueForTests {
    inner_state: Arc<Mutex<InnerState>>,
    receive_sleep: Duration,
}

impl MemoryQueueForTests {
    pub fn new() -> Self {
        let inner_state = Arc::new(Mutex::new(InnerState::default()));
        let inner_weak = Arc::downgrade(&inner_state);
        tokio::spawn(async move {
            loop {
                if let Some(inner_state) = inner_weak.upgrade() {
                    let mut inner_state = inner_state.lock().unwrap();
                    let mut expired = Vec::new();
                    for (ack_id, msg) in inner_state.in_flight.iter() {
                        if msg.metadata.initial_deadline < Instant::now() {
                            expired.push(ack_id.clone());
                        }
                    }
                    for ack_id in expired {
                        let msg = inner_state.in_flight.remove(&ack_id).unwrap();
                        inner_state.in_queue.push_back(msg);
                    }
                } else {
                    break;
                }
                tokio::time::sleep(Duration::from_millis(50)).await;
            }
        });
        MemoryQueueForTests {
            inner_state: Arc::new(Mutex::new(InnerState::default())),
            receive_sleep: Duration::from_millis(50),
        }
    }

    pub fn send_message(&self, payload: String, ack_id: &str) {
        let message = RawMessage {
            payload: OwnedBytes::new(payload.into_bytes()),
            metadata: MessageMetadata {
                ack_id: ack_id.to_string(),
                delivery_attempts: 0,
                initial_deadline: Instant::now(),
                message_id: Ulid::new().to_string(),
            },
        };
        self.inner_state.lock().unwrap().in_queue.push_back(message);
    }

    /// Returns the next visibility deadline for the message if it is in flight
    pub fn next_visibility_deadline(&self, ack_id: &str) -> Option<Instant> {
        let inner_state = self.inner_state.lock().unwrap();
        inner_state
            .in_flight
            .get(ack_id)
            .map(|msg| msg.metadata.initial_deadline)
    }
}

#[async_trait]
impl Queue for MemoryQueueForTests {
    async fn receive(
        self: Arc<Self>,
        max_messages: usize,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Vec<RawMessage>> {
        {
            let mut inner_state = self.inner_state.lock().unwrap();
            let mut response = Vec::new();
            while let Some(mut msg) = inner_state.in_queue.pop_front() {
                msg.metadata.delivery_attempts += 1;
                msg.metadata.initial_deadline = Instant::now() + suggested_deadline;
                let msg_cloned = RawMessage {
                    payload: msg.payload.clone(),
                    metadata: msg.metadata.clone(),
                };
                inner_state
                    .in_flight
                    .insert(msg.metadata.ack_id.clone(), msg_cloned);
                response.push(msg);
                if response.len() >= max_messages {
                    break;
                }
            }
            if !response.is_empty() {
                return Ok(response);
            }
        }
        // `sleep` to avoid using all the CPU when called in a loop
        tokio::time::sleep(self.receive_sleep).await;

        Ok(vec![])
    }

    async fn acknowledge(&self, ack_ids: &[String]) -> anyhow::Result<()> {
        let mut inner_state = self.inner_state.lock().unwrap();
        for ack_id in ack_ids {
            if let Some(msg) = inner_state.in_flight.remove(ack_id) {
                inner_state.acked.push(msg);
            }
        }
        Ok(())
    }

    async fn modify_deadlines(
        &self,
        ack_id: &str,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Instant> {
        let mut inner_state = self.inner_state.lock().unwrap();
        let in_flight = inner_state.in_flight.get_mut(ack_id);
        if let Some(msg) = in_flight {
            msg.metadata.initial_deadline = Instant::now() + suggested_deadline;
        } else {
            bail!("ack_id {} not found in in-flight", ack_id);
        }
        return Ok(Instant::now() + suggested_deadline);
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    fn prefilled_queue(nb_message: usize) -> Arc<MemoryQueueForTests> {
        let memory_queue = MemoryQueueForTests::new();
        for i in 0..nb_message {
            let payload = format!("Test message {i}");
            let ack_id = i.to_string();
            memory_queue.send_message(payload.clone(), &ack_id);
        }
        Arc::new(memory_queue)
    }

    #[tokio::test]
    async fn test_receive_1_by_1() {
        let memory_queue = prefilled_queue(2);
        for i in 0..2 {
            let messages = memory_queue
                .clone()
                .receive(1, Duration::from_secs(5))
                .await
                .unwrap();
            assert_eq!(messages.len(), 1);
            let message = &messages[0];
            let exp_payload = format!("Test message {i}");
            let exp_ack_id = i.to_string();
            assert_eq!(message.payload.as_ref(), exp_payload.as_bytes());
            assert_eq!(message.metadata.ack_id, exp_ack_id);
        }
    }

    #[tokio::test]
    async fn test_receive_2_by_2() {
        let memory_queue = prefilled_queue(2);
        let messages = memory_queue
            .receive(2, Duration::from_secs(5))
            .await
            .unwrap();
        assert_eq!(messages.len(), 2);
        for (i, message) in messages.iter().enumerate() {
            let exp_payload = format!("Test message {i}");
            let exp_ack_id = i.to_string();
            assert_eq!(message.payload.as_ref(), exp_payload.as_bytes());
            assert_eq!(message.metadata.ack_id, exp_ack_id);
        }
    }

    #[tokio::test]
    async fn test_receive_early_if_only_1() {
        let memory_queue = prefilled_queue(1);
        let messages = memory_queue
            .receive(2, Duration::from_secs(5))
            .await
            .unwrap();
        assert_eq!(messages.len(), 1);
        let message = &messages[0];
        let exp_payload = "Test message 0".to_string();
        let exp_ack_id = "0";
        assert_eq!(message.payload.as_ref(), exp_payload.as_bytes());
        assert_eq!(message.metadata.ack_id, exp_ack_id);
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/message.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use core::fmt;
use std::io::read_to_string;
use std::str::FromStr;
use std::time::Instant;

use anyhow::Context;
use quickwit_common::rate_limited_warn;
use quickwit_common::uri::Uri;
use quickwit_metastore::checkpoint::PartitionId;
use quickwit_proto::types::Position;
use quickwit_storage::{OwnedBytes, StorageResolver};
use serde_json::Value;
use thiserror::Error;
use tracing::info;

use super::visibility::VisibilityTaskHandle;
use crate::source::doc_file_reader::ObjectUriBatchReader;

#[derive(Debug, Clone, Copy)]
pub enum MessageType {
    S3Notification,
    // GcsNotification,
    RawUri,
    // RawData,
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub struct MessageMetadata {
    /// The handle that should be used to acknowledge the message or change its visibility deadline
    pub ack_id: String,

    /// The unique message id assigned by the queue
    pub message_id: String,

    /// The approximate number of times the message was delivered. 1 means it is
    /// the first time this message is being delivered.
    pub delivery_attempts: usize,

    /// The first deadline when the message is received. It can be extended later using the ack_id.
    pub initial_deadline: Instant,
}

/// The raw messages as received from the queue abstraction
pub struct RawMessage {
    pub metadata: MessageMetadata,
    pub payload: OwnedBytes,
}

impl fmt::Debug for RawMessage {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("RawMessage")
            .field("metadata", &self.metadata)
            .field("payload", &"<bytes>")
            .finish()
    }
}

#[derive(Error, Debug)]
pub enum PreProcessingError {
    #[error("message can be acknowledged without processing")]
    Discardable { ack_id: String },
    #[error("unexpected message format: {0}")]
    UnexpectedFormat(#[from] anyhow::Error),
}

impl RawMessage {
    pub fn pre_process(
        self,
        message_type: MessageType,
    ) -> Result<PreProcessedMessage, PreProcessingError> {
        let payload = match message_type {
            MessageType::S3Notification => PreProcessedPayload::ObjectUri(
                uri_from_s3_notification(&self.payload, &self.metadata.ack_id)?,
            ),
            MessageType::RawUri => {
                let payload_str = read_to_string(self.payload).context("failed to read payload")?;
                PreProcessedPayload::ObjectUri(Uri::from_str(&payload_str)?)
            }
        };
        Ok(PreProcessedMessage {
            metadata: self.metadata,
            payload,
        })
    }
}

#[derive(Debug, PartialEq, Eq)]
pub enum PreProcessedPayload {
    /// The message contains an object URI
    ObjectUri(Uri),
    // /// The message contains the raw JSON data
    // RawData(OwnedBytes),
}

impl PreProcessedPayload {
    pub fn partition_id(&self) -> PartitionId {
        match &self {
            Self::ObjectUri(uri) => PartitionId::from(uri.as_str()),
        }
    }
}

/// A message that went through the minimal transformation to discover its
/// partition id. Indeed, the message might be discarded if the partition was
/// already processed, so it's better to avoid doing unnecessary work at this
/// stage.
#[derive(Debug, PartialEq, Eq)]
pub struct PreProcessedMessage {
    pub metadata: MessageMetadata,
    pub payload: PreProcessedPayload,
}

impl PreProcessedMessage {
    pub fn partition_id(&self) -> PartitionId {
        self.payload.partition_id()
    }
}

fn uri_from_s3_notification(message: &[u8], ack_id: &str) -> Result<Uri, PreProcessingError> {
    let value: Value = serde_json::from_slice(message).context("invalid JSON message")?;
    if matches!(value["Event"].as_str(), Some("s3:TestEvent")) {
        info!("discarding S3 test event");
        return Err(PreProcessingError::Discardable {
            ack_id: ack_id.to_string(),
        });
    }
    let event_name = value["Records"][0]["eventName"]
        .as_str()
        .context("invalid S3 notification: Records[0].eventName not found")?;
    if !event_name.starts_with("ObjectCreated:") {
        rate_limited_warn!(
            limit_per_min = 5,
            event = event_name,
            "only s3:ObjectCreated:* events are supported"
        );
        return Err(PreProcessingError::Discardable {
            ack_id: ack_id.to_string(),
        });
    }
    let key = value["Records"][0]["s3"]["object"]["key"]
        .as_str()
        .context("invalid S3 notification: Records[0].s3.object.key not found")?;
    let bucket = value["Records"][0]["s3"]["bucket"]["name"]
        .as_str()
        .context("invalid S3 notification: Records[0].s3.bucket.name not found")?;
    let encoded_key = percent_encoding::percent_decode(key.as_bytes())
        .decode_utf8()
        .context("invalid S3 notification: Records[0].s3.object.key could not be url decoded")?;
    Uri::from_str(&format!("s3://{bucket}/{encoded_key}")).map_err(|e| e.into())
}

/// A message for which we know as much of the global processing status as
/// possible and that is now ready to be processed.
pub struct ReadyMessage {
    pub position: Position,
    pub content: PreProcessedMessage,
    pub visibility_handle: VisibilityTaskHandle,
}

impl ReadyMessage {
    pub async fn start_processing(
        self,
        storage_resolver: &StorageResolver,
    ) -> anyhow::Result<Option<InProgressMessage>> {
        let partition_id = self.partition_id();
        match self.content.payload {
            PreProcessedPayload::ObjectUri(uri) => {
                let batch_reader = ObjectUriBatchReader::try_new(
                    storage_resolver,
                    partition_id.clone(),
                    &uri,
                    self.position,
                )
                .await?;
                if batch_reader.is_eof() {
                    Ok(None)
                } else {
                    Ok(Some(InProgressMessage {
                        batch_reader,
                        partition_id,
                        visibility_handle: self.visibility_handle,
                    }))
                }
            }
        }
    }

    pub fn partition_id(&self) -> PartitionId {
        self.content.partition_id()
    }
}

/// A message that is actively being read
pub struct InProgressMessage {
    pub partition_id: PartitionId,
    pub visibility_handle: VisibilityTaskHandle,
    pub batch_reader: ObjectUriBatchReader,
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_uri_from_s3_notification_valid() {
        let test_message = r#"
        {
            "Records": [
                {
                "eventVersion": "2.1",
                "eventSource": "aws:s3",
                "awsRegion": "us-west-2",
                "eventTime": "2021-05-22T09:22:41.789Z",
                "eventName": "ObjectCreated:Put",
                "userIdentity": {
                    "principalId": "AWS:AIDAJDPLRKLG7UEXAMPLE"
                },
                "requestParameters": {
                    "sourceIPAddress": "127.0.0.1"
                },
                "responseElements": {
                    "x-amz-request-id": "C3D13FE58DE4C810",
                    "x-amz-id-2": "FMyUVURIx7Zv2cPi/IZb9Fk1/U4QfTaVK5fahHPj/"
                },
                "s3": {
                    "s3SchemaVersion": "1.0",
                    "configurationId": "testConfigRule",
                    "bucket": {
                        "name": "mybucket",
                        "ownerIdentity": {
                            "principalId": "A3NL1KOZZKExample"
                        },
                        "arn": "arn:aws:s3:::mybucket"
                    },
                    "object": {
                        "key": "logs.json",
                        "size": 1024,
                        "eTag": "d41d8cd98f00b204e9800998ecf8427e",
                        "versionId": "096fKKXTRTtl3on89fVO.nfljtsv6qko",
                        "sequencer": "0055AED6DCD90281E5"
                    }
                }
                }
            ]
        }"#;
        let actual_uri = uri_from_s3_notification(test_message.as_bytes(), "myackid").unwrap();
        let expected_uri = Uri::from_str("s3://mybucket/logs.json").unwrap();
        assert_eq!(actual_uri, expected_uri);
    }

    #[test]
    fn test_uri_from_s3_notification_invalid() {
        let invalid_message = r#"{
            "Records": [
                {
                    "s3": {
                        "object": {
                            "key": "test_key"
                        }
                    }
                }
            ]
        }"#;
        let result =
            uri_from_s3_notification(&OwnedBytes::new(invalid_message.as_bytes()), "myackid");
        assert!(matches!(
            result,
            Err(PreProcessingError::UnexpectedFormat(_))
        ));
    }

    #[test]
    fn test_uri_from_s3_bad_event_type() {
        let invalid_message = r#"{
            "Records": [
                {
                    "eventVersion": "2.1",
                    "eventSource": "aws:s3",
                    "awsRegion": "us-east-1",
                    "eventTime": "2024-07-29T12:47:14.577Z",
                    "eventName": "ObjectRemoved:Delete",
                    "userIdentity": {
                        "principalId": "AWS:ARGHGOHSDGOKGHOGHMCC4:user"
                    },
                    "requestParameters": {
                        "sourceIPAddress": "1.1.1.1"
                    },
                    "responseElements": {
                        "x-amz-request-id": "GHGSH",
                        "x-amz-id-2": "gndflghndflhmnrflsh+gLLKU6X0PvD6ANdVY1+/hspflhjladgfkelagfkndl"
                    },
                    "s3": {
                        "s3SchemaVersion": "1.0",
                        "configurationId": "hello",
                        "bucket": {
                            "name": "mybucket",
                            "ownerIdentity": {
                                "principalId": "KMGP12GHKKH"
                            },
                            "arn": "arn:aws:s3:::mybucket"
                        },
                        "object": {
                            "key": "my_deleted_file",
                            "sequencer": "GKHOFLGKHSALFK0"
                        }
                    }
                }
            ]
        }"#;
        let result =
            uri_from_s3_notification(&OwnedBytes::new(invalid_message.as_bytes()), "myackid");
        assert!(matches!(
            result,
            Err(PreProcessingError::Discardable { .. })
        ));
    }

    #[test]
    fn test_uri_from_s3_notification_discardable() {
        let invalid_message = r#"{
            "Service":"Amazon S3",
            "Event":"s3:TestEvent",
            "Time":"2014-10-13T15:57:02.089Z",
            "Bucket":"bucketname",
            "RequestId":"5582815E1AEA5ADF",
            "HostId":"8cLeGAmw098X5cv4Zkwcmo8vvZa3eH3eKxsPzbB9wrR+YstdA6Knx4Ip8EXAMPLE"
        }"#;
        let result =
            uri_from_s3_notification(&OwnedBytes::new(invalid_message.as_bytes()), "myackid");
        if let Err(PreProcessingError::Discardable { ack_id }) = result {
            assert_eq!(ack_id, "myackid");
        } else {
            panic!("Expected skippable error");
        }
    }

    #[test]
    fn test_uri_from_s3_notification_url_decode() {
        let test_message = r#"
        {
            "Records": [
                {
                "eventVersion": "2.1",
                "eventSource": "aws:s3",
                "awsRegion": "us-west-2",
                "eventTime": "2021-05-22T09:22:41.789Z",
                "eventName": "ObjectCreated:Put",
                "userIdentity": {
                    "principalId": "AWS:AIDAJDPLRKLG7UEXAMPLE"
                },
                "requestParameters": {
                    "sourceIPAddress": "127.0.0.1"
                },
                "responseElements": {
                    "x-amz-request-id": "C3D13FE58DE4C810",
                    "x-amz-id-2": "FMyUVURIx7Zv2cPi/IZb9Fk1/U4QfTaVK5fahHPj/"
                },
                "s3": {
                    "s3SchemaVersion": "1.0",
                    "configurationId": "testConfigRule",
                    "bucket": {
                        "name": "mybucket",
                        "ownerIdentity": {
                            "principalId": "A3NL1KOZZKExample"
                        },
                        "arn": "arn:aws:s3:::mybucket"
                    },
                    "object": {
                        "key": "hello%3A%3Aworld%3A%3Alogs.json",
                        "size": 1024,
                        "eTag": "d41d8cd98f00b204e9800998ecf8427e",
                        "versionId": "096fKKXTRTtl3on89fVO.nfljtsv6qko",
                        "sequencer": "0055AED6DCD90281E5"
                    }
                }
                }
            ]
        }"#;
        let actual_uri = uri_from_s3_notification(test_message.as_bytes(), "myackid").unwrap();
        let expected_uri = Uri::from_str("s3://mybucket/hello::world::logs.json").unwrap();
        assert_eq!(actual_uri, expected_uri);
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub mod coordinator;
mod helpers;
mod local_state;
#[cfg(test)]
mod memory_queue;
mod message;
mod shared_state;
#[cfg(feature = "sqs")]
pub mod sqs_queue;
mod visibility;

use std::fmt;
use std::sync::Arc;
use std::time::{Duration, Instant};

use async_trait::async_trait;
use message::RawMessage;

/// The queue abstraction is based on the AWS SQS and Google Pubsub APIs. The
/// only requirement of the underlying implementation is that messages exposed
/// to a given consumer are hidden to other consumers for a configurable period
/// of time. Retries are handled by the implementation because queues might
/// behave differently (throttling, deduplication...).
#[async_trait]
pub trait Queue: fmt::Debug + Send + Sync + 'static {
    /// Polls the queue to receive messages.
    ///
    /// The implementation is in charge of choosing the wait strategy when there
    /// are no messages in the queue. It will typically use long polling to do
    /// this efficiently. On the other hand, when there is a message available
    /// in the queue, it should be returned as quickly as possible, regardless
    /// of the `max_messages` parameter. The `max_messages` paramater should
    /// always be clamped by the implementation to not violate the maximum value
    /// supported by the backing queue (e.g 10 messages for AWS SQS).
    ///
    /// As soon as the message is received, the caller is responsible for
    /// maintaining the message visibility in a timely fashion. Failing to do so
    /// implies that duplicates will be received by other indexing pipelines,
    /// thus increasing competition for the commit lock.
    async fn receive(
        // `Arc` to make the resulting future `'static` and thus easily
        // wrappable by the `QueueReceiver`
        self: Arc<Self>,
        max_messages: usize,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Vec<RawMessage>>;

    /// Tries to acknowledge (delete) the messages.
    ///
    /// The call returns `Ok(())` if at the message level:
    /// - the acknowledgement failed due to a transient failure
    /// - the message was already acknowledged
    /// - the message was not acknowledged in time and is back to the queue
    ///
    /// If an empty list of ack_ids is provided, the call should be a no-op.
    async fn acknowledge(&self, ack_ids: &[String]) -> anyhow::Result<()>;

    /// Modifies the visibility deadline of the messages.
    ///
    /// We try to set the initial visibility large enough to avoid having to
    /// call this too often. The implementation can retry as long as desired,
    /// it's the caller's responsibility to cancel the future if the deadline is
    /// getting to close to the expiration. The returned `Instant` is a
    /// conservative estimate of the new deadline expiration time.
    async fn modify_deadlines(
        &self,
        ack_id: &str,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Instant>;
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/shared_state.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::sync::{Arc, Weak};
use std::time::Duration;

use anyhow::{Context, bail};
use quickwit_metastore::checkpoint::PartitionId;
use quickwit_proto::metastore::{
    AcquireShardsRequest, MetastoreService, MetastoreServiceClient, OpenShardSubrequest,
    OpenShardsRequest, PruneShardsRequest,
};
use quickwit_proto::types::{DocMappingUid, Position, ShardId, SourceUid};
use time::OffsetDateTime;
use tracing::{error, info};

use super::message::PreProcessedMessage;

#[derive(Clone)]
pub struct QueueSharedState {
    metastore: MetastoreServiceClient,
    pub source_uid: SourceUid,
    /// Duration after which the processing of a shard is considered stale and
    /// should be reacquired
    reacquire_grace_period: Duration,
    _cleanup_handle: Arc<()>,
}

impl QueueSharedState {
    /// Create a shared state service and runs a cleanup task that prunes shards
    /// in the background
    pub fn new(
        metastore: MetastoreServiceClient,
        source_uid: SourceUid,
        reacquire_grace_period: Duration,
        max_age: Option<Duration>,
        max_count: Option<u32>,
        pruning_interval: Duration,
    ) -> Self {
        let cleanup_handle = Arc::new(());
        tokio::spawn(Self::run_cleanup_task(
            metastore.clone(),
            source_uid.clone(),
            max_age,
            max_count,
            pruning_interval,
            Arc::downgrade(&cleanup_handle),
        ));
        Self {
            metastore,
            source_uid,
            reacquire_grace_period,
            _cleanup_handle: cleanup_handle,
        }
    }

    async fn run_cleanup_task(
        metastore: MetastoreServiceClient,
        source_uid: SourceUid,
        max_age: Option<Duration>,
        max_count: Option<u32>,
        pruning_interval: Duration,
        owner_handle: Weak<()>,
    ) {
        if max_count.is_none() && max_age.is_none() {
            return;
        }
        let max_age_secs = max_age.map(|duration| duration.as_secs() as u32);
        let SourceUid {
            index_uid,
            source_id,
        } = source_uid;
        tokio::spawn(async move {
            let mut interval = tokio::time::interval(pruning_interval);
            loop {
                interval.tick().await;
                if owner_handle.upgrade().is_none() {
                    break;
                }
                let result: Result<_, _> = metastore
                    .prune_shards(PruneShardsRequest {
                        index_uid: Some(index_uid.clone()),
                        source_id: source_id.clone(),
                        max_age_secs,
                        max_count,
                        interval_secs: Some(pruning_interval.as_secs() as u32),
                    })
                    .await;
                if let Err(err) = result {
                    error!(error = ?err, "failed to prune shards");
                }
            }
        });
    }

    /// Tries to acquire the ownership for the provided messages from the global
    /// shared context. For each partition id, if the ownership was successfully
    /// acquired or the partition was already successfully indexed, the position
    /// is returned along with the partition id, otherwise the partition id is
    /// dropped.
    async fn acquire_partitions(
        &mut self,
        publish_token: &str,
        partitions: Vec<PartitionId>,
    ) -> anyhow::Result<Vec<(PartitionId, Position)>> {
        let open_shard_subrequests = partitions
            .iter()
            .enumerate()
            .map(|(idx, partition_id)| OpenShardSubrequest {
                subrequest_id: idx as u32,
                index_uid: Some(self.source_uid.index_uid.clone()),
                source_id: self.source_uid.source_id.clone(),
                leader_id: String::new(),
                follower_id: None,
                shard_id: Some(ShardId::from(partition_id.as_str())),
                doc_mapping_uid: Some(DocMappingUid::default()),
                publish_token: Some(publish_token.to_string()),
            })
            .collect();

        let open_shard_resp = self
            .metastore
            .open_shards(OpenShardsRequest {
                subrequests: open_shard_subrequests,
            })
            .await?;

        let mut shards = Vec::new();
        let mut re_acquired_shards = Vec::new();
        for sub in open_shard_resp.subresponses {
            // we could also just cast the shard_id back to a partition_id
            let partition_id = partitions[sub.subrequest_id as usize].clone();
            let shard = sub.open_shard();
            let position = shard.publish_position_inclusive.clone().unwrap_or_default();
            let is_owned = sub.open_shard().publish_token.as_deref() == Some(publish_token);
            let update_datetime = OffsetDateTime::from_unix_timestamp(shard.update_timestamp)
                .context("Invalid shard update timestamp")?;
            let is_stale =
                OffsetDateTime::now_utc() - update_datetime > self.reacquire_grace_period;
            if position.is_eof() || (is_owned && position.is_beginning()) {
                shards.push((partition_id, position));
            } else if !is_owned && is_stale {
                info!(previous_token = shard.publish_token, "shard re-acquired");
                re_acquired_shards.push(shard.shard_id().clone());
            } else if is_owned && !position.is_beginning() {
                bail!("Partition is owned by this indexing pipeline but is not at the beginning. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues.")
            }
        }

        if re_acquired_shards.is_empty() {
            return Ok(shards);
        }

        // re-acquire shards that have a token that is not the local token
        let acquire_shard_resp = self
            .metastore
            .acquire_shards(AcquireShardsRequest {
                index_uid: Some(self.source_uid.index_uid.clone()),
                source_id: self.source_uid.source_id.clone(),
                shard_ids: re_acquired_shards,
                publish_token: publish_token.to_string(),
            })
            .await?;
        for shard in acquire_shard_resp.acquired_shards {
            let partition_id = PartitionId::from(shard.shard_id().as_str());
            let position = shard.publish_position_inclusive.unwrap_or_default();
            shards.push((partition_id, position));
        }

        Ok(shards)
    }
}

/// Acquires shards from the shared state for the provided list of messages
/// using [`QueueSharedState::acquire_partitions`], then maps resulting
/// positions back to that original list. Messages that don't require any
/// further processing are dropped.
pub async fn checkpoint_messages(
    shared_state: &mut QueueSharedState,
    publish_token: &str,
    messages: Vec<PreProcessedMessage>,
) -> anyhow::Result<Vec<(PreProcessedMessage, Position)>> {
    let mut message_map: BTreeMap<PartitionId, PreProcessedMessage> = messages
        .into_iter()
        .map(|msg| (msg.partition_id(), msg))
        .collect();
    let partition_ids = message_map.keys().cloned().collect();

    let partition_positions = shared_state
        .acquire_partitions(publish_token, partition_ids)
        .await?;

    let mut result = Vec::with_capacity(partition_positions.len());
    for (partition_id, position) in partition_positions {
        let content = message_map.remove(&partition_id).context("Unexpected partition ID. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues.")?;
        result.push((content, position));
    }

    Ok(result)
}

#[cfg(test)]
pub mod shared_state_for_tests {
    use std::sync::{Arc, Mutex};

    use itertools::Itertools;
    use quickwit_proto::ingest::{Shard, ShardState};
    use quickwit_proto::metastore::{
        AcquireShardsResponse, MockMetastoreService, OpenShardSubresponse, OpenShardsResponse,
    };
    use quickwit_proto::types::IndexUid;

    use super::*;

    /// Creates a metastore that mocks the behavior of the Shard API on the open
    /// and acquire methods using a simplified in-memory state.
    pub(super) fn mock_metastore(
        // Shards (token, position, update_timestamp) in the initial state
        initial_state: &[(PartitionId, (String, Position, i64))],
        // Times open_shards is expected to be called (None <=> no expectation)
        open_shard_times: Option<usize>,
        // Times acquire_shards is expected to be called (None <=> no expectation)
        acquire_times: Option<usize>,
    ) -> MetastoreServiceClient {
        let mut mock_metastore = MockMetastoreService::new();
        let inner_state = Arc::new(Mutex::new(BTreeMap::from_iter(
            initial_state.iter().cloned(),
        )));
        let inner_state_ref = Arc::clone(&inner_state);
        let open_shards_expectation =
            mock_metastore
                .expect_open_shards()
                .returning(move |request| {
                    let mut subresponses = Vec::with_capacity(request.subrequests.len());
                    for sub_req in request.subrequests {
                        let partition_id: PartitionId = sub_req.shard_id().to_string().into();
                        let req_token = sub_req.publish_token();
                        let (token, position, update_timestamp) = inner_state_ref
                            .lock()
                            .unwrap()
                            .get(&partition_id)
                            .cloned()
                            .unwrap_or((
                                req_token.to_string(),
                                Position::Beginning,
                                OffsetDateTime::now_utc().unix_timestamp(),
                            ));

                        inner_state_ref.lock().unwrap().insert(
                            partition_id,
                            (token.clone(), position.clone(), update_timestamp),
                        );
                        subresponses.push(OpenShardSubresponse {
                            subrequest_id: sub_req.subrequest_id,
                            open_shard: Some(Shard {
                                shard_id: sub_req.shard_id,
                                source_id: sub_req.source_id,
                                publish_token: Some(token),
                                index_uid: sub_req.index_uid,
                                follower_id: sub_req.follower_id,
                                leader_id: sub_req.leader_id,
                                doc_mapping_uid: sub_req.doc_mapping_uid,
                                publish_position_inclusive: Some(position),
                                shard_state: ShardState::Open as i32,
                                update_timestamp,
                            }),
                        });
                    }
                    Ok(OpenShardsResponse { subresponses })
                });
        if let Some(times) = open_shard_times {
            open_shards_expectation.times(times);
        }
        let acquire_shards_expectation =
            mock_metastore
                .expect_acquire_shards()
                .returning(move |request| {
                    let mut acquired_shards = Vec::with_capacity(request.shard_ids.len());
                    for shard_id in request.shard_ids {
                        let partition_id: PartitionId = shard_id.to_string().into();
                        let (existing_token, position, update_timestamp) = inner_state
                            .lock()
                            .unwrap()
                            .get(&partition_id)
                            .cloned()
                            .expect("we should never try to acquire a shard that doesn't exist");
                        inner_state.lock().unwrap().insert(
                            partition_id,
                            (
                                request.publish_token.clone(),
                                position.clone(),
                                update_timestamp,
                            ),
                        );
                        assert_ne!(existing_token, request.publish_token);
                        acquired_shards.push(Shard {
                            shard_id: Some(shard_id),
                            source_id: "dummy".to_string(),
                            publish_token: Some(request.publish_token.clone()),
                            index_uid: None,
                            follower_id: None,
                            leader_id: "dummy".to_string(),
                            doc_mapping_uid: None,
                            publish_position_inclusive: Some(position),
                            shard_state: ShardState::Open as i32,
                            update_timestamp,
                        });
                    }
                    Ok(AcquireShardsResponse { acquired_shards })
                });
        if let Some(times) = acquire_times {
            acquire_shards_expectation.times(times);
        }
        MetastoreServiceClient::from_mock(mock_metastore)
    }

    pub fn init_state(
        index_id: &str,
        // Shards (token, position, is_stale) in the initial state
        initial_state: &[(PartitionId, (String, Position, bool))],
    ) -> QueueSharedState {
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let metastore_state = initial_state
            .iter()
            .map(|(pid, (token, pos, is_stale))| {
                let update_timestamp = if *is_stale {
                    OffsetDateTime::now_utc().unix_timestamp() - 100
                } else {
                    OffsetDateTime::now_utc().unix_timestamp()
                };
                (pid.clone(), (token.clone(), pos.clone(), update_timestamp))
            })
            .collect_vec();
        let metastore = mock_metastore(&metastore_state, None, None);
        QueueSharedState {
            metastore,
            source_uid: SourceUid {
                index_uid,
                source_id: "test-queue-src".to_string(),
            },
            reacquire_grace_period: Duration::from_secs(10),
            _cleanup_handle: Arc::new(()),
        }
    }
}

#[cfg(test)]
mod tests {
    use std::str::FromStr;
    use std::time::Instant;
    use std::vec;

    use quickwit_common::uri::Uri;
    use quickwit_proto::types::IndexUid;
    use shared_state_for_tests::mock_metastore;

    use super::*;
    use crate::source::queue_sources::message::{MessageMetadata, PreProcessedPayload};

    fn test_messages(message_number: usize) -> Vec<PreProcessedMessage> {
        (0..message_number)
            .map(|i| PreProcessedMessage {
                metadata: MessageMetadata {
                    ack_id: format!("ackid{i}"),
                    delivery_attempts: 0,
                    initial_deadline: Instant::now(),
                    message_id: format!("mid{i}"),
                },
                payload: PreProcessedPayload::ObjectUri(
                    Uri::from_str(&format!("s3://bucket/key{i}")).unwrap(),
                ),
            })
            .collect()
    }

    #[tokio::test]
    async fn test_acquire_shards_with_completed() {
        let index_id = "test-sqs-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let init_state = &[(
            "p1".into(),
            (
                "token2".to_string(),
                Position::eof(100usize),
                OffsetDateTime::now_utc().unix_timestamp(),
            ),
        )];
        let metastore = mock_metastore(init_state, Some(1), Some(0));

        let mut shared_state = QueueSharedState {
            metastore,
            source_uid: SourceUid {
                index_uid,
                source_id: "test-sqs-source".to_string(),
            },
            reacquire_grace_period: Duration::from_secs(10),
            _cleanup_handle: Arc::new(()),
        };

        let aquired = shared_state
            .acquire_partitions("token1", vec!["p1".into(), "p2".into()])
            .await
            .unwrap();
        assert!(aquired.contains(&("p1".into(), Position::eof(100usize))));
        assert!(aquired.contains(&("p2".into(), Position::Beginning)));
    }

    #[tokio::test]
    async fn test_re_acquire_shards_within_grace_period() {
        let index_id = "test-sqs-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let init_state = &[(
            "p1".into(),
            (
                "token2".to_string(),
                Position::offset(100usize),
                OffsetDateTime::now_utc().unix_timestamp(),
            ),
        )];
        let metastore = mock_metastore(init_state, Some(1), Some(0));

        let mut shared_state = QueueSharedState {
            metastore,
            source_uid: SourceUid {
                index_uid,
                source_id: "test-sqs-source".to_string(),
            },
            reacquire_grace_period: Duration::from_secs(10),
            _cleanup_handle: Arc::new(()),
        };

        let acquired = shared_state
            .acquire_partitions("token1", vec!["p1".into(), "p2".into()])
            .await
            .unwrap();
        assert_eq!(acquired.len(), 1);
        assert!(acquired.contains(&("p2".into(), Position::Beginning)));
    }

    #[tokio::test]
    async fn test_re_acquire_shards_after_grace_period() {
        let index_id = "test-sqs-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let init_state = &[(
            "p1".into(),
            (
                "token2".to_string(),
                Position::offset(100usize),
                OffsetDateTime::now_utc().unix_timestamp() - 100,
            ),
        )];
        let metastore = mock_metastore(init_state, Some(1), Some(1));

        let mut shared_state = QueueSharedState {
            metastore,
            source_uid: SourceUid {
                index_uid,
                source_id: "test-sqs-source".to_string(),
            },
            reacquire_grace_period: Duration::from_secs(10),
            _cleanup_handle: Arc::new(()),
        };

        let aquired = shared_state
            .acquire_partitions("token1", vec!["p1".into(), "p2".into()])
            .await
            .unwrap();
        assert!(aquired.contains(&("p1".into(), Position::offset(100usize))));
        assert!(aquired.contains(&("p2".into(), Position::Beginning)));
    }

    #[tokio::test]
    async fn test_checkpoint_with_completed() {
        let index_id = "test-sqs-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);

        let source_messages = test_messages(2);
        let completed_partition_id = source_messages[0].partition_id();
        let new_partition_id = source_messages[1].partition_id();

        let init_state = &[(
            completed_partition_id.clone(),
            (
                "token2".to_string(),
                Position::eof(100usize),
                OffsetDateTime::now_utc().unix_timestamp(),
            ),
        )];
        let metastore = mock_metastore(init_state, Some(1), Some(0));
        let mut shared_state = QueueSharedState {
            metastore,
            source_uid: SourceUid {
                index_uid,
                source_id: "test-sqs-source".to_string(),
            },
            reacquire_grace_period: Duration::from_secs(10),
            _cleanup_handle: Arc::new(()),
        };

        let checkpointed_msg = checkpoint_messages(&mut shared_state, "token1", source_messages)
            .await
            .unwrap();
        assert_eq!(checkpointed_msg.len(), 2);
        let completed_msg = checkpointed_msg
            .iter()
            .find(|(msg, _)| msg.partition_id() == completed_partition_id)
            .unwrap();
        assert_eq!(completed_msg.1, Position::eof(100usize));
        let new_msg = checkpointed_msg
            .iter()
            .find(|(msg, _)| msg.partition_id() == new_partition_id)
            .unwrap();
        assert_eq!(new_msg.1, Position::Beginning);
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/sqs_queue.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;
use std::time::{Duration, Instant};

use anyhow::{Context, bail};
use async_trait::async_trait;
use aws_sdk_sqs::config::{Builder, Region, SharedAsyncSleep};
use aws_sdk_sqs::types::{DeleteMessageBatchRequestEntry, MessageSystemAttributeName};
use aws_sdk_sqs::{Client, Config};
use itertools::Itertools;
use quickwit_aws::retry::{AwsRetryable, aws_retry};
use quickwit_aws::{DEFAULT_AWS_REGION, aws_behavior_version, get_aws_config};
use quickwit_common::rate_limited_error;
use quickwit_common::retry::RetryParams;
use quickwit_storage::OwnedBytes;
use regex::Regex;

use super::message::MessageMetadata;
use super::{Queue, RawMessage};

#[derive(Debug)]
pub struct SqsQueue {
    sqs_client: Client,
    queue_url: String,
    receive_retries: RetryParams,
    acknowledge_retries: RetryParams,
    modify_deadline_retries: RetryParams,
}

impl SqsQueue {
    pub async fn try_new(queue_url: String) -> anyhow::Result<Self> {
        let sqs_client = get_sqs_client(&queue_url).await?;
        Ok(SqsQueue {
            sqs_client,
            queue_url,
            receive_retries: RetryParams::standard(),
            // Acknowledgment is retried when the message is received again
            acknowledge_retries: RetryParams::no_retries(),
            // Retry aggressively to avoid loosing the ownership of the message
            modify_deadline_retries: RetryParams::aggressive(),
        })
    }
}

#[async_trait]
impl Queue for SqsQueue {
    async fn receive(
        self: Arc<Self>,
        max_messages: usize,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Vec<RawMessage>> {
        // TODO: We estimate the message deadline using the start of the
        // ReceiveMessage request. This might be overly pessimistic: the docs
        // state that it starts when the message is returned.
        let initial_deadline = Instant::now() + suggested_deadline;
        let clamped_max_messages = std::cmp::min(max_messages, 10) as i32;
        let receive_output = aws_retry(&self.receive_retries, || async {
            self.sqs_client
                .receive_message()
                .queue_url(&self.queue_url)
                .message_system_attribute_names(MessageSystemAttributeName::ApproximateReceiveCount)
                .wait_time_seconds(20)
                .set_max_number_of_messages(Some(clamped_max_messages))
                .visibility_timeout(suggested_deadline.as_secs() as i32)
                .send()
                .await
        })
        .await?;

        let received_messages = receive_output.messages.unwrap_or_default();
        let mut resulting_raw_messages = Vec::with_capacity(received_messages.len());
        for received_message in received_messages {
            let delivery_attempts: usize = received_message
                .attributes
                .as_ref()
                .and_then(|attrs| attrs.get(&MessageSystemAttributeName::ApproximateReceiveCount))
                .and_then(|s| s.parse().ok())
                .unwrap_or(0);
            let ack_id = received_message
                .receipt_handle
                .context("missing receipt_handle in received message")?;
            let message_id = received_message
                .message_id
                .context("missing message_id in received message")?;
            let raw_message = RawMessage {
                metadata: MessageMetadata {
                    ack_id,
                    message_id,
                    initial_deadline,
                    delivery_attempts,
                },
                payload: OwnedBytes::new(received_message.body.unwrap_or_default().into_bytes()),
            };
            resulting_raw_messages.push(raw_message);
        }
        Ok(resulting_raw_messages)
    }

    async fn acknowledge(&self, ack_ids: &[String]) -> anyhow::Result<()> {
        if ack_ids.is_empty() {
            return Ok(());
        }
        let entry_batches: Vec<Vec<_>> = ack_ids
            .iter()
            .dedup()
            .enumerate()
            .map(|(i, id)| {
                DeleteMessageBatchRequestEntry::builder()
                    .id(i.to_string())
                    .receipt_handle(id.to_string())
                    .build()
                    .unwrap()
            })
            .chunks(10)
            .into_iter()
            .map(|chunk| chunk.collect())
            .collect();

        // TODO: parallelization
        let mut batch_errors = Vec::new();
        let mut message_errors = Vec::new();
        for batch in entry_batches {
            let res = aws_retry(&self.acknowledge_retries, || {
                self.sqs_client
                    .delete_message_batch()
                    .queue_url(&self.queue_url)
                    .set_entries(Some(batch.clone()))
                    .send()
            })
            .await;
            match res {
                Ok(res) => {
                    message_errors.extend(res.failed.into_iter());
                }
                Err(err) => {
                    batch_errors.push(err);
                }
            }
        }
        if batch_errors.iter().any(|err| !err.is_retryable()) {
            let fatal_error = batch_errors
                .into_iter()
                .find(|err| !err.is_retryable())
                .unwrap();
            bail!(fatal_error);
        } else if !batch_errors.is_empty() {
            rate_limited_error!(
                limit_per_min = 10,
                count = batch_errors.len(),
                first_err = ?batch_errors.into_iter().next().unwrap(),
                "failed to acknowledge some message batches",
            );
        }
        // The documentation is unclear about these partial failures. We assume
        // it is either:
        // - a transient failure
        // - the message is already acknowledged
        // - the message is expired
        if !message_errors.is_empty() {
            rate_limited_error!(
                limit_per_min = 10,
                count = message_errors.len(),
                first_err = ?message_errors.into_iter().next().unwrap(),
                "failed to acknowledge individual messages",
            );
        }
        Ok(())
    }

    async fn modify_deadlines(
        &self,
        ack_id: &str,
        suggested_deadline: Duration,
    ) -> anyhow::Result<Instant> {
        let visibility_timeout = std::cmp::min(suggested_deadline.as_secs() as i32, 43200);
        let new_deadline = Instant::now() + suggested_deadline;
        aws_retry(&self.modify_deadline_retries, || {
            self.sqs_client
                .change_message_visibility()
                .queue_url(&self.queue_url)
                .visibility_timeout(visibility_timeout)
                .receipt_handle(ack_id)
                .send()
        })
        .await?;
        Ok(new_deadline)
    }
}

async fn preconfigured_builder() -> anyhow::Result<Builder> {
    let aws_config = get_aws_config().await;

    let mut sqs_config = Config::builder().behavior_version(aws_behavior_version());
    sqs_config.set_retry_config(aws_config.retry_config().cloned());
    sqs_config.set_credentials_provider(aws_config.credentials_provider());
    sqs_config.set_http_client(aws_config.http_client());
    sqs_config.set_timeout_config(aws_config.timeout_config().cloned());

    if let Some(identity_cache) = aws_config.identity_cache() {
        sqs_config.set_identity_cache(identity_cache);
    }
    sqs_config.set_sleep_impl(Some(SharedAsyncSleep::new(
        quickwit_aws::TokioSleep::default(),
    )));

    Ok(sqs_config)
}

fn queue_url_region(queue_url: &str) -> Option<Region> {
    let re = Regex::new(r"^https?://sqs\.(.*?)\.amazonaws\.com").unwrap();
    let caps = re.captures(queue_url)?;
    let region_str = caps.get(1)?.as_str();
    Some(Region::new(region_str.to_string()))
}

fn queue_url_endpoint(queue_url: &str) -> anyhow::Result<String> {
    let re = Regex::new(r"(^https?://[^/]+)").unwrap();
    let caps = re.captures(queue_url).context("Invalid queue URL")?;
    let endpoint_str = caps.get(1).context("Invalid queue URL")?.as_str();
    Ok(endpoint_str.to_string())
}

pub async fn get_sqs_client(queue_url: &str) -> anyhow::Result<Client> {
    let mut sqs_config = preconfigured_builder().await?;
    // region is required by the SDK to work
    let inferred_region = queue_url_region(queue_url).unwrap_or(DEFAULT_AWS_REGION);
    let inferred_endpoint = queue_url_endpoint(queue_url)?;
    sqs_config.set_region(Some(inferred_region));
    sqs_config.set_endpoint_url(Some(inferred_endpoint));
    Ok(Client::from_conf(sqs_config.build()))
}

/// Checks whether we can establish a connection to the SQS service and we can
/// access the provided queue_url
pub(crate) async fn check_connectivity(queue_url: &str) -> anyhow::Result<()> {
    let client = get_sqs_client(queue_url).await?;
    client
        .get_queue_attributes()
        .queue_url(queue_url)
        .send()
        .await?;

    Ok(())
}

#[cfg(feature = "sqs-test-helpers")]
pub mod test_helpers {
    use aws_sdk_sqs::types::QueueAttributeName;
    use ulid::Ulid;
    use warp::Filter;

    use super::*;

    pub async fn get_localstack_sqs_client() -> anyhow::Result<Client> {
        let mut sqs_config = preconfigured_builder().await?;
        sqs_config.set_endpoint_url(Some("http://localhost:4566".to_string()));
        sqs_config.set_region(Some(DEFAULT_AWS_REGION));
        Ok(Client::from_conf(sqs_config.build()))
    }

    pub async fn create_queue(sqs_client: &Client, queue_name_prefix: &str) -> String {
        let queue_name = format!("{}-{}", queue_name_prefix, Ulid::new());
        sqs_client
            .create_queue()
            .queue_name(queue_name)
            .send()
            .await
            .unwrap()
            .queue_url
            .unwrap()
    }

    pub async fn send_message(sqs_client: &Client, queue_url: &str, payload: &str) {
        sqs_client
            .send_message()
            .queue_url(queue_url)
            .message_body(payload.to_string())
            .send()
            .await
            .unwrap();
    }

    pub async fn get_queue_attribute(
        sqs_client: &Client,
        queue_url: &str,
        attribute: QueueAttributeName,
    ) -> String {
        let queue_attributes = sqs_client
            .get_queue_attributes()
            .queue_url(queue_url)
            .attribute_names(attribute.clone())
            .send()
            .await
            .unwrap();
        queue_attributes
            .attributes
            .unwrap()
            .get(&attribute)
            .unwrap()
            .to_string()
    }

    /// Runs a mock SQS GetQueueAttributes endpoint to enable creating SQS
    /// sources that pass the connectivity check
    ///
    /// Returns the queue URL to use for the source and a guard for the
    /// temporary mock server
    pub async fn start_mock_sqs_get_queue_attributes_endpoint() -> (String, oneshot::Sender<()>) {
        let hello = warp::path!().map(|| "{}");
        let (tx, rx) = oneshot::channel();
        let listener = tokio::net::TcpListener::bind("127.0.0.1:0")
            .await
            .expect("listener should bind");
        let addr = listener.local_addr().unwrap();

        let server = warp::serve(hello).incoming(listener).graceful(async {
            rx.await.ok();
        });
        tokio::spawn(server.run());

        let queue_url = format!("http://{}:{}/", addr.ip(), addr.port());
        (queue_url, tx)
    }

    #[tokio::test]
    async fn test_mock_sqs_get_queue_attributes_endpoint() {
        let (queue_url, _shutdown) = start_mock_sqs_get_queue_attributes_endpoint().await;
        check_connectivity(&queue_url).await.unwrap();
        drop(_shutdown);
        check_connectivity(&queue_url).await.unwrap_err();
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_queue_url_region() {
        let url = "https://sqs.eu-west-2.amazonaws.com/12345678910/test";
        let region = queue_url_region(url);
        assert_eq!(region, Some(Region::from_static("eu-west-2")));

        let url = "https://sqs.ap-south-1.amazonaws.com/12345678910/test";
        let region = queue_url_region(url);
        assert_eq!(region, Some(Region::from_static("ap-south-1")));

        let url = "http://localhost:4566/000000000000/test-queue";
        let region = queue_url_region(url);
        assert_eq!(region, None);
    }

    #[test]
    fn test_queue_url_endpoint() {
        let url = "https://sqs.eu-west-2.amazonaws.com/12345678910/test";
        let endpoint = queue_url_endpoint(url).unwrap();
        assert_eq!(endpoint, "https://sqs.eu-west-2.amazonaws.com");

        let url = "https://sqs.ap-south-1.amazonaws.com/12345678910/test";
        let endpoint = queue_url_endpoint(url).unwrap();
        assert_eq!(endpoint, "https://sqs.ap-south-1.amazonaws.com");

        let url = "http://localhost:4566/000000000000/test-queue";
        let endpoint = queue_url_endpoint(url).unwrap();
        assert_eq!(endpoint, "http://localhost:4566");

        let url = "http://localhost:4566/000000000000/test-queue";
        let endpoint = queue_url_endpoint(url).unwrap();
        assert_eq!(endpoint, "http://localhost:4566");
    }
}

#[cfg(all(test, feature = "sqs-localstack-tests"))]
mod localstack_tests {
    use aws_sdk_sqs::types::QueueAttributeName;

    use super::*;
    use crate::source::queue_sources::helpers::QueueReceiver;
    use crate::source::queue_sources::sqs_queue::test_helpers::{
        create_queue, get_localstack_sqs_client,
    };

    #[tokio::test]
    async fn test_check_connectivity() {
        let sqs_client = get_localstack_sqs_client().await.unwrap();
        let queue_url = create_queue(&sqs_client, "check-connectivity").await;
        check_connectivity(&queue_url).await.unwrap();
    }

    #[tokio::test]
    async fn test_receive_existing_msg_quickly() {
        let client = test_helpers::get_localstack_sqs_client().await.unwrap();
        let queue_url = test_helpers::create_queue(&client, "test-receive-existing-msg").await;
        let message = "hello world";
        test_helpers::send_message(&client, &queue_url, message).await;

        let queue = Arc::new(SqsQueue::try_new(queue_url).await.unwrap());
        let messages = tokio::time::timeout(
            Duration::from_millis(500),
            queue.clone().receive(5, Duration::from_secs(60)),
        )
        .await
        .unwrap()
        .unwrap();
        assert_eq!(messages.len(), 1);
        assert_eq!(messages[0].payload.as_slice(), message.as_bytes());

        // just assess that there are no errors for now
        queue
            .modify_deadlines(&messages[0].metadata.ack_id, Duration::from_secs(10))
            .await
            .unwrap();
        queue
            .acknowledge(&[messages[0].metadata.ack_id.clone()])
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_acknowledge_larger_batch() {
        let client = test_helpers::get_localstack_sqs_client().await.unwrap();
        let queue_url = test_helpers::create_queue(&client, "test-ack-large").await;
        let message = "hello world";
        for _ in 0..20 {
            test_helpers::send_message(&client, &queue_url, message).await;
        }

        let queue: Arc<SqsQueue> = Arc::new(SqsQueue::try_new(queue_url.clone()).await.unwrap());
        let mut queue_receiver = QueueReceiver::new(queue.clone(), Duration::from_millis(200));
        let mut messages = Vec::new();
        for _ in 0..5 {
            let new_messages = queue_receiver
                .receive(20, Duration::from_secs(60))
                .await
                .unwrap();
            messages.extend(new_messages.into_iter());
        }
        assert_eq!(messages.len(), 20);
        let in_flight_count: usize = test_helpers::get_queue_attribute(
            &client,
            &queue_url,
            QueueAttributeName::ApproximateNumberOfMessagesNotVisible,
        )
        .await
        .parse()
        .unwrap();
        assert_eq!(in_flight_count, 20);

        let ack_ids = messages
            .iter()
            .map(|msg| msg.metadata.ack_id.clone())
            .collect::<Vec<_>>();

        queue.acknowledge(&ack_ids).await.unwrap();

        let in_flight_count: usize = test_helpers::get_queue_attribute(
            &client,
            &queue_url,
            QueueAttributeName::ApproximateNumberOfMessagesNotVisible,
        )
        .await
        .parse()
        .unwrap();
        assert_eq!(in_flight_count, 0);
    }

    #[tokio::test]
    async fn test_receive_wrong_queue() {
        let client = test_helpers::get_localstack_sqs_client().await.unwrap();
        let queue_url = test_helpers::create_queue(&client, "test-receive-existing-msg").await;
        let bad_queue_url = format!("{queue_url}wrong");
        let queue = Arc::new(SqsQueue::try_new(bad_queue_url).await.unwrap());
        tokio::time::timeout(
            Duration::from_millis(500),
            queue.clone().receive(5, Duration::from_secs(60)),
        )
        .await
        .unwrap()
        .unwrap_err();
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/queue_sources/visibility.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::{Arc, Weak};
use std::time::{Duration, Instant};

use anyhow::{Context, anyhow};
use async_trait::async_trait;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, ActorState, Handler, Mailbox,
};
use serde_json::{Value as JsonValue, json};

use super::Queue;
use crate::source::SourceContext;

#[derive(Debug, Clone)]
pub(super) struct VisibilitySettings {
    /// The original deadline asked from the queue when polling the messages
    pub deadline_for_receive: Duration,
    /// The last deadline extension when the message reading is completed
    pub deadline_for_last_extension: Duration,
    /// The extension applied why the VisibilityTask to maintain the message visibility
    pub deadline_for_default_extension: Duration,
    /// Rhe timeout for the visibility extension request
    pub request_timeout: Duration,
    /// an extra margin that is subtracted from the expected deadline when
    /// asserting whether we are still in time to extend the visibility
    pub request_margin: Duration,
}

impl VisibilitySettings {
    /// The commit timeout gives us a first estimate on how long the processing
    /// will take for the messages. We could include other factors such as the
    /// message size.
    pub(super) fn from_commit_timeout(commit_timeout_secs: usize) -> Self {
        let commit_timeout = Duration::from_secs(commit_timeout_secs as u64);
        Self {
            deadline_for_receive: Duration::from_secs(120) + commit_timeout,
            deadline_for_last_extension: 2 * commit_timeout,
            deadline_for_default_extension: Duration::from_secs(60),
            request_timeout: Duration::from_secs(3),
            request_margin: Duration::from_secs(1),
        }
    }
}

#[derive(Debug)]
struct VisibilityTask {
    queue: Arc<dyn Queue>,
    ack_id: String,
    extension_count: u64,
    current_deadline: Instant,
    last_extension_requested: bool,
    visibility_settings: VisibilitySettings,
    ref_count: Weak<()>,
}

// A handle to the visibility actor. When dropped, the actor exits and the
// visibility isn't maintained anymore.
pub(super) struct VisibilityTaskHandle {
    mailbox: Mailbox<VisibilityTask>,
    actor_handle: ActorHandle<VisibilityTask>,
    ack_id: String,
    _ref_count: Arc<()>,
}

/// Spawns actor that ensures that the visibility of a given message
/// (represented by its ack_id) is extended when required. We prefer applying
/// ample margins in the extension process to avoid missing deadlines while also
/// keeping the number of extension requests (and associated cost) small.
pub(super) fn spawn_visibility_task(
    ctx: &SourceContext,
    queue: Arc<dyn Queue>,
    ack_id: String,
    current_deadline: Instant,
    visibility_settings: VisibilitySettings,
) -> VisibilityTaskHandle {
    let ref_count = Arc::new(());
    let weak_ref = Arc::downgrade(&ref_count);
    let task = VisibilityTask {
        queue,
        ack_id: ack_id.clone(),
        extension_count: 0,
        current_deadline,
        last_extension_requested: false,
        visibility_settings,
        ref_count: weak_ref,
    };
    let (mailbox, actor_handle) = ctx.spawn_actor().spawn(task);
    VisibilityTaskHandle {
        mailbox,
        actor_handle,
        ack_id,
        _ref_count: ref_count,
    }
}

impl VisibilityTask {
    async fn extend_visibility(
        &mut self,
        ctx: &ActorContext<Self>,
        extension: Duration,
    ) -> anyhow::Result<()> {
        let _zone = ctx.protect_zone();
        self.current_deadline = tokio::time::timeout(
            self.visibility_settings.request_timeout,
            self.queue.modify_deadlines(&self.ack_id, extension),
        )
        .await
        .context("deadline extension timed out")??;
        self.extension_count += 1;
        Ok(())
    }

    fn next_extension(&self) -> Duration {
        (self.current_deadline - Instant::now())
            - self.visibility_settings.request_timeout
            - self.visibility_settings.request_margin
    }
}

impl VisibilityTaskHandle {
    pub fn extension_failed(&self) -> bool {
        self.actor_handle.state() == ActorState::Failure
    }

    pub fn ack_id(&self) -> &str {
        &self.ack_id
    }

    pub async fn request_last_extension(self) -> anyhow::Result<()> {
        self.mailbox
            .ask_for_res(RequestLastExtension)
            .await
            .map_err(|e| anyhow!(e))?;
        Ok(())
    }
}

#[async_trait]
impl Actor for VisibilityTask {
    type ObservableState = JsonValue;

    fn name(&self) -> String {
        "QueueVisibilityTask".to_string()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        let first_extension = self.next_extension();
        if first_extension.is_zero() {
            return Err(anyhow!("initial visibility deadline insufficient").into());
        }
        ctx.schedule_self_msg(first_extension, Loop);
        Ok(())
    }

    fn yield_after_each_message(&self) -> bool {
        false
    }

    fn observable_state(&self) -> Self::ObservableState {
        json!({
            "ack_id": self.ack_id,
            "extension_count": self.extension_count,
        })
    }
}

#[derive(Debug)]
struct Loop;

#[async_trait]
impl Handler<Loop> for VisibilityTask {
    type Reply = ();

    async fn handle(
        &mut self,
        _message: Loop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if self.ref_count.strong_count() == 0 {
            return Ok(());
        }
        if self.last_extension_requested {
            return Ok(());
        }
        self.extend_visibility(ctx, self.visibility_settings.deadline_for_default_extension)
            .await?;
        ctx.schedule_self_msg(self.next_extension(), Loop);
        Ok(())
    }
}

/// Ensures that the visibility of the message is extended using
/// deadline_for_last_extension and then stops the extension loop.
#[derive(Debug)]
struct RequestLastExtension;

#[async_trait]
impl Handler<RequestLastExtension> for VisibilityTask {
    type Reply = anyhow::Result<()>;

    async fn handle(
        &mut self,
        _message: RequestLastExtension,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        let deadline_for_last_extension = self.visibility_settings.deadline_for_last_extension;
        let last_deadline = Instant::now() + deadline_for_last_extension;
        self.last_extension_requested = true;
        if last_deadline > self.current_deadline {
            Ok(self
                .extend_visibility(ctx, deadline_for_last_extension)
                .await)
        } else {
            Ok(Ok(()))
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_actors::Universe;
    use tokio::sync::watch;

    use super::*;
    use crate::source::queue_sources::memory_queue::MemoryQueueForTests;

    #[tokio::test]
    async fn test_visibility_task_request_last_extension() {
        // actor context
        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);
        // queue with test message
        let ack_id = "ack_id".to_string();
        let queue = Arc::new(MemoryQueueForTests::new());
        queue.send_message("test message".to_string(), &ack_id);
        let initial_deadline = queue
            .clone()
            .receive(1, Duration::from_secs(1))
            .await
            .unwrap()[0]
            .metadata
            .initial_deadline;
        // spawn task
        let visibility_settings = VisibilitySettings {
            deadline_for_default_extension: Duration::from_secs(1),
            deadline_for_last_extension: Duration::from_secs(5),
            deadline_for_receive: Duration::from_secs(1),
            request_timeout: Duration::from_millis(100),
            request_margin: Duration::from_millis(100),
        };
        let handle = spawn_visibility_task(
            &ctx,
            queue.clone(),
            ack_id.clone(),
            initial_deadline,
            visibility_settings.clone(),
        );
        // assert that the background task performs extensions
        assert!(!handle.extension_failed());
        tokio::time::sleep_until(initial_deadline.into()).await;
        let next_deadline = queue.next_visibility_deadline(&ack_id).unwrap();
        assert!(initial_deadline < next_deadline);
        assert!(!handle.extension_failed());
        handle.request_last_extension().await.unwrap();
        assert!(
            Instant::now() + Duration::from_secs(4)
                < queue.next_visibility_deadline(&ack_id).unwrap()
        );
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_visibility_task_stop_on_drop() {
        // actor context
        let universe = Universe::with_accelerated_time();
        let (source_mailbox, _source_inbox) = universe.create_test_mailbox();
        let (observable_state_tx, _observable_state_rx) = watch::channel(serde_json::Value::Null);
        let ctx: SourceContext =
            ActorContext::for_test(&universe, source_mailbox, observable_state_tx);
        // queue with test message
        let ack_id = "ack_id".to_string();
        let queue = Arc::new(MemoryQueueForTests::new());
        queue.send_message("test message".to_string(), &ack_id);
        let initial_deadline = queue
            .clone()
            .receive(1, Duration::from_secs(1))
            .await
            .unwrap()[0]
            .metadata
            .initial_deadline;
        // spawn task
        let visibility_settings = VisibilitySettings {
            deadline_for_default_extension: Duration::from_secs(1),
            deadline_for_last_extension: Duration::from_secs(20),
            deadline_for_receive: Duration::from_secs(1),
            request_timeout: Duration::from_millis(100),
            request_margin: Duration::from_millis(100),
        };
        let handle = spawn_visibility_task(
            &ctx,
            queue.clone(),
            ack_id.clone(),
            initial_deadline,
            visibility_settings.clone(),
        );
        // assert that visibility is not extended after drop
        drop(handle);
        tokio::time::sleep_until(initial_deadline.into()).await;
        // the message is either already expired or about to expire
        if let Some(next_deadline) = queue.next_visibility_deadline(&ack_id) {
            assert_eq!(next_deadline, initial_deadline);
        }
        // assert_eq!(q, None);
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/source_factory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use async_trait::async_trait;
use itertools::Itertools;
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::SourceId;
use thiserror::Error;

use super::Source;
use crate::source::SourceRuntime;

#[async_trait]
pub trait SourceFactory: Send + Sync + 'static {
    async fn create_source(&self, source_runtime: SourceRuntime)
    -> anyhow::Result<Box<dyn Source>>;
}

#[async_trait]
pub trait TypedSourceFactory: Send + Sync + 'static {
    type Source: Source;
    type Params: serde::de::DeserializeOwned + Send + Sync + 'static;

    async fn typed_create_source(
        source_runtime: SourceRuntime,
        source_params: Self::Params,
    ) -> anyhow::Result<Self::Source>;
}

#[async_trait]
impl<T: TypedSourceFactory> SourceFactory for T {
    async fn create_source(
        &self,
        source_runtime: SourceRuntime,
    ) -> anyhow::Result<Box<dyn Source>> {
        let typed_params: T::Params =
            serde_json::from_value(source_runtime.source_config.params())?;
        let source = Self::typed_create_source(source_runtime, typed_params).await?;
        Ok(Box::new(source))
    }
}

#[derive(Default)]
pub struct SourceLoader {
    type_to_factory: HashMap<SourceType, Box<dyn SourceFactory>>,
}

#[derive(Error, Debug)]
pub enum SourceLoaderError {
    #[error(
        "unknown source type `{requested_source_type}` (available source types are \
         {available_source_types})"
    )]
    UnknownSourceType {
        requested_source_type: SourceType,
        available_source_types: String, //< a comma separated list with the available source_type.
    },
    #[error("failed to create source `{source_id}` of type `{source_type}`. Cause: {error:?}")]
    FailedToCreateSource {
        source_id: SourceId,
        source_type: SourceType,
        #[source]
        error: anyhow::Error,
    },
}

impl SourceLoader {
    pub fn add_source<F: SourceFactory>(&mut self, source_type: SourceType, source_factory: F) {
        self.type_to_factory
            .insert(source_type, Box::new(source_factory));
    }

    pub async fn load_source(
        &self,
        source_runtime: SourceRuntime,
    ) -> Result<Box<dyn Source>, SourceLoaderError> {
        let source_type = source_runtime.source_config.source_type();
        let source_id = source_runtime.source_id().to_string();
        let source_factory = self.type_to_factory.get(&source_type).ok_or_else(|| {
            SourceLoaderError::UnknownSourceType {
                requested_source_type: source_type,
                available_source_types: self.type_to_factory.keys().join(", "),
            }
        })?;
        source_factory
            .create_source(source_runtime)
            .await
            .map_err(|error| SourceLoaderError::FailedToCreateSource {
                source_type,
                source_id,
                error,
            })
    }
}

#[cfg(test)]
mod tests {

    use std::num::NonZeroUsize;

    use quickwit_config::{SourceConfig, SourceInputFormat, SourceParams};
    use quickwit_proto::types::IndexUid;

    use crate::source::quickwit_supported_sources;
    use crate::source::tests::SourceRuntimeBuilder;

    #[tokio::test]
    async fn test_source_loader_success() -> anyhow::Result<()> {
        let source_loader = quickwit_supported_sources();
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_config = SourceConfig {
            source_id: "test-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        source_loader.load_source(source_runtime).await?;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/stdin_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_common::Progress;
use quickwit_proto::metastore::SourceType;
use tokio::io::{AsyncBufReadExt, BufReader};

use super::{BATCH_NUM_BYTES_LIMIT, BatchBuilder};
use crate::actors::DocProcessor;
use crate::source::{Source, SourceContext, SourceRuntime, TypedSourceFactory};

pub struct StdinBatchReader {
    reader: BufReader<tokio::io::Stdin>,
    is_eof: bool,
}

impl StdinBatchReader {
    pub fn new() -> Self {
        Self {
            reader: BufReader::new(tokio::io::stdin()),
            is_eof: false,
        }
    }

    async fn read_batch(&mut self, source_progress: &Progress) -> anyhow::Result<BatchBuilder> {
        let mut batch_builder = BatchBuilder::new(SourceType::Stdin);
        while batch_builder.num_bytes < BATCH_NUM_BYTES_LIMIT {
            let mut buf = String::new();
            // stdin might be slow because it's depending on external
            // input (e.g. user typing on a keyboard)
            let bytes_read = source_progress
                .protect_future(self.reader.read_line(&mut buf))
                .await?;
            if bytes_read > 0 {
                batch_builder.add_doc(buf.into());
            } else {
                self.is_eof = true;
                break;
            }
        }

        Ok(batch_builder)
    }

    fn is_eof(&self) -> bool {
        self.is_eof
    }
}

pub struct StdinSource {
    reader: StdinBatchReader,
    num_bytes_processed: u64,
    num_lines_processed: u64,
}

impl fmt::Debug for StdinSource {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "StdinSource")
    }
}

#[async_trait]
impl Source for StdinSource {
    async fn emit_batches(
        &mut self,
        doc_processor_mailbox: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let batch_builder = self.reader.read_batch(ctx.progress()).await?;
        self.num_bytes_processed += batch_builder.num_bytes;
        self.num_lines_processed += batch_builder.docs.len() as u64;
        doc_processor_mailbox
            .send_message(batch_builder.build())
            .await?;
        if self.reader.is_eof() {
            ctx.send_exit_with_success(doc_processor_mailbox).await?;
            return Err(ActorExitStatus::Success);
        }

        Ok(Duration::ZERO)
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    fn observable_state(&self) -> serde_json::Value {
        serde_json::json!({
            "num_bytes_processed": self.num_bytes_processed,
            "num_lines_processed": self.num_lines_processed,
        })
    }
}

pub struct StdinSourceFactory;

#[async_trait]
impl TypedSourceFactory for StdinSourceFactory {
    type Source = StdinSource;
    type Params = ();

    async fn typed_create_source(
        _source_runtime: SourceRuntime,
        _params: (),
    ) -> anyhow::Result<StdinSource> {
        Ok(StdinSource {
            reader: StdinBatchReader::new(),
            num_bytes_processed: 0,
            num_lines_processed: 0,
        })
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/vec_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{ActorExitStatus, Mailbox};
use quickwit_config::VecSourceParams;
use quickwit_metastore::checkpoint::{PartitionId, SourceCheckpointDelta};
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::{Position, SourceId};
use serde_json::Value as JsonValue;
use tracing::info;

use super::BatchBuilder;
use crate::actors::DocProcessor;
use crate::source::{Source, SourceContext, SourceRuntime, TypedSourceFactory};

pub struct VecSource {
    source_id: SourceId,
    source_params: VecSourceParams,
    next_item_idx: usize,
    partition: PartitionId,
}

impl fmt::Debug for VecSource {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("VecSource")
            .field("source_id", &self.source_id)
            .finish()
    }
}

pub struct VecSourceFactory;

#[async_trait]
impl TypedSourceFactory for VecSourceFactory {
    type Source = VecSource;
    type Params = VecSourceParams;
    async fn typed_create_source(
        source_runtime: SourceRuntime,
        source_params: VecSourceParams,
    ) -> anyhow::Result<Self::Source> {
        let checkpoint = source_runtime.fetch_checkpoint().await?;
        let partition = PartitionId::from(source_params.partition.as_str());
        let next_item_idx = checkpoint
            .position_for_partition(&partition)
            .map(|position| {
                position
                    .as_usize()
                    .expect("offset should be stored as usize")
                    + 1
            })
            .unwrap_or(0);
        Ok(VecSource {
            source_id: source_runtime.pipeline_id.source_id,
            source_params,
            partition,
            next_item_idx,
        })
    }
}

fn position_from_offset(offset: usize) -> Position {
    if offset == 0 {
        return Position::Beginning;
    }
    Position::offset(offset - 1)
}

#[async_trait]
impl Source for VecSource {
    async fn emit_batches(
        &mut self,
        batch_sink: &Mailbox<DocProcessor>,
        ctx: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        let mut batch_builder = BatchBuilder::new(SourceType::Vec);

        for doc in self.source_params.docs[self.next_item_idx..]
            .iter()
            .take(self.source_params.batch_num_docs)
            .cloned()
        {
            batch_builder.add_doc(doc);
        }
        if batch_builder.docs.is_empty() {
            info!("reached end of source");
            ctx.send_exit_with_success(batch_sink).await?;
            return Err(ActorExitStatus::Success);
        }
        let from_item_idx = self.next_item_idx;
        self.next_item_idx += batch_builder.docs.len();
        let to_item_idx = self.next_item_idx;

        batch_builder.checkpoint_delta = SourceCheckpointDelta::from_partition_delta(
            self.partition.clone(),
            position_from_offset(from_item_idx),
            position_from_offset(to_item_idx),
        )
        .unwrap();
        ctx.send_message(batch_sink, batch_builder.build()).await?;

        Ok(Duration::default())
    }

    fn name(&self) -> String {
        format!("{self:?}")
    }

    fn observable_state(&self) -> JsonValue {
        serde_json::json!({
            "next_item_idx": self.next_item_idx,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroUsize;

    use bytes::Bytes;
    use quickwit_actors::{Actor, Command, Universe};
    use quickwit_config::{SourceConfig, SourceInputFormat, SourceParams};
    use quickwit_proto::types::IndexUid;
    use serde_json::json;

    use super::*;
    use crate::models::RawDocBatch;
    use crate::source::SourceActor;
    use crate::source::tests::SourceRuntimeBuilder;

    #[tokio::test]
    async fn test_vec_source() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let docs = std::iter::repeat_with(|| Bytes::from_static(b"{}"))
            .take(100)
            .collect();
        let params = VecSourceParams {
            docs,
            batch_num_docs: 3,
            partition: "partition".to_string(),
        };
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_config = SourceConfig {
            source_id: "test-vec-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Vec(params.clone()),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let vec_source = VecSourceFactory::typed_create_source(source_runtime, params).await?;
        let vec_source_actor = SourceActor {
            source: Box::new(vec_source),
            doc_processor_mailbox,
        };
        assert_eq!(
            vec_source_actor.name(),
            r#"VecSource { source_id: "test-vec-source" }"#
        );
        let (_vec_source_mailbox, vec_source_handle) =
            universe.spawn_builder().spawn(vec_source_actor);
        let (actor_termination, last_observation) = vec_source_handle.join().await;
        assert!(actor_termination.is_success());
        assert_eq!(last_observation, json!({"next_item_idx": 100u64}));
        let batches = doc_processor_inbox.drain_for_test();
        assert_eq!(batches.len(), 35);
        let raw_batch = batches[1].downcast_ref::<RawDocBatch>().unwrap();
        assert_eq!(
            format!("{:?}", raw_batch.checkpoint_delta),
            "∆(partition:(00000000000000000002..00000000000000000005])"
        );
        assert!(matches!(
            &batches[34].downcast_ref::<Command>().unwrap(),
            &Command::ExitWithSuccess
        ));
        Ok(())
    }

    #[tokio::test]
    async fn test_vec_source_from_checkpoint() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let (doc_processor_mailbox, doc_processor_inbox) = universe.create_test_mailbox();
        let docs = (0..10).map(|i| Bytes::from(format!("{i}"))).collect();
        let params = VecSourceParams {
            docs,
            batch_num_docs: 3,
            partition: "".to_string(),
        };
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_config = SourceConfig {
            source_id: "test-vec-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Vec(params.clone()),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_delta = SourceCheckpointDelta::from_range(0u64..2u64);
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config)
            .with_mock_metastore(Some(source_delta))
            .build();
        let vec_source = VecSourceFactory::typed_create_source(source_runtime, params).await?;
        let vec_source_actor = SourceActor {
            source: Box::new(vec_source),
            doc_processor_mailbox,
        };
        let (_vec_source_mailbox, vec_source_handle) =
            universe.spawn_builder().spawn(vec_source_actor);
        let (actor_termination, last_observation) = vec_source_handle.join().await;
        assert!(actor_termination.is_success());
        assert_eq!(last_observation, json!({"next_item_idx": 10}));
        let messages = doc_processor_inbox.drain_for_test();
        let batch = messages[0].downcast_ref::<RawDocBatch>().unwrap();
        assert_eq!(&batch.docs[0], "2");
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/source/void_source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{ActorExitStatus, HEARTBEAT, Mailbox};
use quickwit_config::VoidSourceParams;
use serde_json::Value as JsonValue;

use crate::actors::DocProcessor;
use crate::source::{Source, SourceContext, SourceRuntime, TypedSourceFactory};

pub struct VoidSource;

#[async_trait]
impl Source for VoidSource {
    async fn emit_batches(
        &mut self,
        _: &Mailbox<DocProcessor>,
        _: &SourceContext,
    ) -> Result<Duration, ActorExitStatus> {
        tokio::time::sleep(*HEARTBEAT / 2).await;
        Ok(Duration::default())
    }

    fn name(&self) -> String {
        "VoidSource".to_string()
    }

    fn observable_state(&self) -> JsonValue {
        JsonValue::Object(Default::default())
    }
}

pub struct VoidSourceFactory;

#[async_trait]
impl TypedSourceFactory for VoidSourceFactory {
    type Source = VoidSource;

    type Params = VoidSourceParams;

    async fn typed_create_source(
        _source_runtime: SourceRuntime,
        _params: VoidSourceParams,
    ) -> anyhow::Result<VoidSource> {
        Ok(VoidSource)
    }
}

#[cfg(test)]
mod tests {

    use std::num::NonZeroUsize;

    use quickwit_actors::{Health, Supervisable, Universe};
    use quickwit_config::{SourceInputFormat, SourceParams};
    use quickwit_proto::types::IndexUid;
    use serde_json::json;

    use super::*;
    use crate::source::tests::SourceRuntimeBuilder;
    use crate::source::{SourceActor, SourceConfig, quickwit_supported_sources};

    #[tokio::test]
    async fn test_void_source_loading() {
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_config = SourceConfig {
            source_id: "test-void-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let source = quickwit_supported_sources()
            .load_source(source_runtime)
            .await
            .unwrap();
        assert_eq!(source.name(), "VoidSource");
    }

    #[tokio::test]
    async fn test_void_source_running() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let source_config = SourceConfig {
            source_id: "test-void-source".to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let source_runtime = SourceRuntimeBuilder::new(index_uid, source_config).build();
        let void_source =
            VoidSourceFactory::typed_create_source(source_runtime, VoidSourceParams).await?;
        let (doc_processor_mailbox, _) = universe.create_test_mailbox();
        let void_source_actor = SourceActor {
            source: Box::new(void_source),
            doc_processor_mailbox,
        };
        let (_, void_source_handle) = universe.spawn_builder().spawn(void_source_actor);
        matches!(void_source_handle.check_health(true), Health::Healthy);
        let (actor_termination, observed_state) = void_source_handle.quit().await;
        assert_eq!(observed_state, json!({}));
        matches!(actor_termination, ActorExitStatus::Quit);
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/split_store/indexing_split_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;
use std::collections::btree_map::Entry;
use std::io;
use std::path::{Path, PathBuf};
use std::str::FromStr;
use std::time::{Duration, SystemTime};

use anyhow::Context;
use bytesize::ByteSize;
use quickwit_common::split_file;
use quickwit_directories::BundleDirectory;
use quickwit_storage::StorageResult;
use tantivy::Directory;
use tantivy::directory::MmapDirectory;
use tokio::sync::Mutex;
use tracing::{debug, error, warn};
use ulid::Ulid;

use super::SplitStoreQuota;

// TODO Make this configurable.
const SPLIT_MAX_AGE: Duration = Duration::from_secs(2 * 24 * 3_600); // 2 days

pub fn get_tantivy_directory_from_split_bundle(
    split_file: &Path,
) -> StorageResult<Box<dyn Directory>> {
    let mmap_directory = MmapDirectory::open(split_file.parent().ok_or_else(|| {
        io::Error::new(
            io::ErrorKind::NotFound,
            format!("couldn't find parent for {}", split_file.display()),
        )
    })?)?;
    let split_fileslice = mmap_directory.open_read(Path::new(&split_file))?;
    Ok(Box::new(BundleDirectory::open_split(split_fileslice)?))
}

/// Returns the number of bytes held in a given directory.
async fn num_bytes_in_folder(directory_path: &Path) -> io::Result<ByteSize> {
    let mut total_bytes = 0;
    let mut read_dir = tokio::fs::read_dir(directory_path).await?;
    while let Some(dir_entry) = read_dir.next_entry().await? {
        let metadata = dir_entry.metadata().await?;
        if metadata.is_file() {
            total_bytes += metadata.len();
        } else {
            warn!(
                "Unexpected directory found in split cache. {:?}",
                dir_entry.path()
            );
        }
    }
    Ok(ByteSize(total_bytes))
}

/// The local split store is a cache for freshly indexed splits.
///
/// In order to save the cost of an extra write, we store splits in the form
/// of a directory and the split bundles are built upon upload.
#[derive(Debug, Copy, Clone)]
struct SplitFolder {
    split_id: Ulid,
    num_bytes: ByteSize,
}

impl SplitFolder {
    /// Creates a new `SplitFolder`.
    ///
    /// There are no specific constraints on `path`.
    pub async fn create(split_id: &str, path: &Path) -> io::Result<Self> {
        let split_id = Ulid::from_str(split_id).map_err(|_err| {
            let error_msg = format!("split Id should be an ulid: got `{split_id}`");
            io::Error::new(io::ErrorKind::InvalidInput, error_msg)
        })?;
        let num_bytes = num_bytes_in_folder(path).await?;
        Ok(SplitFolder {
            split_id,
            num_bytes,
        })
    }

    /// Returns the creation time as encoded in the split id ULID.
    fn creation_time(&self) -> SystemTime {
        self.split_id.datetime()
    }
}

fn split_id_from_split_folder(dir_path: &Path) -> Option<&str> {
    dir_path.file_name()?.to_str()?.strip_suffix(".split")
}

/// The [`IndexingSplitCache`] is a local cache used to improve the performance of indexing nodes.
/// Its purpose is simple: when a new split is freshly created, it is usually merged
/// very rapidly after.
///
/// In order to prevent this merge from forcing its download, we store it in the
/// [`IndexingSplitCache`]. This store is just a cache: a cache miss is acceptable and
/// just means that the split will be downloaded again.
///
/// The indexing split cache eviction policy however, is rather uncommon.
/// On our happy path, a split is stored into the cache, and is then used only once
/// to undergo a merge.
///
/// For this reason, we simply offer a way to `move splits into the cache`,
/// and `move splits out of the cache`. A split is removed from the split cache
/// after its first access.
///
/// Of course a failed merge could require accessing a given split more than once. In that
/// case the split will be downloaded again.
///
/// The cache size is limited by 3 things:
/// - a maximum number of splits as defined in the `SplitStoreQuota`.
/// - a maximum number of bytes as defined in the `SplitStoreQuota`.
/// - finally, we evict older splits to make sure that the newest split and the oldest split only
///   differ by at most `SPLIT_MAX_AGE`.
///
/// The point of this final rule invariant is to make sure that the disk space will be
/// released if the cache is NOT under pressure but some splits are actually useless.
///
/// When adding a new split into the cache, if adding the split would break one of the following
/// limit, we simply remove split one by one starting by the oldest first, until the split
/// can be added.
pub struct IndexingSplitCache {
    inner: Mutex<InnerSplitCache>,
}

struct InnerSplitCache {
    split_registry: SplitFolderRegistry,
    split_store_folder: PathBuf,
}

struct SplitFolderRegistry {
    /// Splits owned by the local split store, which reside in the split_store_folder.
    ///
    /// Splits ids are generated using ULID, so that they are sorted
    /// according to their creation date.
    ///
    /// We evict the oldest split first. Note this is not an LRU strategy
    /// because we do not care about the last access time, but we only
    /// consider the creation time.
    split_folders: BTreeMap<Ulid, ByteSize>,
    /// The split store quota shared among all indexing split stores.
    split_store_quota: SplitStoreQuota,
}

impl SplitFolderRegistry {
    pub fn with_quota(split_store_quota: SplitStoreQuota) -> SplitFolderRegistry {
        SplitFolderRegistry {
            split_folders: BTreeMap::default(),
            split_store_quota,
        }
    }

    /// Returns an iterator over the split folders sorted by ULID.
    #[cfg(any(test, feature = "testsuite"))]
    fn iter(&self) -> impl Iterator<Item = SplitFolder> + '_ {
        self.split_folders
            .iter()
            .map(|(&split_id, &num_bytes)| SplitFolder {
                split_id,
                num_bytes,
            })
    }

    /// Returns whether the element was inserted or was already present
    fn insert(&mut self, split_folder: SplitFolder) -> bool {
        if let Entry::Vacant(entry) = self.split_folders.entry(split_folder.split_id) {
            entry.insert(split_folder.num_bytes);
            self.split_store_quota.add_split(split_folder.num_bytes);
            true
        } else {
            false
        }
    }

    /// Returns true if the split was indeed present in the registry
    fn remove(&mut self, split_id: Ulid) -> Option<SplitFolder> {
        let num_bytes = self.split_folders.remove(&split_id)?;
        self.split_store_quota.remove_split(num_bytes);
        Some(SplitFolder {
            num_bytes,
            split_id,
        })
    }

    /// Returns the oldest split (oldest in the sense of the ULID = creation time).
    fn oldest_split(&self) -> Option<Ulid> {
        let (split_id, _) = self.split_folders.first_key_value()?;
        Some(*split_id)
    }

    /// Removes the oldest split.
    fn pop_oldest(&mut self) -> Option<SplitFolder> {
        let oldest_split_id = self.oldest_split()?;
        self.remove(oldest_split_id)
    }

    fn quota(&self) -> &SplitStoreQuota {
        &self.split_store_quota
    }
}

impl InnerSplitCache {
    /// Moves a split within the store to an external folder.
    ///
    /// Returns `None` if the split is not available in the cache.
    async fn move_out(
        &mut self,
        split_id: Ulid,
        to_folder: &Path,
    ) -> StorageResult<Option<PathBuf>> {
        let Some(split_folder) = self.split_registry.remove(split_id) else {
            // The split is simply not in cache.
            return Ok(None);
        };
        let from_path = self.split_path(split_id);
        let to_full_path = to_folder.join(from_path.file_name().unwrap());

        // We voluntarily use a non async operation: A rename is supposed to be
        // quick, and we want to keep this operation as transactional as
        // possible. In particular, we don't want our task to be cancelled in the
        // middle of an inconsistent state.
        if let Err(io_err) = std::fs::rename(&from_path, &to_full_path) {
            // We do not simply rely on the `io::ErrorKind::NotFound` here
            // because it could be about the destination and not the origin.
            return match from_path.try_exists() {
                Ok(false) => {
                    // This could happen if some files have been manually
                    // deleted from the FS for instance.
                    warn!(from_path=%from_path.display(), to_full_path=%to_full_path.display(), error=%io_err, "cached split missing from local split directory");
                    Ok(None)
                }
                Ok(true) => {
                    // The file couldn't be copied out but is still in the
                    // cache, we put it back to the registry to keep the
                    // statistics accurate
                    warn!(from_path=%from_path.display(), to_full_path=%to_full_path.display(), error=%io_err, "split stuck in local split cache");
                    self.split_registry.insert(split_folder);
                    Ok(None)
                }
                Err(_) => {
                    // At this point, we are probably in an inconsistent state.
                    // The split has been removed from our registry but we don't
                    // know whether the files are still in the cache directory.
                    error!(from_path=%from_path.display(), to_full_path=%to_full_path.display(), error=%io_err, "failed to move split directory out of cache");
                    Err(From::from(io_err))
                }
            };
        }
        Ok(Some(to_full_path))
    }

    /// Returns the directory filepath of a split in cache.
    fn split_path(&self, split_id: Ulid) -> PathBuf {
        let split_file = split_file(split_id);
        self.split_store_folder.join(split_file)
    }

    /// Remove one split from the cache to make some room.
    ///
    /// # Panics
    /// Panics if there are no remaining splits.
    async fn evict_one_split(&mut self) -> io::Result<()> {
        let evicted_split = self
            .split_registry
            .pop_oldest()
            .expect("split cache should not be empty");
        let result = tokio::fs::remove_dir_all(&self.split_path(evicted_split.split_id)).await;
        if let Err(io_err) = result {
            if io_err.kind() == io::ErrorKind::NotFound {
                // This could happen if some files have been manually deleted
                // from the FS for instance.
                warn!(split_id=%evicted_split.split_id, "cached split missing from local split directory");
                return Ok(());
            } else {
                return Err(io_err);
            }
        }
        Ok(())
    }

    /// Tries to move a `split_folder` file into the cache.
    ///
    /// Move is not an image here. We are literally moving the directory.
    ///
    /// If the cache capacity does not allow it returns Ok(false).
    ///
    /// Ok(true) means the file was effectively accepted.
    async fn move_into_cache(&mut self, split_id_str: &str, split_path: &Path) -> io::Result<bool> {
        let split_folder = SplitFolder::create(split_id_str, split_path).await?;
        let split_id = split_folder.split_id;
        let should_move_split = self.make_room_and_record_split(split_folder).await?;
        if !should_move_split {
            return Ok(false);
        }
        let to_full_path = self.split_path(split_id);
        if let Err(io_err) = tokio::fs::rename(split_path, &to_full_path).await {
            // keep the registry stats accurate
            self.split_registry.remove(split_id);
            return Err(io_err);
        }
        Ok(true)
    }

    /// Removes all splits that have a creation date older than `limit`.
    async fn remove_splits_older_than_limit(&mut self, limit: SystemTime) -> io::Result<()> {
        while let Some(split_id) = self.split_registry.oldest_split() {
            if split_id.datetime() >= limit {
                break;
            }
            self.evict_one_split().await?;
        }
        Ok(())
    }

    /// Ensures that there is room to store the split:
    /// - return false if the split should not be added to the cache.
    /// - return true and record the split if the split should be moved into the cache.
    async fn make_room_and_record_split(&mut self, split_folder: SplitFolder) -> io::Result<bool> {
        // We don't accept splits that are too large.
        if split_folder.num_bytes > self.split_registry.quota().max_num_bytes() {
            return Ok(false);
        }

        while !self
            .split_registry
            .quota()
            .can_fit_split(split_folder.num_bytes)
        {
            self.evict_one_split().await?;
        }

        if let Some(creation_time_limit) = split_folder.creation_time().checked_sub(SPLIT_MAX_AGE) {
            self.remove_splits_older_than_limit(creation_time_limit)
                .await?;
        };
        Ok(self.split_registry.insert(split_folder))
    }
}

impl IndexingSplitCache {
    pub fn no_caching() -> IndexingSplitCache {
        let split_store_space_quota = SplitStoreQuota::no_caching();
        let inner = Mutex::new(InnerSplitCache {
            split_registry: SplitFolderRegistry::with_quota(split_store_space_quota),
            split_store_folder: PathBuf::from("no_caching"),
        });
        IndexingSplitCache { inner }
    }

    /// Try to open an existing local split store directory.
    ///
    /// If the directory does not exists, it will be created.
    ///
    /// The directory is expected to only contain directory
    /// with a name following the pattern `<ULID.split>`.
    ///
    /// The different pre-existing splits are recorded into
    /// the split store in their creation order. If the split store
    /// quota have been modified, the store will undergo the same
    /// eviction logic.
    pub async fn open(
        split_store_folder: PathBuf,
        space_quota: SplitStoreQuota,
    ) -> anyhow::Result<IndexingSplitCache> {
        tokio::fs::create_dir_all(&split_store_folder)
            .await
            .context("failed to create the split cache directory")?;

        let mut split_folders: Vec<SplitFolder> = Vec::new();

        let mut read_dir = tokio::fs::read_dir(&split_store_folder).await?;
        while let Some(dir_entry) = read_dir.next_entry().await? {
            let metadata = dir_entry.metadata().await?;
            let dir_path: PathBuf = dir_entry.path();

            if metadata.is_file() {
                warn!(
                    "unexpected file found in split cache directory: `{}`",
                    dir_path.display()
                );
                continue;
            }

            let split_id = split_id_from_split_folder(&dir_path).ok_or_else(|| {
                let error_msg = format!(
                    "split folder name should match the format `<split_id>.split`: got `{}`",
                    dir_path.display()
                );
                io::Error::new(io::ErrorKind::InvalidInput, error_msg)
            })?;

            let split_folder = SplitFolder::create(split_id, &dir_entry.path()).await?;
            split_folders.push(split_folder);
        }

        let mut inner_local_split_store = InnerSplitCache {
            split_store_folder: split_store_folder.clone(),
            split_registry: SplitFolderRegistry::with_quota(space_quota),
        };

        split_folders.sort_by_key(SplitFolder::creation_time);

        // We record all `split_folder`, sorted by `creation_time`.
        for split_folder in split_folders {
            let split_id = split_folder.split_id;
            if !inner_local_split_store
                .make_room_and_record_split(split_folder)
                .await?
            {
                let split_dir = inner_local_split_store.split_path(split_id);
                tokio::fs::remove_dir_all(&split_dir).await?;
            }
        }

        Ok(IndexingSplitCache {
            inner: Mutex::new(inner_local_split_store),
        })
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub async fn inspect_registry(&self) -> std::collections::HashMap<String, ByteSize> {
        self.inner
            .lock()
            .await
            .split_registry
            .iter()
            .map(|split_folder| (split_folder.split_id.to_string(), split_folder.num_bytes))
            .collect()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub async fn inspect_quota(&self) -> SplitStoreQuota {
        self.inner
            .lock()
            .await
            .split_registry
            .split_store_quota
            .clone()
    }

    /// Returns a cached split to performs a merge operation.
    ///
    /// For simplicity, this method optimistically assumes that the merge operation will be
    /// successful and removes the split from the cache.
    ///
    /// If the merge operation is a failure and needs to be re-executed, we will
    /// experience a cache miss, and the split will be downloaded from the
    /// storage.
    pub(super) async fn get_cached_split(
        &self,
        split_id: &str,
        output_dir_path: &Path,
    ) -> StorageResult<Option<PathBuf>> {
        let mut split_store_lock = self.inner.lock().await;
        let split_ulid = if let Ok(split_ulid) = Ulid::from_str(split_id) {
            split_ulid
        } else {
            return Ok(None);
        };
        let split_file_opt: Option<PathBuf> = split_store_lock
            .move_out(split_ulid, output_dir_path)
            .await?;
        if split_file_opt.is_none() {
            debug!(split_id, "split folder not in cache");
        }
        Ok(split_file_opt)
    }

    /// Tries to move a `split_folder` file into the cache.
    ///
    /// Move is not an image here. We are literally moving the directory.
    ///
    /// If the cache capacity does not allow it, this function
    /// just logs a warning and returns Ok(false).
    ///
    /// Ok(true) means the file was effectively accepted.
    pub(super) async fn move_into_cache(
        &self,
        split_id: &str,
        split_path: &Path,
    ) -> io::Result<bool> {
        assert!(split_path.is_dir());
        let mut inner = self.inner.lock().await;
        inner.move_into_cache(split_id, split_path).await
    }
}

#[cfg(test)]
mod tests {
    use std::fs::File;
    use std::io;
    use std::io::Write;
    use std::path::Path;
    use std::time::Duration;

    use bytesize::ByteSize;
    use quickwit_directories::BundleDirectory;
    use quickwit_storage::{PutPayload, SplitPayloadBuilder};
    use tantivy::Directory;
    use tantivy::directory::FileSlice;
    use tempfile::tempdir;
    use tokio::fs;
    use ulid::Ulid;

    use super::SPLIT_MAX_AGE;
    use crate::split_store::{IndexingSplitCache, SplitStoreQuota};

    async fn create_fake_split(
        split_cache_path: &Path,
        split_id: &str,
        len: usize,
    ) -> io::Result<()> {
        let split_path = split_cache_path.join(format!("{split_id}.split"));
        fs::create_dir(&split_path).await?;
        fs::write(split_path.join("splitdata"), &vec![0u8; len]).await?;
        Ok(())
    }

    #[tokio::test]
    async fn test_local_split_store_load_existing_splits() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let split_id1 = "01GF5449X7DA53TK9F9W2ZJST2";
        let split_id2 = "01GF545472A06WY07SEHGCJF9P";
        create_fake_split(temp_dir.path(), split_id1, 15).await?;
        create_fake_split(temp_dir.path(), split_id2, 13).await?;
        let split_store_space_quota = SplitStoreQuota::default();
        let split_store =
            IndexingSplitCache::open(temp_dir.path().to_path_buf(), split_store_space_quota)
                .await?;
        let cache_content = split_store.inspect_registry().await;
        assert_eq!(cache_content.len(), 2);
        assert_eq!(cache_content.get(split_id1).cloned(), Some(ByteSize(15)));
        assert_eq!(cache_content.get(split_id2).cloned(), Some(ByteSize(13)));
        Ok(())
    }

    #[tokio::test]
    async fn test_create_with_too_many_files() {
        let dir = tempdir().unwrap();
        create_fake_split(dir.path(), "01GF5215TMV48JT7GZ543BV193", 12)
            .await
            .unwrap(); // 1
        create_fake_split(dir.path(), "01GF520MTTRNCCTQZE264BBYWM", 23)
            .await
            .unwrap(); // 0
        create_fake_split(dir.path(), "01GF521M316V9AEHZWTHN76F2V", 5)
            .await
            .unwrap(); // 3
        create_fake_split(dir.path(), "01GF521CZC1260V8QPA81T46X7", 45)
            .await
            .unwrap(); // 2
        let split_store_space_quota = SplitStoreQuota::try_new(2, ByteSize::kb(1)).unwrap();
        let local_split_store =
            IndexingSplitCache::open(dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();
        assert_eq!(local_split_store.inspect_registry().await.len(), 2);
        let quota = local_split_store.inspect_quota().await;
        assert_eq!(quota.used_num_bytes(), ByteSize(50));
    }

    #[tokio::test]
    async fn test_create_with_exceeds_num_bytes() {
        let dir = tempdir().unwrap();
        create_fake_split(dir.path(), "01GF5215TMV48JT7GZ543BV193", 12)
            .await
            .unwrap(); // 1
        create_fake_split(dir.path(), "01GF520MTTRNCCTQZE264BBYWM", 23)
            .await
            .unwrap(); // 0
        create_fake_split(dir.path(), "01GF521M316V9AEHZWTHN76F2V", 5)
            .await
            .unwrap(); // 3
        create_fake_split(dir.path(), "01GF521CZC1260V8QPA81T46X7", 45)
            .await
            .unwrap(); // 2
        let split_store_space_quota = SplitStoreQuota::try_new(6, ByteSize(61)).unwrap();
        let local_split_store =
            IndexingSplitCache::open(dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();
        let cache_content = local_split_store.inspect_registry().await;
        assert_eq!(cache_content.len(), 2);
        assert_eq!(cache_content.values().map(|v| v.as_u64()).sum::<u64>(), 50);
        let quota = local_split_store.inspect_quota().await;
        assert_eq!(quota.used_num_bytes(), ByteSize(50));
    }

    #[tokio::test]
    async fn test_big_split_evicts_all() {
        let dir = tempdir().unwrap();
        create_fake_split(dir.path(), "01GF5215TMV48JT7GZ543BV193", 100)
            .await
            .unwrap(); // 1
        create_fake_split(dir.path(), "01GF520MTTRNCCTQZE264BBYWM", 100)
            .await
            .unwrap(); // 0
        create_fake_split(dir.path(), "01GF521M316V9AEHZWTHN76F2V", 100)
            .await
            .unwrap(); // 3
        create_fake_split(dir.path(), "01GF521CZC1260V8QPA81T46X7", 100)
            .await
            .unwrap(); // 2
        let split_store_space_quota = SplitStoreQuota::try_new(6, ByteSize::b(401)).unwrap();
        let local_split_store =
            IndexingSplitCache::open(dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();
        assert_eq!(local_split_store.inspect_registry().await.len(), 4);

        let extra_split = tempdir().unwrap();
        fs::write(extra_split.path().join("splitdata"), &vec![0u8; 400])
            .await
            .unwrap();
        local_split_store
            .move_into_cache("01GFCZJBMBMEPMAQSFD09VTST2", extra_split.path())
            .await
            .unwrap();
        assert_eq!(local_split_store.inspect_registry().await.len(), 1);
        let quota = local_split_store.inspect_quota().await;
        assert_eq!(quota.used_num_bytes(), ByteSize(400));
    }

    #[tokio::test]
    async fn test_remove_splits_out_of_age() {
        let dir = tempdir().unwrap();
        // 2022-10-13T06:12:37.643Z
        create_fake_split(dir.path(), "01GF7ZJBMBMEPMAQSFD09VTST2", 1)
            .await
            .unwrap();
        // 2022-10-12T20:53:23.211Z
        create_fake_split(dir.path(), "01GF6ZJBMBMEPMAQSFD09VTST2", 1)
            .await
            .unwrap();
        // 2022-10-12T02:14:54.347Z
        create_fake_split(dir.path(), "01GF4ZJBMBMEPMAQSFD09VTST2", 1)
            .await
            .unwrap();
        // 2022-10-10T22:17:11.051Z
        create_fake_split(dir.path(), "01GF1ZJBMBMEPMAQSFD09VTST2", 1)
            .await
            .unwrap();
        let split_store_space_quota = SplitStoreQuota::try_new(6, ByteSize(100)).unwrap();
        let local_split_store =
            IndexingSplitCache::open(dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();
        let cache_content = local_split_store.inspect_registry().await;
        assert_eq!(cache_content.len(), 3);

        // adding a split with a large time gap only keeps splits younger than SPLIT_MAX_AGE
        assert_eq!(
            SPLIT_MAX_AGE,
            Duration::from_secs(2 * 24 * 3_600),
            "update this test if SPLIT_MAX_AGE changes"
        );
        {
            let extra_split = tempdir().unwrap();
            local_split_store
                // 2022-10-15T4:48:49.803Z
                .move_into_cache("01GFCZJBMBMEPMAQSFD09VTST2", extra_split.path())
                .await
                .unwrap();
            let cache_content = local_split_store.inspect_registry().await;
            assert_eq!(cache_content.len(), 2);
            let quota = local_split_store.inspect_quota().await;
            assert_eq!(quota.used_num_bytes(), ByteSize(1));
        }
        {
            // adding a split with a huge time gap should empty the cache entirely first
            let extra_split = tempdir().unwrap();
            let was_accepted = local_split_store
                // 2025-01-13T14:28:17.364Z
                .move_into_cache("01JHG11FAM8F2XPWHY24R3HF6M", extra_split.path())
                .await
                .unwrap();
            assert!(was_accepted);
            let cache_content = local_split_store.inspect_registry().await;
            assert_eq!(cache_content.len(), 1);
            let quota = local_split_store.inspect_quota().await;
            assert_eq!(quota.used_num_bytes(), ByteSize(0));
        }
    }

    #[tokio::test]
    async fn test_stream_split_to_bundle_and_open() {
        let temp_dir = tempfile::tempdir().unwrap();
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");
        let mut file1 = File::create(&test_filepath1).unwrap();
        file1.write_all(b"ab").unwrap();
        let mut file2 = File::create(&test_filepath2).unwrap();
        file2.write_all(b"def").unwrap();
        let split_streamer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1, test_filepath2],
            &[],
            b"hotcache",
        )
        .unwrap();
        let data = split_streamer.read_all().await.unwrap();
        let bundle_dir = BundleDirectory::open_split(FileSlice::from(data.to_vec())).unwrap();
        let f1_data = bundle_dir.atomic_read(Path::new("f1")).unwrap();
        assert_eq!(&*f1_data, b"ab");
        let f2_data = bundle_dir.atomic_read(Path::new("f2")).unwrap();
        assert_eq!(&f2_data[..], b"def");
    }

    #[tokio::test]
    async fn test_store_and_fetch() {
        let temp_dir_in = tempfile::tempdir().unwrap();
        let split_id = Ulid::default().to_string();
        let cache_dir = tempfile::tempdir().unwrap();
        let quota = SplitStoreQuota::default();
        let local_store = IndexingSplitCache::open(cache_dir.path().to_path_buf(), quota)
            .await
            .unwrap();
        {
            let split_dir = temp_dir_in.path().join(format!("scratch_{split_id}"));
            tokio::fs::create_dir(&split_dir).await.unwrap();
            assert!(
                local_store
                    .move_into_cache(&split_id, &split_dir)
                    .await
                    .unwrap()
            );
            assert!(!split_dir.try_exists().unwrap());
        }
        {
            let split_path = local_store
                .get_cached_split(&split_id, temp_dir_in.path())
                .await
                .unwrap()
                .unwrap();
            assert!(split_path.try_exists().unwrap());
            assert_eq!(split_path.parent().unwrap(), temp_dir_in.path());
        }
        {
            // cache miss because the previous get_cached_split removed the split from the cache
            let split_path_opt = local_store
                .get_cached_split(&split_id, temp_dir_in.path())
                .await
                .unwrap();
            assert_eq!(split_path_opt, None);
        }
    }

    async fn clear_dir_manually(dir: &Path) {
        let mut entries = fs::read_dir(dir).await.unwrap();
        while let Some(entry) = entries.next_entry().await.unwrap() {
            let path = entry.path();
            if path.is_dir() {
                fs::remove_dir_all(&path).await.unwrap();
            } else {
                fs::remove_file(&path).await.unwrap();
            }
        }
    }

    #[tokio::test]
    async fn test_fetch_manually_deleted_split() {
        let dir = tempdir().unwrap();
        create_fake_split(dir.path(), "01GF5215TMV48JT7GZ543BV193", 100)
            .await
            .unwrap();
        let split_store_space_quota = SplitStoreQuota::try_new(6, ByteSize::b(401)).unwrap();
        let local_split_store =
            IndexingSplitCache::open(dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();
        assert_eq!(local_split_store.inspect_registry().await.len(), 1);

        clear_dir_manually(dir.path()).await;

        let target_dir = tempdir().unwrap();
        let path_opt = local_split_store
            .get_cached_split("01GF5215TMV48JT7GZ543BV193", target_dir.path())
            .await
            .unwrap();
        assert_eq!(path_opt, None);
        assert_eq!(local_split_store.inspect_registry().await.len(), 0);
        let quota = local_split_store.inspect_quota().await;
        assert_eq!(quota.used_num_bytes(), ByteSize(0));
    }

    #[tokio::test]
    async fn test_evict_manually_deleted_split() {
        let dir = tempdir().unwrap();
        // // 2022-10-12T20:53:23.211Z
        create_fake_split(dir.path(), "01GF6ZJBMBMEPMAQSFD09VTST2", 100)
            .await
            .unwrap();
        let split_store_space_quota = SplitStoreQuota::try_new(1, ByteSize::b(401)).unwrap();
        let local_split_store =
            IndexingSplitCache::open(dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();
        assert_eq!(local_split_store.inspect_registry().await.len(), 1);

        clear_dir_manually(dir.path()).await;

        let extra_split = tempdir().unwrap();
        let was_accepted = local_split_store
            // 2022-10-12T02:14:54.347Z
            .move_into_cache("01GF4ZJBMBMEPMAQSFD09VTST2", extra_split.path())
            .await
            .unwrap();
        assert!(was_accepted);
        assert_eq!(local_split_store.inspect_registry().await.len(), 1);
        let quota = local_split_store.inspect_quota().await;
        assert_eq!(quota.used_num_bytes(), ByteSize(0));
    }

    #[tokio::test]
    async fn test_load_same_split_twice() {
        let temp_dir = tempfile::tempdir().unwrap();
        let split_id = "01GF5449X7DA53TK9F9W2ZJST2";
        create_fake_split(temp_dir.path(), split_id, 15)
            .await
            .unwrap();
        let split_store_space_quota = SplitStoreQuota::default();
        let split_store =
            IndexingSplitCache::open(temp_dir.path().to_path_buf(), split_store_space_quota)
                .await
                .unwrap();

        let extra_split = tempdir().unwrap();
        let extra_split_filepath = temp_dir.path().join("splitfile");
        let mut extra_split_file = File::create(&extra_split_filepath).unwrap();
        extra_split_file.write_all(&[0u8; 15]).unwrap();

        let was_accepted = split_store
            .move_into_cache(split_id, extra_split.path())
            .await
            .unwrap();
        assert!(!was_accepted);
        let quota = split_store.inspect_quota().await;
        assert_eq!(quota.used_num_bytes(), ByteSize(15));
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/split_store/indexing_split_store.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#[cfg(any(test, feature = "testsuite"))]
use std::collections::HashMap;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::time::Instant;

use anyhow::Context;
#[cfg(any(test, feature = "testsuite"))]
use bytesize::ByteSize;
use quickwit_common::io::{IoControls, IoControlsAccess};
use quickwit_common::uri::Uri;
use quickwit_metastore::SplitMetadata;
use quickwit_storage::{PutPayload, Storage, StorageResult};
use tantivy::Directory;
use tantivy::directory::{Advice, MmapDirectory};
use time::OffsetDateTime;
use tracing::{Instrument, debug, info_span, instrument};

use super::IndexingSplitCache;
use crate::get_tantivy_directory_from_split_bundle;

/// IndexingSplitStore is a wrapper around a regular `Storage` to upload and
/// download splits while allowing for efficient caching.
///
/// We typically index with a limited amount of RAM or some constraints on the
/// expected time-to-search.
/// Because of these constraints, the indexer produces splits that are smaller
/// than optimal and need to be merged.
///
/// A split therefore typically undergoes a few merges relatively shortly after
/// its creation.
///
/// In order to alleviate the disk IO as well as the network bandwidth,
/// we save new splits into a split store.
///
/// The role of the `IndexingSplitStore` is to combine a cache and a storage
/// to avoid unnecessary download of fresh splits. Its behavior are however very different
/// from a usual cache as we have a strong knowledge of the split lifecycle.
///
/// The splits are stored on the local filesystem in the `IndexingSplitCache`.
#[derive(Clone)]
pub struct IndexingSplitStore {
    inner: Arc<InnerIndexingSplitStore>,
}

struct InnerIndexingSplitStore {
    /// The remote storage.
    remote_storage: Arc<dyn Storage>,
    split_cache: Arc<IndexingSplitCache>,
}

impl IndexingSplitStore {
    /// Creates an instance of [`IndexingSplitStore`]
    ///
    /// It needs the remote storage to work with.
    pub fn new(remote_storage: Arc<dyn Storage>, split_cache: Arc<IndexingSplitCache>) -> Self {
        let inner = InnerIndexingSplitStore {
            remote_storage,
            split_cache,
        };
        Self {
            inner: Arc::new(inner),
        }
    }

    /// Helper function to create a indexing split store for tests.
    /// The resulting store does not have any local cache.
    pub fn create_without_local_store_for_test(remote_storage: Arc<dyn Storage>) -> Self {
        let inner = InnerIndexingSplitStore {
            remote_storage,
            split_cache: Arc::new(IndexingSplitCache::no_caching()),
        };
        IndexingSplitStore {
            inner: Arc::new(inner),
        }
    }

    pub fn remote_uri(&self) -> &Uri {
        self.inner.remote_storage.uri()
    }

    fn split_path(&self, split_id: &str) -> PathBuf {
        PathBuf::from(quickwit_common::split_file(split_id))
    }

    /// Stores a split.
    ///
    /// If a split is identified as mature by the merge policy,
    /// it will not be cached into the local storage.
    ///
    /// In order to limit the write IO, the file might be moved (and not copied into
    /// the store).
    /// In other words, after calling this function the file will not be available
    /// at `split_folder` anymore.
    #[instrument("store_split", skip_all)]
    pub async fn store_split(
        &self,
        split: &SplitMetadata,
        split_folder_path: &Path,
        put_payload: Box<dyn PutPayload>,
    ) -> anyhow::Result<()> {
        let start = Instant::now();
        let split_num_bytes = put_payload.len();

        let key = self.split_path(split.split_id());
        let is_mature = split.is_mature(OffsetDateTime::now_utc());
        self.inner
            .remote_storage
            .put(&key, put_payload)
            .instrument(info_span!("store_split_in_remote_storage", split=?split.split_id(), is_mature=is_mature, num_bytes=split_num_bytes))
            .await
            .with_context(|| {
                format!(
                    "failed uploading key {} in bucket {}",
                    key.display(),
                    self.inner.remote_storage.uri()
                )
            })?;

        let elapsed_secs = start.elapsed().as_secs_f32();
        let split_size_in_megabytes = split_num_bytes as f32 / 1_000_000f32;
        let throughput_mb_s = split_size_in_megabytes / elapsed_secs;

        debug!(
            split_size_in_megabytes = %split_size_in_megabytes,
            num_docs = %split.num_docs,
            elapsed_secs = %elapsed_secs,
            throughput_mb_s = %throughput_mb_s,
            is_mature = is_mature,
            "store-split-remote-success"
        );

        if !is_mature {
            debug!("store-in-cache");
            if self
                .inner
                .split_cache
                .move_into_cache(split.split_id(), split_folder_path)
                .await?
            {
                return Ok(());
            }
        }
        tokio::fs::remove_dir_all(split_folder_path).await?;
        Ok(())
    }

    /// Gets a split from the split store, and makes it available to the given `output_path`.
    /// If the split is available in the local disk cache, then it will be moved
    /// from the cache to the `output_dir_path`.
    ///
    /// The output_path is expected to be a directory path.
    ///
    /// If not, it will be fetched from the remote `Storage`.
    ///
    /// # Implementation detail:
    ///
    /// Depending on whether the split was obtained from the `Storage`
    /// or the cache, it could consist in a directly or a proper split file.
    /// This method takes care of the dealing with opening the split correctly.
    ///
    /// As we fetch the split, we optimistically assume that this is for a merge
    /// operation that will be successful and we remove the split from the cache.
    #[instrument(skip(self, output_dir_path, io_controls), fields(cache_hit))]
    pub async fn fetch_and_open_split(
        &self,
        split_id: &str,
        output_dir_path: &Path,
        io_controls: &IoControls,
    ) -> StorageResult<Box<dyn Directory>> {
        let path = PathBuf::from(quickwit_common::split_file(split_id));
        if let Some(split_path) = self
            .inner
            .split_cache
            .get_cached_split(split_id, output_dir_path)
            .await?
        {
            tracing::Span::current().record("cache_hit", true);
            let mmap_directory: Box<dyn Directory> = Box::new(MmapDirectory::open_with_madvice(
                split_path,
                Advice::Sequential,
            )?);
            return Ok(mmap_directory);
        } else {
            tracing::Span::current().record("cache_hit", false);
        }
        let dest_filepath = output_dir_path.join(&path);
        let dest_file = tokio::fs::File::create(&dest_filepath).await?;
        let mut dest_file_with_write_limit = io_controls.clone().wrap_write(dest_file);
        self.inner
            .remote_storage
            .copy_to(&path, &mut dest_file_with_write_limit)
            .instrument(info_span!("fetch_split_from_remote_storage", path=?path))
            .await?;
        get_tantivy_directory_from_split_bundle(&dest_filepath)
    }

    /// Takes a snapshot of the cache view (only used for testing).
    #[cfg(any(test, feature = "testsuite"))]
    pub async fn inspect_split_cache(&self) -> HashMap<String, ByteSize> {
        self.inner.split_cache.inspect_registry().await
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::time::Duration;

    use bytesize::ByteSize;
    use quickwit_common::io::IoControls;
    use quickwit_metastore::{SplitMaturity, SplitMetadata};
    use quickwit_storage::{PutPayload, RamStorage, SplitPayloadBuilder};
    use tempfile::tempdir;
    use time::OffsetDateTime;
    use tokio::fs;
    use ulid::Ulid;

    use super::IndexingSplitStore;
    use crate::split_store::{IndexingSplitCache, SplitStoreQuota};

    fn create_test_split_metadata(split_id: &str) -> SplitMetadata {
        SplitMetadata {
            split_id: split_id.to_string(),
            create_timestamp: OffsetDateTime::now_utc().unix_timestamp(),
            maturity: SplitMaturity::Immature {
                maturation_period: Duration::from_secs(3600),
            },
            ..Default::default()
        }
    }

    #[tokio::test]
    async fn test_local_store_cache_in_and_out() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let split_cache_dir = tempdir()?;

        let split_cache = IndexingSplitCache::open(
            split_cache_dir.path().to_path_buf(),
            SplitStoreQuota::default(),
        )
        .await?;
        let remote_storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::new(remote_storage, Arc::new(split_cache));

        let split_id1 = Ulid::new().to_string();
        let split_id2 = Ulid::new().to_string();

        {
            let split1_dir = temp_dir.path().join(&split_id1);
            fs::create_dir_all(&split1_dir).await?;
            let split_metadata1 = create_test_split_metadata(&split_id1);
            fs::write(split1_dir.join("splitfile"), b"1234").await?;
            split_store
                .store_split(&split_metadata1, &split1_dir, Box::new(b"1234".to_vec()))
                .await?;
            assert!(!split1_dir.try_exists()?);
            assert!(
                split_cache_dir
                    .path()
                    .join(format!("{split_id1}.split"))
                    .try_exists()?
            );
            let local_store_stats = split_store.inspect_split_cache().await;
            assert_eq!(local_store_stats.len(), 1);
            assert_eq!(
                local_store_stats.get(&split_id1).cloned(),
                Some(ByteSize(4))
            );
        }
        {
            let split2_dir = temp_dir.path().join(&split_id2);
            fs::create_dir_all(&split2_dir).await?;
            fs::write(split2_dir.join("splitfile"), b"567").await?;
            let split_metadata2 = create_test_split_metadata(&split_id2);
            split_store
                .store_split(&split_metadata2, &split2_dir, Box::new(b"567".to_vec()))
                .await?;
            assert!(!split2_dir.try_exists()?);
            assert!(
                split_cache_dir
                    .path()
                    .join(format!("{split_id2}.split"))
                    .try_exists()?
            );
        }

        let local_store_stats = split_store.inspect_split_cache().await;
        assert_eq!(local_store_stats.len(), 2);
        assert_eq!(
            local_store_stats.get(&split_id1).cloned(),
            Some(ByteSize(4))
        );
        assert_eq!(
            local_store_stats.get(&split_id2).cloned(),
            Some(ByteSize(3))
        );

        let io_controls = IoControls::default();
        {
            let output = tempfile::tempdir()?;
            let split1 = split_store
                .fetch_and_open_split(&split_id1, output.path(), &io_controls)
                .await?;
            let local_store_stats = split_store.inspect_split_cache().await;
            assert_eq!(local_store_stats.len(), 1);
            assert!(split1.exists(std::path::Path::new("splitfile")).unwrap());
        }
        {
            let output = tempfile::tempdir()?;
            let split2 = split_store
                .fetch_and_open_split(&split_id2, output.path(), &io_controls)
                .await?;
            let local_store_stats = split_store.inspect_split_cache().await;
            assert_eq!(local_store_stats.len(), 0);
            assert!(split2.exists(std::path::Path::new("splitfile")).unwrap());
        }

        Ok(())
    }

    #[tokio::test]
    async fn test_eviction_and_fallback_to_remote() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;

        let split_cache_dir = tempdir()?;
        let split_cache = IndexingSplitCache::open(
            split_cache_dir.path().to_path_buf(),
            SplitStoreQuota::try_new(1, ByteSize::mb(1)).unwrap(),
        )
        .await?;

        let remote_storage = Arc::new(RamStorage::default());
        let split_store = IndexingSplitStore::new(remote_storage, Arc::new(split_cache));

        let split_id1 = Ulid::new().to_string();
        let split_payload1 = SplitPayloadBuilder::get_split_payload(&[], &[], &[5, 5, 5])?;
        let split_id2 = Ulid::new().to_string();
        let split_payload2 = SplitPayloadBuilder::get_split_payload(&[], &[], &[5, 5, 5, 5])?;

        {
            let split_path = temp_dir.path().join(&split_id1);
            fs::create_dir_all(&split_path).await?;
            fs::write(split_path.join("splitdatafile"), b"hello-world").await?;
            let split_metadata1 = create_test_split_metadata(&split_id1);
            split_store
                .store_split(
                    &split_metadata1,
                    &split_path,
                    Box::new(split_payload1.clone()),
                )
                .await?;
            assert!(!split_path.try_exists()?);
            assert!(
                split_cache_dir
                    .path()
                    .join(format!("{split_id1}.split"))
                    .try_exists()?
            );
            let split_cache_stats = split_store.inspect_split_cache().await;
            assert_eq!(split_cache_stats.len(), 1);
            assert_eq!(
                split_cache_stats.get(&split_id1).cloned(),
                Some(ByteSize(11))
            );
        }
        {
            let split_path = temp_dir.path().join(&split_id2);
            fs::create_dir_all(&split_path).await?;
            fs::write(split_path.join("splitdatafile2"), b"hello-world2").await?;
            let split_metadata2 = create_test_split_metadata(&split_id2);

            split_store
                .store_split(
                    &split_metadata2,
                    &split_path,
                    Box::new(split_payload2.clone()),
                )
                .await?;
            assert!(!split_path.try_exists()?);
            assert!(
                split_cache_dir
                    .path()
                    .join(format!("{split_id2}.split"))
                    .try_exists()?
            );
            let split_cache_stats = split_store.inspect_split_cache().await;
            assert_eq!(split_cache_stats.len(), 1);
            assert_eq!(
                split_cache_stats.get(&split_id2).cloned(),
                Some(ByteSize(12))
            );
        }
        let io_controls = IoControls::default();
        {
            // get from remote storage because split_id1 was evicted by split_id2
            let output = tempfile::tempdir()?;
            let _split1 = split_store
                .fetch_and_open_split(&split_id1, output.path(), &io_controls)
                .await?;
            assert_eq!(io_controls.num_bytes(), split_payload1.len());
        }
        {
            // get from cache
            let output = tempfile::tempdir()?;
            let _split2 = split_store
                .fetch_and_open_split(&split_id2, output.path(), &io_controls)
                .await?;
            // the number of downloaded by didn't change (still the size of split_payload1)
            assert_eq!(io_controls.num_bytes(), split_payload1.len());
        }
        {
            // get from remote because getting from cache removes the split from the cache
            let output = tempfile::tempdir()?;
            let _split2 = split_store
                .fetch_and_open_split(&split_id2, output.path(), &io_controls)
                .await?;
            assert_eq!(
                io_controls.num_bytes(),
                split_payload1.len() + split_payload2.len()
            );
        }

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/split_store/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod indexing_split_cache;
mod indexing_split_store;
mod split_store_quota;

pub use indexing_split_cache::{IndexingSplitCache, get_tantivy_directory_from_split_bundle};
pub use indexing_split_store::IndexingSplitStore;
pub use split_store_quota::SplitStoreQuota;


================================================
FILE: quickwit/quickwit-indexing/src/split_store/split_store_quota.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytesize::ByteSize;
use quickwit_config::IndexerConfig;

/// A struct for keeping in check multiple SplitStore.
#[derive(Debug, Clone)]
pub struct SplitStoreQuota {
    /// Current number of splits in the cache.
    num_splits_in_cache: usize,
    /// Current size in bytes of splits in the cache.
    size_in_bytes_in_cache: ByteSize,
    /// Maximum number of files allowed in the cache.
    max_num_splits: usize,
    /// Maximum size in bytes allowed in the cache. 0 if max_num_splits=0.
    max_num_bytes: ByteSize,
}

impl Default for SplitStoreQuota {
    fn default() -> Self {
        Self {
            num_splits_in_cache: 0,
            size_in_bytes_in_cache: ByteSize::default(),
            max_num_bytes: IndexerConfig::default_split_store_max_num_bytes(),
            max_num_splits: IndexerConfig::default_split_store_max_num_splits(),
        }
    }
}

impl SplitStoreQuota {
    pub fn try_new(max_num_splits: usize, max_num_bytes: ByteSize) -> anyhow::Result<Self> {
        if max_num_splits == 0 && max_num_bytes.as_u64() > 0 {
            anyhow::bail!("max_num_bytes cannot be > 0 if max_num_splits is 0");
        }
        Ok(Self {
            max_num_splits,
            max_num_bytes,
            ..Default::default()
        })
    }

    /// Space quota that prevents any caching.
    pub fn no_caching() -> Self {
        Self::try_new(0, ByteSize::default()).unwrap()
    }

    pub fn can_fit_split(&self, split_size_in_bytes: ByteSize) -> bool {
        if self.num_splits_in_cache >= self.max_num_splits {
            return false;
        }
        if self.size_in_bytes_in_cache.as_u64() + split_size_in_bytes.as_u64()
            > self.max_num_bytes.as_u64()
        {
            return false;
        }
        true
    }

    pub fn add_split(&mut self, split_size_in_bytes: ByteSize) {
        self.num_splits_in_cache += 1;
        self.size_in_bytes_in_cache =
            ByteSize(self.size_in_bytes_in_cache.as_u64() + split_size_in_bytes.as_u64());
    }

    pub fn remove_split(&mut self, split_size_in_bytes: ByteSize) {
        self.size_in_bytes_in_cache =
            ByteSize(self.size_in_bytes_in_cache.as_u64() - split_size_in_bytes.as_u64());
        self.num_splits_in_cache -= 1;
    }

    pub fn max_num_bytes(&self) -> ByteSize {
        self.max_num_bytes
    }

    pub fn used_num_bytes(&self) -> ByteSize {
        self.size_in_bytes_in_cache
    }
}

#[cfg(test)]
mod tests {
    use bytesize::ByteSize;

    use crate::split_store::SplitStoreQuota;

    #[test]
    fn test_invalid_quota() {
        SplitStoreQuota::try_new(0, ByteSize(100)).unwrap_err();
    }

    #[test]
    fn test_split_store_quota_max_bytes_accepted() {
        let split_store_quota = SplitStoreQuota::try_new(3, ByteSize(100)).unwrap();
        assert!(split_store_quota.can_fit_split(ByteSize(100)));
    }

    #[test]
    fn test_split_store_quota_exceeding_bytes() {
        let split_store_quota = SplitStoreQuota::try_new(3, ByteSize(100)).unwrap();
        assert!(!split_store_quota.can_fit_split(ByteSize(101)));
    }

    #[test]
    fn test_split_store_quota_max_num_files_accepted() {
        let mut split_store_quota = SplitStoreQuota::try_new(2, ByteSize(100)).unwrap();
        split_store_quota.add_split(ByteSize(1));
        assert!(split_store_quota.can_fit_split(ByteSize(1)));
    }

    #[test]
    fn test_split_store_quota_exceeding_max_num_files() {
        let mut split_store_quota = SplitStoreQuota::try_new(2, ByteSize(100)).unwrap();
        split_store_quota.add_split(ByteSize(1));
        split_store_quota.add_split(ByteSize(1));
        assert!(!split_store_quota.can_fit_split(ByteSize(1)));
    }
}


================================================
FILE: quickwit/quickwit-indexing/src/test_utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;
use std::str::FromStr;
use std::sync::Arc;
use std::sync::atomic::{AtomicUsize, Ordering};

use bytes::Bytes;
use quickwit_actors::{Mailbox, Universe};
use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::rand::append_random_suffix;
use quickwit_common::uri::Uri;
use quickwit_config::{
    ConfigFormat, INGEST_API_SOURCE_ID, IndexConfig, IndexerConfig, IngestApiConfig,
    MetastoreConfigs, SourceConfig, SourceInputFormat, SourceParams, VecSourceParams,
    build_doc_mapper,
};
use quickwit_doc_mapper::DocMapper;
use quickwit_ingest::{IngesterPool, QUEUES_DIR_NAME, init_ingest_api};
use quickwit_metastore::{
    CreateIndexRequestExt, MetastoreResolver, Split, SplitMetadata, SplitState,
};
use quickwit_proto::metastore::{CreateIndexRequest, MetastoreService, MetastoreServiceClient};
use quickwit_proto::types::{IndexUid, NodeId, PipelineUid, SourceId};
use quickwit_storage::{Storage, StorageResolver};
use serde_json::Value as JsonValue;

use crate::actors::IndexingService;
use crate::models::{DetachIndexingPipeline, IndexingStatistics, SpawnPipeline};

/// Creates a Test environment.
///
/// It makes it easy to create a test index, perfect for unit testing.
/// The test index content is entirely in RAM and isolated,
/// but the construction of the index involves temporary file directory.
pub struct TestSandbox {
    node_id: NodeId,
    index_uid: IndexUid,
    source_id: SourceId,
    indexing_service: Mailbox<IndexingService>,
    doc_mapper: Arc<DocMapper>,
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
    storage: Arc<dyn Storage>,
    add_docs_id: AtomicUsize,
    universe: Universe,
    _temp_dir: tempfile::TempDir,
}

const METASTORE_URI: &str = "ram://quickwit-test-indexes";

fn index_uri(index_id: &str) -> Uri {
    Uri::from_str(&format!("{METASTORE_URI}/{index_id}")).unwrap()
}

impl TestSandbox {
    /// Creates a new test environment.
    pub async fn create(
        index_id: &str,
        doc_mapping_yaml: &str,
        indexing_settings_yaml: &str,
        search_fields: &[&str],
    ) -> anyhow::Result<TestSandbox> {
        let node_id = NodeId::new(append_random_suffix("test-node"));
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let index_uri = index_uri(index_id);
        let mut index_config = IndexConfig::for_test(index_id, index_uri.as_str());
        index_config.doc_mapping = ConfigFormat::Yaml.parse(doc_mapping_yaml.as_bytes())?;
        index_config.indexing_settings =
            ConfigFormat::Yaml.parse(indexing_settings_yaml.as_bytes())?;
        index_config.search_settings.default_search_fields = search_fields
            .iter()
            .map(|search_field| search_field.to_string())
            .collect();
        let source_config = SourceConfig::ingest_api_default();
        let storage_resolver = StorageResolver::for_test();
        let metastore_resolver =
            MetastoreResolver::configured(storage_resolver.clone(), &MetastoreConfigs::default());
        let metastore = metastore_resolver
            .resolve(&Uri::for_test(METASTORE_URI))
            .await?;
        let create_index_request = CreateIndexRequest::try_from_index_and_source_configs(
            &index_config,
            std::slice::from_ref(&source_config),
        )?;
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await?
            .index_uid()
            .clone();
        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &index_config.search_settings)?;
        let temp_dir = tempfile::tempdir()?;
        let indexer_config = IndexerConfig::for_test()?;
        let num_blocking_threads = 1;
        let storage = storage_resolver.resolve(&index_uri).await?;
        let universe = Universe::with_accelerated_time();
        let merge_scheduler_mailbox = universe.get_or_spawn_one();
        let queues_dir_path = temp_dir.path().join(QUEUES_DIR_NAME);
        let ingest_api_service =
            init_ingest_api(&universe, &queues_dir_path, &IngestApiConfig::default()).await?;
        let indexing_service_actor = IndexingService::new(
            node_id.clone(),
            temp_dir.path().to_path_buf(),
            indexer_config,
            num_blocking_threads,
            cluster,
            metastore.clone(),
            Some(ingest_api_service),
            merge_scheduler_mailbox,
            IngesterPool::default(),
            storage_resolver.clone(),
            EventBroker::default(),
        )
        .await?;
        let (indexing_service, _indexing_service_handle) =
            universe.spawn_builder().spawn(indexing_service_actor);
        Ok(TestSandbox {
            node_id,
            index_uid,
            source_id: INGEST_API_SOURCE_ID.to_string(),
            indexing_service,
            doc_mapper,
            metastore,
            storage_resolver,
            storage,
            add_docs_id: AtomicUsize::default(),
            universe,
            _temp_dir: temp_dir,
        })
    }

    /// Adds documents and waits for them to be indexed (creating a separate split).
    ///
    /// The documents are expected to be `JsonValue`.
    /// They can be created using the `serde_json::json!` macro.
    pub async fn add_documents<I>(&self, json_docs: I) -> anyhow::Result<IndexingStatistics>
    where
        I: IntoIterator<Item = JsonValue> + 'static,
        I::IntoIter: Send,
    {
        let docs: Vec<Bytes> = json_docs
            .into_iter()
            .map(|json_doc| Bytes::from(json_doc.to_string()))
            .collect();
        let add_docs_id = self.add_docs_id.fetch_add(1, Ordering::SeqCst);
        let source_config = SourceConfig {
            source_id: INGEST_API_SOURCE_ID.to_string(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::Vec(VecSourceParams {
                docs,
                batch_num_docs: 10,
                partition: format!("add-docs-{add_docs_id}"),
            }),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        let pipeline_id = self
            .indexing_service
            .ask_for_res(SpawnPipeline {
                index_id: self.index_uid.index_id.to_string(),
                source_config,
                pipeline_uid: PipelineUid::for_test(0u128),
            })
            .await?;
        let pipeline_handle = self
            .indexing_service
            .ask_for_res(DetachIndexingPipeline {
                pipeline_id: pipeline_id.clone(),
            })
            .await?;
        let (_pipeline_exit_status, pipeline_statistics) = pipeline_handle.join().await;
        Ok(pipeline_statistics)
    }

    /// Returns the metastore of the TestSandbox.
    ///
    /// The metastore is a file-backed metastore.
    /// Its data can be found via the `storage` in
    /// the `ram://quickwit-test-indexes` directory.
    pub fn metastore(&self) -> MetastoreServiceClient {
        self.metastore.clone()
    }

    /// Returns the storage of the TestSandbox.
    pub fn storage(&self) -> Arc<dyn Storage> {
        self.storage.clone()
    }

    /// Returns the storage resolver of the TestSandbox.
    pub fn storage_resolver(&self) -> StorageResolver {
        self.storage_resolver.clone()
    }

    /// Returns the doc mapper of the TestSandbox.
    pub fn doc_mapper(&self) -> Arc<DocMapper> {
        self.doc_mapper.clone()
    }

    /// Returns the node ID.
    pub fn node_id(&self) -> NodeId {
        self.node_id.clone()
    }

    /// Returns the index UID.
    pub fn index_uid(&self) -> IndexUid {
        self.index_uid.clone()
    }

    /// Returns the source ID.
    pub fn source_id(&self) -> SourceId {
        self.source_id.clone()
    }

    /// Returns the underlying universe.
    pub fn universe(&self) -> &Universe {
        &self.universe
    }

    /// Gracefully quits all registered actors in the underlying universe and asserts that none of
    /// them panicked.
    ///
    /// This is useful for testing purposes to detect failed asserts in actors
    #[cfg(any(test, feature = "testsuite"))]
    pub async fn assert_quit(self) {
        self.universe.assert_quit().await
    }
}

/// Mock split builder.
pub struct MockSplitBuilder {
    split_metadata: SplitMetadata,
}

impl MockSplitBuilder {
    pub fn new(split_id: &str) -> Self {
        Self {
            split_metadata: mock_split_meta(split_id, &IndexUid::for_test("test-index", 0)),
        }
    }

    pub fn with_index_uid(mut self, index_uid: &IndexUid) -> Self {
        self.split_metadata.index_uid = index_uid.clone();
        self
    }

    pub fn build(self) -> Split {
        Split {
            split_state: SplitState::Published,
            split_metadata: self.split_metadata,
            update_timestamp: 0,
            publish_timestamp: None,
        }
    }
}

/// Mock split helper.
pub fn mock_split(split_id: &str) -> Split {
    MockSplitBuilder::new(split_id).build()
}

/// Mock split meta helper.
pub fn mock_split_meta(split_id: &str, index_uid: &IndexUid) -> SplitMetadata {
    SplitMetadata {
        index_uid: index_uid.clone(),
        split_id: split_id.to_string(),
        partition_id: 13u64,
        num_docs: if split_id == "split1" { 1_000_000 } else { 10 },
        uncompressed_docs_size_in_bytes: 256,
        time_range: Some(121000..=130198),
        create_timestamp: 0,
        footer_offsets: 700..800,
        ..Default::default()
    }
}

#[cfg(test)]
mod tests {
    use quickwit_metastore::{ListSplitsRequestExt, MetastoreServiceStreamSplitsExt};
    use quickwit_proto::metastore::{ListSplitsRequest, MetastoreService};

    use super::TestSandbox;

    #[tokio::test]
    async fn test_test_sandbox() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
              - name: url
                type: text
        "#;
        let test_sandbox =
            TestSandbox::create("test_index", doc_mapping_yaml, "{}", &["body"]).await?;
        let statistics = test_sandbox.add_documents(vec![
            serde_json::json!({"title": "Hurricane Fay", "body": "...", "url": "http://hurricane-fay"}),
            serde_json::json!({"title": "Ganimede", "body": "...", "url": "http://ganimede"}),
        ]).await?;
        assert_eq!(statistics.num_uploaded_splits, 1);
        let metastore = test_sandbox.metastore();
        {
            let splits = metastore
                .list_splits(
                    ListSplitsRequest::try_from_index_uid(test_sandbox.index_uid()).unwrap(),
                )
                .await?
                .collect_splits()
                .await?;
            assert_eq!(splits.len(), 1);
            test_sandbox.add_documents(vec![
            serde_json::json!({"title": "Byzantine-Ottoman wars", "body": "...", "url": "http://biz-ottoman"}),
        ]).await?;
        }
        {
            let splits = metastore
                .list_splits(
                    ListSplitsRequest::try_from_index_uid(test_sandbox.index_uid()).unwrap(),
                )
                .await?
                .collect_splits()
                .await?;
            assert_eq!(splits.len(), 2);
        }
        test_sandbox.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-ingest/Cargo.toml
================================================
[package]
name = "quickwit-ingest"
description = "Native distributed and replicated ingestion engine"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
fail = { workspace = true, optional = true }
futures = { workspace = true }
http = { workspace = true }
itertools = { workspace = true }
mockall = { workspace = true, optional = true }
mrecordlog = { workspace = true }
once_cell = { workspace = true }
prost = { workspace = true }
rand = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
serde_json_borrow = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tonic = { workspace = true }
tonic-prost = { workspace = true }
tower = { workspace = true }
tracing = { workspace = true }
ulid = { workspace = true }
utoipa = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true }
quickwit-doc-mapper = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true }

[dev-dependencies]
mockall = { workspace = true }
rand = { workspace = true }
rand_distr = { workspace = true }
tempfile = { workspace = true }
tokio = { workspace = true, features = ["test-util"]}

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-cluster = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }

[build-dependencies]
quickwit-codegen = { workspace = true }

[features]
failpoints = ["fail/failpoints"]
no-failpoints = []
testsuite = ["mockall"]


================================================
FILE: quickwit/quickwit-ingest/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_codegen::{Codegen, ProstConfig};

fn main() {
    // Legacy ingest codegen
    let mut prost_config = ProstConfig::default();
    prost_config.bytes(["DocBatch.doc_buffer"]);

    Codegen::builder()
        .with_protos(&["src/ingest_service.proto"])
        .with_output_dir("src/codegen/")
        .with_result_type_path("crate::Result")
        .with_error_type_path("crate::IngestServiceError")
        .with_prost_config(prost_config)
        .generate_rpc_name_impls()
        .run()
        .unwrap();
}


================================================
FILE: quickwit/quickwit-ingest/src/codegen/ingest_service.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct QueueExistsRequest {
    #[prost(string, tag = "1")]
    pub queue_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CreateQueueRequest {
    #[prost(string, tag = "1")]
    pub queue_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CreateQueueIfNotExistsRequest {
    #[prost(string, tag = "1")]
    pub queue_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CreateQueueIfNotExistsResponse {
    #[prost(string, tag = "1")]
    pub queue_id: ::prost::alloc::string::String,
    #[prost(bool, tag = "2")]
    pub created: bool,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DropQueueRequest {
    #[prost(string, tag = "1")]
    pub queue_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IngestRequest {
    #[prost(message, repeated, tag = "1")]
    pub doc_batches: ::prost::alloc::vec::Vec<DocBatch>,
    #[prost(enumeration = "CommitType", tag = "2")]
    pub commit: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IngestResponse {
    #[prost(uint64, tag = "1")]
    pub num_docs_for_processing: u64,
}
/// Fetch messages with position strictly after `start_after`.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FetchRequest {
    #[prost(string, tag = "1")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(uint64, optional, tag = "2")]
    pub start_after: ::core::option::Option<u64>,
    #[prost(uint64, optional, tag = "3")]
    pub num_bytes_limit: ::core::option::Option<u64>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FetchResponse {
    #[prost(uint64, optional, tag = "1")]
    pub first_position: ::core::option::Option<u64>,
    #[prost(message, optional, tag = "2")]
    pub doc_batch: ::core::option::Option<DocBatch>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DocBatch {
    #[prost(string, tag = "1")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(bytes = "bytes", tag = "2")]
    #[schema(value_type = String, format = Binary)]
    pub doc_buffer: ::prost::bytes::Bytes,
    #[prost(uint32, repeated, tag = "3")]
    pub doc_lengths: ::prost::alloc::vec::Vec<u32>,
}
/// Suggest to truncate the queue.
///
/// This function allows the queue to remove all records up to and
/// including `up_to_offset_included`.
///
/// The role of this truncation is to release memory and disk space.
///
/// There are no guarantees that the record will effectively be removed.
/// Nothing might happen, or the truncation might be partial.
///
/// In other words, truncating from a position, and fetching records starting
/// earlier than this position can yield undefined result:
/// the truncated records may or may not be returned.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SuggestTruncateRequest {
    #[prost(string, tag = "1")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(uint64, tag = "2")]
    pub up_to_position_included: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct TailRequest {
    #[prost(string, tag = "1")]
    pub index_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListQueuesRequest {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListQueuesResponse {
    #[prost(string, repeated, tag = "1")]
    pub queues: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
/// Specifies if the ingest request should block waiting for the records to be committed.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum CommitType {
    /// The request doesn't wait for commit
    Auto = 0,
    /// The request waits for the next scheduled commit to finish.
    WaitFor = 1,
    /// The request forces an immediate commit after the last document in the batch and waits for
    /// it to finish.
    Force = 2,
}
impl CommitType {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Auto => "Auto",
            Self::WaitFor => "WaitFor",
            Self::Force => "Force",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "Auto" => Some(Self::Auto),
            "WaitFor" => Some(Self::WaitFor),
            "Force" => Some(Self::Force),
            _ => None,
        }
    }
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for IngestRequest {
    fn rpc_name() -> &'static str {
        "ingest"
    }
}
impl RpcName for FetchRequest {
    fn rpc_name() -> &'static str {
        "fetch"
    }
}
impl RpcName for TailRequest {
    fn rpc_name() -> &'static str {
        "tail"
    }
}
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait IngestService: std::fmt::Debug + Send + Sync + 'static {
    ///Ingests document in a given queue.
    ///
    ///Upon any kind of error, the client should
    ///
    ///* retry to get at least once delivery.
    ///* not retry to get at most once delivery.
    ///
    ///Exactly once delivery is not supported yet.
    async fn ingest(&self, request: IngestRequest) -> crate::Result<IngestResponse>;
    ///Fetches record from a given queue.
    ///
    ///Records are returned in order.
    ///
    ///The returned `FetchResponse` object is meant to be read with the
    ///`crate::iter_records` function.
    ///
    ///Fetching does not necessarily return all of the available records.
    ///If returning all records would exceed `FETCH_PAYLOAD_LIMIT` (2MB),
    ///the response will be partial.
    async fn fetch(&self, request: FetchRequest) -> crate::Result<FetchResponse>;
    ///Returns a batch containing the last records.
    ///
    ///It returns the last documents, from the newest
    ///to the oldest, and stops as soon as `FETCH_PAYLOAD_LIMIT` (2MB)
    ///is exceeded.
    async fn tail(&self, request: TailRequest) -> crate::Result<FetchResponse>;
}
#[derive(Debug, Clone)]
pub struct IngestServiceClient {
    inner: InnerIngestServiceClient,
}
#[derive(Debug, Clone)]
struct InnerIngestServiceClient(std::sync::Arc<dyn IngestService>);
impl IngestServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: IngestService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: < MockIngestService
            > (),
            "`MockIngestService` must be wrapped in a `MockIngestServiceWrapper`: use `IngestServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerIngestServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> ingest_service_grpc_server::IngestServiceGrpcServer<
        IngestServiceGrpcServerAdapter,
    > {
        let adapter = IngestServiceGrpcServerAdapter::new(self.clone());
        ingest_service_grpc_server::IngestServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = ingest_service_grpc_client::IngestServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IngestServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngestServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = ingest_service_grpc_client::IngestServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IngestServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IngestServiceMailbox<A>: IngestService,
    {
        IngestServiceClient::new(IngestServiceMailbox::new(mailbox))
    }
    pub fn tower() -> IngestServiceTowerLayerStack {
        IngestServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockIngestService) -> Self {
        let mock_wrapper = mock_ingest_service::MockIngestServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockIngestService::new())
    }
}
#[async_trait::async_trait]
impl IngestService for IngestServiceClient {
    async fn ingest(&self, request: IngestRequest) -> crate::Result<IngestResponse> {
        self.inner.0.ingest(request).await
    }
    async fn fetch(&self, request: FetchRequest) -> crate::Result<FetchResponse> {
        self.inner.0.fetch(request).await
    }
    async fn tail(&self, request: TailRequest) -> crate::Result<FetchResponse> {
        self.inner.0.tail(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_ingest_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockIngestServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockIngestService>,
    }
    #[async_trait::async_trait]
    impl IngestService for MockIngestServiceWrapper {
        async fn ingest(
            &self,
            request: super::IngestRequest,
        ) -> crate::Result<super::IngestResponse> {
            self.inner.lock().await.ingest(request).await
        }
        async fn fetch(
            &self,
            request: super::FetchRequest,
        ) -> crate::Result<super::FetchResponse> {
            self.inner.lock().await.fetch(request).await
        }
        async fn tail(
            &self,
            request: super::TailRequest,
        ) -> crate::Result<super::FetchResponse> {
            self.inner.lock().await.tail(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<IngestRequest> for InnerIngestServiceClient {
    type Response = IngestResponse;
    type Error = crate::IngestServiceError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: IngestRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.ingest(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<FetchRequest> for InnerIngestServiceClient {
    type Response = FetchResponse;
    type Error = crate::IngestServiceError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: FetchRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.fetch(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<TailRequest> for InnerIngestServiceClient {
    type Response = FetchResponse;
    type Error = crate::IngestServiceError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: TailRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.tail(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct IngestServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerIngestServiceClient,
    ingest_svc: quickwit_common::tower::BoxService<
        IngestRequest,
        IngestResponse,
        crate::IngestServiceError,
    >,
    fetch_svc: quickwit_common::tower::BoxService<
        FetchRequest,
        FetchResponse,
        crate::IngestServiceError,
    >,
    tail_svc: quickwit_common::tower::BoxService<
        TailRequest,
        FetchResponse,
        crate::IngestServiceError,
    >,
}
#[async_trait::async_trait]
impl IngestService for IngestServiceTowerServiceStack {
    async fn ingest(&self, request: IngestRequest) -> crate::Result<IngestResponse> {
        self.ingest_svc.clone().ready().await?.call(request).await
    }
    async fn fetch(&self, request: FetchRequest) -> crate::Result<FetchResponse> {
        self.fetch_svc.clone().ready().await?.call(request).await
    }
    async fn tail(&self, request: TailRequest) -> crate::Result<FetchResponse> {
        self.tail_svc.clone().ready().await?.call(request).await
    }
}
type IngestLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        IngestRequest,
        IngestResponse,
        crate::IngestServiceError,
    >,
    IngestRequest,
    IngestResponse,
    crate::IngestServiceError,
>;
type FetchLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        FetchRequest,
        FetchResponse,
        crate::IngestServiceError,
    >,
    FetchRequest,
    FetchResponse,
    crate::IngestServiceError,
>;
type TailLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        TailRequest,
        FetchResponse,
        crate::IngestServiceError,
    >,
    TailRequest,
    FetchResponse,
    crate::IngestServiceError,
>;
#[derive(Debug, Default)]
pub struct IngestServiceTowerLayerStack {
    ingest_layers: Vec<IngestLayer>,
    fetch_layers: Vec<FetchLayer>,
    tail_layers: Vec<TailLayer>,
}
impl IngestServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IngestRequest,
                    IngestResponse,
                    crate::IngestServiceError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                IngestRequest,
                IngestResponse,
                crate::IngestServiceError,
            >,
        >>::Service: tower::Service<
                IngestRequest,
                Response = IngestResponse,
                Error = crate::IngestServiceError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                IngestRequest,
                IngestResponse,
                crate::IngestServiceError,
            >,
        >>::Service as tower::Service<IngestRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    FetchRequest,
                    FetchResponse,
                    crate::IngestServiceError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                FetchRequest,
                FetchResponse,
                crate::IngestServiceError,
            >,
        >>::Service: tower::Service<
                FetchRequest,
                Response = FetchResponse,
                Error = crate::IngestServiceError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                FetchRequest,
                FetchResponse,
                crate::IngestServiceError,
            >,
        >>::Service as tower::Service<FetchRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    TailRequest,
                    FetchResponse,
                    crate::IngestServiceError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                TailRequest,
                FetchResponse,
                crate::IngestServiceError,
            >,
        >>::Service: tower::Service<
                TailRequest,
                Response = FetchResponse,
                Error = crate::IngestServiceError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                TailRequest,
                FetchResponse,
                crate::IngestServiceError,
            >,
        >>::Service as tower::Service<TailRequest>>::Future: Send + 'static,
    {
        self.ingest_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.fetch_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.tail_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_ingest_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IngestRequest,
                    IngestResponse,
                    crate::IngestServiceError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                IngestRequest,
                Response = IngestResponse,
                Error = crate::IngestServiceError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<IngestRequest>>::Future: Send + 'static,
    {
        self.ingest_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_fetch_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    FetchRequest,
                    FetchResponse,
                    crate::IngestServiceError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                FetchRequest,
                Response = FetchResponse,
                Error = crate::IngestServiceError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<FetchRequest>>::Future: Send + 'static,
    {
        self.fetch_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_tail_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    TailRequest,
                    FetchResponse,
                    crate::IngestServiceError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                TailRequest,
                Response = FetchResponse,
                Error = crate::IngestServiceError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<TailRequest>>::Future: Send + 'static,
    {
        self.tail_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> IngestServiceClient
    where
        T: IngestService,
    {
        let inner_client = InnerIngestServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngestServiceClient {
        let client = IngestServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngestServiceClient {
        let client = IngestServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> IngestServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IngestServiceMailbox<A>: IngestService,
    {
        let inner_client = InnerIngestServiceClient(
            std::sync::Arc::new(IngestServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockIngestService) -> IngestServiceClient {
        let client = IngestServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerIngestServiceClient,
    ) -> IngestServiceClient {
        let ingest_svc = self
            .ingest_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let fetch_svc = self
            .fetch_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tail_svc = self
            .tail_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = IngestServiceTowerServiceStack {
            inner: inner_client,
            ingest_svc,
            fetch_svc,
            tail_svc,
        };
        IngestServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct IngestServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::IngestServiceError>,
}
impl<A: quickwit_actors::Actor> IngestServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for IngestServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for IngestServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::IngestServiceError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::IngestServiceError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> IngestService for IngestServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    IngestServiceMailbox<
        A,
    >: tower::Service<
            IngestRequest,
            Response = IngestResponse,
            Error = crate::IngestServiceError,
            Future = BoxFuture<IngestResponse, crate::IngestServiceError>,
        >
        + tower::Service<
            FetchRequest,
            Response = FetchResponse,
            Error = crate::IngestServiceError,
            Future = BoxFuture<FetchResponse, crate::IngestServiceError>,
        >
        + tower::Service<
            TailRequest,
            Response = FetchResponse,
            Error = crate::IngestServiceError,
            Future = BoxFuture<FetchResponse, crate::IngestServiceError>,
        >,
{
    async fn ingest(&self, request: IngestRequest) -> crate::Result<IngestResponse> {
        self.clone().call(request).await
    }
    async fn fetch(&self, request: FetchRequest) -> crate::Result<FetchResponse> {
        self.clone().call(request).await
    }
    async fn tail(&self, request: TailRequest) -> crate::Result<FetchResponse> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct IngestServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> IngestServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> IngestService
for IngestServiceGrpcClientAdapter<
    ingest_service_grpc_client::IngestServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn ingest(&self, request: IngestRequest) -> crate::Result<IngestResponse> {
        self.inner
            .clone()
            .ingest(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                IngestRequest::rpc_name(),
            ))
    }
    async fn fetch(&self, request: FetchRequest) -> crate::Result<FetchResponse> {
        self.inner
            .clone()
            .fetch(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                FetchRequest::rpc_name(),
            ))
    }
    async fn tail(&self, request: TailRequest) -> crate::Result<FetchResponse> {
        self.inner
            .clone()
            .tail(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                TailRequest::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct IngestServiceGrpcServerAdapter {
    inner: InnerIngestServiceClient,
}
impl IngestServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: IngestService,
    {
        Self {
            inner: InnerIngestServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl ingest_service_grpc_server::IngestServiceGrpc for IngestServiceGrpcServerAdapter {
    async fn ingest(
        &self,
        request: tonic::Request<IngestRequest>,
    ) -> Result<tonic::Response<IngestResponse>, tonic::Status> {
        self.inner
            .0
            .ingest(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn fetch(
        &self,
        request: tonic::Request<FetchRequest>,
    ) -> Result<tonic::Response<FetchResponse>, tonic::Status> {
        self.inner
            .0
            .fetch(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn tail(
        &self,
        request: tonic::Request<TailRequest>,
    ) -> Result<tonic::Response<FetchResponse>, tonic::Status> {
        self.inner
            .0
            .tail(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod ingest_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct IngestServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl IngestServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> IngestServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> IngestServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            IngestServiceGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Ingests document in a given queue.
        ///
        /// Upon any kind of error, the client should
        ///
        /// * retry to get at least once delivery.
        /// * not retry to get at most once delivery.
        ///
        /// Exactly once delivery is not supported yet.
        pub async fn ingest(
            &mut self,
            request: impl tonic::IntoRequest<super::IngestRequest>,
        ) -> std::result::Result<tonic::Response<super::IngestResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/ingest_service.IngestService/Ingest",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("ingest_service.IngestService", "Ingest"));
            self.inner.unary(req, path, codec).await
        }
        /// Fetches record from a given queue.
        ///
        /// Records are returned in order.
        ///
        /// The returned `FetchResponse` object is meant to be read with the
        /// `crate::iter_records` function.
        ///
        /// Fetching does not necessarily return all of the available records.
        /// If returning all records would exceed `FETCH_PAYLOAD_LIMIT` (2MB),
        /// the response will be partial.
        pub async fn fetch(
            &mut self,
            request: impl tonic::IntoRequest<super::FetchRequest>,
        ) -> std::result::Result<tonic::Response<super::FetchResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/ingest_service.IngestService/Fetch",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("ingest_service.IngestService", "Fetch"));
            self.inner.unary(req, path, codec).await
        }
        /// Returns a batch containing the last records.
        ///
        /// It returns the last documents, from the newest
        /// to the oldest, and stops as soon as `FETCH_PAYLOAD_LIMIT` (2MB)
        /// is exceeded.
        pub async fn tail(
            &mut self,
            request: impl tonic::IntoRequest<super::TailRequest>,
        ) -> std::result::Result<tonic::Response<super::FetchResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/ingest_service.IngestService/Tail",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("ingest_service.IngestService", "Tail"));
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod ingest_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with IngestServiceGrpcServer.
    #[async_trait]
    pub trait IngestServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Ingests document in a given queue.
        ///
        /// Upon any kind of error, the client should
        ///
        /// * retry to get at least once delivery.
        /// * not retry to get at most once delivery.
        ///
        /// Exactly once delivery is not supported yet.
        async fn ingest(
            &self,
            request: tonic::Request<super::IngestRequest>,
        ) -> std::result::Result<tonic::Response<super::IngestResponse>, tonic::Status>;
        /// Fetches record from a given queue.
        ///
        /// Records are returned in order.
        ///
        /// The returned `FetchResponse` object is meant to be read with the
        /// `crate::iter_records` function.
        ///
        /// Fetching does not necessarily return all of the available records.
        /// If returning all records would exceed `FETCH_PAYLOAD_LIMIT` (2MB),
        /// the response will be partial.
        async fn fetch(
            &self,
            request: tonic::Request<super::FetchRequest>,
        ) -> std::result::Result<tonic::Response<super::FetchResponse>, tonic::Status>;
        /// Returns a batch containing the last records.
        ///
        /// It returns the last documents, from the newest
        /// to the oldest, and stops as soon as `FETCH_PAYLOAD_LIMIT` (2MB)
        /// is exceeded.
        async fn tail(
            &self,
            request: tonic::Request<super::TailRequest>,
        ) -> std::result::Result<tonic::Response<super::FetchResponse>, tonic::Status>;
    }
    #[derive(Debug)]
    pub struct IngestServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> IngestServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for IngestServiceGrpcServer<T>
    where
        T: IngestServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/ingest_service.IngestService/Ingest" => {
                    #[allow(non_camel_case_types)]
                    struct IngestSvc<T: IngestServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngestServiceGrpc,
                    > tonic::server::UnaryService<super::IngestRequest>
                    for IngestSvc<T> {
                        type Response = super::IngestResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::IngestRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngestServiceGrpc>::ingest(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = IngestSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/ingest_service.IngestService/Fetch" => {
                    #[allow(non_camel_case_types)]
                    struct FetchSvc<T: IngestServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngestServiceGrpc,
                    > tonic::server::UnaryService<super::FetchRequest> for FetchSvc<T> {
                        type Response = super::FetchResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FetchRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngestServiceGrpc>::fetch(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FetchSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/ingest_service.IngestService/Tail" => {
                    #[allow(non_camel_case_types)]
                    struct TailSvc<T: IngestServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngestServiceGrpc,
                    > tonic::server::UnaryService<super::TailRequest> for TailSvc<T> {
                        type Response = super::FetchResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::TailRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngestServiceGrpc>::tail(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = TailSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for IngestServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "ingest_service.IngestService";
    impl<T> tonic::server::NamedService for IngestServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/doc_batch.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytes::buf::Writer;
use bytes::{Buf, BufMut, Bytes, BytesMut};
use quickwit_proto::types::IndexId;
use serde::Serialize;

use crate::DocBatch;

#[derive(Debug)]
/// Represents a command that can be stored in a [`DocBatch`].
pub enum DocCommand<T>
where T: Buf
{
    Ingest { payload: T },
    Commit,
    // ... more to come?
}

/// We can use this byte to track both commands and their version changes
/// If serialization protocol changes, we can just use the next number
#[derive(Debug)]
#[repr(u8)]
pub enum DocCommandCode {
    IngestV1 = 0,
    CommitV1 = 1,
}

impl From<u8> for DocCommandCode {
    fn from(value: u8) -> Self {
        match value {
            0 => DocCommandCode::IngestV1,
            1 => DocCommandCode::CommitV1,
            other => panic!("Encountered unknown command: code {other}"),
        }
    }
}

impl<T> DocCommand<T>
where T: Buf + Default
{
    /// Returns the binary serialization code for the current version of this command.
    pub fn code(&self) -> DocCommandCode {
        match self {
            DocCommand::Ingest { payload: _ } => DocCommandCode::IngestV1,
            DocCommand::Commit => DocCommandCode::CommitV1,
        }
    }

    /// Builds a command for bytes::Buf
    pub fn read(mut buf: T) -> Self {
        match buf.get_u8().into() {
            DocCommandCode::IngestV1 => DocCommand::Ingest { payload: buf },
            DocCommandCode::CommitV1 => DocCommand::Commit,
        }
    }

    /// Copies the command to the end of bytes::BufMut while returning the number of bytes copied
    pub fn write(self, mut buf: impl BufMut) -> usize {
        let self_buf = self.into_buf();
        let len = self_buf.remaining();
        buf.put(self_buf);
        len
    }

    pub fn into_buf(self) -> impl Buf {
        self.code_chunk().chain(match self {
            DocCommand::Ingest { payload } => payload,
            DocCommand::Commit => T::default(),
        })
    }

    fn code_chunk(&self) -> &'static [u8; 1] {
        match self {
            DocCommand::Ingest { payload: _ } => &[DocCommandCode::IngestV1 as u8],
            DocCommand::Commit => &[DocCommandCode::CommitV1 as u8],
        }
    }
}

/// Builds DocBatch from individual commands
pub struct DocBatchBuilder {
    index_id: IndexId,
    doc_buffer: BytesMut,
    doc_lengths: Vec<u32>,
}

impl DocBatchBuilder {
    /// Creates a new batch builder for the given index name.
    pub fn new(index_id: IndexId) -> Self {
        Self {
            index_id,
            doc_buffer: BytesMut::new(),
            doc_lengths: Vec::new(),
        }
    }

    /// Creates a new batch builder for the given index name with some pre-allocated capacity for
    /// the internal doc buffer.
    pub fn with_capacity(index_id: IndexId, capacity: usize) -> Self {
        Self {
            index_id,
            doc_buffer: BytesMut::with_capacity(capacity),
            doc_lengths: Vec::new(),
        }
    }

    /// Adds an ingest command to the batch
    pub fn ingest_doc(&mut self, payload: impl Buf + Default) -> usize {
        let command = DocCommand::Ingest { payload };
        self.command(command)
    }

    /// Adds a commit command to the batch
    pub fn commit(&mut self) -> usize {
        let command: DocCommand<Bytes> = DocCommand::Commit;
        self.command(command)
    }

    /// Adds a parsed command to the batch
    pub fn command<T>(&mut self, command: DocCommand<T>) -> usize
    where T: Buf + Default {
        let len = command.write(&mut self.doc_buffer);
        self.doc_lengths.push(len as u32);
        len
    }

    /// Adds a list of bytes representing a command to the batch
    pub fn command_from_buf(&mut self, raw: impl Buf) -> usize {
        let len = raw.remaining();
        self.doc_buffer.put(raw);
        self.doc_lengths.push(len as u32);
        len
    }

    /// Creates another batch builder capable of processing a Serialize structs instead of commands
    pub fn json_writer(self) -> JsonDocBatchBuilder {
        JsonDocBatchBuilder {
            index_id: self.index_id,
            doc_buffer: self.doc_buffer.writer(),
            doc_lengths: self.doc_lengths,
        }
    }

    /// Builds the batch
    pub fn build(self) -> DocBatch {
        DocBatch {
            index_id: self.index_id,
            doc_buffer: self.doc_buffer.freeze(),
            doc_lengths: self.doc_lengths,
        }
    }
}

/// A wrapper around batch builder that can add a Serialize structs
pub struct JsonDocBatchBuilder {
    index_id: IndexId,
    doc_buffer: Writer<BytesMut>,
    doc_lengths: Vec<u32>,
}

impl JsonDocBatchBuilder {
    /// Adds an ingest command to the batch for a Serialize struct
    pub fn ingest_doc(&mut self, payload: impl Serialize) -> serde_json::Result<usize> {
        let old_len = self.doc_buffer.get_ref().len();
        self.doc_buffer
            .get_mut()
            .put_u8(DocCommandCode::IngestV1 as u8);
        let res = serde_json::to_writer(&mut self.doc_buffer, &payload);
        let new_len = self.doc_buffer.get_ref().len();
        if let Err(err) = res {
            Err(err)
        } else {
            let len = new_len - old_len;
            self.doc_lengths.push(len as u32);
            Ok(len)
        }
    }

    /// Returns the underlying batch builder
    pub fn into_inner(self) -> DocBatchBuilder {
        DocBatchBuilder {
            index_id: self.index_id,
            doc_buffer: self.doc_buffer.into_inner(),
            doc_lengths: self.doc_lengths,
        }
    }

    /// Builds the batch
    pub fn build(self) -> DocBatch {
        self.into_inner().build()
    }
}

impl DocBatch {
    /// Returns an iterator over the document payloads within a doc_batch.
    #[allow(clippy::should_implement_trait)]
    pub fn into_iter(self) -> impl Iterator<Item = DocCommand<Bytes>> {
        self.into_iter_raw().map(DocCommand::read)
    }

    /// Returns an iterator over the document payloads within a doc_batch.
    pub fn into_iter_raw(self) -> impl Iterator<Item = Bytes> {
        let DocBatch {
            doc_buffer,
            doc_lengths,
            ..
        } = self;
        doc_lengths
            .into_iter()
            .scan(0, move |current_offset, doc_num_bytes| {
                let start = *current_offset;
                let end = start + doc_num_bytes as usize;
                *current_offset = end;
                Some(doc_buffer.slice(start..end))
            })
    }

    /// Returns true if the batch is empty.
    pub fn is_empty(&self) -> bool {
        self.doc_lengths.is_empty()
    }

    /// Returns the total number of bytes in the batch.
    pub fn num_bytes(&self) -> usize {
        self.doc_buffer.len()
    }

    /// Returns the number of documents in the batch.
    pub fn num_docs(&self) -> usize {
        self.doc_lengths.len()
    }
}

#[cfg(test)]
mod tests {
    use serde_json::json;

    use super::*;

    fn commands_eq<L, R>(l: DocCommand<L>, r: DocCommand<R>) -> bool
    where
        L: Buf,
        R: Buf,
    {
        match (l, r) {
            (
                DocCommand::Ingest {
                    payload: mut l_payload,
                },
                DocCommand::Ingest {
                    payload: mut r_payload,
                },
            ) => {
                l_payload.copy_to_bytes(l_payload.remaining())
                    == r_payload.copy_to_bytes(r_payload.remaining())
            }
            (DocCommand::Commit, DocCommand::Commit) => true,
            _ => false,
        }
    }

    macro_rules! test_command_roundtrip {
        ($command:expr) => {
            let original = $command;
            let expected = $command;
            let mut buf = BytesMut::new();
            let size = original.write(&mut buf);
            assert!(size > 0);
            let copy = DocCommand::read(buf);
            assert!(commands_eq(expected, copy));
        };
    }

    #[test]
    fn test_commands_eq() {
        assert!(commands_eq(
            DocCommand::Ingest {
                payload: &b"hello"[..]
            },
            DocCommand::Ingest {
                payload: Bytes::from("hello")
            }
        ));
        assert!(commands_eq(
            DocCommand::Commit::<Bytes>,
            DocCommand::Commit::<&[u8]>
        ));
        assert!(!commands_eq(
            DocCommand::Ingest {
                payload: Bytes::from("hello")
            },
            DocCommand::Ingest {
                payload: Bytes::from("world")
            }
        ));
        assert!(!commands_eq(
            DocCommand::Ingest {
                payload: Bytes::from("hello")
            },
            DocCommand::Commit::<Bytes>
        ));
    }

    #[test]
    fn test_commands_roundtrip() {
        test_command_roundtrip!(DocCommand::Ingest {
            payload: &b"hello"[..]
        });
        test_command_roundtrip!(DocCommand::Ingest {
            payload: Bytes::from("hello")
        });
        test_command_roundtrip!(DocCommand::Commit::<Bytes>);
        test_command_roundtrip!(DocCommand::Commit::<&[u8]>);
    }

    #[test]
    fn test_batch_builder() {
        let mut batch = DocBatchBuilder::new("test".to_string());
        batch.ingest_doc(&b"hello"[..]);
        batch.ingest_doc(&b" "[..]);
        batch.command(DocCommand::Ingest {
            payload: Bytes::from("world"),
        });
        batch.commit();

        let batch = batch.build();
        assert_eq!(batch.index_id, "test");
        assert_eq!(batch.num_docs(), 4);
        assert_eq!(batch.num_bytes(), 5 + 1 + 5 + 4);

        let mut iter = batch.clone().into_iter();
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Ingest {
                payload: Bytes::from("hello")
            }
        ));
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Ingest {
                payload: Bytes::from(" ")
            }
        ));
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Ingest {
                payload: Bytes::from("world")
            }
        ));
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Commit::<Bytes>
        ));
        assert!(iter.next().is_none());

        let mut copied_batch = DocBatchBuilder::new("test".to_string());
        for raw_buf in batch.clone().into_iter_raw() {
            copied_batch.command_from_buf(raw_buf);
        }
        let copied_batch = copied_batch.build();

        assert_eq!(batch, copied_batch);
    }

    #[test]
    fn test_json_batch_builder() {
        let mut batch = DocBatchBuilder::new("test".to_string()).json_writer();
        batch.ingest_doc(json!({"test":"a"})).unwrap();
        batch.ingest_doc(json!({"test":"b"})).unwrap();

        let mut batch = batch.into_inner();
        batch.commit();

        let batch = batch.build();
        assert_eq!(batch.index_id, "test");
        assert_eq!(batch.num_docs(), 3);
        assert_eq!(batch.num_bytes(), 12 + 12 + 3);

        let mut iter = batch.into_iter();
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Ingest {
                payload: Bytes::from(json!({"test": "a"}).to_string())
            }
        ));
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Ingest {
                payload: Bytes::from(json!({"test": "b"}).to_string())
            }
        ));
        assert!(commands_eq(
            iter.next().unwrap(),
            DocCommand::Commit::<Bytes>
        ));
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;

use mrecordlog::error::*;
use quickwit_actors::AskError;
use quickwit_common::rate_limited_error;
pub(crate) use quickwit_proto::error::{grpc_error_to_grpc_status, grpc_status_to_service_error};
use quickwit_proto::ingest::router::{IngestFailure, IngestFailureReason};
use quickwit_proto::ingest::{IngestV2Error, RateLimitingCause};
use quickwit_proto::types::IndexId;
use quickwit_proto::{GrpcServiceError, ServiceError, ServiceErrorCode, tonic};
use serde::{Deserialize, Serialize};

#[derive(Debug, Clone, thiserror::Error, Serialize, Deserialize)]
pub enum IngestServiceError {
    #[error("data corruption: {0}")]
    Corruption(String),
    #[error("index `{index_id}` already exists")]
    IndexAlreadyExists { index_id: IndexId },
    #[error("index `{index_id}` not found")]
    IndexNotFound { index_id: IndexId },
    #[error("an internal error occurred: {0}")]
    Internal(String),
    #[error("invalid position: {0}")]
    InvalidPosition(String),
    #[error("io error {0}")]
    IoError(String),
    #[error("rate limited {0}")]
    RateLimited(RateLimitingCause),
    #[error("ingest service is unavailable ({0})")]
    Unavailable(String),
    #[error("bad request ({0})")]
    BadRequest(String),
}

impl From<AskError<IngestServiceError>> for IngestServiceError {
    fn from(error: AskError<IngestServiceError>) -> Self {
        match error {
            AskError::ErrorReply(error) => error,
            AskError::MessageNotDelivered => {
                IngestServiceError::Unavailable("actor not running".to_string())
            }
            AskError::ProcessMessageError => IngestServiceError::Internal(error.to_string()),
        }
    }
}

impl From<quickwit_common::tower::BufferError> for IngestServiceError {
    fn from(error: quickwit_common::tower::BufferError) -> Self {
        use quickwit_common::tower::BufferError;
        match error {
            BufferError::Closed => IngestServiceError::Unavailable(error.to_string()),
            BufferError::Unknown => IngestServiceError::Internal(error.to_string()),
        }
    }
}

impl From<io::Error> for IngestServiceError {
    fn from(io_error: io::Error) -> Self {
        IngestServiceError::IoError(io_error.to_string())
    }
}

impl From<IngestV2Error> for IngestServiceError {
    fn from(error: IngestV2Error) -> Self {
        match error {
            IngestV2Error::Timeout(error_msg) => {
                IngestServiceError::Unavailable(format!("timeout {error_msg}"))
            }
            IngestV2Error::Unavailable(error_msg) => {
                IngestServiceError::Unavailable(format!("unavailable: {error_msg}"))
            }
            IngestV2Error::Internal(message) => IngestServiceError::Internal(message),
            IngestV2Error::ShardNotFound { .. } => {
                IngestServiceError::Internal("shard not found".to_string())
            }
            IngestV2Error::TooManyRequests(rate_limiting_cause) => {
                IngestServiceError::RateLimited(rate_limiting_cause)
            }
        }
    }
}

impl From<IngestFailure> for IngestServiceError {
    fn from(ingest_failure: IngestFailure) -> Self {
        match ingest_failure.reason() {
            IngestFailureReason::Unspecified => {
                IngestServiceError::Internal("unknown error".to_string())
            }
            IngestFailureReason::IndexNotFound => IngestServiceError::IndexNotFound {
                index_id: ingest_failure.index_id,
            },
            IngestFailureReason::SourceNotFound => IngestServiceError::Internal(format!(
                "Ingest v2 source not found for index {}",
                ingest_failure.index_id
            )),
            IngestFailureReason::Internal => {
                IngestServiceError::Internal("internal error".to_string())
            }
            IngestFailureReason::NoShardsAvailable => {
                IngestServiceError::Unavailable("no shards available".to_string())
            }
            IngestFailureReason::ShardRateLimited => {
                IngestServiceError::RateLimited(RateLimitingCause::ShardRateLimiting)
            }
            IngestFailureReason::WalFull => {
                IngestServiceError::RateLimited(RateLimitingCause::WalFull)
            }
            IngestFailureReason::Timeout => {
                IngestServiceError::Internal("request timed out".to_string())
            }
            IngestFailureReason::RouterLoadShedding => {
                IngestServiceError::RateLimited(RateLimitingCause::RouterLoadShedding)
            }
            IngestFailureReason::LoadShedding => {
                IngestServiceError::RateLimited(RateLimitingCause::LoadShedding)
            }
            IngestFailureReason::CircuitBreaker => {
                IngestServiceError::RateLimited(RateLimitingCause::CircuitBreaker)
            }
        }
    }
}

impl ServiceError for IngestServiceError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Corruption(err_msg) => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "ingest/corruption internal error: {err_msg}"
                );
                ServiceErrorCode::Internal
            }
            Self::IndexAlreadyExists { .. } => ServiceErrorCode::AlreadyExists,
            Self::IndexNotFound { .. } => ServiceErrorCode::NotFound,
            Self::Internal(err_msg) => {
                rate_limited_error!(limit_per_min = 6, "ingest internal error: {err_msg}");
                ServiceErrorCode::Internal
            }
            Self::InvalidPosition(_) => ServiceErrorCode::BadRequest,
            Self::IoError(io_err) => {
                rate_limited_error!(limit_per_min = 6, "ingest/io internal error: {io_err}");
                ServiceErrorCode::Internal
            }
            Self::RateLimited(_) => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
            Self::BadRequest(_) => ServiceErrorCode::BadRequest,
        }
    }
}

impl GrpcServiceError for IngestServiceError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_too_many_requests() -> Self {
        Self::RateLimited(RateLimitingCause::Unknown)
    }

    fn new_unavailable(error_msg: String) -> Self {
        Self::Unavailable(error_msg)
    }
}

#[derive(Debug, thiserror::Error)]
#[error("key should contain 16 bytes, got {0}")]
pub struct CorruptedKey(pub usize);

impl From<CorruptedKey> for IngestServiceError {
    fn from(error: CorruptedKey) -> Self {
        IngestServiceError::Corruption(format!("corrupted key: {error:?}"))
    }
}

impl From<IngestServiceError> for tonic::Status {
    fn from(error: IngestServiceError) -> tonic::Status {
        let code = match &error {
            IngestServiceError::Corruption { .. } => tonic::Code::DataLoss,
            IngestServiceError::IndexAlreadyExists { .. } => tonic::Code::AlreadyExists,
            IngestServiceError::IndexNotFound { .. } => tonic::Code::NotFound,
            IngestServiceError::Internal(_) => tonic::Code::Internal,
            IngestServiceError::InvalidPosition(_) => tonic::Code::InvalidArgument,
            IngestServiceError::IoError { .. } => tonic::Code::Internal,
            IngestServiceError::RateLimited(_) => tonic::Code::ResourceExhausted,
            IngestServiceError::Unavailable(_) => tonic::Code::Unavailable,
            IngestServiceError::BadRequest(_) => tonic::Code::InvalidArgument,
        };
        let message = error.to_string();
        tonic::Status::new(code, message)
    }
}

impl From<ReadRecordError> for IngestServiceError {
    fn from(error: ReadRecordError) -> IngestServiceError {
        match error {
            ReadRecordError::IoError(io_error) => io_error.into(),
            ReadRecordError::Corruption => {
                IngestServiceError::Corruption("failed to read record".to_string())
            }
        }
    }
}

impl From<AppendError> for IngestServiceError {
    fn from(err: AppendError) -> IngestServiceError {
        match err {
            AppendError::IoError(io_error) => io_error.into(),
            AppendError::MissingQueue(index_id) => IngestServiceError::IndexNotFound { index_id },
            // these errors can't be reached right now
            AppendError::Past => IngestServiceError::InvalidPosition(
                "attempted to append a record in the past".to_string(),
            ),
        }
    }
}

impl From<DeleteQueueError> for IngestServiceError {
    fn from(err: DeleteQueueError) -> IngestServiceError {
        match err {
            DeleteQueueError::IoError(io_error) => io_error.into(),
            DeleteQueueError::MissingQueue(index_id) => {
                IngestServiceError::IndexNotFound { index_id }
            }
        }
    }
}

impl From<TruncateError> for IngestServiceError {
    fn from(err: TruncateError) -> IngestServiceError {
        match err {
            TruncateError::IoError(io_error) => io_error.into(),
            TruncateError::MissingQueue(index_id) => IngestServiceError::IndexNotFound { index_id },
        }
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_api_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::Path;
use std::{fmt, iter};

use async_trait::async_trait;
use bytes::Bytes;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, DeferableReplyHandler, Handler, QueueCapacity,
};
use quickwit_common::runtimes::RuntimeType;
use quickwit_common::tower::Cost;
use quickwit_proto::ingest::RateLimitingCause;
use tracing::{error, info};
use ulid::Ulid;

use crate::metrics::INGEST_METRICS;
use crate::notifications::Notifications;
use crate::{
    CommitType, CreateQueueIfNotExistsRequest, CreateQueueIfNotExistsResponse, CreateQueueRequest,
    DocCommand, DropQueueRequest, FetchRequest, FetchResponse, IngestRequest, IngestResponse,
    IngestServiceError, ListQueuesRequest, ListQueuesResponse, MemoryCapacity, Queues,
    SuggestTruncateRequest, TailRequest,
};

impl Cost for IngestRequest {
    fn cost(&self) -> u64 {
        self.doc_batches
            .iter()
            .map(|doc_batch| doc_batch.num_bytes())
            .sum::<usize>() as u64
    }
}

pub struct IngestApiService {
    partition_id: String,
    queues: Queues,
    memory_limit: usize,
    disk_limit: usize,
    memory_capacity: MemoryCapacity,
    notifications: Notifications,
}

impl fmt::Debug for IngestApiService {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("IngestApiService")
            .field("partition_id", &self.partition_id)
            .field("memory_limit", &self.memory_limit)
            .field("disk_limit", &self.disk_limit)
            .finish()
    }
}

/// When we create our queue storage, we also generate and store
/// a random partition id associated to it.
///
/// That partition_id is used in the source checkpoint.
///
/// The idea is to make sure that if the entire queue storage is lost,
/// the old source checkpoint (stored in the metastore) do not apply.
/// (See #2310)
const PARTITION_ID_PATH: &str = "partition_id";

async fn get_or_initialize_partition_id(dir_path: &Path) -> crate::Result<String> {
    let partition_id_path = dir_path.join(PARTITION_ID_PATH);
    if let Ok(partition_id_bytes) = tokio::fs::read(&partition_id_path).await {
        let partition_id: &str = std::str::from_utf8(&partition_id_bytes).map_err(|_| {
            let msg = format!("partition key ({partition_id_bytes:?}) is not utf8");
            IngestServiceError::Corruption(msg)
        })?;
        return Ok(partition_id.to_string());
    }
    // We add a prefix here to make sure we don't mistake it for a split id when reading logs.
    let partition_id = format!("ingest_partition_{}", Ulid::new());
    tokio::fs::write(partition_id_path, partition_id.as_bytes()).await?;
    Ok(partition_id)
}

impl IngestApiService {
    pub async fn with_queues_dir(
        queues_dir_path: &Path,
        memory_limit: usize,
        disk_limit: usize,
    ) -> crate::Result<Self> {
        let queues = Queues::open(queues_dir_path).await?;
        let partition_id = get_or_initialize_partition_id(queues_dir_path).await?;
        let memory_capacity = MemoryCapacity::new(memory_limit);
        let notifications = Notifications::new();
        info!(ingest_partition_id=%partition_id, "Ingest API partition id");
        Ok(Self {
            partition_id,
            queues,
            memory_limit,
            disk_limit,
            memory_capacity,
            notifications,
        })
    }

    async fn ingest(
        &mut self,
        request: IngestRequest,
        reply: impl FnOnce(crate::Result<IngestResponse>) + Send + Sync + 'static,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let notification = self.ingest_inner(request, ctx).await;
        match notification {
            Ok((response, index_positions)) => {
                if index_positions.is_empty() {
                    reply(Ok(response));
                } else {
                    self.notifications
                        .register(index_positions, move || {
                            reply(Ok(response));
                        })
                        .await;
                }
                Ok(())
            }
            Err(err) => {
                reply(Err(err));
                Ok(())
            }
        }
    }

    async fn ingest_inner(
        &mut self,
        request: IngestRequest,
        ctx: &ActorContext<Self>,
    ) -> crate::Result<(IngestResponse, Vec<(String, u64)>)> {
        // Check all indexes exist assuming existing queues always have a corresponding index.
        let first_non_existing_queue_opt = request
            .doc_batches
            .iter()
            .map(|batch| batch.index_id.as_str())
            .find(|index_id| !self.queues.queue_exists(index_id));

        if let Some(index_id) = first_non_existing_queue_opt {
            error!(
                index_id,
                partition_id = self.partition_id,
                "could not find index"
            );
            return Err(IngestServiceError::IndexNotFound {
                index_id: index_id.to_string(),
            });
        }
        let disk_used = self.queues.resource_usage().disk_used_bytes;

        if disk_used > self.disk_limit {
            info!("ingestion rejected due to disk limit");
            return Err(IngestServiceError::RateLimited(RateLimitingCause::WalFull));
        }

        if self
            .memory_capacity
            .reserve_capacity(request.cost() as usize)
            .is_err()
        {
            info!("ingest request rejected due to memory limit");
            return Err(IngestServiceError::RateLimited(RateLimitingCause::WalFull));
        }
        let mut num_docs = 0usize;
        let mut notifications = Vec::new();
        let commit = request.commit();
        for doc_batch in request.doc_batches {
            // TODO better error handling.
            // If there is an error, we probably want a transactional behavior.

            let batch_num_docs = doc_batch.num_docs();
            let batch_num_bytes = doc_batch.num_bytes();
            let index_id = doc_batch.index_id.clone();
            let records_it = doc_batch.into_iter_raw();
            let max_position = self.queues.append_batch(&index_id, records_it, ctx).await?;
            if let Some(max_position) = max_position
                && commit != CommitType::Auto
            {
                if commit == CommitType::Force {
                    self.queues
                        .append_batch(
                            &index_id,
                            iter::once(DocCommand::Commit::<Bytes>.into_buf()),
                            ctx,
                        )
                        .await?;
                }
                notifications.push((index_id.clone(), max_position));
            }

            num_docs += batch_num_docs;
            INGEST_METRICS
                .ingested_docs_bytes_valid
                .inc_by(batch_num_bytes as u64);
            INGEST_METRICS
                .ingested_docs_valid
                .inc_by(batch_num_docs as u64);
        }
        // TODO we could fsync here and disable autosync to have better i/o perfs.
        Ok((
            IngestResponse {
                num_docs_for_processing: num_docs as u64,
            },
            notifications,
        ))
    }

    fn fetch(&mut self, fetch_req: FetchRequest) -> crate::Result<FetchResponse> {
        let num_bytes_limit_opt: Option<usize> = fetch_req
            .num_bytes_limit
            .map(|num_bytes_limit| num_bytes_limit as usize);
        self.queues.fetch(
            &fetch_req.index_id,
            fetch_req.start_after,
            num_bytes_limit_opt,
        )
    }

    async fn suggest_truncate(
        &mut self,
        request: SuggestTruncateRequest,
        ctx: &ActorContext<Self>,
    ) -> crate::Result<()> {
        self.notifications
            .notify(&request.index_id, request.up_to_position_included)
            .await;
        self.queues
            .suggest_truncate(&request.index_id, request.up_to_position_included, ctx)
            .await?;

        let memory_used = self.queues.resource_usage().memory_used_bytes;
        let new_capacity = self.memory_limit - memory_used;
        self.memory_capacity.reset_capacity(new_capacity);

        Ok(())
    }
}

#[async_trait]
impl Actor for IngestApiService {
    type ObservableState = ();

    fn observable_state(&self) -> Self::ObservableState {}

    fn runtime_handle(&self) -> tokio::runtime::Handle {
        RuntimeType::NonBlocking.get_runtime_handle()
    }

    /// The Actor's incoming mailbox queue capacity. It is set when the actor is spawned.
    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(3)
    }
}

#[derive(Debug)]
pub struct GetPartitionId;

#[async_trait]
impl Handler<GetPartitionId> for IngestApiService {
    type Reply = String;

    async fn handle(
        &mut self,
        _request: GetPartitionId,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.partition_id.clone())
    }
}

#[derive(Debug)]
pub struct GetMemoryCapacity;

#[async_trait]
impl Handler<GetMemoryCapacity> for IngestApiService {
    type Reply = MemoryCapacity;

    async fn handle(
        &mut self,
        _request: GetMemoryCapacity,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.memory_capacity.clone())
    }
}

#[async_trait]
impl Handler<CreateQueueRequest> for IngestApiService {
    type Reply = crate::Result<()>;
    async fn handle(
        &mut self,
        create_queue_req: CreateQueueRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self
            .queues
            .create_queue(&create_queue_req.queue_id, ctx)
            .await)
    }
}

#[async_trait]
impl Handler<CreateQueueIfNotExistsRequest> for IngestApiService {
    type Reply = crate::Result<CreateQueueIfNotExistsResponse>;
    async fn handle(
        &mut self,
        create_queue_inf_req: CreateQueueIfNotExistsRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        if self.queues.queue_exists(&create_queue_inf_req.queue_id) {
            let response = CreateQueueIfNotExistsResponse {
                queue_id: create_queue_inf_req.queue_id,
                created: false,
            };
            return Ok(Ok(response));
        }
        Ok(self
            .queues
            .create_queue(&create_queue_inf_req.queue_id, ctx)
            .await
            .map(|_| CreateQueueIfNotExistsResponse {
                queue_id: create_queue_inf_req.queue_id,
                created: true,
            }))
    }
}

#[async_trait]
impl Handler<DropQueueRequest> for IngestApiService {
    type Reply = crate::Result<()>;
    async fn handle(
        &mut self,
        drop_queue_req: DropQueueRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.queues.drop_queue(&drop_queue_req.queue_id, ctx).await)
    }
}

#[async_trait]
impl DeferableReplyHandler<IngestRequest> for IngestApiService {
    type Reply = crate::Result<IngestResponse>;
    async fn handle_message(
        &mut self,
        ingest_req: IngestRequest,
        reply: impl FnOnce(Self::Reply) + Send + Sync + 'static,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.ingest(ingest_req, reply, ctx).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<FetchRequest> for IngestApiService {
    type Reply = crate::Result<FetchResponse>;
    async fn handle(
        &mut self,
        request: FetchRequest,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.fetch(request))
    }
}

#[async_trait]
impl Handler<TailRequest> for IngestApiService {
    type Reply = crate::Result<FetchResponse>;
    async fn handle(
        &mut self,
        request: TailRequest,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.queues.tail(&request.index_id))
    }
}

#[async_trait]
impl Handler<SuggestTruncateRequest> for IngestApiService {
    type Reply = crate::Result<()>;
    async fn handle(
        &mut self,
        request: SuggestTruncateRequest,
        ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.suggest_truncate(request, ctx).await)
    }
}

#[async_trait]
impl Handler<ListQueuesRequest> for IngestApiService {
    type Reply = crate::Result<ListQueuesResponse>;
    async fn handle(
        &mut self,
        _list_queue_req: ListQueuesRequest,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.queues.list_queues())
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use bytes::Bytes;
    use quickwit_actors::Universe;
    use quickwit_config::IngestApiConfig;

    use super::*;
    use crate::{DocBatch, DocBatchBuilder, init_ingest_api};

    #[test]
    fn test_ingest_request_cost() {
        let ingest_request = IngestRequest {
            doc_batches: vec![
                DocBatch {
                    index_id: "index-1".to_string(),
                    doc_buffer: Bytes::from_static(&[0, 1, 2]),
                    doc_lengths: vec![1, 2],
                },
                DocBatch {
                    index_id: "index-2".to_string(),
                    doc_buffer: Bytes::from_static(&[3, 4, 5, 6, 7, 8]),
                    doc_lengths: vec![1, 3, 2],
                },
            ],
            commit: CommitType::Auto.into(),
        };
        assert_eq!(ingest_request.cost(), 9);
    }

    #[tokio::test]
    async fn test_ingest_api_service_with_commit() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;

        // Ensure a queue for this index exists.
        let create_queue_req = CreateQueueIfNotExistsRequest {
            queue_id: "index-1".to_string(),
        };

        ingest_api_service.ask_for_res(create_queue_req).await?;

        let mut batch = DocBatchBuilder::new("index-1".to_string());
        batch.ingest_doc(Bytes::from_static(b"Test1"));
        batch.ingest_doc(Bytes::from_static(b"Test2"));
        batch.ingest_doc(Bytes::from_static(b"Test3"));
        batch.ingest_doc(Bytes::from_static(b"Test4"));

        let ingest_request = IngestRequest {
            doc_batches: vec![batch.build()],
            commit: CommitType::Force.into(),
        };
        let ingest_response = ingest_api_service
            .send_message(ingest_request)
            .await
            .unwrap();
        universe.sleep(Duration::from_secs(2)).await;
        let fetch_request = FetchRequest {
            index_id: "index-1".to_string(),
            start_after: None,
            num_bytes_limit: None,
        };
        let fetch_response = ingest_api_service.ask_for_res(fetch_request).await.unwrap();
        let doc_batch = fetch_response.doc_batch.unwrap();
        let position = doc_batch.num_docs() as u64;
        assert_eq!(doc_batch.num_docs(), 5);
        assert!(matches!(
            doc_batch.into_iter().nth(4),
            Some(DocCommand::Commit::<Bytes>)
        ));
        ingest_api_service
            .send_message(SuggestTruncateRequest {
                index_id: "index-1".to_string(),
                up_to_position_included: position,
            })
            .await
            .unwrap();

        let ingest_response = ingest_response.await.unwrap().unwrap();
        assert_eq!(ingest_response.num_docs_for_processing, 4);

        universe.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_ingest_api_service_with_wait() -> anyhow::Result<()> {
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir()?;
        let queues_dir_path = temp_dir.path();

        let ingest_api_service =
            init_ingest_api(&universe, queues_dir_path, &IngestApiConfig::default()).await?;

        // Ensure a queue for this index exists.
        let create_queue_req = CreateQueueIfNotExistsRequest {
            queue_id: "index-1".to_string(),
        };

        ingest_api_service.ask_for_res(create_queue_req).await?;

        let mut batch = DocBatchBuilder::new("index-1".to_string());
        batch.ingest_doc(Bytes::from_static(b"Test1"));
        batch.ingest_doc(Bytes::from_static(b"Test2"));
        batch.ingest_doc(Bytes::from_static(b"Test3"));
        batch.ingest_doc(Bytes::from_static(b"Test4"));

        let ingest_request = IngestRequest {
            doc_batches: vec![batch.build()],
            commit: CommitType::WaitFor.into(),
        };
        let ingest_response = ingest_api_service
            .send_message(ingest_request)
            .await
            .unwrap();
        universe.sleep(Duration::from_secs(2)).await;
        let fetch_request = FetchRequest {
            index_id: "index-1".to_string(),
            start_after: None,
            num_bytes_limit: None,
        };
        let fetch_response = ingest_api_service.ask_for_res(fetch_request).await.unwrap();
        let doc_batch = fetch_response.doc_batch.unwrap();
        let position = doc_batch.num_docs() as u64;
        assert_eq!(doc_batch.num_docs(), 4);
        ingest_api_service
            .send_message(SuggestTruncateRequest {
                index_id: "index-1".to_string(),
                up_to_position_included: position,
            })
            .await
            .unwrap();

        let ingest_response = ingest_response.await.unwrap().unwrap();
        assert_eq!(ingest_response.num_docs_for_processing, 4);

        universe.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_service.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.


syntax = "proto3";

package ingest_service;

service IngestService {
  // Ingests document in a given queue.
  //
  // Upon any kind of error, the client should
  // - retry to get at least once delivery.
  // - not retry to get at most once delivery.
  //
  // Exactly once delivery is not supported yet.
  rpc Ingest(IngestRequest) returns (IngestResponse);

  // Fetches record from a given queue.
  //
  // Records are returned in order.
  //
  // The returned `FetchResponse` object is meant to be read with the
  // `crate::iter_records` function.
  //
  // Fetching does not necessarily return all of the available records.
  // If returning all records would exceed `FETCH_PAYLOAD_LIMIT` (2MB),
  // the response will be partial.
  rpc Fetch(FetchRequest) returns (FetchResponse);

  // Returns a batch containing the last records.
  //
  // It returns the last documents, from the newest
  // to the oldest, and stops as soon as `FETCH_PAYLOAD_LIMIT` (2MB)
  // is exceeded.
  rpc Tail(TailRequest) returns (FetchResponse);
}

message QueueExistsRequest {
    string queue_id = 1;
}

message CreateQueueRequest {
    string queue_id = 1;
}

message CreateQueueIfNotExistsRequest {
    string queue_id = 1;
}

message CreateQueueIfNotExistsResponse {
    string queue_id = 1;
    bool created = 2;
}

message DropQueueRequest {
    string queue_id = 1;
}

// Specifies if the ingest request should block waiting for the records to be committed.
enum CommitType {
    // The request doesn't wait for commit
    Auto = 0;
    // The request waits for the next scheduled commit to finish.
    WaitFor = 1;
    // The request forces an immediate commit after the last document in the batch and waits for
    // it to finish.
    Force = 2;
}

message IngestRequest {
    repeated DocBatch doc_batches = 1;
    CommitType commit = 2;
}

message IngestResponse {
    uint64 num_docs_for_processing = 1;
}

// Fetch messages with position strictly after `start_after`.
message FetchRequest {
    string index_id = 1;
    optional uint64 start_after = 2;
    optional uint64 num_bytes_limit = 3;
}

message FetchResponse {
    optional uint64 first_position = 1;
    DocBatch doc_batch = 2;
}

message DocBatch {
    string index_id = 1;
    bytes doc_buffer = 2;
    repeated uint32 doc_lengths = 3;
}

// Suggest to truncate the queue.
//
// This function allows the queue to remove all records up to and
// including `up_to_offset_included`.
//
// The role of this truncation is to release memory and disk space.
//
// There are no guarantees that the record will effectively be removed.
// Nothing might happen, or the truncation might be partial.
//
// In other words, truncating from a position, and fetching records starting
// earlier than this position can yield undefined result:
// the truncated records may or may not be returned.
message SuggestTruncateRequest {
    string index_id = 1;
    uint64 up_to_position_included = 2;
}

message TailRequest {
    string index_id = 1;
}

message ListQueuesRequest {
}

message ListQueuesResponse {
    repeated string queues = 1;
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/broadcast/capacity_score.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;

use anyhow::{Context, Result};
use bytesize::ByteSize;
use quickwit_cluster::{Cluster, ListenerHandle};
use quickwit_common::pubsub::{Event, EventBroker};
use quickwit_common::shared_consts::INGESTER_CAPACITY_SCORE_PREFIX;
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::types::{NodeId, SourceUid};
use serde::{Deserialize, Serialize};
use tokio::task::JoinHandle;
use tracing::{info, warn};

use super::{BROADCAST_INTERVAL_PERIOD, make_key, parse_key};
use crate::OpenShardCounts;
use crate::ingest_v2::state::WeakIngesterState;

#[derive(Debug, Clone, Default, Serialize, Deserialize)]
pub struct IngesterCapacityScore {
    pub capacity_score: usize,
    pub open_shard_count: usize,
}

/// Periodically snapshots the ingester's WAL memory usage and open shard counts, computes
/// a capacity score, and broadcasts it to other nodes via Chitchat.
pub struct BroadcastIngesterCapacityScoreTask {
    cluster: Cluster,
    weak_state: WeakIngesterState,
}

impl BroadcastIngesterCapacityScoreTask {
    pub fn spawn(cluster: Cluster, weak_state: WeakIngesterState) -> JoinHandle<()> {
        let mut broadcaster = Self {
            cluster,
            weak_state,
        };
        tokio::spawn(async move { broadcaster.run().await })
    }

    async fn snapshot(&self) -> Result<Option<(usize, OpenShardCounts)>> {
        let state = self
            .weak_state
            .upgrade()
            .context("ingester state has been dropped")?;

        // lock fully asserts that the ingester is ready. There's a likelihood that this task runs
        // before the WAL is loaded, so we make sure that the ingester is ready just in case.
        if *state.status_rx.borrow() != IngesterStatus::Ready {
            return Ok(None);
        }

        let mut guard = state
            .lock_fully()
            .await
            .context("failed to acquire ingester state lock")?;

        let usage = guard.mrecordlog.resource_usage();
        let disk_used = ByteSize::b(usage.disk_used_bytes as u64);
        let memory_used = ByteSize::b(usage.memory_used_bytes as u64);
        let capacity_score = guard
            .wal_capacity_tracker
            .record_and_score(disk_used, memory_used);
        let (open_shard_counts, _) = guard.get_shard_snapshot();

        Ok(Some((capacity_score, open_shard_counts)))
    }

    async fn run(&mut self) {
        let mut interval = tokio::time::interval(BROADCAST_INTERVAL_PERIOD);
        let mut previous_sources: BTreeSet<SourceUid> = BTreeSet::new();

        loop {
            interval.tick().await;

            let (capacity_score, open_shard_counts) = match self.snapshot().await {
                Ok(Some(snapshot)) => snapshot,
                Ok(None) => continue,
                Err(error) => {
                    info!("stopping ingester capacity broadcast: {error}");
                    return;
                }
            };

            previous_sources = self
                .broadcast_capacity(capacity_score, &open_shard_counts, &previous_sources)
                .await;
        }
    }

    async fn broadcast_capacity(
        &self,
        capacity_score: usize,
        open_shard_counts: &OpenShardCounts,
        previous_sources: &BTreeSet<SourceUid>,
    ) -> BTreeSet<SourceUid> {
        let mut current_sources = BTreeSet::new();

        for (index_uid, source_id, open_shard_count) in open_shard_counts {
            let source_uid = SourceUid {
                index_uid: index_uid.clone(),
                source_id: source_id.clone(),
            };
            let key = make_key(INGESTER_CAPACITY_SCORE_PREFIX, &source_uid);
            let capacity = IngesterCapacityScore {
                capacity_score,
                open_shard_count: *open_shard_count,
            };
            let value = serde_json::to_string(&capacity)
                .expect("`IngesterCapacityScore` should be JSON serializable");
            self.cluster.set_self_key_value(key, value).await;
            current_sources.insert(source_uid);
        }

        for removed_source in previous_sources.difference(&current_sources) {
            let key = make_key(INGESTER_CAPACITY_SCORE_PREFIX, removed_source);
            self.cluster.remove_self_key(&key).await;
        }

        current_sources
    }
}

#[derive(Debug, Clone)]
pub struct IngesterCapacityScoreUpdate {
    pub node_id: NodeId,
    pub source_uid: SourceUid,
    pub capacity_score: usize,
    pub open_shard_count: usize,
}

impl Event for IngesterCapacityScoreUpdate {}

pub async fn setup_ingester_capacity_update_listener(
    cluster: Cluster,
    event_broker: EventBroker,
) -> ListenerHandle {
    cluster
        .subscribe(INGESTER_CAPACITY_SCORE_PREFIX, move |event| {
            let Some(source_uid) = parse_key(event.key) else {
                warn!("failed to parse source UID from key `{}`", event.key);
                return;
            };
            let Ok(ingester_capacity) = serde_json::from_str::<IngesterCapacityScore>(event.value)
            else {
                warn!("failed to parse ingester capacity `{}`", event.value);
                return;
            };
            let node_id: NodeId = event.node.node_id.clone().into();
            event_broker.publish(IngesterCapacityScoreUpdate {
                node_id,
                source_uid,
                capacity_score: ingester_capacity.capacity_score,
                open_shard_count: ingester_capacity.open_shard_count,
            });
        })
        .await
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};

    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_proto::types::{IndexUid, ShardId, SourceId};

    use super::*;
    use crate::ingest_v2::models::IngesterShard;
    use crate::ingest_v2::state::IngesterState;

    #[tokio::test]
    async fn test_snapshot_state_dropped() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster.clone()).await;
        let weak_state = state.weak();
        drop(state);

        let task = BroadcastIngesterCapacityScoreTask {
            cluster,
            weak_state,
        };
        assert!(task.snapshot().await.is_err());
    }

    #[tokio::test]
    async fn test_broadcast_ingester_capacity() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let event_broker = EventBroker::default();

        // Use 1000 bytes disk capacity so 500 used => 50% remaining, 0 delta => score = 6
        let (_temp_dir, state) =
            IngesterState::for_test_with_disk_capacity(cluster.clone(), ByteSize::b(1000)).await;
        let index_uid = IndexUid::for_test("test-index", 0);
        let mut state_guard = state.lock_partially().await.unwrap();
        let shard = IngesterShard::new_solo(
            index_uid.clone(),
            SourceId::from("test-source"),
            ShardId::from(0),
        )
        .advertisable()
        .build();
        state_guard.shards.insert(shard.queue_id(), shard);
        let (open_shard_counts, _) = state_guard.get_shard_snapshot();
        let capacity_score = state_guard
            .wal_capacity_tracker
            .record_and_score(ByteSize::b(500), ByteSize::b(0));
        drop(state_guard);

        assert_eq!(capacity_score, 6);

        let task = BroadcastIngesterCapacityScoreTask {
            cluster: cluster.clone(),
            weak_state: state.weak(),
        };

        let update_counter = Arc::new(AtomicUsize::new(0));
        let update_counter_clone = update_counter.clone();
        let index_uid_clone = index_uid.clone();
        let _sub = event_broker.subscribe(move |event: IngesterCapacityScoreUpdate| {
            update_counter_clone.fetch_add(1, Ordering::Release);
            assert_eq!(event.source_uid.index_uid, index_uid_clone);
            assert_eq!(event.source_uid.source_id, "test-source");
            assert_eq!(event.capacity_score, 6);
            assert_eq!(event.open_shard_count, 1);
        });

        let _listener =
            setup_ingester_capacity_update_listener(cluster.clone(), event_broker).await;

        let previous_sources = BTreeSet::new();
        task.broadcast_capacity(capacity_score, &open_shard_counts, &previous_sources)
            .await;
        tokio::time::sleep(BROADCAST_INTERVAL_PERIOD * 2).await;

        assert_eq!(update_counter.load(Ordering::Acquire), 1);

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: SourceId::from("test-source"),
        };
        let key = make_key(INGESTER_CAPACITY_SCORE_PREFIX, &source_uid);
        let value = cluster.get_self_key_value(&key).await.unwrap();
        let deserialized: IngesterCapacityScore = serde_json::from_str(&value).unwrap();
        assert_eq!(deserialized.capacity_score, 6);
        assert_eq!(deserialized.open_shard_count, 1);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/broadcast/local_shards.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, BTreeSet, HashMap};
use std::time::Duration;

use bytesize::ByteSize;
use quickwit_cluster::{Cluster, ListenerHandle};
use quickwit_common::pubsub::{Event, EventBroker};
use quickwit_common::ring_buffer::RingBuffer;
use quickwit_common::shared_consts::INGESTER_PRIMARY_SHARDS_PREFIX;
use quickwit_common::sorted_iter::{KeyDiff, SortedByKeyIterator};
use quickwit_common::tower::{ConstantRate, Rate};
use quickwit_proto::ingest::ShardState;
use quickwit_proto::types::{NodeId, ShardId, SourceUid};
use serde::{Deserialize, Serialize, Serializer};
use tokio::task::JoinHandle;
use tracing::{debug, warn};

use super::{BROADCAST_INTERVAL_PERIOD, make_key, parse_key};
use crate::RateMibPerSec;
use crate::ingest_v2::metrics::INGEST_V2_METRICS;
use crate::ingest_v2::state::WeakIngesterState;

const ONE_MIB: ByteSize = ByteSize::mib(1);

/// Broadcasted information about a primary shard.
#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd)]
pub struct ShardInfo {
    pub shard_id: ShardId,
    pub shard_state: ShardState,
    /// Shard ingestion rate in MiB/s.
    /// Short term ingestion rate. It is measured over a short period of time.
    pub short_term_ingestion_rate: RateMibPerSec,
    /// Long term ingestion rate. It is measured over a larger period of time.
    pub long_term_ingestion_rate: RateMibPerSec,
}

impl Serialize for ShardInfo {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        serializer.serialize_str(&format!(
            "{}:{}:{}:{}",
            self.shard_id,
            self.shard_state.as_json_str_name(),
            self.short_term_ingestion_rate.0,
            self.long_term_ingestion_rate.0,
        ))
    }
}

impl<'de> Deserialize<'de> for ShardInfo {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        let value = String::deserialize(deserializer)?;
        let mut parts = value.split(':');

        let shard_id: ShardId = parts
            .next()
            .ok_or_else(|| serde::de::Error::custom("invalid shard info"))?
            .into();

        let shard_state_str = parts
            .next()
            .ok_or_else(|| serde::de::Error::custom("invalid shard info"))?;
        let shard_state = ShardState::from_json_str_name(shard_state_str)
            .ok_or_else(|| serde::de::Error::custom("invalid shard state"))?;

        let short_term_ingestion_rate = parts
            .next()
            .ok_or_else(|| serde::de::Error::custom("invalid shard info"))?
            .parse::<u16>()
            .map(RateMibPerSec)
            .map_err(|_| serde::de::Error::custom("invalid shard ingestion rate"))?;

        let long_term_ingestion_rate = parts
            .next()
            .ok_or_else(|| serde::de::Error::custom("invalid shard info"))?
            .parse::<u16>()
            .map(RateMibPerSec)
            .map_err(|_| serde::de::Error::custom("invalid shard ingestion rate"))?;

        Ok(Self {
            shard_id,
            shard_state,
            short_term_ingestion_rate,
            long_term_ingestion_rate,
        })
    }
}

/// A set of primary shards belonging to the same source.
pub type ShardInfos = BTreeSet<ShardInfo>;

/// Lists ALL the primary shards hosted by a SINGLE ingester, grouped by source.
#[derive(Debug, Default, Eq, PartialEq)]
struct LocalShardsSnapshot {
    per_source_shard_infos: BTreeMap<SourceUid, ShardInfos>,
}

#[derive(Debug)]
enum ShardInfosChange<'a> {
    Updated {
        source_uid: &'a SourceUid,
        shard_infos: &'a ShardInfos,
    },
    Removed {
        source_uid: &'a SourceUid,
    },
}

impl LocalShardsSnapshot {
    pub fn diff<'a>(&'a self, other: &'a Self) -> impl Iterator<Item = ShardInfosChange<'a>> + 'a {
        self.per_source_shard_infos
            .iter()
            .diff_by_key(other.per_source_shard_infos.iter())
            .filter_map(|key_diff| match key_diff {
                KeyDiff::Added(source_uid, shard_infos) => Some(ShardInfosChange::Updated {
                    source_uid,
                    shard_infos,
                }),
                KeyDiff::Unchanged(source_uid, previous_shard_infos, new_shard_infos) => {
                    if previous_shard_infos != new_shard_infos {
                        Some(ShardInfosChange::Updated {
                            source_uid,
                            shard_infos: new_shard_infos,
                        })
                    } else {
                        None
                    }
                }
                KeyDiff::Removed(source_uid, _shard_infos) => {
                    Some(ShardInfosChange::Removed { source_uid })
                }
            })
    }
}

/// Takes a snapshot of the primary shards hosted by the ingester at regular intervals and
/// broadcasts it to other nodes via Chitchat.
pub struct BroadcastLocalShardsTask {
    cluster: Cluster,
    weak_state: WeakIngesterState,
    shard_throughput_time_series_map: ShardThroughputTimeSeriesMap,
}

const SHARD_THROUGHPUT_LONG_TERM_WINDOW_LEN: usize = 12;

#[derive(Default)]
struct ShardThroughputTimeSeriesMap {
    shard_time_series: HashMap<(SourceUid, ShardId), ShardThroughputTimeSeries>,
}

impl ShardThroughputTimeSeriesMap {
    // Records a list of shard throughputs.
    //
    // A new time series is created for each new shard_ids.
    // If a shard_id had a time series, and it is not present in the
    // `shard_throughput`, the time series will be removed.
    #[allow(clippy::mutable_key_type)]
    pub fn record_shard_throughputs(
        &mut self,
        shard_throughputs: HashMap<(SourceUid, ShardId), (ShardState, ConstantRate)>,
    ) {
        self.shard_time_series
            .retain(|key, _| shard_throughputs.contains_key(key));
        for ((source_uid, shard_id), (shard_state, throughput)) in shard_throughputs {
            let throughput_measurement = throughput.rescale(Duration::from_secs(1)).work_bytes();
            let shard_time_series = self
                .shard_time_series
                .entry((source_uid.clone(), shard_id.clone()))
                .or_default();
            shard_time_series.shard_state = shard_state;
            shard_time_series.record(throughput_measurement);
        }
    }

    pub fn get_per_source_shard_infos(&self) -> BTreeMap<SourceUid, ShardInfos> {
        let mut per_source_shard_infos: BTreeMap<SourceUid, ShardInfos> = BTreeMap::new();
        for ((source_uid, shard_id), shard_time_series) in self.shard_time_series.iter() {
            let shard_state = shard_time_series.shard_state;
            let short_term_ingestion_rate_mib_per_sec_u64: u64 =
                shard_time_series.last().as_u64().div_ceil(ONE_MIB.as_u64());
            let long_term_ingestion_rate_mib_per_sec_u64: u64 = shard_time_series
                .average()
                .as_u64()
                .div_ceil(ONE_MIB.as_u64());
            INGEST_V2_METRICS
                .shard_st_throughput_mib
                .observe(short_term_ingestion_rate_mib_per_sec_u64 as f64);
            INGEST_V2_METRICS
                .shard_lt_throughput_mib
                .observe(long_term_ingestion_rate_mib_per_sec_u64 as f64);

            let short_term_ingestion_rate =
                RateMibPerSec(short_term_ingestion_rate_mib_per_sec_u64 as u16);
            let long_term_ingestion_rate =
                RateMibPerSec(long_term_ingestion_rate_mib_per_sec_u64 as u16);
            let shard_info = ShardInfo {
                shard_id: shard_id.clone(),
                shard_state,
                short_term_ingestion_rate,
                long_term_ingestion_rate,
            };

            per_source_shard_infos
                .entry(source_uid.clone())
                .or_default()
                .insert(shard_info);
        }
        per_source_shard_infos
    }
}

#[derive(Default)]
struct ShardThroughputTimeSeries {
    shard_state: ShardState,
    throughput: RingBuffer<ByteSize, SHARD_THROUGHPUT_LONG_TERM_WINDOW_LEN>,
}

impl ShardThroughputTimeSeries {
    fn last(&self) -> ByteSize {
        self.throughput.last().unwrap_or_default()
    }

    fn average(&self) -> ByteSize {
        if self.throughput.is_empty() {
            return ByteSize::default();
        }
        let sum = self.throughput.iter().map(ByteSize::as_u64).sum::<u64>();
        ByteSize::b(sum / self.throughput.len() as u64)
    }

    fn record(&mut self, new_throughput_measurement: ByteSize) {
        self.throughput.push_back(new_throughput_measurement);
    }
}

impl BroadcastLocalShardsTask {
    pub fn spawn(cluster: Cluster, weak_state: WeakIngesterState) -> JoinHandle<()> {
        let mut broadcaster = Self {
            cluster,
            weak_state,
            shard_throughput_time_series_map: Default::default(),
        };
        tokio::spawn(async move { broadcaster.run().await })
    }

    async fn snapshot_local_shards(&mut self) -> Option<LocalShardsSnapshot> {
        let state = self.weak_state.upgrade()?;

        let Ok(mut state_guard) = state.lock_partially().await else {
            return Some(LocalShardsSnapshot::default());
        };
        #[allow(clippy::mutable_key_type)]
        let ingestion_rates: HashMap<(SourceUid, ShardId), (ShardState, ConstantRate)> =
            state_guard
                .shards
                .values_mut()
                .filter(|shard| shard.is_advertisable && !shard.is_replica())
                .map(|shard| {
                    let source_uid = SourceUid {
                        index_uid: shard.index_uid.clone(),
                        source_id: shard.source_id.clone(),
                    };
                    let shard_id = shard.shard_id.clone();
                    let shard_state = shard.shard_state;
                    let rate_meter = &mut shard.rate_meter;

                    ((source_uid, shard_id), (shard_state, rate_meter.harvest()))
                })
                .collect();

        self.shard_throughput_time_series_map
            .record_shard_throughputs(ingestion_rates);

        let per_source_shard_infos = self
            .shard_throughput_time_series_map
            .get_per_source_shard_infos();

        let mut num_open_shards = 0;
        let mut num_closed_shards = 0;

        for shard_infos in per_source_shard_infos.values() {
            for shard_info in shard_infos {
                match shard_info.shard_state {
                    ShardState::Open => num_open_shards += 1,
                    ShardState::Closed => num_closed_shards += 1,
                    ShardState::Unavailable | ShardState::Unspecified => {}
                }
            }
        }
        INGEST_V2_METRICS.open_shards.set(num_open_shards as i64);
        INGEST_V2_METRICS
            .closed_shards
            .set(num_closed_shards as i64);

        let snapshot = LocalShardsSnapshot {
            per_source_shard_infos,
        };
        Some(snapshot)
    }

    async fn broadcast_local_shards(
        &self,
        previous_snapshot: &LocalShardsSnapshot,
        new_snapshot: &LocalShardsSnapshot,
    ) {
        for change in previous_snapshot.diff(new_snapshot) {
            match change {
                ShardInfosChange::Updated {
                    source_uid,
                    shard_infos,
                } => {
                    let key = make_key(INGESTER_PRIMARY_SHARDS_PREFIX, source_uid);
                    let value = serde_json::to_string(&shard_infos)
                        .expect("`ShardInfos` should be JSON serializable");
                    self.cluster.set_self_key_value(key, value).await;
                }
                ShardInfosChange::Removed { source_uid } => {
                    let key = make_key(INGESTER_PRIMARY_SHARDS_PREFIX, source_uid);
                    self.cluster.remove_self_key(&key).await;
                }
            }
        }
    }

    async fn run(&mut self) {
        let mut interval = tokio::time::interval(BROADCAST_INTERVAL_PERIOD);
        let mut previous_snapshot = LocalShardsSnapshot::default();

        loop {
            interval.tick().await;

            let Some(new_snapshot) = self.snapshot_local_shards().await else {
                // The state has been dropped, we can stop the task.
                debug!("stopping local shards broadcast task");
                return;
            };
            self.broadcast_local_shards(&previous_snapshot, &new_snapshot)
                .await;

            previous_snapshot = new_snapshot;
        }
    }
}

#[derive(Debug, Clone)]
pub struct LocalShardsUpdate {
    pub leader_id: NodeId,
    pub source_uid: SourceUid,
    pub shard_infos: ShardInfos,
}

impl Event for LocalShardsUpdate {}

pub async fn setup_local_shards_update_listener(
    cluster: Cluster,
    event_broker: EventBroker,
) -> ListenerHandle {
    cluster
        .subscribe(INGESTER_PRIMARY_SHARDS_PREFIX, move |event| {
            let Some(source_uid) = parse_key(event.key) else {
                warn!("failed to parse source UID `{}`", event.key);
                return;
            };
            let Ok(shard_infos) = serde_json::from_str::<ShardInfos>(event.value) else {
                warn!("failed to parse shard infos `{}`", event.value);
                return;
            };
            let leader_id: NodeId = event.node.node_id.clone().into();

            let local_shards_update = LocalShardsUpdate {
                leader_id,
                source_uid,
                shard_infos,
            };
            event_broker.publish(local_shards_update);
        })
        .await
}

#[cfg(test)]
mod tests {

    use std::sync::Arc;
    use std::sync::atomic::{AtomicUsize, Ordering};

    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_common::shared_consts::INGESTER_PRIMARY_SHARDS_PREFIX;
    use quickwit_proto::ingest::ShardState;
    use quickwit_proto::types::{IndexUid, NodeId, ShardId, SourceId, SourceUid};

    use super::*;
    use crate::RateMibPerSec;
    use crate::ingest_v2::models::IngesterShard;
    use crate::ingest_v2::state::IngesterState;

    #[test]
    fn test_shard_info_serde() {
        let shard_info = ShardInfo {
            shard_id: ShardId::from(1),
            shard_state: ShardState::Open,
            short_term_ingestion_rate: RateMibPerSec(42),
            long_term_ingestion_rate: RateMibPerSec(40),
        };
        let serialized = serde_json::to_string(&shard_info).unwrap();
        assert_eq!(serialized, r#""00000000000000000001:open:42:40""#);

        let deserialized = serde_json::from_str::<ShardInfo>(&serialized).unwrap();
        assert_eq!(deserialized, shard_info);
    }

    #[test]
    fn test_local_shards_snapshot_diff() {
        let previous_snapshot = LocalShardsSnapshot::default();
        let current_snapshot = LocalShardsSnapshot::default();
        let num_changes = previous_snapshot.diff(&current_snapshot).count();
        assert_eq!(num_changes, 0);

        let previous_snapshot = LocalShardsSnapshot::default();
        let index_uid = IndexUid::for_test("test-index", 0);
        let current_snapshot = LocalShardsSnapshot {
            per_source_shard_infos: vec![(
                SourceUid {
                    index_uid: index_uid.clone(),
                    source_id: SourceId::from("test-source"),
                },
                vec![ShardInfo {
                    shard_id: ShardId::from(1),
                    shard_state: ShardState::Open,
                    short_term_ingestion_rate: RateMibPerSec(42),
                    long_term_ingestion_rate: RateMibPerSec(42),
                }]
                .into_iter()
                .collect(),
            )]
            .into_iter()
            .collect(),
        };
        let changes = previous_snapshot
            .diff(&current_snapshot)
            .collect::<Vec<_>>();
        assert_eq!(changes.len(), 1);

        let ShardInfosChange::Updated {
            source_uid,
            shard_infos,
        } = &changes[0]
        else {
            panic!(
                "expected `ShardInfosChange::Updated` variant, got {:?}",
                changes[0]
            );
        };
        assert_eq!(source_uid.index_uid, index_uid);
        assert_eq!(source_uid.source_id, "test-source");
        assert_eq!(shard_infos.len(), 1);

        let num_changes = current_snapshot.diff(&current_snapshot).count();
        assert_eq!(num_changes, 0);

        let previous_snapshot = current_snapshot;
        let current_snapshot = LocalShardsSnapshot {
            per_source_shard_infos: vec![(
                SourceUid {
                    index_uid: index_uid.clone(),
                    source_id: SourceId::from("test-source"),
                },
                vec![ShardInfo {
                    shard_id: ShardId::from(1),
                    shard_state: ShardState::Closed,
                    short_term_ingestion_rate: RateMibPerSec(42),
                    long_term_ingestion_rate: RateMibPerSec(42),
                }]
                .into_iter()
                .collect(),
            )]
            .into_iter()
            .collect(),
        };
        let changes = previous_snapshot
            .diff(&current_snapshot)
            .collect::<Vec<_>>();
        assert_eq!(changes.len(), 1);

        let ShardInfosChange::Updated {
            source_uid,
            shard_infos,
        } = &changes[0]
        else {
            panic!(
                "expected `ShardInfosChange::Updated` variant, got {:?}",
                changes[0]
            );
        };
        assert_eq!(source_uid.index_uid, index_uid);
        assert_eq!(source_uid.source_id, "test-source");
        assert_eq!(shard_infos.len(), 1);

        let previous_snapshot = current_snapshot;
        let current_snapshot = LocalShardsSnapshot::default();

        let changes = previous_snapshot
            .diff(&current_snapshot)
            .collect::<Vec<_>>();
        assert_eq!(changes.len(), 1);

        let ShardInfosChange::Removed { source_uid } = &changes[0] else {
            panic!(
                "expected `ShardInfosChange::Removed` variant, got {:?}",
                changes[0]
            );
        };
        assert_eq!(source_uid.index_uid, index_uid);
        assert_eq!(source_uid.source_id, "test-source");
    }

    #[tokio::test]
    async fn test_broadcast_local_shards_task() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster.clone()).await;
        let weak_state = state.weak();
        let mut task = BroadcastLocalShardsTask {
            cluster,
            weak_state,
            shard_throughput_time_series_map: Default::default(),
        };
        let previous_snapshot = task.snapshot_local_shards().await.unwrap();
        assert!(previous_snapshot.per_source_shard_infos.is_empty());

        let mut state_guard = state.lock_partially().await.unwrap();

        let index_uid = IndexUid::for_test("test-index", 0);
        let shard_00 = IngesterShard::new_solo(
            index_uid.clone(),
            SourceId::from("test-source"),
            ShardId::from(0),
        )
        .build();
        state_guard.shards.insert(shard_00.queue_id(), shard_00);

        let shard_01 = IngesterShard::new_solo(
            index_uid.clone(),
            SourceId::from("test-source"),
            ShardId::from(1),
        )
        .advertisable()
        .build();
        state_guard.shards.insert(shard_01.queue_id(), shard_01);

        let shard_02 = IngesterShard::new_replica(
            index_uid.clone(),
            SourceId::from("test-source"),
            ShardId::from(2),
            NodeId::from("test-leader"),
        )
        .advertisable()
        .build();
        state_guard.shards.insert(shard_02.queue_id(), shard_02);
        drop(state_guard);

        let new_snapshot = task.snapshot_local_shards().await.unwrap();
        assert_eq!(new_snapshot.per_source_shard_infos.len(), 1);

        task.broadcast_local_shards(&previous_snapshot, &new_snapshot)
            .await;

        tokio::time::sleep(Duration::from_millis(100)).await;

        let key = format!(
            "{INGESTER_PRIMARY_SHARDS_PREFIX}{}:{}",
            index_uid, "test-source"
        );
        task.cluster.get_self_key_value(&key).await.unwrap();

        task.broadcast_local_shards(&new_snapshot, &previous_snapshot)
            .await;

        tokio::time::sleep(Duration::from_millis(100)).await;

        let value_opt = task.cluster.get_self_key_value(&key).await;
        assert!(value_opt.is_none());
    }

    #[tokio::test]
    async fn test_local_shards_update_listener() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &["indexer"], &transport, true)
            .await
            .unwrap();
        let event_broker = EventBroker::default();

        let local_shards_update_counter = Arc::new(AtomicUsize::new(0));
        let local_shards_update_counter_clone = local_shards_update_counter.clone();
        let index_uid = IndexUid::for_test("test-index", 0);

        let index_uid_clone = index_uid.clone();
        event_broker
            .subscribe(move |event: LocalShardsUpdate| {
                local_shards_update_counter_clone.fetch_add(1, Ordering::Release);

                assert_eq!(event.source_uid.index_uid, index_uid_clone);
                assert_eq!(event.source_uid.source_id, "test-source");
                assert_eq!(event.shard_infos.len(), 1);

                let shard_info = event.shard_infos.iter().next().unwrap();
                assert_eq!(shard_info.shard_id, ShardId::from(1));
                assert_eq!(shard_info.shard_state, ShardState::Open);
                assert_eq!(shard_info.short_term_ingestion_rate, 42u16);
            })
            .forever();

        setup_local_shards_update_listener(cluster.clone(), event_broker.clone())
            .await
            .forever();

        let source_uid = SourceUid {
            index_uid: index_uid.clone(),
            source_id: SourceId::from("test-source"),
        };
        let key = make_key(INGESTER_PRIMARY_SHARDS_PREFIX, &source_uid);
        let value = serde_json::to_string(&vec![ShardInfo {
            shard_id: ShardId::from(1),
            shard_state: ShardState::Open,
            short_term_ingestion_rate: RateMibPerSec(42),
            long_term_ingestion_rate: RateMibPerSec(42),
        }])
        .unwrap();

        cluster.set_self_key_value(key, value).await;
        tokio::time::sleep(Duration::from_millis(50)).await;

        assert_eq!(local_shards_update_counter.load(Ordering::Acquire), 1);
    }

    #[test]
    fn test_shard_throughput_time_series() {
        let mut time_series = ShardThroughputTimeSeries::default();
        assert_eq!(time_series.last(), ByteSize::mb(0));
        assert_eq!(time_series.average(), ByteSize::mb(0));

        time_series.record(ByteSize::mb(2));
        assert_eq!(time_series.last(), ByteSize::mb(2));
        assert_eq!(time_series.average(), ByteSize::mb(2));

        time_series.record(ByteSize::mb(1));
        assert_eq!(time_series.last(), ByteSize::mb(1));
        assert_eq!(time_series.average(), ByteSize::kb(1500));

        time_series.record(ByteSize::mb(3));
        assert_eq!(time_series.last(), ByteSize::mb(3));
        assert_eq!(time_series.average(), ByteSize::mb(2));

        for _ in 0..SHARD_THROUGHPUT_LONG_TERM_WINDOW_LEN {
            time_series.record(ByteSize::mb(4));
            assert_eq!(time_series.last(), ByteSize::mb(4));
        }
        assert_eq!(time_series.last(), ByteSize::mb(4));
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/broadcast/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#[allow(dead_code)]
mod capacity_score;
mod local_shards;

use std::time::Duration;

use quickwit_proto::types::SourceUid;

pub(in crate::ingest_v2) const BROADCAST_INTERVAL_PERIOD: Duration = if cfg!(test) {
    Duration::from_millis(50)
} else {
    Duration::from_secs(5)
};

pub use capacity_score::{
    BroadcastIngesterCapacityScoreTask, IngesterCapacityScoreUpdate,
    setup_ingester_capacity_update_listener,
};
pub use local_shards::{
    BroadcastLocalShardsTask, LocalShardsUpdate, ShardInfo, ShardInfos,
    setup_local_shards_update_listener,
};

fn make_key(prefix: &str, source_uid: &SourceUid) -> String {
    format!("{prefix}{}:{}", source_uid.index_uid, source_uid.source_id)
}

fn parse_key(key: &str) -> Option<SourceUid> {
    let (index_uid_str, source_id_str) = key.rsplit_once(':')?;
    Some(SourceUid {
        index_uid: index_uid_str.parse().ok()?,
        source_id: source_id_str.to_string(),
    })
}

#[cfg(test)]
mod tests {
    use quickwit_common::shared_consts::INGESTER_PRIMARY_SHARDS_PREFIX;
    use quickwit_proto::types::{IndexUid, SourceId, SourceUid};

    use super::*;

    #[test]
    fn test_make_key() {
        let source_uid = SourceUid {
            index_uid: IndexUid::for_test("test-index", 0),
            source_id: SourceId::from("test-source"),
        };
        let key = make_key(INGESTER_PRIMARY_SHARDS_PREFIX, &source_uid);
        assert_eq!(
            key,
            "ingester.primary_shards:test-index:00000000000000000000000000:test-source"
        );
    }

    #[test]
    fn test_parse_key() {
        let key = "test-index:00000000000000000000000000:test-source";
        let source_uid = parse_key(key).unwrap();
        assert_eq!(
            &source_uid.index_uid.to_string(),
            "test-index:00000000000000000000000000"
        );
        assert_eq!(source_uid.source_id, "test-source".to_string());
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/debouncing.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::sync::Arc;

use quickwit_proto::control_plane::{
    GetOrCreateOpenShardsRequest, GetOrCreateOpenShardsSubrequest,
};
use quickwit_proto::ingest::ShardIds;
use quickwit_proto::types::{IndexId, SourceId};
use tokio::sync::{OwnedRwLockWriteGuard, RwLock};

#[derive(Default)]
struct Debouncer(Arc<RwLock<()>>);

impl Debouncer {
    fn acquire(&self) -> Result<PermitGuard, BarrierGuard> {
        if let Ok(permit) = self.0.clone().try_write_owned() {
            Ok(PermitGuard(permit))
        } else {
            let barrier = self.0.clone();
            Err(BarrierGuard(barrier))
        }
    }
}

#[derive(Debug)]
pub(super) struct PermitGuard(#[allow(dead_code)] OwnedRwLockWriteGuard<()>);

#[derive(Debug)]
pub(super) struct BarrierGuard(Arc<RwLock<()>>);

impl BarrierGuard {
    pub async fn wait(self) {
        let _ = self.0.read().await;
    }
}

/// Debounces [`GetOrCreateOpenShardsRequest`] requests by index and source IDs. It gives away a
/// permit to the first request and a barrier to subsequent requests.
#[derive(Default)]
pub(super) struct GetOrCreateOpenShardsRequestDebouncer {
    debouncers: HashMap<(IndexId, SourceId), Debouncer>,
}

impl GetOrCreateOpenShardsRequestDebouncer {
    pub fn acquire(
        &mut self,
        index_id: &str,
        source_id: &str,
    ) -> Result<PermitGuard, BarrierGuard> {
        let key = (index_id.to_string(), source_id.to_string());
        self.debouncers.entry(key).or_default().acquire()
    }
}

#[derive(Default)]
pub(super) struct DebouncedGetOrCreateOpenShardsRequest {
    subrequests: Vec<GetOrCreateOpenShardsSubrequest>,
    pub closed_shards: Vec<ShardIds>,
    pub unavailable_leaders: Vec<String>,
    rendezvous: Rendezvous,
}

impl DebouncedGetOrCreateOpenShardsRequest {
    pub fn is_empty(&self) -> bool {
        self.subrequests.is_empty()
    }

    pub fn take(self) -> (Option<GetOrCreateOpenShardsRequest>, Rendezvous) {
        if self.is_empty() {
            return (None, self.rendezvous);
        }
        let request = GetOrCreateOpenShardsRequest {
            subrequests: self.subrequests,
            closed_shards: self.closed_shards,
            unavailable_leaders: self.unavailable_leaders,
        };
        (Some(request), self.rendezvous)
    }

    pub fn push_subrequest(
        &mut self,
        subrequest: GetOrCreateOpenShardsSubrequest,
        permit: PermitGuard,
    ) {
        self.subrequests.push(subrequest);
        self.rendezvous.permits.push(permit);
    }

    pub fn push_barrier(&mut self, barrier: BarrierGuard) {
        self.rendezvous.barriers.push(barrier);
    }
}

#[derive(Default)]
pub(super) struct Rendezvous {
    permits: Vec<PermitGuard>,
    barriers: Vec<BarrierGuard>,
}

impl Rendezvous {
    /// Releases the permits and waits for the barriers to be lifted.
    pub async fn wait(mut self) {
        // Releasing the permits before waiting for the barriers is necessary to avoid
        // dead locks.
        self.permits.clear();

        for barrier in self.barriers {
            barrier.wait().await;
        }
    }
}

#[cfg(test)]
mod tests {
    use std::sync::atomic::{AtomicUsize, Ordering};
    use std::time::Duration;

    use super::*;

    impl Rendezvous {
        pub fn is_empty(&self) -> bool {
            self.permits.is_empty() && self.barriers.is_empty()
        }

        pub fn num_permits(&self) -> usize {
            self.permits.len()
        }

        pub fn num_barriers(&self) -> usize {
            self.barriers.len()
        }
    }

    #[tokio::test]
    async fn test_debouncer() {
        let debouncer = Debouncer::default();

        let permit = debouncer.acquire().unwrap();
        let barrier = debouncer.acquire().unwrap_err();
        drop(permit);
        barrier.wait().await;

        let permit = debouncer.acquire().unwrap();
        let barrier = debouncer.acquire().unwrap_err();
        let flag = Arc::new(AtomicUsize::new(0));

        let flag_clone = flag.clone();
        tokio::spawn(async move {
            tokio::time::sleep(Duration::from_millis(100)).await;
            flag_clone.store(1, Ordering::Release);
            drop(permit);
        });
        let flag_clone = flag.clone();
        tokio::spawn(async move {
            let _ = barrier.wait().await;
            flag_clone.store(2, Ordering::Release);
        });
        tokio::time::sleep(Duration::from_millis(200)).await;
        assert_eq!(flag.load(Ordering::Acquire), 2);
    }

    #[test]
    fn test_get_or_create_open_shards_request_debouncer() {
        let mut debouncer = GetOrCreateOpenShardsRequestDebouncer::default();

        let _permit_foo: PermitGuard = debouncer.acquire("test-index", "test-source-foo").unwrap();

        let _barrier = debouncer
            .acquire("test-index", "test-source-foo")
            .unwrap_err();

        let _permit_bar: PermitGuard = debouncer.acquire("test-index", "test-source-bar").unwrap();
    }

    #[tokio::test]
    async fn test_debounced_get_or_create_open_shards_request() {
        let debounced_request = DebouncedGetOrCreateOpenShardsRequest::default();
        assert!(debounced_request.is_empty());

        let (request_opt, rendezvous) = debounced_request.take();
        assert!(request_opt.is_none());
        assert!(rendezvous.is_empty());

        let mut debouncer = GetOrCreateOpenShardsRequestDebouncer::default();
        let mut debounced_request = DebouncedGetOrCreateOpenShardsRequest::default();

        let permit = debouncer.acquire("test-index", "test-source-foo").unwrap();
        debounced_request.push_subrequest(
            GetOrCreateOpenShardsSubrequest {
                index_id: "test-index".to_string(),
                source_id: "test-source-foo".to_string(),
                ..Default::default()
            },
            permit,
        );

        let barrier = debouncer
            .acquire("test-index", "test-source-foo")
            .unwrap_err();
        debounced_request.push_barrier(barrier);

        let (request_opt, rendezvous) = debounced_request.take();
        let request = request_opt.unwrap();

        assert_eq!(request.subrequests.len(), 1);
        assert_eq!(rendezvous.num_permits(), 1);
        assert_eq!(rendezvous.num_barriers(), 1);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/doc_mapper.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::hash_map::Entry;
use std::collections::{HashMap, HashSet};
use std::sync::{Arc, Weak};

use once_cell::sync::OnceCell;
use quickwit_common::rate_limited_error;
use quickwit_common::thread_pool::run_cpu_intensive;
use quickwit_config::{DocMapping, SearchSettings, build_doc_mapper};
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::ingest::{
    DocBatchV2, IngestV2Error, IngestV2Result, ParseFailure, ParseFailureReason,
};
use quickwit_proto::types::{DocMappingUid, DocUid};
use serde_json_borrow::Value as JsonValue;
use tracing::info;

use crate::DocBatchV2Builder;

/// Attempts to get the doc mapper identified by the given doc mapping UID `doc_mapping_uid` from
/// the `doc_mappers` cache. If it is not found, it is built from the specified JSON doc mapping
/// `doc_mapping_json` and inserted into the cache before being returned.
pub(super) fn get_or_try_build_doc_mapper(
    doc_mappers: &mut HashMap<DocMappingUid, Weak<DocMapper>>,
    doc_mapping_uid: DocMappingUid,
    doc_mapping_json: &str,
) -> IngestV2Result<Arc<DocMapper>> {
    if let Entry::Occupied(occupied) = doc_mappers.entry(doc_mapping_uid) {
        if let Some(doc_mapper) = occupied.get().upgrade() {
            return Ok(doc_mapper);
        }
        occupied.remove();
    }
    let doc_mapper = try_build_doc_mapper(doc_mapping_json)?;

    if doc_mapper.doc_mapping_uid() != doc_mapping_uid {
        let message = format!(
            "doc mapping UID mismatch: expected `{doc_mapping_uid}`, got `{}`",
            doc_mapper.doc_mapping_uid()
        );
        return Err(IngestV2Error::Internal(message));
    }
    doc_mappers.insert(doc_mapping_uid, Arc::downgrade(&doc_mapper));
    info!("inserted doc mapper `{doc_mapping_uid}` into cache`");

    Ok(doc_mapper)
}

/// Attempts to build a doc mapper from the specified JSON doc mapping `doc_mapping_json`.
pub(super) fn try_build_doc_mapper(doc_mapping_json: &str) -> IngestV2Result<Arc<DocMapper>> {
    let doc_mapping: DocMapping = serde_json::from_str(doc_mapping_json).map_err(|error| {
        IngestV2Error::Internal(format!("failed to parse doc mapping: {error}"))
    })?;
    let search_settings = SearchSettings::default();
    let doc_mapper = build_doc_mapper(&doc_mapping, &search_settings)
        .map_err(|error| IngestV2Error::Internal(format!("failed to build doc mapper: {error}")))?;
    Ok(doc_mapper)
}

fn validate_document(
    doc_mapper: &DocMapper,
    doc_bytes: &[u8],
) -> Result<(), (ParseFailureReason, String)> {
    let Ok(json_doc) = serde_json::from_slice::<serde_json_borrow::Value>(doc_bytes) else {
        return Err((
            ParseFailureReason::InvalidJson,
            "failed to parse JSON document".to_string(),
        ));
    };
    let JsonValue::Object(json_obj) = json_doc else {
        return Err((
            ParseFailureReason::InvalidJson,
            "JSON document is not an object".to_string(),
        ));
    };
    if let Err(error) = doc_mapper.validate_json_obj(&json_obj) {
        rate_limited_error!(
            limit_per_min = 6,
            "failed to validate JSON document: {}",
            error
        );
        return Err((ParseFailureReason::InvalidSchema, error.to_string()));
    }
    Ok(())
}

/// Validates a batch of docs.
///
/// Returns a batch of valid docs and the list of errors.
fn validate_doc_batch_impl(
    doc_batch: DocBatchV2,
    doc_mapper: &DocMapper,
) -> (DocBatchV2, Vec<ParseFailure>) {
    let mut parse_failures: Vec<ParseFailure> = Vec::new();
    let mut invalid_doc_ids: HashSet<DocUid> = HashSet::default();
    for (doc_uid, doc_bytes) in doc_batch.docs() {
        if let Err((reason, message)) = validate_document(doc_mapper, &doc_bytes) {
            let parse_failure = ParseFailure {
                doc_uid: Some(doc_uid),
                reason: reason as i32,
                message,
            };
            invalid_doc_ids.insert(doc_uid);
            parse_failures.push(parse_failure);
        }
    }
    if invalid_doc_ids.is_empty() {
        // All docs are valid! We don't need to build a valid doc batch.
        return (doc_batch, parse_failures);
    }
    let mut valid_doc_batch_builder = DocBatchV2Builder::default();
    for (doc_uid, doc_bytes) in doc_batch.docs() {
        if !invalid_doc_ids.contains(&doc_uid) {
            valid_doc_batch_builder.add_doc(doc_uid, &doc_bytes);
        }
    }
    let valid_doc_batch: DocBatchV2 = valid_doc_batch_builder.build().unwrap_or_default();
    assert_eq!(
        valid_doc_batch.num_docs() + parse_failures.len(),
        doc_batch.num_docs()
    );
    (valid_doc_batch, parse_failures)
}

fn is_document_validation_enabled() -> bool {
    static IS_DOCUMENT_VALIDATION_ENABLED: OnceCell<bool> = OnceCell::new();
    *IS_DOCUMENT_VALIDATION_ENABLED.get_or_init(|| {
        !quickwit_common::get_bool_from_env("QW_DISABLE_DOCUMENT_VALIDATION", false)
    })
}

/// Parses the JSON documents contained in the batch and applies the doc mapper. Returns the
/// original batch and a list of parse failures.
pub(super) async fn validate_doc_batch(
    doc_batch: DocBatchV2,
    doc_mapper: Arc<DocMapper>,
) -> IngestV2Result<(DocBatchV2, Vec<ParseFailure>)> {
    if is_document_validation_enabled() {
        run_cpu_intensive(move || validate_doc_batch_impl(doc_batch, &doc_mapper))
            .await
            .map_err(|error| {
                let message = format!("failed to validate documents: {error}");
                IngestV2Error::Internal(message)
            })
    } else {
        Ok((doc_batch, Vec::new()))
    }
}

#[cfg(test)]
mod tests {
    use quickwit_proto::types::DocUid;

    use super::*;

    #[test]
    fn test_get_or_try_build_doc_mapper() {
        let mut doc_mappers: HashMap<DocMappingUid, Weak<DocMapper>> = HashMap::new();

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = r#"{
            "field_mappings": [{
                "name": "message",
                "type": "text"
            }]
        }"#;
        let error =
            get_or_try_build_doc_mapper(&mut doc_mappers, doc_mapping_uid, doc_mapping_json)
                .unwrap_err();
        assert!(
            matches!(error, IngestV2Error::Internal(message) if message.contains("doc mapping UID mismatch"))
        );

        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "field_mappings": [{{
                        "name": "message",
                        "type": "text"
                }}]
            }}"#
        );
        let doc_mapper =
            get_or_try_build_doc_mapper(&mut doc_mappers, doc_mapping_uid, &doc_mapping_json)
                .unwrap();
        assert_eq!(doc_mappers.len(), 1);
        assert_eq!(doc_mapper.doc_mapping_uid(), doc_mapping_uid);
        assert_eq!(Arc::strong_count(&doc_mapper), 1);

        drop(doc_mapper);
        assert!(
            doc_mappers
                .get(&doc_mapping_uid)
                .unwrap()
                .upgrade()
                .is_none()
        );

        let error = get_or_try_build_doc_mapper(&mut doc_mappers, doc_mapping_uid, "").unwrap_err();
        assert!(
            matches!(error, IngestV2Error::Internal(message) if message.contains("parse doc mapping"))
        );
        assert_eq!(doc_mappers.len(), 0);
    }

    #[test]
    fn test_try_build_doc_mapper() {
        let error = try_build_doc_mapper("").unwrap_err();
        assert!(
            matches!(error, IngestV2Error::Internal(message) if message.contains("parse doc mapping"))
        );

        let error = try_build_doc_mapper(r#"{"timestamp_field": ".timestamp"}"#).unwrap_err();
        assert!(
            matches!(error, IngestV2Error::Internal(message) if message.contains("build doc mapper"))
        );

        let doc_mapping_json = r#"{
            "mode": "strict",
            "field_mappings": [{
                "name": "message",
                "type": "text"
        }]}"#;
        let doc_mapper = try_build_doc_mapper(doc_mapping_json).unwrap();
        let schema = doc_mapper.schema();
        assert_eq!(schema.num_fields(), 2);

        let contains_message_field = schema
            .fields()
            .map(|(_field, entry)| entry.name())
            .any(|field_name| field_name == "message");
        assert!(contains_message_field);
    }

    #[test]
    fn test_validate_doc_batch() {
        let doc_mapping_json = r#"{
            "mode": "strict",
            "field_mappings": [
                {
                    "name": "doc",
                    "type": "text"
                }
            ]
        }"#;
        let doc_mapper = try_build_doc_mapper(doc_mapping_json).unwrap();
        let doc_batch = DocBatchV2::default();

        let (_, parse_failures) = validate_doc_batch_impl(doc_batch, &doc_mapper);
        assert_eq!(parse_failures.len(), 0);

        let doc_batch =
            DocBatchV2::for_test(["", "[]", r#"{"foo": "bar"}"#, r#"{"doc": "test-doc-000"}"#]);
        let (doc_batch, parse_failures) = validate_doc_batch_impl(doc_batch, &doc_mapper);
        assert_eq!(parse_failures.len(), 3);

        let parse_failure_0 = &parse_failures[0];
        assert_eq!(parse_failure_0.doc_uid(), DocUid::for_test(0));
        assert_eq!(parse_failure_0.reason(), ParseFailureReason::InvalidJson);
        assert!(parse_failure_0.message.contains("parse JSON document"));

        let parse_failure_1 = &parse_failures[1];
        assert_eq!(parse_failure_1.doc_uid(), DocUid::for_test(1));
        assert_eq!(parse_failure_1.reason(), ParseFailureReason::InvalidJson);
        assert!(parse_failure_1.message.contains("not an object"));

        let parse_failure_2 = &parse_failures[2];
        assert_eq!(parse_failure_2.doc_uid(), DocUid::for_test(2));
        assert_eq!(parse_failure_2.reason(), ParseFailureReason::InvalidSchema);
        assert!(parse_failure_2.message.contains("not declared"));

        assert_eq!(doc_batch.num_docs(), 1);
        assert_eq!(doc_batch.doc_uids[0], DocUid::for_test(3));
        let (valid_doc_uid, valid_doc_bytes) = doc_batch.docs().next().unwrap();
        assert_eq!(valid_doc_uid, DocUid::for_test(3));
        assert_eq!(&valid_doc_bytes, r#"{"doc": "test-doc-000"}"#.as_bytes());
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/fetch.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Borrow;
use std::collections::HashMap;
use std::collections::hash_map::Entry;
use std::fmt;
use std::sync::Arc;

use bytes::{BufMut, BytesMut};
use bytesize::ByteSize;
use futures::StreamExt;
use mrecordlog::Record;
use quickwit_common::metrics::MEMORY_METRICS;
use quickwit_common::retry::RetryParams;
use quickwit_common::stream_utils::{InFlightValue, TrackedSender};
use quickwit_common::{ServiceStream, spawn_named_task};
use quickwit_proto::ingest::ingester::{
    FetchEof, FetchMessage, FetchPayload, IngesterService, OpenFetchStreamRequest, fetch_message,
};
use quickwit_proto::ingest::{IngestV2Error, IngestV2Result, MRecordBatch};
use quickwit_proto::types::{IndexUid, NodeId, Position, QueueId, ShardId, SourceId, queue_id};
use tokio::sync::{RwLock, mpsc, watch};
use tokio::task::JoinHandle;
use tracing::{debug, error, warn};

use super::models::ShardStatus;
use crate::mrecordlog_async::MultiRecordLogAsync;
use crate::{ClientId, IngesterPool, with_lock_metrics};

/// A fetch stream task is responsible for waiting and pushing new records written to a shard's
/// record log into a channel named `fetch_message_tx`.
pub(super) struct FetchStreamTask {
    /// Uniquely identifies the consumer of the fetch task for logging and debugging purposes.
    client_id: ClientId,
    index_uid: IndexUid,
    source_id: SourceId,
    shard_id: ShardId,
    queue_id: QueueId,
    /// The position of the next record fetched.
    from_position_inclusive: u64,
    mrecordlog: Arc<RwLock<Option<MultiRecordLogAsync>>>,
    fetch_message_tx: TrackedSender<IngestV2Result<FetchMessage>>,
    /// This channel notifies the fetch task when new records are available. This way the fetch
    /// task does not need to grab the lock and poll the mrecordlog queue unnecessarily.
    shard_status_rx: watch::Receiver<ShardStatus>,
    batch_num_bytes: usize,
}

impl fmt::Debug for FetchStreamTask {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("FetchStreamTask")
            .field("client_id", &self.client_id)
            .field("index_uid", &self.index_uid)
            .field("source_id", &self.source_id)
            .field("shard_id", &self.shard_id)
            .finish()
    }
}

impl FetchStreamTask {
    pub fn spawn(
        open_fetch_stream_request: OpenFetchStreamRequest,
        mrecordlog: Arc<RwLock<Option<MultiRecordLogAsync>>>,
        shard_status_rx: watch::Receiver<ShardStatus>,
        batch_num_bytes: usize,
    ) -> (ServiceStream<IngestV2Result<FetchMessage>>, JoinHandle<()>) {
        let from_position_inclusive = open_fetch_stream_request
            .from_position_exclusive()
            .as_u64()
            .map(|offset| offset + 1)
            .unwrap_or_default();
        let (fetch_message_tx, fetch_stream) =
            ServiceStream::new_bounded_with_gauge(3, &MEMORY_METRICS.in_flight.fetch_stream);
        let mut fetch_task = Self {
            shard_id: open_fetch_stream_request.shard_id().clone(),
            queue_id: open_fetch_stream_request.queue_id(),
            index_uid: open_fetch_stream_request.index_uid().clone(),
            client_id: open_fetch_stream_request.client_id,
            source_id: open_fetch_stream_request.source_id,
            from_position_inclusive,
            mrecordlog,
            fetch_message_tx,
            shard_status_rx,
            batch_num_bytes,
        };
        let future = async move { fetch_task.run().await };
        let fetch_task_handle: JoinHandle<()> = spawn_named_task(future, "fetch_task");
        (fetch_stream, fetch_task_handle)
    }

    /// Runs the fetch task. It waits for new records in the log and pushes them into the fetch
    /// response channel until it reaches the end of the shard marked by an EOF record.
    async fn run(&mut self) {
        debug!(
            client_id=%self.client_id,
            index_uid=%self.index_uid,
            source_id=%self.source_id,
            shard_id=%self.shard_id,
            from_position_inclusive=%self.from_position_inclusive,
            "spawning fetch task"
        );
        let mut has_drained_queue = false;
        let mut to_position_inclusive = if self.from_position_inclusive == 0 {
            Position::Beginning
        } else {
            Position::offset(self.from_position_inclusive - 1)
        };

        loop {
            if has_drained_queue && self.shard_status_rx.changed().await.is_err() {
                // The shard was dropped.
                break;
            }
            has_drained_queue = true;

            let mut mrecord_buffer = BytesMut::with_capacity(self.batch_num_bytes);
            let mut mrecord_lengths = Vec::new();

            let mrecordlog_guard =
                with_lock_metrics!(self.mrecordlog.read().await, "fetch", "read");

            let Ok(mrecords) = mrecordlog_guard
                .as_ref()
                .expect("mrecordlog should be initialized")
                .range(&self.queue_id, self.from_position_inclusive..)
            else {
                // The queue was dropped.
                break;
            };
            for Record { payload, .. } in mrecords {
                // Accept at least one message
                if !mrecord_buffer.is_empty()
                    && (mrecord_buffer.len() + payload.len() > mrecord_buffer.capacity())
                {
                    has_drained_queue = false;
                    break;
                }
                mrecord_buffer.put(payload.borrow());
                mrecord_lengths.push(payload.len() as u32);
            }
            // Drop the lock while we send the message.
            drop(mrecordlog_guard);

            if !mrecord_lengths.is_empty() {
                let from_position_exclusive = if self.from_position_inclusive == 0 {
                    Position::Beginning
                } else {
                    Position::offset(self.from_position_inclusive - 1)
                };
                self.from_position_inclusive += mrecord_lengths.len() as u64;

                to_position_inclusive = Position::offset(self.from_position_inclusive - 1);

                let mrecord_batch = MRecordBatch {
                    mrecord_buffer: mrecord_buffer.freeze(),
                    mrecord_lengths,
                };
                let batch_size = mrecord_batch.estimate_size();
                let fetch_payload = FetchPayload {
                    index_uid: Some(self.index_uid.clone()),
                    source_id: self.source_id.clone(),
                    shard_id: Some(self.shard_id.clone()),
                    mrecord_batch: Some(mrecord_batch),
                    from_position_exclusive: Some(from_position_exclusive),
                    to_position_inclusive: Some(to_position_inclusive.clone()),
                };
                let fetch_message = FetchMessage::new_payload(fetch_payload);

                if self
                    .fetch_message_tx
                    .send(Ok(fetch_message), batch_size)
                    .await
                    .is_err()
                {
                    // The consumer was dropped.
                    return;
                }
            }
            if has_drained_queue {
                let has_reached_eof = {
                    let shard_status = self.shard_status_rx.borrow();
                    let shard_state = &shard_status.0;
                    let replication_position = &shard_status.1;
                    shard_state.is_closed() && to_position_inclusive >= *replication_position
                };
                if has_reached_eof {
                    debug!(
                        client_id=%self.client_id,
                        index_uid=%self.index_uid,
                        source_id=%self.source_id,
                        shard_id=%self.shard_id,
                        to_position_inclusive=%self.from_position_inclusive - 1,
                        "fetch stream reached end of shard"
                    );
                    let eof_position = to_position_inclusive.as_eof();

                    let fetch_eof = FetchEof {
                        index_uid: Some(self.index_uid.clone()),
                        source_id: self.source_id.clone(),
                        shard_id: Some(self.shard_id.clone()),
                        eof_position: Some(eof_position),
                    };
                    let fetch_message = FetchMessage::new_eof(fetch_eof);
                    let _ = self
                        .fetch_message_tx
                        .send(Ok(fetch_message), ByteSize(0))
                        .await;
                    return;
                }
            }
        }
        if !to_position_inclusive.is_eof() {
            // This can happen if we delete the associated source or index.
            warn!(
                client_id=%self.client_id,
                index_uid=%self.index_uid,
                source_id=%self.source_id,
                shard_id=%self.shard_id,
                "fetch stream ended before reaching end of shard"
            );
            let _ = self
                .fetch_message_tx
                .send(
                    Err(IngestV2Error::Internal(
                        "fetch stream ended before reaching end of shard".to_string(),
                    )),
                    ByteSize(0),
                )
                .await;
        }
    }
}

#[derive(Debug)]
pub struct FetchStreamError {
    pub index_uid: IndexUid,
    pub source_id: SourceId,
    pub shard_id: ShardId,
    pub ingest_error: IngestV2Error,
}

/// Combines multiple fetch streams originating from different ingesters into a single stream. It
/// tolerates the failure of ingesters and automatically fails over to replica shards.
pub struct MultiFetchStream {
    self_node_id: NodeId,
    client_id: ClientId,
    ingester_pool: IngesterPool,
    retry_params: RetryParams,
    fetch_task_handles: HashMap<QueueId, JoinHandle<()>>,
    fetch_message_rx: mpsc::Receiver<Result<InFlightValue<FetchMessage>, FetchStreamError>>,
    fetch_message_tx: mpsc::Sender<Result<InFlightValue<FetchMessage>, FetchStreamError>>,
}

impl MultiFetchStream {
    pub fn new(
        self_node_id: NodeId,
        client_id: ClientId,
        ingester_pool: IngesterPool,
        retry_params: RetryParams,
    ) -> Self {
        let (fetch_message_tx, fetch_message_rx) = mpsc::channel(3);
        Self {
            self_node_id,
            client_id,
            ingester_pool,
            retry_params,
            fetch_task_handles: HashMap::new(),
            fetch_message_rx,
            fetch_message_tx,
        }
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn fetch_message_tx(
        &self,
    ) -> mpsc::Sender<Result<InFlightValue<FetchMessage>, FetchStreamError>> {
        self.fetch_message_tx.clone()
    }

    /// Subscribes to a shard and fails over to the replica if an error occurs.
    #[allow(clippy::too_many_arguments)]
    pub async fn subscribe(
        &mut self,
        leader_id: NodeId,
        follower_id_opt: Option<NodeId>,
        index_uid: IndexUid,
        source_id: SourceId,
        shard_id: ShardId,
        from_position_exclusive: Position,
    ) -> IngestV2Result<()> {
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);
        let entry = self.fetch_task_handles.entry(queue_id.clone());

        if let Entry::Occupied(_) = entry {
            return Err(IngestV2Error::Internal(format!(
                "stream has already subscribed to shard `{queue_id}`"
            )));
        }
        let (preferred_ingester_id, failover_ingester_id_opt) =
            select_preferred_and_failover_ingesters(&self.self_node_id, leader_id, follower_id_opt);

        let mut ingester_ids = Vec::with_capacity(1 + failover_ingester_id_opt.is_some() as usize);
        ingester_ids.push(preferred_ingester_id);

        if let Some(failover_ingester_id) = failover_ingester_id_opt {
            ingester_ids.push(failover_ingester_id);
        }
        let fetch_stream_future = retrying_fetch_stream(
            self.client_id.clone(),
            index_uid,
            source_id,
            shard_id,
            from_position_exclusive,
            ingester_ids,
            self.ingester_pool.clone(),
            self.retry_params,
            self.fetch_message_tx.clone(),
        );
        let fetch_task_handle = spawn_named_task(fetch_stream_future, "fetch_stream");
        self.fetch_task_handles.insert(queue_id, fetch_task_handle);
        Ok(())
    }

    pub fn unsubscribe(
        &mut self,
        index_uid: &IndexUid,
        source_id: &str,
        shard_id: ShardId,
    ) -> IngestV2Result<()> {
        let queue_id = queue_id(index_uid, source_id, &shard_id);

        if let Some(fetch_stream_handle) = self.fetch_task_handles.remove(&queue_id) {
            fetch_stream_handle.abort();
        }
        Ok(())
    }

    /// Returns the next fetch response. This method blocks until a response is available.
    ///
    /// # Cancel safety
    ///
    /// This method is cancel safe.
    pub async fn next(&mut self) -> Result<FetchMessage, FetchStreamError> {
        // Because we always hold a sender and never call `close()` on the receiver, the channel is
        // always open.
        self.fetch_message_rx
            .recv()
            .await
            .expect("channel should be open")
            .map(|value: InFlightValue<FetchMessage>| value.into_inner())
    }

    /// Resets the stream by aborting all the active fetch tasks and dropping all queued responses.
    ///
    /// The borrow checker guarantees that both `next()` and `reset()` cannot be called
    /// simultaneously because they are both `&mut self` methods.
    pub fn reset(&mut self) {
        for (_queue_id, fetch_stream_handle) in self.fetch_task_handles.drain() {
            fetch_stream_handle.abort();
        }
        let (fetch_message_tx, fetch_message_rx) = mpsc::channel(3);
        self.fetch_message_tx = fetch_message_tx;
        self.fetch_message_rx = fetch_message_rx;
    }
}

impl Drop for MultiFetchStream {
    fn drop(&mut self) {
        self.reset();
    }
}

/// Chooses the ingester to stream records from, preferring "local" ingesters.
fn select_preferred_and_failover_ingesters(
    self_node_id: &NodeId,
    leader_id: NodeId,
    follower_id_opt: Option<NodeId>,
) -> (NodeId, Option<NodeId>) {
    // The replication factor is 1 and there is no follower.
    let Some(follower_id) = follower_id_opt else {
        return (leader_id, None);
    };
    if &leader_id == self_node_id {
        (leader_id, Some(follower_id))
    } else if &follower_id == self_node_id {
        (follower_id, Some(leader_id))
    } else if rand::random::<bool>() {
        (leader_id, Some(follower_id))
    } else {
        (follower_id, Some(leader_id))
    }
}

/// Performs multiple fault-tolerant fetch stream attempts until the stream reaches
/// the end of the shard.
#[allow(clippy::too_many_arguments)]
async fn retrying_fetch_stream(
    client_id: String,
    index_uid: IndexUid,
    source_id: SourceId,
    shard_id: ShardId,
    mut from_position_exclusive: Position,
    ingester_ids: Vec<NodeId>,
    ingester_pool: IngesterPool,
    retry_params: RetryParams,
    fetch_message_tx: mpsc::Sender<Result<InFlightValue<FetchMessage>, FetchStreamError>>,
) {
    for num_attempts in 1..=retry_params.max_attempts {
        fault_tolerant_fetch_stream(
            client_id.clone(),
            index_uid.clone(),
            source_id.clone(),
            shard_id.clone(),
            &mut from_position_exclusive,
            &ingester_ids,
            ingester_pool.clone(),
            fetch_message_tx.clone(),
        )
        .await;

        if from_position_exclusive.is_eof() {
            break;
        }
        let delay = retry_params.compute_delay(num_attempts);
        tokio::time::sleep(delay).await;
    }
}

/// Streams records from the preferred ingester and fails over to the other ingester if an error
/// occurs.
#[allow(clippy::too_many_arguments)]
async fn fault_tolerant_fetch_stream(
    client_id: String,
    index_uid: IndexUid,
    source_id: SourceId,
    shard_id: ShardId,
    from_position_exclusive: &mut Position,
    ingester_ids: &[NodeId],
    ingester_pool: IngesterPool,
    fetch_message_tx: mpsc::Sender<Result<InFlightValue<FetchMessage>, FetchStreamError>>,
) {
    // TODO: We can probably simplify this code by breaking it into smaller functions.
    'outer: for (ingester_idx, ingester_id) in ingester_ids.iter().enumerate() {
        let failover_ingester_id_opt = ingester_ids.get(ingester_idx + 1);

        let Some(ingester) = ingester_pool.get(ingester_id) else {
            if let Some(failover_ingester_id) = failover_ingester_id_opt {
                warn!(
                    client_id=%client_id,
                    index_uid=%index_uid,
                    source_id=%source_id,
                    shard_id=%shard_id,
                    "ingester `{ingester_id}` is unavailable: failing over to ingester `{failover_ingester_id}`"
                );
            } else {
                error!(
                    client_id=%client_id,
                    index_uid=%index_uid,
                    source_id=%source_id,
                    shard_id=%shard_id,
                    "ingester `{ingester_id}` is unavailable: closing fetch stream"
                );
                let message =
                    format!("ingester `{ingester_id}` is unavailable: closing fetch stream");
                let ingest_error = IngestV2Error::Unavailable(message);
                // Attempt to send the error to the consumer in a best-effort manner before
                // returning.
                let fetch_stream_error = FetchStreamError {
                    index_uid,
                    source_id,
                    shard_id,
                    ingest_error,
                };
                let _ = fetch_message_tx.send(Err(fetch_stream_error)).await;
                return;
            }
            continue;
        };
        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(from_position_exclusive.clone()),
        };
        let mut fetch_stream = match ingester
            .client
            .open_fetch_stream(open_fetch_stream_request)
            .await
        {
            Ok(fetch_stream) => fetch_stream,
            Err(not_found_error @ IngestV2Error::ShardNotFound { .. }) => {
                error!(
                    client_id=%client_id,
                    index_uid=%index_uid,
                    source_id=%source_id,
                    shard_id=%shard_id,
                    "failed to open fetch stream from ingester `{ingester_id}`: shard not found"
                );
                let fetch_stream_error = FetchStreamError {
                    index_uid,
                    source_id,
                    shard_id,
                    ingest_error: not_found_error,
                };
                let _ = fetch_message_tx.send(Err(fetch_stream_error)).await;
                from_position_exclusive.to_eof();
                return;
            }
            Err(other_ingest_error) => {
                if let Some(failover_ingester_id) = failover_ingester_id_opt {
                    warn!(
                        client_id=%client_id,
                        index_uid=%index_uid,
                        source_id=%source_id,
                        shard_id=%shard_id,
                        error=%other_ingest_error,
                        "failed to open fetch stream from ingester `{ingester_id}`: failing over to ingester `{failover_ingester_id}`"
                    );
                } else {
                    error!(
                        client_id=%client_id,
                        index_uid=%index_uid,
                        source_id=%source_id,
                        shard_id=%shard_id,
                        error=%other_ingest_error,
                        "failed to open fetch stream from ingester `{ingester_id}`: closing fetch stream"
                    );
                    let fetch_stream_error = FetchStreamError {
                        index_uid,
                        source_id,
                        shard_id,
                        ingest_error: other_ingest_error,
                    };
                    let _ = fetch_message_tx.send(Err(fetch_stream_error)).await;
                    return;
                }
                continue;
            }
        };
        while let Some(fetch_message_result) = fetch_stream.next().await {
            match fetch_message_result {
                Ok(fetch_message) => match &fetch_message.message {
                    Some(fetch_message::Message::Payload(fetch_payload)) => {
                        let batch_size = fetch_payload.estimate_size();
                        let to_position_inclusive = fetch_payload.to_position_inclusive();
                        let in_flight_value = InFlightValue::new(
                            fetch_message,
                            batch_size,
                            &MEMORY_METRICS.in_flight.multi_fetch_stream,
                        );
                        if fetch_message_tx.send(Ok(in_flight_value)).await.is_err() {
                            // The consumer was dropped.
                            return;
                        }
                        *from_position_exclusive = to_position_inclusive;
                    }
                    Some(fetch_message::Message::Eof(fetch_eof)) => {
                        let eof_position = fetch_eof.eof_position();
                        let in_flight_value = InFlightValue::new(
                            fetch_message,
                            ByteSize(0),
                            &MEMORY_METRICS.in_flight.multi_fetch_stream,
                        );
                        // We ignore the send error if the consumer was dropped because we're going
                        // to return anyway.
                        let _ = fetch_message_tx.send(Ok(in_flight_value)).await;

                        *from_position_exclusive = eof_position;
                        return;
                    }
                    None => {
                        warn!("received empty fetch message");
                        continue;
                    }
                },
                Err(ingest_error) => {
                    if let Some(failover_ingester_id) = failover_ingester_id_opt {
                        warn!(
                            client_id=%client_id,
                            index_uid=%index_uid,
                            source_id=%source_id,
                            shard_id=%shard_id,
                            error=%ingest_error,
                            "failed to fetch records from ingester `{ingester_id}`: failing over to ingester `{failover_ingester_id}`"
                        );
                    } else {
                        error!(
                            client_id=%client_id,
                            index_uid=%index_uid,
                            source_id=%source_id,
                            shard_id=%shard_id,
                            error=%ingest_error,
                            "failed to fetch records from ingester `{ingester_id}`: closing fetch stream"
                        );
                        let fetch_stream_error = FetchStreamError {
                            index_uid,
                            source_id,
                            shard_id,
                            ingest_error,
                        };
                        let _ = fetch_message_tx.send(Err(fetch_stream_error)).await;
                        return;
                    }
                    continue 'outer;
                }
            }
        }
    }
}

#[cfg(test)]
pub(super) mod tests {
    use std::time::Duration;

    use bytes::Bytes;
    use quickwit_proto::ingest::ShardState;
    use quickwit_proto::ingest::ingester::{IngesterServiceClient, MockIngesterService};
    use quickwit_proto::types::queue_id;
    use tokio::time::timeout;

    use super::*;
    use crate::{IngesterPoolEntry, MRecord};

    pub fn into_fetch_payload(fetch_message: FetchMessage) -> FetchPayload {
        match fetch_message.message.unwrap() {
            fetch_message::Message::Payload(fetch_payload) => fetch_payload,
            other => panic!("expected fetch payload, got `{other:?}`"),
        }
    }

    pub fn into_fetch_eof(fetch_message: FetchMessage) -> FetchEof {
        match fetch_message.message.unwrap() {
            fetch_message::Message::Eof(fetch_eof) => fetch_eof,
            other => panic!("expected fetch EOF, got `{other:?}`"),
        }
    }

    #[tokio::test]
    async fn test_fetch_task_happy_path() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::Beginning),
        };
        let (shard_status_tx, shard_status_rx) = watch::channel(ShardStatus::default());
        let (mut fetch_stream, fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            1024,
        );
        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .create_queue(&queue_id)
            .await
            .unwrap();
        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(
                &queue_id,
                None,
                std::iter::once(MRecord::new_doc("test-doc-foo").encode()),
            )
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(fetch_payload.index_uid(), &index_uid);
        assert_eq!(fetch_payload.source_id, source_id);
        assert_eq!(fetch_payload.shard_id(), shard_id);
        assert_eq!(fetch_payload.from_position_exclusive(), Position::Beginning);
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [14]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "\0\0test-doc-foo"
        );

        timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap_err();

        // Trigger a spurious notification.
        let shard_status = (ShardState::Open, Position::offset(0u64));
        shard_status_tx.send(shard_status).unwrap();

        timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap_err();

        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(
                &queue_id,
                None,
                std::iter::once(MRecord::new_doc("test-doc-bar").encode()),
            )
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let shard_status = (ShardState::Open, Position::offset(1u64));
        shard_status_tx.send(shard_status.clone()).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );
        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [14]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "\0\0test-doc-bar"
        );

        let mut mrecordlog_guard = mrecordlog.write().await;

        let mrecords = [
            MRecord::new_doc("test-doc-baz").encode(),
            MRecord::new_doc("test-doc-qux").encode(),
        ]
        .into_iter();

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(&queue_id, None, mrecords)
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let shard_status = (ShardState::Open, Position::offset(3u64));
        shard_status_tx.send(shard_status).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(1u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(3u64)
        );
        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [14, 14]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "\0\0test-doc-baz\0\0test-doc-qux"
        );

        let shard_status = (ShardState::Closed, Position::offset(3u64));
        shard_status_tx.send(shard_status).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_eof = into_fetch_eof(fetch_message);

        assert_eq!(fetch_eof.index_uid(), &index_uid);
        assert_eq!(fetch_eof.source_id, source_id);
        assert_eq!(fetch_eof.shard_id(), shard_id);
        assert_eq!(fetch_eof.eof_position, Some(Position::eof(3u64)));

        fetch_task_handle.await.unwrap();
    }

    #[tokio::test]
    async fn test_fetch_task_signals_eof() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);

        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .create_queue(&queue_id)
            .await
            .unwrap();

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(
                &queue_id,
                None,
                std::iter::once(MRecord::new_doc("test-doc-foo").encode()),
            )
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::offset(0u64)),
        };
        let shard_status = (ShardState::Closed, Position::offset(0u64));
        let (_shard_status_tx, shard_status_rx) = watch::channel(shard_status);

        let (mut fetch_stream, fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            1024,
        );
        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_eof = into_fetch_eof(fetch_message);

        assert_eq!(fetch_eof.index_uid(), &index_uid);
        assert_eq!(fetch_eof.source_id, source_id);
        assert_eq!(fetch_eof.shard_id(), shard_id);
        assert_eq!(fetch_eof.eof_position, Some(Position::eof(0u64).as_eof()));

        fetch_task_handle.await.unwrap();
    }

    #[tokio::test]
    async fn test_fetch_task_signals_eof_at_beginning() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::Beginning),
        };
        let (shard_status_tx, shard_status_rx) = watch::channel(ShardStatus::default());
        let (mut fetch_stream, fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            1024,
        );
        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .create_queue(&queue_id)
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let shard_status = (ShardState::Closed, Position::Beginning);
        shard_status_tx.send(shard_status).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_eof = into_fetch_eof(fetch_message);

        assert_eq!(fetch_eof.index_uid(), &index_uid);
        assert_eq!(fetch_eof.source_id, source_id);
        assert_eq!(fetch_eof.shard_id(), shard_id);
        assert_eq!(fetch_eof.eof_position, Some(Position::Beginning.as_eof()));

        fetch_task_handle.await.unwrap();
    }

    #[tokio::test]
    async fn test_fetch_task_from_position_exclusive() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::offset(0u64)),
        };
        let (shard_status_tx, shard_status_rx) = watch::channel(ShardStatus::default());
        let (mut fetch_stream, _fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            1024,
        );
        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .create_queue(&queue_id)
            .await
            .unwrap();
        drop(mrecordlog_guard);

        timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap_err();

        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(
                &queue_id,
                None,
                std::iter::once(MRecord::new_doc("test-doc-foo").encode()),
            )
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let shard_status = (ShardState::Open, Position::offset(0u64));
        shard_status_tx.send(shard_status).unwrap();

        timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap_err();

        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(
                &queue_id,
                None,
                std::iter::once(MRecord::new_doc("test-doc-bar").encode()),
            )
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let shard_status = (ShardState::Open, Position::offset(1u64));
        shard_status_tx.send(shard_status).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(fetch_payload.index_uid(), &index_uid);
        assert_eq!(fetch_payload.source_id, source_id);
        assert_eq!(fetch_payload.shard_id(), shard_id);
        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );
        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [14]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "\0\0test-doc-bar"
        );
    }

    #[tokio::test]
    async fn test_fetch_task_error() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::Beginning),
        };
        let (_shard_status_tx, shard_status_rx) = watch::channel(ShardStatus::default());
        let (mut fetch_stream, fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            1024,
        );
        let ingest_error = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap_err();
        assert!(matches!(ingest_error, IngestV2Error::Internal(_)));

        fetch_task_handle.await.unwrap();
    }

    #[tokio::test]
    async fn test_fetch_task_batch_num_bytes() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::Beginning),
        };
        let (shard_status_tx, shard_status_rx) = watch::channel(ShardStatus::default());
        let (mut fetch_stream, _fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            30,
        );
        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .create_queue(&queue_id)
            .await
            .unwrap();

        let records = [
            Bytes::from_static(b"test-doc-foo"),
            Bytes::from_static(b"test-doc-bar"),
            Bytes::from_static(b"test-doc-baz"),
        ]
        .into_iter();

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(&queue_id, None, records)
            .await
            .unwrap();
        drop(mrecordlog_guard);

        let shard_status = (ShardState::Open, Position::offset(2u64));
        shard_status_tx.send(shard_status).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [12, 12]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "test-doc-footest-doc-bar"
        );

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [12]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "test-doc-baz"
        );
    }

    #[tokio::test]
    async fn test_fetch_task_batch_num_bytes_less_than_record_payload() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = Arc::new(RwLock::new(Some(
            MultiRecordLogAsync::open(tempdir.path()).await.unwrap(),
        )));
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let shard_id = ShardId::from(1);
        let queue_id = queue_id(&index_uid, &source_id, &shard_id);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: client_id.clone(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            from_position_exclusive: Some(Position::Beginning),
        };
        let (shard_status_tx, shard_status_rx) = watch::channel(ShardStatus::default());
        let (mut fetch_stream, _fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog.clone(),
            shard_status_rx,
            10, //< we request batch larger than 10 bytes.
        );

        let mut mrecordlog_guard = mrecordlog.write().await;

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .create_queue(&queue_id)
            .await
            .unwrap();

        mrecordlog_guard
            .as_mut()
            .unwrap()
            .append_records(
                &queue_id,
                None,
                // This doc is longer than 10 bytes.
                std::iter::once(MRecord::new_doc("test-doc-foo").encode()),
            )
            .await
            .unwrap();

        drop(mrecordlog_guard);

        let shard_status = (ShardState::Open, Position::offset(1u64));
        shard_status_tx.send(shard_status).unwrap();

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();

        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload
                .mrecord_batch
                .as_ref()
                .unwrap()
                .mrecord_lengths,
            [14]
        );
        assert_eq!(
            fetch_payload.mrecord_batch.as_ref().unwrap().mrecord_buffer,
            "\0\0test-doc-foo"
        );
    }

    #[test]
    fn test_select_preferred_and_failover_ingesters() {
        let self_node_id: NodeId = "test-ingester-0".into();

        let (preferred, failover) =
            select_preferred_and_failover_ingesters(&self_node_id, "test-ingester-0".into(), None);
        assert_eq!(preferred, "test-ingester-0");
        assert!(failover.is_none());

        let (preferred, failover) = select_preferred_and_failover_ingesters(
            &self_node_id,
            "test-ingester-0".into(),
            Some("test-ingester-1".into()),
        );
        assert_eq!(preferred, "test-ingester-0");
        assert_eq!(failover.unwrap(), "test-ingester-1");

        let (preferred, failover) = select_preferred_and_failover_ingesters(
            &self_node_id,
            "test-ingester-1".into(),
            Some("test-ingester-0".into()),
        );
        assert_eq!(preferred, "test-ingester-0");
        assert_eq!(failover.unwrap(), "test-ingester-1");
    }

    #[tokio::test]
    async fn test_fault_tolerant_fetch_stream_ingester_unavailable_failover() {
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".into();
        let shard_id = ShardId::from(1);
        let mut from_position_exclusive = Position::offset(0u64);

        let ingester_ids: Vec<NodeId> = vec!["test-ingester-0".into(), "test-ingester-1".into()];
        let ingester_pool = IngesterPool::default();

        let (fetch_message_tx, mut fetch_stream) = ServiceStream::new_bounded(5);
        let (service_stream_tx_1, service_stream_1) = ServiceStream::new_unbounded();

        let mut mock_ingester_1 = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester_1
            .expect_open_fetch_stream()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Ok(service_stream_1)
            });
        let ingester_1 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1));
        ingester_pool.insert("test-ingester-1".into(), ingester_1);

        let fetch_payload = FetchPayload {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-foo"]),
            from_position_exclusive: Some(Position::offset(0u64)),
            to_position_inclusive: Some(Position::offset(1u64)),
        };
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        service_stream_tx_1.send(Ok(fetch_message)).unwrap();

        let fetch_eof = FetchEof {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            eof_position: Some(Position::eof(1u64)),
        };
        let fetch_message = FetchMessage::new_eof(fetch_eof);
        service_stream_tx_1.send(Ok(fetch_message)).unwrap();

        fault_tolerant_fetch_stream(
            client_id,
            index_uid,
            source_id,
            shard_id,
            &mut from_position_exclusive,
            &ingester_ids,
            ingester_pool,
            fetch_message_tx,
        )
        .await;

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_eof = into_fetch_eof(fetch_message);

        assert_eq!(fetch_eof.eof_position(), Position::eof(1u64));

        assert!(
            timeout(Duration::from_millis(100), fetch_stream.next())
                .await
                .unwrap()
                .is_none()
        );
    }

    #[tokio::test]
    async fn test_fault_tolerant_fetch_stream_open_fetch_stream_error_failover() {
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".into();
        let shard_id = ShardId::from(1);
        let mut from_position_exclusive = Position::offset(0u64);

        let ingester_ids: Vec<NodeId> = vec!["test-ingester-0".into(), "test-ingester-1".into()];
        let ingester_pool = IngesterPool::default();

        let (fetch_message_tx, mut fetch_stream) = ServiceStream::new_bounded(5);
        let (service_stream_tx_1, service_stream_1) = ServiceStream::new_unbounded();

        let mut mock_ingester_0 = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester_0
            .expect_open_fetch_stream()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Err(IngestV2Error::Internal(
                    "open fetch stream error".to_string(),
                ))
            });
        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));

        let mut mock_ingester_1 = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester_1
            .expect_open_fetch_stream()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Ok(service_stream_1)
            });
        let ingester_1 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1));

        ingester_pool.insert("test-ingester-0".into(), ingester_0);
        ingester_pool.insert("test-ingester-1".into(), ingester_1);

        let fetch_payload = FetchPayload {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-foo"]),
            from_position_exclusive: Some(Position::offset(0u64)),
            to_position_inclusive: Some(Position::offset(1u64)),
        };
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        service_stream_tx_1.send(Ok(fetch_message)).unwrap();

        let fetch_eof = FetchEof {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            eof_position: Some(Position::eof(1u64)),
        };
        let fetch_message = FetchMessage::new_eof(fetch_eof);
        service_stream_tx_1.send(Ok(fetch_message)).unwrap();

        fault_tolerant_fetch_stream(
            client_id,
            index_uid,
            source_id,
            shard_id,
            &mut from_position_exclusive,
            &ingester_ids,
            ingester_pool,
            fetch_message_tx,
        )
        .await;

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_eof = into_fetch_eof(fetch_message);

        assert_eq!(fetch_eof.eof_position(), Position::eof(1u64));

        assert!(
            timeout(Duration::from_millis(100), fetch_stream.next())
                .await
                .unwrap()
                .is_none()
        );
    }

    #[tokio::test]
    async fn test_fault_tolerant_fetch_stream_error_failover() {
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".into();
        let shard_id = ShardId::from(1);
        let mut from_position_exclusive = Position::offset(0u64);

        let ingester_ids: Vec<NodeId> = vec!["test-ingester-0".into(), "test-ingester-1".into()];
        let ingester_pool = IngesterPool::default();

        let (fetch_message_tx, mut fetch_stream) = ServiceStream::new_bounded(5);
        let (service_stream_tx_0, service_stream_0) = ServiceStream::new_unbounded();
        let (service_stream_tx_1, service_stream_1) = ServiceStream::new_unbounded();

        let mut mock_ingester_0 = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester_0
            .expect_open_fetch_stream()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Ok(service_stream_0)
            });
        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));

        let mut mock_ingester_1 = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester_1
            .expect_open_fetch_stream()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(1u64));

                Ok(service_stream_1)
            });
        let ingester_1 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_1));

        ingester_pool.insert("test-ingester-0".into(), ingester_0);
        ingester_pool.insert("test-ingester-1".into(), ingester_1);

        let fetch_payload = FetchPayload {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-foo"]),
            from_position_exclusive: Some(Position::offset(0u64)),
            to_position_inclusive: Some(Position::offset(1u64)),
        };
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        service_stream_tx_0.send(Ok(fetch_message)).unwrap();

        let ingest_error = IngestV2Error::Internal("fetch stream error".into());
        service_stream_tx_0.send(Err(ingest_error)).unwrap();

        let fetch_eof = FetchEof {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            eof_position: Some(Position::eof(1u64)),
        };
        let fetch_message = FetchMessage::new_eof(fetch_eof);
        service_stream_tx_1.send(Ok(fetch_message)).unwrap();

        fault_tolerant_fetch_stream(
            client_id,
            index_uid,
            source_id,
            shard_id,
            &mut from_position_exclusive,
            &ingester_ids,
            ingester_pool,
            fetch_message_tx,
        )
        .await;

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_eof = into_fetch_eof(fetch_message);

        assert_eq!(fetch_eof.eof_position(), Position::eof(1u64));

        assert!(
            timeout(Duration::from_millis(100), fetch_stream.next())
                .await
                .unwrap()
                .is_none()
        );
    }

    #[tokio::test]
    async fn test_fault_tolerant_fetch_stream_shard_not_found() {
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".into();
        let shard_id = ShardId::from(1);
        let mut from_position_exclusive = Position::offset(0u64);

        let ingester_ids: Vec<NodeId> = vec!["test-ingester-0".into(), "test-ingester-1".into()];
        let ingester_pool = IngesterPool::default();

        let (fetch_message_tx, mut fetch_stream) = ServiceStream::new_bounded(5);

        let mut mock_ingester_0 = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester_0
            .expect_open_fetch_stream()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Err(IngestV2Error::ShardNotFound {
                    shard_id: ShardId::from(1),
                })
            });
        let ingester_0 =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester_0));
        ingester_pool.insert("test-ingester-0".into(), ingester_0);

        fault_tolerant_fetch_stream(
            client_id,
            index_uid,
            source_id,
            shard_id,
            &mut from_position_exclusive,
            &ingester_ids,
            ingester_pool,
            fetch_message_tx,
        )
        .await;

        let fetch_stream_error = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap_err();

        assert!(matches!(
            fetch_stream_error.ingest_error,
            IngestV2Error::ShardNotFound { shard_id } if shard_id == ShardId::from(1)
        ));
        assert!(from_position_exclusive.is_eof());
    }

    #[tokio::test]
    async fn test_retrying_fetch_stream() {
        let client_id = "test-client".to_string();
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id: SourceId = "test-source".into();
        let shard_id = ShardId::from(1);
        let from_position_exclusive = Position::offset(0u64);

        let ingester_ids: Vec<NodeId> = vec!["test-ingester".into()];
        let ingester_pool = IngesterPool::default();

        let (fetch_message_tx, mut fetch_stream) = ServiceStream::new_bounded(5);
        let (service_stream_tx_1, service_stream_1) = ServiceStream::new_unbounded();
        let (service_stream_tx_2, service_stream_2) = ServiceStream::new_unbounded();

        let mut retry_params = RetryParams::for_test();
        retry_params.max_attempts = 3;

        let mut mock_ingester = MockIngesterService::new();
        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_open_fetch_stream()
            .once()
            .returning(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Err(IngestV2Error::Internal(
                    "open fetch stream error".to_string(),
                ))
            });
        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_open_fetch_stream()
            .once()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(0u64));

                Ok(service_stream_1)
            });
        let index_uid_clone = index_uid.clone();
        mock_ingester
            .expect_open_fetch_stream()
            .once()
            .return_once(move |request| {
                assert_eq!(request.client_id, "test-client");
                assert_eq!(request.index_uid(), &index_uid_clone);
                assert_eq!(request.source_id, "test-source");
                assert_eq!(request.shard_id(), ShardId::from(1));
                assert_eq!(request.from_position_exclusive(), Position::offset(1u64));

                Ok(service_stream_2)
            });
        let ingester =
            IngesterPoolEntry::ready_with_client(IngesterServiceClient::from_mock(mock_ingester));

        ingester_pool.insert("test-ingester".into(), ingester);

        let fetch_payload = FetchPayload {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-foo"]),
            from_position_exclusive: Some(Position::offset(0u64)),
            to_position_inclusive: Some(Position::offset(1u64)),
        };
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        service_stream_tx_1.send(Ok(fetch_message)).unwrap();

        let ingest_error = IngestV2Error::Internal("fetch stream error #1".into());
        service_stream_tx_1.send(Err(ingest_error)).unwrap();

        let fetch_payload = FetchPayload {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(shard_id.clone()),
            mrecord_batch: MRecordBatch::for_test(["\0\0test-doc-bar"]),
            from_position_exclusive: Some(Position::offset(1u64)),
            to_position_inclusive: Some(Position::offset(2u64)),
        };
        let fetch_message = FetchMessage::new_payload(fetch_payload);
        service_stream_tx_2.send(Ok(fetch_message)).unwrap();

        let ingest_error = IngestV2Error::Internal("fetch stream error #2".into());
        service_stream_tx_2.send(Err(ingest_error)).unwrap();

        retrying_fetch_stream(
            client_id,
            index_uid,
            source_id,
            shard_id,
            from_position_exclusive,
            ingester_ids,
            ingester_pool,
            retry_params,
            fetch_message_tx,
        )
        .await;

        let ingest_error = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap_err()
            .ingest_error;
        assert!(
            matches!(ingest_error, IngestV2Error::Internal(message) if message == "open fetch stream error")
        );

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );

        let fetch_stream_error = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap_err();
        assert!(
            matches!(fetch_stream_error.ingest_error, IngestV2Error::Internal(message) if message == "fetch stream error #1")
        );

        let fetch_message = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap()
            .into_inner();
        let fetch_payload = into_fetch_payload(fetch_message);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(1u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(2u64)
        );

        let fetch_stream_error = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap_err();
        assert!(
            matches!(fetch_stream_error.ingest_error, IngestV2Error::Internal(message) if message == "fetch stream error #2")
        );

        assert!(
            timeout(Duration::from_millis(100), fetch_stream.next())
                .await
                .unwrap()
                .is_none()
        );
    }

    #[tokio::test]
    async fn test_multi_fetch_stream() {
        let self_node_id: NodeId = "test-node".into();
        let client_id = "test-client".to_string();
        let ingester_pool = IngesterPool::default();
        let retry_params = RetryParams::for_test();
        let _multi_fetch_stream =
            MultiFetchStream::new(self_node_id, client_id, ingester_pool, retry_params);
        // TODO: Backport from original branch.
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/helpers.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::{Duration, Instant};

use anyhow::{Context, anyhow, bail};
use futures::StreamExt;
use quickwit_common::pretty::PrettyDisplay;
use quickwit_proto::ingest::ingester::{
    DecommissionRequest, IngesterService, IngesterStatus, OpenObservationStreamRequest,
};
use tracing::info;

/// Tries to get the current status of an ingester by opening an observation stream
/// and reading the first message.
///
/// # Errors
///
/// Returns an error if:
/// - The observation stream fails to open
/// - The stream ends without producing a message
/// - The stream ends after returning an error
pub async fn try_get_ingester_status(
    ingester: &impl IngesterService,
) -> anyhow::Result<IngesterStatus> {
    let mut observation_stream = ingester
        .open_observation_stream(OpenObservationStreamRequest {})
        .await
        .context("failed to open observation stream")?;

    let next_observation_message = observation_stream
        .next()
        .await
        .context("observation stream ended")?
        .context("observation stream failed")?;

    Ok(next_observation_message.status())
}

/// Waits for an ingester to reach a specific status by monitoring its observation stream.
///
/// This function continuously polls the observation stream until the ingester reaches
/// the desired status.
///
/// # Errors
///
/// Returns an error if:
/// - The observation stream fails to open
/// - The stream ends without producing a message
/// - The stream ends after returning an error
/// - The timeout is exceeded
pub async fn wait_for_ingester_status(
    ingester: &impl IngesterService,
    status: IngesterStatus,
    timeout_after: Duration,
) -> anyhow::Result<()> {
    debug_assert!(
        timeout_after > Duration::ZERO,
        "timeout_after should be greater than zero"
    );
    tokio::time::timeout(
        timeout_after,
        wait_for_ingester_status_inner(ingester, status),
    )
    .await
    .with_context(|| {
        format!(
            "timed out waiting for ingester to transition to status {status} after {} seconds",
            timeout_after.as_secs(),
        )
    })?
}

async fn wait_for_ingester_status_inner(
    ingester: &impl IngesterService,
    status: IngesterStatus,
) -> anyhow::Result<()> {
    let mut observation_stream = ingester
        .open_observation_stream(OpenObservationStreamRequest {})
        .await
        .context("failed to open observation stream")?;

    loop {
        match observation_stream.next().await {
            Some(Ok(observation_message)) => {
                if observation_message.status() == status {
                    return Ok(());
                }
            }
            Some(Err(error)) => {
                return Err(anyhow!(error).context("observation stream failed"));
            }
            None => {
                bail!("observation stream ended");
            }
        }
    }
}

/// Initiates decommission of an ingester and waits for it to complete.
///
/// This function sends a decommission request to the ingester and then waits
/// for it to reach the `Decommissioned` status.
///
/// # Errors
///
/// Returns an error if:
/// - The decommission request fails
/// - The observation stream fails to open
/// - The stream ends without producing a message
/// - The stream ends after returning an error
/// - The timeout is exceeded
pub async fn wait_for_ingester_decommission(
    ingester: &impl IngesterService,
    timeout_after: Duration,
) -> anyhow::Result<()> {
    let now = Instant::now();

    ingester
        .decommission(DecommissionRequest {})
        .await
        .context("failed to initiate ingester decommission")?;

    wait_for_ingester_status(
        ingester,
        IngesterStatus::Decommissioned,
        timeout_after.saturating_sub(now.elapsed()),
    )
    .await?;

    info!(
        "successfully decommissioned ingester in {}",
        now.elapsed().pretty_display()
    );
    Ok(())
}

#[cfg(test)]
mod tests {

    use std::time::Duration;

    use quickwit_common::ServiceStream;
    use quickwit_proto::ingest::ingester::{
        DecommissionResponse, IngesterServiceClient, MockIngesterService, ObservationMessage,
    };

    use super::*;

    #[tokio::test]
    async fn test_try_get_ingester_status() {
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_open_observation_stream()
            .once()
            .returning(|_| {
                let (service_stream_tx, service_stream) = ServiceStream::new_bounded(1);
                let message = ObservationMessage {
                    node_id: "test-ingester".to_string(),
                    status: IngesterStatus::Initializing as i32,
                };
                service_stream_tx.try_send(Ok(message)).unwrap();
                Ok(service_stream)
            });
        let ingester = IngesterServiceClient::from_mock(mock_ingester);
        let status = try_get_ingester_status(&ingester).await.unwrap();
        assert_eq!(status, IngesterStatus::Initializing);
    }

    #[tokio::test]
    async fn test_wait_for_ingester_status() {
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_open_observation_stream()
            .once()
            .returning(|_| {
                let (service_stream_tx, service_stream) = ServiceStream::new_bounded(2);
                let message = ObservationMessage {
                    node_id: "test-ingester".to_string(),
                    status: IngesterStatus::Initializing as i32,
                };
                service_stream_tx.try_send(Ok(message)).unwrap();

                let message = ObservationMessage {
                    node_id: "test-ingester".to_string(),
                    status: IngesterStatus::Ready as i32,
                };
                service_stream_tx.try_send(Ok(message)).unwrap();
                Ok(service_stream)
            });
        let ingester = IngesterServiceClient::from_mock(mock_ingester);
        wait_for_ingester_status(&ingester, IngesterStatus::Ready, Duration::from_secs(1))
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_wait_for_ingester_decommission_elapsed_timeout_not_zero() {
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_open_observation_stream()
            .once()
            .returning(|_| {
                let (service_stream_tx, service_stream) = ServiceStream::new_bounded(1);
                // Simulate the ingester transitioning to Decommissioned after 50ms.
                tokio::spawn(async move {
                    tokio::time::sleep(Duration::from_millis(50)).await;
                    let message = ObservationMessage {
                        node_id: "test-ingester".to_string(),
                        status: IngesterStatus::Decommissioned as i32,
                    };
                    service_stream_tx.try_send(Ok(message)).unwrap();
                });
                Ok(service_stream)
            });
        mock_ingester
            .expect_decommission()
            .once()
            .returning(|_| Ok(DecommissionResponse {}));
        let ingester = IngesterServiceClient::from_mock(mock_ingester);
        wait_for_ingester_decommission(&ingester, Duration::from_secs(1))
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_wait_for_ingester_decommission() {
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_open_observation_stream()
            .once()
            .returning(|_| {
                let (service_stream_tx, service_stream) = ServiceStream::new_bounded(3);
                let message = ObservationMessage {
                    node_id: "test-ingester".to_string(),
                    status: IngesterStatus::Ready as i32,
                };
                service_stream_tx.try_send(Ok(message)).unwrap();

                let message = ObservationMessage {
                    node_id: "test-ingester".to_string(),
                    status: IngesterStatus::Decommissioning as i32,
                };
                service_stream_tx.try_send(Ok(message)).unwrap();

                let message = ObservationMessage {
                    node_id: "test-ingester".to_string(),
                    status: IngesterStatus::Decommissioned as i32,
                };
                service_stream_tx.try_send(Ok(message)).unwrap();
                Ok(service_stream)
            });
        mock_ingester
            .expect_decommission()
            .once()
            .returning(|_| Ok(DecommissionResponse {}));
        let ingester = IngesterServiceClient::from_mock(mock_ingester);
        wait_for_ingester_decommission(&ingester, Duration::from_secs(1))
            .await
            .unwrap();
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/idle.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::{Duration, Instant};

use tokio::task::JoinHandle;
use tracing::info;

use super::state::WeakIngesterState;
use crate::with_lock_metrics;

const RUN_INTERVAL_PERIOD: Duration = if cfg!(test) {
    Duration::from_millis(50)
} else {
    Duration::from_secs(60)
};

/// Periodically closes idle shards.
pub(super) struct CloseIdleShardsTask {
    weak_state: WeakIngesterState,
    idle_shard_timeout: Duration,
}

impl CloseIdleShardsTask {
    pub fn spawn(weak_state: WeakIngesterState, idle_shard_timeout: Duration) -> JoinHandle<()> {
        let task = Self {
            weak_state,
            idle_shard_timeout,
        };
        tokio::spawn(async move {
            let Some(mut state) = task.weak_state.upgrade() else {
                return;
            };
            state.wait_for_ready().await;
            drop(state);

            task.run().await
        })
    }

    async fn run(&self) {
        let mut interval = tokio::time::interval(RUN_INTERVAL_PERIOD);

        loop {
            interval.tick().await;

            let Some(state) = self.weak_state.upgrade() else {
                return;
            };
            let Ok(mut state_guard) =
                with_lock_metrics!(state.lock_partially(), "close_idle_shards", "write").await
            else {
                return;
            };

            let now = Instant::now();

            for (queue_id, shard) in &mut state_guard.shards {
                if shard.is_open() && shard.is_idle(now, self.idle_shard_timeout) {
                    shard.close();
                    info!("closed idle shard `{queue_id}`");
                }
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_config::service::QuickwitService;
    use quickwit_proto::types::{IndexUid, ShardId};

    use super::*;
    use crate::ingest_v2::models::IngesterShard;
    use crate::ingest_v2::state::IngesterState;

    #[tokio::test]
    async fn test_close_idle_shards_run() {
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let weak_state = state.weak();
        let idle_shard_timeout = RUN_INTERVAL_PERIOD * 4;
        let join_handle = CloseIdleShardsTask::spawn(weak_state, idle_shard_timeout);

        let mut state_guard = state.lock_partially().await.unwrap();
        let now = Instant::now();

        let index_uid = IndexUid::for_test("test-index", 0);
        let shard_01 = IngesterShard::new_solo(
            index_uid.clone(),
            "test-source".to_string(),
            ShardId::from(1),
        )
        .with_last_write(now - idle_shard_timeout)
        .build();
        let queue_id_01 = shard_01.queue_id();
        state_guard.shards.insert(queue_id_01.clone(), shard_01);

        let shard_02 = IngesterShard::new_solo(
            index_uid.clone(),
            "test-source".to_string(),
            ShardId::from(2),
        )
        .build();
        let queue_id_02 = shard_02.queue_id();
        state_guard.shards.insert(queue_id_02.clone(), shard_02);
        drop(state_guard);

        tokio::time::sleep(RUN_INTERVAL_PERIOD * 2).await;

        let state_guard = state.lock_partially().await.unwrap();
        state_guard
            .shards
            .get(&queue_id_01)
            .unwrap()
            .assert_is_closed();
        state_guard
            .shards
            .get(&queue_id_02)
            .unwrap()
            .assert_is_open();
        drop(state_guard);

        tokio::time::sleep(idle_shard_timeout).await;

        let state_guard = state.lock_partially().await.unwrap();
        state_guard
            .shards
            .get(&queue_id_02)
            .unwrap()
            .assert_is_closed();
        drop(state_guard);
        drop(state);

        tokio::time::timeout(Duration::from_secs(1), join_handle)
            .await
            .unwrap()
            .unwrap();
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/ingest.md
================================================
## Replication

### Settings

- ingest request timeout (35s), `Itimeout`
- persist request timeout (6s), `Ptimeout`
- replicate request timeout (3s), `Rtimeout`
- number of persist attempts (5), `k`

Knowing that persist requests issue replicate requests, and ingest requests issue persist requests, we must have approximately:
- `Ptimeout` >= 2 * `Rtimeout`
- `Itimeout` >= `k` * `Ptimeout`


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/ingester.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::hash_map::Entry;
use std::collections::{BTreeMap, HashMap, HashSet};
use std::fmt;
use std::path::Path;
use std::sync::Arc;
use std::time::{Duration, Instant};

use async_trait::async_trait;
use bytesize::ByteSize;
use futures::StreamExt;
use futures::stream::FuturesUnordered;
use mrecordlog::error::CreateQueueError;
use once_cell::sync::OnceCell;
use quickwit_cluster::Cluster;
use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_common::pretty::PrettyDisplay;
use quickwit_common::pubsub::{EventBroker, EventSubscriber};
use quickwit_common::rate_limiter::{RateLimiter, RateLimiterSettings};
use quickwit_common::{ServiceStream, rate_limited_error, rate_limited_warn};
use quickwit_proto::control_plane::{
    AdviseResetShardsRequest, ControlPlaneService, ControlPlaneServiceClient,
};
use quickwit_proto::indexing::ShardPositionsUpdate;
use quickwit_proto::ingest::ingester::*;
use quickwit_proto::ingest::{
    CommitTypeV2, DocBatchV2, IngestV2Error, IngestV2Result, ParseFailure, Shard, ShardIds,
};
use quickwit_proto::types::{
    IndexUid, NodeId, Position, QueueId, ShardId, SourceId, SubrequestId, queue_id, split_queue_id,
};
use serde_json::{Value as JsonValue, json};
use tokio::sync::Semaphore;
use tokio::time::{sleep, timeout};
use tracing::{debug, error, info, warn};

use super::IngesterPool;
use super::broadcast::{BroadcastIngesterCapacityScoreTask, BroadcastLocalShardsTask};
use super::doc_mapper::validate_doc_batch;
use super::fetch::FetchStreamTask;
use super::idle::CloseIdleShardsTask;
use super::metrics::INGEST_V2_METRICS;
use super::models::IngesterShard;
use super::mrecordlog_utils::{
    AppendDocBatchError, append_non_empty_doc_batch, check_enough_capacity,
};
use super::rate_meter::RateMeter;
use super::replication::{
    ReplicationClient, ReplicationStreamTask, ReplicationStreamTaskHandle, ReplicationTask,
    SYN_REPLICATION_STREAM_CAPACITY,
};
use super::state::{IngesterState, InnerIngesterState, WeakIngesterState};
use crate::ingest_v2::doc_mapper::get_or_try_build_doc_mapper;
use crate::ingest_v2::metrics::report_wal_usage;
use crate::ingest_v2::models::IngesterShardType;
use crate::mrecordlog_async::MultiRecordLogAsync;
use crate::{FollowerId, estimate_size, with_lock_metrics};

/// Minimum interval between two reset shards operations.
const MIN_RESET_SHARDS_INTERVAL: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::ZERO
} else {
    Duration::from_secs(60)
};

/// Duration after which persist requests time out with
/// [`quickwit_proto::ingest::IngestV2Error::Timeout`].
pub(super) const PERSIST_REQUEST_TIMEOUT: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(500)
} else {
    Duration::from_secs(6)
};

const DEFAULT_BATCH_NUM_BYTES: usize = 1024 * 1024; // 1 MiB

fn get_batch_num_bytes() -> usize {
    static BATCH_NUM_BYTES_CELL: OnceCell<usize> = OnceCell::new();
    *BATCH_NUM_BYTES_CELL.get_or_init(|| {
        quickwit_common::get_from_env("QW_INGEST_BATCH_NUM_BYTES", DEFAULT_BATCH_NUM_BYTES, false)
    })
}

#[derive(Clone)]
pub struct Ingester {
    self_node_id: NodeId,
    control_plane: ControlPlaneServiceClient,
    ingester_pool: IngesterPool,
    state: IngesterState,
    disk_capacity: ByteSize,
    memory_capacity: ByteSize,
    rate_limiter_settings: RateLimiterSettings,
    replication_factor: usize,
    // This semaphore ensures that the ingester that not run two reset shards operations
    // concurrently.
    reset_shards_permits: Arc<Semaphore>,
}

impl fmt::Debug for Ingester {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("Ingester")
            .field("replication_factor", &self.replication_factor)
            .finish()
    }
}

impl Ingester {
    #[allow(clippy::too_many_arguments)]
    pub async fn try_new(
        cluster: Cluster,
        control_plane: ControlPlaneServiceClient,
        ingester_pool: IngesterPool,
        wal_dir_path: &Path,
        disk_capacity: ByteSize,
        memory_capacity: ByteSize,
        rate_limiter_settings: RateLimiterSettings,
        replication_factor: usize,
        idle_shard_timeout: Duration,
    ) -> IngestV2Result<Self> {
        let self_node_id: NodeId = cluster.self_node_id().into();
        let state = IngesterState::load(
            cluster.clone(),
            wal_dir_path,
            disk_capacity,
            memory_capacity,
            rate_limiter_settings,
        )
        .await;

        let weak_state = state.weak();
        BroadcastLocalShardsTask::spawn(cluster.clone(), weak_state.clone());
        BroadcastIngesterCapacityScoreTask::spawn(cluster, weak_state.clone());
        CloseIdleShardsTask::spawn(weak_state, idle_shard_timeout);

        let ingester = Self {
            self_node_id,
            control_plane,
            ingester_pool,
            state,
            disk_capacity,
            memory_capacity,
            rate_limiter_settings,
            replication_factor,
            reset_shards_permits: Arc::new(Semaphore::new(1)),
        };
        ingester.background_reset_shards();

        Ok(ingester)
    }

    /// Checks whether the ingester is fully decommissioned and updates its status accordingly.
    async fn check_decommissioning_status(&self, state: &mut InnerIngesterState) {
        if state.status() != IngesterStatus::Decommissioning {
            return;
        }
        if state.shards.values().all(|shard| shard.is_indexed()) {
            state.set_status(IngesterStatus::Decommissioned).await;
        }
    }

    /// Initializes a primary shard by creating a queue in the write-ahead log and inserting a new
    /// [`IngesterShard`] into the ingester state. If replication is enabled, this method will
    /// also:
    /// - open a replication stream between the leader and the follower if one does not already
    ///   exist.
    /// - initialize the replica shard.
    async fn init_primary_shard(
        &self,
        state: &mut InnerIngesterState,
        mrecordlog: &mut MultiRecordLogAsync,
        shard: Shard,
        doc_mapping_json: &str,
        now: Instant,
        validate_docs: bool,
    ) -> IngestV2Result<()> {
        let queue_id = shard.queue_id();
        info!(
            index_uid=%shard.index_uid(),
            source_id=shard.source_id,
            shard_id=%shard.shard_id(),
            "init primary shard"
        );
        let Entry::Vacant(entry) = state.shards.entry(queue_id.clone()) else {
            return Ok(());
        };
        let doc_mapper = get_or_try_build_doc_mapper(
            &mut state.doc_mappers,
            shard.doc_mapping_uid(),
            doc_mapping_json,
        )?;
        match mrecordlog.create_queue(&queue_id).await {
            Ok(_) => {}
            Err(CreateQueueError::AlreadyExists) => {
                error!("WAL queue `{queue_id}` already exists");
                let message = format!("WAL queue `{queue_id}` already exists");
                return Err(IngestV2Error::Internal(message));
            }
            Err(CreateQueueError::IoError(io_error)) => {
                error!("failed to create WAL queue `{queue_id}`: {io_error}",);
                let message = format!("failed to create WAL queue `{queue_id}`: {io_error}");
                return Err(IngestV2Error::Internal(message));
            }
        };
        let index_uid = shard.index_uid().clone();
        let source_id = shard.source_id.clone();
        let shard_id = shard.shard_id().clone();
        let rate_limiter = RateLimiter::from_settings(self.rate_limiter_settings);
        let rate_meter = RateMeter::default();

        let primary_shard = if let Some(follower_id) = &shard.follower_id {
            let leader_id: NodeId = shard.leader_id.clone().into();
            let follower_id: NodeId = follower_id.clone().into();

            let replication_client = self
                .init_replication_stream(
                    &mut state.replication_streams,
                    leader_id,
                    follower_id.clone(),
                )
                .await?;

            if let Err(error) = replication_client.init_replica(shard).await {
                // TODO: Remove dangling queue from the WAL.
                error!("failed to initialize replica shard: {error}");
                let message = format!("failed to initialize replica shard: {error}");
                return Err(IngestV2Error::Internal(message));
            }
            IngesterShard::new_primary(index_uid, source_id, shard_id, follower_id)
                .with_rate_limiter(rate_limiter)
                .with_rate_meter(rate_meter)
                .with_doc_mapper(doc_mapper)
                .with_validate_docs(validate_docs)
                .with_last_write(now)
                .build()
        } else {
            IngesterShard::new_solo(index_uid, source_id, shard_id)
                .with_rate_limiter(rate_limiter)
                .with_rate_meter(rate_meter)
                .with_doc_mapper(doc_mapper)
                .with_validate_docs(validate_docs)
                .with_last_write(now)
                .build()
        };
        entry.insert(primary_shard);
        Ok(())
    }

    /// Resets the local shards in a separate background task.
    fn background_reset_shards(&self) {
        let mut ingester = self.clone();

        let future = async move {
            ingester.reset_shards().await;
        };
        tokio::spawn(future);
    }

    /// Resets the local shards at most once by minute by querying the control plane for the shards
    /// that should be deleted or truncated and then performing the requested operations.
    ///
    /// This operation should be triggered very rarely when the ingester has not been able to delete
    /// or truncate its shards by other means (RPCs from indexers, gossip, etc.).
    async fn reset_shards(&mut self) {
        let Ok(_permit) = self.reset_shards_permits.try_acquire() else {
            return;
        };
        self.state.wait_for_ready().await;

        info!("resetting shards");
        let now = Instant::now();

        let mut per_source_shard_ids: HashMap<(IndexUid, SourceId), Vec<ShardId>> = HashMap::new();

        let state_guard = with_lock_metrics!(self.state.lock_fully().await, "reset_shards", "read")
            .expect("ingester should be ready");

        for queue_id in state_guard.mrecordlog.list_queues() {
            let Some((index_uid, source_id, shard_id)) = split_queue_id(queue_id) else {
                // `split_queue_id` already logs an error.
                continue;
            };
            per_source_shard_ids
                .entry((index_uid, source_id))
                .or_default()
                .push(shard_id);
        }
        drop(state_guard);

        let shard_ids = per_source_shard_ids
            .into_iter()
            .map(|((index_uid, source_id), shard_ids)| ShardIds {
                index_uid: Some(index_uid),
                source_id,
                shard_ids,
            })
            .collect();

        let advise_reset_shards_request = AdviseResetShardsRequest {
            ingester_id: self.self_node_id.to_string(),
            shard_ids,
        };
        let advise_reset_shards_future = self
            .control_plane
            .advise_reset_shards(advise_reset_shards_request);
        let advise_reset_shards_result =
            timeout(Duration::from_secs(30), advise_reset_shards_future).await;

        match advise_reset_shards_result {
            Ok(Ok(advise_reset_shards_response)) => {
                let mut state_guard =
                    with_lock_metrics!(self.state.lock_fully().await, "reset_shards", "write")
                        .expect("ingester should be ready");

                state_guard
                    .reset_shards(&advise_reset_shards_response)
                    .await;

                info!(
                    "deleted {} and truncated {} shard(s) in {}",
                    advise_reset_shards_response.shards_to_delete.len(),
                    advise_reset_shards_response.shards_to_truncate.len(),
                    now.elapsed().pretty_display()
                );
                INGEST_V2_METRICS
                    .reset_shards_operations_total
                    .with_label_values(["success"])
                    .inc();

                let wal_usage = state_guard.mrecordlog.resource_usage();
                report_wal_usage(wal_usage);
            }
            Ok(Err(error)) => {
                warn!("advise reset shards request failed: {error}");

                INGEST_V2_METRICS
                    .reset_shards_operations_total
                    .with_label_values(["error"])
                    .inc();
            }
            Err(_) => {
                warn!("advise reset shards request timed out");

                INGEST_V2_METRICS
                    .reset_shards_operations_total
                    .with_label_values(["timeout"])
                    .inc();
            }
        };
        // We still hold the permit while sleeping so we effectively rate limit the reset shards
        // operation to once per [`MIN_RESET_SHARDS_INTERVAL`].
        if let Some(sleep_for) = MIN_RESET_SHARDS_INTERVAL.checked_sub(now.elapsed()) {
            sleep(sleep_for).await;
        }
    }

    async fn init_replication_stream(
        &self,
        replication_streams: &mut HashMap<FollowerId, ReplicationStreamTaskHandle>,
        leader_id: NodeId,
        follower_id: NodeId,
    ) -> IngestV2Result<ReplicationClient> {
        let entry = match replication_streams.entry(follower_id.clone()) {
            Entry::Occupied(entry) => {
                // A replication stream with this follower is already opened.
                return Ok(entry.get().replication_client());
            }
            Entry::Vacant(entry) => entry,
        };
        let open_request = OpenReplicationStreamRequest {
            leader_id: leader_id.clone().into(),
            follower_id: follower_id.clone().into(),
            replication_seqno: 0,
        };
        let open_message = SynReplicationMessage::new_open_request(open_request);
        let (syn_replication_stream_tx, syn_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        syn_replication_stream_tx
            .try_send(open_message)
            .expect("channel should be open and have capacity");

        let ingester = self.ingester_pool.get(&follower_id).ok_or_else(|| {
            let message = format!("ingester `{follower_id}` is unavailable");
            IngestV2Error::Unavailable(message)
        })?;
        let mut ack_replication_stream = ingester
            .client
            .open_replication_stream(syn_replication_stream)
            .await?;
        ack_replication_stream
            .next()
            .await
            .expect("TODO")
            .expect("TODO")
            .into_open_response()
            .expect("first message should be an open response");

        let replication_stream_task_handle = ReplicationStreamTask::spawn(
            leader_id.clone(),
            follower_id.clone(),
            syn_replication_stream_tx,
            ack_replication_stream,
        );
        let replication_client = replication_stream_task_handle.replication_client();
        entry.insert(replication_stream_task_handle);
        Ok(replication_client)
    }

    pub fn subscribe(&self, event_broker: &EventBroker) {
        let weak_ingester_state = self.state.weak();
        // This subscription is the one in charge of truncating the mrecordlog.
        info!("subscribing ingester to shard positions updates");
        event_broker
            .subscribe_without_timeout::<ShardPositionsUpdate>(weak_ingester_state)
            .forever();
    }

    async fn persist_inner(
        &self,
        persist_request: PersistRequest,
    ) -> IngestV2Result<PersistResponse> {
        if persist_request.leader_id != self.self_node_id {
            return Err(IngestV2Error::Internal(format!(
                "routing error: expected leader ID `{}`, got `{}`",
                self.self_node_id, persist_request.leader_id,
            )));
        }
        let mut persist_successes = Vec::with_capacity(persist_request.subrequests.len());
        let mut persist_failures = Vec::new();
        let mut per_follower_replicate_subrequests: HashMap<NodeId, Vec<ReplicateSubrequest>> =
            HashMap::new();
        let mut pending_persist_subrequests: HashMap<SubrequestId, PendingPersistSubrequest> =
            HashMap::with_capacity(persist_request.subrequests.len());

        // Keep track of the shards that need to be closed following an IO error.
        let mut shards_to_close: HashSet<QueueId> = HashSet::new();

        // Keep track of dangling shards, i.e., shards for which there is no longer a corresponding
        // queue in the WAL and should be deleted.
        let mut shards_to_delete: HashSet<QueueId> = HashSet::new();

        let commit_type = persist_request.commit_type();
        let force_commit = commit_type == CommitTypeV2::Force;

        let mut state_guard =
            with_lock_metrics!(self.state.lock_fully().await, "persist", "write")?;
        let status = state_guard.status();

        if !status.accepts_write_requests() {
            persist_failures.reserve_exact(persist_request.subrequests.len());

            for subrequest in persist_request.subrequests {
                let persist_failure = PersistFailure {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    reason: PersistFailureReason::NodeUnavailable as i32,
                };
                persist_failures.push(persist_failure);
            }
            let persist_response = PersistResponse {
                leader_id: persist_request.leader_id,
                successes: Vec::new(),
                failures: persist_failures,
                routing_update: None,
            };
            return Ok(persist_response);
        }
        // first verify if we would locally accept each subrequest
        {
            let mut total_requested_capacity = ByteSize::b(0);

            for subrequest in persist_request.subrequests {
                let Some(shard) = state_guard
                    .inner
                    .find_most_capacity_shard_mut(subrequest.index_uid(), &subrequest.source_id)
                else {
                    warn!(
                        index_uid=%subrequest.index_uid(),
                        source_id=%subrequest.source_id,
                        "no open shard found on ingester"
                    );
                    let persist_failure = PersistFailure {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid,
                        source_id: subrequest.source_id,
                        reason: PersistFailureReason::NoShardsAvailable as i32,
                    };
                    persist_failures.push(persist_failure);
                    continue;
                };
                let shard_id = shard.shard_id.clone();

                // A router can only know about a newly opened shard if it has been informed by the
                // control plane, which confirms that the shard was correctly opened in the
                // metastore.
                shard.is_advertisable = true;
                let doc_mapper = shard.doc_mapper_opt.clone().expect("shard should be open");
                let validate_docs = shard.validate_docs;
                let follower_id_opt = shard.follower_id_opt().cloned();
                let from_position_exclusive = shard.replication_position_inclusive.clone();

                let doc_batch = match subrequest.doc_batch {
                    Some(doc_batch) if !doc_batch.is_empty() => doc_batch,
                    _ => {
                        warn!("received empty persist request");
                        DocBatchV2::default()
                    }
                };
                let requested_capacity = estimate_size(&doc_batch);

                if let Err(error) = check_enough_capacity(
                    &state_guard.mrecordlog,
                    self.disk_capacity,
                    self.memory_capacity,
                    requested_capacity + total_requested_capacity,
                ) {
                    rate_limited_warn!(
                        limit_per_min = 10,
                        "failed to persist records to ingester `{}`: {error}",
                        self.self_node_id
                    );
                    let persist_failure = PersistFailure {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid,
                        source_id: subrequest.source_id,
                        reason: PersistFailureReason::WalFull as i32,
                    };
                    persist_failures.push(persist_failure);
                    continue;
                };
                // Because we return the shard with the most available capacity, if this hits, it
                // means that no shard can receive this request, and it should be retried.
                if !shard.rate_limiter.acquire_bytes(requested_capacity) {
                    debug!(
                        "failed to persist records to shard `{}`: rate limited",
                        shard.queue_id()
                    );

                    let persist_failure = PersistFailure {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid,
                        source_id: subrequest.source_id,
                        reason: PersistFailureReason::NoShardsAvailable as i32,
                    };
                    persist_failures.push(persist_failure);
                    continue;
                }

                // Total number of bytes (valid and invalid documents)
                let original_batch_num_bytes = doc_batch.num_bytes() as u64;

                let (valid_doc_batch, parse_failures) = if validate_docs {
                    validate_doc_batch(doc_batch, doc_mapper).await?
                } else {
                    (doc_batch, Vec::new())
                };

                if valid_doc_batch.is_empty() {
                    crate::metrics::INGEST_METRICS
                        .ingested_docs_invalid
                        .inc_by(parse_failures.len() as u64);
                    crate::metrics::INGEST_METRICS
                        .ingested_docs_bytes_invalid
                        .inc_by(original_batch_num_bytes);
                    let persist_success = PersistSuccess {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid,
                        source_id: subrequest.source_id,
                        shard_id: Some(shard_id),
                        replication_position_inclusive: Some(from_position_exclusive),
                        num_persisted_docs: 0,
                        parse_failures,
                    };
                    persist_successes.push(persist_success);
                    continue;
                };

                crate::metrics::INGEST_METRICS
                    .ingested_docs_valid
                    .inc_by(valid_doc_batch.num_docs() as u64);
                crate::metrics::INGEST_METRICS
                    .ingested_docs_bytes_valid
                    .inc_by(valid_doc_batch.num_bytes() as u64);
                if !parse_failures.is_empty() {
                    crate::metrics::INGEST_METRICS
                        .ingested_docs_invalid
                        .inc_by(parse_failures.len() as u64);
                    crate::metrics::INGEST_METRICS
                        .ingested_docs_bytes_invalid
                        .inc_by(original_batch_num_bytes - valid_doc_batch.num_bytes() as u64);
                }
                let valid_batch_num_bytes = valid_doc_batch.num_bytes() as u64;
                shard.rate_meter.update(valid_batch_num_bytes);
                total_requested_capacity += requested_capacity;

                let mut successfully_replicated = true;

                if let Some(follower_id) = follower_id_opt {
                    successfully_replicated = false;

                    let replicate_subrequest = ReplicateSubrequest {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid.clone(),
                        source_id: subrequest.source_id.clone(),
                        shard_id: Some(shard_id.clone()),
                        from_position_exclusive: Some(from_position_exclusive),
                        doc_batch: Some(valid_doc_batch.clone()),
                    };
                    per_follower_replicate_subrequests
                        .entry(follower_id)
                        .or_default()
                        .push(replicate_subrequest);
                }
                let pending_persist_subrequest = PendingPersistSubrequest {
                    queue_id: shard.queue_id(),
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    shard_id: Some(shard_id),
                    doc_batch: valid_doc_batch,
                    parse_failures,
                    expected_position_inclusive: None,
                    successfully_replicated,
                };
                pending_persist_subrequests.insert(
                    pending_persist_subrequest.subrequest_id,
                    pending_persist_subrequest,
                );
            }
        }
        // replicate to the follower
        {
            let mut replicate_futures = FuturesUnordered::new();

            for (follower_id, replicate_subrequests) in per_follower_replicate_subrequests {
                let replication_client = state_guard
                    .replication_streams
                    .get(&follower_id)
                    .expect("replication stream should be initialized")
                    .replication_client();
                let leader_id = self.self_node_id.clone();

                let replicate_future = replication_client.replicate(
                    leader_id,
                    follower_id,
                    replicate_subrequests,
                    commit_type,
                );
                replicate_futures.push(replicate_future);
            }
            while let Some(replication_result) = replicate_futures.next().await {
                let replicate_response = match replication_result {
                    Ok(replicate_response) => replicate_response,
                    Err(_) => {
                        // TODO: Handle replication error:
                        // 1. Close and evict all the shards hosted by the follower.
                        // 2. Close and evict the replication client.
                        // 3. Return `PersistFailureReason::NodeUnavailable` to router.
                        continue;
                    }
                };
                for replicate_success in replicate_response.successes {
                    let pending_persist_subrequest = pending_persist_subrequests
                        .get_mut(&replicate_success.subrequest_id)
                        .expect("persist subrequest should exist");

                    pending_persist_subrequest.successfully_replicated = true;
                    pending_persist_subrequest.expected_position_inclusive =
                        replicate_success.replication_position_inclusive;
                }
                for replicate_failure in replicate_response.failures {
                    // TODO: If the replica shard is closed, close the primary shard if it is not
                    // already.
                    let persist_failure_reason: PersistFailureReason =
                        replicate_failure.reason().into();
                    let persist_failure = PersistFailure {
                        subrequest_id: replicate_failure.subrequest_id,
                        index_uid: replicate_failure.index_uid,
                        source_id: replicate_failure.source_id,
                        reason: persist_failure_reason as i32,
                    };
                    persist_failures.push(persist_failure);
                }
            }
        }
        // finally write locally
        {
            let now = Instant::now();
            for subrequest in pending_persist_subrequests.into_values() {
                if !subrequest.successfully_replicated {
                    continue;
                }
                let queue_id = subrequest.queue_id;

                let batch_num_docs = subrequest.doc_batch.num_docs() as u64;

                let append_result = append_non_empty_doc_batch(
                    &mut state_guard.mrecordlog,
                    &queue_id,
                    subrequest.doc_batch,
                    force_commit,
                )
                .await;

                let current_position_inclusive = match append_result {
                    Ok(current_position_inclusive) => current_position_inclusive,
                    Err(append_error) => {
                        let reason = match &append_error {
                            AppendDocBatchError::Io(io_error) => {
                                error!(
                                    "failed to persist records to shard `{queue_id}`: {io_error}"
                                );
                                shards_to_close.insert(queue_id);
                                PersistFailureReason::NodeUnavailable
                            }
                            AppendDocBatchError::QueueNotFound(_) => {
                                error!(
                                    "failed to persist records to shard `{queue_id}`: WAL queue \
                                     not found"
                                );
                                shards_to_delete.insert(queue_id);
                                PersistFailureReason::NodeUnavailable
                            }
                        };
                        let persist_failure = PersistFailure {
                            subrequest_id: subrequest.subrequest_id,
                            index_uid: subrequest.index_uid,
                            source_id: subrequest.source_id,
                            reason: reason as i32,
                        };
                        persist_failures.push(persist_failure);
                        continue;
                    }
                };

                if let Some(expected_position_inclusive) = subrequest.expected_position_inclusive
                    && expected_position_inclusive != current_position_inclusive
                {
                    return Err(IngestV2Error::Internal(format!(
                        "bad replica position: expected {expected_position_inclusive:?}, got \
                         {current_position_inclusive:?}"
                    )));
                }
                state_guard
                    .shards
                    .get_mut(&queue_id)
                    .expect("primary shard should exist")
                    .set_replication_position_inclusive(current_position_inclusive.clone(), now);

                let persist_success = PersistSuccess {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    shard_id: subrequest.shard_id,
                    replication_position_inclusive: Some(current_position_inclusive),
                    num_persisted_docs: batch_num_docs as u32,
                    parse_failures: subrequest.parse_failures,
                };
                persist_successes.push(persist_success);
            }
        }
        if !shards_to_close.is_empty() {
            for queue_id in &shards_to_close {
                let shard = state_guard
                    .shards
                    .get_mut(queue_id)
                    .expect("shard should exist");

                shard.close();
                warn!("closed shard `{queue_id}` following IO error");
            }
        }
        if !shards_to_delete.is_empty() {
            for queue_id in &shards_to_delete {
                state_guard.shards.remove(queue_id);
                warn!("deleted dangling shard `{queue_id}`");
            }
        }
        let wal_usage = state_guard.mrecordlog.resource_usage();
        let disk_used = wal_usage.disk_used_bytes as u64;
        let memory_used = wal_usage.memory_used_bytes as u64;
        let (open_shard_counts, closed_shards) = state_guard.get_shard_snapshot();
        let capacity_score = state_guard
            .wal_capacity_tracker
            .score(ByteSize::b(disk_used), ByteSize::b(memory_used))
            as u32;
        drop(state_guard);

        if disk_used >= self.disk_capacity.as_u64() * 90 / 100 {
            self.background_reset_shards();
        }
        report_wal_usage(wal_usage);

        let source_shard_updates = open_shard_counts
            .into_iter()
            .map(|(index_uid, source_id, count)| SourceShardUpdate {
                index_uid: Some(index_uid),
                source_id,
                open_shard_count: count as u32,
            })
            .collect();

        let routing_update = RoutingUpdate {
            capacity_score,
            source_shard_updates,
            closed_shards,
        };

        #[cfg(test)]
        {
            persist_successes.sort_by_key(|success| success.subrequest_id);
            persist_failures.sort_by_key(|failure| failure.subrequest_id);
        }
        let leader_id = self.self_node_id.to_string();
        let persist_response = PersistResponse {
            leader_id,
            successes: persist_successes,
            failures: persist_failures,
            routing_update: Some(routing_update),
        };
        Ok(persist_response)
    }

    /// Opens a replication stream, which is a bi-directional gRPC stream. The client-side stream
    async fn open_replication_stream_inner(
        &self,
        mut syn_replication_stream: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> IngestV2Result<IngesterServiceStream<AckReplicationMessage>> {
        let open_replication_stream_request = syn_replication_stream
            .next()
            .await
            .ok_or_else(|| IngestV2Error::Internal("syn replication stream aborted".to_string()))?
            .into_open_request()
            .expect("first message should be an open replication stream request");

        if open_replication_stream_request.follower_id != self.self_node_id {
            return Err(IngestV2Error::Internal("routing error".to_string()));
        }
        let leader_id: NodeId = open_replication_stream_request.leader_id.into();
        let follower_id: NodeId = open_replication_stream_request.follower_id.into();

        let mut state_guard = self.state.lock_partially().await?;
        let status = state_guard.status();

        if !status.accepts_write_requests() {
            let error = IngestV2Error::Unavailable(format!(
                "ingester {follower_id} is not ready: {status}",
            ));
            return Err(error);
        }
        let Entry::Vacant(entry) = state_guard.replication_tasks.entry(leader_id.clone()) else {
            return Err(IngestV2Error::Internal(format!(
                "a replication stream between {leader_id} and {follower_id} is already opened"
            )));
        };
        // Channel capacity: there is no need to bound the capacity of the channel here because it
        // is already virtually bounded by the capacity of the SYN replication stream.
        let (ack_replication_stream_tx, ack_replication_stream) = ServiceStream::new_unbounded();
        let open_response = OpenReplicationStreamResponse {
            replication_seqno: 0,
        };
        let ack_replication_message = AckReplicationMessage::new_open_response(open_response);
        ack_replication_stream_tx
            .send(Ok(ack_replication_message))
            .expect("channel should be open");

        let replication_task_handle = ReplicationTask::spawn(
            leader_id,
            follower_id,
            self.state.clone(),
            syn_replication_stream,
            ack_replication_stream_tx,
            self.disk_capacity,
            self.memory_capacity,
        );
        entry.insert(replication_task_handle);
        Ok(ack_replication_stream)
    }

    async fn open_fetch_stream_inner(
        &self,
        open_fetch_stream_request: OpenFetchStreamRequest,
    ) -> IngestV2Result<ServiceStream<IngestV2Result<FetchMessage>>> {
        let queue_id = open_fetch_stream_request.queue_id();

        let mut state_guard = self.state.lock_partially().await?;

        let shard = state_guard.shards.get_mut(&queue_id).ok_or_else(|| {
            rate_limited_error!(limit_per_min=6, queue_id=%queue_id, "shard not found");
            IngestV2Error::ShardNotFound {
                shard_id: open_fetch_stream_request.shard_id().clone(),
            }
        })?;
        // An indexer can only know about a newly opened shard if it has been scheduled by the
        // control plane, which confirms that the shard was correctly opened in the
        // metastore.
        shard.is_advertisable = true;

        let shard_status_rx = shard.shard_status_rx.clone();
        let mrecordlog = self.state.mrecordlog();
        let (service_stream, _fetch_task_handle) = FetchStreamTask::spawn(
            open_fetch_stream_request,
            mrecordlog,
            shard_status_rx,
            get_batch_num_bytes(),
        );
        Ok(service_stream)
    }

    async fn open_observation_stream_inner(
        &self,
        _open_observation_stream_request: OpenObservationStreamRequest,
    ) -> IngestV2Result<IngesterServiceStream<ObservationMessage>> {
        let status_stream = ServiceStream::from(self.state.status_rx.clone());
        let self_node_id = self.self_node_id.clone();
        let observation_stream = status_stream.map(move |status| {
            let observation_message = ObservationMessage {
                node_id: self_node_id.clone().into(),
                status: status as i32,
            };
            Ok(observation_message)
        });
        Ok(observation_stream)
    }

    async fn init_shards_inner(
        &self,
        init_shards_request: InitShardsRequest,
    ) -> IngestV2Result<InitShardsResponse> {
        let mut state_guard =
            with_lock_metrics!(self.state.lock_fully().await, "init_shards", "write")?;
        let status = state_guard.status();

        if !status.accepts_write_requests() {
            let error = IngestV2Error::Unavailable(format!(
                "ingester {} is not ready: {status}",
                self.self_node_id
            ));
            return Err(error);
        }
        let mut successes = Vec::with_capacity(init_shards_request.subrequests.len());
        let mut failures = Vec::new();
        let now = Instant::now();

        for subrequest in init_shards_request.subrequests {
            let init_primary_shard_result = self
                .init_primary_shard(
                    &mut state_guard.inner,
                    &mut state_guard.mrecordlog,
                    subrequest.shard().clone(),
                    &subrequest.doc_mapping_json,
                    now,
                    subrequest.validate_docs,
                )
                .await;
            if init_primary_shard_result.is_ok() {
                let success = InitShardSuccess {
                    subrequest_id: subrequest.subrequest_id,
                    shard: subrequest.shard,
                };
                successes.push(success);
            } else {
                let shard = subrequest.shard();
                let failure = InitShardFailure {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: shard.index_uid.clone(),
                    source_id: shard.source_id.clone(),
                    shard_id: shard.shard_id.clone(),
                };
                failures.push(failure);
            }
        }
        let response = InitShardsResponse {
            successes,
            failures,
        };
        Ok(response)
    }

    async fn truncate_shards_inner(
        &self,
        truncate_shards_request: TruncateShardsRequest,
    ) -> IngestV2Result<TruncateShardsResponse> {
        if truncate_shards_request.ingester_id != self.self_node_id {
            return Err(IngestV2Error::Internal(format!(
                "routing error: expected ingester `{}`, got `{}`",
                self.self_node_id, truncate_shards_request.ingester_id,
            )));
        }
        let mut state_guard =
            with_lock_metrics!(self.state.lock_fully().await, "truncate_shards", "write")?;

        for subrequest in truncate_shards_request.subrequests {
            let queue_id = subrequest.queue_id();
            let truncate_up_to_position_inclusive = subrequest.truncate_up_to_position_inclusive();

            if truncate_up_to_position_inclusive.is_eof() {
                state_guard.delete_shard(&queue_id, "indexer-rpc").await;
            } else {
                state_guard
                    .truncate_shard(&queue_id, truncate_up_to_position_inclusive, "indexer-rpc")
                    .await;
            }
        }
        let wal_usage = state_guard.mrecordlog.resource_usage();
        report_wal_usage(wal_usage);

        self.check_decommissioning_status(&mut state_guard).await;
        let truncate_response = TruncateShardsResponse {};
        Ok(truncate_response)
    }

    async fn close_shards_inner(
        &self,
        close_shards_request: CloseShardsRequest,
    ) -> IngestV2Result<CloseShardsResponse> {
        let mut state_guard =
            with_lock_metrics!(self.state.lock_partially().await, "close_shards", "write")?;

        let mut successes = Vec::with_capacity(close_shards_request.shard_pkeys.len());

        for shard_pkey in close_shards_request.shard_pkeys {
            let queue_id = shard_pkey.queue_id();

            if let Some(shard) = state_guard.shards.get_mut(&queue_id) {
                shard.close();
                successes.push(shard_pkey);
            }
        }
        info!("closed {} shards", successes.len());
        let response = CloseShardsResponse { successes };
        Ok(response)
    }

    pub async fn debug_info(&self) -> JsonValue {
        let state_guard = match self.state.lock_fully().await {
            Ok(state_guard) => state_guard,
            Err(_) => {
                return json!({
                    "status": "initializing",
                    "shards": {},
                    "mrecordlog": {},
                });
            }
        };
        let mut per_index_shards_json: BTreeMap<IndexUid, Vec<JsonValue>> = BTreeMap::new();

        for (queue_id, shard) in &state_guard.shards {
            let Some((index_uid, source_id, shard_id)) = split_queue_id(queue_id) else {
                // `split_queue_id` already logs an error.
                continue;
            };
            let mut shard_json = json!({
                "index_uid": index_uid,
                "source_id": source_id,
                "shard_id": shard_id,
                "state": shard.shard_state.as_json_str_name(),
                "replication_position_inclusive": shard.replication_position_inclusive,
                "truncation_position_inclusive": shard.truncation_position_inclusive,
            });
            match &shard.shard_type {
                IngesterShardType::Primary { follower_id, .. } => {
                    shard_json["type"] = json!("primary");
                    shard_json["leader_id"] = json!(self.self_node_id.to_string());
                    shard_json["follower_id"] = json!(follower_id.to_string());
                }
                IngesterShardType::Replica { leader_id } => {
                    shard_json["type"] = json!("replica");
                    shard_json["leader_id"] = json!(leader_id.to_string());
                    shard_json["follower_id"] = json!(self.self_node_id.to_string());
                }
                IngesterShardType::Solo => {
                    shard_json["type"] = json!("solo");
                    shard_json["leader_id"] = json!(self.self_node_id.to_string());
                }
            };
            per_index_shards_json
                .entry(index_uid.clone())
                .or_default()
                .push(shard_json);
        }
        json!({
            "status": state_guard.status().as_json_str_name(),
            "shards": per_index_shards_json,
            "mrecordlog":  state_guard.mrecordlog.summary(),
        })
    }
}

#[async_trait]
impl IngesterService for Ingester {
    async fn persist(&self, persist_request: PersistRequest) -> IngestV2Result<PersistResponse> {
        // If the request is local, the amount of memory it occupies is already
        // accounted for in the router.
        let request_size_bytes = persist_request
            .subrequests
            .iter()
            .flat_map(|subrequest| match &subrequest.doc_batch {
                Some(doc_batch) if doc_batch.doc_buffer.is_unique() => Some(doc_batch.num_bytes()),
                _ => None,
            })
            .sum::<usize>();
        let mut gauge_guard = GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.ingester_persist);
        gauge_guard.add(request_size_bytes as i64);

        self.persist_inner(persist_request).await
    }

    async fn open_replication_stream(
        &self,
        syn_replication_stream: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> IngestV2Result<IngesterServiceStream<AckReplicationMessage>> {
        self.open_replication_stream_inner(syn_replication_stream)
            .await
    }

    async fn open_fetch_stream(
        &self,
        open_fetch_stream_request: OpenFetchStreamRequest,
    ) -> IngestV2Result<ServiceStream<IngestV2Result<FetchMessage>>> {
        self.open_fetch_stream_inner(open_fetch_stream_request)
            .await
    }

    async fn open_observation_stream(
        &self,
        open_observation_stream_request: OpenObservationStreamRequest,
    ) -> IngestV2Result<IngesterServiceStream<ObservationMessage>> {
        self.open_observation_stream_inner(open_observation_stream_request)
            .await
    }

    async fn init_shards(
        &self,
        init_shards_request: InitShardsRequest,
    ) -> IngestV2Result<InitShardsResponse> {
        self.init_shards_inner(init_shards_request).await
    }

    async fn retain_shards(
        &self,
        request: RetainShardsRequest,
    ) -> IngestV2Result<RetainShardsResponse> {
        let retain_queue_ids: HashSet<QueueId> = request
            .retain_shards_for_sources
            .into_iter()
            .flat_map(|retain_shards_for_source: RetainShardsForSource| {
                let index_uid = retain_shards_for_source.index_uid().clone();
                retain_shards_for_source
                    .shard_ids
                    .into_iter()
                    .map(move |shard_id| {
                        queue_id(&index_uid, &retain_shards_for_source.source_id, &shard_id)
                    })
            })
            .collect();
        let mut state_guard =
            with_lock_metrics!(self.state.lock_fully(), "retain_shards", "write").await?;
        let remove_queue_ids: HashSet<QueueId> = state_guard
            .shards
            .keys()
            .filter(move |shard_id| !retain_queue_ids.contains(*shard_id))
            .map(ToString::to_string)
            .collect();
        info!(queues=?remove_queue_ids, "removing queues");
        for queue_id in remove_queue_ids {
            state_guard
                .delete_shard(&queue_id, "control-plane-retain-shards-rpc")
                .await;
        }
        self.check_decommissioning_status(&mut state_guard).await;
        Ok(RetainShardsResponse {})
    }

    async fn truncate_shards(
        &self,
        truncate_shards_request: TruncateShardsRequest,
    ) -> IngestV2Result<TruncateShardsResponse> {
        self.truncate_shards_inner(truncate_shards_request).await
    }

    async fn close_shards(
        &self,
        close_shards_request: CloseShardsRequest,
    ) -> IngestV2Result<CloseShardsResponse> {
        self.close_shards_inner(close_shards_request).await
    }

    async fn decommission(
        &self,
        _decommission_request: DecommissionRequest,
    ) -> IngestV2Result<DecommissionResponse> {
        // Retire the ingester immediately by setting its status to `Retiring`.
        info!("retiring ingester");
        let mut state_guard = self.state.lock_partially().await?;
        state_guard.set_status(IngesterStatus::Retiring).await;
        drop(state_guard); // Dropping explicitly for readability.

        // Drain write requests by scheduling the decommissioning of the ingester after a delay
        // allowing the propagation of the `Retiring` status to other nodes.
        let self_clone = self.clone();
        tokio::spawn(async move {
            const DECOMMISSION_DELAY: Duration = if cfg!(any(test, feature = "testsuite")) {
                Duration::from_millis(100)
            } else {
                // Having to wait for 10s is not great but we can live with it. During this time, we
                // still make progress towards decommissioning because we gradually receive less
                // write requests and indexing is still ongoing. However, it sets a floor on the
                // amount of time with which we can fully decommission an ingester. This will be
                // most noticeable when using Quickwit locally.
                Duration::from_secs(10)
            };
            tokio::time::sleep(DECOMMISSION_DELAY).await;

            info!("decommissioning ingester");
            let mut state_guard = match self_clone.state.lock_partially().await {
                Ok(state_guard) => state_guard,
                Err(error) => {
                    error!(%error, "failed to decommission ingester");
                    return;
                }
            };
            state_guard
                .set_status(IngesterStatus::Decommissioning)
                .await;

            for shard in state_guard.shards.values_mut() {
                shard.close();
            }
            self_clone
                .check_decommissioning_status(&mut state_guard)
                .await;
        });
        Ok(DecommissionResponse {})
    }
}

#[async_trait]
impl EventSubscriber<ShardPositionsUpdate> for WeakIngesterState {
    async fn handle_event(&mut self, shard_positions_update: ShardPositionsUpdate) {
        let Some(state) = self.upgrade() else {
            warn!("ingester state update failed");
            return;
        };
        let Ok(mut state_guard) =
            with_lock_metrics!(state.lock_fully().await, "gc_shards", "write")
        else {
            error!("failed to lock the ingester state");
            return;
        };
        let index_uid = shard_positions_update.source_uid.index_uid;
        let source_id = shard_positions_update.source_uid.source_id;

        for (shard_id, shard_position) in shard_positions_update.updated_shard_positions {
            let queue_id = queue_id(&index_uid, &source_id, &shard_id);
            if shard_position.is_eof() {
                state_guard.delete_shard(&queue_id, "indexer-gossip").await;
            } else if !shard_position.is_beginning() {
                state_guard
                    .truncate_shard(&queue_id, shard_position, "indexer-gossip")
                    .await;
            }
        }
    }
}

struct PendingPersistSubrequest {
    queue_id: QueueId,
    subrequest_id: u32,
    index_uid: Option<IndexUid>,
    source_id: SourceId,
    shard_id: Option<ShardId>,
    doc_batch: DocBatchV2,
    parse_failures: Vec<ParseFailure>,
    expected_position_inclusive: Option<Position>,
    successfully_replicated: bool,
}

#[cfg(test)]
mod tests {
    #![allow(clippy::mutable_key_type)]

    use std::collections::HashSet;
    use std::net::SocketAddr;
    use std::sync::atomic::{AtomicU16, Ordering};

    use bytes::Bytes;
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test_with_id};
    use quickwit_common::shared_consts::INGESTER_PRIMARY_SHARDS_PREFIX;
    use quickwit_common::tower::ConstantRate;
    use quickwit_config::service::QuickwitService;
    use quickwit_proto::control_plane::{AdviseResetShardsResponse, MockControlPlaneService};
    use quickwit_proto::ingest::ingester::{
        IngesterServiceClient, IngesterServiceGrpcServer, IngesterServiceGrpcServerAdapter,
        IngesterStatus, InitShardSubrequest, PersistSubrequest, TruncateShardsSubrequest,
    };
    use quickwit_proto::ingest::{
        DocBatchV2, ParseFailureReason, ShardIdPosition, ShardIdPositions, ShardIds, ShardPKey,
        ShardState,
    };
    use quickwit_proto::types::{DocMappingUid, DocUid, ShardId, SourceUid, queue_id};
    use tokio::task::yield_now;
    use tokio::time::timeout;
    use tonic::transport::{Endpoint, Server};

    use super::*;
    use crate::ingest_v2::DEFAULT_IDLE_SHARD_TIMEOUT;
    use crate::ingest_v2::broadcast::ShardInfos;
    use crate::ingest_v2::doc_mapper::try_build_doc_mapper;
    use crate::ingest_v2::fetch::tests::{into_fetch_eof, into_fetch_payload};
    use crate::ingest_v2::helpers::wait_for_ingester_status;
    use crate::{IngesterPoolEntry, MRecord};

    const MAX_GRPC_MESSAGE_SIZE: ByteSize = ByteSize::mib(1);

    pub(super) struct IngesterForTest {
        node_id: NodeId,
        control_plane: ControlPlaneServiceClient,
        ingester_pool: IngesterPool,
        disk_capacity: ByteSize,
        memory_capacity: ByteSize,
        rate_limiter_settings: RateLimiterSettings,
        replication_factor: usize,
        idle_shard_timeout: Duration,
    }

    impl Default for IngesterForTest {
        fn default() -> Self {
            let mut mock_control_plane = MockControlPlaneService::new();
            mock_control_plane
                .expect_advise_reset_shards()
                .returning(|_| Ok(AdviseResetShardsResponse::default()));
            let control_plane = ControlPlaneServiceClient::from_mock(mock_control_plane);

            Self {
                node_id: "test-ingester".into(),
                control_plane,
                ingester_pool: IngesterPool::default(),
                disk_capacity: ByteSize::mb(256),
                memory_capacity: ByteSize::mb(1),
                rate_limiter_settings: RateLimiterSettings::default(),
                replication_factor: 1,
                idle_shard_timeout: DEFAULT_IDLE_SHARD_TIMEOUT,
            }
        }
    }

    impl IngesterForTest {
        pub fn with_node_id(mut self, node_id: &str) -> Self {
            self.node_id = node_id.into();
            self
        }

        pub fn with_control_plane(mut self, control_plane: ControlPlaneServiceClient) -> Self {
            self.control_plane = control_plane;
            self
        }

        pub fn with_ingester_pool(mut self, ingester_pool: &IngesterPool) -> Self {
            self.ingester_pool = ingester_pool.clone();
            self
        }

        pub fn with_disk_capacity(mut self, disk_capacity: ByteSize) -> Self {
            self.disk_capacity = disk_capacity;
            self
        }

        pub fn with_memory_capacity(mut self, memory_capacity: ByteSize) -> Self {
            self.memory_capacity = memory_capacity;
            self
        }

        pub fn with_rate_limiter_settings(
            mut self,
            rate_limiter_settings: RateLimiterSettings,
        ) -> Self {
            self.rate_limiter_settings = rate_limiter_settings;
            self
        }

        pub fn with_replication(mut self) -> Self {
            self.replication_factor = 2;
            self
        }

        pub fn with_idle_shard_timeout(mut self, idle_shard_timeout: Duration) -> Self {
            self.idle_shard_timeout = idle_shard_timeout;
            self
        }

        pub async fn build(self) -> (IngesterContext, Ingester) {
            static GOSSIP_ADVERTISE_PORT_SEQUENCE: AtomicU16 = AtomicU16::new(1u16);

            let tempdir = tempfile::tempdir().unwrap();
            let wal_dir_path = tempdir.path();
            let transport = ChannelTransport::default();

            let gossip_advertise_port =
                GOSSIP_ADVERTISE_PORT_SEQUENCE.fetch_add(1, Ordering::Relaxed);

            let cluster = create_cluster_for_test_with_id(
                self.node_id.clone(),
                gossip_advertise_port,
                "test-cluster".to_string(),
                Vec::new(),
                &HashSet::from_iter([QuickwitService::Indexer]),
                &transport,
                true,
            )
            .await
            .unwrap();

            let ingester = Ingester::try_new(
                cluster.clone(),
                self.control_plane.clone(),
                self.ingester_pool.clone(),
                wal_dir_path,
                self.disk_capacity,
                self.memory_capacity,
                self.rate_limiter_settings,
                self.replication_factor,
                self.idle_shard_timeout,
            )
            .await
            .unwrap();

            wait_for_ingester_status(&ingester, IngesterStatus::Ready, Duration::from_secs(1))
                .await
                .unwrap();

            let ingester_env = IngesterContext {
                tempdir,
                _transport: transport,
                node_id: self.node_id,
                cluster,
                ingester_pool: self.ingester_pool,
            };
            (ingester_env, ingester)
        }
    }

    pub struct IngesterContext {
        tempdir: tempfile::TempDir,
        _transport: ChannelTransport,
        node_id: NodeId,
        cluster: Cluster,
        ingester_pool: IngesterPool,
    }

    #[tokio::test]
    async fn test_ingester_init() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;
        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let queue_id_02 = queue_id(&index_uid, &source_id, &ShardId::from(2));
        let queue_id_03 = queue_id(&index_uid, &source_id, &ShardId::from(3));

        state_guard
            .mrecordlog
            .create_queue(&queue_id_01)
            .await
            .unwrap();

        let records = [MRecord::new_doc("test-doc-foo").encode()].into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_01, None, records)
            .await
            .unwrap();

        state_guard
            .mrecordlog
            .truncate(&queue_id_01, 0)
            .await
            .unwrap();

        state_guard
            .mrecordlog
            .create_queue(&queue_id_02)
            .await
            .unwrap();

        let records = [
            MRecord::new_doc("test-doc-foo").encode(),
            MRecord::new_doc("test-doc-bar").encode(),
        ]
        .into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_02, None, records)
            .await
            .unwrap();

        state_guard
            .mrecordlog
            .truncate(&queue_id_02, 0)
            .await
            .unwrap();

        state_guard
            .mrecordlog
            .create_queue(&queue_id_03)
            .await
            .unwrap();

        state_guard.set_status(IngesterStatus::Initializing).await;

        drop(state_guard);

        ingester
            .state
            .init(ingester_ctx.tempdir.path(), RateLimiterSettings::default())
            .await;

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 1);

        let solo_shard_02 = state_guard.shards.get(&queue_id_02).unwrap();
        solo_shard_02.assert_is_solo();
        solo_shard_02.assert_is_closed();
        solo_shard_02.assert_replication_position(Position::offset(1u64));
        solo_shard_02.assert_truncation_position(Position::offset(0u64));
        assert!(solo_shard_02.is_advertisable);

        state_guard
            .mrecordlog
            .assert_records_eq(&queue_id_02, .., &[(1, [0, 0], "test-doc-bar")]);

        assert_eq!(state_guard.status(), IngesterStatus::Ready);
    }

    #[tokio::test]
    async fn test_ingester_broadcasts_local_shards() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let shard_00 =
            IngesterShard::new_solo(index_uid.clone(), source_id.clone(), ShardId::from(0)).build();
        state_guard.shards.insert(shard_00.queue_id(), shard_00);

        let shard_01 = IngesterShard::new_solo(index_uid.clone(), source_id, ShardId::from(1))
            .advertisable()
            .build();
        let queue_id_01 = shard_01.queue_id();
        state_guard.shards.insert(queue_id_01.clone(), shard_01);
        drop(state_guard);

        tokio::time::sleep(Duration::from_millis(100)).await;

        let key = format!(
            "{INGESTER_PRIMARY_SHARDS_PREFIX}{}:{}",
            index_uid, "test-source"
        );
        let value = ingester_ctx.cluster.get_self_key_value(&key).await.unwrap();

        let shard_infos: ShardInfos = serde_json::from_str(&value).unwrap();
        assert_eq!(shard_infos.len(), 1);

        let shard_info = shard_infos.iter().next().unwrap();
        assert_eq!(shard_info.shard_id, ShardId::from(1));
        assert_eq!(shard_info.shard_state, ShardState::Open);
        assert_eq!(shard_info.short_term_ingestion_rate, 0);

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        state_guard
            .shards
            .get_mut(&queue_id_01)
            .unwrap()
            .shard_state = ShardState::Closed;
        drop(state_guard);

        tokio::time::sleep(Duration::from_millis(100)).await;

        let value = ingester_ctx.cluster.get_self_key_value(&key).await.unwrap();

        let shard_infos: ShardInfos = serde_json::from_str(&value).unwrap();
        assert_eq!(shard_infos.len(), 1);

        let shard_info = shard_infos.iter().next().unwrap();
        assert_eq!(shard_info.shard_state, ShardState::Closed);

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        state_guard.shards.remove(&queue_id_01).unwrap();
        drop(state_guard);

        tokio::time::sleep(Duration::from_millis(100)).await;

        let value_opt = ingester_ctx.cluster.get_self_key_value(&key).await;
        assert!(value_opt.is_none());
    }

    #[tokio::test]
    async fn test_ingester_init_primary_shard() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "field_mappings": [{{
                        "name": "message",
                        "type": "text"
                }}]
            }}"#
        );
        let primary_shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: ingester_ctx.node_id.to_string(),
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                primary_shard,
                &doc_mapping_json,
                Instant::now(),
                true,
            )
            .await
            .unwrap();

        let queue_id = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let shard = state_guard.shards.get(&queue_id).unwrap();
        shard.assert_is_solo();
        shard.assert_is_open();
        shard.assert_replication_position(Position::Beginning);
        shard.assert_truncation_position(Position::Beginning);
        assert!(shard.doc_mapper_opt.is_some());
    }

    #[tokio::test]
    async fn test_ingester_init_shards() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: ingester_ctx.node_id.to_string(),
            follower_id: None,
            doc_mapping_uid: Some(doc_mapping_uid),
            publish_position_inclusive: None,
            publish_token: None,
            update_timestamp: 1724158996,
        };
        let init_shards_request = InitShardsRequest {
            subrequests: vec![InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(shard.clone()),
                doc_mapping_json,
                validate_docs: true,
            }],
        };
        let response = ingester.init_shards(init_shards_request).await.unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);

        let init_shard_success = &response.successes[0];
        assert_eq!(init_shard_success.subrequest_id, 0);
        assert_eq!(init_shard_success.shard, Some(shard));

        let state_guard = ingester.state.lock_fully().await.unwrap();

        let queue_id = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let shard = state_guard.shards.get(&queue_id).unwrap();
        shard.assert_is_solo();
        shard.assert_is_open();
        shard.assert_replication_position(Position::Beginning);
        shard.assert_truncation_position(Position::Beginning);

        assert!(state_guard.mrecordlog.queue_exists(&queue_id));
    }

    #[tokio::test]
    async fn test_ingester_persist() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid_0 = IndexUid::for_test("test-index", 0);
        let index_uid_1 = IndexUid::for_test("test-index", 1);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![
                InitShardSubrequest {
                    subrequest_id: 0,
                    shard: Some(Shard {
                        index_uid: Some(index_uid_0.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: ingester_ctx.node_id.to_string(),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json: doc_mapping_json.clone(),
                    validate_docs: true,
                },
                InitShardSubrequest {
                    subrequest_id: 1,
                    shard: Some(Shard {
                        index_uid: Some(index_uid_1.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: ingester_ctx.node_id.to_string(),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json,
                    validate_docs: true,
                },
            ],
        };
        ingester.init_shards(init_shards_request).await.unwrap();

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![
                PersistSubrequest {
                    subrequest_id: 0,
                    index_uid: Some(index_uid_0.clone()),
                    source_id: source_id.clone(),
                    doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
                },
                PersistSubrequest {
                    subrequest_id: 1,
                    index_uid: Some(index_uid_1.clone()),
                    source_id: source_id.clone(),
                    doc_batch: Some(DocBatchV2::for_test([
                        r#"{"doc": "test-doc-110"}"#,
                        r#"{"doc": "test-doc-111"}"#,
                    ])),
                },
            ],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 2);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_success_0 = &persist_response.successes[0];
        assert_eq!(persist_success_0.subrequest_id, 0);
        assert_eq!(persist_success_0.index_uid(), &index_uid_0);
        assert_eq!(persist_success_0.source_id, "test-source");
        assert_eq!(
            persist_success_0.replication_position_inclusive,
            Some(Position::offset(1u64))
        );

        let persist_success_1 = &persist_response.successes[1];
        assert_eq!(persist_success_1.subrequest_id, 1);
        assert_eq!(persist_success_1.index_uid(), &index_uid_1);
        assert_eq!(persist_success_1.source_id, "test-source");
        assert_eq!(
            persist_success_1.replication_position_inclusive,
            Some(Position::offset(2u64))
        );

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 2);

        let queue_id_01 = queue_id(&index_uid_0, &source_id, &ShardId::from(1));
        let solo_shard_01 = state_guard.shards.get(&queue_id_01).unwrap();
        solo_shard_01.assert_is_solo();
        solo_shard_01.assert_is_open();
        solo_shard_01.assert_replication_position(Position::offset(1u64));

        state_guard.mrecordlog.assert_records_eq(
            &queue_id_01,
            ..,
            &[(0, [0, 0], r#"{"doc": "test-doc-010"}"#), (1, [0, 1], "")],
        );

        let queue_id_11 = queue_id(&index_uid_1, &source_id, &ShardId::from(1));
        let solo_shard_11 = state_guard.shards.get(&queue_id_11).unwrap();
        solo_shard_11.assert_is_solo();
        solo_shard_11.assert_is_open();
        solo_shard_11.assert_replication_position(Position::offset(2u64));

        state_guard.mrecordlog.assert_records_eq(
            &queue_id_11,
            ..,
            &[
                (0, [0, 0], r#"{"doc": "test-doc-110"}"#),
                (1, [0, 0], r#"{"doc": "test-doc-111"}"#),
                (2, [0, 1], ""),
            ],
        );
    }

    #[tokio::test]
    async fn test_ingester_persist_empty() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(0)),
                    shard_state: ShardState::Open as i32,
                    leader_id: ingester_ctx.node_id.to_string(),
                    doc_mapping_uid: Some(doc_mapping_uid),
                    ..Default::default()
                }),
                doc_mapping_json,
                validate_docs: true,
            }],
        };
        let response = ingester.init_shards(init_shards_request).await.unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: Vec::new(),
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_request = PersistRequest {
            leader_id: "test-ingester".to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: None,
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 1);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_success = &persist_response.successes[0];
        assert_eq!(persist_success.subrequest_id, 0);
        assert_eq!(persist_success.index_uid(), &index_uid);
        assert_eq!(persist_success.source_id, "test-source");
        assert_eq!(
            persist_success.replication_position_inclusive,
            Some(Position::Beginning)
        );
    }

    #[tokio::test]
    async fn test_ingester_persist_validates_docs() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "mode": "strict",
                "field_mappings": [{{"name": "doc", "type": "text"}}]
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(0)),
                    shard_state: ShardState::Open as i32,
                    leader_id: ingester_ctx.node_id.to_string(),
                    doc_mapping_uid: Some(doc_mapping_uid),
                    ..Default::default()
                }),
                doc_mapping_json,
                validate_docs: true,
            }],
        };
        let response = ingester.init_shards(init_shards_request).await.unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([
                    "",                           // invalid
                    "[]",                         // invalid
                    r#"{"foo": "bar"}"#,          // invalid
                    r#"{"doc": "test-doc-000"}"#, // valid
                ])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 1);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_success = &persist_response.successes[0];
        assert_eq!(persist_success.num_persisted_docs, 1);
        assert_eq!(persist_success.parse_failures.len(), 3);

        let parse_failure_0 = &persist_success.parse_failures[0];
        assert_eq!(parse_failure_0.doc_uid(), DocUid::for_test(0));
        assert_eq!(parse_failure_0.reason(), ParseFailureReason::InvalidJson);
        assert!(parse_failure_0.message.contains("parse JSON document"));

        let parse_failure_1 = &persist_success.parse_failures[1];
        assert_eq!(parse_failure_1.doc_uid(), DocUid::for_test(1));
        assert_eq!(parse_failure_1.reason(), ParseFailureReason::InvalidJson);
        assert!(parse_failure_1.message.contains("not an object"));

        let parse_failure_2 = &persist_success.parse_failures[2];
        assert_eq!(parse_failure_2.doc_uid(), DocUid::for_test(2));
        assert_eq!(parse_failure_2.reason(), ParseFailureReason::InvalidSchema);
        assert!(parse_failure_2.message.contains("not declared"));
    }

    #[tokio::test]
    async fn test_ingester_persist_doesnt_validates_docs_when_requested() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "mode": "strict",
                "field_mappings": [{{"name": "doc", "type": "text"}}]
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(0)),
                    shard_state: ShardState::Open as i32,
                    leader_id: ingester_ctx.node_id.to_string(),
                    doc_mapping_uid: Some(doc_mapping_uid),
                    ..Default::default()
                }),
                doc_mapping_json,
                validate_docs: false,
            }],
        };
        let response = ingester.init_shards(init_shards_request).await.unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([
                    "",                           // invalid
                    "[]",                         // invalid
                    r#"{"foo": "bar"}"#,          // invalid
                    r#"{"doc": "test-doc-000"}"#, // valid
                ])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 1);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_success = &persist_response.successes[0];
        assert_eq!(persist_success.num_persisted_docs, 4);
        assert_eq!(persist_success.parse_failures.len(), 0);
    }

    #[tokio::test]
    async fn test_ingester_persist_checks_capacity_before_validating_docs() {
        let (ingester_ctx, ingester) = IngesterForTest::default()
            .with_memory_capacity(ByteSize(0))
            .build()
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "mode": "strict",
                "field_mappings": [{{"name": "doc", "type": "text"}}]
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(0)),
                    shard_state: ShardState::Open as i32,
                    leader_id: ingester_ctx.node_id.to_string(),
                    doc_mapping_uid: Some(doc_mapping_uid),
                    ..Default::default()
                }),
                doc_mapping_json,
                validate_docs: true,
            }],
        };
        let response = ingester.init_shards(init_shards_request).await.unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test(["", "[]", r#"{"foo": "bar"}"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(persist_failure.reason(), PersistFailureReason::WalFull);
    }

    #[tokio::test]
    async fn test_ingester_persist_applies_rate_limiting_before_validating_docs() {
        let (ingester_ctx, ingester) = IngesterForTest::default()
            .with_rate_limiter_settings(RateLimiterSettings {
                burst_limit: 0,
                rate_limit: ConstantRate::bytes_per_sec(ByteSize(0)),
                refill_period: Duration::from_secs(1),
            })
            .build()
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}",
                "mode": "strict",
                "field_mappings": [{{"name": "doc", "type": "text"}}]
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![InitShardSubrequest {
                subrequest_id: 0,
                shard: Some(Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(0)),
                    shard_state: ShardState::Open as i32,
                    leader_id: ingester_ctx.node_id.to_string(),
                    doc_mapping_uid: Some(doc_mapping_uid),
                    ..Default::default()
                }),
                doc_mapping_json,
                validate_docs: true,
            }],
        };
        let response = ingester.init_shards(init_shards_request).await.unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test(["", "[]", r#"{"foo": "bar"}"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(
            persist_failure.reason(),
            PersistFailureReason::NoShardsAvailable
        );
    }

    // This test should be run manually and independently of other tests with the `failpoints`
    // feature enabled:
    // ```sh
    // cargo test --manifest-path quickwit/Cargo.toml -p quickwit-ingest --features failpoints -- test_ingester_persist_closes_shard_on_io_error
    // ```
    #[cfg(all(feature = "failpoints", not(feature = "no-failpoints")))]
    #[tokio::test]
    async fn test_ingester_persist_closes_shard_on_io_error() {
        let scenario = fail::FailScenario::setup();
        fail::cfg("ingester:append_records", "return").unwrap();

        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let solo_shard =
            IngesterShard::new_solo(index_uid.clone(), source_id, ShardId::from(1)).build();
        let queue_id = solo_shard.queue_id();
        state_guard.shards.insert(queue_id.clone(), solo_shard);

        state_guard
            .mrecordlog
            .create_queue(&queue_id)
            .await
            .unwrap();

        let rate_limiter = RateLimiter::from_settings(RateLimiterSettings::default());
        let rate_meter = RateMeter::default();
        state_guard
            .rate_trackers
            .insert(queue_id.clone(), (rate_limiter, rate_meter));

        drop(state_guard);

        let persist_request = PersistRequest {
            leader_id: "test-ingester".to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([r#"test-doc-foo"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(persist_failure.subrequest_id, 0);
        assert_eq!(persist_failure.index_uid(), &index_uid);
        assert_eq!(persist_failure.source_id, "test-source");
        assert_eq!(
            persist_failure.reason(),
            PersistFailureReason::NodeUnavailable,
        );

        let state_guard = ingester.state.lock_fully().await.unwrap();
        let shard = state_guard.shards.get(&queue_id).unwrap();
        shard.assert_is_closed();

        scenario.teardown();
    }

    #[tokio::test]
    async fn test_ingester_persist_deletes_dangling_shard() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapper = try_build_doc_mapper("{}").unwrap();

        // Insert a dangling shard, i.e. a shard without a corresponding queue.
        let solo_shard =
            IngesterShard::new_solo(index_uid.clone(), source_id.clone(), ShardId::from(1))
                .with_doc_mapper(doc_mapper)
                .build();
        state_guard.shards.insert(solo_shard.queue_id(), solo_shard);
        drop(state_guard);

        let persist_request = PersistRequest {
            leader_id: "test-ingester".to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-foo"}"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(persist_failure.subrequest_id, 0);
        assert_eq!(persist_failure.index_uid(), &index_uid);
        assert_eq!(persist_failure.source_id, "test-source");
        assert_eq!(
            persist_failure.reason(),
            PersistFailureReason::NodeUnavailable
        );

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 0);
    }

    #[tokio::test]
    async fn test_ingester_persist_replicate() {
        let (leader_ctx, leader) = IngesterForTest::default()
            .with_node_id("test-leader")
            .with_replication()
            .build()
            .await;

        let (follower_ctx, follower) = IngesterForTest::default()
            .with_node_id("test-follower")
            .with_ingester_pool(&leader_ctx.ingester_pool)
            .with_replication()
            .build()
            .await;

        let ingester_pool_entry = IngesterPoolEntry {
            client: IngesterServiceClient::new(follower.clone()),
            status: IngesterStatus::Ready,
            availability_zone: None,
        };

        leader_ctx
            .ingester_pool
            .insert(follower_ctx.node_id.clone(), ingester_pool_entry);

        let index_uid = IndexUid::for_test("test-index", 0);
        let index_uid2 = IndexUid::for_test("test-index", 1);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![
                InitShardSubrequest {
                    subrequest_id: 0,
                    shard: Some(Shard {
                        index_uid: Some(index_uid.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: leader_ctx.node_id.to_string(),
                        follower_id: Some(follower_ctx.node_id.to_string()),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json: doc_mapping_json.clone(),
                    validate_docs: true,
                },
                InitShardSubrequest {
                    subrequest_id: 1,
                    shard: Some(Shard {
                        index_uid: Some(index_uid2.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: leader_ctx.node_id.to_string(),
                        follower_id: Some(follower_ctx.node_id.to_string()),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json,
                    validate_docs: true,
                },
            ],
        };
        leader.init_shards(init_shards_request).await.unwrap();

        let persist_request = PersistRequest {
            leader_id: "test-leader".to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![
                PersistSubrequest {
                    subrequest_id: 0,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
                },
                PersistSubrequest {
                    subrequest_id: 1,
                    index_uid: Some(index_uid2.clone()),
                    source_id: "test-source".to_string(),
                    doc_batch: Some(DocBatchV2::for_test([
                        r#"{"doc": "test-doc-110"}"#,
                        r#"{"doc": "test-doc-111"}"#,
                    ])),
                },
            ],
        };
        let persist_response = leader.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-leader");
        assert_eq!(persist_response.successes.len(), 2);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_success_0 = &persist_response.successes[0];
        assert_eq!(persist_success_0.subrequest_id, 0);
        assert_eq!(persist_success_0.index_uid(), &index_uid);
        assert_eq!(persist_success_0.source_id, "test-source");
        assert_eq!(persist_success_0.shard_id(), ShardId::from(1));
        assert_eq!(
            persist_success_0.replication_position_inclusive,
            Some(Position::offset(1u64))
        );

        let persist_success_1 = &persist_response.successes[1];
        assert_eq!(persist_success_1.subrequest_id, 1);
        assert_eq!(persist_success_1.index_uid(), &index_uid2);
        assert_eq!(persist_success_1.source_id, "test-source");
        assert_eq!(persist_success_1.shard_id(), ShardId::from(1));
        assert_eq!(
            persist_success_1.replication_position_inclusive,
            Some(Position::offset(2u64))
        );

        let leader_state_guard = leader.state.lock_fully().await.unwrap();
        assert_eq!(leader_state_guard.shards.len(), 2);

        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let primary_shard_01 = leader_state_guard.shards.get(&queue_id_01).unwrap();
        primary_shard_01.assert_is_primary();
        primary_shard_01.assert_is_open();
        primary_shard_01.assert_replication_position(Position::offset(1u64));

        leader_state_guard.mrecordlog.assert_records_eq(
            &queue_id_01,
            ..,
            &[(0, [0, 0], r#"{"doc": "test-doc-010"}"#), (1, [0, 1], "")],
        );

        let queue_id_11 = queue_id(&index_uid2, &source_id, &ShardId::from(1));
        let primary_shard_11 = leader_state_guard.shards.get(&queue_id_11).unwrap();
        primary_shard_11.assert_is_primary();
        primary_shard_11.assert_is_open();
        primary_shard_11.assert_replication_position(Position::offset(2u64));

        leader_state_guard.mrecordlog.assert_records_eq(
            &queue_id_11,
            ..,
            &[
                (0, [0, 0], r#"{"doc": "test-doc-110"}"#),
                (1, [0, 0], r#"{"doc": "test-doc-111"}"#),
                (2, [0, 1], ""),
            ],
        );

        let follower_state_guard = follower.state.lock_fully().await.unwrap();
        assert_eq!(follower_state_guard.shards.len(), 2);

        let replica_shard_01 = follower_state_guard.shards.get(&queue_id_01).unwrap();
        replica_shard_01.assert_is_replica();
        replica_shard_01.assert_is_open();
        replica_shard_01.assert_replication_position(Position::offset(1u64));

        follower_state_guard.mrecordlog.assert_records_eq(
            &queue_id_01,
            ..,
            &[(0, [0, 0], r#"{"doc": "test-doc-010"}"#), (1, [0, 1], "")],
        );

        let replica_shard_11 = follower_state_guard.shards.get(&queue_id_11).unwrap();
        replica_shard_11.assert_is_replica();
        replica_shard_11.assert_is_open();
        replica_shard_11.assert_replication_position(Position::offset(2u64));

        follower_state_guard.mrecordlog.assert_records_eq(
            &queue_id_11,
            ..,
            &[
                (0, [0, 0], r#"{"doc": "test-doc-110"}"#),
                (1, [0, 0], r#"{"doc": "test-doc-111"}"#),
                (2, [0, 1], ""),
            ],
        );
    }

    #[tokio::test]
    async fn test_ingester_persist_replicate_grpc() {
        let (leader_ctx, leader) = IngesterForTest::default()
            .with_node_id("test-leader")
            .with_replication()
            .build()
            .await;

        let leader_grpc_server_adapter = IngesterServiceGrpcServerAdapter::new(leader.clone());
        let leader_grpc_server = IngesterServiceGrpcServer::new(leader_grpc_server_adapter);
        let leader_socket_addr: SocketAddr = "127.0.0.1:6666".parse().unwrap();

        tokio::spawn({
            async move {
                Server::builder()
                    .add_service(leader_grpc_server)
                    .serve(leader_socket_addr)
                    .await
                    .unwrap();
            }
        });

        let (follower_ctx, follower) = IngesterForTest::default()
            .with_node_id("test-follower")
            .with_ingester_pool(&leader_ctx.ingester_pool)
            .with_replication()
            .build()
            .await;

        let follower_grpc_server_adapter = IngesterServiceGrpcServerAdapter::new(follower.clone());
        let follower_grpc_server = IngesterServiceGrpcServer::new(follower_grpc_server_adapter);
        let follower_socket_addr: SocketAddr = "127.0.0.1:7777".parse().unwrap();

        tokio::spawn({
            async move {
                Server::builder()
                    .add_service(follower_grpc_server)
                    .serve(follower_socket_addr)
                    .await
                    .unwrap();
            }
        });
        let follower_channel = Endpoint::from_static("http://127.0.0.1:7777").connect_lazy();
        let follower_client = IngesterServiceClient::from_channel(
            "127.0.0.1:7777".parse().unwrap(),
            follower_channel,
            MAX_GRPC_MESSAGE_SIZE,
            None,
        );

        let ingester_pool_entry = IngesterPoolEntry {
            client: follower_client,
            status: IngesterStatus::Ready,
            availability_zone: None,
        };

        leader_ctx
            .ingester_pool
            .insert(follower_ctx.node_id.clone(), ingester_pool_entry);

        let index_uid = IndexUid::for_test("test-index", 0);
        let index_uid2 = IndexUid::for_test("test-index", 1);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![
                InitShardSubrequest {
                    subrequest_id: 0,
                    shard: Some(Shard {
                        index_uid: Some(index_uid.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: leader_ctx.node_id.to_string(),
                        follower_id: Some(follower_ctx.node_id.to_string()),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json: doc_mapping_json.clone(),
                    validate_docs: true,
                },
                InitShardSubrequest {
                    subrequest_id: 1,
                    shard: Some(Shard {
                        index_uid: Some(index_uid2.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: leader_ctx.node_id.to_string(),
                        follower_id: Some(follower_ctx.node_id.to_string()),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json,
                    validate_docs: true,
                },
            ],
        };
        leader.init_shards(init_shards_request).await.unwrap();

        let persist_request = PersistRequest {
            leader_id: "test-leader".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![
                PersistSubrequest {
                    subrequest_id: 0,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
                },
                PersistSubrequest {
                    subrequest_id: 1,
                    index_uid: Some(index_uid2.clone()),
                    source_id: "test-source".to_string(),
                    doc_batch: Some(DocBatchV2::for_test([
                        r#"{"doc": "test-doc-110"}"#,
                        r#"{"doc": "test-doc-111"}"#,
                    ])),
                },
            ],
        };
        let persist_response = leader.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-leader");
        assert_eq!(persist_response.successes.len(), 2);
        assert_eq!(persist_response.failures.len(), 0);

        let persist_success_0 = &persist_response.successes[0];
        assert_eq!(persist_success_0.subrequest_id, 0);
        assert_eq!(persist_success_0.index_uid(), &index_uid);
        assert_eq!(persist_success_0.source_id, "test-source");
        assert_eq!(persist_success_0.shard_id(), ShardId::from(1));
        assert_eq!(
            persist_success_0.replication_position_inclusive,
            Some(Position::offset(0u64))
        );

        let persist_success_1 = &persist_response.successes[1];
        assert_eq!(persist_success_1.subrequest_id, 1);
        assert_eq!(persist_success_1.index_uid(), &index_uid2);
        assert_eq!(persist_success_1.source_id, "test-source");
        assert_eq!(persist_success_1.shard_id(), ShardId::from(1));
        assert_eq!(
            persist_success_1.replication_position_inclusive,
            Some(Position::offset(1u64))
        );

        let leader_state_guard = leader.state.lock_fully().await.unwrap();
        assert_eq!(leader_state_guard.shards.len(), 2);

        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let primary_shard_01 = leader_state_guard.shards.get(&queue_id_01).unwrap();
        primary_shard_01.assert_is_primary();
        primary_shard_01.assert_is_open();
        primary_shard_01.assert_replication_position(Position::offset(0u64));

        leader_state_guard.mrecordlog.assert_records_eq(
            &queue_id_01,
            ..,
            &[(0, [0, 0], r#"{"doc": "test-doc-010"}"#)],
        );

        let queue_id_11 = queue_id(&index_uid2, &source_id, &ShardId::from(1));
        let primary_shard_11 = leader_state_guard.shards.get(&queue_id_11).unwrap();
        primary_shard_11.assert_is_primary();
        primary_shard_11.assert_is_open();
        primary_shard_11.assert_replication_position(Position::offset(1u64));

        leader_state_guard.mrecordlog.assert_records_eq(
            &queue_id_11,
            ..,
            &[
                (0, [0, 0], r#"{"doc": "test-doc-110"}"#),
                (1, [0, 0], r#"{"doc": "test-doc-111"}"#),
            ],
        );

        let follower_state_guard = follower.state.lock_fully().await.unwrap();
        assert_eq!(follower_state_guard.shards.len(), 2);

        let replica_shard_01 = follower_state_guard.shards.get(&queue_id_01).unwrap();
        replica_shard_01.assert_is_replica();
        replica_shard_01.assert_is_open();
        replica_shard_01.assert_replication_position(Position::offset(0u64));

        follower_state_guard.mrecordlog.assert_records_eq(
            &queue_id_01,
            ..,
            &[(0, [0, 0], r#"{"doc": "test-doc-010"}"#)],
        );

        let replica_shard_11 = follower_state_guard.shards.get(&queue_id_11).unwrap();
        replica_shard_11.assert_is_replica();
        replica_shard_11.assert_is_open();
        replica_shard_11.assert_replication_position(Position::offset(1u64));

        follower_state_guard.mrecordlog.assert_records_eq(
            &queue_id_11,
            ..,
            &[
                (0, [0, 0], r#"{"doc": "test-doc-110"}"#),
                (1, [0, 0], r#"{"doc": "test-doc-111"}"#),
            ],
        );
    }

    #[tokio::test]
    async fn test_ingester_persist_no_available_shards() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let solo_shard =
            IngesterShard::new_solo(index_uid.clone(), source_id.clone(), ShardId::from(1))
                .with_state(ShardState::Closed)
                .build();
        let queue_id = solo_shard.queue_id();
        ingester
            .state
            .lock_fully()
            .await
            .unwrap()
            .shards
            .insert(queue_id.clone(), solo_shard);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(persist_failure.subrequest_id, 0);
        assert_eq!(persist_failure.index_uid(), &index_uid);
        assert_eq!(persist_failure.source_id, "test-source");
        assert_eq!(
            persist_failure.reason(),
            PersistFailureReason::NoShardsAvailable
        );

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 1);

        let solo_shard = state_guard.shards.get(&queue_id).unwrap();
        solo_shard.assert_is_solo();
        solo_shard.assert_is_closed();
        solo_shard.assert_replication_position(Position::Beginning);
    }

    #[tokio::test]
    async fn test_ingester_persist_rate_limited() {
        let (ingester_ctx, ingester) = IngesterForTest::default()
            .with_rate_limiter_settings(RateLimiterSettings {
                burst_limit: 0,
                rate_limit: ConstantRate::bytes_per_sec(ByteSize(0)),
                refill_period: Duration::from_millis(100),
            })
            .build()
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let primary_shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: ingester_ctx.node_id.to_string(),
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                primary_shard,
                &doc_mapping_json,
                Instant::now(),
                true,
            )
            .await
            .unwrap();

        drop(state_guard);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(persist_failure.subrequest_id, 0);
        assert_eq!(persist_failure.index_uid(), &index_uid);
        assert_eq!(persist_failure.source_id, "test-source");
        assert_eq!(
            persist_failure.reason(),
            PersistFailureReason::NoShardsAvailable
        );

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 1);

        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));

        let solo_shard_01 = state_guard.shards.get(&queue_id_01).unwrap();
        solo_shard_01.assert_is_solo();
        solo_shard_01.assert_is_open();
        solo_shard_01.assert_replication_position(Position::Beginning);

        state_guard
            .mrecordlog
            .assert_records_eq(&queue_id_01, .., &[]);
    }

    #[tokio::test]
    async fn test_ingester_persist_resource_exhausted() {
        let (ingester_ctx, ingester) = IngesterForTest::default()
            .with_disk_capacity(ByteSize(0))
            .build()
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let primary_shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: ingester_ctx.node_id.to_string(),
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                primary_shard,
                &doc_mapping_json,
                Instant::now(),
                true,
            )
            .await
            .unwrap();

        drop(state_guard);

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![PersistSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
            }],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.leader_id, "test-ingester");
        assert_eq!(persist_response.successes.len(), 0);
        assert_eq!(persist_response.failures.len(), 1);

        let persist_failure = &persist_response.failures[0];
        assert_eq!(persist_failure.subrequest_id, 0);
        assert_eq!(persist_failure.index_uid(), &index_uid);
        assert_eq!(persist_failure.source_id, "test-source");
        assert_eq!(persist_failure.reason(), PersistFailureReason::WalFull);

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 1);

        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let solo_shard_01 = state_guard.shards.get(&queue_id_01).unwrap();
        solo_shard_01.assert_is_solo();
        solo_shard_01.assert_is_open();
        solo_shard_01.assert_replication_position(Position::Beginning);

        state_guard
            .mrecordlog
            .assert_records_eq(&queue_id_01, .., &[]);
    }

    #[tokio::test]
    async fn test_ingester_persist_returns_routing_update() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid_0 = IndexUid::for_test("test-index-0", 0);
        let index_uid_1 = IndexUid::for_test("test-index-1", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let init_shards_request = InitShardsRequest {
            subrequests: vec![
                InitShardSubrequest {
                    subrequest_id: 0,
                    shard: Some(Shard {
                        index_uid: Some(index_uid_0.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: ingester_ctx.node_id.to_string(),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json: doc_mapping_json.clone(),
                    validate_docs: false,
                },
                InitShardSubrequest {
                    subrequest_id: 1,
                    shard: Some(Shard {
                        index_uid: Some(index_uid_1.clone()),
                        source_id: source_id.clone(),
                        shard_id: Some(ShardId::from(1)),
                        shard_state: ShardState::Open as i32,
                        leader_id: ingester_ctx.node_id.to_string(),
                        doc_mapping_uid: Some(doc_mapping_uid),
                        ..Default::default()
                    }),
                    doc_mapping_json,
                    validate_docs: false,
                },
            ],
        };
        ingester.init_shards(init_shards_request).await.unwrap();

        let persist_request = PersistRequest {
            leader_id: ingester_ctx.node_id.to_string(),
            commit_type: CommitTypeV2::Force as i32,
            subrequests: vec![
                PersistSubrequest {
                    subrequest_id: 0,
                    index_uid: Some(index_uid_0.clone()),
                    source_id: source_id.clone(),
                    doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-010"}"#])),
                },
                PersistSubrequest {
                    subrequest_id: 1,
                    index_uid: Some(index_uid_1.clone()),
                    source_id: source_id.clone(),
                    doc_batch: Some(DocBatchV2::for_test([r#"{"doc": "test-doc-110"}"#])),
                },
            ],
        };
        let persist_response = ingester.persist(persist_request).await.unwrap();
        assert_eq!(persist_response.successes.len(), 2);

        let routing_update = persist_response
            .routing_update
            .expect("routing update should be present");

        assert!(
            routing_update.capacity_score > 0,
            "capacity score should be non-zero after a small persist"
        );

        let mut source_shard_updates = routing_update.source_shard_updates;
        source_shard_updates.sort_by(|a, b| a.index_uid().cmp(b.index_uid()));

        assert_eq!(source_shard_updates.len(), 2);
        assert_eq!(source_shard_updates[0].index_uid(), &index_uid_0);
        assert_eq!(source_shard_updates[0].source_id, source_id.as_str());
        assert_eq!(source_shard_updates[0].open_shard_count, 1);
        assert_eq!(source_shard_updates[1].index_uid(), &index_uid_1);
        assert_eq!(source_shard_updates[1].source_id, source_id.as_str());
        assert_eq!(source_shard_updates[1].open_shard_count, 1);

        assert!(routing_update.closed_shards.is_empty());
    }

    #[tokio::test]
    async fn test_ingester_open_replication_stream() {
        let (_ingester_ctx, ingester) = IngesterForTest::default()
            .with_node_id("test-follower")
            .build()
            .await;

        let (syn_replication_stream_tx, syn_replication_stream) = ServiceStream::new_bounded(5);
        let open_stream_request = OpenReplicationStreamRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            replication_seqno: 0,
        };
        let syn_replication_message = SynReplicationMessage::new_open_request(open_stream_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let mut ack_replication_stream = ingester
            .open_replication_stream(syn_replication_stream)
            .await
            .unwrap();
        ack_replication_stream
            .next()
            .await
            .unwrap()
            .unwrap()
            .into_open_response()
            .unwrap();

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert!(state_guard.replication_tasks.contains_key("test-leader"));
    }

    #[tokio::test]
    async fn test_ingester_open_fetch_stream() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: "test-client".to_string(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1337)),
            from_position_exclusive: Some(Position::Beginning),
        };
        let error = ingester
            .open_fetch_stream(open_fetch_stream_request)
            .await
            .unwrap_err();
        assert!(
            matches!(error, IngestV2Error::ShardNotFound { shard_id } if shard_id == ShardId::from(1337))
        );

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let queue_id = queue_id(&index_uid, &source_id, &ShardId::from(1));

        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard,
                &doc_mapping_json,
                Instant::now(),
                true,
            )
            .await
            .unwrap();

        let records = [MRecord::new_doc("test-doc-foo").encode()].into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id, None, records)
            .await
            .unwrap();

        drop(state_guard);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: "test-client".to_string(),
            index_uid: Some(index_uid.clone()),
            source_id,
            shard_id: Some(ShardId::from(1)),
            from_position_exclusive: Some(Position::Beginning),
        };
        let mut fetch_stream = ingester
            .open_fetch_stream(open_fetch_stream_request)
            .await
            .unwrap();

        let fetch_response = fetch_stream.next().await.unwrap().unwrap();
        let fetch_payload = into_fetch_payload(fetch_response);

        assert_eq!(fetch_payload.from_position_exclusive(), Position::Beginning);
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(0u64)
        );

        let mrecord_batch = fetch_payload.mrecord_batch.unwrap();
        assert_eq!(
            mrecord_batch.mrecord_buffer,
            Bytes::from_static(b"\0\0test-doc-foo")
        );
        assert_eq!(mrecord_batch.mrecord_lengths, [14]);

        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        let records = [MRecord::new_doc("test-doc-bar").encode()].into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id, None, records)
            .await
            .unwrap();

        let shard = state_guard.shards.get(&queue_id).unwrap();
        assert!(shard.is_advertisable);
        shard.notify_shard_status();
        drop(state_guard);

        let fetch_response = fetch_stream.next().await.unwrap().unwrap();
        let fetch_payload = into_fetch_payload(fetch_response);

        assert_eq!(
            fetch_payload.from_position_exclusive(),
            Position::offset(0u64)
        );
        assert_eq!(
            fetch_payload.to_position_inclusive(),
            Position::offset(1u64)
        );

        let mrecord_batch = fetch_payload.mrecord_batch.unwrap();
        assert_eq!(
            mrecord_batch.mrecord_buffer,
            Bytes::from_static(b"\0\0test-doc-bar")
        );
        assert_eq!(mrecord_batch.mrecord_lengths, [14]);
    }

    #[tokio::test]
    async fn test_ingester_truncate_shards() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));
        let queue_id_02 = queue_id(&index_uid, &source_id, &ShardId::from(2));

        let doc_mapping_uid_01 = DocMappingUid::random();
        let doc_mapping_json_01 = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid_01}"
            }}"#
        );
        let shard_01 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid_01),
            ..Default::default()
        };

        let doc_mapping_uid_02 = DocMappingUid::random();
        let doc_mapping_json_02 = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid_02}"
            }}"#
        );
        let shard_02 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(doc_mapping_uid_02),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let now = Instant::now();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_01,
                &doc_mapping_json_01,
                now,
                true,
            )
            .await
            .unwrap();
        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_02,
                &doc_mapping_json_02,
                now,
                true,
            )
            .await
            .unwrap();

        assert_eq!(state_guard.shards.len(), 2);
        assert_eq!(state_guard.doc_mappers.len(), 2);

        let records = [
            MRecord::new_doc("test-doc-foo").encode(),
            MRecord::new_doc("test-doc-bar").encode(),
        ]
        .into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_01, None, records)
            .await
            .unwrap();

        let records = [MRecord::new_doc("test-doc-baz").encode()].into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_02, None, records)
            .await
            .unwrap();

        drop(state_guard);

        let truncate_shards_request = TruncateShardsRequest {
            ingester_id: ingester_ctx.node_id.to_string(),
            subrequests: vec![
                TruncateShardsSubrequest {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(1)),
                    truncate_up_to_position_inclusive: Some(Position::offset(0u64)),
                },
                TruncateShardsSubrequest {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(2)),
                    truncate_up_to_position_inclusive: Some(Position::eof(0u64)),
                },
                TruncateShardsSubrequest {
                    index_uid: Some(IndexUid::for_test("test-index", 1337)),
                    source_id,
                    shard_id: Some(ShardId::from(1337)),
                    truncate_up_to_position_inclusive: Some(Position::offset(1337u64)),
                },
            ],
        };
        ingester
            .truncate_shards(truncate_shards_request.clone())
            .await
            .unwrap();

        // Verify idempotency.
        ingester
            .truncate_shards(truncate_shards_request)
            .await
            .unwrap();

        let state_guard = ingester.state.lock_fully().await.unwrap();

        assert_eq!(state_guard.shards.len(), 1);
        assert_eq!(state_guard.doc_mappers.len(), 1);

        assert!(state_guard.shards.contains_key(&queue_id_01));
        assert!(state_guard.doc_mappers.contains_key(&doc_mapping_uid_01));

        state_guard
            .mrecordlog
            .assert_records_eq(&queue_id_01, .., &[(1, [0, 0], "test-doc-bar")]);
    }

    #[tokio::test]
    async fn test_ingester_truncate_shards_deletes_dangling_shards() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let solo_shard =
            IngesterShard::new_solo(index_uid.clone(), source_id.clone(), ShardId::from(1)).build();
        state_guard.shards.insert(solo_shard.queue_id(), solo_shard);
        drop(state_guard);

        let truncate_shards_request = TruncateShardsRequest {
            ingester_id: ingester_ctx.node_id.to_string(),
            subrequests: vec![TruncateShardsSubrequest {
                index_uid: Some(index_uid.clone()),
                source_id,
                shard_id: Some(ShardId::from(1)),
                truncate_up_to_position_inclusive: Some(Position::offset(0u64)),
            }],
        };
        ingester
            .truncate_shards(truncate_shards_request.clone())
            .await
            .unwrap();

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 0);
    }

    #[tokio::test]
    async fn test_ingester_reset_shards() {
        let mut mock_control_plane = MockControlPlaneService::new();
        mock_control_plane
            .expect_advise_reset_shards()
            .once()
            .returning(|_| Ok(AdviseResetShardsResponse::default()));

        mock_control_plane
            .expect_advise_reset_shards()
            .once()
            .returning(|mut request| {
                assert_eq!(request.ingester_id, "test-ingester");
                assert_eq!(request.shard_ids.len(), 1);
                assert_eq!(request.shard_ids[0].index_uid(), &("test-index", 0));
                assert_eq!(request.shard_ids[0].source_id, "test-source");
                request.shard_ids[0].shard_ids.sort_unstable();
                assert_eq!(
                    request.shard_ids[0].shard_ids,
                    [ShardId::from(1), ShardId::from(2)]
                );
                let response = AdviseResetShardsResponse {
                    shards_to_delete: vec![ShardIds {
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        shard_ids: vec![ShardId::from(1)],
                    }],
                    shards_to_truncate: vec![ShardIdPositions {
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        shard_positions: vec![ShardIdPosition {
                            shard_id: Some(ShardId::from(2)),
                            publish_position_inclusive: Some(Position::offset(1u64)),
                        }],
                    }],
                };
                Ok(response)
            });
        let control_plane = ControlPlaneServiceClient::from_mock(mock_control_plane);

        let (_ingester_ctx, mut ingester) = IngesterForTest::default()
            .with_control_plane(control_plane)
            .build()
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard_01 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let shard_02 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let queue_id_02 = queue_id(&index_uid, &source_id, &ShardId::from(2));

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let now = Instant::now();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_01,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();
        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_02,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();

        let records = [
            MRecord::new_doc("test-doc-foo").encode(),
            MRecord::new_doc("test-doc-bar").encode(),
        ]
        .into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_02, None, records)
            .await
            .unwrap();

        drop(state_guard);

        ingester.reset_shards().await;

        let state_guard = ingester.state.lock_partially().await.unwrap();
        assert_eq!(state_guard.shards.len(), 1);

        let shard_02 = state_guard.shards.get(&queue_id_02).unwrap();
        shard_02.assert_truncation_position(Position::offset(1u64));
    }

    #[tokio::test]
    async fn test_ingester_retain_shards() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard_17 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(17)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };

        let shard_18 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(18)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let queue_id_17 = queue_id(
            shard_17.index_uid(),
            &shard_17.source_id,
            shard_17.shard_id(),
        );

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let now = Instant::now();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_17,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_18,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();

        drop(state_guard);

        {
            let state_guard = ingester.state.lock_fully().await.unwrap();
            assert_eq!(state_guard.shards.len(), 2);
        }

        let retain_shards_request = RetainShardsRequest {
            retain_shards_for_sources: vec![RetainShardsForSource {
                index_uid: Some(index_uid.clone()),
                source_id,
                shard_ids: vec![ShardId::from(17u64)],
            }],
        };
        ingester.retain_shards(retain_shards_request).await.unwrap();

        {
            let state_guard = ingester.state.lock_fully().await.unwrap();
            assert_eq!(state_guard.shards.len(), 1);
            assert!(state_guard.shards.contains_key(&queue_id_17));
        }
    }

    #[tokio::test]
    async fn test_ingester_close_shards() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let queue_id = queue_id(&index_uid, &source_id, &ShardId::from(1));

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            publish_position_inclusive: Some(Position::Beginning),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard,
                &doc_mapping_json,
                Instant::now(),
                true,
            )
            .await
            .unwrap();
        drop(state_guard);

        let open_fetch_stream_request = OpenFetchStreamRequest {
            client_id: "test-client".to_string(),
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            from_position_exclusive: Some(Position::Beginning),
        };
        let mut fetch_stream = ingester
            .open_fetch_stream(open_fetch_stream_request)
            .await
            .unwrap();

        let close_shards_request = CloseShardsRequest {
            shard_pkeys: vec![
                ShardPKey {
                    index_uid: Some(index_uid.clone()),
                    source_id: source_id.clone(),
                    shard_id: Some(ShardId::from(1)),
                },
                ShardPKey {
                    index_uid: Some(index_uid.clone()),
                    source_id,
                    shard_id: Some(ShardId::from(1337)),
                },
            ],
        };
        let closed_shards_response = ingester
            .close_shards(close_shards_request.clone())
            .await
            .unwrap();
        assert_eq!(closed_shards_response.successes.len(), 1);

        let close_shard_success = &closed_shards_response.successes[0];
        assert_eq!(close_shard_success.index_uid(), &index_uid);
        assert_eq!(close_shard_success.source_id, "test-source");
        assert_eq!(close_shard_success.shard_id(), ShardId::from(1));

        // Verify idempotency.
        ingester
            .close_shards(close_shards_request.clone())
            .await
            .unwrap();

        let state_guard = ingester.state.lock_partially().await.unwrap();
        let shard = state_guard.shards.get(&queue_id).unwrap();
        shard.assert_is_closed();

        let fetch_response = timeout(Duration::from_millis(100), fetch_stream.next())
            .await
            .unwrap()
            .unwrap()
            .unwrap();
        let fetch_eof = into_fetch_eof(fetch_response);

        assert_eq!(fetch_eof.eof_position(), Position::Beginning.as_eof());
    }

    #[tokio::test]
    async fn test_ingester_open_observation_stream() {
        let (ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let mut observation_stream = ingester
            .open_observation_stream(OpenObservationStreamRequest {})
            .await
            .unwrap();
        let observation = observation_stream.next().await.unwrap().unwrap();
        assert_eq!(observation.node_id, ingester_ctx.node_id);
        assert_eq!(observation.status(), IngesterStatus::Ready);

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        state_guard
            .set_status(IngesterStatus::Decommissioning)
            .await;
        drop(state_guard);

        let observation = observation_stream.next().await.unwrap().unwrap();
        assert_eq!(observation.node_id, ingester_ctx.node_id);
        assert_eq!(observation.status(), IngesterStatus::Decommissioning);

        drop(ingester);

        let observation_opt = observation_stream.next().await;
        assert!(observation_opt.is_none());
    }

    #[tokio::test]
    async fn test_ingester_decommission() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let shard = IngesterShard::new_solo(index_uid, source_id, ShardId::from(1)).build();
        let queue_id = shard.queue_id();

        state_guard.shards.insert(queue_id.clone(), shard);
        drop(state_guard);

        let mut observation_stream = ingester
            .open_observation_stream(OpenObservationStreamRequest {})
            .await
            .unwrap();

        ingester.decommission(DecommissionRequest {}).await.unwrap();

        let next_observation = observation_stream.next().await.unwrap().unwrap();
        let next_status = next_observation.status();
        assert_eq!(next_status, IngesterStatus::Retiring);

        wait_for_ingester_status(
            &ingester,
            IngesterStatus::Decommissioning,
            Duration::from_secs(1),
        )
        .await
        .unwrap();

        let state_guard = ingester.state.lock_fully().await.unwrap();
        let shard = state_guard.shards.get(&queue_id).unwrap();
        shard.assert_is_closed();
    }

    #[tokio::test]
    async fn test_check_decommissioning_status() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;
        let mut state_guard = ingester.state.lock_fully().await.unwrap();

        ingester
            .check_decommissioning_status(&mut state_guard)
            .await;
        assert_eq!(state_guard.status(), IngesterStatus::Ready);

        state_guard
            .set_status(IngesterStatus::Decommissioning)
            .await;
        ingester
            .check_decommissioning_status(&mut state_guard)
            .await;
        assert_eq!(state_guard.status(), IngesterStatus::Decommissioned);

        state_guard
            .set_status(IngesterStatus::Decommissioning)
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let solo_shard = IngesterShard::new_solo(index_uid.clone(), source_id, ShardId::from(1))
            .with_state(ShardState::Closed)
            .with_replication_position_inclusive(Position::offset(12u64))
            .build();
        let queue_id = solo_shard.queue_id();

        state_guard.shards.insert(queue_id.clone(), solo_shard);
        ingester
            .check_decommissioning_status(&mut state_guard)
            .await;
        assert_eq!(state_guard.status(), IngesterStatus::Decommissioning);

        let shard = state_guard.shards.get_mut(&queue_id).unwrap();
        shard.truncation_position_inclusive = Position::Beginning.as_eof();

        ingester
            .check_decommissioning_status(&mut state_guard)
            .await;
        assert_eq!(state_guard.status(), IngesterStatus::Decommissioned);
    }

    #[tokio::test]
    async fn test_ingester_truncate_on_shard_positions_update() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;
        let event_broker = EventBroker::default();
        ingester.subscribe(&event_broker);

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard_01 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));

        let shard_02 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let queue_id_02 = queue_id(&index_uid, &source_id, &ShardId::from(2));

        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let now = Instant::now();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_01,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();
        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_02,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();

        let records = [
            MRecord::new_doc("test-doc-foo").encode(),
            MRecord::new_doc("test-doc-bar").encode(),
        ]
        .into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_01, None, records)
            .await
            .unwrap();

        let records = [MRecord::new_doc("test-doc-baz").encode()].into_iter();

        state_guard
            .mrecordlog
            .append_records(&queue_id_02, None, records)
            .await
            .unwrap();

        drop(state_guard);

        let shard_position_update = ShardPositionsUpdate {
            source_uid: SourceUid {
                index_uid: index_uid.clone(),
                source_id,
            },
            updated_shard_positions: vec![
                (ShardId::from(1), Position::offset(0u64)),
                (ShardId::from(2), Position::eof(0u64)),
                (ShardId::from(1337), Position::offset(1337u64)),
            ],
        };
        event_broker.publish(shard_position_update.clone());

        // Verify idempotency.
        event_broker.publish(shard_position_update);

        // Yield so that the event is processed.
        yield_now().await;

        let state_guard = ingester.state.lock_fully().await.unwrap();
        assert_eq!(state_guard.shards.len(), 1);

        assert!(state_guard.shards.contains_key(&queue_id_01));

        state_guard
            .mrecordlog
            .assert_records_eq(&queue_id_01, .., &[(1, [0, 0], "test-doc-bar")]);

        assert!(!state_guard.shards.contains_key(&queue_id_02));
        assert!(!state_guard.mrecordlog.queue_exists(&queue_id_02));
    }

    #[tokio::test]
    async fn test_ingester_closes_idle_shards() {
        // The `CloseIdleShardsTask` task is already unit tested, so this test ensures the task is
        // correctly spawned upon starting an ingester.
        let idle_shard_timeout = Duration::from_millis(200);
        let (_ingester_ctx, ingester) = IngesterForTest::default()
            .with_idle_shard_timeout(idle_shard_timeout)
            .build()
            .await;

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");
        let queue_id_01 = queue_id(&index_uid, &source_id, &ShardId::from(1));

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard_01 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id,
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let now = Instant::now();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_01,
                &doc_mapping_json,
                now - idle_shard_timeout,
                true,
            )
            .await
            .unwrap();

        drop(state_guard);

        for _ in 0..10 {
            tokio::time::sleep(Duration::from_millis(100)).await;

            let state_guard = ingester.state.lock_partially().await.unwrap();
            let shard = state_guard.shards.get(&queue_id_01).unwrap();

            if shard.is_closed() {
                return;
            }
            drop(state_guard);
        }
        panic!("idle shard was not closed");
    }

    #[tokio::test]
    async fn test_ingester_debug_info() {
        let (_ingester_ctx, ingester) = IngesterForTest::default().build().await;

        let index_uid_0: IndexUid = IndexUid::for_test("test-index-0", 0);
        let index_uid_1: IndexUid = IndexUid::for_test("test-index-1", 0);
        let source_id = SourceId::from("test-source");

        let doc_mapping_uid = DocMappingUid::random();
        let doc_mapping_json = format!(
            r#"{{
                "doc_mapping_uid": "{doc_mapping_uid}"
            }}"#
        );
        let shard_01 = Shard {
            index_uid: Some(index_uid_0.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let shard_02 = Shard {
            index_uid: Some(index_uid_0.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let shard_03 = Shard {
            index_uid: Some(index_uid_1.clone()),
            source_id,
            shard_id: Some(ShardId::from(3)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(doc_mapping_uid),
            ..Default::default()
        };
        let mut state_guard = ingester.state.lock_fully().await.unwrap();
        let now = Instant::now();

        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_01,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();
        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_02,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();
        ingester
            .init_primary_shard(
                &mut state_guard.inner,
                &mut state_guard.mrecordlog,
                shard_03,
                &doc_mapping_json,
                now,
                true,
            )
            .await
            .unwrap();
        drop(state_guard);

        let debug_info = ingester.debug_info().await;
        assert_eq!(debug_info["status"], "ready");

        let shards = &debug_info["shards"];
        assert_eq!(shards.as_object().unwrap().len(), 2);

        assert_eq!(
            shards["test-index-0:00000000000000000000000000"]
                .as_array()
                .unwrap()
                .len(),
            2
        );
        assert_eq!(
            shards["test-index-1:00000000000000000000000000"]
                .as_array()
                .unwrap()
                .len(),
            1
        );
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use mrecordlog::ResourceUsage;
use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    Histogram, HistogramVec, IntCounter, IntCounterVec, IntGauge, IntGaugeVec, exponential_buckets,
    linear_buckets, new_counter_vec, new_gauge, new_gauge_vec, new_histogram, new_histogram_vec,
};

// Counter vec counting the different outcomes of ingest requests as
// measure at the end of the router work.
//
// The counter are counting persist subrequests.
pub(crate) struct IngestResultMetrics {
    pub success: IntCounter,
    pub circuit_breaker: IntCounter,
    pub unspecified: IntCounter,
    pub index_not_found: IntCounter,
    pub source_not_found: IntCounter,
    pub internal: IntCounter,
    pub no_shards_available: IntCounter,
    pub shard_rate_limited: IntCounter,
    pub wal_full: IntCounter,
    pub timeout: IntCounter,
    pub router_timeout: IntCounter,
    pub router_load_shedding: IntCounter,
    pub load_shedding: IntCounter,
    pub shard_not_found: IntCounter,
    pub unavailable: IntCounter,
}

impl Default for IngestResultMetrics {
    fn default() -> Self {
        let ingest_result_total_vec = new_counter_vec::<1>(
            "ingest_result_total",
            "Number of ingest requests by result",
            "ingest",
            &[],
            ["result"],
        );
        Self {
            success: ingest_result_total_vec.with_label_values(["success"]),
            circuit_breaker: ingest_result_total_vec.with_label_values(["circuit_breaker"]),
            unspecified: ingest_result_total_vec.with_label_values(["unspecified"]),
            index_not_found: ingest_result_total_vec.with_label_values(["index_not_found"]),
            source_not_found: ingest_result_total_vec.with_label_values(["source_not_found"]),
            internal: ingest_result_total_vec.with_label_values(["internal"]),
            no_shards_available: ingest_result_total_vec.with_label_values(["no_shards_available"]),
            shard_rate_limited: ingest_result_total_vec.with_label_values(["shard_rate_limited"]),
            wal_full: ingest_result_total_vec.with_label_values(["wal_full"]),
            timeout: ingest_result_total_vec.with_label_values(["timeout"]),
            router_timeout: ingest_result_total_vec.with_label_values(["router_timeout"]),
            router_load_shedding: ingest_result_total_vec
                .with_label_values(["router_load_shedding"]),
            load_shedding: ingest_result_total_vec.with_label_values(["load_shedding"]),
            unavailable: ingest_result_total_vec.with_label_values(["unavailable"]),
            shard_not_found: ingest_result_total_vec.with_label_values(["shard_not_found"]),
        }
    }
}

pub(super) struct IngestV2Metrics {
    pub reset_shards_operations_total: IntCounterVec<1>,
    pub open_shards: IntGauge,
    pub closed_shards: IntGauge,
    pub shard_lt_throughput_mib: Histogram,
    pub shard_st_throughput_mib: Histogram,
    pub wal_acquire_lock_requests_in_flight: IntGaugeVec<2>,
    pub wal_acquire_lock_request_duration_secs: HistogramVec<2>,
    pub wal_disk_used_bytes: IntGauge,
    pub wal_memory_used_bytes: IntGauge,
    pub ingest_results: IngestResultMetrics,
    pub ingest_attempts: IntCounterVec<1>,
}

impl Default for IngestV2Metrics {
    fn default() -> Self {
        Self {
            ingest_results: IngestResultMetrics::default(),
            ingest_attempts: new_counter_vec::<1>(
                "ingest_attempts",
                "Number of routing attempts by AZ locality",
                "ingest",
                &[],
                ["az_routing"],
            ),
            reset_shards_operations_total: new_counter_vec(
                "reset_shards_operations_total",
                "Total number of reset shards operations performed.",
                "ingest",
                &[],
                ["status"],
            ),
            open_shards: new_gauge(
                "shards",
                "Number of shards hosted by the ingester.",
                "ingest",
                &[("state", "open")],
            ),
            closed_shards: new_gauge(
                "shards",
                "Number of shards hosted by the ingester.",
                "ingest",
                &[("state", "closed")],
            ),
            shard_lt_throughput_mib: new_histogram(
                "shard_lt_throughput_mib",
                "Shard long term throughput as reported through chitchat",
                "ingest",
                linear_buckets(0.0f64, 1.0f64, 15).unwrap(),
            ),
            shard_st_throughput_mib: new_histogram(
                "shard_st_throughput_mib",
                "Shard short term throughput as reported through chitchat",
                "ingest",
                linear_buckets(0.0f64, 1.0f64, 15).unwrap(),
            ),
            wal_acquire_lock_requests_in_flight: new_gauge_vec(
                "wal_acquire_lock_requests_in_flight",
                "Number of acquire lock requests in-flight.",
                "ingest",
                &[],
                ["operation", "type"],
            ),
            wal_acquire_lock_request_duration_secs: new_histogram_vec(
                "wal_acquire_lock_request_duration_secs",
                "Duration of acquire lock requests in seconds.",
                "ingest",
                &[],
                ["operation", "type"],
                exponential_buckets(0.001, 2.0, 12).unwrap(),
            ),
            wal_disk_used_bytes: new_gauge(
                "wal_disk_used_bytes",
                "WAL disk space used in bytes.",
                "ingest",
                &[],
            ),
            wal_memory_used_bytes: new_gauge(
                "wal_memory_used_bytes",
                "WAL memory used in bytes.",
                "ingest",
                &[],
            ),
        }
    }
}

pub(super) fn report_wal_usage(wal_usage: ResourceUsage) {
    INGEST_V2_METRICS
        .wal_disk_used_bytes
        .set(wal_usage.disk_used_bytes as i64);
    quickwit_common::metrics::MEMORY_METRICS
        .in_flight
        .wal
        .set(wal_usage.memory_allocated_bytes as i64);
    INGEST_V2_METRICS
        .wal_memory_used_bytes
        .set(wal_usage.memory_used_bytes as i64);
}

pub(super) static INGEST_V2_METRICS: Lazy<IngestV2Metrics> = Lazy::new(IngestV2Metrics::default);


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod broadcast;
mod debouncing;
mod doc_mapper;
mod fetch;
mod helpers;
mod idle;
mod ingester;
mod metrics;
mod models;
mod mrecord;
mod mrecordlog_utils;
mod publish_tracker;
mod rate_meter;
mod replication;
mod router;
mod routing_table;
mod state;
mod wal_capacity_tracker;
mod workbench;

use std::collections::HashMap;
use std::collections::hash_map::Entry;
use std::ops::{Add, AddAssign};
use std::time::Duration;
use std::{env, fmt};

pub use broadcast::{
    LocalShardsUpdate, ShardInfo, ShardInfos, setup_ingester_capacity_update_listener,
    setup_local_shards_update_listener,
};
use bytes::buf::Writer;
use bytes::{BufMut, BytesMut};
use bytesize::ByteSize;
use quickwit_common::tower::Pool;
use quickwit_proto::ingest::ingester::{IngesterServiceClient, IngesterStatus};
use quickwit_proto::ingest::router::{IngestRequestV2, IngestSubrequest};
use quickwit_proto::ingest::{CommitTypeV2, DocBatchV2};
use quickwit_proto::types::{
    DocUid, DocUidGenerator, IndexId, IndexUid, NodeId, SourceId, SubrequestId,
};
use serde::Serialize;
use tracing::{error, info};
use workbench::pending_subrequests;

pub use self::fetch::{FetchStreamError, MultiFetchStream};
pub use self::helpers::{
    try_get_ingester_status, wait_for_ingester_decommission, wait_for_ingester_status,
};
pub use self::ingester::Ingester;
use self::mrecord::MRECORD_HEADER_LEN;
pub use self::mrecord::{MRecord, decoded_mrecords};
pub use self::router::IngestRouter;

/// An ingester as represented in the pool, bundling the gRPC client with node metadata.
#[derive(Debug, Clone)]
pub struct IngesterPoolEntry {
    pub client: IngesterServiceClient,
    pub status: IngesterStatus,
    pub availability_zone: Option<String>,
}

impl IngesterPoolEntry {
    #[cfg(any(test, feature = "testsuite"))]
    pub fn ready_with_client(client: IngesterServiceClient) -> Self {
        IngesterPoolEntry {
            client,
            status: IngesterStatus::Ready,
            availability_zone: None,
        }
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked_ingester() -> Self {
        IngesterPoolEntry {
            client: IngesterServiceClient::mocked(),
            status: IngesterStatus::Ready,
            availability_zone: None,
        }
    }
}

pub type IngesterPool = Pool<NodeId, IngesterPoolEntry>;

/// Identifies an ingester client, typically a source, for logging and debugging purposes.
pub type ClientId = String;

pub type LeaderId = NodeId;

pub type FollowerId = NodeId;

pub type OpenShardCounts = Vec<(IndexUid, SourceId, usize)>;

const IDLE_SHARD_TIMEOUT_ENV_KEY: &str = "QW_IDLE_SHARD_TIMEOUT_SECS";

const DEFAULT_IDLE_SHARD_TIMEOUT: Duration = Duration::from_secs(15 * 60); // 15 minutes

pub fn get_idle_shard_timeout() -> Duration {
    env::var(IDLE_SHARD_TIMEOUT_ENV_KEY)
        .ok()
        .and_then(|idle_shard_timeout_str| {
            if let Ok(idle_shard_timeout_secs) = idle_shard_timeout_str.parse::<u64>() {
                info!("overriding idle shard timeout to {idle_shard_timeout_secs} seconds");
                Some(idle_shard_timeout_secs)
            } else {
                error!(
                    "failed to parse environment variable \
                     `{IDLE_SHARD_TIMEOUT_ENV_KEY}={idle_shard_timeout_str}`"
                );
                None
            }
        })
        .map(Duration::from_secs)
        .unwrap_or(DEFAULT_IDLE_SHARD_TIMEOUT)
}

const INGEST_ROUTER_BUFFER_SIZE_ENV_KEY: &str = "QW_INGEST_ROUTER_BUFFER_SIZE_BYTES";

const DEFAULT_INGEST_ROUTER_BUFFER_SIZE: ByteSize = ByteSize::mib(if cfg!(test) { 8 } else { 256 }); // 256 MiB

pub(crate) fn get_ingest_router_buffer_size() -> ByteSize {
    env::var(INGEST_ROUTER_BUFFER_SIZE_ENV_KEY)
        .ok()
        .and_then(|buffer_size_bytes_str| {
            if let Ok(buffer_size) = buffer_size_bytes_str.parse::<ByteSize>() {
                info!("overriding ingest router buffer size to {buffer_size}");
                Some(buffer_size)
            } else {
                error!(
                    "failed to parse environment variable \
                     `{INGEST_ROUTER_BUFFER_SIZE_ENV_KEY}={buffer_size_bytes_str}`"
                );
                None
            }
        })
        .unwrap_or(DEFAULT_INGEST_ROUTER_BUFFER_SIZE)
}

/// Helper struct to build a [`DocBatchV2`]`.
#[derive(Debug, Default)]
pub struct DocBatchV2Builder {
    doc_uids: Vec<DocUid>,
    doc_buffer: BytesMut,
    doc_lengths: Vec<u32>,
}

impl DocBatchV2Builder {
    /// Adds a document to the batch.
    pub fn add_doc(&mut self, doc_uid: DocUid, doc: &[u8]) {
        self.doc_uids.push(doc_uid);
        self.doc_buffer.put(doc);
        self.doc_lengths.push(doc.len() as u32);
    }

    /// Builds the [`DocBatchV2`], returning `None` if the batch is empty.
    pub fn build(self) -> Option<DocBatchV2> {
        if self.doc_uids.is_empty() {
            return None;
        }
        let doc_batch = DocBatchV2 {
            doc_uids: self.doc_uids,
            doc_buffer: self.doc_buffer.freeze(),
            doc_lengths: self.doc_lengths,
        };
        Some(doc_batch)
    }
}

/// Batch builder that can append [`Serialize`] structs without an extra copy
pub struct JsonDocBatchV2Builder {
    doc_uids: Vec<DocUid>,
    doc_buffer: Writer<BytesMut>,
    doc_lengths: Vec<u32>,
}

impl Default for JsonDocBatchV2Builder {
    fn default() -> Self {
        Self {
            doc_uids: Vec::new(),
            doc_buffer: BytesMut::new().writer(),
            doc_lengths: Vec::new(),
        }
    }
}

impl JsonDocBatchV2Builder {
    pub fn add_doc(&mut self, doc_uid: DocUid, payload: impl Serialize) -> serde_json::Result<()> {
        let old_len = self.doc_buffer.get_ref().len();
        serde_json::to_writer(&mut self.doc_buffer, &payload)?;
        let new_len = self.doc_buffer.get_ref().len();
        let written_len = new_len - old_len;
        self.doc_uids.push(doc_uid);
        self.doc_lengths.push(written_len as u32);
        Ok(())
    }

    pub fn build(self) -> DocBatchV2 {
        DocBatchV2 {
            doc_uids: self.doc_uids,
            doc_buffer: self.doc_buffer.into_inner().freeze(),
            doc_lengths: self.doc_lengths,
        }
    }

    pub fn with_num_docs(num_docs: usize) -> Self {
        Self {
            doc_uids: Vec::with_capacity(num_docs),
            doc_lengths: Vec::with_capacity(num_docs),
            ..Default::default()
        }
    }
}

/// Helper struct to build an [`IngestRequestV2`].
#[derive(Debug, Default)]
pub struct IngestRequestV2Builder {
    per_index_id_doc_batch_builders: HashMap<IndexId, (SubrequestId, DocBatchV2Builder)>,
    subrequest_id_sequence: SubrequestId,
    doc_uid_generator: DocUidGenerator,
}

impl IngestRequestV2Builder {
    /// Adds a document to the request, returning the ID of the subrequest to which it was added and
    /// its newly assigned [`DocUid`].
    pub fn add_doc(&mut self, index_id: IndexId, doc: &[u8]) -> (SubrequestId, DocUid) {
        match self.per_index_id_doc_batch_builders.entry(index_id) {
            Entry::Occupied(mut entry) => {
                let (subrequest_id, doc_batch_builder) = entry.get_mut();
                let doc_uid = self.doc_uid_generator.next_doc_uid();
                doc_batch_builder.add_doc(doc_uid, doc);
                (*subrequest_id, doc_uid)
            }
            Entry::Vacant(entry) => {
                let subrequest_id = self.subrequest_id_sequence;
                self.subrequest_id_sequence += 1;
                let mut doc_batch_builder = DocBatchV2Builder::default();
                let doc_uid = self.doc_uid_generator.next_doc_uid();
                doc_batch_builder.add_doc(doc_uid, doc);
                entry.insert((subrequest_id, doc_batch_builder));
                (subrequest_id, doc_uid)
            }
        }
    }

    /// Builds the [`IngestRequestV2`], returning `None` if the request is empty.
    pub fn build(self, source_id: &str, commit_type: CommitTypeV2) -> Option<IngestRequestV2> {
        let subrequests: Vec<IngestSubrequest> = self
            .per_index_id_doc_batch_builders
            .into_iter()
            .flat_map(|(index_id, (subrequest_id, doc_batch_builder))| {
                let doc_batch = doc_batch_builder.build()?;
                let ingest_subrequest = IngestSubrequest {
                    subrequest_id,
                    index_id,
                    source_id: source_id.to_string(),
                    doc_batch: Some(doc_batch),
                };
                Some(ingest_subrequest)
            })
            .collect();

        if subrequests.is_empty() {
            return None;
        }
        let ingest_request = IngestRequestV2 {
            subrequests,
            commit_type: commit_type as i32,
        };
        Some(ingest_request)
    }
}

pub(super) fn estimate_size(doc_batch: &DocBatchV2) -> ByteSize {
    let estimate = doc_batch.num_bytes() + doc_batch.num_docs() * MRECORD_HEADER_LEN;
    ByteSize(estimate as u64)
}

#[derive(Debug, Clone, Copy, Default, Eq, PartialEq, Ord, PartialOrd)]
pub struct RateMibPerSec(pub u16);

impl fmt::Display for RateMibPerSec {
    fn fmt(&self, f: &mut fmt::Formatter) -> std::fmt::Result {
        write!(f, "{}MiB/s", self.0)
    }
}

impl PartialEq<u16> for RateMibPerSec {
    fn eq(&self, other: &u16) -> bool {
        self.0 == *other
    }
}

impl Add<RateMibPerSec> for RateMibPerSec {
    type Output = RateMibPerSec;

    #[inline(always)]
    fn add(self, rhs: RateMibPerSec) -> Self::Output {
        RateMibPerSec(self.0 + rhs.0)
    }
}

impl AddAssign<RateMibPerSec> for RateMibPerSec {
    #[inline(always)]
    fn add_assign(&mut self, rhs: RateMibPerSec) {
        self.0 += rhs.0;
    }
}

#[cfg(test)]
mod tests {
    use bytes::Bytes;

    use super::*;

    #[test]
    fn test_doc_batch_builder() {
        let doc_batch_builder = DocBatchV2Builder::default();
        let doc_batch_opt = doc_batch_builder.build();
        assert!(doc_batch_opt.is_none());

        let mut doc_batch_builder = DocBatchV2Builder::default();
        let mut doc_uid_generator = DocUidGenerator::default();
        doc_batch_builder.add_doc(doc_uid_generator.next_doc_uid(), b"Hello, ");
        doc_batch_builder.add_doc(doc_uid_generator.next_doc_uid(), b"World!");
        let doc_batch = doc_batch_builder.build().unwrap();

        assert_eq!(doc_batch.num_docs(), 2);
        assert_eq!(doc_batch.num_bytes(), 21);
        assert_eq!(doc_batch.doc_lengths, [7, 6]);
        assert_eq!(doc_batch.doc_buffer, Bytes::from(&b"Hello, World!"[..]));
    }

    #[test]
    fn test_ingest_request_builder() {
        let ingest_request_builder = IngestRequestV2Builder::default();
        let ingest_request_opt = ingest_request_builder.build("test-source", CommitTypeV2::Auto);
        assert!(ingest_request_opt.is_none());

        let mut ingest_request_builder = IngestRequestV2Builder::default();

        let (subrequest_id, hello_doc_uid) =
            ingest_request_builder.add_doc("test-index-foo".to_string(), b"Hello, ");
        assert_eq!(subrequest_id, 0);

        let (subrequest_id, world_doc_uid) =
            ingest_request_builder.add_doc("test-index-foo".to_string(), b"World!");
        assert_eq!(subrequest_id, 0);
        assert!(hello_doc_uid < world_doc_uid);

        let (subrequest_id, hola_doc_uid) =
            ingest_request_builder.add_doc("test-index-bar".to_string(), b"Hola, ");
        assert_eq!(subrequest_id, 1);
        assert!(world_doc_uid < hola_doc_uid);

        let (subrequest_id, mundo_doc_uid) =
            ingest_request_builder.add_doc("test-index-bar".to_string(), b"Mundo!");
        assert_eq!(subrequest_id, 1);
        assert!(hola_doc_uid < mundo_doc_uid);

        let mut ingest_request = ingest_request_builder
            .build("test-source", CommitTypeV2::Auto)
            .unwrap();

        ingest_request
            .subrequests
            .sort_by(|left, right| left.index_id.cmp(&right.index_id).reverse());

        assert_eq!(ingest_request.subrequests.len(), 2);
        assert_eq!(ingest_request.subrequests[0].index_id, "test-index-foo");
        assert_eq!(ingest_request.subrequests[0].source_id, "test-source");
        assert_eq!(
            ingest_request.subrequests[0]
                .doc_batch
                .as_ref()
                .unwrap()
                .num_docs(),
            2
        );
        assert_eq!(
            ingest_request.subrequests[0]
                .doc_batch
                .as_ref()
                .unwrap()
                .num_bytes(),
            21
        );
        assert_eq!(
            ingest_request.subrequests[0]
                .doc_batch
                .as_ref()
                .unwrap()
                .doc_lengths,
            [7, 6]
        );
        assert_eq!(
            ingest_request.subrequests[0]
                .doc_batch
                .as_ref()
                .unwrap()
                .doc_buffer,
            Bytes::from(&b"Hello, World!"[..])
        );
        assert_eq!(
            ingest_request.subrequests[0]
                .doc_batch
                .as_ref()
                .unwrap()
                .doc_uids,
            [hello_doc_uid, world_doc_uid]
        );

        assert_eq!(ingest_request.subrequests[1].index_id, "test-index-bar");
        assert_eq!(ingest_request.subrequests[1].source_id, "test-source");
        assert_eq!(
            ingest_request.subrequests[1]
                .doc_batch
                .as_ref()
                .unwrap()
                .num_docs(),
            2
        );
        assert_eq!(
            ingest_request.subrequests[1]
                .doc_batch
                .as_ref()
                .unwrap()
                .num_bytes(),
            20
        );
        assert_eq!(
            ingest_request.subrequests[1]
                .doc_batch
                .as_ref()
                .unwrap()
                .doc_lengths,
            [6, 6]
        );
        assert_eq!(
            ingest_request.subrequests[1]
                .doc_batch
                .as_ref()
                .unwrap()
                .doc_buffer,
            Bytes::from(&b"Hola, Mundo!"[..])
        );
        assert_eq!(
            ingest_request.subrequests[1]
                .doc_batch
                .as_ref()
                .unwrap()
                .doc_uids,
            [hola_doc_uid, mundo_doc_uid]
        );
    }

    #[test]
    fn test_estimate_size() {
        let doc_batch = DocBatchV2 {
            doc_buffer: Vec::new().into(),
            doc_lengths: Vec::new(),
            doc_uids: Vec::new(),
        };
        assert_eq!(estimate_size(&doc_batch), ByteSize(0));

        let doc_batch = DocBatchV2 {
            doc_buffer: vec![0u8; 100].into(),
            doc_lengths: vec![10, 20, 30],
            doc_uids: Vec::new(),
        };
        assert_eq!(estimate_size(&doc_batch), ByteSize(118));
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/models.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;
use std::time::{Duration, Instant};

use quickwit_common::rate_limiter::RateLimiter;
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::ingest::ShardState;
use quickwit_proto::types::{IndexUid, NodeId, Position, QueueId, ShardId, SourceId, queue_id};
use tokio::sync::watch;

use crate::ingest_v2::rate_meter::RateMeter;

#[derive(Debug, Clone)]
pub(super) enum IngesterShardType {
    /// A primary shard hosted on a leader and replicated on a follower.
    Primary { follower_id: NodeId },
    /// A replica shard hosted on a follower.
    Replica { leader_id: NodeId },
    /// A shard hosted on a single node when the replication factor is set to 1.
    Solo,
}

/// Status of a shard: state + position of the last record written.
pub(super) type ShardStatus = (ShardState, Position);

#[derive(Debug)]
pub(super) struct IngesterShard {
    pub index_uid: IndexUid,
    pub source_id: SourceId,
    pub shard_id: ShardId,
    pub shard_type: IngesterShardType,
    pub shard_state: ShardState,
    /// Position of the last record written in the shard's mrecordlog queue.
    pub replication_position_inclusive: Position,
    /// Position up to which the shard has been truncated.
    pub truncation_position_inclusive: Position,
    // Rate limiter for the shard. Unused for replica shards.
    pub rate_limiter: RateLimiter,
    // Rate meter for the shard. Unused for replica shards.
    pub rate_meter: RateMeter,
    /// Whether the shard should be advertised to other nodes (routers) via gossip.
    ///
    /// Because shards  are created in multiple steps, (e.g., init shard on leader, create shard in
    /// metastore), we must receive a "signal" from the control plane confirming that a shard
    /// was successfully opened before advertising it. Currently, this confirmation comes in the
    /// form of `PersistRequest` or `FetchRequest`.
    pub is_advertisable: bool,
    /// Document mapper for the shard. Replica shards and closed solo shards do not have one.
    pub doc_mapper_opt: Option<Arc<DocMapper>>,
    /// Whether to validate documents in this shard. True if no preprocessing (VRL) will happen
    /// before indexing.
    pub validate_docs: bool,
    pub shard_status_tx: watch::Sender<ShardStatus>,
    pub shard_status_rx: watch::Receiver<ShardStatus>,
    /// Instant at which the shard was last written to.
    pub last_write_instant: Instant,
}

/// Builder for `IngesterShard`. By default, the shard is open, is empty (i.e. the replication and
/// truncation positions are at the beginning), uses the default rate limiter and rate meter, has no
/// doc mapper, does not validate documents, and is not advertisable.
pub(super) struct IngesterShardBuilder {
    index_uid: IndexUid,
    source_id: SourceId,
    shard_id: ShardId,
    shard_type: IngesterShardType,
    shard_state: ShardState,
    replication_position_inclusive: Position,
    truncation_position_inclusive: Position,
    rate_limiter: RateLimiter,
    rate_meter: RateMeter,
    doc_mapper_opt: Option<Arc<DocMapper>>,
    validate_docs: bool,
    is_advertisable: bool,
    last_write_instant: Option<Instant>,
}

impl IngesterShardBuilder {
    /// Sets the shard state. Defaults to `ShardState::Open`.
    pub fn with_state(mut self, shard_state: ShardState) -> Self {
        self.shard_state = shard_state;
        self
    }

    /// Sets the rate limiter. Defaults to `RateLimiter::default()`.
    pub fn with_rate_limiter(mut self, rate_limiter: RateLimiter) -> Self {
        self.rate_limiter = rate_limiter;
        self
    }

    /// Sets the rate meter. Defaults to `RateMeter::default()`.
    pub fn with_rate_meter(mut self, rate_meter: RateMeter) -> Self {
        self.rate_meter = rate_meter;
        self
    }

    /// Sets the doc mapper.
    pub fn with_doc_mapper(mut self, doc_mapper: Arc<DocMapper>) -> Self {
        self.doc_mapper_opt = Some(doc_mapper);
        self
    }

    /// Sets the replication position. Defaults to `Position::Beginning`.
    pub fn with_replication_position_inclusive(mut self, position: Position) -> Self {
        self.replication_position_inclusive = position;
        self
    }

    /// Sets the truncation position. Defaults to `Position::Beginning`.
    pub fn with_truncation_position_inclusive(mut self, position: Position) -> Self {
        self.truncation_position_inclusive = position;
        self
    }

    /// Sets whether to validate documents. Defaults to `false`.
    pub fn with_validate_docs(mut self, validate_docs: bool) -> Self {
        self.validate_docs = validate_docs;
        self
    }

    /// Sets whether the shard should be advertised to other nodes via gossip. Defaults to `false`.
    pub fn advertisable(mut self) -> Self {
        self.is_advertisable = true;
        self
    }

    /// Sets the last write instant. Defaults to `Instant::now()`.
    pub fn with_last_write(mut self, last_write_instant: Instant) -> Self {
        self.last_write_instant = Some(last_write_instant);
        self
    }

    /// Builds the `IngesterShard`. Uses `Instant::now()` for last write time if not specified.
    pub fn build(self) -> IngesterShard {
        let shard_status = (
            self.shard_state,
            self.replication_position_inclusive.clone(),
        );
        let (shard_status_tx, shard_status_rx) = watch::channel(shard_status);
        IngesterShard {
            index_uid: self.index_uid,
            source_id: self.source_id,
            shard_id: self.shard_id,
            shard_type: self.shard_type,
            shard_state: self.shard_state,
            replication_position_inclusive: self.replication_position_inclusive,
            truncation_position_inclusive: self.truncation_position_inclusive,
            rate_limiter: self.rate_limiter,
            rate_meter: self.rate_meter,
            is_advertisable: self.is_advertisable,
            doc_mapper_opt: self.doc_mapper_opt,
            validate_docs: self.validate_docs,
            shard_status_tx,
            shard_status_rx,
            last_write_instant: self.last_write_instant.unwrap_or_else(Instant::now),
        }
    }
}

impl IngesterShard {
    /// Creates a builder for a primary shard hosted on a leader and replicated on a follower.
    pub fn new_primary(
        index_uid: IndexUid,
        source_id: SourceId,
        shard_id: ShardId,
        follower_id: NodeId,
    ) -> IngesterShardBuilder {
        IngesterShardBuilder {
            index_uid,
            source_id,
            shard_id,
            shard_type: IngesterShardType::Primary { follower_id },
            shard_state: ShardState::Open,
            replication_position_inclusive: Position::Beginning,
            truncation_position_inclusive: Position::Beginning,
            rate_limiter: RateLimiter::default(),
            rate_meter: RateMeter::default(),
            doc_mapper_opt: None,
            validate_docs: false,
            is_advertisable: false,
            last_write_instant: None,
        }
    }

    /// Creates a builder for a replica shard hosted on a follower.
    pub fn new_replica(
        index_uid: IndexUid,
        source_id: SourceId,
        shard_id: ShardId,
        leader_id: NodeId,
    ) -> IngesterShardBuilder {
        IngesterShardBuilder {
            index_uid,
            source_id,
            shard_id,
            shard_type: IngesterShardType::Replica { leader_id },
            shard_state: ShardState::Open,
            replication_position_inclusive: Position::Beginning,
            truncation_position_inclusive: Position::Beginning,
            rate_limiter: RateLimiter::default(),
            rate_meter: RateMeter::default(),
            doc_mapper_opt: None,
            validate_docs: false,
            is_advertisable: false,
            last_write_instant: None,
        }
    }

    /// Creates a builder for a solo shard hosted on a single node (i.e. replication factor = 1).
    pub fn new_solo(
        index_uid: IndexUid,
        source_id: SourceId,
        shard_id: ShardId,
    ) -> IngesterShardBuilder {
        IngesterShardBuilder {
            index_uid,
            source_id,
            shard_id,
            shard_type: IngesterShardType::Solo,
            shard_state: ShardState::Open,
            replication_position_inclusive: Position::Beginning,
            truncation_position_inclusive: Position::Beginning,
            rate_limiter: RateLimiter::default(),
            rate_meter: RateMeter::default(),
            doc_mapper_opt: None,
            validate_docs: false,
            is_advertisable: false,
            last_write_instant: None,
        }
    }

    pub fn follower_id_opt(&self) -> Option<&NodeId> {
        match &self.shard_type {
            IngesterShardType::Primary { follower_id, .. } => Some(follower_id),
            IngesterShardType::Replica { .. } => None,
            IngesterShardType::Solo => None,
        }
    }

    pub fn close(&mut self) {
        self.shard_state = ShardState::Closed;
        self.notify_shard_status();
    }

    pub fn is_closed(&self) -> bool {
        self.shard_state.is_closed()
    }

    pub fn is_open(&self) -> bool {
        self.shard_state.is_open()
    }

    pub fn is_idle(&self, now: Instant, idle_timeout: Duration) -> bool {
        now.duration_since(self.last_write_instant) >= idle_timeout
    }

    pub fn is_indexed(&self) -> bool {
        self.shard_state.is_closed() && self.truncation_position_inclusive.is_eof()
    }

    pub fn is_replica(&self) -> bool {
        matches!(self.shard_type, IngesterShardType::Replica { .. })
    }

    pub fn notify_shard_status(&self) {
        let shard_status = (
            self.shard_state,
            self.replication_position_inclusive.clone(),
        );
        // `shard_status_tx` is guaranteed to be open because `self` also holds a receiver.
        self.shard_status_tx
            .send(shard_status)
            .expect("channel should be open");
    }

    pub fn queue_id(&self) -> QueueId {
        queue_id(&self.index_uid, &self.source_id, &self.shard_id)
    }

    pub fn set_replication_position_inclusive(
        &mut self,
        replication_position_inclusive: Position,
        now: Instant,
    ) {
        if self.replication_position_inclusive == replication_position_inclusive {
            return;
        }
        self.replication_position_inclusive = replication_position_inclusive;
        self.last_write_instant = now;
        self.notify_shard_status();
    }
}

#[cfg(test)]
mod tests {
    use quickwit_config::{DocMapping, SearchSettings, build_doc_mapper};

    use super::*;

    impl IngesterShard {
        #[track_caller]
        pub fn assert_is_solo(&self) {
            assert!(matches!(self.shard_type, IngesterShardType::Solo))
        }

        #[track_caller]
        pub fn assert_is_primary(&self) {
            assert!(matches!(self.shard_type, IngesterShardType::Primary { .. }))
        }

        #[track_caller]
        pub fn assert_is_replica(&self) {
            assert!(matches!(self.shard_type, IngesterShardType::Replica { .. }))
        }

        #[track_caller]
        pub fn assert_is_open(&self) {
            assert!(self.shard_state.is_open())
        }

        #[track_caller]
        pub fn assert_is_closed(&self) {
            assert!(self.shard_state.is_closed())
        }

        #[track_caller]
        pub fn assert_replication_position(&self, expected_replication_position: Position) {
            assert_eq!(
                self.replication_position_inclusive, expected_replication_position,
                "expected replication position at `{:?}`, got `{:?}`",
                expected_replication_position, self.replication_position_inclusive
            );
        }

        #[track_caller]
        pub fn assert_truncation_position(&self, expected_truncation_position: Position) {
            assert_eq!(
                self.truncation_position_inclusive, expected_truncation_position,
                "expected truncation position at `{:?}`, got `{:?}`",
                expected_truncation_position, self.truncation_position_inclusive
            );
        }
    }

    #[test]
    fn test_new_primary_shard() {
        let doc_mapping: DocMapping = serde_json::from_str("{}").unwrap();
        let search_settings = SearchSettings::default();
        let doc_mapper = build_doc_mapper(&doc_mapping, &search_settings).unwrap();

        let primary_shard = IngesterShard::new_primary(
            IndexUid::for_test("test-index", 0),
            SourceId::from("test-source"),
            ShardId::from(1),
            NodeId::from("test-follower"),
        )
        .with_state(ShardState::Closed)
        .with_replication_position_inclusive(Position::offset(42u64))
        .with_doc_mapper(doc_mapper)
        .with_validate_docs(true)
        .build();

        assert!(matches!(
            &primary_shard.shard_type,
            IngesterShardType::Primary { follower_id, .. } if *follower_id == "test-follower"
        ));
        assert!(!primary_shard.is_replica());
        assert_eq!(primary_shard.shard_state, ShardState::Closed);
        assert_eq!(
            primary_shard.replication_position_inclusive,
            Position::offset(42u64)
        );
        assert_eq!(
            primary_shard.truncation_position_inclusive,
            Position::Beginning
        );
        assert!(!primary_shard.is_advertisable);
    }

    #[test]
    fn test_new_replica_shard() {
        let replica_shard = IngesterShard::new_replica(
            IndexUid::for_test("test-index", 0),
            SourceId::from("test-source"),
            ShardId::from(1),
            NodeId::from("test-leader"),
        )
        .with_state(ShardState::Closed)
        .with_replication_position_inclusive(Position::offset(42u64))
        .build();

        assert!(matches!(
            &replica_shard.shard_type,
            IngesterShardType::Replica { leader_id } if *leader_id == "test-leader"
        ));
        assert!(replica_shard.is_replica());
        assert_eq!(replica_shard.shard_state, ShardState::Closed);
        assert_eq!(
            replica_shard.replication_position_inclusive,
            Position::offset(42u64)
        );
        assert_eq!(
            replica_shard.truncation_position_inclusive,
            Position::Beginning
        );
        assert!(!replica_shard.is_advertisable);
    }

    #[test]
    fn test_new_solo_shard() {
        let solo_shard = IngesterShard::new_solo(
            IndexUid::for_test("test-index", 0),
            SourceId::from("test-source"),
            ShardId::from(1),
        )
        .with_state(ShardState::Closed)
        .with_replication_position_inclusive(Position::offset(42u64))
        .build();

        solo_shard.assert_is_solo();
        assert!(!solo_shard.is_replica());
        assert_eq!(solo_shard.shard_state, ShardState::Closed);
        assert_eq!(
            solo_shard.replication_position_inclusive,
            Position::offset(42u64)
        );
        assert_eq!(
            solo_shard.truncation_position_inclusive,
            Position::Beginning
        );
        assert!(!solo_shard.is_advertisable);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/mrecord.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytes::{Buf, Bytes};
use quickwit_proto::ingest::MRecordBatch;
use tracing::warn;

/// The first byte of a [`MRecord`] is the version of the record header.
#[derive(Debug)]
#[repr(u8)]
pub enum HeaderVersion {
    /// Version 0, introduced in Quickwit 0.7.0, it uses one byte to encode the record type.
    V0 = 0,
}

/// Length of the header of a [`MRecord`] in bytes.
pub(super) const MRECORD_HEADER_LEN: usize = 2;

/// `Doc` header v0 composed of the header version and the `Doc = 0` record type.
const DOC_HEADER_V0: &[u8; MRECORD_HEADER_LEN] = &[HeaderVersion::V0 as u8, 0];

/// `Commit` header v0 composed of the header version and the `Commit = 1` record type.
const COMMIT_HEADER_V0: &[u8; MRECORD_HEADER_LEN] = &[HeaderVersion::V0 as u8, 1];

#[derive(Debug, Clone, Eq, PartialEq)]
pub enum MRecord {
    Doc(Bytes),
    Commit,
}

impl MRecord {
    pub fn encode(&self) -> impl Buf + use<> {
        match &self {
            Self::Doc(doc) => DOC_HEADER_V0.chain(doc.clone()),
            Self::Commit => COMMIT_HEADER_V0.chain(Bytes::new()),
        }
    }

    pub fn decode(mut buf: impl Buf) -> Option<Self> {
        if buf.remaining() < 2 {
            return None;
        }

        let header_version = buf.get_u8();

        if header_version != HeaderVersion::V0 as u8 {
            warn!("unknown mrecord header version `{header_version}`");
            return None;
        }

        let mrecord = match buf.get_u8() {
            0 => {
                let doc = buf.copy_to_bytes(buf.remaining());
                Self::Doc(doc)
            }
            1 => Self::Commit,
            other => {
                warn!("unknown mrecord type `{other}`");
                return None;
            }
        };
        Some(mrecord)
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn new_doc(doc: impl Into<Bytes>) -> Self {
        Self::Doc(doc.into())
    }
}

pub fn decoded_mrecords(mrecord_batch: &MRecordBatch) -> impl Iterator<Item = MRecord> + '_ {
    mrecord_batch.encoded_mrecords().flat_map(MRecord::decode)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_parse_invalid_mrecord() {
        assert!(MRecord::decode(&b""[..]).is_none());
        assert!(MRecord::decode(&b"a"[..]).is_none());
        assert!(MRecord::decode(&[HeaderVersion::V0 as u8][..]).is_none());
        assert!(MRecord::decode(&[HeaderVersion::V0 as u8, 19u8][..]).is_none());
    }

    #[test]
    fn test_mrecord_doc_roundtrip() {
        let record = MRecord::new_doc("hello");
        let encoded_record = record.encode();
        let decoded_record = MRecord::decode(encoded_record).unwrap();
        assert_eq!(record, decoded_record);
    }

    #[test]
    fn test_mrecord_commit_roundtrip() {
        let record = MRecord::Commit;
        let encoded_record = record.encode();
        let decoded_record = MRecord::decode(encoded_record).unwrap();
        assert_eq!(record, decoded_record);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/mrecordlog_utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;
use std::iter::once;
use std::ops::RangeInclusive;

use bytesize::ByteSize;
#[cfg(feature = "failpoints")]
use fail::fail_point;
use mrecordlog::error::{AppendError, DeleteQueueError};
use quickwit_proto::ingest::DocBatchV2;
use quickwit_proto::types::{Position, QueueId};

use crate::MRecord;
use crate::mrecordlog_async::MultiRecordLogAsync;

#[derive(Debug, thiserror::Error)]
pub(super) enum AppendDocBatchError {
    #[error("IO error: {0}")]
    Io(#[from] io::Error),
    #[error("WAL queue `{0}` not found")]
    QueueNotFound(QueueId),
}

/// Appends a non-empty document batch to the WAL queue `queue_id`.
///
/// # Panics
///
/// Panics if `doc_batch` is empty.
pub(super) async fn append_non_empty_doc_batch(
    mrecordlog: &mut MultiRecordLogAsync,
    queue_id: &QueueId,
    doc_batch: DocBatchV2,
    force_commit: bool,
) -> Result<Position, AppendDocBatchError> {
    let append_result = if force_commit {
        let encoded_mrecords = doc_batch
            .into_docs()
            .map(|(_doc_uid, doc)| MRecord::Doc(doc).encode())
            .chain(once(MRecord::Commit.encode()));

        #[cfg(feature = "failpoints")]
        fail_point!("ingester:append_records", |_| {
            let io_error = io::Error::from(io::ErrorKind::PermissionDenied);
            Err(AppendDocBatchError::Io(io_error))
        });

        mrecordlog
            .append_records(queue_id, None, encoded_mrecords)
            .await
    } else {
        let encoded_mrecords = doc_batch
            .into_docs()
            .map(|(_doc_uid, doc)| MRecord::Doc(doc).encode());

        #[cfg(feature = "failpoints")]
        fail_point!("ingester:append_records", |_| {
            let io_error = io::Error::from(io::ErrorKind::PermissionDenied);
            Err(AppendDocBatchError::Io(io_error))
        });

        mrecordlog
            .append_records(queue_id, None, encoded_mrecords)
            .await
    };
    match append_result {
        Ok(Some(offset)) => Ok(Position::offset(offset)),
        Ok(None) => panic!("`doc_batch` should not be empty"),
        Err(AppendError::IoError(io_error)) => Err(AppendDocBatchError::Io(io_error)),
        Err(AppendError::MissingQueue(queue_id)) => {
            Err(AppendDocBatchError::QueueNotFound(queue_id))
        }
        Err(AppendError::Past) => {
            panic!("`append_records` should be called with `position_opt: None`")
        }
    }
}

/// Error returned when the mrecordlog does not have enough capacity to store some records.
#[derive(Debug, Clone, Copy, thiserror::Error)]
pub(super) enum NotEnoughCapacityError {
    #[error(
        "write-ahead log is full, capacity: {capacity}, usage: {usage}, requested: {requested}"
    )]
    Disk {
        usage: ByteSize,
        capacity: ByteSize,
        requested: ByteSize,
    },
    #[error(
        "write-ahead log memory buffer is full: capacity: {capacity}, usage: {usage}, requested: \
         {requested}"
    )]
    Memory {
        usage: ByteSize,
        capacity: ByteSize,
        requested: ByteSize,
    },
}

/// Checks whether the log has enough capacity to store some records.
pub(super) fn check_enough_capacity(
    mrecordlog: &MultiRecordLogAsync,
    disk_capacity: ByteSize,
    memory_capacity: ByteSize,
    requested_capacity: ByteSize,
) -> Result<(), NotEnoughCapacityError> {
    let wal_usage = mrecordlog.resource_usage();
    let disk_used = ByteSize(wal_usage.disk_used_bytes as u64);

    if disk_used + requested_capacity > disk_capacity {
        return Err(NotEnoughCapacityError::Disk {
            usage: disk_used,
            capacity: disk_capacity,
            requested: requested_capacity,
        });
    }
    let memory_used = ByteSize(wal_usage.memory_used_bytes as u64);

    if memory_used + requested_capacity > memory_capacity {
        return Err(NotEnoughCapacityError::Memory {
            usage: memory_used,
            capacity: memory_capacity,
            requested: requested_capacity,
        });
    }
    Ok(())
}

/// Deletes a queue from the WAL. Returns without error if the queue does not exist.
pub async fn force_delete_queue(
    mrecordlog: &mut MultiRecordLogAsync,
    queue_id: &QueueId,
) -> io::Result<()> {
    match mrecordlog.delete_queue(queue_id).await {
        Ok(_) | Err(DeleteQueueError::MissingQueue(_)) => Ok(()),
        Err(DeleteQueueError::IoError(error)) => Err(error),
    }
}

/// Returns the first and last position of the records currently stored in the queue. Returns `None`
/// if the queue does not exist or is empty.
pub(super) fn queue_position_range(
    mrecordlog: &MultiRecordLogAsync,
    queue_id: &QueueId,
) -> Option<RangeInclusive<u64>> {
    let first_position = mrecordlog
        .range(queue_id, ..)
        .ok()?
        .next()
        .map(|record| record.position)?;

    let last_position = mrecordlog
        .last_record(queue_id)
        .ok()?
        .map(|record| record.position)?;

    Some(first_position..=last_position)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[cfg(not(feature = "failpoints"))]
    #[tokio::test]
    async fn test_append_non_empty_doc_batch() {
        let tempdir = tempfile::tempdir().unwrap();
        let mut mrecordlog = MultiRecordLogAsync::open(tempdir.path()).await.unwrap();

        let queue_id = "test-queue".to_string();
        let doc_batch = DocBatchV2::for_test(["test-doc-foo"]);

        let append_error =
            append_non_empty_doc_batch(&mut mrecordlog, &queue_id, doc_batch.clone(), false)
                .await
                .unwrap_err();

        assert!(matches!(
            append_error,
            AppendDocBatchError::QueueNotFound(..)
        ));

        mrecordlog.create_queue(&queue_id).await.unwrap();

        let position =
            append_non_empty_doc_batch(&mut mrecordlog, &queue_id, doc_batch.clone(), false)
                .await
                .unwrap();
        assert_eq!(position, Position::offset(0u64));

        let position =
            append_non_empty_doc_batch(&mut mrecordlog, &queue_id, doc_batch.clone(), true)
                .await
                .unwrap();
        assert_eq!(position, Position::offset(2u64));
    }

    // This test should be run manually and independently of other tests with the `failpoints`
    // feature enabled:
    // ```sh
    // cargo test --manifest-path quickwit/Cargo.toml -p quickwit-ingest --features failpoints -- test_append_non_empty_doc_batch_io_error
    // ```
    #[cfg(feature = "failpoints")]
    #[tokio::test]
    async fn test_append_non_empty_doc_batch_io_error() {
        let scenario = fail::FailScenario::setup();
        fail::cfg("ingester:append_records", "return").unwrap();

        let tempdir = tempfile::tempdir().unwrap();
        let mut mrecordlog = MultiRecordLogAsync::open(tempdir.path()).await.unwrap();

        let queue_id = "test-queue".to_string();
        mrecordlog.create_queue(&queue_id).await.unwrap();

        let doc_batch = DocBatchV2::for_test(["test-doc-foo"]);
        let append_error = append_non_empty_doc_batch(&mut mrecordlog, &queue_id, doc_batch, false)
            .await
            .unwrap_err();

        assert!(matches!(append_error, AppendDocBatchError::Io(..)));

        scenario.teardown();
    }

    #[tokio::test]
    async fn test_check_enough_capacity() {
        let tempdir = tempfile::tempdir().unwrap();
        let mrecordlog = MultiRecordLogAsync::open(tempdir.path()).await.unwrap();

        let disk_error =
            check_enough_capacity(&mrecordlog, ByteSize(0), ByteSize(0), ByteSize(12)).unwrap_err();

        assert!(matches!(disk_error, NotEnoughCapacityError::Disk { .. }));

        let memory_error =
            check_enough_capacity(&mrecordlog, ByteSize::mb(256), ByteSize(11), ByteSize(12))
                .unwrap_err();

        assert!(matches!(
            memory_error,
            NotEnoughCapacityError::Memory { .. }
        ));

        check_enough_capacity(&mrecordlog, ByteSize::mb(256), ByteSize(12), ByteSize(12)).unwrap();
    }

    #[tokio::test]
    async fn test_append_queue_position_range() {
        let tempdir = tempfile::tempdir().unwrap();
        let mut mrecordlog = MultiRecordLogAsync::open(tempdir.path()).await.unwrap();

        assert!(queue_position_range(&mrecordlog, &"queue-not-found".to_string()).is_none());

        mrecordlog.create_queue("test-queue").await.unwrap();
        assert!(queue_position_range(&mrecordlog, &"test-queue".to_string()).is_none());

        mrecordlog
            .append_records("test-queue", None, std::iter::once(&b"test-doc-foo"[..]))
            .await
            .unwrap();
        let position_range = queue_position_range(&mrecordlog, &"test-queue".to_string()).unwrap();
        assert_eq!(position_range, 0..=0);

        mrecordlog
            .append_records("test-queue", None, std::iter::once(&b"test-doc-bar"[..]))
            .await
            .unwrap();
        let position_range = queue_position_range(&mrecordlog, &"test-queue".to_string()).unwrap();
        assert_eq!(position_range, 0..=1);

        mrecordlog.truncate("test-queue", 0).await.unwrap();
        let position_range = queue_position_range(&mrecordlog, &"test-queue".to_string()).unwrap();
        assert_eq!(position_range, 1..=1);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/publish_tracker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::sync::{Arc, Mutex};

use quickwit_common::pubsub::{EventBroker, EventSubscriptionHandle};
use quickwit_proto::indexing::ShardPositionsUpdate;
use quickwit_proto::types::{Position, ShardId};
use tokio::sync::Notify;
use tracing::error;

/// A helper for awaiting shard publish events when running in `wait_for` and
/// `force` commit mode.
///
/// Registers a set of shard positions and listens to [`ShardPositionsUpdate`]
/// events to assert when all the persisted events have been published. To
/// ensure that no events are missed:
/// - create the tracker before any persist requests is sent
/// - call `register_requested_shards` before each persist request to ensure that the associated
///   publish events are recorded
/// - call `track_persisted_shard_position` after each successful persist subrequests
pub struct PublishTracker {
    state: Arc<Mutex<ShardPublishStates>>,
    // sync::notify instead of sync::oneshot because we don't want to store the permit
    publish_complete: Arc<Notify>,
    _publish_listen_handle: EventSubscriptionHandle,
}

impl PublishTracker {
    pub fn new(event_tracker: EventBroker) -> Self {
        let state = Arc::new(Mutex::new(ShardPublishStates::default()));
        let state_clone = state.clone();
        let publish_complete = Arc::new(Notify::new());
        let publish_complete_notifier = publish_complete.clone();
        let _publish_listen_handle =
            event_tracker.subscribe(move |update: ShardPositionsUpdate| {
                let mut publish_states = state_clone.lock().unwrap();
                for (updated_shard_id, updated_position) in &update.updated_shard_positions {
                    publish_states.position_published(
                        updated_shard_id,
                        updated_position,
                        &publish_complete_notifier,
                    );
                }
            });
        Self {
            state,
            _publish_listen_handle,
            publish_complete,
        }
    }

    pub fn track_persisted_shard_position(&self, shard_id: ShardId, new_position: Position) {
        let mut publish_states = self.state.lock().unwrap();
        publish_states.position_persisted(&shard_id, &new_position)
    }

    pub async fn wait_publish_complete(self) {
        // correctness: `awaiting_count` cannot be increased after this point
        // because `self` is consumed. By subscribing to `publish_complete`
        // before checking `awaiting_count`, we make sure we don't miss the
        // moment when it becomes 0.
        let notified = self.publish_complete.notified();
        if self.state.lock().unwrap().awaiting_count == 0 {
            return;
        }
        notified.await;
    }
}

enum PublishState {
    /// The persist request for this shard success response has been received
    /// but the position has not yet been published
    AwaitingPublish(Position),
    ///  The shard has been published up to this position (might happen before
    ///  the persist success is received)
    Published(Position),
}

#[derive(Default)]
struct ShardPublishStates {
    states: HashMap<ShardId, PublishState>,
    awaiting_count: usize,
}

impl ShardPublishStates {
    fn position_published(
        &mut self,
        shard_id: &ShardId,
        new_position: &Position,
        publish_complete_notifier: &Notify,
    ) {
        let Some(publish_state) = self.states.get_mut(shard_id) else {
            return;
        };

        match publish_state {
            PublishState::AwaitingPublish(shard_position) if new_position >= shard_position => {
                *publish_state = PublishState::Published(new_position.clone());
                self.awaiting_count -= 1;
                if self.awaiting_count == 0 {
                    publish_complete_notifier.notify_waiters();
                }
            }
            PublishState::Published(current_position) if new_position > current_position => {
                *current_position = new_position.clone();
            }
            PublishState::Published(_) | PublishState::AwaitingPublish(_) => {
                // duplicate/out-of-order or not enough progress yet
            }
        }
    }

    fn position_persisted(&mut self, shard_id: &ShardId, new_position: &Position) {
        if self.states.contains_key(shard_id) {
            error!(%shard_id, "shard persisted positions should not be tracked multiple times");
            return;
        }

        self.states.insert(
            shard_id.clone(),
            PublishState::AwaitingPublish(new_position.clone()),
        );
        self.awaiting_count += 1;
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_proto::types::{IndexUid, ShardId, SourceUid};

    use super::*;

    #[tokio::test]
    async fn test_shard_publish_states() {
        let mut shard_publish_states = ShardPublishStates::default();
        let notifier = Arc::new(Notify::new());

        let shard_id_1 = ShardId::from("test-shard-1");
        let shard_id_2 = ShardId::from("test-shard-2");
        let shard_id_3 = ShardId::from("test-shard-3"); // not tracked

        let notifier_receiver = notifier.clone();
        let notified_subscription = notifier_receiver.notified();

        shard_publish_states.position_persisted(&shard_id_1, &Position::offset(10usize));
        assert_eq!(shard_publish_states.awaiting_count, 1);
        shard_publish_states.position_persisted(&shard_id_2, &Position::offset(20usize));
        assert_eq!(shard_publish_states.awaiting_count, 2);
        shard_publish_states.position_published(&shard_id_1, &Position::offset(15usize), &notifier);
        assert_eq!(shard_publish_states.awaiting_count, 1);
        shard_publish_states.position_published(&shard_id_2, &Position::offset(20usize), &notifier);
        assert_eq!(shard_publish_states.awaiting_count, 0);

        // check that only the notification that was subscribed before holds a permit
        tokio::time::timeout(Duration::from_millis(100), notifier.notified())
            .await
            .unwrap_err();
        tokio::time::timeout(Duration::from_millis(100), notified_subscription)
            .await
            .unwrap();

        // shard 3 is not tracked
        shard_publish_states.position_published(&shard_id_3, &Position::offset(10usize), &notifier);
        assert_eq!(shard_publish_states.awaiting_count, 0);
        assert!(!shard_publish_states.states.contains_key(&shard_id_3));
    }

    #[tokio::test]
    async fn test_publish_tracker() {
        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);
        let event_broker = EventBroker::default();
        let tracker = PublishTracker::new(event_broker.clone());
        let shard_id_1 = ShardId::from("test-shard-1");
        let shard_id_2 = ShardId::from("test-shard-2");
        let shard_id_3 = ShardId::from("test-shard-3");
        let shard_id_4 = ShardId::from("test-shard-4");
        let shard_id_5 = ShardId::from("test-shard-5"); // not tracked

        tracker.track_persisted_shard_position(shard_id_1.clone(), Position::offset(42usize));
        tracker.track_persisted_shard_position(shard_id_2.clone(), Position::offset(42usize));
        tracker.track_persisted_shard_position(shard_id_3.clone(), Position::offset(42usize));

        event_broker.publish(ShardPositionsUpdate {
            source_uid: SourceUid {
                index_uid: index_uid.clone(),
                source_id: "test-source".to_string(),
            },
            updated_shard_positions: vec![
                (shard_id_1.clone(), Position::offset(42usize)),
                (shard_id_2.clone(), Position::offset(666usize)),
                (shard_id_5.clone(), Position::offset(888usize)),
            ]
            .into_iter()
            .collect(),
        });

        event_broker.publish(ShardPositionsUpdate {
            source_uid: SourceUid {
                index_uid: index_uid.clone(),
                source_id: "test-source".to_string(),
            },
            updated_shard_positions: vec![
                (shard_id_3.clone(), Position::eof(42usize)),
                (shard_id_4.clone(), Position::offset(42usize)),
            ]
            .into_iter()
            .collect(),
        });

        // persist response received after the publish event
        tracker.track_persisted_shard_position(shard_id_4.clone(), Position::offset(42usize));

        tokio::time::timeout(Duration::from_millis(200), tracker.wait_publish_complete())
            .await
            .unwrap();
    }

    #[tokio::test]
    async fn test_publish_tracker_waits() {
        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);
        let shard_id_1 = ShardId::from("test-shard-1");
        let shard_id_2 = ShardId::from("test-shard-2");
        let position = Position::offset(42usize);

        {
            let event_broker = EventBroker::default();
            let tracker = PublishTracker::new(event_broker.clone());
            tracker.track_persisted_shard_position(shard_id_1.clone(), position.clone());
            tracker.track_persisted_shard_position(shard_id_2.clone(), position.clone());

            event_broker.publish(ShardPositionsUpdate {
                source_uid: SourceUid {
                    index_uid: index_uid.clone(),
                    source_id: "test-source".to_string(),
                },
                updated_shard_positions: vec![(shard_id_1.clone(), position.clone())]
                    .into_iter()
                    .collect(),
            });

            tokio::time::timeout(Duration::from_millis(200), tracker.wait_publish_complete())
                .await
                .unwrap_err();
        }
        {
            let event_broker = EventBroker::default();
            let tracker = PublishTracker::new(event_broker.clone());
            tracker.track_persisted_shard_position(shard_id_1.clone(), position.clone());
            event_broker.publish(ShardPositionsUpdate {
                source_uid: SourceUid {
                    index_uid: index_uid.clone(),
                    source_id: "test-source".to_string(),
                },
                updated_shard_positions: vec![(shard_id_1.clone(), position.clone())]
                    .into_iter()
                    .collect(),
            });
            // sleep to make sure the event is processed
            tokio::time::sleep(Duration::from_millis(50)).await;
            tracker.track_persisted_shard_position(shard_id_2.clone(), position.clone());

            tokio::time::timeout(Duration::from_millis(200), tracker.wait_publish_complete())
                .await
                .unwrap_err();
        }
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/rate_meter.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::tower::ConstantRate;
use tokio::time::Instant;

/// A naive rate meter that tracks how much work was performed during a period of time defined by
/// two successive calls to `harvest`.
#[derive(Debug, Clone)]
pub(super) struct RateMeter {
    total_work: u64,
    harvested_at: Instant,
}

impl Default for RateMeter {
    fn default() -> Self {
        Self {
            total_work: 0,
            harvested_at: Instant::now(),
        }
    }
}

impl RateMeter {
    /// Increments the amount of work performed since the last call to `harvest`.
    pub fn update(&mut self, work: u64) {
        self.total_work += work;
    }

    /// Returns the average work rate since the last call to this method and resets the internal
    /// state.
    pub fn harvest(&mut self) -> ConstantRate {
        let now = Instant::now();
        let elapsed = now.duration_since(self.harvested_at);
        let rate = ConstantRate::new(self.total_work, elapsed);
        self.total_work = 0;
        self.harvested_at = now;
        rate
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_common::tower::Rate;

    use super::*;

    #[tokio::test]
    async fn test_rate_meter() {
        tokio::time::pause();
        let mut rate_meter = RateMeter::default();

        let rate = rate_meter.harvest();
        assert_eq!(rate.work(), 0);
        assert!(rate.period().is_zero());

        tokio::time::advance(Duration::from_millis(100)).await;

        let rate = rate_meter.harvest();
        assert_eq!(rate.work(), 0);
        assert_eq!(rate.period(), Duration::from_millis(100));

        rate_meter.update(1);
        tokio::time::advance(Duration::from_millis(100)).await;

        let rate = rate_meter.harvest();
        assert_eq!(rate.work(), 1);
        assert_eq!(rate.period(), Duration::from_millis(100));
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/replication.md
================================================
## Replication

### Sync replication
For each shard, leaders replicate the state of their local mrecordlog queues and associated metadata (positions) by sending replication requests to their followers. Then, they wait for followers to acknowledge the replication requests before returning success or failure responses to routers.

### Replication stream
Two gRPC streams back the independent streams of requests and responses between leader-follower pairs called the SYN replication stream and the ACK replication stream. gRPC streams guarantee that the streamed messages are delivered in the order they are sent. However, gRPC bidirectional streaming does not guarantee that requests and responses match. Most of the logic implemented in `replication.rs` aims to "zip" the two streams together to fix this issue.

### Life of a happy persist request
1. Leader receives a persist request pre-assigned to a shard from a router.

1. Leader forwards replicate request to follower of the shard via the SYN replication stream.

1. Follower receives the replicate request, writes the data to its replica queue, and records the new position of the queue called `replica_position`.

1. Follower returns replicate response to leader via the ACK replication stream.

1. Leader records the new position of the replica queue.

1. Leader writes the data to its local mrecordlog queue and records the new position of the queue called `primary_position`.  It should match the `replica_position`.

1. Leader return success persist response to router.

### Replication stream errors

- When a replication request fails, the leader and follower close the shard(s) targeted by the request.

- When a replication stream fails (transport error, timeout), the leader and follower close the shard(s) targeted by the stream. Then, the leader reopens a new stream if necessary.


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/replication.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::time::{Duration, Instant};

use bytesize::ByteSize;
use futures::{Future, StreamExt};
use mrecordlog::error::CreateQueueError;
use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_common::{ServiceStream, rate_limited_warn};
use quickwit_proto::ingest::ingester::{
    AckReplicationMessage, IngesterStatus, InitReplicaRequest, InitReplicaResponse,
    ReplicateFailure, ReplicateFailureReason, ReplicateRequest, ReplicateResponse,
    ReplicateSubrequest, ReplicateSuccess, SynReplicationMessage, ack_replication_message,
    syn_replication_message,
};
use quickwit_proto::ingest::{CommitTypeV2, IngestV2Error, IngestV2Result, Shard, ShardState};
use quickwit_proto::types::{NodeId, QueueId};
use tokio::sync::mpsc::error::TryRecvError;
use tokio::sync::{mpsc, oneshot};
use tokio::task::JoinHandle;
use tracing::{error, warn};

use super::metrics::report_wal_usage;
use super::models::IngesterShard;
use super::mrecordlog_utils::check_enough_capacity;
use super::state::IngesterState;
use crate::ingest_v2::mrecordlog_utils::{AppendDocBatchError, append_non_empty_doc_batch};
use crate::metrics::INGEST_METRICS;
use crate::{estimate_size, with_lock_metrics};

pub(super) const SYN_REPLICATION_STREAM_CAPACITY: usize = 5;

/// Duration after which replication requests time out with [`ReplicationError::Timeout`].
const REPLICATION_REQUEST_TIMEOUT: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(250)
} else {
    Duration::from_secs(3)
};

/// A replication request is sent by the leader to its follower to update the state of a replica
/// shard.
#[derive(Debug)]
pub(super) enum ReplicationRequest {
    Init(InitReplicaRequest),
    Replicate(ReplicateRequest),
}

impl ReplicationRequest {
    fn replication_seqno(&self) -> ReplicationSeqNo {
        match self {
            ReplicationRequest::Init(init_replica_request) => {
                init_replica_request.replication_seqno
            }
            ReplicationRequest::Replicate(replicate_request) => replicate_request.replication_seqno,
        }
    }

    fn set_replication_seqno(&mut self, replication_seqno: ReplicationSeqNo) {
        match self {
            ReplicationRequest::Init(init_replica_request) => {
                init_replica_request.replication_seqno = replication_seqno
            }
            ReplicationRequest::Replicate(replicate_request) => {
                replicate_request.replication_seqno = replication_seqno
            }
        }
    }

    fn into_syn_replication_message(self) -> SynReplicationMessage {
        match self {
            ReplicationRequest::Init(init_replica_request) => {
                SynReplicationMessage::new_init_replica_request(init_replica_request)
            }
            ReplicationRequest::Replicate(replicate_request) => {
                SynReplicationMessage::new_replicate_request(replicate_request)
            }
        }
    }
}

#[derive(Debug)]
pub(super) enum ReplicationResponse {
    Init(InitReplicaResponse),
    Replicate(ReplicateResponse),
}

impl ReplicationResponse {
    fn replication_seqno(&self) -> ReplicationSeqNo {
        match self {
            ReplicationResponse::Init(init_replica_response) => {
                init_replica_response.replication_seqno
            }
            ReplicationResponse::Replicate(replicate_response) => {
                replicate_response.replication_seqno
            }
        }
    }
}

type OneShotReplicationRequest = (ReplicationRequest, oneshot::Sender<ReplicationResponse>);

/// Replication sequence number.
type ReplicationSeqNo = u64;

/// Task that "powers" the replication stream between a leader and a follower.
pub(super) struct ReplicationStreamTask {
    leader_id: NodeId,
    follower_id: NodeId,
    replication_request_rx: mpsc::Receiver<OneShotReplicationRequest>,
    syn_replication_stream_tx: mpsc::Sender<SynReplicationMessage>,
    ack_replication_stream: ServiceStream<IngestV2Result<AckReplicationMessage>>,
}

impl ReplicationStreamTask {
    /// Spawns a [`ReplicationStreamTask`].
    pub fn spawn(
        leader_id: NodeId,
        follower_id: NodeId,
        syn_replication_stream_tx: mpsc::Sender<SynReplicationMessage>,
        ack_replication_stream: ServiceStream<IngestV2Result<AckReplicationMessage>>,
    ) -> ReplicationStreamTaskHandle {
        let (replication_request_tx, replication_request_rx) =
            mpsc::channel::<OneShotReplicationRequest>(3);

        let replication_stream_task = Self {
            leader_id,
            follower_id,
            replication_request_rx,
            syn_replication_stream_tx,
            ack_replication_stream,
        };
        let (enqueue_syn_requests_join_handle, dequeue_ack_responses_join_handle) =
            replication_stream_task.run();

        ReplicationStreamTaskHandle {
            replication_request_tx,
            enqueue_syn_requests_join_handle,
            dequeue_ack_responses_join_handle,
        }
    }

    /// Executes the request processing loop. It enqueues requests into the SYN replication stream
    /// going to the follower then dequeues the responses returned from the ACK replication
    /// stream. Additionally (and crucially), it ensures that requests and responses are
    /// processed and returned in the same order. Conceptually, it is akin to "zipping" the SYN and
    /// ACK replication streams together.
    fn run(mut self) -> (JoinHandle<()>, JoinHandle<()>) {
        // Response sequencer channel. It ensures that requests and responses are processed and
        // returned in the same order.
        //
        // Channel capacity: there is no need to bound the capacity of the channel here
        // because it is already virtually bounded by the capacity of the SYN replication
        // stream.
        let (response_sequencer_tx, mut response_sequencer_rx) = mpsc::unbounded_channel();

        // This loop enqueues SYN replication requests into the SYN replication stream and passes
        // the one-shot response sender to the "dequeue" loop via the sequencer channel.
        let enqueue_syn_requests_fut = async move {
            let mut replication_seqno = ReplicationSeqNo::default();
            while let Some((mut replication_request, oneshot_replication_response_tx)) =
                self.replication_request_rx.recv().await
            {
                replication_request.set_replication_seqno(replication_seqno);
                replication_seqno += 1;

                if response_sequencer_tx
                    .send((
                        replication_request.replication_seqno(),
                        oneshot_replication_response_tx,
                    ))
                    .is_err()
                {
                    // The response sequencer receiver was dropped.
                    return;
                }
                let syn_replication_message = replication_request.into_syn_replication_message();

                if self
                    .syn_replication_stream_tx
                    .send(syn_replication_message)
                    .await
                    .is_err()
                {
                    // The SYN replication stream was closed.
                    return;
                }
            }
            // The replication client was dropped.
        };
        // This loop dequeues ACK replication responses from the ACK replication stream and forwards
        // them to their respective clients using associated one-shot associated with each response.
        let dequeue_ack_responses_fut = async move {
            while let Some(ack_replication_message_res) = self.ack_replication_stream.next().await {
                let ack_replication_message = match ack_replication_message_res {
                    Ok(ack_replication_message) => ack_replication_message,
                    Err(_) => {
                        return;
                    }
                };
                let replication_response = match ack_replication_message.message {
                    Some(ack_replication_message::Message::InitResponse(init_replica_response)) => {
                        ReplicationResponse::Init(init_replica_response)
                    }
                    Some(ack_replication_message::Message::ReplicateResponse(
                        replicate_response,
                    )) => ReplicationResponse::Replicate(replicate_response),
                    Some(ack_replication_message::Message::OpenResponse(_)) => {
                        warn!("received unexpected ACK replication message");
                        continue;
                    }
                    None => {
                        warn!("received empty ACK replication message");
                        continue;
                    }
                };
                let oneshot_replication_response_tx = match response_sequencer_rx.try_recv() {
                    Ok((replication_seqno, oneshot_replication_response_tx)) => {
                        if replication_response.replication_seqno() != replication_seqno {
                            error!(
                                "received out-of-order replication response: expected replication \
                                 seqno `{}`, got `{}`; closing replication stream from leader \
                                 `{}` to follower `{}`",
                                replication_seqno,
                                replication_response.replication_seqno(),
                                self.leader_id,
                                self.follower_id,
                            );
                            return;
                        }
                        oneshot_replication_response_tx
                    }
                    Err(TryRecvError::Empty) => {
                        panic!("response sequencer should not be empty");
                    }
                    Err(TryRecvError::Disconnected) => {
                        // The response sequencer sender was dropped.
                        return;
                    }
                };
                // We intentionally ignore the error here. It is the responsibility of the
                // `replicate` method to surface it.
                let _ = oneshot_replication_response_tx.send(replication_response);
            }
            // The ACK replication stream was closed.
        };
        (
            tokio::spawn(enqueue_syn_requests_fut),
            tokio::spawn(dequeue_ack_responses_fut),
        )
    }
}

pub(super) struct ReplicationStreamTaskHandle {
    replication_request_tx: mpsc::Sender<OneShotReplicationRequest>,
    enqueue_syn_requests_join_handle: JoinHandle<()>,
    dequeue_ack_responses_join_handle: JoinHandle<()>,
}

impl ReplicationStreamTaskHandle {
    /// Returns a [`ReplicationClient`] that can be used to enqueue replication requests
    /// into the replication stream.
    pub fn replication_client(&self) -> ReplicationClient {
        ReplicationClient {
            replication_request_tx: self.replication_request_tx.clone(),
        }
    }
}

impl Drop for ReplicationStreamTaskHandle {
    fn drop(&mut self) {
        self.enqueue_syn_requests_join_handle.abort();
        self.dequeue_ack_responses_join_handle.abort();
    }
}

/// Error returned by the [`ReplicationClient`].
#[derive(Debug, Clone, Copy, thiserror::Error)]
#[error("failed to replicate records from leader to follower")]
pub(super) enum ReplicationError {
    /// The replication stream was closed.
    #[error("replication stream was closed")]
    Closed,
    /// The replication request timed out.
    #[error("replication request timed out")]
    Timeout,
}

// DO NOT derive or implement `Clone` for this object.
#[derive(Debug)]
pub(super) struct ReplicationClient {
    replication_request_tx: mpsc::Sender<OneShotReplicationRequest>,
}

/// Single-use client that enqueues replication requests into the replication stream.
///
/// The `init_replica`, `replicate`, and `submit` methods take `self` instead of `&self`
/// to produce 'static futures and enforce single-use semantics.
impl ReplicationClient {
    /// Enqueues an init replica request into the replication stream and waits for the response.
    /// Times out after [`REPLICATION_REQUEST_TIMEOUT`] seconds.
    pub fn init_replica(
        self,
        replica_shard: Shard,
    ) -> impl Future<Output = Result<InitReplicaResponse, ReplicationError>> + Send + 'static {
        let init_replica_request = InitReplicaRequest {
            replica_shard: Some(replica_shard),
            replication_seqno: 0, // replication number are generated further down
        };
        let replication_request = ReplicationRequest::Init(init_replica_request);

        async {
            self.submit(replication_request)
                .await
                .map(|replication_response| {
                    if let ReplicationResponse::Init(init_replica_response) = replication_response {
                        init_replica_response
                    } else {
                        panic!("response should be an init replica response")
                    }
                })
        }
    }

    /// Enqueues a replicate request into the replication stream and waits for the response. Times
    /// out after [`REPLICATION_REQUEST_TIMEOUT`] seconds.
    pub fn replicate(
        self,
        leader_id: NodeId,
        follower_id: NodeId,
        subrequests: Vec<ReplicateSubrequest>,
        commit_type: CommitTypeV2,
    ) -> impl Future<Output = Result<ReplicateResponse, ReplicationError>> + Send + 'static {
        let replicate_request = ReplicateRequest {
            leader_id: leader_id.into(),
            follower_id: follower_id.into(),
            subrequests,
            commit_type: commit_type as i32,
            replication_seqno: 0, // replication number are generated further down
        };
        let replication_request = ReplicationRequest::Replicate(replicate_request);

        async {
            self.submit(replication_request)
                .await
                .map(|replication_response| {
                    if let ReplicationResponse::Replicate(replicate_response) = replication_response
                    {
                        replicate_response
                    } else {
                        panic!("response should be a replicate response")
                    }
                })
        }
    }

    /// Submits a replication request to the replication stream and waits for the response.
    fn submit(
        self,
        replication_request: ReplicationRequest,
    ) -> impl Future<Output = Result<ReplicationResponse, ReplicationError>> + Send + 'static {
        let (oneshot_replication_response_tx, oneshot_replication_response_rx) = oneshot::channel();

        let send_recv_fut = async move {
            self.replication_request_tx
                .send((replication_request, oneshot_replication_response_tx))
                .await
                .map_err(|_| ReplicationError::Closed)?;
            let replicate_response = oneshot_replication_response_rx
                .await
                .map_err(|_| ReplicationError::Closed)?;
            Ok(replicate_response)
        };
        async {
            tokio::time::timeout(REPLICATION_REQUEST_TIMEOUT, send_recv_fut)
                .await
                .map_err(|_| ReplicationError::Timeout)?
        }
    }
}

/// Replication task executed for each replication stream.
pub(super) struct ReplicationTask {
    leader_id: NodeId,
    follower_id: NodeId,
    state: IngesterState,
    syn_replication_stream: ServiceStream<SynReplicationMessage>,
    ack_replication_stream_tx: mpsc::UnboundedSender<IngestV2Result<AckReplicationMessage>>,
    current_replication_seqno: ReplicationSeqNo,
    disk_capacity: ByteSize,
    memory_capacity: ByteSize,
}

impl ReplicationTask {
    pub fn spawn(
        leader_id: NodeId,
        follower_id: NodeId,
        state: IngesterState,
        syn_replication_stream: ServiceStream<SynReplicationMessage>,
        ack_replication_stream_tx: mpsc::UnboundedSender<IngestV2Result<AckReplicationMessage>>,
        disk_capacity: ByteSize,
        memory_capacity: ByteSize,
    ) -> ReplicationTaskHandle {
        let mut replication_task = Self {
            leader_id,
            follower_id,
            state,
            syn_replication_stream,
            ack_replication_stream_tx,
            current_replication_seqno: 0,
            disk_capacity,
            memory_capacity,
        };
        let join_handle = tokio::spawn(async move { replication_task.run().await });
        ReplicationTaskHandle { join_handle }
    }

    async fn init_replica(
        &mut self,
        init_replica_request: InitReplicaRequest,
    ) -> IngestV2Result<InitReplicaResponse> {
        if init_replica_request.replication_seqno != self.current_replication_seqno {
            return Err(IngestV2Error::Internal(format!(
                "received out-of-order replication request: expected replication seqno `{}`, got \
                 `{}`",
                self.current_replication_seqno, init_replica_request.replication_seqno
            )));
        }
        self.current_replication_seqno += 1;

        let Some(replica_shard) = init_replica_request.replica_shard else {
            warn!("received empty init replica request");

            return Err(IngestV2Error::Internal(
                "init replica request is empty".to_string(),
            ));
        };
        let queue_id = replica_shard.queue_id();

        let mut state_guard =
            with_lock_metrics!(self.state.lock_fully(), "init_replica", "write").await?;

        match state_guard.mrecordlog.create_queue(&queue_id).await {
            Ok(_) => {}
            Err(CreateQueueError::AlreadyExists) => {
                error!("WAL queue `{queue_id}` already exists");
                let message = format!("WAL queue `{queue_id}` already exists");
                return Err(IngestV2Error::Internal(message));
            }
            Err(CreateQueueError::IoError(io_error)) => {
                error!("failed to create WAL queue `{queue_id}`: {io_error}",);
                let message = format!("failed to create WAL queue `{queue_id}`: {io_error}");
                return Err(IngestV2Error::Internal(message));
            }
        };
        let index_uid = replica_shard.index_uid().clone();
        let shard_id = replica_shard.shard_id().clone();
        let source_id = replica_shard.source_id;
        let leader_id = NodeId::from(replica_shard.leader_id);

        let replica_shard =
            IngesterShard::new_replica(index_uid, source_id, shard_id, leader_id).build();
        state_guard.shards.insert(queue_id, replica_shard);

        let init_replica_response = InitReplicaResponse {
            replication_seqno: init_replica_request.replication_seqno,
        };
        Ok(init_replica_response)
    }

    async fn replicate(
        &mut self,
        replicate_request: ReplicateRequest,
    ) -> IngestV2Result<ReplicateResponse> {
        if replicate_request.leader_id != self.leader_id {
            return Err(IngestV2Error::Internal(format!(
                "routing error: expected leader ID `{}`, got `{}`",
                self.leader_id, replicate_request.leader_id
            )));
        }
        if replicate_request.follower_id != self.follower_id {
            return Err(IngestV2Error::Internal(format!(
                "routing error: expected follower ID `{}`, got `{}`",
                self.follower_id, replicate_request.follower_id
            )));
        }
        if replicate_request.replication_seqno != self.current_replication_seqno {
            return Err(IngestV2Error::Internal(format!(
                "received out-of-order replication request: expected replication seqno `{}`, got \
                 `{}`",
                self.current_replication_seqno, replicate_request.replication_seqno
            )));
        }
        let request_size_bytes = replicate_request.num_bytes();
        let mut gauge_guard = GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.ingester_replicate);
        gauge_guard.add(request_size_bytes as i64);

        self.current_replication_seqno += 1;

        let commit_type = replicate_request.commit_type();
        let force_commit = commit_type == CommitTypeV2::Force;

        let mut replicate_successes = Vec::with_capacity(replicate_request.subrequests.len());
        let mut replicate_failures = Vec::new();

        // Keep track of the shards that need to be closed following an IO error.
        let mut shards_to_close: HashSet<QueueId> = HashSet::new();

        // Keep track of dangling shards, i.e., shards for which there is no longer a corresponding
        // queue in the WAL and should be deleted.
        let mut shards_to_delete: HashSet<QueueId> = HashSet::new();

        let mut state_guard =
            with_lock_metrics!(self.state.lock_fully(), "replicate", "write").await?;

        if state_guard.status() != IngesterStatus::Ready {
            replicate_failures.reserve_exact(replicate_request.subrequests.len());

            for subrequest in replicate_request.subrequests {
                let replicate_failure = ReplicateFailure {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    shard_id: subrequest.shard_id,
                    reason: ReplicateFailureReason::ShardClosed as i32,
                };
                replicate_failures.push(replicate_failure);
            }
            let replicate_response = ReplicateResponse {
                follower_id: replicate_request.follower_id,
                successes: Vec::new(),
                failures: replicate_failures,
                replication_seqno: replicate_request.replication_seqno,
            };
            return Ok(replicate_response);
        }
        let now = Instant::now();

        for subrequest in replicate_request.subrequests {
            let queue_id = subrequest.queue_id();
            let from_position_exclusive = subrequest.from_position_exclusive();

            let Some(shard) = state_guard.shards.get(&queue_id) else {
                let replicate_failure = ReplicateFailure {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    shard_id: subrequest.shard_id,
                    reason: ReplicateFailureReason::ShardNotFound as i32,
                };
                replicate_failures.push(replicate_failure);
                continue;
            };
            assert!(shard.is_replica());

            if shard.is_closed() {
                let replicate_failure = ReplicateFailure {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    shard_id: subrequest.shard_id,
                    reason: ReplicateFailureReason::ShardClosed as i32,
                };
                replicate_failures.push(replicate_failure);
                continue;
            }
            if shard.replication_position_inclusive != from_position_exclusive {
                // TODO
            }
            let doc_batch = match subrequest.doc_batch {
                Some(doc_batch) if !doc_batch.is_empty() => doc_batch,
                _ => {
                    warn!("received empty replicate request");

                    let replicate_success = ReplicateSuccess {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid,
                        source_id: subrequest.source_id,
                        shard_id: subrequest.shard_id,
                        replication_position_inclusive: Some(
                            shard.replication_position_inclusive.clone(),
                        ),
                    };
                    replicate_successes.push(replicate_success);
                    continue;
                }
            };

            let batch_num_bytes = doc_batch.num_bytes() as u64;
            let batch_num_docs = doc_batch.num_docs() as u64;

            let requested_capacity = estimate_size(&doc_batch);

            if let Err(error) = check_enough_capacity(
                &state_guard.mrecordlog,
                self.disk_capacity,
                self.memory_capacity,
                requested_capacity,
            ) {
                rate_limited_warn!(
                    limit_per_min = 10,
                    "failed to replicate records to ingester `{}`: {error}",
                    self.follower_id,
                );
                let replicate_failure = ReplicateFailure {
                    subrequest_id: subrequest.subrequest_id,
                    index_uid: subrequest.index_uid,
                    source_id: subrequest.source_id,
                    shard_id: subrequest.shard_id,
                    reason: ReplicateFailureReason::WalFull as i32,
                };
                replicate_failures.push(replicate_failure);
                continue;
            };
            let append_result = append_non_empty_doc_batch(
                &mut state_guard.mrecordlog,
                &queue_id,
                doc_batch,
                force_commit,
            )
            .await;

            let current_position_inclusive = match append_result {
                Ok(current_position_inclusive) => current_position_inclusive,
                Err(append_error) => {
                    let reason = match &append_error {
                        AppendDocBatchError::Io(io_error) => {
                            error!("failed to replicate records to shard `{queue_id}`: {io_error}");
                            shards_to_close.insert(queue_id);
                            ReplicateFailureReason::ShardClosed
                        }
                        AppendDocBatchError::QueueNotFound(_) => {
                            error!(
                                "failed to replicate records to shard `{queue_id}`: WAL queue not \
                                 found"
                            );
                            shards_to_delete.insert(queue_id);
                            ReplicateFailureReason::ShardNotFound
                        }
                    };
                    let replicate_failure = ReplicateFailure {
                        subrequest_id: subrequest.subrequest_id,
                        index_uid: subrequest.index_uid,
                        source_id: subrequest.source_id,
                        shard_id: subrequest.shard_id,
                        reason: reason as i32,
                    };
                    replicate_failures.push(replicate_failure);
                    continue;
                }
            };
            state_guard
                .shards
                .get_mut(&queue_id)
                .expect("replica shard should be initialized")
                .set_replication_position_inclusive(current_position_inclusive.clone(), now);

            INGEST_METRICS
                .replicated_num_bytes_total
                .inc_by(batch_num_bytes);
            INGEST_METRICS
                .replicated_num_docs_total
                .inc_by(batch_num_docs);

            let replicate_success = ReplicateSuccess {
                subrequest_id: subrequest.subrequest_id,
                index_uid: subrequest.index_uid,
                source_id: subrequest.source_id,
                shard_id: subrequest.shard_id,
                replication_position_inclusive: Some(current_position_inclusive),
            };
            replicate_successes.push(replicate_success);
        }
        if !shards_to_close.is_empty() {
            for queue_id in &shards_to_close {
                let shard = state_guard
                    .shards
                    .get_mut(queue_id)
                    .expect("shard should exist");

                shard.shard_state = ShardState::Closed;
                shard.notify_shard_status();
                warn!("closed shard `{queue_id}` following IO error");
            }
        }
        if !shards_to_delete.is_empty() {
            for queue_id in &shards_to_delete {
                state_guard.shards.remove(queue_id);
                warn!("deleted dangling shard `{queue_id}`");
            }
        }
        let wal_usage = state_guard.mrecordlog.resource_usage();
        drop(state_guard);

        report_wal_usage(wal_usage);

        let follower_id = self.follower_id.clone().into();

        let replicate_response = ReplicateResponse {
            follower_id,
            successes: replicate_successes,
            failures: replicate_failures,
            replication_seqno: replicate_request.replication_seqno,
        };
        Ok(replicate_response)
    }

    async fn run(&mut self) -> IngestV2Result<()> {
        while let Some(syn_replication_message) = self.syn_replication_stream.next().await {
            let ack_replication_message = match syn_replication_message.message {
                Some(syn_replication_message::Message::OpenRequest(_)) => {
                    panic!("TODO: this should not happen, internal error");
                }
                Some(syn_replication_message::Message::InitRequest(init_replica_request)) => self
                    .init_replica(init_replica_request)
                    .await
                    .map(AckReplicationMessage::new_init_replica_response),
                Some(syn_replication_message::Message::ReplicateRequest(replicate_request)) => self
                    .replicate(replicate_request)
                    .await
                    .map(AckReplicationMessage::new_replicate_response),
                None => {
                    warn!("received empty SYN replication message");
                    continue;
                }
            };
            if self
                .ack_replication_stream_tx
                .send(ack_replication_message)
                .is_err()
            {
                break;
            }
        }
        Ok(())
    }
}

pub(super) struct ReplicationTaskHandle {
    join_handle: JoinHandle<IngestV2Result<()>>,
}

impl Drop for ReplicationTaskHandle {
    fn drop(&mut self) {
        self.join_handle.abort();
    }
}

#[cfg(test)]
mod tests {

    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_config::service::QuickwitService;
    use quickwit_proto::ingest::ingester::{ReplicateSubrequest, ReplicateSuccess};
    use quickwit_proto::ingest::{DocBatchV2, Shard};
    use quickwit_proto::types::{IndexUid, Position, ShardId, queue_id};

    use super::*;

    fn into_init_replica_request(
        syn_replication_message: SynReplicationMessage,
    ) -> InitReplicaRequest {
        let Some(syn_replication_message::Message::InitRequest(init_replica_request)) =
            syn_replication_message.message
        else {
            panic!(
                "expected init replica SYN message, got `{:?}`",
                syn_replication_message.message
            );
        };
        init_replica_request
    }

    fn into_replicate_request(syn_replication_message: SynReplicationMessage) -> ReplicateRequest {
        let Some(syn_replication_message::Message::ReplicateRequest(replicate_request)) =
            syn_replication_message.message
        else {
            panic!(
                "expected replicate SYN message, got `{:?}`",
                syn_replication_message.message
            );
        };
        replicate_request
    }

    fn into_init_replica_response(
        ack_replication_message: AckReplicationMessage,
    ) -> InitReplicaResponse {
        let Some(ack_replication_message::Message::InitResponse(init_replica_response)) =
            ack_replication_message.message
        else {
            panic!(
                "expected init replica ACK message, got `{:?}`",
                ack_replication_message.message
            );
        };
        init_replica_response
    }

    fn into_replicate_response(
        ack_replication_message: AckReplicationMessage,
    ) -> ReplicateResponse {
        let Some(ack_replication_message::Message::ReplicateResponse(replicate_response)) =
            ack_replication_message.message
        else {
            panic!(
                "expected replicate ACK message, got `{:?}`",
                ack_replication_message.message
            );
        };
        replicate_response
    }

    #[tokio::test]
    async fn test_replication_stream_task_init() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let (syn_replication_stream_tx, mut syn_replication_stream_rx) = mpsc::channel(5);
        let (ack_replication_stream_tx, ack_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let replication_stream_task_handle = ReplicationStreamTask::spawn(
            leader_id,
            follower_id,
            syn_replication_stream_tx,
            ack_replication_stream,
        );
        let dummy_replication_task_future = async move {
            while let Some(syn_replication_message) = syn_replication_stream_rx.recv().await {
                let init_replica_request = into_init_replica_request(syn_replication_message);
                let init_replica_response = InitReplicaResponse {
                    replication_seqno: init_replica_request.replication_seqno,
                };
                let ack_replication_message =
                    AckReplicationMessage::new_init_replica_response(init_replica_response);
                ack_replication_stream_tx
                    .send(Ok(ack_replication_message))
                    .await
                    .unwrap();
            }
        };
        tokio::spawn(dummy_replication_task_future);

        let index_uid = IndexUid::for_test("test-index", 0);
        let replica_shard = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: "test-source".to_string(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: "test-leader".to_string(),
            follower_id: Some("test-follower".to_string()),
            ..Default::default()
        };
        let init_replica_response = replication_stream_task_handle
            .replication_client()
            .init_replica(replica_shard)
            .await
            .unwrap();
        assert_eq!(init_replica_response.replication_seqno, 0);
    }

    #[tokio::test]
    async fn test_replication_stream_task_replicate() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let (syn_replication_stream_tx, mut syn_replication_stream_rx) = mpsc::channel(5);
        let (ack_replication_stream_tx, ack_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let replication_stream_task_handle = ReplicationStreamTask::spawn(
            leader_id.clone(),
            follower_id.clone(),
            syn_replication_stream_tx,
            ack_replication_stream,
        );
        let dummy_replication_task_future = async move {
            while let Some(syn_replication_message) = syn_replication_stream_rx.recv().await {
                let replicate_request = into_replicate_request(syn_replication_message);
                let replicate_successes = replicate_request
                    .subrequests
                    .iter()
                    .map(|subrequest| {
                        let batch_len = subrequest.doc_batch.as_ref().unwrap().num_docs();
                        let replication_position_inclusive = subrequest
                            .from_position_exclusive()
                            .as_usize()
                            .map(|pos| pos + batch_len)
                            .unwrap_or(batch_len - 1);
                        ReplicateSuccess {
                            subrequest_id: subrequest.subrequest_id,
                            index_uid: subrequest.index_uid.clone(),
                            source_id: subrequest.source_id.clone(),
                            shard_id: subrequest.shard_id.clone(),
                            replication_position_inclusive: Some(Position::offset(
                                replication_position_inclusive,
                            )),
                        }
                    })
                    .collect::<Vec<_>>();

                let replicate_response = ReplicateResponse {
                    follower_id: replicate_request.follower_id,
                    successes: replicate_successes,
                    failures: Vec::new(),
                    replication_seqno: replicate_request.replication_seqno,
                };
                let ack_replication_message =
                    AckReplicationMessage::new_replicate_response(replicate_response);
                ack_replication_stream_tx
                    .send(Ok(ack_replication_message))
                    .await
                    .unwrap();
            }
        };
        tokio::spawn(dummy_replication_task_future);

        let index_uid = IndexUid::for_test("test-index", 0);
        let index_uid2: IndexUid = IndexUid::for_test("test-index", 1);

        let subrequests = vec![
            ReplicateSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                from_position_exclusive: Some(Position::Beginning),
            },
            ReplicateSubrequest {
                subrequest_id: 1,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(2)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-bar", "test-doc-baz"])),
                from_position_exclusive: Some(Position::Beginning),
            },
            ReplicateSubrequest {
                subrequest_id: 2,
                index_uid: Some(index_uid2.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-qux", "test-doc-tux"])),
                from_position_exclusive: Some(Position::offset(0u64)),
            },
        ];
        let replicate_response = replication_stream_task_handle
            .replication_client()
            .replicate(
                leader_id.clone(),
                follower_id.clone(),
                subrequests,
                CommitTypeV2::Auto,
            )
            .await
            .unwrap();
        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 3);
        assert_eq!(replicate_response.failures.len(), 0);
        assert_eq!(replicate_response.replication_seqno, 0);

        let replicate_success_0 = &replicate_response.successes[0];
        assert_eq!(replicate_success_0.index_uid(), &index_uid);
        assert_eq!(replicate_success_0.source_id, "test-source");
        assert_eq!(replicate_success_0.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_success_0.replication_position_inclusive(),
            Position::offset(0u64)
        );

        let replicate_success_1 = &replicate_response.successes[1];
        assert_eq!(replicate_success_1.index_uid(), &index_uid);
        assert_eq!(replicate_success_1.source_id, "test-source");
        assert_eq!(replicate_success_1.shard_id(), ShardId::from(2));
        assert_eq!(
            replicate_success_1.replication_position_inclusive(),
            Position::offset(1u64)
        );

        let replicate_success_2 = &replicate_response.successes[2];
        assert_eq!(replicate_success_2.index_uid(), &index_uid2);
        assert_eq!(replicate_success_2.source_id, "test-source");
        assert_eq!(replicate_success_2.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_success_2.replication_position_inclusive(),
            Position::offset(2u64)
        );
    }

    #[tokio::test]
    async fn test_replication_stream_replicate_errors() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let (syn_replication_stream_tx, _syn_replication_stream_rx) = mpsc::channel(5);
        let (_ack_replication_stream_tx, ack_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let replication_stream_task_handle = ReplicationStreamTask::spawn(
            leader_id.clone(),
            follower_id.clone(),
            syn_replication_stream_tx,
            ack_replication_stream,
        );
        let timeout_error = replication_stream_task_handle
            .replication_client()
            .replicate(
                leader_id.clone(),
                follower_id.clone(),
                Vec::new(),
                CommitTypeV2::Auto,
            )
            .await
            .unwrap_err();
        assert!(matches!(timeout_error, ReplicationError::Timeout));

        replication_stream_task_handle
            .enqueue_syn_requests_join_handle
            .abort();

        let closed_error = replication_stream_task_handle
            .replication_client()
            .replicate(leader_id, follower_id, Vec::new(), CommitTypeV2::Auto)
            .await
            .unwrap_err();

        assert!(matches!(closed_error, ReplicationError::Closed));
    }

    #[tokio::test]
    async fn test_replication_task_happy_path() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let (syn_replication_stream_tx, syn_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let (ack_replication_stream_tx, mut ack_replication_stream) =
            ServiceStream::new_unbounded();

        let disk_capacity = ByteSize::mb(256);
        let memory_capacity = ByteSize::mb(1);

        let _replication_task_handle = ReplicationTask::spawn(
            leader_id,
            follower_id,
            state.clone(),
            syn_replication_stream,
            ack_replication_stream_tx,
            disk_capacity,
            memory_capacity,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let index_uid2: IndexUid = IndexUid::for_test("test-index", 1);

        // Init shard 01.
        let init_replica_request = InitReplicaRequest {
            replica_shard: Some(Shard {
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-leader".to_string(),
                follower_id: Some("test-follower".to_string()),
                ..Default::default()
            }),
            replication_seqno: 0,
        };
        let syn_replication_message =
            SynReplicationMessage::new_init_replica_request(init_replica_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let init_replica_response = into_init_replica_response(ack_replication_message);
        assert_eq!(init_replica_response.replication_seqno, 0);

        // Init shard 02.
        let init_replica_request = InitReplicaRequest {
            replica_shard: Some(Shard {
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(2)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-leader".to_string(),
                follower_id: Some("test-follower".to_string()),
                ..Default::default()
            }),
            replication_seqno: 1,
        };
        let syn_replication_message =
            SynReplicationMessage::new_init_replica_request(init_replica_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let init_replica_response = into_init_replica_response(ack_replication_message);
        assert_eq!(init_replica_response.replication_seqno, 1);

        // Init shard 11.
        let init_replica_request = InitReplicaRequest {
            replica_shard: Some(Shard {
                index_uid: Some(index_uid2.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-leader".to_string(),
                follower_id: Some("test-follower".to_string()),
                ..Default::default()
            }),
            replication_seqno: 2,
        };
        let syn_replication_message =
            SynReplicationMessage::new_init_replica_request(init_replica_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let init_replica_response = into_init_replica_response(ack_replication_message);
        assert_eq!(init_replica_response.replication_seqno, 2);

        let state_guard = state.lock_fully().await.unwrap();

        let queue_id_01 = queue_id(&index_uid, "test-source", &ShardId::from(1));

        let replica_shard_01 = state_guard.shards.get(&queue_id_01).unwrap();
        replica_shard_01.assert_is_replica();
        replica_shard_01.assert_is_open();
        replica_shard_01.assert_replication_position(Position::Beginning);
        replica_shard_01.assert_truncation_position(Position::Beginning);

        assert!(state_guard.mrecordlog.queue_exists(&queue_id_01));

        let queue_id_02 = queue_id(&index_uid, "test-source", &ShardId::from(2));

        let replica_shard_02 = state_guard.shards.get(&queue_id_02).unwrap();
        replica_shard_02.assert_is_replica();
        replica_shard_02.assert_is_open();
        replica_shard_02.assert_replication_position(Position::Beginning);
        replica_shard_02.assert_truncation_position(Position::Beginning);

        let queue_id_11 = queue_id(&index_uid2, "test-source", &ShardId::from(1));

        let replica_shard_11 = state_guard.shards.get(&queue_id_11).unwrap();
        replica_shard_11.assert_is_replica();
        replica_shard_11.assert_is_open();
        replica_shard_11.assert_replication_position(Position::Beginning);
        replica_shard_11.assert_truncation_position(Position::Beginning);

        drop(state_guard);

        let replicate_request = ReplicateRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![
                ReplicateSubrequest {
                    subrequest_id: 0,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                    from_position_exclusive: Some(Position::Beginning),
                },
                ReplicateSubrequest {
                    subrequest_id: 1,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(2)),
                    doc_batch: Some(DocBatchV2::for_test(["test-doc-bar", "test-doc-baz"])),
                    from_position_exclusive: Some(Position::Beginning),
                },
                ReplicateSubrequest {
                    subrequest_id: 2,
                    index_uid: Some(index_uid2.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    doc_batch: Some(DocBatchV2::for_test(["test-doc-qux", "test-doc-tux"])),
                    from_position_exclusive: Some(Position::Beginning),
                },
            ],
            replication_seqno: 3,
        };
        let syn_replication_message =
            SynReplicationMessage::new_replicate_request(replicate_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let replicate_response = into_replicate_response(ack_replication_message);

        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 3);
        assert_eq!(replicate_response.failures.len(), 0);
        assert_eq!(replicate_response.replication_seqno, 3);

        let replicate_success_0 = &replicate_response.successes[0];
        assert_eq!(replicate_success_0.index_uid(), &index_uid);
        assert_eq!(replicate_success_0.source_id, "test-source");
        assert_eq!(replicate_success_0.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_success_0.replication_position_inclusive(),
            Position::offset(0u64)
        );

        let replicate_success_1 = &replicate_response.successes[1];
        assert_eq!(replicate_success_1.index_uid(), &index_uid);
        assert_eq!(replicate_success_1.source_id, "test-source");
        assert_eq!(replicate_success_1.shard_id(), ShardId::from(2));
        assert_eq!(
            replicate_success_1.replication_position_inclusive(),
            Position::offset(1u64)
        );

        let replicate_success_2 = &replicate_response.successes[2];
        assert_eq!(replicate_success_2.index_uid(), &index_uid2);
        assert_eq!(replicate_success_2.source_id, "test-source");
        assert_eq!(replicate_success_2.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_success_2.replication_position_inclusive(),
            Position::offset(1u64)
        );

        let state_guard = state.lock_fully().await.unwrap();

        state_guard
            .mrecordlog
            .assert_records_eq(&queue_id_01, .., &[(0, [0, 0], "test-doc-foo")]);

        state_guard.mrecordlog.assert_records_eq(
            &queue_id_02,
            ..,
            &[(0, [0, 0], "test-doc-bar"), (1, [0, 0], "test-doc-baz")],
        );

        state_guard.mrecordlog.assert_records_eq(
            &queue_id_11,
            ..,
            &[(0, [0, 0], "test-doc-qux"), (1, [0, 0], "test-doc-tux")],
        );
        drop(state_guard);

        let replicate_request = ReplicateRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![ReplicateSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-moo"])),
                from_position_exclusive: Some(Position::offset(0u64)),
            }],
            replication_seqno: 4,
        };
        let syn_replication_message =
            SynReplicationMessage::new_replicate_request(replicate_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let replicate_response = into_replicate_response(ack_replication_message);

        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 1);
        assert_eq!(replicate_response.failures.len(), 0);
        assert_eq!(replicate_response.replication_seqno, 4);

        let replicate_success_0 = &replicate_response.successes[0];
        assert_eq!(replicate_success_0.index_uid(), &index_uid);
        assert_eq!(replicate_success_0.source_id, "test-source");
        assert_eq!(replicate_success_0.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_success_0.replication_position_inclusive(),
            Position::offset(1u64)
        );

        let state_guard = state.lock_fully().await.unwrap();

        state_guard.mrecordlog.assert_records_eq(
            &queue_id_01,
            ..,
            &[(0, [0, 0], "test-doc-foo"), (1, [0, 0], "test-doc-moo")],
        );
    }

    #[tokio::test]
    async fn test_replication_task_shard_closed() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let (syn_replication_stream_tx, syn_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let (ack_replication_stream_tx, mut ack_replication_stream) =
            ServiceStream::new_unbounded();

        let disk_capacity = ByteSize::mb(256);
        let memory_capacity = ByteSize::mb(1);

        let _replication_task_handle = ReplicationTask::spawn(
            leader_id.clone(),
            follower_id,
            state.clone(),
            syn_replication_stream,
            ack_replication_stream_tx,
            disk_capacity,
            memory_capacity,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let replica_shard = IngesterShard::new_replica(
            index_uid.clone(),
            "test-source".to_string(),
            ShardId::from(1),
            leader_id,
        )
        .with_state(ShardState::Closed)
        .build();
        state
            .lock_fully()
            .await
            .unwrap()
            .shards
            .insert(replica_shard.queue_id(), replica_shard);

        let replicate_request = ReplicateRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![ReplicateSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                from_position_exclusive: Position::offset(0u64).into(),
            }],
            replication_seqno: 0,
        };
        let syn_replication_message =
            SynReplicationMessage::new_replicate_request(replicate_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let replicate_response = into_replicate_response(ack_replication_message);

        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 0);
        assert_eq!(replicate_response.failures.len(), 1);

        let replicate_failure = &replicate_response.failures[0];
        assert_eq!(replicate_failure.index_uid(), &index_uid);
        assert_eq!(replicate_failure.source_id, "test-source");
        assert_eq!(replicate_failure.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_failure.reason(),
            ReplicateFailureReason::ShardClosed
        );
    }

    #[cfg(not(feature = "failpoints"))]
    #[tokio::test]
    async fn test_replication_task_deletes_dangling_shard() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let (syn_replication_stream_tx, syn_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let (ack_replication_stream_tx, mut ack_replication_stream) =
            ServiceStream::new_unbounded();

        let disk_capacity = ByteSize::mb(256);
        let memory_capacity = ByteSize::mb(1);

        let _replication_task_handle = ReplicationTask::spawn(
            leader_id.clone(),
            follower_id,
            state.clone(),
            syn_replication_stream,
            ack_replication_stream_tx,
            disk_capacity,
            memory_capacity,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let replica_shard = IngesterShard::new_replica(
            index_uid.clone(),
            "test-source".to_string(),
            ShardId::from(1),
            leader_id,
        )
        .build();
        let queue_id_01 = replica_shard.queue_id();
        state
            .lock_fully()
            .await
            .unwrap()
            .shards
            .insert(queue_id_01.clone(), replica_shard);

        let replicate_request = ReplicateRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![ReplicateSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                from_position_exclusive: Position::offset(0u64).into(),
            }],
            replication_seqno: 0,
        };
        let syn_replication_message =
            SynReplicationMessage::new_replicate_request(replicate_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let replicate_response = into_replicate_response(ack_replication_message);

        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 0);
        assert_eq!(replicate_response.failures.len(), 1);

        let replicate_failure = &replicate_response.failures[0];
        assert_eq!(replicate_failure.index_uid(), &index_uid);
        assert_eq!(replicate_failure.source_id, "test-source");
        assert_eq!(replicate_failure.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_failure.reason(),
            ReplicateFailureReason::ShardNotFound
        );

        let state_guard = state.lock_partially().await.unwrap();
        assert!(!state_guard.shards.contains_key(&queue_id_01));
    }

    // This test should be run manually and independently of other tests with the `failpoints`
    // feature enabled:
    // ```sh
    // cargo test --manifest-path quickwit/Cargo.toml -p quickwit-ingest --features failpoints -- test_replication_task_closes_shard_on_io_error
    // ```
    #[cfg(feature = "failpoints")]
    #[tokio::test]
    async fn test_replication_task_closes_shard_on_io_error() {
        let scenario = fail::FailScenario::setup();
        fail::cfg("ingester:append_records", "return").unwrap();

        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let (syn_replication_stream_tx, syn_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let (ack_replication_stream_tx, mut ack_replication_stream) =
            ServiceStream::new_unbounded();

        let disk_capacity = ByteSize::mb(256);
        let memory_capacity = ByteSize::mb(1);

        let _replication_task_handle = ReplicationTask::spawn(
            leader_id.clone(),
            follower_id,
            state.clone(),
            syn_replication_stream,
            ack_replication_stream_tx,
            disk_capacity,
            memory_capacity,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let queue_id_01 = queue_id(&index_uid, "test-source", &ShardId::from(1));
        let replica_shard = IngesterShard::new_replica(
            index_uid.clone(),
            "test-source".to_string(),
            ShardId::from(1),
            leader_id,
        )
        .build();
        let mut state_guard = state.lock_fully().await.unwrap();

        state_guard
            .shards
            .insert(queue_id_01.clone(), replica_shard);

        state_guard
            .mrecordlog
            .create_queue(&queue_id_01)
            .await
            .unwrap();

        drop(state_guard);

        let replicate_request = ReplicateRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![ReplicateSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                from_position_exclusive: Position::offset(0u64).into(),
            }],
            replication_seqno: 0,
        };
        let syn_replication_message =
            SynReplicationMessage::new_replicate_request(replicate_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let replicate_response = into_replicate_response(ack_replication_message);

        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 0);
        assert_eq!(replicate_response.failures.len(), 1);

        let replicate_failure = &replicate_response.failures[0];
        assert_eq!(replicate_failure.index_uid(), &index_uid);
        assert_eq!(replicate_failure.source_id, "test-source");
        assert_eq!(replicate_failure.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_failure.reason(),
            ReplicateFailureReason::ShardClosed
        );

        let state_guard = state.lock_partially().await.unwrap();
        let replica_shard = state_guard.shards.get(&queue_id_01).unwrap();
        replica_shard.assert_is_closed();

        scenario.teardown();
    }

    #[tokio::test]
    async fn test_replication_task_resource_exhausted() {
        let leader_id: NodeId = "test-leader".into();
        let follower_id: NodeId = "test-follower".into();
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let (syn_replication_stream_tx, syn_replication_stream) =
            ServiceStream::new_bounded(SYN_REPLICATION_STREAM_CAPACITY);
        let (ack_replication_stream_tx, mut ack_replication_stream) =
            ServiceStream::new_unbounded();

        let disk_capacity = ByteSize(0);
        let memory_capacity = ByteSize(0);

        let _replication_task_handle = ReplicationTask::spawn(
            leader_id.clone(),
            follower_id,
            state.clone(),
            syn_replication_stream,
            ack_replication_stream_tx,
            disk_capacity,
            memory_capacity,
        );

        let index_uid = IndexUid::for_test("test-index", 0);
        let replica_shard = IngesterShard::new_replica(
            index_uid.clone(),
            "test-source".to_string(),
            ShardId::from(1),
            leader_id,
        )
        .build();
        let queue_id_01 = replica_shard.queue_id();
        state
            .lock_fully()
            .await
            .unwrap()
            .shards
            .insert(queue_id_01.clone(), replica_shard);

        let replicate_request = ReplicateRequest {
            leader_id: "test-leader".to_string(),
            follower_id: "test-follower".to_string(),
            commit_type: CommitTypeV2::Auto as i32,
            subrequests: vec![ReplicateSubrequest {
                subrequest_id: 0,
                index_uid: Some(index_uid.clone()),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(1)),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                from_position_exclusive: Some(Position::Beginning),
            }],
            replication_seqno: 0,
        };
        let syn_replication_message =
            SynReplicationMessage::new_replicate_request(replicate_request);
        syn_replication_stream_tx
            .send(syn_replication_message)
            .await
            .unwrap();
        let ack_replication_message = ack_replication_stream.next().await.unwrap().unwrap();
        let replicate_response = into_replicate_response(ack_replication_message);

        assert_eq!(replicate_response.follower_id, "test-follower");
        assert_eq!(replicate_response.successes.len(), 0);
        assert_eq!(replicate_response.failures.len(), 1);

        let replicate_failure_0 = &replicate_response.failures[0];
        assert_eq!(replicate_failure_0.index_uid(), &index_uid);
        assert_eq!(replicate_failure_0.source_id, "test-source");
        assert_eq!(replicate_failure_0.shard_id(), ShardId::from(1));
        assert_eq!(
            replicate_failure_0.reason(),
            ReplicateFailureReason::WalFull
        );
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/router.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::fmt;
use std::sync::{Arc, OnceLock, Weak};
use std::time::Duration;

use async_trait::async_trait;
use futures::stream::FuturesUnordered;
use futures::{Future, StreamExt};
use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_common::pubsub::{EventBroker, EventSubscriber};
use quickwit_common::{rate_limited_error, rate_limited_warn};
use quickwit_proto::control_plane::{
    ControlPlaneService, ControlPlaneServiceClient, GetOrCreateOpenShardsRequest,
    GetOrCreateOpenShardsSubrequest,
};
use quickwit_proto::ingest::ingester::{
    IngesterService, PersistFailureReason, PersistRequest, PersistResponse, PersistSubrequest,
};
use quickwit_proto::ingest::router::{
    IngestFailureReason, IngestRequestV2, IngestResponseV2, IngestRouterService,
};
use quickwit_proto::ingest::{CommitTypeV2, IngestV2Error, IngestV2Result, RateLimitingCause};
use quickwit_proto::types::{NodeId, SubrequestId};
use serde_json::{Value as JsonValue, json};
use tokio::sync::{Mutex, Semaphore};
use tokio::time::error::Elapsed;
use tracing::{error, info};

use super::broadcast::IngesterCapacityScoreUpdate;
use super::debouncing::{
    DebouncedGetOrCreateOpenShardsRequest, GetOrCreateOpenShardsRequestDebouncer,
};
use super::ingester::PERSIST_REQUEST_TIMEOUT;
use super::metrics::IngestResultMetrics;
use super::routing_table::RoutingTable;
use super::workbench::IngestWorkbench;
use super::{IngesterPool, pending_subrequests};
use crate::get_ingest_router_buffer_size;
use crate::ingest_v2::metrics::INGEST_V2_METRICS;

/// Duration after which ingest requests time out with [`IngestV2Error::Timeout`].
fn ingest_request_timeout() -> Duration {
    const DEFAULT_INGEST_REQUEST_TIMEOUT: Duration = if cfg!(any(test, feature = "testsuite")) {
        Duration::from_millis(10)
    } else {
        Duration::from_secs(35)
    };
    static TIMEOUT: OnceLock<Duration> = OnceLock::new();
    *TIMEOUT.get_or_init(|| {
        let duration_ms = quickwit_common::get_from_env(
            "QW_INGEST_REQUEST_TIMEOUT_MS",
            DEFAULT_INGEST_REQUEST_TIMEOUT.as_millis() as u64,
            false,
        );
        let minimum_ingest_request_timeout: Duration =
            PERSIST_REQUEST_TIMEOUT * (MAX_PERSIST_ATTEMPTS as u32) + Duration::from_secs(5);
        let requested_ingest_request_timeout = Duration::from_millis(duration_ms);
        if requested_ingest_request_timeout < minimum_ingest_request_timeout {
            error!(
                "ingest request timeout too short {}ms, setting to {}ms",
                requested_ingest_request_timeout.as_millis(),
                minimum_ingest_request_timeout.as_millis()
            );
            minimum_ingest_request_timeout
        } else {
            requested_ingest_request_timeout
        }
    })
}

const MAX_PERSIST_ATTEMPTS: usize = 5;

type PersistResult = (PersistRequestSummary, IngestV2Result<PersistResponse>);

#[derive(Clone)]
pub struct IngestRouter {
    self_node_id: NodeId,
    control_plane: ControlPlaneServiceClient,
    ingester_pool: IngesterPool,
    state: Arc<Mutex<RouterState>>,
    replication_factor: usize,
    // Limits the number of ingest requests in-flight to some capacity in bytes.
    ingest_semaphore: Arc<Semaphore>,
    event_broker: EventBroker,
}

struct RouterState {
    // Debounces `GetOrCreateOpenShardsRequest` requests to the control plane.
    debouncer: GetOrCreateOpenShardsRequestDebouncer,
    // Routing table of nodes, their WAL capacity, and the number of open shards per source.
    routing_table: RoutingTable,
}

impl fmt::Debug for IngestRouter {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("IngestRouter")
            .field("self_node_id", &self.self_node_id)
            .field("replication_factor", &self.replication_factor)
            .finish()
    }
}

impl IngestRouter {
    pub fn new(
        self_node_id: NodeId,
        control_plane: ControlPlaneServiceClient,
        ingester_pool: IngesterPool,
        replication_factor: usize,
        event_broker: EventBroker,
        self_availability_zone: Option<String>,
    ) -> Self {
        let state = Arc::new(Mutex::new(RouterState {
            debouncer: GetOrCreateOpenShardsRequestDebouncer::default(),
            routing_table: RoutingTable::new(self_availability_zone),
        }));
        let ingest_semaphore_permits = get_ingest_router_buffer_size().as_u64() as usize;
        let ingest_semaphore = Arc::new(Semaphore::new(ingest_semaphore_permits));

        Self {
            self_node_id,
            control_plane,
            ingester_pool,
            state,
            replication_factor,
            ingest_semaphore,
            event_broker,
        }
    }

    pub fn subscribe(&self) {
        let weak_router_state = WeakRouterState(Arc::downgrade(&self.state));
        self.event_broker
            .subscribe::<IngesterCapacityScoreUpdate>(weak_router_state)
            .forever();
    }

    /// Inspects the shard table for each subrequest and returns the appropriate
    /// [`GetOrCreateOpenShardsRequest`] request if open shards do not exist for all of them.
    async fn make_get_or_create_open_shard_request(
        &self,
        workbench: &mut IngestWorkbench,
        ingester_pool: &IngesterPool,
    ) -> DebouncedGetOrCreateOpenShardsRequest {
        let mut debounced_request = DebouncedGetOrCreateOpenShardsRequest::default();
        let unavailable_leaders: &HashSet<NodeId> = &workbench.unavailable_leaders;

        let mut state_guard = self.state.lock().await;

        for subrequest in pending_subrequests(&workbench.subworkbenches) {
            if !state_guard.routing_table.has_open_nodes(
                &subrequest.index_id,
                &subrequest.source_id,
                ingester_pool,
                unavailable_leaders,
            ) {
                // No known nodes with open shards for this source. Ask the control
                // plane to create shards so we have somewhere to route to.
                let acquire_result = state_guard
                    .debouncer
                    .acquire(&subrequest.index_id, &subrequest.source_id);

                match acquire_result {
                    Ok(permit) => {
                        let subrequest = GetOrCreateOpenShardsSubrequest {
                            subrequest_id: subrequest.subrequest_id,
                            index_id: subrequest.index_id.clone(),
                            source_id: subrequest.source_id.clone(),
                        };
                        debounced_request.push_subrequest(subrequest, permit);
                    }
                    Err(barrier) => {
                        debounced_request.push_barrier(barrier);
                    }
                }
            }
        }
        drop(state_guard);

        if !debounced_request.is_empty() && !workbench.closed_shards.is_empty() {
            info!(closed_shards=?workbench.closed_shards, "reporting closed shard(s) to control plane");
            debounced_request
                .closed_shards
                .append(&mut workbench.closed_shards);
        }
        if !debounced_request.is_empty() && !unavailable_leaders.is_empty() {
            info!(unavailable_leaders=?unavailable_leaders, "reporting unavailable leader(s) to control plane");

            for unavailable_leader in unavailable_leaders.iter() {
                debounced_request
                    .unavailable_leaders
                    .push(unavailable_leader.to_string());
            }
        }
        debounced_request
    }

    async fn populate_routing_table_debounced(
        &self,
        workbench: &mut IngestWorkbench,
        debounced_request: DebouncedGetOrCreateOpenShardsRequest,
    ) {
        let (request_opt, rendezvous) = debounced_request.take();

        if let Some(request) = request_opt {
            self.populate_routing_table(workbench, request).await;
        }
        rendezvous.wait().await;
    }

    /// Issues a [`GetOrCreateOpenShardsRequest`] request to the control plane and populates the
    /// shard table according to the response received.
    async fn populate_routing_table(
        &self,
        workbench: &mut IngestWorkbench,
        request: GetOrCreateOpenShardsRequest,
    ) {
        if request.subrequests.is_empty() {
            return;
        }
        let response_result = self.control_plane.get_or_create_open_shards(request).await;
        let response = match response_result {
            Ok(response) => response,
            Err(control_plane_error) => {
                if workbench.is_last_attempt() {
                    rate_limited_error!(
                        limit_per_min = 10,
                        "failed to get open shards from control plane: {control_plane_error}"
                    );
                } else {
                    rate_limited_warn!(
                        limit_per_min = 10,
                        "failed to get open shards from control plane: {control_plane_error}"
                    );
                };
                return;
            }
        };
        let mut state_guard = self.state.lock().await;

        for success in response.successes {
            state_guard.routing_table.merge_from_shards(
                success.index_uid().clone(),
                success.source_id,
                success.open_shards,
            );
        }
        drop(state_guard);

        for failure in response.failures {
            workbench.record_get_or_create_open_shards_failure(failure);
        }
    }

    async fn process_persist_results(
        &self,
        workbench: &mut IngestWorkbench,
        mut persist_futures: FuturesUnordered<impl Future<Output = PersistResult>>,
    ) {
        let mut unavailable_leaders: HashSet<NodeId> = HashSet::new();

        while let Some((persist_summary, persist_result)) = persist_futures.next().await {
            match persist_result {
                Ok(persist_response) => {
                    let leader_id = NodeId::from(persist_response.leader_id.clone());

                    for persist_success in persist_response.successes {
                        workbench.record_persist_success(persist_success);
                    }
                    for persist_failure in persist_response.failures {
                        workbench.record_persist_failure(&persist_failure);

                        match persist_failure.reason() {
                            PersistFailureReason::NoShardsAvailable => {
                                // For non-critical failures, we don't mark the nodes unavailable;
                                // a routing update is piggybacked on PersistResponses, so shard
                                // counts and capacity scores will be fresh on the next try.
                            }
                            PersistFailureReason::NodeUnavailable
                            | PersistFailureReason::WalFull
                            | PersistFailureReason::Timeout => {
                                unavailable_leaders.insert(leader_id.clone());
                            }
                            _ => {}
                        }
                    }

                    if let Some(routing_update) = persist_response.routing_update {
                        // Since we just talked to the node, we take advantage and use the
                        // opportunity to get a fresh routing update.
                        let mut state_guard = self.state.lock().await;
                        for shard_update in routing_update.source_shard_updates {
                            state_guard.routing_table.apply_capacity_update(
                                leader_id.clone(),
                                shard_update.index_uid().clone(),
                                shard_update.source_id,
                                routing_update.capacity_score as usize,
                                shard_update.open_shard_count as usize,
                            );
                        }
                        drop(state_guard);

                        workbench.closed_shards.extend(routing_update.closed_shards);
                    }
                }
                Err(persist_error) => {
                    if workbench.is_last_attempt() {
                        rate_limited_error!(
                            limit_per_min = 10,
                            "failed to persist records on ingester `{}`: {persist_error}",
                            persist_summary.leader_id
                        );
                    } else {
                        rate_limited_warn!(
                            limit_per_min = 10,
                            "failed to persist records on ingester `{}`: {persist_error}",
                            persist_summary.leader_id
                        );
                    }
                    workbench.record_persist_error(persist_error, persist_summary);
                }
            };
        }
        workbench.unavailable_leaders.extend(unavailable_leaders);
    }

    async fn batch_persist(&self, workbench: &mut IngestWorkbench, commit_type: CommitTypeV2) {
        // Let's first create the shards that might be missing.
        let debounced_request = self
            .make_get_or_create_open_shard_request(workbench, &self.ingester_pool)
            .await;

        self.populate_routing_table_debounced(workbench, debounced_request)
            .await;

        let unavailable_leaders = &workbench.unavailable_leaders;
        let mut no_shards_available_subrequest_ids: Vec<SubrequestId> = Vec::new();
        let mut per_leader_persist_subrequests: HashMap<&NodeId, Vec<PersistSubrequest>> =
            HashMap::new();

        let state_guard = self.state.lock().await;

        for subrequest in pending_subrequests(&workbench.subworkbenches) {
            let ingester_node = state_guard.routing_table.pick_node(
                &subrequest.index_id,
                &subrequest.source_id,
                &self.ingester_pool,
                unavailable_leaders,
            );

            let ingester_node = match ingester_node {
                Some(node) => node,
                None => {
                    no_shards_available_subrequest_ids.push(subrequest.subrequest_id);
                    continue;
                }
            };
            let az_locality = state_guard
                .routing_table
                .classify_az_locality(&ingester_node.node_id, &self.ingester_pool);
            INGEST_V2_METRICS
                .ingest_attempts
                .with_label_values([az_locality])
                .inc();
            let persist_subrequest = PersistSubrequest {
                subrequest_id: subrequest.subrequest_id,
                index_uid: Some(ingester_node.index_uid.clone()),
                source_id: subrequest.source_id.clone(),
                doc_batch: subrequest.doc_batch.clone(),
            };
            per_leader_persist_subrequests
                .entry(&ingester_node.node_id)
                .or_default()
                .push(persist_subrequest);
        }
        let persist_futures = FuturesUnordered::new();

        for (leader_id, subrequests) in per_leader_persist_subrequests {
            let leader_id: NodeId = leader_id.clone();
            let subrequest_ids: Vec<SubrequestId> = subrequests
                .iter()
                .map(|subrequest| subrequest.subrequest_id)
                .collect();
            let Some(ingester) = self.ingester_pool.get(&leader_id).map(|h| h.client) else {
                no_shards_available_subrequest_ids.extend(subrequest_ids);
                continue;
            };
            let persist_summary = PersistRequestSummary {
                leader_id: leader_id.clone(),
                subrequest_ids,
            };
            let persist_request = PersistRequest {
                leader_id: leader_id.into(),
                subrequests,
                commit_type: commit_type as i32,
            };

            let persist_future = async move {
                let persist_result = tokio::time::timeout(
                    PERSIST_REQUEST_TIMEOUT,
                    ingester.persist(persist_request),
                )
                .await
                .unwrap_or_else(|_| {
                    let message = format!(
                        "persist request timed out after {} seconds",
                        PERSIST_REQUEST_TIMEOUT.as_secs()
                    );
                    Err(IngestV2Error::Timeout(message))
                });
                (persist_summary, persist_result)
            };
            persist_futures.push(persist_future);
        }
        drop(state_guard);

        for subrequest_id in no_shards_available_subrequest_ids {
            workbench.record_no_shards_available(subrequest_id);
        }
        self.process_persist_results(workbench, persist_futures)
            .await;
    }

    async fn retry_batch_persist(
        &self,
        ingest_request: IngestRequestV2,
        max_num_attempts: usize,
    ) -> IngestResponseV2 {
        let commit_type = ingest_request.commit_type();
        let mut workbench = if matches!(commit_type, CommitTypeV2::Force | CommitTypeV2::WaitFor) {
            IngestWorkbench::new_with_publish_tracking(
                ingest_request.subrequests,
                max_num_attempts,
                self.event_broker.clone(),
            )
        } else {
            IngestWorkbench::new(ingest_request.subrequests, max_num_attempts)
        };
        while !workbench.is_complete() {
            workbench.new_attempt();
            self.batch_persist(&mut workbench, commit_type).await;
        }
        workbench.into_ingest_result().await
    }

    async fn ingest_timeout(
        &self,
        ingest_request: IngestRequestV2,
        timeout_duration: Duration,
    ) -> IngestV2Result<IngestResponseV2> {
        tokio::time::timeout(
            timeout_duration,
            self.retry_batch_persist(ingest_request, MAX_PERSIST_ATTEMPTS),
        )
        .await
        .map_err(|_elapsed: Elapsed| {
            let message = format!(
                "ingest request timed out after {} millis",
                timeout_duration.as_millis()
            );
            error!(
                "ingest request should not timeout as there is a timeout on independent ingest \
                 requests too. timeout after {}",
                timeout_duration.as_millis()
            );
            IngestV2Error::Timeout(message)
        })
    }

    pub async fn debug_info(&self) -> JsonValue {
        let state_guard = self.state.lock().await;
        let routing_table_json = state_guard.routing_table.debug_info(&self.ingester_pool);

        json!({
            "routing_table": routing_table_json,
        })
    }
}

fn update_ingest_metrics(ingest_result: &IngestV2Result<IngestResponseV2>, num_subrequests: usize) {
    let num_subrequests = num_subrequests as u64;
    let ingest_results_metrics: &IngestResultMetrics = &INGEST_V2_METRICS.ingest_results;
    match ingest_result {
        Ok(ingest_response) => {
            ingest_results_metrics
                .success
                .inc_by(ingest_response.successes.len() as u64);
            for ingest_failure in &ingest_response.failures {
                match ingest_failure.reason() {
                    IngestFailureReason::CircuitBreaker => {
                        ingest_results_metrics.circuit_breaker.inc();
                    }
                    IngestFailureReason::Unspecified => ingest_results_metrics.unspecified.inc(),
                    IngestFailureReason::IndexNotFound => {
                        ingest_results_metrics.index_not_found.inc()
                    }
                    IngestFailureReason::SourceNotFound => {
                        ingest_results_metrics.source_not_found.inc()
                    }
                    IngestFailureReason::Internal => ingest_results_metrics.internal.inc(),
                    IngestFailureReason::NoShardsAvailable => {
                        ingest_results_metrics.no_shards_available.inc()
                    }
                    IngestFailureReason::ShardRateLimited => {
                        ingest_results_metrics.shard_rate_limited.inc()
                    }
                    IngestFailureReason::WalFull => ingest_results_metrics.wal_full.inc(),
                    IngestFailureReason::Timeout => ingest_results_metrics.timeout.inc(),
                    IngestFailureReason::RouterLoadShedding => {
                        ingest_results_metrics.router_load_shedding.inc()
                    }
                    IngestFailureReason::LoadShedding => ingest_results_metrics.load_shedding.inc(),
                }
            }
        }
        Err(ingest_error) => match ingest_error {
            IngestV2Error::TooManyRequests(rate_limiting_cause) => match rate_limiting_cause {
                RateLimitingCause::RouterLoadShedding => {
                    ingest_results_metrics
                        .router_load_shedding
                        .inc_by(num_subrequests);
                }
                RateLimitingCause::LoadShedding => {
                    ingest_results_metrics.load_shedding.inc_by(num_subrequests)
                }
                RateLimitingCause::WalFull => {
                    ingest_results_metrics.wal_full.inc_by(num_subrequests);
                }
                RateLimitingCause::CircuitBreaker => {
                    ingest_results_metrics
                        .circuit_breaker
                        .inc_by(num_subrequests);
                }
                RateLimitingCause::ShardRateLimiting => {
                    ingest_results_metrics
                        .shard_rate_limited
                        .inc_by(num_subrequests);
                }
                RateLimitingCause::Unknown => {
                    ingest_results_metrics.unspecified.inc_by(num_subrequests);
                }
            },
            IngestV2Error::Timeout(_) => {
                ingest_results_metrics
                    .router_timeout
                    .inc_by(num_subrequests);
            }
            IngestV2Error::ShardNotFound { .. } => {
                ingest_results_metrics
                    .shard_not_found
                    .inc_by(num_subrequests);
            }
            IngestV2Error::Unavailable(_) => {
                ingest_results_metrics.unavailable.inc_by(num_subrequests);
            }
            IngestV2Error::Internal(_) => {
                ingest_results_metrics.internal.inc_by(num_subrequests);
            }
        },
    }
}

#[async_trait]
impl IngestRouterService for IngestRouter {
    async fn ingest(&self, ingest_request: IngestRequestV2) -> IngestV2Result<IngestResponseV2> {
        let request_size_bytes = ingest_request.num_bytes();

        let mut gauge_guard = GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.ingest_router);
        gauge_guard.add(request_size_bytes as i64);
        let num_subrequests = ingest_request.subrequests.len();

        let _permit = self
            .ingest_semaphore
            .clone()
            .try_acquire_many_owned(request_size_bytes as u32)
            .map_err(|_| IngestV2Error::TooManyRequests(RateLimitingCause::RouterLoadShedding))?;

        let ingest_res = if ingest_request.commit_type() == CommitTypeV2::Auto {
            self.ingest_timeout(ingest_request, ingest_request_timeout())
                .await
        } else {
            Ok(self
                .retry_batch_persist(ingest_request, MAX_PERSIST_ATTEMPTS)
                .await)
        };
        update_ingest_metrics(&ingest_res, num_subrequests);

        ingest_res
    }
}

#[derive(Clone)]
struct WeakRouterState(Weak<Mutex<RouterState>>);

#[async_trait]
impl EventSubscriber<IngesterCapacityScoreUpdate> for WeakRouterState {
    async fn handle_event(&mut self, update: IngesterCapacityScoreUpdate) {
        let Some(state) = self.0.upgrade() else {
            return;
        };
        let mut state_guard = state.lock().await;
        state_guard.routing_table.apply_capacity_update(
            update.node_id,
            update.source_uid.index_uid,
            update.source_uid.source_id,
            update.capacity_score,
            update.open_shard_count,
        );
    }
}

pub(super) struct PersistRequestSummary {
    pub leader_id: NodeId,
    pub subrequest_ids: Vec<SubrequestId>,
}

#[cfg(test)]
mod tests {
    use quickwit_proto::control_plane::{
        GetOrCreateOpenShardsFailure, GetOrCreateOpenShardsFailureReason,
        GetOrCreateOpenShardsResponse, GetOrCreateOpenShardsSuccess, MockControlPlaneService,
    };
    use quickwit_proto::ingest::ingester::{
        IngesterServiceClient, IngesterStatus, MockIngesterService, PersistFailure,
        PersistResponse, PersistSuccess, RoutingUpdate, SourceShardUpdate,
    };
    use quickwit_proto::ingest::router::IngestSubrequest;
    use quickwit_proto::ingest::{
        CommitTypeV2, DocBatchV2, ParseFailure, ParseFailureReason, Shard, ShardState,
    };
    use quickwit_proto::types::{DocUid, IndexUid, Position, ShardId, SourceUid};

    use super::*;
    use crate::IngesterPoolEntry;
    use crate::ingest_v2::workbench::SubworkbenchFailure;

    #[tokio::test]
    async fn test_router_make_get_or_create_open_shard_request() {
        let self_node_id = "test-router".into();
        let control_plane: ControlPlaneServiceClient =
            ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let mut workbench = IngestWorkbench::default();
        let (get_or_create_open_shard_request_opt, rendezvous) = router
            .make_get_or_create_open_shard_request(&mut workbench, &ingester_pool)
            .await
            .take();
        assert!(get_or_create_open_shard_request_opt.is_none());
        assert!(rendezvous.is_empty());

        {
            let mut state_guard = router.state.lock().await;
            state_guard.routing_table.apply_capacity_update(
                "test-ingester-0".into(),
                IndexUid::for_test("test-index-0", 0),
                "test-source".to_string(),
                8,
                1,
            );
        }

        let ingest_subrequests: Vec<IngestSubrequest> = vec![
            IngestSubrequest {
                subrequest_id: 0,
                index_id: "test-index-0".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                index_id: "test-index-1".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
        ];
        let mut workbench = IngestWorkbench::new(ingest_subrequests.clone(), 3);
        let (get_or_create_open_shard_request_opt, rendezvous_1) = router
            .make_get_or_create_open_shard_request(&mut workbench, &ingester_pool)
            .await
            .take();

        let get_or_create_open_shard_request = get_or_create_open_shard_request_opt.unwrap();
        assert_eq!(get_or_create_open_shard_request.subrequests.len(), 2);

        assert_eq!(rendezvous_1.num_permits(), 2);
        assert_eq!(rendezvous_1.num_barriers(), 0);

        let subrequest = &get_or_create_open_shard_request.subrequests[0];
        assert_eq!(subrequest.index_id, "test-index-0");
        assert_eq!(subrequest.source_id, "test-source");

        let subrequest = &get_or_create_open_shard_request.subrequests[1];
        assert_eq!(subrequest.index_id, "test-index-1");
        assert_eq!(subrequest.source_id, "test-source");

        assert!(
            get_or_create_open_shard_request
                .unavailable_leaders
                .is_empty()
        );
        assert!(workbench.unavailable_leaders.is_empty());

        let (get_or_create_open_shard_request_opt, rendezvous_2) = router
            .make_get_or_create_open_shard_request(&mut workbench, &ingester_pool)
            .await
            .take();

        assert!(get_or_create_open_shard_request_opt.is_none());

        assert_eq!(rendezvous_2.num_permits(), 0);
        assert_eq!(rendezvous_2.num_barriers(), 2);

        drop(rendezvous_1);
        drop(rendezvous_2);

        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry::mocked_ingester(),
        );
        {
            // Ingester-0 is in pool and in table, but marked unavailable on the workbench
            // (simulating a prior transport error). has_open_nodes returns false → both
            // subrequests trigger CP request.
            workbench
                .unavailable_leaders
                .insert("test-ingester-0".into());
            let (get_or_create_open_shard_request_opt, _rendezvous) = router
                .make_get_or_create_open_shard_request(&mut workbench, &ingester_pool)
                .await
                .take();
            let get_or_create_open_shard_request = get_or_create_open_shard_request_opt.unwrap();
            assert_eq!(get_or_create_open_shard_request.subrequests.len(), 2);
            assert_eq!(
                get_or_create_open_shard_request.unavailable_leaders.len(),
                1
            );
        }
        {
            // Fresh workbench: ingester-0 is in pool, in table, and NOT unavailable.
            // has_open_nodes returns true for index-0 → only index-1 triggers request.
            let mut workbench = IngestWorkbench::new(ingest_subrequests, 3);
            let (get_or_create_open_shard_request_opt, _rendezvous) = router
                .make_get_or_create_open_shard_request(&mut workbench, &ingester_pool)
                .await
                .take();
            let get_or_create_open_shard_request = get_or_create_open_shard_request_opt.unwrap();
            assert_eq!(get_or_create_open_shard_request.subrequests.len(), 1);

            let subrequest = &get_or_create_open_shard_request.subrequests[0];
            assert_eq!(subrequest.index_id, "test-index-1");
            assert_eq!(subrequest.source_id, "test-source");

            assert!(
                get_or_create_open_shard_request
                    .unavailable_leaders
                    .is_empty()
            );
        }
    }

    #[tokio::test]
    async fn test_router_populate_routing_table() {
        let self_node_id = "test-router".into();

        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);
        let index_uid2: IndexUid = IndexUid::for_test("test-index-1", 0);
        let mut mock_control_plane = MockControlPlaneService::new();
        mock_control_plane
            .expect_get_or_create_open_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 4);

                let subrequest_0 = &request.subrequests[0];
                assert_eq!(subrequest_0.index_id, "test-index-0");
                assert_eq!(subrequest_0.source_id, "test-source");

                let subrequest_1 = &request.subrequests[1];
                assert_eq!(subrequest_1.index_id, "test-index-1");
                assert_eq!(subrequest_1.source_id, "test-source");

                let subrequest_2 = &request.subrequests[2];
                assert_eq!(subrequest_2.index_id, "index-not-found");
                assert_eq!(subrequest_2.source_id, "test-source");

                let subrequest_3 = &request.subrequests[3];
                assert_eq!(subrequest_3.index_id, "test-index-0");
                assert_eq!(subrequest_3.source_id, "source-not-found");

                let response = GetOrCreateOpenShardsResponse {
                    successes: vec![
                        GetOrCreateOpenShardsSuccess {
                            subrequest_id: 0,
                            index_uid: Some(index_uid.clone()),
                            source_id: "test-source".to_string(),
                            open_shards: vec![Shard {
                                index_uid: Some(index_uid.clone()),
                                source_id: "test-source".to_string(),
                                shard_id: Some(ShardId::from(1)),
                                shard_state: ShardState::Open as i32,
                                leader_id: "test-ingester-0".to_string(),
                                ..Default::default()
                            }],
                        },
                        GetOrCreateOpenShardsSuccess {
                            subrequest_id: 1,
                            index_uid: Some(index_uid2.clone()),
                            source_id: "test-source".to_string(),
                            open_shards: vec![
                                Shard {
                                    index_uid: Some(index_uid2.clone()),
                                    source_id: "test-source".to_string(),
                                    shard_id: Some(ShardId::from(1)),
                                    shard_state: ShardState::Open as i32,
                                    leader_id: "test-ingester-1".to_string(),
                                    ..Default::default()
                                },
                                Shard {
                                    index_uid: Some(index_uid2.clone()),
                                    source_id: "test-source".to_string(),
                                    shard_id: Some(ShardId::from(2)),
                                    shard_state: ShardState::Open as i32,
                                    leader_id: "test-ingester-1".to_string(),
                                    ..Default::default()
                                },
                            ],
                        },
                    ],
                    failures: vec![
                        GetOrCreateOpenShardsFailure {
                            subrequest_id: 2,
                            index_id: "index-not-found".to_string(),
                            source_id: "test-source".to_string(),
                            reason: GetOrCreateOpenShardsFailureReason::IndexNotFound as i32,
                        },
                        GetOrCreateOpenShardsFailure {
                            subrequest_id: 3,
                            index_id: "test-index-0".to_string(),
                            source_id: "source-not-found".to_string(),
                            reason: GetOrCreateOpenShardsFailureReason::SourceNotFound as i32,
                        },
                    ],
                };
                Ok(response)
            });
        let control_plane = ControlPlaneServiceClient::from_mock(mock_control_plane);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                index_id: "test-index-0".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                index_id: "test-index-1".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 2,
                index_id: "index-not-found".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 3,
                index_id: "source-not-found".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
        ];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);

        let get_or_create_open_shards_request = GetOrCreateOpenShardsRequest {
            subrequests: vec![
                GetOrCreateOpenShardsSubrequest {
                    subrequest_id: 0,
                    index_id: "test-index-0".to_string(),
                    source_id: "test-source".to_string(),
                },
                GetOrCreateOpenShardsSubrequest {
                    subrequest_id: 1,
                    index_id: "test-index-1".to_string(),
                    source_id: "test-source".to_string(),
                },
                GetOrCreateOpenShardsSubrequest {
                    subrequest_id: 2,
                    index_id: "index-not-found".to_string(),
                    source_id: "test-source".to_string(),
                },
                GetOrCreateOpenShardsSubrequest {
                    subrequest_id: 3,
                    index_id: "test-index-0".to_string(),
                    source_id: "source-not-found".to_string(),
                },
            ],
            closed_shards: Vec::new(),
            unavailable_leaders: Vec::new(),
        };
        router
            .populate_routing_table(&mut workbench, get_or_create_open_shards_request)
            .await;

        let subworkbench = workbench.subworkbenches.get(&2).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::IndexNotFound)
        ));

        let subworkbench = workbench.subworkbenches.get(&3).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::SourceNotFound)
        ));
    }

    #[tokio::test]
    async fn test_router_batch_persist_records_no_shards_available_empty_routing_table() {
        let self_node_id = "test-router".into();
        let mut mock_control_plane = MockControlPlaneService::new();
        mock_control_plane
            .expect_get_or_create_open_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_id, "test-index");
                assert_eq!(subrequest.source_id, "test-source");

                let response = GetOrCreateOpenShardsResponse::default();
                Ok(response)
            });
        let control_plane = ControlPlaneServiceClient::from_mock(mock_control_plane);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            index_id: "test-index".to_string(),
            source_id: "test-source".to_string(),
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);
        let commit_type = CommitTypeV2::Auto;
        router.batch_persist(&mut workbench, commit_type).await;

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::NoShardsAvailable)
        ));
    }

    #[tokio::test]
    async fn test_router_batch_persist_records_no_shards_available_unavailable_ingester() {
        let self_node_id = "test-router".into();
        let mut mock_control_plane = MockControlPlaneService::new();
        mock_control_plane
            .expect_get_or_create_open_shards()
            .once()
            .returning(move |request| {
                assert_eq!(request.subrequests.len(), 1);

                let subrequest = &request.subrequests[0];
                assert_eq!(subrequest.index_id, "test-index");
                assert_eq!(subrequest.source_id, "test-source");

                let response = GetOrCreateOpenShardsResponse {
                    successes: vec![GetOrCreateOpenShardsSuccess {
                        subrequest_id: 0,
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        open_shards: vec![Shard {
                            index_uid: Some(IndexUid::for_test("test-index", 0)),
                            source_id: "test-source".to_string(),
                            shard_id: Some(ShardId::from(1)),
                            shard_state: ShardState::Open as i32,
                            leader_id: "test-ingester".into(),
                            ..Default::default()
                        }],
                    }],
                    ..Default::default()
                };
                Ok(response)
            });
        let control_plane = ControlPlaneServiceClient::from_mock(mock_control_plane);
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            index_id: "test-index".to_string(),
            source_id: "test-source".to_string(),
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);
        let commit_type = CommitTypeV2::Auto;
        router.batch_persist(&mut workbench, commit_type).await;

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::NoShardsAvailable)
        ));
    }

    #[tokio::test]
    async fn test_router_process_persist_results_record_persist_successes() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            index_id: "test-index-0".to_string(),
            source_id: "test-source".to_string(),
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);
        let persist_futures = FuturesUnordered::new();
        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);

        persist_futures.push(async move {
            let persist_summary = PersistRequestSummary {
                leader_id: "test-ingester-0".into(),
                subrequest_ids: vec![0],
            };
            let persist_result = Ok::<_, IngestV2Error>(PersistResponse {
                leader_id: "test-ingester-0".to_string(),
                successes: vec![PersistSuccess {
                    subrequest_id: 0,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    ..Default::default()
                }],
                failures: Vec::new(),
                routing_update: Some(RoutingUpdate {
                    capacity_score: 6,
                    source_shard_updates: Vec::new(),
                    ..Default::default()
                }),
            });
            (persist_summary, persist_result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.persist_success_opt,
            Some(PersistSuccess { .. })
        ));
    }

    #[tokio::test]
    async fn test_router_process_persist_results_record_persist_failures() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            index_id: "test-index-0".to_string(),
            source_id: "test-source".to_string(),
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);
        let persist_futures = FuturesUnordered::new();
        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);

        persist_futures.push(async move {
            let persist_summary = PersistRequestSummary {
                leader_id: "test-ingester-0".into(),
                subrequest_ids: vec![0],
            };
            let persist_result = Ok::<_, IngestV2Error>(PersistResponse {
                leader_id: "test-ingester-0".to_string(),
                successes: Vec::new(),
                failures: vec![PersistFailure {
                    subrequest_id: 0,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    reason: PersistFailureReason::NoShardsAvailable as i32,
                }],
                routing_update: Some(RoutingUpdate {
                    capacity_score: 6,
                    source_shard_updates: Vec::new(),
                    ..Default::default()
                }),
            });
            (persist_summary, persist_result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Persist { .. })
        ));
    }

    #[tokio::test]
    async fn test_router_process_persist_results_does_not_remove_unavailable_leaders() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());

        let ingester_pool = IngesterPool::default();
        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry::mocked_ingester(),
        );
        ingester_pool.insert(
            "test-ingester-1".into(),
            IngesterPoolEntry::mocked_ingester(),
        );

        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                index_id: "test-index-0".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                index_id: "test-index-1".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
        ];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);
        let persist_futures = FuturesUnordered::new();

        persist_futures.push(async {
            let persist_summary = PersistRequestSummary {
                leader_id: "test-ingester-0".into(),
                subrequest_ids: vec![0],
            };
            let persist_result =
                Err::<_, IngestV2Error>(IngestV2Error::Internal("internal error".to_string()));
            (persist_summary, persist_result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            &subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Internal)
        ));

        assert!(
            !workbench
                .unavailable_leaders
                .contains(&NodeId::from("test-ingester-1"))
        );
        let persist_futures = FuturesUnordered::new();
        persist_futures.push(async {
            let persist_summary = PersistRequestSummary {
                leader_id: "test-ingester-1".into(),
                subrequest_ids: vec![1],
            };
            let persist_result =
                Err::<_, IngestV2Error>(IngestV2Error::Unavailable("connection error".to_string()));
            (persist_summary, persist_result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;

        // We do not remove the leader from the pool.
        assert!(!ingester_pool.is_empty());
        // ... but we mark it as unavailable.
        assert!(
            workbench
                .unavailable_leaders
                .contains(&NodeId::from("test-ingester-1"))
        );

        let subworkbench = workbench.subworkbenches.get(&1).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Unavailable)
        ));
    }

    #[tokio::test]
    async fn test_router_ingest() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            1,
            EventBroker::default(),
            Some("test-az".to_string()),
        );

        let index_uid_0: IndexUid = IndexUid::for_test("test-index-0", 0);
        let index_uid_1: IndexUid = IndexUid::for_test("test-index-1", 0);
        {
            let mut state_guard = router.state.lock().await;
            state_guard.routing_table.merge_from_shards(
                index_uid_0.clone(),
                "test-source".to_string(),
                vec![Shard {
                    index_uid: Some(index_uid_0.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    shard_state: ShardState::Open as i32,
                    leader_id: "test-ingester-0".to_string(),
                    ..Default::default()
                }],
            );
            state_guard.routing_table.merge_from_shards(
                index_uid_1.clone(),
                "test-source".to_string(),
                vec![Shard {
                    index_uid: Some(index_uid_1.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    shard_state: ShardState::Open as i32,
                    leader_id: "test-ingester-1".to_string(),
                    ..Default::default()
                }],
            );
        }

        let index_uid_0_clone = index_uid_0.clone();
        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0
            .expect_persist()
            .once()
            .returning(move |request| {
                assert_eq!(request.leader_id, "test-ingester-0");
                assert_eq!(request.subrequests.len(), 1);

                Ok(PersistResponse {
                    leader_id: request.leader_id,
                    successes: vec![PersistSuccess {
                        subrequest_id: 0,
                        index_uid: Some(index_uid_0_clone.clone()),
                        source_id: "test-source".to_string(),
                        shard_id: Some(ShardId::from(1)),
                        replication_position_inclusive: Some(Position::offset(1u64)),
                        num_persisted_docs: 2,
                        parse_failures: vec![ParseFailure {
                            doc_uid: Some(DocUid::for_test(0)),
                            reason: ParseFailureReason::InvalidJson as i32,
                            message: "invalid JSON".to_string(),
                        }],
                    }],
                    failures: Vec::new(),
                    routing_update: Some(RoutingUpdate {
                        capacity_score: 6,
                        source_shard_updates: Vec::new(),
                        ..Default::default()
                    }),
                })
            });
        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry {
                client: IngesterServiceClient::from_mock(mock_ingester_0),
                status: IngesterStatus::Ready,
                availability_zone: None,
            },
        );

        let mut mock_ingester_1 = MockIngesterService::new();
        mock_ingester_1
            .expect_persist()
            .once()
            .returning(move |request| {
                assert_eq!(request.leader_id, "test-ingester-1");
                assert_eq!(request.subrequests.len(), 1);

                Ok(PersistResponse {
                    leader_id: request.leader_id,
                    successes: vec![PersistSuccess {
                        subrequest_id: 1,
                        index_uid: Some(index_uid_1.clone()),
                        source_id: "test-source".to_string(),
                        shard_id: Some(ShardId::from(1)),
                        replication_position_inclusive: Some(Position::offset(0u64)),
                        num_persisted_docs: 1,
                        parse_failures: Vec::new(),
                    }],
                    failures: Vec::new(),
                    routing_update: Some(RoutingUpdate {
                        capacity_score: 6,
                        source_shard_updates: Vec::new(),
                        ..Default::default()
                    }),
                })
            });
        ingester_pool.insert(
            "test-ingester-1".into(),
            IngesterPoolEntry {
                client: IngesterServiceClient::from_mock(mock_ingester_1),
                availability_zone: None,
                status: IngesterStatus::Ready,
            },
        );

        let response = router
            .ingest(IngestRequestV2 {
                subrequests: vec![
                    IngestSubrequest {
                        subrequest_id: 0,
                        index_id: "test-index-0".to_string(),
                        source_id: "test-source".to_string(),
                        doc_batch: Some(DocBatchV2::for_test(["", "test-doc-foo", "test-doc-bar"])),
                    },
                    IngestSubrequest {
                        subrequest_id: 1,
                        index_id: "test-index-1".to_string(),
                        source_id: "test-source".to_string(),
                        doc_batch: Some(DocBatchV2::for_test(["test-doc-qux"])),
                    },
                ],
                commit_type: CommitTypeV2::Auto as i32,
            })
            .await
            .unwrap();

        assert_eq!(response.successes.len(), 2);
        assert_eq!(response.failures.len(), 0);

        let parse_failures = &response.successes[0].parse_failures;
        assert_eq!(parse_failures.len(), 1);
        assert_eq!(parse_failures[0].doc_uid(), DocUid::for_test(0));
        assert_eq!(parse_failures[0].reason(), ParseFailureReason::InvalidJson);
    }

    #[tokio::test]
    async fn test_router_ingest_retry() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            1,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);
        {
            let mut state_guard = router.state.lock().await;
            state_guard.routing_table.merge_from_shards(
                index_uid.clone(),
                "test-source".to_string(),
                vec![Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    shard_state: ShardState::Open as i32,
                    leader_id: "test-ingester-0".to_string(),
                    ..Default::default()
                }],
            );
        }

        let mut mock_ingester_0 = MockIngesterService::new();
        // First attempt: returns NoShardsAvailable (transient, doesn't mark leader unavailable).
        // The response still reports capacity_score=6 and 1 open shard so the node stays routable.
        let index_uid_clone = index_uid.clone();
        mock_ingester_0
            .expect_persist()
            .once()
            .returning(move |request| {
                Ok(PersistResponse {
                    leader_id: request.leader_id,
                    successes: Vec::new(),
                    failures: vec![PersistFailure {
                        subrequest_id: 0,
                        index_uid: Some(index_uid_clone.clone()),
                        source_id: "test-source".to_string(),
                        reason: PersistFailureReason::NoShardsAvailable as i32,
                    }],
                    routing_update: Some(RoutingUpdate {
                        capacity_score: 6,
                        source_shard_updates: vec![SourceShardUpdate {
                            index_uid: Some(index_uid_clone.clone()),
                            source_id: "test-source".to_string(),
                            open_shard_count: 1,
                        }],
                        ..Default::default()
                    }),
                })
            });
        // Second attempt: succeeds.
        mock_ingester_0
            .expect_persist()
            .once()
            .returning(move |request| {
                Ok(PersistResponse {
                    leader_id: request.leader_id,
                    successes: vec![PersistSuccess {
                        subrequest_id: 0,
                        index_uid: Some(index_uid.clone()),
                        source_id: "test-source".to_string(),
                        shard_id: Some(ShardId::from(1)),
                        replication_position_inclusive: Some(Position::offset(0u64)),
                        num_persisted_docs: 1,
                        parse_failures: Vec::new(),
                    }],
                    failures: Vec::new(),
                    routing_update: Some(RoutingUpdate {
                        capacity_score: 6,
                        source_shard_updates: Vec::new(),
                        ..Default::default()
                    }),
                })
            });
        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry {
                client: IngesterServiceClient::from_mock(mock_ingester_0),
                status: IngesterStatus::Ready,
                availability_zone: None,
            },
        );

        let response = router
            .ingest(IngestRequestV2 {
                subrequests: vec![IngestSubrequest {
                    subrequest_id: 0,
                    index_id: "test-index-0".to_string(),
                    source_id: "test-source".to_string(),
                    doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
                }],
                commit_type: CommitTypeV2::Auto as i32,
            })
            .await
            .unwrap();
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.failures.len(), 0);
    }

    #[tokio::test]
    async fn test_router_debug_info() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let index_uid_0: IndexUid = IndexUid::for_test("test-index-0", 0);
        let index_uid_1: IndexUid = IndexUid::for_test("test-index-1", 0);

        {
            let mut state_guard = router.state.lock().await;
            state_guard.routing_table.merge_from_shards(
                index_uid_0.clone(),
                "test-source".to_string(),
                vec![Shard {
                    index_uid: Some(index_uid_0.clone()),
                    shard_id: Some(ShardId::from(1)),
                    shard_state: ShardState::Open as i32,
                    leader_id: "test-ingester-0".to_string(),
                    ..Default::default()
                }],
            );
            state_guard.routing_table.merge_from_shards(
                index_uid_1.clone(),
                "test-source".to_string(),
                vec![Shard {
                    index_uid: Some(index_uid_1.clone()),
                    shard_id: Some(ShardId::from(2)),
                    shard_state: ShardState::Open as i32,
                    leader_id: "test-ingester-1".to_string(),
                    ..Default::default()
                }],
            );
        }

        let debug_info = router.debug_info().await;
        let routing_table = &debug_info["routing_table"];
        assert_eq!(routing_table.as_object().unwrap().len(), 2);

        let index_0_entries = routing_table["test-index-0"].as_array().unwrap();
        assert_eq!(index_0_entries.len(), 1);
        assert_eq!(index_0_entries[0]["node_id"], "test-ingester-0");
        assert_eq!(index_0_entries[0]["capacity_score"], 5);

        let index_1_entries = routing_table["test-index-1"].as_array().unwrap();
        assert_eq!(index_1_entries.len(), 1);
        assert_eq!(index_1_entries[0]["node_id"], "test-ingester-1");
    }

    #[tokio::test]
    async fn test_router_returns_rate_limited_failure() {
        let self_node_id = "test-router".into();
        let control_plane = ControlPlaneServiceClient::from_mock(MockControlPlaneService::new());
        let ingester_pool = IngesterPool::default();
        let replication_factor = 1;
        let router = IngestRouter::new(
            self_node_id,
            control_plane,
            ingester_pool.clone(),
            replication_factor,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let index_uid: IndexUid = IndexUid::for_test("test-index-0", 0);
        {
            let mut state_guard = router.state.lock().await;
            state_guard.routing_table.merge_from_shards(
                index_uid.clone(),
                "test-source".to_string(),
                vec![Shard {
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    shard_id: Some(ShardId::from(1)),
                    shard_state: ShardState::Open as i32,
                    leader_id: "test-ingester-0".to_string(),
                    ..Default::default()
                }],
            );
        }

        let mut mock_ingester_0 = MockIngesterService::new();
        mock_ingester_0.expect_persist().returning(move |request| {
            assert_eq!(request.leader_id, "test-ingester-0");
            assert_eq!(request.commit_type(), CommitTypeV2::Auto);
            assert_eq!(request.subrequests.len(), 1);
            let subrequest = &request.subrequests[0];
            assert_eq!(subrequest.subrequest_id, 0);
            let index_uid = subrequest.index_uid().clone();
            assert_eq!(subrequest.source_id, "test-source");
            assert_eq!(
                subrequest.doc_batch,
                Some(DocBatchV2::for_test(["test-doc-foo"]))
            );

            let response = PersistResponse {
                leader_id: request.leader_id,
                successes: Vec::new(),
                failures: vec![PersistFailure {
                    subrequest_id: 0,
                    index_uid: Some(index_uid.clone()),
                    source_id: "test-source".to_string(),
                    reason: PersistFailureReason::NoShardsAvailable as i32,
                }],
                routing_update: Some(RoutingUpdate {
                    capacity_score: 6,
                    source_shard_updates: vec![SourceShardUpdate {
                        index_uid: Some(index_uid),
                        source_id: "test-source".to_string(),
                        open_shard_count: 1,
                    }],
                    ..Default::default()
                }),
            };
            Ok(response)
        });
        let ingester_0 = IngesterServiceClient::from_mock(mock_ingester_0);
        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry {
                client: ingester_0.clone(),
                availability_zone: None,
                status: IngesterStatus::Ready,
            },
        );

        let ingest_request = IngestRequestV2 {
            subrequests: vec![IngestSubrequest {
                subrequest_id: 0,
                index_id: "test-index-0".to_string(),
                source_id: "test-source".to_string(),
                doc_batch: Some(DocBatchV2::for_test(["test-doc-foo"])),
            }],
            commit_type: CommitTypeV2::Auto as i32,
        };
        let ingest_response = router.ingest(ingest_request).await.unwrap();
        assert_eq!(ingest_response.successes.len(), 0);
        assert_eq!(ingest_response.failures.len(), 1);
        assert_eq!(
            ingest_response.failures[0].reason(),
            IngestFailureReason::NoShardsAvailable
        );
    }

    #[tokio::test]
    async fn test_router_updates_node_routing_table_on_capacity_update() {
        let event_broker = EventBroker::default();
        let ingester_pool = IngesterPool::default();
        let router = IngestRouter::new(
            "test-router".into(),
            ControlPlaneServiceClient::from_mock(MockControlPlaneService::new()),
            ingester_pool.clone(),
            1,
            event_broker.clone(),
            Some("test-az".to_string()),
        );
        router.subscribe();

        event_broker.publish(IngesterCapacityScoreUpdate {
            node_id: "test-ingester-0".into(),
            source_uid: SourceUid {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".to_string(),
            },
            capacity_score: 7,
            open_shard_count: 3,
        });
        // Give the async subscriber a moment to process.
        tokio::time::sleep(Duration::from_millis(10)).await;

        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry::mocked_ingester(),
        );
        let state_guard = router.state.lock().await;
        let node = state_guard
            .routing_table
            .pick_node("test-index", "test-source", &ingester_pool, &HashSet::new())
            .unwrap();
        assert_eq!(node.node_id, NodeId::from("test-ingester-0"));
    }

    #[tokio::test]
    async fn test_router_process_persist_results_marks_unavailable_on_persist_failure() {
        let router = IngestRouter::new(
            "test-router".into(),
            ControlPlaneServiceClient::from_mock(MockControlPlaneService::new()),
            IngesterPool::default(),
            1,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                index_id: "test-index-0".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                index_id: "test-index-1".to_string(),
                source_id: "test-source".to_string(),
                ..Default::default()
            },
        ];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);

        // NoShardsAvailable does NOT mark the leader as unavailable.
        let persist_futures = FuturesUnordered::new();
        persist_futures.push(async {
            let summary = PersistRequestSummary {
                leader_id: "test-ingester-0".into(),
                subrequest_ids: vec![0],
            };
            let result = Ok::<_, IngestV2Error>(PersistResponse {
                leader_id: "test-ingester-0".to_string(),
                successes: Vec::new(),
                failures: vec![PersistFailure {
                    subrequest_id: 0,
                    index_uid: Some(IndexUid::for_test("test-index-0", 0)),
                    source_id: "test-source".to_string(),
                    reason: PersistFailureReason::NoShardsAvailable as i32,
                }],
                routing_update: Some(RoutingUpdate {
                    capacity_score: 6,
                    source_shard_updates: Vec::new(),
                    ..Default::default()
                }),
            });
            (summary, result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;
        assert!(
            !workbench
                .unavailable_leaders
                .contains(&NodeId::from("test-ingester-0"))
        );

        // NodeUnavailable DOES mark the leader as unavailable.
        let persist_futures = FuturesUnordered::new();
        persist_futures.push(async {
            let summary = PersistRequestSummary {
                leader_id: "test-ingester-1".into(),
                subrequest_ids: vec![1],
            };
            let result = Ok::<_, IngestV2Error>(PersistResponse {
                leader_id: "test-ingester-1".to_string(),
                successes: Vec::new(),
                failures: vec![PersistFailure {
                    subrequest_id: 1,
                    index_uid: Some(IndexUid::for_test("test-index-1", 0)),
                    source_id: "test-source".to_string(),
                    reason: PersistFailureReason::NodeUnavailable as i32,
                }],
                routing_update: Some(RoutingUpdate {
                    capacity_score: 6,
                    source_shard_updates: Vec::new(),
                    ..Default::default()
                }),
            });
            (summary, result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;
        assert!(
            workbench
                .unavailable_leaders
                .contains(&NodeId::from("test-ingester-1"))
        );
    }

    #[tokio::test]
    async fn test_router_process_persist_results_applies_piggybacked_routing_updates() {
        let ingester_pool = IngesterPool::default();
        let router = IngestRouter::new(
            "test-router".into(),
            ControlPlaneServiceClient::from_mock(MockControlPlaneService::new()),
            ingester_pool.clone(),
            1,
            EventBroker::default(),
            Some("test-az".to_string()),
        );
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            index_id: "test-index".to_string(),
            source_id: "test-source".to_string(),
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 2);

        let persist_futures = FuturesUnordered::new();
        persist_futures.push(async {
            let summary = PersistRequestSummary {
                leader_id: "test-ingester-0".into(),
                subrequest_ids: vec![0],
            };
            let result = Ok::<_, IngestV2Error>(PersistResponse {
                leader_id: "test-ingester-0".to_string(),
                successes: Vec::new(),
                failures: Vec::new(),
                routing_update: Some(RoutingUpdate {
                    capacity_score: 3,
                    source_shard_updates: vec![SourceShardUpdate {
                        index_uid: Some(IndexUid::for_test("test-index", 0)),
                        source_id: "test-source".to_string(),
                        open_shard_count: 2,
                    }],
                    ..Default::default()
                }),
            });
            (summary, result)
        });
        router
            .process_persist_results(&mut workbench, persist_futures)
            .await;

        ingester_pool.insert(
            "test-ingester-0".into(),
            IngesterPoolEntry::mocked_ingester(),
        );
        let state_guard = router.state.lock().await;
        let node = state_guard
            .routing_table
            .pick_node("test-index", "test-source", &ingester_pool, &HashSet::new())
            .unwrap();
        assert_eq!(node.node_id, NodeId::from("test-ingester-0"));
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/routing_table.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};

use itertools::Itertools;
use quickwit_proto::ingest::Shard;
use quickwit_proto::types::{IndexId, IndexUid, NodeId, SourceId};
use rand::rng;
use rand::seq::IndexedRandom;

use crate::IngesterPool;

/// A single ingester node's routing-relevant data for a specific (index, source) pair.
/// Each entry is self-describing: it carries its own node_id, index_uid, and source_id
/// so it can always be attributed back to a specific source on a specific node.
#[derive(Debug, Clone)]
pub(super) struct IngesterNode {
    pub node_id: NodeId,
    pub index_uid: IndexUid,
    #[allow(unused)]
    pub source_id: SourceId,
    /// Score from 0-10. Higher means more available capacity.
    pub capacity_score: usize,
    /// Number of open shards on this node for this (index, source) pair. Tiebreaker for power of
    /// two choices comparison - we favor a node with more open shards.
    pub open_shard_count: usize,
}

#[derive(Debug, Default)]
pub(super) struct RoutingEntry {
    pub nodes: HashMap<NodeId, IngesterNode>,
}

/// Given a slice of candidates, picks the better of two random choices.
/// Higher capacity_score wins; tiebreak on more open_shard_count (more landing spots).
fn power_of_two_choices<'a>(candidates: &[&'a IngesterNode]) -> &'a IngesterNode {
    debug_assert!(candidates.len() >= 2);
    let mut iter = candidates.choose_multiple(&mut rng(), 2);
    let (&a, &b) = (iter.next().unwrap(), iter.next().unwrap());

    if (a.capacity_score, a.open_shard_count) >= (b.capacity_score, b.open_shard_count) {
        a
    } else {
        b
    }
}

fn pick_from(candidates: Vec<&IngesterNode>) -> Option<&IngesterNode> {
    match candidates.len() {
        0 => None,
        1 => Some(candidates[0]),
        _ => Some(power_of_two_choices(&candidates)),
    }
}

impl RoutingEntry {
    /// Pick an ingester node to persist the request to. Uses power of two choices based on reported
    /// ingester capacity, if more than one eligible node exists. Prefers nodes in the same
    /// availability zone, falling back to remote nodes.
    fn pick_node(
        &self,
        ingester_pool: &IngesterPool,
        unavailable_leaders: &HashSet<NodeId>,
        self_availability_zone: &Option<String>,
    ) -> Option<&IngesterNode> {
        let (local_ingesters, remote_ingesters): (Vec<&IngesterNode>, Vec<&IngesterNode>) = self
            .nodes
            .values()
            .filter(|node| {
                node.capacity_score > 0
                    && node.open_shard_count > 0
                    && ingester_pool
                        .get(&node.node_id)
                        .map(|entry| entry.status.is_ready())
                        .unwrap_or(false)
                    && !unavailable_leaders.contains(&node.node_id)
            })
            .partition(|node| {
                let node_az = ingester_pool
                    .get(&node.node_id)
                    .and_then(|h| h.availability_zone);
                node_az == *self_availability_zone
            });

        pick_from(local_ingesters).or_else(|| pick_from(remote_ingesters))
    }
}

#[derive(Debug, Default)]
pub(super) struct RoutingTable {
    table: HashMap<(IndexId, SourceId), RoutingEntry>,
    self_availability_zone: Option<String>,
}

impl RoutingTable {
    pub fn new(self_availability_zone: Option<String>) -> Self {
        Self {
            self_availability_zone,
            ..Default::default()
        }
    }

    pub fn pick_node(
        &self,
        index_id: &str,
        source_id: &str,
        ingester_pool: &IngesterPool,
        unavailable_leaders: &HashSet<NodeId>,
    ) -> Option<&IngesterNode> {
        let key = (index_id.to_string(), source_id.to_string());
        let entry = self.table.get(&key)?;
        entry.pick_node(
            ingester_pool,
            unavailable_leaders,
            &self.self_availability_zone,
        )
    }

    pub fn classify_az_locality(
        &self,
        target_node_id: &NodeId,
        ingester_pool: &IngesterPool,
    ) -> &'static str {
        let Some(self_az) = &self.self_availability_zone else {
            return "az_unaware";
        };
        let target_az = ingester_pool
            .get(target_node_id)
            .and_then(|entry| entry.availability_zone);
        match target_az {
            Some(ref az) if az == self_az => "same_az",
            Some(_) => "cross_az",
            None => "az_unaware",
        }
    }

    pub fn debug_info(
        &self,
        ingester_pool: &IngesterPool,
    ) -> HashMap<IndexId, Vec<serde_json::Value>> {
        let mut per_index: HashMap<IndexId, Vec<serde_json::Value>> = HashMap::new();
        for ((index_id, source_id), entry) in &self.table {
            for (node_id, node) in &entry.nodes {
                let az = ingester_pool.get(node_id).and_then(|h| h.availability_zone);
                per_index
                    .entry(index_id.clone())
                    .or_default()
                    .push(serde_json::json!({
                        "source_id": source_id,
                        "node_id": node_id,
                        "capacity_score": node.capacity_score,
                        "open_shard_count": node.open_shard_count,
                        "availability_zone": az,
                    }));
            }
        }
        per_index
    }

    pub fn has_open_nodes(
        &self,
        index_id: &str,
        source_id: &str,
        ingester_pool: &IngesterPool,
        unavailable_leaders: &HashSet<NodeId>,
    ) -> bool {
        let key = (index_id.to_string(), source_id.to_string());
        let Some(entry) = self.table.get(&key) else {
            return false;
        };
        entry.nodes.values().any(|node| {
            node.capacity_score > 0
                && node.open_shard_count > 0
                && ingester_pool
                    .get(&node.node_id)
                    .map(|entry| entry.status.is_ready())
                    .unwrap_or(false)
                && !unavailable_leaders.contains(&node.node_id)
        })
    }

    /// Applies a capacity update from the IngesterCapacityScoreUpdate broadcast. This is the
    /// primary way the table learns about node availability and capacity.
    pub fn apply_capacity_update(
        &mut self,
        node_id: NodeId,
        index_uid: IndexUid,
        source_id: SourceId,
        capacity_score: usize,
        open_shard_count: usize,
    ) {
        let key = (index_uid.index_id.to_string(), source_id.clone());

        let entry = self.table.entry(key).or_default();
        let ingester_node = IngesterNode {
            node_id: node_id.clone(),
            index_uid,
            source_id,
            capacity_score,
            open_shard_count,
        };
        entry.nodes.insert(node_id, ingester_node);
    }

    /// Merges routing updates from a GetOrCreateOpenShards control plane response into the
    /// table. For existing nodes, updates their open shard count, including if the count is 0, from
    /// the CP response while preserving capacity scores if they already exist.
    /// New nodes get a default capacity_score of 5.
    pub fn merge_from_shards(
        &mut self,
        index_uid: IndexUid,
        source_id: SourceId,
        shards: Vec<Shard>,
    ) {
        let per_leader_count: HashMap<NodeId, usize> = shards
            .iter()
            .map(|shard| {
                let num_open_shards = shard.is_open() as usize;
                let leader_id = NodeId::from(shard.leader_id.clone());
                (leader_id, num_open_shards)
            })
            .into_grouping_map()
            .sum();

        let key = (index_uid.index_id.to_string(), source_id.clone());
        let entry = self.table.entry(key).or_default();

        for (node_id, open_shard_count) in per_leader_count {
            entry
                .nodes
                .entry(node_id.clone())
                .and_modify(|node| node.open_shard_count = open_shard_count)
                .or_insert_with(|| IngesterNode {
                    node_id,
                    index_uid: index_uid.clone(),
                    source_id: source_id.clone(),
                    capacity_score: 5,
                    open_shard_count,
                });
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_proto::ingest::ShardState;
    use quickwit_proto::ingest::ingester::{IngesterServiceClient, IngesterStatus};
    use quickwit_proto::types::ShardId;

    use super::*;
    use crate::IngesterPoolEntry;

    fn mocked_ingester(availability_zone: Option<&str>) -> IngesterPoolEntry {
        IngesterPoolEntry {
            client: IngesterServiceClient::mocked(),
            status: IngesterStatus::Ready,
            availability_zone: availability_zone.map(|s| s.to_string()),
        }
    }

    #[test]
    fn test_apply_capacity_update() {
        let mut table = RoutingTable::default();
        let key = ("test-index".to_string(), "test-source".into());

        // Insert first node.
        table.apply_capacity_update(
            "node-1".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            8,
            3,
        );
        let entry = table.table.get(&key).unwrap();
        assert_eq!(entry.nodes.len(), 1);
        assert_eq!(entry.nodes.get("node-1").unwrap().capacity_score, 8);

        // Update existing node.
        table.apply_capacity_update(
            "node-1".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            4,
            5,
        );
        let node = table.table.get(&key).unwrap().nodes.get("node-1").unwrap();
        assert_eq!(node.capacity_score, 4);
        assert_eq!(node.open_shard_count, 5);

        // Add second node.
        table.apply_capacity_update(
            "node-2".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            6,
            2,
        );
        assert_eq!(table.table.get(&key).unwrap().nodes.len(), 2);

        // Zero shards: node stays in table but becomes ineligible for routing.
        table.apply_capacity_update(
            "node-1".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            0,
            0,
        );
        let entry = table.table.get(&key).unwrap();
        assert_eq!(entry.nodes.len(), 2);
        assert_eq!(entry.nodes.get("node-1").unwrap().open_shard_count, 0);
        assert_eq!(entry.nodes.get("node-1").unwrap().capacity_score, 0);
    }

    #[test]
    fn test_has_open_nodes() {
        let mut table = RoutingTable::default();
        let pool = IngesterPool::default();

        // Empty table.
        assert!(!table.has_open_nodes("test-index", "test-source", &pool, &HashSet::new()));

        // Node exists but is not in pool.
        table.apply_capacity_update(
            "node-1".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            8,
            3,
        );
        assert!(!table.has_open_nodes("test-index", "test-source", &pool, &HashSet::new()));

        // Node is in pool → true.
        pool.insert("node-1".into(), mocked_ingester(None));
        assert!(table.has_open_nodes("test-index", "test-source", &pool, &HashSet::new()));

        // Node is unavailable → false.
        let unavailable: HashSet<NodeId> = HashSet::from(["node-1".into()]);
        assert!(!table.has_open_nodes("test-index", "test-source", &pool, &unavailable));

        // Second node available → true despite first being unavailable.
        table.apply_capacity_update(
            "node-2".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            6,
            2,
        );
        pool.insert("node-2".into(), mocked_ingester(None));
        assert!(table.has_open_nodes("test-index", "test-source", &pool, &unavailable));

        // Node with capacity_score=0 is not eligible.
        table.apply_capacity_update(
            "node-2".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            0,
            2,
        );
        assert!(!table.has_open_nodes("test-index", "test-source", &pool, &unavailable));
    }

    #[test]
    fn test_pick_node_prefers_same_az() {
        let mut table = RoutingTable::new(Some("az-1".to_string()));
        let pool = IngesterPool::default();

        table.apply_capacity_update(
            "node-1".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            5,
            1,
        );
        table.apply_capacity_update(
            "node-2".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            5,
            1,
        );
        pool.insert("node-1".into(), mocked_ingester(Some("az-1")));
        pool.insert("node-2".into(), mocked_ingester(Some("az-2")));

        let picked = table
            .pick_node("test-index", "test-source", &pool, &HashSet::new())
            .unwrap();
        assert_eq!(picked.node_id, NodeId::from("node-1"));
    }

    #[test]
    fn test_pick_node_falls_back_to_cross_az() {
        let mut table = RoutingTable::new(Some("az-1".to_string()));
        let pool = IngesterPool::default();

        table.apply_capacity_update(
            "node-2".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            5,
            1,
        );
        pool.insert("node-2".into(), mocked_ingester(Some("az-2")));

        let picked = table
            .pick_node("test-index", "test-source", &pool, &HashSet::new())
            .unwrap();
        assert_eq!(picked.node_id, NodeId::from("node-2"));
    }

    #[test]
    fn test_pick_node_no_az_awareness() {
        let mut table = RoutingTable::default();
        let pool = IngesterPool::default();

        table.apply_capacity_update(
            "node-1".into(),
            IndexUid::for_test("test-index", 0),
            "test-source".into(),
            5,
            1,
        );
        pool.insert("node-1".into(), mocked_ingester(Some("az-1")));

        let picked = table
            .pick_node("test-index", "test-source", &pool, &HashSet::new())
            .unwrap();
        assert_eq!(picked.node_id, NodeId::from("node-1"));
    }

    #[test]
    fn test_pick_node_missing_entry() {
        let table = RoutingTable::new(Some("az-1".to_string()));
        let pool = IngesterPool::default();

        assert!(
            table
                .pick_node("nonexistent", "source", &pool, &HashSet::new())
                .is_none()
        );
    }

    #[test]
    fn test_power_of_two_choices() {
        // 3 candidates: best appears in the random pair 2/3 of the time and always
        // wins when it does, so it should win ~67% of 1000 runs. Asserting > 550
        // is ~7.5 standard deviations from the mean — effectively impossible to flake.
        let high = IngesterNode {
            node_id: "high".into(),
            index_uid: IndexUid::for_test("idx", 0),
            source_id: "src".into(),
            capacity_score: 9,
            open_shard_count: 2,
        };
        let mid = IngesterNode {
            node_id: "mid".into(),
            index_uid: IndexUid::for_test("idx", 0),
            source_id: "src".into(),
            capacity_score: 5,
            open_shard_count: 2,
        };
        let low = IngesterNode {
            node_id: "low".into(),
            index_uid: IndexUid::for_test("idx", 0),
            source_id: "src".into(),
            capacity_score: 1,
            open_shard_count: 2,
        };
        let candidates: Vec<&IngesterNode> = vec![&high, &mid, &low];

        let mut high_wins = 0;
        for _ in 0..1000 {
            if power_of_two_choices(&candidates).node_id == "high" {
                high_wins += 1;
            }
        }
        assert!(high_wins > 550, "high won only {high_wins}/1000 times");
    }

    #[test]
    fn test_merge_from_shards() {
        let mut table = RoutingTable::default();
        let index_uid = IndexUid::for_test("test-index", 0);
        let key = ("test-index".to_string(), "test-source".to_string());

        let make_shard = |id: u64, leader: &str, open: bool| Shard {
            index_uid: Some(index_uid.clone()),
            source_id: "test-source".to_string(),
            shard_id: Some(ShardId::from(id)),
            shard_state: if open {
                ShardState::Open as i32
            } else {
                ShardState::Closed as i32
            },
            leader_id: leader.to_string(),
            ..Default::default()
        };

        // Two open shards on node-1, one open + one closed on node-2, only closed on node-3.
        let shards = vec![
            make_shard(1, "node-1", true),
            make_shard(2, "node-1", true),
            make_shard(3, "node-2", true),
            make_shard(4, "node-2", false),
            make_shard(5, "node-3", false),
        ];
        table.merge_from_shards(index_uid.clone(), "test-source".into(), shards);

        let entry = table.table.get(&key).unwrap();
        assert_eq!(entry.nodes.len(), 3);

        let n1 = entry.nodes.get("node-1").unwrap();
        assert_eq!(n1.open_shard_count, 2);
        assert_eq!(n1.capacity_score, 5);

        let n2 = entry.nodes.get("node-2").unwrap();
        assert_eq!(n2.open_shard_count, 1);

        let n3 = entry.nodes.get("node-3").unwrap();
        assert_eq!(n3.open_shard_count, 0);

        // Merging again adds new nodes but preserves existing ones.
        let shards = vec![make_shard(10, "node-4", true)];
        table.merge_from_shards(index_uid, "test-source".into(), shards);

        let entry = table.table.get(&key).unwrap();
        assert_eq!(entry.nodes.len(), 4);
        assert!(entry.nodes.contains_key("node-1"));
        assert!(entry.nodes.contains_key("node-2"));
        assert!(entry.nodes.contains_key("node-3"));
        assert!(entry.nodes.contains_key("node-4"));
    }

    #[test]
    fn test_classify_az_locality() {
        let table = RoutingTable::new(Some("az-1".to_string()));
        let pool = IngesterPool::default();
        pool.insert("node-local".into(), mocked_ingester(Some("az-1")));
        pool.insert("node-remote".into(), mocked_ingester(Some("az-2")));
        pool.insert("node-no-az".into(), mocked_ingester(None));

        assert_eq!(
            table.classify_az_locality(&"node-local".into(), &pool),
            "same_az"
        );
        assert_eq!(
            table.classify_az_locality(&"node-remote".into(), &pool),
            "cross_az"
        );
        assert_eq!(
            table.classify_az_locality(&"node-no-az".into(), &pool),
            "az_unaware"
        );

        let table_no_az = RoutingTable::default();
        assert_eq!(
            table_no_az.classify_az_locality(&"node-local".into(), &pool),
            "az_unaware"
        );
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/state.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::ops::{Deref, DerefMut};
use std::path::Path;
use std::sync::{Arc, Weak};
use std::time::{Duration, Instant};

use bytesize::ByteSize;
use itertools::Itertools;
use mrecordlog::error::{DeleteQueueError, TruncateError};
use quickwit_cluster::Cluster;
use quickwit_common::pretty::PrettyDisplay;
use quickwit_common::rate_limiter::{RateLimiter, RateLimiterSettings};
use quickwit_common::shared_consts::INGESTER_STATUS_KEY;
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::control_plane::AdviseResetShardsResponse;
use quickwit_proto::ingest::ingester::IngesterStatus;
use quickwit_proto::ingest::{IngestV2Error, IngestV2Result, ShardIds, ShardState};
use quickwit_proto::types::{DocMappingUid, IndexUid, Position, QueueId, SourceId, split_queue_id};
use tokio::sync::{Mutex, MutexGuard, RwLock, RwLockMappedWriteGuard, RwLockWriteGuard, watch};
use tracing::{error, info};

use super::models::IngesterShard;
use super::rate_meter::RateMeter;
use super::replication::{ReplicationStreamTaskHandle, ReplicationTaskHandle};
use super::wal_capacity_tracker::WalCapacityTracker;
use crate::ingest_v2::mrecordlog_utils::{force_delete_queue, queue_position_range};
use crate::mrecordlog_async::MultiRecordLogAsync;
use crate::{FollowerId, LeaderId, OpenShardCounts};

/// Stores the state of the ingester and attempts to prevent deadlocks by exposing an API that
/// guarantees that the internal data structures are always locked in the same order.
///
/// `lock_partially` locks `inner` only, while `lock_fully` locks both `inner` and `mrecordlog`. Use
/// the former when you only need to access the in-memory state of the ingester and the latter when
/// you need to access both the in-memory state AND the WAL.
#[derive(Clone)]
pub(super) struct IngesterState {
    // `inner` is a mutex because it's almost always accessed mutably.
    inner: Arc<Mutex<InnerIngesterState>>,
    mrecordlog: Arc<RwLock<Option<MultiRecordLogAsync>>>,
    pub status_rx: watch::Receiver<IngesterStatus>,
}

pub(super) struct InnerIngesterState {
    pub shards: HashMap<QueueId, IngesterShard>,
    pub doc_mappers: HashMap<DocMappingUid, Weak<DocMapper>>,
    // Replication stream opened with followers.
    pub replication_streams: HashMap<FollowerId, ReplicationStreamTaskHandle>,
    // Replication tasks running for each replication stream opened with leaders.
    pub replication_tasks: HashMap<LeaderId, ReplicationTaskHandle>,
    cluster: Cluster,
    pub wal_capacity_tracker: WalCapacityTracker,
    status: IngesterStatus,
    status_tx: watch::Sender<IngesterStatus>,
}

impl InnerIngesterState {
    pub fn status(&self) -> IngesterStatus {
        self.status
    }

    pub async fn set_status(&mut self, status: IngesterStatus) {
        self.status = status;
        self.status_tx.send(status).expect("channel should be open");
        self.cluster
            .set_self_key_value(INGESTER_STATUS_KEY, status.as_json_str_name())
            .await;
    }

    /// Returns the shard with the most available permits for this index and source.
    pub fn find_most_capacity_shard_mut(
        &mut self,
        index_uid: &IndexUid,
        source_id: &SourceId,
    ) -> Option<&mut IngesterShard> {
        self.shards
            .values_mut()
            .filter(|shard| {
                shard.is_open() && shard.index_uid == *index_uid && shard.source_id == *source_id
            })
            .map(|shard| (shard.rate_limiter.available_permits(), shard))
            .max_by_key(|(available_permits, _)| *available_permits)
            .map(|(_, shard)| shard)
    }

    /// Returns per-source open shard counts and closed shard IDs for all advertisable,
    /// non-replica shards.
    pub fn get_shard_snapshot(&self) -> (OpenShardCounts, Vec<ShardIds>) {
        let grouped = self
            .shards
            .values()
            .filter(|shard| shard.is_advertisable && !shard.is_replica())
            .map(|shard| ((shard.index_uid.clone(), shard.source_id.clone()), shard))
            .into_group_map();

        let mut open_counts = Vec::new();
        let mut closed_shards = Vec::new();

        for ((index_uid, source_id), shards) in grouped {
            let mut open_count = 0;
            let mut closed_ids = Vec::new();

            for shard in shards {
                if shard.is_open() {
                    open_count += 1;
                } else if shard.is_closed() {
                    closed_ids.push(shard.shard_id.clone());
                }
            }
            open_counts.push((index_uid.clone(), source_id.clone(), open_count));
            if !closed_ids.is_empty() {
                closed_shards.push(ShardIds {
                    index_uid: Some(index_uid),
                    source_id,
                    shard_ids: closed_ids,
                });
            }
        }
        (open_counts, closed_shards)
    }
}

impl IngesterState {
    async fn create(cluster: Cluster, disk_capacity: ByteSize, memory_capacity: ByteSize) -> Self {
        let status = IngesterStatus::Initializing;
        let (status_tx, status_rx) = watch::channel(status);
        let mut inner = InnerIngesterState {
            shards: Default::default(),
            doc_mappers: Default::default(),
            replication_streams: Default::default(),
            replication_tasks: Default::default(),
            cluster,
            wal_capacity_tracker: WalCapacityTracker::new(disk_capacity, memory_capacity),
            status,
            status_tx,
        };
        // We call `set_status` here instead of setting it directly because it also updates the
        // ingester status in chitchat.
        inner.set_status(IngesterStatus::Initializing).await;

        let inner = Arc::new(Mutex::new(inner));
        let mrecordlog = Arc::new(RwLock::new(None));

        Self {
            inner,
            mrecordlog,
            status_rx,
        }
    }

    pub async fn load(
        cluster: Cluster,
        wal_dir_path: &Path,
        disk_capacity: ByteSize,
        memory_capacity: ByteSize,
        rate_limiter_settings: RateLimiterSettings,
    ) -> Self {
        let state = Self::create(cluster, disk_capacity, memory_capacity).await;
        let state_clone = state.clone();
        let wal_dir_path = wal_dir_path.to_path_buf();

        let init_future = async move {
            state_clone.init(&wal_dir_path, rate_limiter_settings).await;
        };
        tokio::spawn(init_future);

        state
    }

    #[cfg(test)]
    pub async fn for_test(cluster: Cluster) -> (tempfile::TempDir, Self) {
        Self::for_test_with_disk_capacity(cluster, ByteSize::mb(256)).await
    }

    #[cfg(test)]
    pub async fn for_test_with_disk_capacity(
        cluster: Cluster,
        disk_capacity: ByteSize,
    ) -> (tempfile::TempDir, Self) {
        let temp_dir = tempfile::tempdir().unwrap();
        let mut state = IngesterState::load(
            cluster,
            temp_dir.path(),
            disk_capacity,
            ByteSize::mb(256),
            RateLimiterSettings::default(),
        )
        .await;

        state.wait_for_ready().await;

        (temp_dir, state)
    }

    /// Initializes the internal state of the ingester. It loads the local WAL, then lists all its
    /// queues. Empty queues are deleted, while non-empty queues are recovered. However, the
    /// corresponding shards are closed and become read-only.
    pub async fn init(&self, wal_dir_path: &Path, rate_limiter_settings: RateLimiterSettings) {
        // Acquire locks in the same order as `lock_fully` (mrecordlog first, then inner) to
        // prevent ABBA deadlocks with the broadcast capacity task.
        let mut mrecordlog_guard = self.mrecordlog.write().await;
        let mut inner_guard = self.inner.lock().await;

        let now = Instant::now();

        info!("opening WAL located at `{}`", wal_dir_path.display());
        let open_result = MultiRecordLogAsync::open_with_prefs(
            wal_dir_path,
            mrecordlog::PersistPolicy::OnDelay {
                interval: Duration::from_secs(5),
                // TODO maybe we want to fsync too?
                action: mrecordlog::PersistAction::Flush,
            },
        )
        .await;

        let mut mrecordlog = match open_result {
            Ok(mrecordlog) => {
                info!(
                    "opened WAL successfully in {}",
                    now.elapsed().pretty_display()
                );
                mrecordlog
            }
            Err(error) => {
                error!("failed to open WAL: {error}");
                inner_guard.set_status(IngesterStatus::Failed).await;
                return;
            }
        };
        let queue_ids: Vec<QueueId> = mrecordlog
            .list_queues()
            .map(|queue_id| queue_id.to_string())
            .collect();

        if !queue_ids.is_empty() {
            info!("recovering {} shard(s)", queue_ids.len());
        }
        let now = Instant::now();
        let mut num_closed_shards = 0;
        let mut num_deleted_shards = 0;

        for queue_id in queue_ids {
            if let Some(position_range) = queue_position_range(&mrecordlog, &queue_id) {
                let Some((index_uid, source_id, shard_id)) = split_queue_id(&queue_id) else {
                    // `split_queue_id` already logs an error.
                    continue;
                };
                // The queue is not empty: recover it.
                let replication_position_inclusive = Position::offset(*position_range.end());
                let truncation_position_inclusive = if *position_range.start() == 0 {
                    Position::Beginning
                } else {
                    Position::offset(*position_range.start() - 1)
                };
                let rate_limiter = RateLimiter::from_settings(rate_limiter_settings);
                let rate_meter = RateMeter::default();
                // We want to advertise the shard as read-only right away.
                let solo_shard =
                    IngesterShard::new_solo(index_uid.clone(), source_id.clone(), shard_id.clone())
                        .with_state(ShardState::Closed)
                        .with_replication_position_inclusive(replication_position_inclusive)
                        .with_truncation_position_inclusive(truncation_position_inclusive)
                        .with_rate_limiter(rate_limiter)
                        .with_rate_meter(rate_meter)
                        .with_last_write(now)
                        .advertisable() // We want to advertise the shard as read-only right away.
                        .build();
                inner_guard.shards.insert(queue_id.clone(), solo_shard);

                num_closed_shards += 1;
            } else {
                // The queue is empty: delete it.
                if let Err(io_error) = force_delete_queue(&mut mrecordlog, &queue_id).await {
                    error!("failed to delete shard `{queue_id}`: {io_error}");
                    continue;
                }
                num_deleted_shards += 1;
            }
        }
        if num_closed_shards > 0 {
            info!("recovered and closed {num_closed_shards} shard(s)");
        }
        if num_deleted_shards > 0 {
            info!("deleted {num_deleted_shards} empty shard(s)");
        }
        mrecordlog_guard.replace(mrecordlog);
        inner_guard.set_status(IngesterStatus::Ready).await;
    }

    pub async fn wait_for_ready(&mut self) {
        self.status_rx
            .wait_for(|status| *status == IngesterStatus::Ready)
            .await
            .expect("channel should be open");
    }

    pub async fn lock_partially(&self) -> IngestV2Result<PartiallyLockedIngesterState<'_>> {
        if *self.status_rx.borrow() == IngesterStatus::Initializing {
            return Err(IngestV2Error::Internal(
                "ingester is initializing".to_string(),
            ));
        }
        let inner_guard = self.inner.lock().await;

        if inner_guard.status() == IngesterStatus::Failed {
            return Err(IngestV2Error::Internal(
                "failed to initialize ingester".to_string(),
            ));
        }
        let partial_lock = PartiallyLockedIngesterState { inner: inner_guard };
        Ok(partial_lock)
    }

    pub async fn lock_fully(&self) -> IngestV2Result<FullyLockedIngesterState<'_>> {
        if *self.status_rx.borrow() == IngesterStatus::Initializing {
            return Err(IngestV2Error::Internal(
                "ingester is initializing".to_string(),
            ));
        }
        // We assume that the mrecordlog lock is the most "expensive" one to acquire, so we acquire
        // it first.
        let mrecordlog_opt_guard = self.mrecordlog.write().await;
        let inner_guard = self.inner.lock().await;

        if inner_guard.status() == IngesterStatus::Failed {
            return Err(IngestV2Error::Internal(
                "failed to initialize ingester".to_string(),
            ));
        }
        let mrecordlog_guard = RwLockWriteGuard::map(mrecordlog_opt_guard, |mrecordlog_opt| {
            mrecordlog_opt
                .as_mut()
                .expect("mrecordlog should be initialized")
        });
        let full_lock = FullyLockedIngesterState {
            inner: inner_guard,
            mrecordlog: mrecordlog_guard,
        };
        Ok(full_lock)
    }

    // Leaks the mrecordlog lock for use in fetch tasks. It's safe to do so because fetch tasks
    // never attempt to lock the inner state.
    pub fn mrecordlog(&self) -> Arc<RwLock<Option<MultiRecordLogAsync>>> {
        self.mrecordlog.clone()
    }

    pub fn weak(&self) -> WeakIngesterState {
        WeakIngesterState {
            inner: Arc::downgrade(&self.inner),
            mrecordlog: Arc::downgrade(&self.mrecordlog),
            status_rx: self.status_rx.clone(),
        }
    }
}

pub(super) struct PartiallyLockedIngesterState<'a> {
    pub inner: MutexGuard<'a, InnerIngesterState>,
}

impl fmt::Debug for PartiallyLockedIngesterState<'_> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("PartiallyLockedIngesterState").finish()
    }
}

impl Deref for PartiallyLockedIngesterState<'_> {
    type Target = InnerIngesterState;

    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}

impl DerefMut for PartiallyLockedIngesterState<'_> {
    fn deref_mut(&mut self) -> &mut Self::Target {
        &mut self.inner
    }
}

pub(super) struct FullyLockedIngesterState<'a> {
    pub inner: MutexGuard<'a, InnerIngesterState>,
    pub mrecordlog: RwLockMappedWriteGuard<'a, MultiRecordLogAsync>,
}

impl fmt::Debug for FullyLockedIngesterState<'_> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("FullyLockedIngesterState").finish()
    }
}

impl Deref for FullyLockedIngesterState<'_> {
    type Target = InnerIngesterState;

    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}

impl DerefMut for FullyLockedIngesterState<'_> {
    fn deref_mut(&mut self) -> &mut Self::Target {
        &mut self.inner
    }
}

impl FullyLockedIngesterState<'_> {
    /// Deletes the shard identified by `queue_id` from the ingester state. It removes the
    /// mrecordlog queue first and then removes the associated in-memory shard and rate trackers.
    pub async fn delete_shard(&mut self, queue_id: &QueueId, initiator: &'static str) {
        match self.mrecordlog.delete_queue(queue_id).await {
            Ok(_) | Err(DeleteQueueError::MissingQueue(_)) => {
                // Log only if the shard was actually removed.
                if let Some(shard) = self.shards.remove(queue_id) {
                    info!("deleted shard `{queue_id}` initiated via `{initiator}`");

                    if let Some(doc_mapper) = shard.doc_mapper_opt {
                        // At this point, we hold the lock so we can safely check the strong count.
                        // The other locations where the doc mapper is cloned also require holding
                        // the lock.
                        if Arc::strong_count(&doc_mapper) == 1 {
                            let doc_mapping_uid = doc_mapper.doc_mapping_uid();

                            if self.doc_mappers.remove(&doc_mapping_uid).is_some() {
                                info!("evicted doc mapper `{doc_mapping_uid}` from cache`");
                            }
                        }
                    }
                }
            }
            Err(DeleteQueueError::IoError(io_error)) => {
                error!("failed to delete shard `{queue_id}`: {io_error}");
            }
        };
    }

    /// Truncates the shard identified by `queue_id` up to `truncate_up_to_position_inclusive` only
    /// if the current truncation position of the shard is smaller.
    pub async fn truncate_shard(
        &mut self,
        queue_id: &QueueId,
        truncate_up_to_position_inclusive: Position,
        initiator: &'static str,
    ) {
        if let Some(truncate_up_to_offset_inclusive) = truncate_up_to_position_inclusive.as_u64()
            && let Some(shard) = self.inner.shards.get_mut(queue_id)
            && shard.truncation_position_inclusive < truncate_up_to_position_inclusive
        {
            match self
                .mrecordlog
                .truncate(queue_id, truncate_up_to_offset_inclusive)
                .await
            {
                Ok(_) => {
                    info!(
                        "truncated shard `{queue_id}` at {truncate_up_to_position_inclusive} \
                         initiated via `{initiator}`"
                    );
                    shard.truncation_position_inclusive = truncate_up_to_position_inclusive;
                }
                Err(TruncateError::MissingQueue(_)) => {
                    error!("failed to truncate shard `{queue_id}`: WAL queue not found");
                    self.shards.remove(queue_id);
                    info!("deleted dangling shard `{queue_id}`");
                }
                Err(TruncateError::IoError(io_error)) => {
                    error!("failed to truncate shard `{queue_id}`: {io_error}");
                }
            };
        }
    }

    /// Deletes and truncates the shards as directed by the `advise_reset_shards_response` returned
    /// by the control plane.
    pub async fn reset_shards(&mut self, advise_reset_shards_response: &AdviseResetShardsResponse) {
        info!("resetting shards");
        for shard_ids in &advise_reset_shards_response.shards_to_delete {
            for queue_id in shard_ids.queue_ids() {
                self.delete_shard(&queue_id, "control-plane-reset-shards-rpc")
                    .await;
            }
        }
        for shard_id_positions in &advise_reset_shards_response.shards_to_truncate {
            for (queue_id, publish_position) in shard_id_positions.queue_id_positions() {
                self.truncate_shard(
                    &queue_id,
                    publish_position,
                    "control-plane-reset-shards-rpc",
                )
                .await;
            }
        }
    }
}

#[derive(Clone)]
pub(super) struct WeakIngesterState {
    inner: Weak<Mutex<InnerIngesterState>>,
    mrecordlog: Weak<RwLock<Option<MultiRecordLogAsync>>>,
    status_rx: watch::Receiver<IngesterStatus>,
}

impl WeakIngesterState {
    pub fn upgrade(&self) -> Option<IngesterState> {
        let inner = self.inner.upgrade()?;
        let mrecordlog = self.mrecordlog.upgrade()?;
        let status_rx = self.status_rx.clone();
        let state = IngesterState {
            inner,
            mrecordlog,
            status_rx,
        };
        Some(state)
    }
}

#[cfg(test)]
mod tests {
    use bytesize::ByteSize;
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_config::service::QuickwitService;
    use quickwit_proto::types::{NodeId, ShardId, SourceId};
    use tokio::time::timeout;

    use super::*;

    async fn test_cluster() -> Cluster {
        create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap()
    }

    #[tokio::test]
    async fn test_ingester_state_does_not_lock_while_initializing() {
        let cluster = test_cluster().await;
        let state = IngesterState::create(cluster, ByteSize::mb(256), ByteSize::mb(256)).await;
        let inner_guard = state.inner.lock().await;

        assert_eq!(inner_guard.status(), IngesterStatus::Initializing);
        assert_eq!(*state.status_rx.borrow(), IngesterStatus::Initializing);

        let error = state.lock_partially().await.unwrap_err().to_string();
        assert!(error.contains("ingester is initializing"));

        let error = state.lock_fully().await.unwrap_err().to_string();
        assert!(error.contains("ingester is initializing"));
    }

    #[tokio::test]
    async fn test_ingester_state_failed() {
        let cluster = test_cluster().await;
        let state = IngesterState::create(cluster, ByteSize::mb(256), ByteSize::mb(256)).await;

        state
            .inner
            .lock()
            .await
            .set_status(IngesterStatus::Failed)
            .await;

        let error = state.lock_partially().await.unwrap_err().to_string();
        assert!(error.to_string().ends_with("failed to initialize ingester"));

        let error = state.lock_fully().await.unwrap_err().to_string();
        assert!(error.contains("failed to initialize ingester"));
    }

    #[tokio::test]
    async fn test_ingester_state_init() {
        let cluster = test_cluster().await;
        let mut state = IngesterState::create(cluster, ByteSize::mb(256), ByteSize::mb(256)).await;
        let temp_dir = tempfile::tempdir().unwrap();

        state
            .init(temp_dir.path(), RateLimiterSettings::default())
            .await;

        timeout(Duration::from_millis(100), state.wait_for_ready())
            .await
            .unwrap();

        state.lock_partially().await.unwrap();

        let locked_state = state.lock_fully().await.unwrap();
        assert_eq!(locked_state.status(), IngesterStatus::Ready);
        assert_eq!(*locked_state.status_tx.borrow(), IngesterStatus::Ready);
    }

    fn insert_shard_with_used_capacity(
        state: &mut InnerIngesterState,
        index_uid: IndexUid,
        source_id: SourceId,
        shard_id: ShardId,
        shard_state: ShardState,
        used_capacity: ByteSize,
    ) {
        let mut shard = IngesterShard::new_solo(index_uid, source_id, shard_id)
            .with_state(shard_state)
            .build();
        shard.rate_limiter.acquire_bytes(used_capacity);

        let queue_id = shard.queue_id();
        state.shards.insert(queue_id, shard);
    }

    #[tokio::test]
    async fn test_find_most_capacity_shard_returns_shard_with_least_used_capacity() {
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let mut state_guard = state.lock_partially().await.unwrap();

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        // Shard 1: 1KB used (most available capacity)
        // Shard 2: 2KB used
        // ...
        // Shard 5: 5KB used (least available capacity)
        for i in 1..=5u64 {
            insert_shard_with_used_capacity(
                &mut state_guard,
                index_uid.clone(),
                source_id.clone(),
                ShardId::from(i),
                ShardState::Open,
                ByteSize::kb(i),
            );
        }

        let shard = state_guard
            .find_most_capacity_shard_mut(&index_uid, &source_id)
            .unwrap();

        assert_eq!(shard.shard_id, ShardId::from(1));
        assert_eq!(shard.shard_state, ShardState::Open);

        let expected_available_permits =
            RateLimiterSettings::default().burst_limit - ByteSize::kb(1).as_u64();
        assert_eq!(
            shard.rate_limiter.available_permits(),
            expected_available_permits
        );
    }

    #[tokio::test]
    async fn test_find_most_capacity_shard_skips_closed_shards() {
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let mut locked_state = state.lock_partially().await.unwrap();

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        insert_shard_with_used_capacity(
            &mut locked_state,
            index_uid.clone(),
            source_id.clone(),
            ShardId::from(1),
            ShardState::Open,
            ByteSize::kb(1),
        );
        insert_shard_with_used_capacity(
            &mut locked_state,
            index_uid.clone(),
            source_id.clone(),
            ShardId::from(2),
            ShardState::Open,
            ByteSize::kb(2),
        );

        insert_shard_with_used_capacity(
            &mut locked_state,
            index_uid.clone(),
            source_id.clone(),
            ShardId::from(3),
            ShardState::Closed,
            ByteSize::kb(0),
        );

        let shard = locked_state
            .find_most_capacity_shard_mut(&index_uid, &source_id)
            .unwrap();

        // Should pick shard 1 (most capacity among open shards), not shard 3 (closed)
        assert_eq!(shard.shard_id, ShardId::from(1));
    }

    #[tokio::test]
    async fn test_find_most_capacity_shard_returns_none_for_unknown_index_or_source() {
        let cluster = create_cluster_for_test(
            Vec::new(),
            &[QuickwitService::Indexer.as_str()],
            &ChannelTransport::default(),
            true,
        )
        .await
        .unwrap();
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let mut locked_state = state.lock_partially().await.unwrap();

        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = SourceId::from("test-source");

        insert_shard_with_used_capacity(
            &mut locked_state,
            index_uid.clone(),
            source_id.clone(),
            ShardId::from(1),
            ShardState::Open,
            ByteSize::kb(0),
        );

        let shard_opt = locked_state
            .find_most_capacity_shard_mut(&IndexUid::for_test("other-index", 0), &source_id);
        assert!(shard_opt.is_none());

        let shard_opt =
            locked_state.find_most_capacity_shard_mut(&index_uid, &SourceId::from("other-source"));
        assert!(shard_opt.is_none());
    }

    #[tokio::test]
    async fn test_ingester_state_set_status() {
        let cluster = test_cluster().await;
        let state =
            IngesterState::create(cluster.clone(), ByteSize::mb(256), ByteSize::mb(256)).await;
        let temp_dir = tempfile::tempdir().unwrap();

        state
            .init(temp_dir.path(), RateLimiterSettings::default())
            .await;

        let mut state_guard = state.lock_fully().await.unwrap();
        state_guard.set_status(IngesterStatus::Failed).await;
        assert_eq!(state_guard.status(), IngesterStatus::Failed);
        assert_eq!(*state.status_rx.borrow(), IngesterStatus::Failed);

        let status_json_str = cluster
            .get_self_key_value(INGESTER_STATUS_KEY)
            .await
            .unwrap();
        let status = IngesterStatus::from_json_str_name(&status_json_str).unwrap();
        assert_eq!(status, IngesterStatus::Failed);
    }

    fn open_shard(
        index_uid: IndexUid,
        source_id: SourceId,
        shard_id: ShardId,
        is_replica: bool,
    ) -> IngesterShard {
        let builder = if is_replica {
            IngesterShard::new_replica(index_uid, source_id, shard_id, NodeId::from("test-leader"))
        } else {
            IngesterShard::new_solo(index_uid, source_id, shard_id)
        };
        builder.advertisable().build()
    }

    #[tokio::test]
    async fn test_get_shard_snapshot() {
        let cluster = test_cluster().await;
        let (_temp_dir, state) = IngesterState::for_test(cluster).await;
        let mut state_guard = state.lock_partially().await.unwrap();

        let index_uid = IndexUid::for_test("test-index", 0);

        // source-a: 2 open shards + 1 closed shard + 1 replica (ignored).
        let s = open_shard(
            index_uid.clone(),
            "source-a".into(),
            ShardId::from(1),
            false,
        );
        state_guard.shards.insert(s.queue_id(), s);
        let s = open_shard(
            index_uid.clone(),
            "source-a".into(),
            ShardId::from(2),
            false,
        );
        state_guard.shards.insert(s.queue_id(), s);
        let s = IngesterShard::new_solo(index_uid.clone(), "source-a".into(), ShardId::from(3))
            .with_state(ShardState::Closed)
            .advertisable()
            .build();
        state_guard.shards.insert(s.queue_id(), s);
        let s = open_shard(index_uid.clone(), "source-a".into(), ShardId::from(4), true);
        state_guard.shards.insert(s.queue_id(), s);

        // source-b: 2 closed shards, no open shards.
        let s = IngesterShard::new_solo(index_uid.clone(), "source-b".into(), ShardId::from(5))
            .with_state(ShardState::Closed)
            .advertisable()
            .build();
        state_guard.shards.insert(s.queue_id(), s);
        let s = IngesterShard::new_solo(index_uid.clone(), "source-b".into(), ShardId::from(6))
            .with_state(ShardState::Closed)
            .advertisable()
            .build();
        state_guard.shards.insert(s.queue_id(), s);

        let (mut open_counts, mut closed_shards) = state_guard.get_shard_snapshot();

        // Open counts: source-a has 2, source-b has 0.
        open_counts.sort_by(|a, b| a.1.cmp(&b.1));
        assert_eq!(open_counts.len(), 2);
        assert_eq!(
            open_counts[0],
            (index_uid.clone(), SourceId::from("source-a"), 2)
        );
        assert_eq!(
            open_counts[1],
            (index_uid.clone(), SourceId::from("source-b"), 0)
        );

        // Closed shards: source-a has shard 3, source-b has shards 5 and 6.
        closed_shards.sort_by(|a, b| a.source_id.cmp(&b.source_id));
        assert_eq!(closed_shards.len(), 2);

        assert_eq!(closed_shards[0].source_id, "source-a");
        assert_eq!(closed_shards[0].shard_ids, vec![ShardId::from(3)]);

        assert_eq!(closed_shards[1].source_id, "source-b");
        let mut source_b_ids = closed_shards[1].shard_ids.clone();
        source_b_ids.sort();
        assert_eq!(source_b_ids, vec![ShardId::from(5), ShardId::from(6)]);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/wal_capacity_tracker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytesize::ByteSize;
use quickwit_common::ring_buffer::RingBuffer;

/// The lookback window length is meant to capture readings far enough back in time to give
/// a rough rate of change estimate. At size 6, with broadcast interval of 5 seconds, this would be
/// 30 seconds of readings.
const WAL_CAPACITY_LOOKBACK_WINDOW_LEN: usize = 6;

/// The ring buffer stores one extra element so that `delta()` can compare the newest reading
/// with the one that is exactly `WAL_CAPACITY_LOOKBACK_WINDOW_LEN` steps ago. Otherwise, that
/// reading would be discarded when the next reading is inserted.
const WAL_CAPACITY_READINGS_LEN: usize = WAL_CAPACITY_LOOKBACK_WINDOW_LEN + 1;

struct WalCapacityTimeSeries {
    capacity: ByteSize,
    readings: RingBuffer<f64, WAL_CAPACITY_READINGS_LEN>,
}

impl WalCapacityTimeSeries {
    fn new(capacity: ByteSize) -> Self {
        #[cfg(not(test))]
        assert!(capacity.as_u64() > 0);
        Self {
            capacity,
            readings: RingBuffer::default(),
        }
    }

    fn record_and_score(&mut self, used: ByteSize) -> usize {
        self.record(used);
        let remaining = self.current().unwrap_or(1.0);
        let delta = self.delta().unwrap_or(0.0);
        compute_capacity_score(remaining, delta)
    }

    fn score(&self, used: ByteSize) -> usize {
        let remaining = 1.0 - (used.as_u64() as f64 / self.capacity.as_u64() as f64);
        let delta = self.delta().unwrap_or(0.0);
        compute_capacity_score(remaining, delta)
    }

    fn record(&mut self, used: ByteSize) {
        let remaining = 1.0 - (used.as_u64() as f64 / self.capacity.as_u64() as f64);
        self.readings.push_back(remaining.clamp(0.0, 1.0));
    }

    fn current(&self) -> Option<f64> {
        self.readings.last()
    }

    fn delta(&self) -> Option<f64> {
        let current = self.readings.last()?;
        let oldest = self.readings.front()?;
        Some(current - oldest)
    }
}

pub struct WalCapacityTracker {
    disk: WalCapacityTimeSeries,
    memory: WalCapacityTimeSeries,
}

impl WalCapacityTracker {
    pub fn new(disk_capacity: ByteSize, memory_capacity: ByteSize) -> Self {
        Self {
            disk: WalCapacityTimeSeries::new(disk_capacity),
            memory: WalCapacityTimeSeries::new(memory_capacity),
        }
    }

    /// Records disk and memory usage readings and returns the resulting capacity score.
    /// The score is the minimum of the individual disk and memory scores.
    pub fn record_and_score(&mut self, disk_used: ByteSize, memory_used: ByteSize) -> usize {
        let disk_score = self.disk.record_and_score(disk_used);
        let memory_score = self.memory.record_and_score(memory_used);
        disk_score.min(memory_score)
    }

    /// Computes a capacity score for the given usage without recording it.
    pub fn score(&self, disk_used: ByteSize, memory_used: ByteSize) -> usize {
        let disk_score = self.disk.score(disk_used);
        let memory_score = self.memory.score(memory_used);
        disk_score.min(memory_score)
    }
}

/// Computes a capacity score from 0 to 10 using a PD controller.
///
/// The score has two components:
///
/// - **P (proportional):** How much WAL capacity remains right now. An ingester with 100% free
///   capacity gets `PROPORTIONAL_WEIGHT` points; 50% gets half; and so on. If remaining capacity
///   drops to `MIN_PERMISSIBLE_CAPACITY` or below, the score is immediately 0.
///
/// - **D (derivative):** Up to `DERIVATIVE_WEIGHT` bonus points based on how fast remaining
///   capacity is changing over the lookback window. A higher drain rate is worse, so we invert it:
///   `drain / MAX_DRAIN_RATE` normalizes the drain to a 0–1 penalty, and subtracting from 1
///   converts it into a 0–1 bonus. Multiplied by `DERIVATIVE_WEIGHT`, a stable node gets the full
///   bonus and a node draining at `MAX_DRAIN_RATE` or faster gets nothing.
///
/// Putting it together: a completely idle ingester scores 10 (8 + 2).
/// One that is full but stable scores ~2. One that is draining rapidly scores less.
/// A score of 0 means the ingester is at or below minimum permissible capacity.
///
/// Below this remaining capacity fraction, the score is immediately 0.
const MIN_PERMISSIBLE_CAPACITY: f64 = 0.05;
/// Weight of the proportional term (max points from P).
const PROPORTIONAL_WEIGHT: f64 = 8.0;
/// Weight of the derivative term (max points from D).
const DERIVATIVE_WEIGHT: f64 = 2.0;
/// The drain rate (as a fraction of total capacity over the lookback window) at which the
/// derivative penalty is fully applied. Drain rates beyond this are clamped.
const MAX_DRAIN_RATE: f64 = 0.10;

fn compute_capacity_score(remaining_capacity: f64, capacity_delta: f64) -> usize {
    if remaining_capacity <= MIN_PERMISSIBLE_CAPACITY {
        return 0;
    }
    let p = PROPORTIONAL_WEIGHT * remaining_capacity;
    let drain = (-capacity_delta).clamp(0.0, MAX_DRAIN_RATE);
    let d = DERIVATIVE_WEIGHT * (1.0 - drain / MAX_DRAIN_RATE);
    (p + d).clamp(0.0, 10.0) as usize
}

#[cfg(test)]
mod tests {
    use super::*;

    fn ts() -> WalCapacityTimeSeries {
        WalCapacityTimeSeries::new(ByteSize::b(100))
    }

    /// Helper: record a reading with `used` bytes against the series' fixed capacity.
    fn record(series: &mut WalCapacityTimeSeries, used: u64) {
        series.record(ByteSize::b(used));
    }

    #[test]
    fn test_wal_disk_capacity_current_after_record() {
        let mut series = WalCapacityTimeSeries::new(ByteSize::b(256));
        // 192 of 256 used => 25% remaining
        series.record(ByteSize::b(192));
        assert_eq!(series.current(), Some(0.25));

        // 16 of 256 used => 93.75% remaining
        series.record(ByteSize::b(16));
        assert_eq!(series.current(), Some(0.9375));
    }

    #[test]
    fn test_wal_disk_capacity_record_saturates_at_zero() {
        let mut series = ts();
        // 200 used out of 100 capacity => clamped to 0.0
        record(&mut series, 200);
        assert_eq!(series.current(), Some(0.0));
    }

    #[test]
    fn test_wal_disk_capacity_delta_growing() {
        let mut series = ts();
        // oldest: 60 of 100 used => 40% remaining
        record(&mut series, 60);
        // current: 20 of 100 used => 80% remaining
        record(&mut series, 20);
        // delta = 0.80 - 0.40 = 0.40
        assert_eq!(series.delta(), Some(0.40));
    }

    #[test]
    fn test_wal_disk_capacity_delta_shrinking() {
        let mut series = ts();
        // oldest: 20 of 100 used => 80% remaining
        record(&mut series, 20);
        // current: 60 of 100 used => 40% remaining
        record(&mut series, 60);
        // delta = 0.40 - 0.80 = -0.40
        assert_eq!(series.delta(), Some(-0.40));
    }

    #[test]
    fn test_capacity_score_draining_vs_stable() {
        // Node A: capacity draining — usage increases 10, 20, ..., 70 over 7 ticks.
        let mut node_a = ts();
        for used in (10..=70).step_by(10) {
            record(&mut node_a, used);
        }
        let a_remaining = node_a.current().unwrap();
        let a_delta = node_a.delta().unwrap();
        let a_score = compute_capacity_score(a_remaining, a_delta);

        // Node B: steady at 50% usage over 7 ticks.
        let mut node_b = ts();
        for _ in 0..7 {
            record(&mut node_b, 50);
        }
        let b_remaining = node_b.current().unwrap();
        let b_delta = node_b.delta().unwrap();
        let b_score = compute_capacity_score(b_remaining, b_delta);

        // p=2.4, d=0 (max drain) => 2
        assert_eq!(a_score, 2);
        // p=4, d=2 (stable) => 6
        assert_eq!(b_score, 6);
        assert!(b_score > a_score);
    }

    #[test]
    fn test_wal_disk_capacity_delta_spans_lookback_window() {
        let mut series = ts();

        // Fill to exactly the lookback window length (6 readings), all same value.
        for _ in 0..WAL_CAPACITY_LOOKBACK_WINDOW_LEN {
            record(&mut series, 50);
        }
        assert_eq!(series.delta(), Some(0.0));

        // 7th reading fills the ring buffer. Delta spans 6 intervals.
        record(&mut series, 0);
        assert_eq!(series.delta(), Some(0.50));

        // 8th reading evicts the oldest 50-remaining. Delta still spans 6 intervals.
        record(&mut series, 0);
        assert_eq!(series.delta(), Some(0.50));
    }

    #[test]
    fn test_wal_capacity_tracker_returns_min() {
        let mut tracker = WalCapacityTracker::new(ByteSize::b(100), ByteSize::b(100));
        // Disk 10% used (score 9), memory 90% used (score 2) → returns 2.
        assert_eq!(
            tracker.record_and_score(ByteSize::b(10), ByteSize::b(90)),
            2
        );
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/ingest_v2/workbench.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, HashSet};

use quickwit_common::pubsub::EventBroker;
use quickwit_common::rate_limited_error;
use quickwit_proto::control_plane::{
    GetOrCreateOpenShardsFailure, GetOrCreateOpenShardsFailureReason,
};
use quickwit_proto::ingest::ingester::{PersistFailure, PersistFailureReason, PersistSuccess};
use quickwit_proto::ingest::router::{
    IngestFailure, IngestFailureReason, IngestResponseV2, IngestSubrequest, IngestSuccess,
};
use quickwit_proto::ingest::{IngestV2Error, RateLimitingCause, ShardIds};
use quickwit_proto::types::{NodeId, SubrequestId};
use tracing::warn;

use super::publish_tracker::PublishTracker;
use super::router::PersistRequestSummary;

/// A helper struct for managing the state of the subrequests of an ingest request during multiple
/// persist attempts.
#[derive(Default)]
pub(super) struct IngestWorkbench {
    pub subworkbenches: BTreeMap<SubrequestId, IngestSubworkbench>,
    pub num_successes: usize,
    /// The number of batch persist attempts. This is not sum of the number of attempts for each
    /// subrequest.
    pub num_attempts: usize,
    pub max_num_attempts: usize,
    /// List of leaders that have been marked as temporarily unavailable.
    /// These leaders have encountered a transport error during an attempt and will be treated as
    /// if they were out of the pool for subsequent attempts.
    ///
    /// (The point here is to make sure we do not wait for the failure detection to kick the node
    /// out of the ingest node.)
    pub unavailable_leaders: HashSet<NodeId>,
    pub closed_shards: Vec<ShardIds>,
    publish_tracker: Option<PublishTracker>,
}

/// Returns an iterator of pending of subrequests, sorted by sub request id.
pub(super) fn pending_subrequests(
    subworkbenches: &BTreeMap<SubrequestId, IngestSubworkbench>,
) -> impl Iterator<Item = &IngestSubrequest> {
    subworkbenches.values().filter_map(|subworbench| {
        if subworbench.is_pending() {
            Some(&subworbench.subrequest)
        } else {
            None
        }
    })
}

impl IngestWorkbench {
    fn new_inner(
        ingest_subrequests: Vec<IngestSubrequest>,
        max_num_attempts: usize,
        publish_tracker: Option<PublishTracker>,
    ) -> Self {
        let subworkbenches: BTreeMap<SubrequestId, IngestSubworkbench> = ingest_subrequests
            .into_iter()
            .map(|subrequest| {
                (
                    subrequest.subrequest_id,
                    IngestSubworkbench::new(subrequest),
                )
            })
            .collect();

        Self {
            subworkbenches,
            max_num_attempts,
            publish_tracker,
            ..Default::default()
        }
    }

    pub fn new(ingest_subrequests: Vec<IngestSubrequest>, max_num_attempts: usize) -> Self {
        Self::new_inner(ingest_subrequests, max_num_attempts, None)
    }

    pub fn new_with_publish_tracking(
        ingest_subrequests: Vec<IngestSubrequest>,
        max_num_attempts: usize,
        event_broker: EventBroker,
    ) -> Self {
        Self::new_inner(
            ingest_subrequests,
            max_num_attempts,
            Some(PublishTracker::new(event_broker)),
        )
    }

    pub fn new_attempt(&mut self) {
        self.num_attempts += 1;
    }

    /// Returns true if all subrequests were successfully persisted or if the
    /// number of attempts has been exhausted.
    pub fn is_complete(&self) -> bool {
        self.num_successes >= self.subworkbenches.len()
            || self.num_attempts >= self.max_num_attempts
            || self.has_no_pending_subrequests()
    }

    pub fn is_last_attempt(&self) -> bool {
        self.num_attempts >= self.max_num_attempts
    }

    fn has_no_pending_subrequests(&self) -> bool {
        self.subworkbenches
            .values()
            .all(|subworbench| !subworbench.is_pending())
    }

    pub fn record_get_or_create_open_shards_failure(
        &mut self,
        open_shards_failure: GetOrCreateOpenShardsFailure,
    ) {
        let last_failure = match open_shards_failure.reason() {
            GetOrCreateOpenShardsFailureReason::IndexNotFound => SubworkbenchFailure::IndexNotFound,
            GetOrCreateOpenShardsFailureReason::SourceNotFound => {
                SubworkbenchFailure::SourceNotFound
            }
            GetOrCreateOpenShardsFailureReason::NoIngestersAvailable => {
                SubworkbenchFailure::NoShardsAvailable
            }
            GetOrCreateOpenShardsFailureReason::Unspecified => {
                warn!(
                    "failure reason for subrequest `{}` is unspecified",
                    open_shards_failure.subrequest_id
                );
                SubworkbenchFailure::Internal
            }
        };
        self.record_failure(open_shards_failure.subrequest_id, last_failure);
    }

    pub fn record_persist_success(&mut self, persist_success: PersistSuccess) {
        let Some(subworkbench) = self.subworkbenches.get_mut(&persist_success.subrequest_id) else {
            warn!(
                "could not find subrequest `{}` in workbench",
                persist_success.subrequest_id
            );
            return;
        };
        if let Some(publish_tracker) = &mut self.publish_tracker
            && let Some(position) = &persist_success.replication_position_inclusive
        {
            publish_tracker.track_persisted_shard_position(
                persist_success.shard_id().clone(),
                position.clone(),
            );
        }
        self.num_successes += 1;
        subworkbench.num_attempts += 1;
        subworkbench.persist_success_opt = Some(persist_success);
    }

    pub fn record_persist_error(
        &mut self,
        persist_error: IngestV2Error,
        persist_summary: PersistRequestSummary,
    ) {
        // Persist responses use dedicated failure reasons for `ShardNotFound` and
        // `TooManyRequests`: in reality, we should never have to handle these cases here.
        match persist_error {
            IngestV2Error::Timeout(_) => {
                for subrequest_id in persist_summary.subrequest_ids {
                    let failure = SubworkbenchFailure::Persist(PersistFailureReason::Timeout);
                    self.record_failure(subrequest_id, failure);
                }
            }
            IngestV2Error::Unavailable(_) => {
                self.unavailable_leaders.insert(persist_summary.leader_id);
                for subrequest_id in persist_summary.subrequest_ids {
                    self.record_ingester_unavailable(subrequest_id);
                }
            }
            IngestV2Error::Internal(internal_err_msg) => {
                rate_limited_error!(limit_per_min=6, err_msg=%internal_err_msg, "persist error: internal error during persist");
                for subrequest_id in persist_summary.subrequest_ids {
                    self.record_internal_error(subrequest_id);
                }
            }
            IngestV2Error::ShardNotFound { shard_id } => {
                rate_limited_error!(limit_per_min=6, shard_id=%shard_id, "persist error: shard not found");
                for subrequest_id in persist_summary.subrequest_ids {
                    self.record_internal_error(subrequest_id);
                }
            }
            IngestV2Error::TooManyRequests(rate_limiting_cause) => {
                for subrequest_id in persist_summary.subrequest_ids {
                    self.record_too_many_requests(subrequest_id, rate_limiting_cause);
                }
            }
        }
    }

    pub fn record_persist_failure(&mut self, persist_failure: &PersistFailure) {
        let failure = SubworkbenchFailure::Persist(persist_failure.reason());
        self.record_failure(persist_failure.subrequest_id, failure);
    }

    fn record_failure(&mut self, subrequest_id: SubrequestId, failure: SubworkbenchFailure) {
        let Some(subworkbench) = self.subworkbenches.get_mut(&subrequest_id) else {
            warn!("could not find subrequest `{}` in workbench", subrequest_id);
            return;
        };
        subworkbench.num_attempts += 1;
        subworkbench.last_failure_opt = Some(failure);
    }

    pub fn record_no_shards_available(&mut self, subrequest_id: SubrequestId) {
        self.record_failure(subrequest_id, SubworkbenchFailure::NoShardsAvailable);
    }

    /// Marks a node as unavailable for the span of the workbench.
    ///
    /// Remaining attempts will treat the node as if it was not in the ingester pool.
    pub fn record_ingester_unavailable(&mut self, subrequest_id: SubrequestId) {
        self.record_failure(subrequest_id, SubworkbenchFailure::Unavailable);
    }

    fn record_internal_error(&mut self, subrequest_id: SubrequestId) {
        self.record_failure(subrequest_id, SubworkbenchFailure::Internal);
    }

    fn record_too_many_requests(
        &mut self,
        subrequest_id: SubrequestId,
        rate_limiting_cause: RateLimitingCause,
    ) {
        self.record_failure(
            subrequest_id,
            SubworkbenchFailure::RateLimited(rate_limiting_cause),
        );
    }

    pub async fn into_ingest_result(self) -> IngestResponseV2 {
        let num_subworkbenches = self.subworkbenches.len();
        let mut successes = Vec::with_capacity(self.num_successes);
        let mut failures = Vec::with_capacity(num_subworkbenches - self.num_successes);

        // We consider the last retry outcome as the actual outcome.
        for subworkbench in self.subworkbenches.into_values() {
            if let Some(persist_success) = subworkbench.persist_success_opt {
                let success = IngestSuccess {
                    subrequest_id: persist_success.subrequest_id,
                    index_uid: persist_success.index_uid,
                    source_id: persist_success.source_id,
                    shard_id: persist_success.shard_id,
                    replication_position_inclusive: persist_success.replication_position_inclusive,
                    num_ingested_docs: persist_success.num_persisted_docs,
                    parse_failures: persist_success.parse_failures,
                };
                successes.push(success);
            } else if let Some(failure) = subworkbench.last_failure_opt {
                let failure = IngestFailure {
                    subrequest_id: subworkbench.subrequest.subrequest_id,
                    index_id: subworkbench.subrequest.index_id,
                    source_id: subworkbench.subrequest.source_id,
                    reason: failure.reason() as i32,
                };
                failures.push(failure);
            }
        }
        let num_successes = successes.len();
        let num_failures = failures.len();
        assert_eq!(num_successes + num_failures, num_subworkbenches);

        if let Some(publish_tracker) = self.publish_tracker {
            publish_tracker.wait_publish_complete().await;
        }

        // For tests, we sort the successes and failures by subrequest_id
        #[cfg(test)]
        {
            for success in &mut successes {
                success
                    .parse_failures
                    .sort_by_key(|parse_failure| parse_failure.doc_uid());
            }
            successes.sort_by_key(|success| success.subrequest_id);
            failures.sort_by_key(|failure| failure.subrequest_id);
        }

        IngestResponseV2 {
            successes,
            failures,
        }
    }
}

#[derive(Debug)]
pub(super) enum SubworkbenchFailure {
    // There is no entry in the routing table for this index.
    IndexNotFound,
    // There is no entry in the routing table for this source.
    SourceNotFound,
    // The routing table entry for this source is empty, shards are all closed, or their leaders
    // are unavailable.
    NoShardsAvailable,
    // This is an error returned by the ingester: e.g. shard not found, shard closed, rate
    // limited, resource exhausted, etc.
    Persist(PersistFailureReason),
    Internal,
    // The ingester is no longer in the pool or a transport error occurred.
    Unavailable,
    // The ingester is rate limited.
    RateLimited(RateLimitingCause),
}

impl SubworkbenchFailure {
    /// Returns the final `IngestFailureReason` returned to the client.
    fn reason(&self) -> IngestFailureReason {
        match self {
            Self::IndexNotFound => IngestFailureReason::IndexNotFound,
            Self::SourceNotFound => IngestFailureReason::SourceNotFound,
            Self::Internal => IngestFailureReason::Internal,
            Self::NoShardsAvailable => IngestFailureReason::NoShardsAvailable,
            // In our last attempt, we did not manage to reach the ingester.
            // We can consider that as a no shards available.
            Self::Unavailable => IngestFailureReason::NoShardsAvailable,
            Self::RateLimited(rate_limiting_cause) => match rate_limiting_cause {
                RateLimitingCause::RouterLoadShedding => IngestFailureReason::RouterLoadShedding,
                RateLimitingCause::LoadShedding => IngestFailureReason::RouterLoadShedding,
                RateLimitingCause::WalFull => IngestFailureReason::WalFull,
                RateLimitingCause::CircuitBreaker => IngestFailureReason::CircuitBreaker,
                RateLimitingCause::ShardRateLimiting => IngestFailureReason::ShardRateLimited,
                RateLimitingCause::Unknown => IngestFailureReason::Unspecified,
            },
            Self::Persist(persist_failure_reason) => (*persist_failure_reason).into(),
        }
    }
}

#[derive(Debug, Default)]
pub(super) struct IngestSubworkbench {
    pub subrequest: IngestSubrequest,
    pub persist_success_opt: Option<PersistSuccess>,
    pub last_failure_opt: Option<SubworkbenchFailure>,
    /// The number of persist attempts for this subrequest.
    pub num_attempts: usize,
}

impl IngestSubworkbench {
    pub fn new(subrequest: IngestSubrequest) -> Self {
        Self {
            subrequest,
            ..Default::default()
        }
    }

    pub fn is_pending(&self) -> bool {
        self.persist_success_opt.is_none() && self.last_failure_is_transient()
    }

    /// Returns `false` if and only if the last attempt suggests retrying (on any node) will fail.
    /// e.g.:
    /// - the index does not exist
    /// - the source does not exist.
    fn last_failure_is_transient(&self) -> bool {
        match self.last_failure_opt {
            Some(SubworkbenchFailure::IndexNotFound) => false,
            Some(SubworkbenchFailure::SourceNotFound) => false,
            Some(SubworkbenchFailure::Internal) => true,
            Some(SubworkbenchFailure::NoShardsAvailable) => true,
            Some(SubworkbenchFailure::Persist(_)) => true,
            Some(SubworkbenchFailure::Unavailable) => true,
            Some(SubworkbenchFailure::RateLimited(_)) => true,
            None => true,
        }
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_proto::indexing::ShardPositionsUpdate;
    use quickwit_proto::ingest::ingester::PersistFailureReason;
    use quickwit_proto::types::{IndexUid, Position, ShardId, SourceUid};

    use super::*;

    #[test]
    fn test_ingest_subworkbench() {
        let subrequest = IngestSubrequest {
            ..Default::default()
        };
        let mut subworkbench = IngestSubworkbench::new(subrequest);
        assert!(subworkbench.is_pending());
        assert!(subworkbench.last_failure_is_transient());

        subworkbench.last_failure_opt = Some(SubworkbenchFailure::Unavailable);
        assert!(subworkbench.is_pending());
        assert!(subworkbench.last_failure_is_transient());

        subworkbench.last_failure_opt = Some(SubworkbenchFailure::Internal);
        assert!(subworkbench.is_pending());
        assert!(subworkbench.last_failure_is_transient());

        subworkbench.last_failure_opt = Some(SubworkbenchFailure::NoShardsAvailable);
        assert!(subworkbench.is_pending());
        assert!(subworkbench.last_failure_is_transient());

        subworkbench.last_failure_opt = Some(SubworkbenchFailure::IndexNotFound);
        assert!(!subworkbench.is_pending());
        assert!(!subworkbench.last_failure_is_transient());
        subworkbench.last_failure_opt = Some(SubworkbenchFailure::SourceNotFound);
        assert!(!subworkbench.is_pending());
        assert!(!subworkbench.last_failure_is_transient());

        subworkbench.last_failure_opt = Some(SubworkbenchFailure::Persist(
            PersistFailureReason::NoShardsAvailable,
        ));
        assert!(subworkbench.is_pending());
        assert!(subworkbench.last_failure_is_transient());

        let persist_success = PersistSuccess {
            ..Default::default()
        };
        subworkbench.persist_success_opt = Some(persist_success);
        assert!(!subworkbench.is_pending());
    }

    #[test]
    fn test_ingest_workbench() {
        let workbench = IngestWorkbench::new(Vec::new(), 1);
        assert!(workbench.is_complete());

        let ingest_subrequests = vec![IngestSubrequest {
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);
        assert!(!workbench.is_last_attempt());
        assert!(!workbench.is_complete());

        workbench.new_attempt();
        assert!(workbench.is_last_attempt());
        assert!(workbench.is_complete());

        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                ..Default::default()
            },
        ];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 2);
        assert!(!workbench.is_complete());

        let persist_success = PersistSuccess {
            subrequest_id: 0,
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        assert_eq!(workbench.num_successes, 1);
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 1);
        assert_eq!(
            pending_subrequests(&workbench.subworkbenches)
                .next()
                .unwrap()
                .subrequest_id,
            1
        );

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert_eq!(subworkbench.num_attempts, 1);
        assert!(!subworkbench.is_pending());

        let persist_failure = PersistFailure {
            subrequest_id: 1,
            ..Default::default()
        };
        workbench.record_persist_failure(&persist_failure);

        assert_eq!(workbench.num_successes, 1);
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 1);
        assert_eq!(
            pending_subrequests(&workbench.subworkbenches)
                .next()
                .unwrap()
                .subrequest_id,
            1
        );

        let subworkbench = workbench.subworkbenches.get(&1).unwrap();
        assert_eq!(subworkbench.num_attempts, 1);
        assert!(subworkbench.last_failure_opt.is_some());

        let persist_success = PersistSuccess {
            subrequest_id: 1,
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        assert!(workbench.is_complete());
        assert_eq!(workbench.num_successes, 2);
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 0);
    }

    #[tokio::test]
    async fn test_workbench_publish_tracking_empty() {
        let workbench =
            IngestWorkbench::new_with_publish_tracking(Vec::new(), 1, EventBroker::default());
        assert!(workbench.is_complete());
        assert_eq!(
            workbench.into_ingest_result().await,
            IngestResponseV2::default()
        );
    }

    #[tokio::test]
    async fn test_workbench_publish_tracking_happy_path() {
        let event_broker = EventBroker::default();
        let shard_id_1 = ShardId::from("test-shard-1");
        let shard_id_2 = ShardId::from("test-shard-2");
        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                ..Default::default()
            },
        ];
        let mut workbench =
            IngestWorkbench::new_with_publish_tracking(ingest_subrequests, 1, event_broker.clone());
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 2);
        assert!(!workbench.is_complete());

        let persist_success = PersistSuccess {
            subrequest_id: 0,
            shard_id: Some(shard_id_1.clone()),
            replication_position_inclusive: Some(Position::offset(42usize)),
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        let persist_failure = PersistFailure {
            subrequest_id: 1,
            ..Default::default()
        };
        workbench.record_persist_failure(&persist_failure);

        let persist_success = PersistSuccess {
            subrequest_id: 1,
            shard_id: Some(shard_id_2.clone()),
            replication_position_inclusive: Some(Position::offset(66usize)),
            ..Default::default()
        };

        workbench.record_persist_success(persist_success);

        assert!(workbench.is_complete());
        assert_eq!(workbench.num_successes, 2);
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 0);

        event_broker.publish(ShardPositionsUpdate {
            source_uid: SourceUid {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".to_string(),
            },
            updated_shard_positions: vec![
                (shard_id_1, Position::offset(42usize)),
                (shard_id_2, Position::offset(66usize)),
            ]
            .into_iter()
            .collect(),
        });

        let ingest_response = workbench.into_ingest_result().await;
        assert_eq!(ingest_response.successes.len(), 2);
        assert_eq!(ingest_response.failures.len(), 0);
    }

    #[tokio::test]
    async fn test_workbench_publish_tracking_waits() {
        let event_broker = EventBroker::default();
        let shard_id_1 = ShardId::from("test-shard-1");
        let shard_id_2 = ShardId::from("test-shard-2");
        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                ..Default::default()
            },
        ];
        let mut workbench =
            IngestWorkbench::new_with_publish_tracking(ingest_subrequests, 1, event_broker.clone());

        let persist_success = PersistSuccess {
            subrequest_id: 0,
            shard_id: Some(shard_id_1.clone()),
            replication_position_inclusive: Some(Position::offset(42usize)),
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        let persist_success = PersistSuccess {
            subrequest_id: 1,
            shard_id: Some(shard_id_2.clone()),
            replication_position_inclusive: Some(Position::offset(66usize)),
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        assert!(workbench.is_complete());
        assert_eq!(workbench.num_successes, 2);
        assert_eq!(pending_subrequests(&workbench.subworkbenches).count(), 0);

        event_broker.publish(ShardPositionsUpdate {
            source_uid: SourceUid {
                index_uid: IndexUid::for_test("test-index", 0),
                source_id: "test-source".to_string(),
            },
            updated_shard_positions: vec![(shard_id_2, Position::offset(66usize))]
                .into_iter()
                .collect(),
        });
        // still waits for shard 1 to be published
        tokio::time::timeout(Duration::from_millis(200), workbench.into_ingest_result())
            .await
            .unwrap_err();
    }

    #[test]
    fn test_ingest_workbench_record_get_or_create_open_shards_failure() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        let get_or_create_open_shards_failure = GetOrCreateOpenShardsFailure {
            subrequest_id: 42,
            reason: GetOrCreateOpenShardsFailureReason::IndexNotFound as i32,
            ..Default::default()
        };
        workbench.record_get_or_create_open_shards_failure(get_or_create_open_shards_failure);

        let get_or_create_open_shards_failure = GetOrCreateOpenShardsFailure {
            subrequest_id: 0,
            reason: GetOrCreateOpenShardsFailureReason::SourceNotFound as i32,
            ..Default::default()
        };
        workbench.record_get_or_create_open_shards_failure(get_or_create_open_shards_failure);

        assert_eq!(workbench.num_successes, 0);

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::SourceNotFound)
        ));
        assert_eq!(subworkbench.num_attempts, 1);
    }

    #[test]
    fn test_ingest_workbench_record_persist_success() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        let persist_success = PersistSuccess {
            subrequest_id: 42,
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        let persist_success = PersistSuccess {
            subrequest_id: 0,
            ..Default::default()
        };
        workbench.record_persist_success(persist_success);

        assert_eq!(workbench.num_successes, 1);

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.persist_success_opt,
            Some(PersistSuccess { .. })
        ));
        assert_eq!(subworkbench.num_attempts, 1);
    }

    #[test]
    fn test_ingest_workbench_record_persist_error_timeout() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        let persist_error = IngestV2Error::Timeout("request timed out".to_string());
        let leader_id = NodeId::from("test-leader");
        let persist_summary = PersistRequestSummary {
            leader_id: leader_id.clone(),
            subrequest_ids: vec![0],
        };
        workbench.record_persist_error(persist_error, persist_summary);

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert_eq!(subworkbench.num_attempts, 1);

        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Persist(PersistFailureReason::Timeout))
        ));
        assert!(subworkbench.persist_success_opt.is_none());
    }

    #[test]
    fn test_ingest_workbench_record_persist_error_unavailable() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        let persist_error = IngestV2Error::Unavailable("connection error".to_string());
        let leader_id = NodeId::from("test-leader");
        let persist_summary = PersistRequestSummary {
            leader_id: leader_id.clone(),
            subrequest_ids: vec![0],
        };
        workbench.record_persist_error(persist_error, persist_summary);

        assert!(workbench.unavailable_leaders.contains(&leader_id));

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert_eq!(subworkbench.num_attempts, 1);

        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Unavailable)
        ));
        assert!(subworkbench.persist_success_opt.is_none());
    }

    #[test]
    fn test_ingest_workbench_record_persist_error_internal() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        let persist_error = IngestV2Error::Internal("IO error".to_string());
        let persist_summary = PersistRequestSummary {
            leader_id: NodeId::from("test-leader"),
            subrequest_ids: vec![0],
        };
        workbench.record_persist_error(persist_error, persist_summary);

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert_eq!(subworkbench.num_attempts, 1);

        assert!(matches!(
            &subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Internal)
        ));
        assert!(subworkbench.persist_success_opt.is_none());
    }

    #[test]
    fn test_ingest_workbench_record_persist_failure() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        let persist_failure = PersistFailure {
            subrequest_id: 42,
            reason: PersistFailureReason::NoShardsAvailable as i32,
            ..Default::default()
        };
        workbench.record_persist_failure(&persist_failure);

        let persist_failure = PersistFailure {
            subrequest_id: 0,
            reason: PersistFailureReason::WalFull as i32,
            ..Default::default()
        };
        workbench.record_persist_failure(&persist_failure);

        assert_eq!(workbench.num_successes, 0);

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::Persist(reason)) if reason == PersistFailureReason::WalFull
        ));
        assert_eq!(subworkbench.num_attempts, 1);
    }

    #[test]
    fn test_ingest_workbench_record_no_shards_available() {
        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);

        workbench.record_no_shards_available(42);
        workbench.record_no_shards_available(0);

        assert_eq!(workbench.num_successes, 0);

        let subworkbench = workbench.subworkbenches.get(&0).unwrap();
        assert!(matches!(
            subworkbench.last_failure_opt,
            Some(SubworkbenchFailure::NoShardsAvailable)
        ));
        assert_eq!(subworkbench.num_attempts, 1);
    }

    #[tokio::test]
    async fn test_ingest_workbench_into_ingest_result() {
        let workbench = IngestWorkbench::new(Vec::new(), 0);
        let response = workbench.into_ingest_result().await;
        assert!(response.successes.is_empty());
        assert!(response.failures.is_empty());

        let ingest_subrequests = vec![
            IngestSubrequest {
                subrequest_id: 0,
                ..Default::default()
            },
            IngestSubrequest {
                subrequest_id: 1,
                ..Default::default()
            },
        ];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);
        let persist_success = PersistSuccess {
            ..Default::default()
        };
        let subworkbench = workbench.subworkbenches.get_mut(&0).unwrap();
        subworkbench.persist_success_opt = Some(persist_success);

        workbench.record_no_shards_available(1);

        let response = workbench.into_ingest_result().await;
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.successes[0].subrequest_id, 0);

        assert_eq!(response.failures.len(), 1);
        assert_eq!(response.failures[0].subrequest_id, 1);
        assert_eq!(
            response.failures[0].reason(),
            IngestFailureReason::NoShardsAvailable
        );

        let ingest_subrequests = vec![IngestSubrequest {
            subrequest_id: 0,
            ..Default::default()
        }];
        let mut workbench = IngestWorkbench::new(ingest_subrequests, 1);
        let failure = SubworkbenchFailure::Persist(PersistFailureReason::Timeout);
        workbench.record_failure(0, failure);

        let ingest_response = workbench.into_ingest_result().await;
        assert_eq!(ingest_response.successes.len(), 0);
        assert_eq!(
            ingest_response.failures[0].reason(),
            IngestFailureReason::Timeout
        );
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

mod doc_batch;
pub mod error;
mod ingest_api_service;
#[path = "codegen/ingest_service.rs"]
#[allow(clippy::disallowed_methods)]
mod ingest_service;
mod ingest_v2;
mod memory_capacity;
mod metrics;
mod mrecordlog_async;
mod notifications;
mod position;
mod queue;

use std::collections::HashMap;
use std::path::{Path, PathBuf};

use anyhow::{Context, bail};
pub use doc_batch::*;
pub use error::IngestServiceError;
pub use ingest_api_service::{GetMemoryCapacity, GetPartitionId, IngestApiService};
pub use ingest_service::*;
pub use ingest_v2::*;
pub use memory_capacity::MemoryCapacity;
use once_cell::sync::OnceCell;
pub use position::Position;
pub use queue::Queues;
use quickwit_actors::{Mailbox, Universe};
use quickwit_config::IngestApiConfig;
use tokio::sync::Mutex;

pub const QUEUES_DIR_NAME: &str = "queues";

pub type Result<T> = std::result::Result<T, IngestServiceError>;

type IngestApiServiceMailboxes = HashMap<PathBuf, Mailbox<IngestApiService>>;

pub static INGEST_API_SERVICE_MAILBOXES: OnceCell<Mutex<IngestApiServiceMailboxes>> =
    OnceCell::new();

/// Initializes an [`IngestApiService`] consuming the queue located at `queue_path`.
pub async fn init_ingest_api(
    universe: &Universe,
    queues_dir_path: &Path,
    config: &IngestApiConfig,
) -> anyhow::Result<Mailbox<IngestApiService>> {
    let mut guard = INGEST_API_SERVICE_MAILBOXES
        .get_or_init(|| Mutex::new(HashMap::new()))
        .lock()
        .await;
    if let Some(mailbox) = guard.get(queues_dir_path) {
        return Ok(mailbox.clone());
    }
    let ingest_api_actor = IngestApiService::with_queues_dir(
        queues_dir_path,
        config.max_queue_memory_usage.as_u64() as usize,
        config.max_queue_disk_usage.as_u64() as usize,
    )
    .await
    .with_context(|| {
        format!(
            "failed to open the ingest API record log located at `{}`",
            queues_dir_path.display()
        )
    })?;
    let (ingest_api_service, _ingest_api_handle) = universe.spawn_builder().spawn(ingest_api_actor);
    guard.insert(queues_dir_path.to_path_buf(), ingest_api_service.clone());
    Ok(ingest_api_service)
}

/// Returns the instance of the single IngestApiService via a copy of its Mailbox.
pub async fn get_ingest_api_service(
    queues_dir_path: &Path,
) -> anyhow::Result<Mailbox<IngestApiService>> {
    let guard = INGEST_API_SERVICE_MAILBOXES
        .get_or_init(|| Mutex::new(HashMap::new()))
        .lock()
        .await;
    if let Some(mailbox) = guard.get(queues_dir_path) {
        return Ok(mailbox.clone());
    }
    bail!(
        "ingest API service with queues directory located at `{}` is not initialized",
        queues_dir_path.display()
    )
}

/// Starts an [`IngestApiService`] instance at `<data_dir_path>/queues`.
pub async fn start_ingest_api_service(
    universe: &Universe,
    data_dir_path: &Path,
    config: &IngestApiConfig,
) -> anyhow::Result<Mailbox<IngestApiService>> {
    let queues_dir_path = data_dir_path.join(QUEUES_DIR_NAME);
    init_ingest_api(universe, &queues_dir_path, config).await
}

#[macro_export]
macro_rules! with_lock_metrics {
    ($future:expr, $($label:tt),*) => {
        {
            $crate::ingest_v2::metrics::INGEST_V2_METRICS
                .wal_acquire_lock_requests_in_flight
                .with_label_values([$($label),*])
                .inc();

            let now = std::time::Instant::now();
            let guard = $future;

            let elapsed = now.elapsed();
            if elapsed > std::time::Duration::from_secs(1) {
                quickwit_common::rate_limited_warn!(
                    limit_per_min=6,
                    "lock acquisition took {}ms", elapsed.as_millis()
                );
            }
            $crate::ingest_v2::metrics::INGEST_V2_METRICS
                .wal_acquire_lock_requests_in_flight
                .with_label_values([$($label),*])
                .dec();
            $crate::ingest_v2::metrics::INGEST_V2_METRICS
                .wal_acquire_lock_request_duration_secs
                .with_label_values([$($label),*])
                .observe(elapsed.as_secs_f64());

            guard
        }
    }
}

#[cfg(test)]
mod tests {

    use quickwit_actors::AskError;
    use quickwit_proto::ingest::RateLimitingCause;

    use super::*;
    use crate::{CreateQueueRequest, IngestRequest, SuggestTruncateRequest};

    #[tokio::test]
    async fn test_get_ingest_api_service() {
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir().unwrap();

        let queues_0_dir_path = temp_dir.path().join("queues-0");
        get_ingest_api_service(&queues_0_dir_path)
            .await
            .unwrap_err();
        init_ingest_api(&universe, &queues_0_dir_path, &IngestApiConfig::default())
            .await
            .unwrap();
        let ingest_api_service_0 = get_ingest_api_service(&queues_0_dir_path).await.unwrap();
        ingest_api_service_0
            .ask_for_res(CreateQueueRequest {
                queue_id: "test-queue".to_string(),
            })
            .await
            .unwrap();

        let queues_1_dir_path = temp_dir.path().join("queues-1");
        init_ingest_api(&universe, &queues_1_dir_path, &IngestApiConfig::default())
            .await
            .unwrap();
        let ingest_api_service_1 = get_ingest_api_service(&queues_1_dir_path).await.unwrap();
        ingest_api_service_1
            .ask_for_res(CreateQueueRequest {
                queue_id: "test-queue".to_string(),
            })
            .await
            .unwrap();
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_get_ingest_multiple_index_api_service() {
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir().unwrap();

        let queues_0_dir_path = temp_dir.path().join("queues-0");
        let ingest_api_service =
            init_ingest_api(&universe, &queues_0_dir_path, &IngestApiConfig::default())
                .await
                .unwrap();
        ingest_api_service
            .ask_for_res(CreateQueueRequest {
                queue_id: "index-1".to_string(),
            })
            .await
            .unwrap();
        let ingest_request = IngestRequest {
            doc_batches: vec![
                DocBatch {
                    index_id: "index-1".to_string(),
                    doc_buffer: vec![10, 11, 12].into(),
                    doc_lengths: vec![2],
                },
                DocBatch {
                    index_id: "index-2".to_string(),
                    doc_buffer: vec![10, 11, 12].into(),
                    doc_lengths: vec![2],
                },
            ],
            commit: CommitType::Auto.into(),
        };
        let ingest_result = ingest_api_service.ask_for_res(ingest_request).await;
        assert!(ingest_result.is_err());
        match ingest_result.unwrap_err() {
            AskError::ErrorReply(ingest_error) => {
                assert!(ingest_error.to_string().contains("index-2"));
            }
            _ => panic!("wrong error type"),
        }
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_queue_limit() {
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir().unwrap();

        let queues_dir_path = temp_dir.path().join("queues-0");
        get_ingest_api_service(&queues_dir_path).await.unwrap_err();

        let ingest_api_config = serde_json::from_str(
            r#"{
            "max_queue_memory_usage": "1200b",
            "max_queue_disk_usage": "256mb"
        }"#,
        )
        .unwrap();
        init_ingest_api(&universe, &queues_dir_path, &ingest_api_config)
            .await
            .unwrap();
        let ingest_api_service = get_ingest_api_service(&queues_dir_path).await.unwrap();

        ingest_api_service
            .ask_for_res(CreateQueueRequest {
                queue_id: "test-queue".to_string(),
            })
            .await
            .unwrap();

        let ingest_request = IngestRequest {
            doc_batches: vec![DocBatch {
                index_id: "test-queue".to_string(),
                doc_buffer: vec![1; 600].into(),
                doc_lengths: vec![30; 20],
            }],
            commit: CommitType::Auto.into(),
        };

        ingest_api_service
            .ask_for_res(ingest_request.clone())
            .await
            .unwrap();

        ingest_api_service
            .ask_for_res(ingest_request.clone())
            .await
            .unwrap();

        // we have to much in memory
        assert!(matches!(
            ingest_api_service
                .ask_for_res(ingest_request.clone())
                .await
                .unwrap_err(),
            AskError::ErrorReply(IngestServiceError::RateLimited(RateLimitingCause::WalFull))
        ));

        // delete the first batch
        ingest_api_service
            .ask_for_res(SuggestTruncateRequest {
                index_id: "test-queue".to_string(),
                up_to_position_included: 29,
            })
            .await
            .unwrap();

        // now we should be okay
        ingest_api_service
            .ask_for_res(ingest_request)
            .await
            .unwrap();
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/memory_capacity.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::sync::Arc;
use std::sync::atomic::{AtomicUsize, Ordering};

#[derive(Debug, Clone, Copy, thiserror::Error)]
#[error("failed to reserve requested memory capacity. current capacity: {0}")]
pub struct ReserveCapacityError(usize);

#[derive(Clone)]
pub struct MemoryCapacity {
    inner: Arc<InnerMemoryCapacity>,
}

impl fmt::Debug for MemoryCapacity {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("MemoryCapacity")
            .field("capacity", &self.capacity())
            .field("max_capacity", &self.max_capacity())
            .finish()
    }
}

impl MemoryCapacity {
    /// Creates a new [`MemoryCapacity`] object with a capacity of `max_capacity` bytes.
    ///
    /// # Panics
    ///
    /// This constructor panics if `max_capacity` is 0.
    pub fn new(max_capacity: usize) -> Self {
        assert!(
            max_capacity > 0,
            "The memory capacity is required to be > 0."
        );

        Self {
            inner: Arc::new(InnerMemoryCapacity {
                max_capacity,
                capacity: AtomicUsize::new(max_capacity),
            }),
        }
    }

    /// Attempts to reserve `num_bytes` of capacity. Returns an error if there is not enough
    /// capacity available.
    pub fn reserve_capacity(&self, num_bytes: usize) -> Result<(), ReserveCapacityError> {
        loop {
            let current_capacity = self.inner.capacity.load(Ordering::Acquire);

            if current_capacity < num_bytes {
                return Err(ReserveCapacityError(current_capacity));
            }
            let new_capacity = current_capacity - num_bytes;

            if self
                .inner
                .capacity
                .compare_exchange(
                    current_capacity,
                    new_capacity,
                    Ordering::AcqRel,
                    Ordering::Acquire,
                )
                .is_ok()
            {
                return Ok(());
            }
        }
    }

    /// Resets the capacity to `new_capacity`.
    pub fn reset_capacity(&self, new_capacity: usize) {
        self.inner.capacity.store(new_capacity, Ordering::Release);
    }

    pub fn max_capacity(&self) -> usize {
        self.inner.max_capacity
    }

    /// Returns the current capacity.
    pub fn capacity(&self) -> usize {
        self.inner
            .capacity
            .load(std::sync::atomic::Ordering::Relaxed)
    }

    /// Returns the ratio of used capacity to maximum capacity.
    pub fn usage_ratio(&self) -> f64 {
        1.0 - (self.capacity() as f64 / self.max_capacity() as f64)
    }
}

struct InnerMemoryCapacity {
    /// The maximum number of bytes that can be stored in memory.
    max_capacity: usize,
    /// The current number of bytes stored in memory.
    capacity: AtomicUsize,
}

#[cfg(test)]
mod tests {
    use std::sync::Barrier;
    use std::thread;

    use super::*;

    #[tokio::test]
    async fn test_memory_capacity() {
        let memory_capacity = MemoryCapacity::new(10);
        assert_eq!(memory_capacity.max_capacity(), 10);
        assert_eq!(memory_capacity.capacity(), 10);
        assert_eq!(memory_capacity.usage_ratio(), 0.0);

        memory_capacity.reserve_capacity(6).unwrap();
        assert_eq!(memory_capacity.max_capacity(), 10);
        assert_eq!(memory_capacity.capacity(), 4);
        assert_eq!(memory_capacity.usage_ratio(), 0.6);

        memory_capacity.reserve_capacity(3).unwrap();
        assert_eq!(memory_capacity.max_capacity(), 10);
        assert_eq!(memory_capacity.capacity(), 1);
        assert_eq!(memory_capacity.usage_ratio(), 0.9);

        memory_capacity.reserve_capacity(1).unwrap();
        assert_eq!(memory_capacity.max_capacity(), 10);
        assert_eq!(memory_capacity.capacity(), 0);
        assert_eq!(memory_capacity.usage_ratio(), 1.0);

        memory_capacity.reserve_capacity(1).unwrap_err();

        let mut handles = Vec::with_capacity(100);
        let barrier = Arc::new(Barrier::new(100));
        let memory_capacity = MemoryCapacity::new(100);

        for _ in 0..100 {
            let barrier = barrier.clone();
            let memory_capacity = memory_capacity.clone();

            handles.push(thread::spawn(move || {
                barrier.wait();
                memory_capacity.reserve_capacity(1).unwrap();
            }));
        }
        for handle in handles {
            handle.join().unwrap();
        }
        assert_eq!(memory_capacity.capacity(), 0)
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{IntCounter, IntGauge, new_counter, new_counter_vec, new_gauge};

pub struct IngestMetrics {
    pub ingested_docs_bytes_valid: IntCounter,
    pub ingested_docs_bytes_invalid: IntCounter,
    pub ingested_docs_invalid: IntCounter,
    pub ingested_docs_valid: IntCounter,

    pub replicated_num_bytes_total: IntCounter,
    pub replicated_num_docs_total: IntCounter,
    #[allow(dead_code)] // this really shouldn't be dead, it needs to be used somewhere
    pub queue_count: IntGauge,
}

impl Default for IngestMetrics {
    fn default() -> Self {
        let ingest_docs_bytes_total = new_counter_vec(
            "docs_bytes_total",
            "Total size of the docs ingested, measured in ingester's leader, after validation and \
             before persistence/replication",
            "ingest",
            &[],
            ["validity"],
        );
        let ingested_docs_bytes_valid = ingest_docs_bytes_total.with_label_values(["valid"]);
        let ingested_docs_bytes_invalid = ingest_docs_bytes_total.with_label_values(["invalid"]);

        let ingest_docs_total = new_counter_vec(
            "docs_total",
            "Total number of the docs ingested, measured in ingester's leader, after validation \
             and before persistence/replication",
            "ingest",
            &[],
            ["validity"],
        );
        let ingested_docs_valid = ingest_docs_total.with_label_values(["valid"]);
        let ingested_docs_invalid = ingest_docs_total.with_label_values(["invalid"]);

        IngestMetrics {
            ingested_docs_bytes_valid,
            ingested_docs_bytes_invalid,
            ingested_docs_valid,
            ingested_docs_invalid,
            replicated_num_bytes_total: new_counter(
                "replicated_num_bytes_total",
                "Total size in bytes of the replicated docs.",
                "ingest",
                &[],
            ),
            replicated_num_docs_total: new_counter(
                "replicated_num_docs_total",
                "Total number of docs replicated.",
                "ingest",
                &[],
            ),
            queue_count: new_gauge(
                "queue_count",
                "Number of queues currently active",
                "ingest",
                &[],
            ),
        }
    }
}

pub static INGEST_METRICS: Lazy<IngestMetrics> = Lazy::new(IngestMetrics::default);


================================================
FILE: quickwit/quickwit-ingest/src/mrecordlog_async.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;
use std::ops::RangeBounds;
use std::path::Path;

use bytes::Buf;
use mrecordlog::error::*;
use mrecordlog::{MultiRecordLog, PersistAction, PersistPolicy, Record, ResourceUsage};
use tokio::task::JoinError;
use tracing::error;

/// A light wrapper to allow async operation in mrecordlog.
pub struct MultiRecordLogAsync {
    mrecordlog_opt: Option<MultiRecordLog>,
}

impl MultiRecordLogAsync {
    fn take(&mut self) -> MultiRecordLog {
        let Some(mrecordlog) = self.mrecordlog_opt.take() else {
            error!("wal is poisoned (on write), aborting process");
            std::process::abort();
        };
        mrecordlog
    }

    fn mrecordlog_ref(&self) -> &MultiRecordLog {
        let Some(mrecordlog) = &self.mrecordlog_opt else {
            error!("wal is poisoned (on read), aborting process");
            std::process::abort();
        };
        mrecordlog
    }

    pub async fn open(directory_path: &Path) -> Result<Self, ReadRecordError> {
        Self::open_with_prefs(directory_path, PersistPolicy::Always(PersistAction::Flush)).await
    }

    pub async fn open_with_prefs(
        directory_path: &Path,
        persist_policy: PersistPolicy,
    ) -> Result<Self, ReadRecordError> {
        let directory_path = directory_path.to_path_buf();
        let mrecordlog = tokio::task::spawn(async move {
            MultiRecordLog::open_with_prefs(&directory_path, persist_policy)
        })
        .await
        .map_err(|join_err| {
            error!(error=?join_err, "failed to load WAL");
            ReadRecordError::IoError(io::Error::other("loading wal from directory failed"))
        })??;
        Ok(Self {
            mrecordlog_opt: Some(mrecordlog),
        })
    }

    async fn run_operation<F, T>(&mut self, operation: F) -> T
    where
        F: FnOnce(&mut MultiRecordLog) -> T + Send + 'static,
        T: Send + 'static,
    {
        let mut mrecordlog = self.take();
        let join_res: Result<(T, MultiRecordLog), JoinError> =
            tokio::task::spawn_blocking(move || {
                let res = operation(&mut mrecordlog);
                (res, mrecordlog)
            })
            .await;
        match join_res {
            Ok((operation_result, mrecordlog)) => {
                self.mrecordlog_opt = Some(mrecordlog);
                operation_result
            }
            Err(join_error) => {
                // This could be caused by a panic
                error!(error=?join_error, "failed to run mrecordlog operation");
                panic!("failed to run mrecordlog operation");
            }
        }
    }

    pub async fn create_queue(&mut self, queue: &str) -> Result<(), CreateQueueError> {
        let queue = queue.to_string();
        self.run_operation(move |mrecordlog| mrecordlog.create_queue(&queue))
            .await
    }

    pub async fn delete_queue(&mut self, queue: &str) -> Result<(), DeleteQueueError> {
        let queue = queue.to_string();
        self.run_operation(move |mrecordlog| mrecordlog.delete_queue(&queue))
            .await
    }

    pub async fn append_records<T: Iterator<Item = impl Buf> + Send + 'static>(
        &mut self,
        queue: &str,
        position_opt: Option<u64>,
        payloads: T,
    ) -> Result<Option<u64>, AppendError> {
        let queue = queue.to_string();
        self.run_operation(move |mrecordlog| {
            mrecordlog.append_records(&queue, position_opt, payloads)
        })
        .await
    }

    #[track_caller]
    #[cfg(test)]
    pub fn assert_records_eq<R>(
        &self,
        queue_id: &str,
        range: R,
        expected_records: &[(u64, [u8; 2], &str)],
    ) where
        R: RangeBounds<u64> + 'static,
    {
        let records = self
            .range(queue_id, range)
            .unwrap()
            .map(|Record { position, payload }| {
                let header: [u8; 2] = payload[..2].try_into().unwrap();
                let payload = String::from_utf8(payload[2..].to_vec()).unwrap();
                (position, header, payload)
            })
            .collect::<Vec<_>>();
        assert_eq!(
            records.len(),
            expected_records.len(),
            "expected {} records, got {}",
            expected_records.len(),
            records.len()
        );
        for ((position, header, payload), (expected_position, expected_header, expected_payload)) in
            records.iter().zip(expected_records.iter())
        {
            assert_eq!(
                position, expected_position,
                "expected record at position `{expected_position}`, got `{position}`",
            );
            assert_eq!(
                header, expected_header,
                "expected record header, `{expected_header:?}`, got `{header:?}`",
            );
            assert_eq!(
                payload, expected_payload,
                "expected record payload, `{expected_payload}`, got `{payload}`",
            );
        }
    }

    pub async fn truncate(&mut self, queue: &str, position: u64) -> Result<usize, TruncateError> {
        let queue = queue.to_string();
        self.run_operation(move |mrecordlog| mrecordlog.truncate(&queue, position))
            .await
    }

    pub fn range<R>(
        &self,
        queue: &str,
        range: R,
    ) -> Result<impl Iterator<Item = Record<'_>> + '_, MissingQueue>
    where
        R: RangeBounds<u64> + 'static,
    {
        self.mrecordlog_ref().range(queue, range)
    }

    pub fn queue_exists(&self, queue: &str) -> bool {
        self.mrecordlog_ref().queue_exists(queue)
    }

    pub fn list_queues(&self) -> impl Iterator<Item = &str> {
        self.mrecordlog_ref().list_queues()
    }

    pub fn last_record(&self, queue: &str) -> Result<Option<Record<'_>>, MissingQueue> {
        self.mrecordlog_ref().last_record(queue)
    }

    pub fn resource_usage(&self) -> ResourceUsage {
        self.mrecordlog_ref().resource_usage()
    }

    pub fn summary(&self) -> mrecordlog::QueuesSummary {
        self.mrecordlog_ref().summary()
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/notifications.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, VecDeque};
use std::sync::Arc;

use tokio::sync::Mutex;

/// Registry for the index positions that are waiting to be notified when index commit occurs.
#[derive(Clone, Default)]
pub struct Notifications {
    notifications: Arc<Mutex<HashMap<String, VecDeque<Position>>>>,
}

impl Notifications {
    /// Create a new notification registry
    pub fn new() -> Self {
        Self {
            notifications: Arc::new(Mutex::new(HashMap::new())),
        }
    }

    /// Register index positions
    pub async fn register(
        &self,
        index_positions: Vec<(String, u64)>,
        notify: impl FnOnce() + Send + Sync + 'static,
    ) {
        let mut guard = self.notifications.lock().await;
        let notification = Arc::new(Notification::new(notify));
        for index_position in index_positions {
            let positions = guard
                .entry(index_position.0.clone())
                .or_insert_with(VecDeque::new);
            positions.push_back(Position {
                position: index_position.1,
                notification: notification.clone(),
            });
        }
    }

    /// Notify positions
    pub async fn notify(&self, index: &String, max_position: u64) {
        let mut map = self.notifications.lock().await;
        if let Some(positions) = map.get_mut(index) {
            while let Some(position) = positions.front() {
                if position.position <= max_position {
                    positions
                        .pop_front()
                        .unwrap()
                        .decrement_count_and_notify_if_last();
                } else {
                    break;
                }
            }
            if positions.is_empty() {
                map.remove(index);
            }
        }
    }
}

impl Notification {
    fn new(notify: impl FnOnce() + Send + Sync + 'static) -> Self {
        Self {
            notify: Box::new(notify),
        }
    }
}

struct Position {
    position: u64,
    notification: Arc<Notification>,
}

impl Position {
    /// Reduces the notification's Arc count and notifies when if self has the only pointer.
    fn decrement_count_and_notify_if_last(self) {
        // Errors are allowed here, it simply means theare are still some positions that
        // were not notified
        let _ = Arc::try_unwrap(self.notification).map(|notification| notification.notify());
    }
}

struct Notification {
    notify: Box<dyn FnOnce() + Send + Sync + 'static>,
}

impl Notification {
    fn notify(self) {
        (self.notify)();
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::sync::atomic::AtomicUsize;

    use crate::notifications::Notifications;

    #[tokio::test]
    async fn test_notifications() {
        let notifications = Notifications::new();
        let cleared = Arc::new(AtomicUsize::default());
        let cleared_clone = cleared.clone();
        notifications
            .register(vec![("index1".to_string(), 10)], move || {
                assert_eq!(
                    cleared_clone.fetch_add(1, std::sync::atomic::Ordering::Relaxed),
                    0
                );
            })
            .await;
        let cleared_clone = cleared.clone();
        notifications
            .register(vec![("index2".to_string(), 10)], move || {
                assert_eq!(
                    cleared_clone.fetch_add(1, std::sync::atomic::Ordering::Relaxed),
                    1
                );
            })
            .await;
        let cleared_clone = cleared.clone();
        notifications
            .register(
                vec![("index1".to_string(), 20), ("index1".to_string(), 30)],
                move || {
                    assert_eq!(
                        cleared_clone.fetch_add(1, std::sync::atomic::Ordering::Relaxed),
                        2
                    );
                },
            )
            .await;
        assert_eq!(cleared.load(std::sync::atomic::Ordering::Relaxed), 0);
        notifications.notify(&"index1".to_string(), 20).await;
        assert_eq!(cleared.load(std::sync::atomic::Ordering::Relaxed), 1);
        notifications.notify(&"index2".to_string(), 100).await;
        assert_eq!(cleared.load(std::sync::atomic::Ordering::Relaxed), 2);
        notifications.notify(&"index1".to_string(), 100).await;
        assert_eq!(cleared.load(std::sync::atomic::Ordering::Relaxed), 3);
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/position.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use crate::error::CorruptedKey;

#[derive(Clone, Copy, Default, Ord, PartialOrd, Eq, PartialEq)]
pub struct Position([u8; 8]);

impl TryFrom<&[u8]> for Position {
    type Error = CorruptedKey;

    fn try_from(bytes: &[u8]) -> Result<Self, CorruptedKey> {
        let bytes: [u8; 8] = bytes.try_into().map_err(|_| CorruptedKey(bytes.len()))?;
        Ok(Position(bytes))
    }
}

impl From<u64> for Position {
    fn from(num: u64) -> Self {
        Position(num.to_be_bytes())
    }
}

impl From<Position> for u64 {
    fn from(pos: Position) -> u64 {
        pos.pos_val()
    }
}

impl Position {
    fn pos_val(self) -> u64 {
        u64::from_be_bytes(self.0)
    }

    pub fn inc(&self) -> Position {
        let new_val: u64 = self.pos_val() + 1u64;
        Position::from(new_val)
    }
}

impl fmt::Debug for Position {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_tuple("Position").field(&self.pos_val()).finish()
    }
}

impl fmt::Display for Position {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "#{:_>20}", self.pos_val())
    }
}

impl AsRef<[u8]> for Position {
    fn as_ref(&self) -> &[u8] {
        &self.0
    }
}

#[cfg(test)]
mod tests {
    use std::cmp::Ordering;

    use crate::Position;

    #[test]
    fn test_position_ordering_is_matching_natural_order() {
        for (lesser, greater) in (0..1_000).zip(1..1_001) {
            let lesser_pos = Position::from(lesser);
            let greater_pos = Position::from(greater);
            assert_eq!(lesser_pos.cmp(&greater_pos), Ordering::Less);
        }
    }

    #[test]
    fn test_from_to_u128() {
        let test_n = 20_220_303u64;
        let position = Position::from(test_n);
        let position_val: u64 = position.into();
        assert_eq!(test_n, position_val);
    }

    #[test]
    fn test_position_debug() {
        let test_n = 20_220_303u64;
        let position = Position::from(test_n);
        let position_str = format!("{position:?}");
        assert_eq!(position_str, "Position(20220303)");
    }

    #[test]
    fn test_position_display() {
        let test_n = 20_220_303u64;
        let position_str = Position::from(test_n).to_string();
        assert_eq!(position_str, "#____________20220303");
    }
}


================================================
FILE: quickwit/quickwit-ingest/src/queue.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Bound;
use std::path::Path;

use bytes::Buf;
use mrecordlog::error::CreateQueueError;
use mrecordlog::{Record, ResourceUsage};
use quickwit_actors::ActorContext;

use crate::mrecordlog_async::MultiRecordLogAsync;
use crate::{
    DocBatchBuilder, FetchResponse, IngestApiService, IngestServiceError, ListQueuesResponse,
};

const FETCH_PAYLOAD_LIMIT: usize = 2_000_000; // 2MB

// TODO do we need to keep this?
const QUICKWIT_CF_PREFIX: &str = ".queue_";

pub struct Queues {
    record_log: MultiRecordLogAsync,
}

impl Queues {
    pub async fn open(queues_dir_path: &Path) -> crate::Result<Queues> {
        tokio::fs::create_dir_all(queues_dir_path)
            .await
            .map_err(|error| {
                IngestServiceError::IoError(format!(
                    "failed to create WAL directory `{}`: {}",
                    queues_dir_path.display(),
                    error
                ))
            })?;
        let record_log = MultiRecordLogAsync::open(queues_dir_path).await?;
        Ok(Queues { record_log })
    }

    pub fn queue_exists(&self, queue_id: &str) -> bool {
        let real_queue_id = format!("{QUICKWIT_CF_PREFIX}{queue_id}");
        self.record_log.queue_exists(&real_queue_id)
    }

    pub async fn create_queue(
        &mut self,
        queue_id: &str,
        ctx: &ActorContext<IngestApiService>,
    ) -> crate::Result<()> {
        if self.queue_exists(queue_id) {
            return Err(crate::IngestServiceError::IndexAlreadyExists {
                index_id: queue_id.to_string(),
            });
        }
        let real_queue_id = format!("{QUICKWIT_CF_PREFIX}{queue_id}");
        ctx.protect_future(self.record_log.create_queue(&real_queue_id))
            .await
            .map_err(|e| match e {
                CreateQueueError::AlreadyExists => IngestServiceError::IndexAlreadyExists {
                    index_id: queue_id.to_owned(),
                },
                CreateQueueError::IoError(ioe) => ioe.into(),
            })?;
        Ok(())
    }

    pub async fn drop_queue(
        &mut self,
        queue_id: &str,
        ctx: &ActorContext<IngestApiService>,
    ) -> crate::Result<()> {
        let real_queue_id = format!("{QUICKWIT_CF_PREFIX}{queue_id}");
        ctx.protect_future(self.record_log.delete_queue(&real_queue_id))
            .await?;
        Ok(())
    }

    /// Suggest to truncate the queue.
    ///
    /// This function allows the queue to remove all records up to and
    /// including `up_to_offset_included`.
    ///
    /// The role of this truncation is to release memory and disk space.
    ///
    /// There are no guarantees that the record will effectively be removed.
    /// Nothing might happen, or the truncation might be partial.
    ///
    /// In other words, truncating from a position, and fetching records starting
    /// earlier than this position can yield undefined result:
    /// the truncated records may or may not be returned.
    pub async fn suggest_truncate(
        &mut self,
        queue_id: &str,
        up_to_offset_included: u64,
        ctx: &ActorContext<IngestApiService>,
    ) -> crate::Result<()> {
        let real_queue_id = format!("{QUICKWIT_CF_PREFIX}{queue_id}");

        ctx.protect_future(
            self.record_log
                .truncate(&real_queue_id, up_to_offset_included),
        )
        .await?;

        Ok(())
    }

    // Append a single record to a target queue.
    #[cfg(test)]
    async fn append(
        &mut self,
        queue_id: &str,
        record: &[u8],
        ctx: &ActorContext<IngestApiService>,
    ) -> crate::Result<Option<u64>> {
        use bytes::Bytes;

        self.append_batch(queue_id, std::iter::once(Bytes::from(record.to_vec())), ctx)
            .await
    }

    // Append a batch of records to a target queue.
    //
    // This operation is atomic: the batch of records is either entirely added or not.
    pub async fn append_batch(
        &mut self,
        queue_id: &str,
        records_it: impl Iterator<Item = impl Buf> + Send + 'static,
        ctx: &ActorContext<IngestApiService>,
    ) -> crate::Result<Option<u64>> {
        let real_queue_id = format!("{QUICKWIT_CF_PREFIX}{queue_id}");

        // TODO None means we don't have itempotent inserts
        let max_position = ctx
            .protect_future(
                self.record_log
                    .append_records(&real_queue_id, None, records_it),
            )
            .await?;

        Ok(max_position)
    }

    // Streams messages from in `]after_position, +∞[`.
    //
    // If after_position is set to None, then fetch from the start of the Stream.
    pub fn fetch(
        &self,
        queue_id: &str,
        start_after: Option<u64>,
        num_bytes_limit: Option<usize>,
    ) -> crate::Result<FetchResponse> {
        let real_queue_id = format!("{QUICKWIT_CF_PREFIX}{queue_id}");

        let starting_bound = match start_after {
            Some(pos) => Bound::Excluded(pos),
            None => Bound::Unbounded,
        };
        let records = self
            .record_log
            .range(&real_queue_id, (starting_bound, Bound::Unbounded))
            .map_err(|_| crate::IngestServiceError::IndexNotFound {
                // we want to return the queue_id, not the real_queue_id, so we can't just
                // implement From<MissingQueue>
                index_id: queue_id.to_string(),
            })?;

        let size_limit = num_bytes_limit.unwrap_or(FETCH_PAYLOAD_LIMIT);
        let mut doc_batch = DocBatchBuilder::new(queue_id.to_string());
        let mut num_bytes = 0;
        let mut first_key_opt = None;

        for Record { position, payload } in records {
            if first_key_opt.is_none() {
                first_key_opt = Some(position);
            }
            num_bytes += doc_batch.command_from_buf(payload.as_ref());
            if num_bytes > size_limit {
                break;
            }
        }

        Ok(FetchResponse {
            first_position: first_key_opt,
            doc_batch: Some(doc_batch.build()),
        })
    }

    // Streams messages from the start of the Stream.
    pub fn tail(&self, queue_id: &str) -> crate::Result<FetchResponse> {
        self.fetch(queue_id, None, None)
    }

    pub fn list_queues(&self) -> crate::Result<ListQueuesResponse> {
        Ok(ListQueuesResponse {
            queues: self
                .record_log
                .list_queues()
                .flat_map(|real_queue_id| real_queue_id.strip_prefix(QUICKWIT_CF_PREFIX))
                .map(|queue| queue.to_string())
                .collect(),
        })
    }

    pub(crate) fn resource_usage(&self) -> ResourceUsage {
        self.record_log.resource_usage()
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;
    use std::ops::{Deref, DerefMut};

    use bytes::Bytes;
    use quickwit_actors::{ActorContext, Universe};
    use tokio::sync::watch;

    use super::Queues;
    use crate::IngestApiService;
    use crate::error::IngestServiceError;

    const TEST_QUEUE_ID: &str = "my-queue";
    const TEST_QUEUE_ID2: &str = "my-queue2";

    struct QueuesForTest {
        queues: Option<Queues>,
        temp_dir: tempfile::TempDir,
    }

    impl QueuesForTest {
        async fn new() -> (Self, ActorContext<IngestApiService>) {
            let temp_dir = tempfile::tempdir().unwrap();
            let mut queues_for_test = QueuesForTest {
                temp_dir,
                queues: None,
            };
            queues_for_test.reload().await;

            let universe = Universe::with_accelerated_time();
            let (source_mailbox, _source_inbox) = universe.create_test_mailbox();
            let (observable_state_tx, _observable_state_rx) = watch::channel(());
            let ctx = ActorContext::for_test(&universe, source_mailbox, observable_state_tx);
            (queues_for_test, ctx)
        }
    }

    impl QueuesForTest {
        async fn reload(&mut self) {
            std::mem::drop(self.queues.take());
            self.queues = Some(Queues::open(self.temp_dir.path()).await.unwrap());
        }

        #[track_caller]
        fn fetch_test(
            &mut self,
            queue_id: &str,
            start_after: Option<u64>,
            expected_first_pos_opt: Option<u64>,
            expected: &[&[u8]],
        ) {
            let fetch_resp = self.fetch(queue_id, start_after, None).unwrap();
            assert_eq!(fetch_resp.first_position, expected_first_pos_opt);
            let doc_batch = fetch_resp.doc_batch.unwrap();
            let records: Vec<Bytes> = doc_batch.clone().into_iter_raw().collect();
            assert_eq!(&records, expected);
        }
    }

    impl Deref for QueuesForTest {
        type Target = Queues;

        fn deref(&self) -> &Self::Target {
            self.queues.as_ref().unwrap()
        }
    }

    impl DerefMut for QueuesForTest {
        fn deref_mut(&mut self) -> &mut Self::Target {
            self.queues.as_mut().unwrap()
        }
    }

    impl Drop for QueuesForTest {
        fn drop(&mut self) {
            std::mem::drop(self.queues.take().unwrap());
        }
    }

    #[tokio::test]
    async fn test_access_queue_twice() {
        let (mut queues, ctx) = QueuesForTest::new().await;
        queues.create_queue(TEST_QUEUE_ID, &ctx).await.unwrap();
        let queue_err = queues
            .create_queue(TEST_QUEUE_ID, &ctx)
            .await
            .err()
            .unwrap();
        assert!(matches!(
            queue_err,
            IngestServiceError::IndexAlreadyExists { .. }
        ));
    }

    #[tokio::test]
    async fn test_list_queues() {
        let queue_ids = vec!["foo".to_string(), "bar".to_string(), "baz".to_string()];
        let (mut queues, ctx) = QueuesForTest::new().await;
        for queue_id in queue_ids.iter() {
            queues.create_queue(queue_id, &ctx).await.unwrap();
        }
        assert_eq!(
            HashSet::<String>::from_iter(queue_ids),
            HashSet::from_iter(queues.list_queues().unwrap().queues)
        );

        queues.drop_queue("foo", &ctx).await.unwrap();
        assert_eq!(
            HashSet::<String>::from_iter(vec!["bar".to_string(), "baz".to_string()]),
            HashSet::from_iter(queues.list_queues().unwrap().queues)
        );
    }

    #[tokio::test]
    async fn test_simple() {
        let (mut queues, ctx) = QueuesForTest::new().await;

        queues.create_queue(TEST_QUEUE_ID, &ctx).await.unwrap();
        queues
            .append_batch(
                TEST_QUEUE_ID,
                [b"hello", b"happy"].iter().map(|bytes| bytes.as_slice()),
                &ctx,
            )
            .await
            .unwrap();

        queues.reload().await;
        queues.fetch_test(
            TEST_QUEUE_ID,
            None,
            Some(0),
            &[&b"hello"[..], &b"happy"[..]],
        );

        queues.reload().await;
        queues.fetch_test(
            TEST_QUEUE_ID,
            None,
            Some(0),
            &[&b"hello"[..], &b"happy"[..]],
        );
    }

    #[tokio::test]
    async fn test_distinct_queues() {
        let (mut queues, ctx) = QueuesForTest::new().await;

        queues.create_queue(TEST_QUEUE_ID, &ctx).await.unwrap();
        queues.create_queue(TEST_QUEUE_ID2, &ctx).await.unwrap();
        queues.append(TEST_QUEUE_ID, b"hello", &ctx).await.unwrap();
        queues
            .append(TEST_QUEUE_ID2, b"hello2", &ctx)
            .await
            .unwrap();

        queues.fetch_test(TEST_QUEUE_ID, None, Some(0), &[&b"hello"[..]]);
        queues.fetch_test(TEST_QUEUE_ID2, None, Some(0), &[&b"hello2"[..]]);
    }

    #[tokio::test]
    async fn test_create_reopen() {
        let (mut queues, ctx) = QueuesForTest::new().await;
        queues.create_queue(TEST_QUEUE_ID, &ctx).await.unwrap();

        queues.reload().await;
        queues.append(TEST_QUEUE_ID, b"hello", &ctx).await.unwrap();

        queues.reload().await;
        queues.append(TEST_QUEUE_ID, b"happy", &ctx).await.unwrap();

        queues.fetch_test(
            TEST_QUEUE_ID,
            None,
            Some(0),
            &[&b"hello"[..], &b"happy"[..]],
        );
    }

    // Note this test is specific to the current implementation of truncate.
    //
    // The truncate contract is actually not as accurate as what we are testing here.
    #[tokio::test]
    async fn test_truncation() {
        let (mut queues, ctx) = QueuesForTest::new().await;
        queues.create_queue(TEST_QUEUE_ID, &ctx).await.unwrap();
        queues.append(TEST_QUEUE_ID, b"hello", &ctx).await.unwrap();
        queues.append(TEST_QUEUE_ID, b"happy", &ctx).await.unwrap();
        queues
            .suggest_truncate(TEST_QUEUE_ID, 0, &ctx)
            .await
            .unwrap();
        queues.fetch_test(TEST_QUEUE_ID, None, Some(1), &[&b"happy"[..]]);
    }

    #[tokio::test]
    async fn test_truncation_and_reload() {
        // This test makes sure that we don't reset the position counter when we truncate an entire
        // queue.
        let (mut queues, ctx) = QueuesForTest::new().await;
        queues.create_queue(TEST_QUEUE_ID, &ctx).await.unwrap();
        queues.append(TEST_QUEUE_ID, b"hello", &ctx).await.unwrap();
        queues.append(TEST_QUEUE_ID, b"happy", &ctx).await.unwrap();
        queues.reload().await;
        queues
            .suggest_truncate(TEST_QUEUE_ID, 1, &ctx)
            .await
            .unwrap();
        queues.reload().await;
        queues.append(TEST_QUEUE_ID, b"tax", &ctx).await.unwrap();
        queues.fetch_test(TEST_QUEUE_ID, Some(1), Some(2), &[&b"tax"[..]]);
    }

    struct Record {
        queue_id: String,
        payload: Vec<u8>,
    }

    #[ignore]
    #[tokio::test]
    async fn test_create_multiple_queue() {
        use std::iter::repeat_with;

        use rand::rngs::StdRng;
        use rand::{Rng, SeedableRng};
        use rand_distr::weighted::WeightedIndex;
        use rand_distr::{Distribution, LogNormal};

        const NUM_QUEUES: usize = 100;
        const NUM_RECORDS: usize = 1_000_000;

        let (_, ctx) = QueuesForTest::new().await;

        // mean 2, standard deviation 3
        let log_normal = LogNormal::new(10.0f32, 3.0f32).unwrap();
        let mut rng = StdRng::seed_from_u64(4u64);
        let queue_weights: Vec<f32> = repeat_with(|| log_normal.sample(&mut rng))
            .take(NUM_QUEUES)
            .collect();

        let dist = WeightedIndex::new(&queue_weights).unwrap();
        let record_queue_ids: Vec<usize> = repeat_with(|| dist.sample(&mut rng))
            .take(NUM_RECORDS)
            .collect();

        let records: Vec<Record> = record_queue_ids
            .into_iter()
            .map(|queue_id| {
                let num_bytes: usize = rng.random_range(80..800);
                let payload: Vec<u8> = repeat_with(rand::random::<u8>).take(num_bytes).collect();
                Record {
                    queue_id: queue_id.to_string(),
                    payload,
                }
            })
            .collect();

        let tmpdir = tempfile::tempdir_in(".").unwrap();
        let mut queues = Queues::open(tmpdir.path()).await.unwrap();
        for queue_id in 0..NUM_QUEUES {
            queues
                .create_queue(&queue_id.to_string(), &ctx)
                .await
                .unwrap();
        }
        let start = std::time::Instant::now();
        let mut num_bytes = 0;
        for record in records.iter() {
            queues
                .append(&record.queue_id, &record.payload, &ctx)
                .await
                .unwrap();
            num_bytes += record.payload.len();
        }
        let elapsed = start.elapsed();
        println!("{elapsed:?}");
        println!("{num_bytes}");
        let throughput = num_bytes as f64 / (elapsed.as_micros() as f64);
        println!("Throughput: {throughput}");
    }
}


================================================
FILE: quickwit/quickwit-integration-tests/Cargo.toml
================================================
[package]
name = "quickwit-integration-tests"
description = "Integration tests runner and repository"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[features]
sqs-localstack-tests = [
    "quickwit-indexing/sqs",
    "quickwit-indexing/sqs-localstack-tests",
]

[dependencies]

[dev-dependencies]
anyhow = { workspace = true }
aws-sdk-sqs = { workspace = true }
futures-util = { workspace = true }
hyper = { workspace = true }
hyper-util = { workspace = true }
itertools = { workspace = true }
rand = { workspace = true }
reqwest = { workspace = true }
rustls = { workspace = true }
serde_json = { workspace = true }
tempfile = { workspace = true }
tokio = { workspace = true }
tonic = { workspace = true }
tracing = { workspace = true }
tracing-subscriber = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-cli = { workspace = true }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-opentelemetry = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-rest-client = { workspace = true }
quickwit-serve = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }


================================================
FILE: quickwit/quickwit-integration-tests/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![recursion_limit = "256"]

#[cfg(test)]
mod test_utils;
#[cfg(test)]
mod tests;


================================================
FILE: quickwit/quickwit-integration-tests/src/test_utils/cluster_sandbox.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::io::Write;
use std::net::SocketAddr;
use std::str::FromStr;
use std::time::Duration;

use anyhow::Context;
use futures_util::future;
use itertools::Itertools;
use quickwit_actors::ActorExitStatus;
use quickwit_cli::tool::{LocalIngestDocsArgs, local_ingest_docs_cli};
use quickwit_common::new_coolid;
use quickwit_common::runtimes::RuntimesConfig;
use quickwit_common::test_utils::wait_until_predicate;
use quickwit_common::uri::Uri as QuickwitUri;
use quickwit_config::NodeConfig;
use quickwit_config::service::QuickwitService;
use quickwit_metastore::{MetastoreResolver, SplitState};
use quickwit_proto::jaeger::storage::v1::span_reader_plugin_client::SpanReaderPluginClient;
use quickwit_proto::opentelemetry::proto::collector::logs::v1::logs_service_client::LogsServiceClient;
use quickwit_proto::opentelemetry::proto::collector::trace::v1::trace_service_client::TraceServiceClient;
use quickwit_proto::types::NodeId;
use quickwit_rest_client::models::IngestSource;
use quickwit_rest_client::rest_client::{
    CommitType, DEFAULT_BASE_URL, QuickwitClient, QuickwitClientBuilder,
};
use quickwit_serve::tcp_listener::for_tests::TestTcpListenerResolver;
use quickwit_serve::{
    ListSplitsQueryParams, RestIngestResponse, SearchRequestQueryString, serve_quickwit,
};
use quickwit_storage::StorageResolver;
use reqwest::Url;
use serde_json::Value;
use tempfile::TempDir;
use tokio::net::TcpListener;
use tracing::debug;

use super::shutdown::NodeShutdownHandle;

pub struct TestNodeConfig {
    pub services: HashSet<QuickwitService>,
    pub enable_otlp: bool,
}

impl TestNodeConfig {
    async fn build_node_config(
        &self,
        node_idx: usize,
        cluster_id: String,
        temp_dir: &TempDir,
        unique_dir_name: String,
        tcp_listener_resolver: &TestTcpListenerResolver,
    ) -> NodeConfig {
        let socket: SocketAddr = ([127, 0, 0, 1], 0u16).into();
        let rest_tcp_listener = TcpListener::bind(socket).await.unwrap();
        let grpc_tcp_listener = TcpListener::bind(socket).await.unwrap();
        let mut config = NodeConfig::for_test_from_ports(
            rest_tcp_listener.local_addr().unwrap().port(),
            grpc_tcp_listener.local_addr().unwrap().port(),
        );
        tcp_listener_resolver.add_listener(rest_tcp_listener).await;
        tcp_listener_resolver.add_listener(grpc_tcp_listener).await;
        config.indexer_config.enable_otlp_endpoint = self.enable_otlp;
        config.enabled_services.clone_from(&self.services);
        config.jaeger_config.enable_endpoint = true;
        config.cluster_id.clone_from(&cluster_id);
        config.node_id = NodeId::new(format!("test-node-{node_idx}"));
        let root_data_dir = temp_dir.path().to_path_buf();
        config.data_dir_path = root_data_dir.join(config.node_id.as_str());
        config.metastore_uri =
            QuickwitUri::from_str(&format!("ram:///{unique_dir_name}/metastore")).unwrap();
        config.default_index_root_uri =
            QuickwitUri::from_str(&format!("ram:///{unique_dir_name}/indexes")).unwrap();
        config
    }
}

pub struct ClusterSandboxBuilder {
    temp_dir: TempDir,
    node_configs: Vec<TestNodeConfig>,
    use_legacy_ingest: bool,
}

impl Default for ClusterSandboxBuilder {
    fn default() -> Self {
        Self {
            temp_dir: tempfile::tempdir().unwrap(),
            node_configs: Vec::new(),
            use_legacy_ingest: false,
        }
    }
}

impl ClusterSandboxBuilder {
    pub fn add_node(mut self, services: impl IntoIterator<Item = QuickwitService>) -> Self {
        self.node_configs.push(TestNodeConfig {
            services: HashSet::from_iter(services),
            enable_otlp: false,
        });
        self
    }

    pub fn add_node_with_otlp(
        mut self,
        services: impl IntoIterator<Item = QuickwitService>,
    ) -> Self {
        self.node_configs.push(TestNodeConfig {
            services: HashSet::from_iter(services),
            enable_otlp: true,
        });
        self
    }

    pub fn use_legacy_ingest(mut self) -> Self {
        self.use_legacy_ingest = true;
        self
    }

    /// Builds a list of of [`NodeConfig`] from the node definitions added to
    /// builder. For each node, a [`NodeConfig`] is built with the right
    /// parameters such that we will be able to run `quickwit_serve` on them and
    /// form a Quickwit cluster. For each node, we set:
    /// - `data_dir_path` defined by `root_data_dir/node_id`.
    /// - `metastore_uri` defined by `root_data_dir/metastore`.
    /// - `default_index_root_uri` defined by `root_data_dir/indexes`.
    /// - `peers` defined by others nodes `gossip_advertise_addr`.
    pub async fn build_config(self) -> ResolvedClusterConfig {
        let cluster_id = new_coolid("test-cluster");
        let mut resolved_node_configs = Vec::new();
        let mut peers: Vec<String> = Vec::new();
        let unique_dir_name = new_coolid("test-dir");
        let tcp_listener_resolver = TestTcpListenerResolver::default();
        for (node_idx, node_builder) in self.node_configs.iter().enumerate() {
            let config = node_builder
                .build_node_config(
                    node_idx,
                    cluster_id.clone(),
                    &self.temp_dir,
                    unique_dir_name.clone(),
                    &tcp_listener_resolver,
                )
                .await;
            peers.push(config.gossip_advertise_addr.to_string());
            resolved_node_configs.push((config, node_builder.services.clone()));
        }
        for node_config in resolved_node_configs.iter_mut() {
            node_config.0.peer_seeds = peers
                .clone()
                .into_iter()
                .filter(|seed| *seed != node_config.0.gossip_advertise_addr.to_string())
                .collect_vec();
        }
        ResolvedClusterConfig {
            cluster_id,
            temp_dir: self.temp_dir,
            unique_dir_name,
            node_configs: resolved_node_configs,
            tcp_listener_resolver,
        }
    }

    /// Builds the cluster config, starts the nodes and waits for them to be ready
    pub async fn build_and_start(self) -> ClusterSandbox {
        self.build_config().await.start().await
    }

    pub async fn build_and_start_standalone() -> ClusterSandbox {
        ClusterSandboxBuilder::default()
            .add_node(QuickwitService::supported_services())
            .build_config()
            .await
            .start()
            .await
    }
}

/// Intermediate state where the ports of all the test cluster nodes have
/// been reserved and the configurations have been generated.
pub struct ResolvedClusterConfig {
    cluster_id: String,
    temp_dir: TempDir,
    unique_dir_name: String,
    pub node_configs: Vec<(NodeConfig, HashSet<QuickwitService>)>,
    tcp_listener_resolver: TestTcpListenerResolver,
}

impl ResolvedClusterConfig {
    /// Start a cluster using this config and waits for the nodes to be ready
    pub async fn start(self) -> ClusterSandbox {
        quickwit_cli::install_default_crypto_ring_provider();

        let mut sandbox = ClusterSandbox {
            cluster_id: self.cluster_id,
            node_configs: Vec::new(),
            temp_dir: self.temp_dir,
            unique_dir_name: self.unique_dir_name,
            node_shutdown_handles: Vec::new(),
            tcp_listener_resolver: self.tcp_listener_resolver,
            storage_resolver: StorageResolver::unconfigured(),
            metastore_resolver: MetastoreResolver::unconfigured(),
        };
        for (config, services) in &self.node_configs {
            sandbox.spawn_node(config.clone(), services.clone());
        }
        sandbox.node_configs = self.node_configs;
        sandbox
            .wait_for_cluster_num_ready_nodes(sandbox.node_configs.len())
            .await
            .unwrap();
        sandbox
    }
}

fn transport_url(addr: SocketAddr, tls: bool) -> Url {
    let mut url = Url::parse(DEFAULT_BASE_URL).unwrap();
    url.set_ip_host(addr.ip()).unwrap();
    url.set_port(Some(addr.port())).unwrap();
    if tls {
        url.set_scheme("https").unwrap();
    }
    url
}

#[macro_export]
macro_rules! ingest_json {
    ($($json:tt)+) => {
        quickwit_rest_client::models::IngestSource::Str(json!($($json)+).to_string())
    };
}

pub(crate) async fn ingest(
    client: &QuickwitClient,
    index_id: &str,
    ingest_source: IngestSource,
    commit_type: CommitType,
) -> anyhow::Result<RestIngestResponse> {
    let resp = client
        .ingest(index_id, ingest_source, None, None, commit_type)
        .await?;
    Ok(resp)
}

/// A test environment where you can start a Quickwit cluster and use the gRPC
/// or REST clients to test it.
pub struct ClusterSandbox {
    cluster_id: String,
    pub node_configs: Vec<(NodeConfig, HashSet<QuickwitService>)>,
    unique_dir_name: String,
    temp_dir: TempDir,
    node_shutdown_handles: Vec<NodeShutdownHandle>,
    tcp_listener_resolver: TestTcpListenerResolver,
    storage_resolver: StorageResolver,
    metastore_resolver: MetastoreResolver,
}

impl ClusterSandbox {
    fn spawn_node(&mut self, config: NodeConfig, services: HashSet<QuickwitService>) {
        let mut shutdown_handle = NodeShutdownHandle::new(config.node_id.clone(), services.clone());
        let shutdown_signal = shutdown_handle.shutdown_signal();
        let runtimes_config = RuntimesConfig::light_for_tests();
        let join_handle = tokio::spawn({
            let node_id = config.node_id.clone();
            let metastore_resolver = self.metastore_resolver.clone();
            let storage_resolver = self.storage_resolver.clone();
            let tcp_listener_resolver = self.tcp_listener_resolver.clone();
            async move {
                let result = serve_quickwit(
                    config,
                    runtimes_config,
                    metastore_resolver,
                    storage_resolver,
                    tcp_listener_resolver,
                    shutdown_signal,
                    quickwit_serve::do_nothing_env_filter_reload_fn(),
                )
                .await?;
                debug!("{node_id} stopped successfully ({services:?})");
                Result::<_, anyhow::Error>::Ok(result)
            }
        });
        shutdown_handle.set_node_join_handle(join_handle);
        self.node_shutdown_handles.push(shutdown_handle);
    }

    /// Dynamically adds a node to the cluster. Does not wait for readiness.
    pub async fn add_node(&mut self, services: impl IntoIterator<Item = QuickwitService>) {
        self.add_node_inner(TestNodeConfig {
            services: HashSet::from_iter(services),
            enable_otlp: false,
        })
        .await;
    }

    async fn add_node_inner(&mut self, config_builder: TestNodeConfig) {
        let mut config = config_builder
            .build_node_config(
                self.node_configs.len() + 1,
                self.cluster_id.clone(),
                &self.temp_dir,
                self.unique_dir_name.clone(),
                &self.tcp_listener_resolver,
            )
            .await;
        config.peer_seeds = self
            .node_configs
            .iter()
            .map(|config| config.0.gossip_advertise_addr.to_string())
            .collect_vec();
        self.spawn_node(config.clone(), config_builder.services.clone());
        self.node_configs
            .push((config, config_builder.services.clone()));
    }

    fn find_node_for_service(&self, service: QuickwitService) -> NodeConfig {
        self.node_configs
            .iter()
            .find(|config| config.1.contains(&service))
            .unwrap_or_else(|| panic!("No {service:?} node"))
            .0
            .clone()
    }

    fn channel(&self, service: QuickwitService) -> tonic::transport::Channel {
        let node_config = self.find_node_for_service(service);
        let endpoint = format!("http://{}", node_config.grpc_listen_addr);
        tonic::transport::Channel::from_shared(endpoint)
            .unwrap()
            .connect_lazy()
    }

    /// Returns a client to one of the nodes that runs the specified service
    pub fn rest_client(&self, service: QuickwitService) -> QuickwitClient {
        let node_config = self.find_node_for_service(service);

        let certificate = if let Some(tls_conf) = &node_config.rest_config.tls {
            let cert_bytes = std::fs::read(&tls_conf.ca_path).unwrap();
            Some(reqwest::tls::Certificate::from_pem(&cert_bytes).unwrap())
        } else {
            None
        };

        QuickwitClientBuilder::new(transport_url(
            node_config.rest_config.listen_addr,
            certificate.is_some(),
        ))
        .set_tls_ca(certificate)
        .build()
    }

    /// A client configured to ingest documents and return detailed parse failures.
    pub fn detailed_ingest_client(&self) -> QuickwitClient {
        let node_config = self.find_node_for_service(QuickwitService::Indexer);

        let certificate = if let Some(tls_conf) = &node_config.rest_config.tls {
            let cert_bytes = std::fs::read(&tls_conf.ca_path).unwrap();
            Some(reqwest::tls::Certificate::from_pem(&cert_bytes).unwrap())
        } else {
            None
        };

        QuickwitClientBuilder::new(transport_url(
            node_config.rest_config.listen_addr,
            certificate.is_some(),
        ))
        .set_tls_ca(certificate)
        .detailed_response(true)
        .build()
    }

    // TODO(#5604)
    pub fn rest_client_legacy_indexer(&self) -> QuickwitClient {
        let node_config = self.find_node_for_service(QuickwitService::Indexer);

        let certificate = if let Some(tls_conf) = &node_config.rest_config.tls {
            let cert_bytes = std::fs::read(&tls_conf.ca_path).unwrap();
            Some(reqwest::tls::Certificate::from_pem(&cert_bytes).unwrap())
        } else {
            None
        };

        QuickwitClientBuilder::new(transport_url(
            node_config.rest_config.listen_addr,
            certificate.is_some(),
        ))
        .set_tls_ca(certificate)
        .use_legacy_ingest(true)
        .build()
    }

    pub fn jaeger_client(&self) -> SpanReaderPluginClient<tonic::transport::Channel> {
        SpanReaderPluginClient::new(self.channel(QuickwitService::Searcher))
    }

    pub fn logs_client(&self) -> LogsServiceClient<tonic::transport::Channel> {
        LogsServiceClient::new(self.channel(QuickwitService::Indexer))
    }

    pub fn trace_client(&self) -> TraceServiceClient<tonic::transport::Channel> {
        TraceServiceClient::new(self.channel(QuickwitService::Indexer))
    }

    pub async fn wait_for_cluster_num_ready_nodes(
        &self,
        expected_num_ready_nodes: usize,
    ) -> anyhow::Result<()> {
        wait_until_predicate(
            || async move {
                match self
                    .rest_client(QuickwitService::Metastore)
                    .cluster()
                    .snapshot()
                    .await
                {
                    Ok(result) => {
                        if result.ready_nodes.len() != expected_num_ready_nodes {
                            debug!(
                                "wait_for_cluster_num_ready_nodes expected {} ready nodes, got {}",
                                expected_num_ready_nodes,
                                result.live_nodes.len()
                            );
                            false
                        } else {
                            true
                        }
                    }
                    Err(err) => {
                        debug!("wait_for_cluster_num_ready_nodes error {err}");
                        false
                    }
                }
            },
            Duration::from_secs(10),
            Duration::from_millis(100),
        )
        .await?;
        Ok(())
    }

    /// Waits for the needed number of indexing pipeline to start.
    ///
    /// WARNING! does not work if multiple indexers are running
    pub async fn wait_for_indexing_pipelines(
        &self,
        required_pipeline_num: usize,
    ) -> anyhow::Result<()> {
        wait_until_predicate(
            || async move {
                match self
                    .rest_client(QuickwitService::Indexer)
                    .node_stats()
                    .indexing()
                    .await
                {
                    Ok(result) => {
                        if result.num_running_pipelines != required_pipeline_num {
                            debug!(
                                "wait_for_indexing_pipelines expected {} pipelines, got {}",
                                required_pipeline_num, result.num_running_pipelines
                            );
                            false
                        } else {
                            true
                        }
                    }
                    Err(err) => {
                        debug!("wait_for_cluster_num_ready_nodes error {err}");
                        false
                    }
                }
            },
            Duration::from_secs(10),
            Duration::from_millis(100),
        )
        .await?;
        Ok(())
    }

    // Waits for the needed number of indexing pipeline to start.
    pub async fn wait_for_splits(
        &self,
        index_id: &str,
        split_states_filter: Option<Vec<SplitState>>,
        required_splits_num: usize,
    ) -> anyhow::Result<()> {
        wait_until_predicate(
            || {
                let splits_query_params = ListSplitsQueryParams {
                    split_states: split_states_filter.clone(),
                    ..Default::default()
                };
                async move {
                    match self
                        .rest_client(QuickwitService::Metastore)
                        .splits(index_id)
                        .list(splits_query_params)
                        .await
                    {
                        Ok(result) => {
                            if result.len() != required_splits_num {
                                debug!(
                                    "wait_for_splits expected {} splits, got {}",
                                    required_splits_num,
                                    result.len()
                                );
                                false
                            } else {
                                true
                            }
                        }
                        Err(err) => {
                            debug!("wait_for_splits error {err}");
                            false
                        }
                    }
                }
            },
            Duration::from_secs(15),
            Duration::from_millis(500),
        )
        .await?;
        Ok(())
    }

    pub async fn local_ingest(&self, index_id: &str, json_data: &[Value]) -> anyhow::Result<()> {
        let test_conf = self
            .node_configs
            .iter()
            .find(|config| config.1.contains(&QuickwitService::Indexer))
            .ok_or(anyhow::anyhow!("No indexer node found"))?;
        // NodeConfig cannot be serialized, we write our own simplified config
        let mut tmp_config_file = tempfile::Builder::new().suffix(".yaml").tempfile().unwrap();
        // we suffix data_dir with a random slug to save us from multiple local ingestion trying to
        // concurrently do something, and cleanup the directory to start a new ingestion.
        let data_dir = test_conf
            .0
            .data_dir_path
            .join(rand::random::<u64>().to_string());
        tokio::fs::create_dir(&data_dir).await?;
        let node_config = format!(
            r#"
                version: 0.8
                metastore_uri: {}
                data_dir: {:?}
                "#,
            test_conf.0.metastore_uri, data_dir
        );
        tmp_config_file.write_all(node_config.as_bytes())?;
        tmp_config_file.flush()?;

        let mut tmp_data_file = tempfile::NamedTempFile::new().unwrap();
        for line in json_data {
            serde_json::to_writer(&mut tmp_data_file, line)?;
            tmp_data_file.write_all(b"\n")?;
        }
        tmp_data_file.flush()?;

        local_ingest_docs_cli(LocalIngestDocsArgs {
            clear_cache: false,
            config_uri: QuickwitUri::from_str(tmp_config_file.path().to_str().unwrap())?,
            index_id: index_id.to_string(),
            input_format: quickwit_config::SourceInputFormat::Json,
            overwrite: false,
            vrl_script: None,
            input_path_opt: Some(QuickwitUri::from_str(
                tmp_data_file
                    .path()
                    .to_str()
                    .context("temp path could not be converted to URI")?,
            )?),
        })
        .await?;
        Ok(())
    }

    pub async fn assert_hit_count(&self, index_id: &str, query: &str, expected_num_hits: u64) {
        let search_response = self
            .rest_client(QuickwitService::Searcher)
            .search(
                index_id,
                SearchRequestQueryString {
                    query: query.to_string(),
                    max_hits: 10,
                    ..Default::default()
                },
            )
            .await
            .unwrap();
        debug!(
            "search response for query {} on index {index_id}: {:?}",
            query, search_response
        );
        assert_eq!(
            search_response.num_hits, expected_num_hits,
            "unexpected num_hits for query {query}"
        );
    }

    /// Shutdown nodes that only provide the specified services
    pub async fn shutdown_services(
        &mut self,
        shutdown_services: impl IntoIterator<Item = QuickwitService>,
    ) -> Result<Vec<HashMap<String, ActorExitStatus>>, anyhow::Error> {
        // We need to drop rest clients first because reqwest can hold connections open
        // preventing rest server's graceful shutdown.
        let mut indexer_shutdown_futures = Vec::new();
        let mut other_shutdown_futures = Vec::new();
        let mut shutdown_nodes = HashMap::new();
        let mut i = 0;
        let shutdown_services_map = HashSet::from_iter(shutdown_services);
        while i < self.node_shutdown_handles.len() {
            let handler_services = &self.node_shutdown_handles[i].node_services;
            if !handler_services.is_subset(&shutdown_services_map) {
                i += 1;
                continue;
            }
            let handler_to_shutdown = self.node_shutdown_handles.remove(i);
            shutdown_nodes.insert(
                handler_to_shutdown.node_id.clone(),
                handler_to_shutdown.node_services.clone(),
            );
            if handler_to_shutdown
                .node_services
                .contains(&QuickwitService::Indexer)
            {
                indexer_shutdown_futures.push(handler_to_shutdown.shutdown());
            } else {
                other_shutdown_futures.push(handler_to_shutdown.shutdown());
            }
        }
        debug!("shutting down {:?}", shutdown_nodes);
        // We must decommision the indexer nodes first and independently from the other nodes.
        let indexer_shutdown_results = future::join_all(indexer_shutdown_futures).await;
        let other_shutdown_results = future::join_all(other_shutdown_futures).await;
        let exit_statuses = indexer_shutdown_results
            .into_iter()
            .chain(other_shutdown_results)
            .collect::<Result<Vec<_>, _>>()?;
        Ok(exit_statuses)
    }

    pub async fn shutdown(
        mut self,
    ) -> Result<Vec<HashMap<String, ActorExitStatus>>, anyhow::Error> {
        self.shutdown_services(QuickwitService::supported_services())
            .await
    }

    /// Remove a node from the sandbox and return its shutdown handle.
    /// After this call, `rest_client` and other lookup methods skip the removed
    /// node, so callers can trigger shutdown concurrently with other sandbox
    /// operations.
    pub fn remove_node_with_service(&mut self, service: QuickwitService) -> NodeShutdownHandle {
        let idx = self
            .node_shutdown_handles
            .iter()
            .position(|h| h.node_services.contains(&service))
            .unwrap_or_else(|| panic!("no node with service {service:?}"));
        self.node_configs.remove(idx);
        self.node_shutdown_handles.remove(idx)
    }
}

/// We don't usually test the tests, but the complexity of the sandbox setup code justifies it here.
#[tokio::test]
async fn test_sandbox_happy_path() {
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::ControlPlane, QuickwitService::Metastore])
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Indexer])
        .build_and_start()
        .await;

    sandbox.wait_for_cluster_num_ready_nodes(3).await.unwrap();
    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_sandbox_add_node_dynamically() {
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::ControlPlane, QuickwitService::Metastore])
        .add_node([QuickwitService::Searcher])
        .build_and_start()
        .await;
    sandbox.wait_for_cluster_num_ready_nodes(2).await.unwrap();

    // Later, add an indexer node to the running cluster
    sandbox.add_node([QuickwitService::Indexer]).await;

    sandbox.wait_for_cluster_num_ready_nodes(3).await.unwrap();
    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/test_utils/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod cluster_sandbox;
mod shutdown;

pub(crate) use cluster_sandbox::{ClusterSandbox, ClusterSandboxBuilder, ingest};


================================================
FILE: quickwit/quickwit-integration-tests/src/test_utils/shutdown.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};

use quickwit_actors::ActorExitStatus;
use quickwit_common::tower::BoxFutureInfaillible;
use quickwit_config::service::QuickwitService;
use quickwit_proto::types::NodeId;
use tokio::sync::watch::{self, Receiver, Sender};
use tokio::task::JoinHandle;

type NodeJoinHandle = JoinHandle<Result<HashMap<String, ActorExitStatus>, anyhow::Error>>;

pub(crate) struct NodeShutdownHandle {
    sender: Sender<()>,
    receiver: Receiver<()>,
    pub node_services: HashSet<QuickwitService>,
    pub node_id: NodeId,
    join_handle_opt: Option<NodeJoinHandle>,
}

impl NodeShutdownHandle {
    pub(crate) fn new(node_id: NodeId, node_services: HashSet<QuickwitService>) -> Self {
        let (sender, receiver) = watch::channel(());
        Self {
            sender,
            receiver,
            node_id,
            node_services,
            join_handle_opt: None,
        }
    }

    pub(crate) fn shutdown_signal(&self) -> BoxFutureInfaillible<()> {
        let receiver = self.receiver.clone();
        Box::pin(async move {
            receiver.clone().changed().await.unwrap();
        })
    }

    pub(crate) fn set_node_join_handle(&mut self, join_handle: NodeJoinHandle) {
        self.join_handle_opt = Some(join_handle);
    }

    /// Initiate node shutdown and wait for it to complete
    pub(crate) async fn shutdown(
        self,
    ) -> anyhow::Result<HashMap<std::string::String, ActorExitStatus>> {
        self.sender.send(()).unwrap();
        self.join_handle_opt
            .expect("node join handle was not set before shutdown")
            .await
            .unwrap()
    }
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/basic_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use hyper::{Method, Request, StatusCode};
use hyper_util::rt::TokioExecutor;
use quickwit_config::service::QuickwitService;
use quickwit_serve::SearchRequestQueryString;

use crate::test_utils::ClusterSandboxBuilder;

#[tokio::test]
async fn test_ui_redirect_on_get() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let node_config = sandbox.node_configs.first().unwrap();
    let client = hyper_util::client::legacy::Client::builder(TokioExecutor::new())
        .pool_idle_timeout(Duration::from_secs(30))
        .http2_only(true)
        .build_http();
    let root_uri = format!("http://{}/", node_config.0.rest_config.listen_addr)
        .parse::<hyper::Uri>()
        .unwrap();
    let response = client.get(root_uri.clone()).await.unwrap();
    assert_eq!(response.status(), StatusCode::MOVED_PERMANENTLY);
    let post_request = Request::builder()
        .uri(root_uri)
        .method(Method::POST)
        .body("{}".to_string())
        .unwrap();
    let response = client.request(post_request).await.unwrap();
    assert_eq!(response.status(), StatusCode::METHOD_NOT_ALLOWED);
    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_standalone_server() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    {
        // The indexing service should be running.
        let counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(counters.num_running_pipelines, 0);
    }

    {
        // Create an dynamic index.
        sandbox
            .rest_client(QuickwitService::Indexer)
            .indexes()
            .create(
                r#"
                version: 0.8
                index_id: my-new-index
                doc_mapping:
                  field_mappings:
                  - name: body
                    type: text
                "#,
                quickwit_config::ConfigFormat::Yaml,
                false,
            )
            .await
            .unwrap();

        // Index should be searchable
        assert_eq!(
            sandbox
                .rest_client(QuickwitService::Indexer)
                .search(
                    "my-new-index",
                    SearchRequestQueryString {
                        query: "body:test".to_string(),
                        max_hits: 10,
                        ..Default::default()
                    },
                )
                .await
                .unwrap()
                .num_hits,
            0
        );
        sandbox.wait_for_indexing_pipelines(1).await.unwrap();
    }
    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_multi_nodes_cluster() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            r#"
            version: 0.8
            index_id: my-new-multi-node-index
            doc_mapping:
              field_mappings:
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            "#,
            quickwit_config::ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Assert that at least 1 indexing pipelines is successfully started
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    // Check that search is working
    let search_response_empty = sandbox
        .rest_client(QuickwitService::Searcher)
        .search(
            "my-new-multi-node-index",
            SearchRequestQueryString {
                query: "body:bar".to_string(),
                ..Default::default()
            },
        )
        .await
        .unwrap();
    assert_eq!(search_response_empty.num_hits, 0);

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/ingest_v1_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::ConfigFormat;
use quickwit_config::service::QuickwitService;
use quickwit_metastore::SplitState;
use quickwit_rest_client::rest_client::CommitType;
use serde_json::json;

use crate::ingest_json;
use crate::test_utils::{ClusterSandboxBuilder, ingest};

// TODO(#5604)

/// This tests checks our happy path for ingesting one doc.
#[tokio::test]
async fn test_ingest_v1_happy_path() {
    let sandbox = ClusterSandboxBuilder::default()
        .use_legacy_ingest()
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::Searcher])
        .add_node([
            QuickwitService::ControlPlane,
            QuickwitService::Janitor,
            QuickwitService::Metastore,
        ])
        .build_and_start()
        .await;

    let index_id = "test-ingest-v1-happy-path";
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body
              type: text
        indexing_settings:
            commit_timeout_secs: 1
        "#
    );
    let indexer_client = sandbox.rest_client_legacy_indexer();
    indexer_client
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    ingest(
        &indexer_client,
        index_id,
        ingest_json!({"body": "my-doc"}),
        CommitType::Auto,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "*", 1).await;

    // Delete the index to avoid potential hanging on shutdown #5068
    indexer_client
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/ingest_v2_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use futures_util::FutureExt;
use itertools::Itertools;
use quickwit_common::test_utils::wait_until_predicate;
use quickwit_config::ConfigFormat;
use quickwit_config::service::QuickwitService;
use quickwit_indexing::actors::INDEXING_DIR_NAME;
use quickwit_metastore::SplitState;
use quickwit_proto::ingest::ParseFailureReason;
use quickwit_rest_client::error::{ApiError, Error};
use quickwit_rest_client::models::IngestSource;
use quickwit_rest_client::rest_client::CommitType;
use quickwit_serve::{ListSplitsQueryParams, RestIngestResponse, RestParseFailure};
use serde_json::json;

use crate::ingest_json;
use crate::test_utils::{ClusterSandboxBuilder, ingest};

/// Ingesting on a freshly re-created index sometimes fails, see #5430
#[tokio::test]
#[ignore]
async fn test_ingest_recreated_index() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test-ingest-recreated-index";
    let index_config = format!(
        r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
                field_mappings:
                - name: body
                  type: text
            indexing_settings:
                commit_timeout_secs: 1
                merge_policy:
                    type: stable_log
                    merge_factor: 3
                    max_merge_factor: 3
            "#
    );
    let current_index_metadata = sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config.clone(), ConfigFormat::Yaml, false)
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "first record"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    // Recreate the index and start ingesting into it again

    let new_index_metadata = sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    assert_ne!(
        current_index_metadata.index_uid.incarnation_id,
        new_index_metadata.index_uid.incarnation_id
    );

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "second record"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "third record"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 2)
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "fourth record"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 3)
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "body:record", 3).await;

    // Wait for splits to merge, since we created 3 splits and merge factor is 3,
    // we should get 1 published split with no staged splits eventually.
    sandbox
        .wait_for_splits(
            index_id,
            Some(vec![SplitState::Published, SplitState::Staged]),
            1,
        )
        .await
        .unwrap();

    // Delete the index to avoid potential hanging on shutdown #5068
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}

/// Indexing directory is not cleaned up after deleting an index, see #5436
#[tokio::test]
#[ignore]
async fn test_indexing_directory_cleanup() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test-ingest-directory-cleanup";
    let index_config = format!(
        r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
                field_mappings:
                - name: body
                  type: text
            indexing_settings:
                commit_timeout_secs: 1
                merge_policy:
                    type: stable_log
                    merge_factor: 3
                    max_merge_factor: 3
            "#
    );
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config.clone(), ConfigFormat::Yaml, false)
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "first record"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    // The index is deleted so the `indexing` directory should be cleaned up
    let data_dir_path = &sandbox.node_configs.first().unwrap().0.data_dir_path;
    let indexing_dir_path = data_dir_path.join(INDEXING_DIR_NAME);
    wait_until_predicate(
        || async {
            let indexing_dir_entries = indexing_dir_path.read_dir().unwrap().collect_vec();
            indexing_dir_entries.is_empty()
        },
        Duration::from_secs(100),
        Duration::from_millis(500),
    )
    .await
    .unwrap();

    sandbox.shutdown().await.unwrap();
}

/// This tests checks what happens when we try to ingest into a non-existing index.
#[tokio::test]
async fn test_ingest_v2_index_not_found() {
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Indexer, QuickwitService::Janitor])
        .add_node([QuickwitService::Indexer, QuickwitService::Janitor])
        .add_node([
            QuickwitService::ControlPlane,
            QuickwitService::Metastore,
            QuickwitService::Searcher,
        ])
        .build_and_start()
        .await;
    let missing_index_err: Error = sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            "missing_index",
            ingest_json!({"body": "doc1"}),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap_err();
    let Error::Api(ApiError { message, code }) = missing_index_err else {
        panic!("Expected an API error.");
    };
    assert_eq!(code, 404u16);
    let error_message = message.unwrap();
    assert_eq!(error_message, "index `missing_index` not found");
    sandbox.shutdown().await.unwrap();
}

/// This tests checks our happy path for ingesting one doc.
#[tokio::test]
async fn test_ingest_v2_happy_path() {
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Indexer, QuickwitService::Janitor])
        .add_node([QuickwitService::Indexer, QuickwitService::Janitor])
        .add_node([
            QuickwitService::ControlPlane,
            QuickwitService::Metastore,
            QuickwitService::Searcher,
        ])
        .build_and_start()
        .await;
    let index_id = "test_happy_path";
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body
              type: text
        indexing_settings:
            commit_timeout_secs: 1
        "#
    );
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    let ingest_resp = ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "doc1"}),
        CommitType::Auto,
    )
    .await
    .unwrap();
    assert_eq!(
        ingest_resp,
        RestIngestResponse {
            num_docs_for_processing: 1,
            num_ingested_docs: Some(1),
            num_rejected_docs: Some(0),
            parse_failures: None,
        },
    );

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "*", 1).await;

    // Delete the index to avoid potential hanging on shutdown #5068
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_commit_force() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test_commit_force";
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body
              type: text
        indexing_settings:
            commit_timeout_secs: 60
        "#
    );

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    // commit_timeout_secs is set to a large value, so this would timeout if
    // the commit isn't forced
    let ingest_resp = tokio::time::timeout(
        Duration::from_secs(20),
        ingest(
            &sandbox.rest_client(QuickwitService::Indexer),
            index_id,
            ingest_json!({"body": "force"}),
            CommitType::Force,
        ),
    )
    .await
    .unwrap()
    .unwrap();
    assert_eq!(
        ingest_resp,
        RestIngestResponse {
            num_docs_for_processing: 1,
            num_ingested_docs: Some(1),
            num_rejected_docs: Some(0),
            parse_failures: None,
        },
    );

    sandbox.assert_hit_count(index_id, "body:force", 1).await;

    // Delete the index to avoid waiting for the commit timeout on shutdown #5068
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_commit_wait_for() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test_commit_wait_for";
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body 
              type: text
        indexing_settings:
            commit_timeout_secs: 3
        "#
    );

    // Create index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    // run 2 ingest requests at the same time on the same index
    // wait_for shouldn't force the commit so expect only 1 published split
    let client = sandbox.rest_client(QuickwitService::Indexer);
    let ingest_1_fut = client
        .ingest(
            index_id,
            ingest_json!({"body": "wait for"}),
            None,
            None,
            CommitType::WaitFor,
        )
        .then(|res| async {
            let ingest_resp = res.unwrap();
            sandbox.assert_hit_count(index_id, "body:for", 1).await;
            ingest_resp
        });

    let ingest_2_fut = client
        .ingest(
            index_id,
            ingest_json!({"body": "wait again"}),
            None,
            None,
            CommitType::WaitFor,
        )
        .then(|res| async {
            let ingest_resp = res.unwrap();
            sandbox.assert_hit_count(index_id, "body:again", 1).await;
            ingest_resp
        });

    let (ingest_resp_1, ingest_resp_2) = tokio::join!(ingest_1_fut, ingest_2_fut);
    assert_eq!(
        ingest_resp_1,
        RestIngestResponse {
            num_docs_for_processing: 1,
            num_ingested_docs: Some(1),
            num_rejected_docs: Some(0),
            parse_failures: None,
        },
    );
    assert_eq!(
        ingest_resp_2,
        RestIngestResponse {
            num_docs_for_processing: 1,
            num_ingested_docs: Some(1),
            num_rejected_docs: Some(0),
            parse_failures: None,
        },
    );

    sandbox.assert_hit_count(index_id, "body:wait", 2).await;

    let splits_query_params = ListSplitsQueryParams {
        split_states: Some(vec![SplitState::Published]),
        ..Default::default()
    };
    let published_splits = sandbox
        .rest_client(QuickwitService::Indexer)
        .splits(index_id)
        .list(splits_query_params)
        .await
        .unwrap();
    assert_eq!(published_splits.len(), 1);

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_commit_auto() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test_commit_auto";
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body
              type: text
        indexing_settings:
            commit_timeout_secs: 2
        "#
    );

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    let ingest_resp = sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            ingest_json!({"body": "auto"}),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();
    assert_eq!(
        ingest_resp,
        RestIngestResponse {
            num_docs_for_processing: 1,
            num_ingested_docs: Some(1),
            num_rejected_docs: Some(0),
            parse_failures: None,
        },
    );

    sandbox.assert_hit_count(index_id, "body:auto", 0).await;

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "body:auto", 1).await;

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_detailed_ingest_response() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test_detailed_ingest_response";
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body
              type: text
        indexing_settings:
            commit_timeout_secs: 1
        "#
    );
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    let ingest_resp = ingest(
        &sandbox.detailed_ingest_client(),
        index_id,
        IngestSource::Str("{\"body\":\"hello\"}\naouch!".to_string()),
        CommitType::Auto,
    )
    .await
    .unwrap();

    assert_eq!(
        ingest_resp,
        RestIngestResponse {
            num_docs_for_processing: 2,
            num_ingested_docs: Some(1),
            num_rejected_docs: Some(1),
            parse_failures: Some(vec![RestParseFailure {
                document: "aouch!".to_string(),
                message: "failed to parse JSON document".to_string(),
                reason: ParseFailureReason::InvalidJson,
            }]),
        },
    );
    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_very_large_index_name() {
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    let acceptable_index_id = "its_very_very_very_very_very_very_very_very_very_very_very_\
    very_very_very_very_very_very_very_very_very_very_very_very_very_very_very_\
    very_very_very_very_very_very_very_very_very_very_very_very_very_very_very_\
    very_very_very_very_very_very_index_large_name";
    assert_eq!(acceptable_index_id.len(), 255);
    let oversized_index_id = format!("{acceptable_index_id}1");

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            format!(
                r#"
                version: 0.8
                index_id: {acceptable_index_id}
                doc_mapping:
                  field_mappings:
                    - name: body
                      type: text
                indexing_settings:
                    commit_timeout_secs: 1
                "#,
            ),
            ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        acceptable_index_id,
        ingest_json!({"body": "not too long"}),
        CommitType::Auto,
    )
    .await
    .unwrap();

    sandbox
        .wait_for_splits(acceptable_index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox
        .assert_hit_count(acceptable_index_id, "body:long", 1)
        .await;

    // Delete the index to avoid potential hanging on shutdown #5068
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(acceptable_index_id, false)
        .await
        .unwrap();

    let error = sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            format!(
                r#"
                version: 0.8
                index_id: {oversized_index_id}
                doc_mapping:
                    field_mappings:
                    - name: body
                      type: text
                indexing_settings:
                    commit_timeout_secs: 1
                "#,
            ),
            ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap_err();

    assert!(error.to_string().ends_with(
        "is invalid: identifiers must match the following regular expression: \
         `^[a-zA-Z][a-zA-Z0-9-_\\.]{2,254}$`)"
    ));

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_shutdown_single_node() {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test_shutdown_single_node";

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            format!(
                r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
              field_mappings:
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            "#
            ),
            ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "one"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            ingest_json!({"body": "two"}),
            None,
            None,
            CommitType::Force,
        )
        .await
        .unwrap();

    tokio::time::timeout(Duration::from_secs(10), sandbox.shutdown())
        .await
        .unwrap()
        .unwrap();
}

#[tokio::test]
async fn test_shutdown_control_plane_first() {
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Indexer])
        .add_node([
            QuickwitService::ControlPlane,
            QuickwitService::Searcher,
            QuickwitService::Metastore,
            QuickwitService::Janitor,
        ])
        .build_and_start()
        .await;
    let index_id = "test_shutdown_control_plane_first";

    // Create index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            format!(
                r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
              field_mappings:
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            "#
            ),
            ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "one"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .shutdown_services([
            QuickwitService::ControlPlane,
            QuickwitService::Searcher,
            QuickwitService::Metastore,
            QuickwitService::Janitor,
        ])
        .await
        .unwrap();

    // The indexer hangs on shutdown because it cannot commit the shard EOF
    tokio::time::timeout(Duration::from_secs(5), sandbox.shutdown())
        .await
        .unwrap_err();
}

#[tokio::test]
async fn test_shutdown_indexer_first() {
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Indexer])
        .add_node([
            QuickwitService::ControlPlane,
            QuickwitService::Searcher,
            QuickwitService::Metastore,
            QuickwitService::Janitor,
        ])
        .build_and_start()
        .await;
    let index_id = "test_shutdown_indexer_first";

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            format!(
                r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
              field_mappings:
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            "#
            ),
            ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "one"}),
        CommitType::Force,
    )
    .await
    .unwrap();

    sandbox
        .shutdown_services([QuickwitService::Indexer])
        .await
        .unwrap();

    tokio::time::timeout(Duration::from_secs(5), sandbox.shutdown())
        .await
        .unwrap()
        .unwrap();
}

/// Tests that the graceful shutdown sequence works correctly in a multi-indexer
/// cluster: shutting down one indexer does NOT cause 500 errors or data loss,
/// and the cluster eventually rebalances. see #6158
///
/// We start with a single indexer so the shard for this index is guaranteed to
/// live on it. After ingesting, we dynamically add a second indexer, then shut
/// down the first one. This proves the decommission sequence correctly drains
/// in-flight data even when the shard owner is the node being removed.
#[tokio::test]
async fn test_graceful_shutdown_no_data_loss() {
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Indexer])
        .add_node([
            QuickwitService::ControlPlane,
            QuickwitService::Searcher,
            QuickwitService::Metastore,
            QuickwitService::Janitor,
        ])
        .build_and_start()
        .await;
    let index_id = "test_graceful_shutdown_no_data_loss";

    // Create index with a long commit timeout so documents stay uncommitted
    // in the ingesters' WAL. The decommission sequence should commit
    // them before the indexer quits.
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            format!(
                r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
              field_mappings:
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 5
            "#
            ),
            ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    // Ingest docs with auto-commit. With a 5s commit timeout, these documents
    // sit uncommitted in the ingesters' WAL - exactly the in-flight state we
    // want to exercise during draining.
    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "before-shutdown-1"}),
        CommitType::Auto,
    )
    .await
    .unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        index_id,
        ingest_json!({"body": "before-shutdown-2"}),
        CommitType::Auto,
    )
    .await
    .unwrap();

    // Add a second indexer after the shard has been created on the first one.
    sandbox.add_node([QuickwitService::Indexer]).await;
    sandbox.wait_for_cluster_num_ready_nodes(3).await.unwrap();

    // Remove the first indexer (the shard owner) from the sandbox and get its
    // shutdown handle. After this call, rest_client(Indexer) returns the
    // second (surviving) indexer.
    let shutdown_handle = sandbox.remove_node_with_service(QuickwitService::Indexer);

    // Concurrently: shut down the removed indexer AND ingest more data via the
    // surviving indexer. This verifies the cluster stays operational and the
    // router on the surviving node does not return 500 errors while one indexer
    // is decommissioning. The control plane excludes the decommissioning
    // ingester from shard allocation, so new shards go to the surviving one.
    let ingest_client = sandbox.rest_client(QuickwitService::Indexer);
    let (shutdown_result, ingest_result) = tokio::join!(
        async {
            tokio::time::timeout(Duration::from_secs(30), shutdown_handle.shutdown())
                .await
                .expect("indexer shutdown timed out — decommission may be stuck")
        },
        async {
            // Small delay so the decommission sequence has started before we ingest.
            tokio::time::sleep(Duration::from_millis(200)).await;
            ingest(
                &ingest_client,
                index_id,
                ingest_json!({"body": "during-shutdown"}),
                CommitType::Auto,
            )
            .await
        },
    );
    shutdown_result.expect("indexer shutdown failed");
    ingest_result.expect("ingest during shutdown should succeed (no 500 errors)");

    // All 3 documents should eventually be searchable. Documents 1 & 2 were
    // in-flight on the decommissioning indexer and should have been committed during
    // the decommission step. Document 3 was ingested to the surviving indexer.
    wait_until_predicate(
        || async {
            match sandbox
                .rest_client(QuickwitService::Searcher)
                .search(
                    index_id,
                    quickwit_serve::SearchRequestQueryString {
                        query: "*".to_string(),
                        max_hits: 10,
                        ..Default::default()
                    },
                )
                .await
            {
                Ok(resp) => resp.num_hits == 3,
                Err(_) => false,
            }
        },
        Duration::from_secs(30),
        Duration::from_millis(500),
    )
    .await
    .expect("expected 3 documents after decommission shutdown, some data may have been lost");

    // Verify the cluster sees 2 ready nodes (the surviving indexer + the
    // control-plane/searcher/metastore/janitor node).
    sandbox
        .wait_for_cluster_num_ready_nodes(2)
        .await
        .expect("cluster should see 2 ready nodes after indexer shutdown");

    // Clean shutdown of the remaining nodes.
    tokio::time::timeout(Duration::from_secs(30), sandbox.shutdown())
        .await
        .unwrap()
        .unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod basic_tests;
mod ingest_v1_tests;
mod ingest_v2_tests;
mod no_cp_tests;
mod otlp_tests;
#[cfg(feature = "sqs-localstack-tests")]
mod sqs_tests;
mod tls_tests;
mod update_tests;


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/no_cp_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Tests for cluster configurations without a control plane.

use quickwit_config::ConfigFormat;
use quickwit_config::service::QuickwitService;
use quickwit_rest_client::error::{ApiError, Error as RestClientError};
use quickwit_serve::SearchRequestQueryString;

use crate::test_utils::ClusterSandboxBuilder;

fn initialize_tests() {
    // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
    // as this is only a test, and it would be extremly inconvenient to run it in a different way,
    // we are keeping it that way

    quickwit_common::setup_logging_for_tests();
    unsafe { std::env::set_var("QW_ENABLE_INGEST_V2", "true") };
}

#[tokio::test]
async fn test_search_after_control_plane_shutdown() {
    initialize_tests();
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Searcher])
        .build_and_start()
        .await;
    let index_id = "test-search-after-control-plane-shutdown";
    let index_config = format!(
        r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
                field_mappings:
                - name: body
                  type: text
            indexing_settings:
                commit_timeout_secs: 1
            "#
    );

    sandbox
        .rest_client(QuickwitService::Metastore)
        .indexes()
        .create(index_config.clone(), ConfigFormat::Yaml, false)
        .await
        .unwrap();

    sandbox
        .shutdown_services([QuickwitService::ControlPlane])
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "", 0).await;

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_searcher_and_metastore_without_control_plane() {
    initialize_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Searcher])
        .build_and_start()
        .await;

    // we cannot create an actual index without control plane

    let search_error = sandbox
        .rest_client(QuickwitService::Searcher)
        .search(
            "does-not-exist",
            SearchRequestQueryString {
                query: String::new(),
                max_hits: 10,
                ..Default::default()
            },
        )
        .await
        .unwrap_err();

    if let RestClientError::Api(ApiError { message, code }) = search_error {
        assert_eq!(
            message.unwrap(),
            "could not find indexes matching the IDs `[\"does-not-exist\"]`"
        );
        assert_eq!(code.as_u16(), 404);
    } else {
        panic!("unexpected error: {search_error:?}");
    }

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
#[should_panic]
async fn test_indexer_fails_without_control_plane() {
    initialize_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer, QuickwitService::Searcher])
        .build_and_start()
        .await;

    let _ = sandbox.shutdown().await;
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/otlp_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use futures_util::StreamExt;
use quickwit_config::service::QuickwitService;
use quickwit_metastore::SplitState;
use quickwit_opentelemetry::otlp::{
    OTEL_LOGS_INDEX_ID, OTEL_TRACES_INDEX_ID, make_resource_spans_for_test,
};
use quickwit_proto::jaeger::storage::v1::{
    FindTraceIDsRequest, GetOperationsRequest, GetServicesRequest, GetTraceRequest, Operation,
    SpansResponseChunk, TraceQueryParameters,
};
use quickwit_proto::opentelemetry::proto::collector::logs::v1::ExportLogsServiceRequest;
use quickwit_proto::opentelemetry::proto::collector::trace::v1::ExportTraceServiceRequest;
use quickwit_proto::opentelemetry::proto::common::v1::AnyValue;
use quickwit_proto::opentelemetry::proto::common::v1::any_value::Value;
use quickwit_proto::opentelemetry::proto::logs::v1::{LogRecord, ResourceLogs, ScopeLogs};
use quickwit_proto::opentelemetry::proto::trace::v1::{ResourceSpans, ScopeSpans, Span};
use tonic::codec::CompressionEncoding;

use crate::test_utils::ClusterSandboxBuilder;

fn initialize_tests() {
    // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
    // as this is only a test, and it would be extremly inconvenient to run it in a different way,
    // we are keeping it that way

    quickwit_common::setup_logging_for_tests();
    unsafe { std::env::set_var("QW_ENABLE_INGEST_V2", "true") };
}

#[tokio::test]
async fn test_ingest_traces_with_otlp_grpc_api() {
    initialize_tests();
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node_with_otlp([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;
    // Wait for the pipelines to start (one for logs and one for traces)
    sandbox.wait_for_indexing_pipelines(2).await.unwrap();

    fn build_span(span_name: String) -> Vec<ResourceSpans> {
        let scope_spans = vec![ScopeSpans {
            spans: vec![Span {
                name: span_name,
                trace_id: vec![1; 16],
                span_id: vec![2; 8],
                start_time_unix_nano: 1724060143000000001,
                end_time_unix_nano: 1724060144000000000,
                ..Default::default()
            }],
            ..Default::default()
        }];
        vec![ResourceSpans {
            scope_spans,
            ..Default::default()
        }]
    }

    // Send the spans on the default index
    let tested_clients = vec![
        sandbox.trace_client().clone(),
        sandbox
            .trace_client()
            .clone()
            .send_compressed(CompressionEncoding::Gzip),
    ];
    for (idx, mut tested_client) in tested_clients.into_iter().enumerate() {
        let body = format!("hello{idx}");
        let request = ExportTraceServiceRequest {
            resource_spans: build_span(body.clone()),
        };
        let response = tested_client.export(request).await.unwrap();
        assert_eq!(
            response
                .into_inner()
                .partial_success
                .unwrap()
                .rejected_spans,
            0
        );
        sandbox
            .wait_for_splits(
                OTEL_TRACES_INDEX_ID,
                Some(vec![SplitState::Published]),
                idx + 1,
            )
            .await
            .unwrap();
        sandbox
            .assert_hit_count(OTEL_TRACES_INDEX_ID, &format!("span_name:{body}"), 1)
            .await;
    }

    // Send the spans on a non existing index, should return an error.
    {
        let request = ExportTraceServiceRequest {
            resource_spans: build_span("hello".to_string()),
        };
        let mut tonic_request = tonic::Request::new(request);
        tonic_request.metadata_mut().insert(
            "qw-otel-traces-index",
            tonic::metadata::MetadataValue::try_from("non-existing-index").unwrap(),
        );
        let status = sandbox
            .trace_client()
            .clone()
            .export(tonic_request)
            .await
            .unwrap_err();
        assert_eq!(status.code(), tonic::Code::NotFound);
    }

    sandbox
        .shutdown_services([QuickwitService::Indexer])
        .await
        .unwrap();
    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_ingest_logs_with_otlp_grpc_api() {
    initialize_tests();
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node_with_otlp([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;
    // Wait fo the pipelines to start (one for logs and one for traces)
    sandbox.wait_for_indexing_pipelines(2).await.unwrap();

    fn build_log(body: String) -> Vec<ResourceLogs> {
        let log_record = LogRecord {
            time_unix_nano: 1724060143000000001,
            body: Some(AnyValue {
                value: Some(Value::StringValue(body)),
            }),
            ..Default::default()
        };
        let scope_logs = ScopeLogs {
            log_records: vec![log_record],
            ..Default::default()
        };
        vec![ResourceLogs {
            scope_logs: vec![scope_logs],
            ..Default::default()
        }]
    }

    // Send the logs on the default index
    let tested_clients = vec![
        sandbox.logs_client().clone(),
        sandbox
            .logs_client()
            .clone()
            .send_compressed(CompressionEncoding::Gzip),
    ];
    for (idx, mut tested_client) in tested_clients.into_iter().enumerate() {
        let body: String = format!("hello{idx}");
        let request = ExportLogsServiceRequest {
            resource_logs: build_log(body.clone()),
        };
        let response = tested_client.export(request).await.unwrap();
        assert_eq!(
            response
                .into_inner()
                .partial_success
                .unwrap()
                .rejected_log_records,
            0
        );
        sandbox
            .wait_for_splits(
                OTEL_LOGS_INDEX_ID,
                Some(vec![SplitState::Published]),
                idx + 1,
            )
            .await
            .unwrap();
        sandbox
            .assert_hit_count(OTEL_LOGS_INDEX_ID, &format!("body.message:{body}"), 1)
            .await;
    }

    sandbox
        .shutdown_services([QuickwitService::Indexer])
        .await
        .unwrap();
    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_jaeger_api() {
    initialize_tests();
    let mut sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node_with_otlp([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;
    // Wait fo the pipelines to start (one for logs and one for traces)
    sandbox.wait_for_indexing_pipelines(2).await.unwrap();

    let export_trace_request = ExportTraceServiceRequest {
        resource_spans: make_resource_spans_for_test(),
    };
    sandbox
        .trace_client()
        .export(export_trace_request)
        .await
        .unwrap();

    sandbox
        .wait_for_splits(OTEL_TRACES_INDEX_ID, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox
        .shutdown_services([QuickwitService::Indexer])
        .await
        .unwrap();

    {
        // Test `GetServices`
        let get_services_request = GetServicesRequest {};
        let get_services_response = sandbox
            .jaeger_client()
            .get_services(tonic::Request::new(get_services_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(get_services_response.services, &["quickwit"]);
    }
    {
        // Test `GetOperations`
        let get_operations_request = GetOperationsRequest {
            service: "quickwit".to_string(),
            span_kind: "".to_string(),
        };
        let get_operations_response = sandbox
            .jaeger_client()
            .get_operations(tonic::Request::new(get_operations_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(get_operations_response.operations.len(), 4);
        assert_eq!(
            get_operations_response.operations,
            vec![
                Operation {
                    name: "delete_splits".to_string(),
                    span_kind: "client".to_string(),
                },
                Operation {
                    name: "list_splits".to_string(),
                    span_kind: "client".to_string(),
                },
                Operation {
                    name: "publish_splits".to_string(),
                    span_kind: "server".to_string(),
                },
                Operation {
                    name: "stage_splits".to_string(),
                    span_kind: "internal".to_string(),
                }
            ]
        );

        let get_operations_request = GetOperationsRequest {
            service: "quickwit".to_string(),
            span_kind: "server".to_string(),
        };
        let get_operations_response = sandbox
            .jaeger_client()
            .get_operations(tonic::Request::new(get_operations_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(get_operations_response.operations.len(), 1);
        assert_eq!(
            get_operations_response.operations,
            vec![Operation {
                name: "publish_splits".to_string(),
                span_kind: "server".to_string(),
            },]
        );
    }
    {
        // Test `FindTraceIds`
        // TODO: Increase comprehensiveness of this test.
        // Search by service and operation name.
        let query = TraceQueryParameters {
            service_name: "quickwit".to_string(),
            operation_name: "stage_splits".to_string(),
            tags: HashMap::new(),
            start_time_min: None,
            start_time_max: None,
            duration_min: None,
            duration_max: None,
            num_traces: 10,
        };
        let find_trace_ids_request = FindTraceIDsRequest { query: Some(query) };
        let find_trace_ids_response = sandbox
            .jaeger_client()
            .find_trace_i_ds(tonic::Request::new(find_trace_ids_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(find_trace_ids_response.trace_ids.len(), 1);
        assert_eq!(find_trace_ids_response.trace_ids[0], [1; 16]);

        // Search by service name, operation name, and span attribute.
        let query = TraceQueryParameters {
            service_name: "quickwit".to_string(),
            operation_name: "list_splits".to_string(),
            tags: HashMap::from([("span_key".to_string(), "span_value".to_string())]),
            start_time_min: None,
            start_time_max: None,
            duration_min: None,
            duration_max: None,
            num_traces: 10,
        };
        let find_trace_ids_request = FindTraceIDsRequest { query: Some(query) };
        let find_trace_ids_response = sandbox
            .jaeger_client()
            .find_trace_i_ds(tonic::Request::new(find_trace_ids_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(find_trace_ids_response.trace_ids.len(), 1);
        assert_eq!(find_trace_ids_response.trace_ids[0], [3; 16]);

        // Search by service name, operation name, and event attribute.
        let query = TraceQueryParameters {
            service_name: "quickwit".to_string(),
            operation_name: "delete_splits".to_string(),
            tags: HashMap::from([("event_key".to_string(), "event_value".to_string())]),
            start_time_min: None,
            start_time_max: None,
            duration_min: None,
            duration_max: None,
            num_traces: 10,
        };
        let find_trace_ids_request = FindTraceIDsRequest { query: Some(query) };
        let find_trace_ids_response = sandbox
            .jaeger_client()
            .find_trace_i_ds(tonic::Request::new(find_trace_ids_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(find_trace_ids_response.trace_ids.len(), 1);
        assert_eq!(find_trace_ids_response.trace_ids[0], [5; 16]);

        // Search traces with an error.
        let query = TraceQueryParameters {
            service_name: "quickwit".to_string(),
            operation_name: "list_splits".to_string(),
            tags: HashMap::from([("error".to_string(), "true".to_string())]),
            start_time_min: None,
            start_time_max: None,
            duration_min: None,
            duration_max: None,
            num_traces: 10,
        };
        let find_trace_ids_request = FindTraceIDsRequest { query: Some(query) };
        let find_trace_ids_response = sandbox
            .jaeger_client()
            .find_trace_i_ds(tonic::Request::new(find_trace_ids_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(find_trace_ids_response.trace_ids.len(), 1);
        assert_eq!(find_trace_ids_response.trace_ids[0], [4; 16]);

        // Search traces without an error.
        let query = TraceQueryParameters {
            service_name: "quickwit".to_string(),
            operation_name: "list_splits".to_string(),
            tags: HashMap::from([("error".to_string(), "false".to_string())]),
            start_time_min: None,
            start_time_max: None,
            duration_min: None,
            duration_max: None,
            num_traces: 10,
        };
        let find_trace_ids_request = FindTraceIDsRequest { query: Some(query) };
        let find_trace_ids_response = sandbox
            .jaeger_client()
            .find_trace_i_ds(tonic::Request::new(find_trace_ids_request))
            .await
            .unwrap()
            .into_inner();
        assert_eq!(find_trace_ids_response.trace_ids.len(), 1);
        assert_eq!(find_trace_ids_response.trace_ids[0], [3; 16]);
    }
    {
        // Test `GetTrace`
        let get_trace_request = GetTraceRequest {
            trace_id: [1; 16].to_vec(),
        };
        let mut span_stream = sandbox
            .jaeger_client()
            .get_trace(tonic::Request::new(get_trace_request))
            .await
            .unwrap()
            .into_inner();
        let SpansResponseChunk { spans } = span_stream.next().await.unwrap().unwrap();
        assert_eq!(spans.len(), 1);

        let span: &quickwit_proto::jaeger::api_v2::Span = &spans[0];
        assert_eq!(span.operation_name, "stage_splits");

        let process = span.process.as_ref().unwrap();
        assert_eq!(process.tags.len(), 1);
        assert_eq!(process.tags[0].key, "tags");
        assert_eq!(process.tags[0].v_str, r#"["foo"]"#);
    }
    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/sqs_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io::Write;
use std::iter;
use std::str::FromStr;
use std::time::Duration;

use aws_sdk_sqs::types::QueueAttributeName;
use quickwit_common::test_utils::wait_until_predicate;
use quickwit_common::uri::Uri;
use quickwit_config::ConfigFormat;
use quickwit_config::service::QuickwitService;
use quickwit_indexing::source::sqs_queue::test_helpers as sqs_test_helpers;
use quickwit_metastore::SplitState;
use tempfile::NamedTempFile;

use crate::test_utils::ClusterSandboxBuilder;

fn create_mock_data_file(num_lines: usize) -> (NamedTempFile, Uri) {
    let mut temp_file = tempfile::NamedTempFile::new().unwrap();
    for i in 0..num_lines {
        writeln!(temp_file, "{{\"body\": \"hello {i}\"}}").unwrap()
    }
    temp_file.flush().unwrap();
    let path = temp_file.path().to_str().unwrap();
    let uri = Uri::from_str(path).unwrap();
    (temp_file, uri)
}

#[tokio::test]
async fn test_sqs_with_duplicates() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test-sqs-source-duplicates";
    let index_config = format!(
        r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
                field_mappings:
                - name: body
                  type: text
            indexing_settings:
                commit_timeout_secs: 3
            "#
    );

    let sqs_client = sqs_test_helpers::get_localstack_sqs_client().await.unwrap();
    let queue_url = sqs_test_helpers::create_queue(&sqs_client, "test-single-node-cluster").await;

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config.clone(), ConfigFormat::Yaml, false)
        .await
        .unwrap();

    let source_id: &str = "test-sqs-single-node-cluster";
    let source_config_input = format!(
        r#"
            version: 0.7
            source_id: {source_id}
            desired_num_pipelines: 1
            max_num_pipelines_per_indexer: 1
            source_type: file
            params:
                notifications:
                  - type: sqs
                    queue_url: {queue_url}
                    message_type: raw_uri
            input_format: plain_text
        "#
    );

    sandbox
        .rest_client(QuickwitService::Indexer)
        .sources(index_id)
        .create(source_config_input, ConfigFormat::Yaml)
        .await
        .unwrap();

    // Send messages with duplicates
    let tmp_mock_data_files: Vec<_> = iter::repeat_with(|| create_mock_data_file(1000))
        .take(10)
        .collect();
    for (_, uri) in &tmp_mock_data_files {
        sqs_test_helpers::send_message(&sqs_client, &queue_url, uri.as_str()).await;
    }
    sqs_test_helpers::send_message(&sqs_client, &queue_url, tmp_mock_data_files[0].1.as_str())
        .await;
    sqs_test_helpers::send_message(&sqs_client, &queue_url, tmp_mock_data_files[5].1.as_str())
        .await;

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "", 10 * 1000).await;

    // The two duplicates could not be acknowledged when the were received
    // because at that point the relevant data was not yet committed. Now it is
    // committed, but their visibility timeout will still take a while to be
    // reached.
    wait_until_predicate(
        || async {
            let in_flight_count: usize = sqs_test_helpers::get_queue_attribute(
                &sqs_client,
                &queue_url,
                QueueAttributeName::ApproximateNumberOfMessagesNotVisible,
            )
            .await
            .parse()
            .unwrap();
            in_flight_count == 2
        },
        Duration::from_secs(5),
        Duration::from_millis(100),
    )
    .await
    .expect("number of in-flight messages didn't reach 2 within the timeout");

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_sqs_garbage_collect() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;
    let index_id = "test-sqs-source-garbage-collect";
    let index_config = format!(
        r#"
            version: 0.8
            index_id: {index_id}
            doc_mapping:
                field_mappings:
                - name: body
                  type: text
            indexing_settings:
                commit_timeout_secs: 1
            "#
    );

    let sqs_client = sqs_test_helpers::get_localstack_sqs_client().await.unwrap();
    let queue_url = sqs_test_helpers::create_queue(&sqs_client, "test-single-node-cluster").await;

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config.clone(), ConfigFormat::Yaml, false)
        .await
        .unwrap();

    let source_id: &str = "test-sqs-single-node-cluster";
    let source_config_input = format!(
        r#"
            version: 0.7
            source_id: {source_id}
            desired_num_pipelines: 1
            max_num_pipelines_per_indexer: 1
            source_type: file
            params:
                notifications:
                  - type: sqs
                    queue_url: {queue_url}
                    message_type: raw_uri
                    deduplication_window_max_messages: 5
                    deduplication_cleanup_interval_secs: 3
            input_format: plain_text
        "#
    );

    sandbox
        .rest_client(QuickwitService::Indexer)
        .sources(index_id)
        .create(source_config_input, ConfigFormat::Yaml)
        .await
        .unwrap();

    let tmp_mock_data_files: Vec<_> = iter::repeat_with(|| create_mock_data_file(1000))
        .take(10)
        .collect();
    for (_, uri) in &tmp_mock_data_files {
        sqs_test_helpers::send_message(&sqs_client, &queue_url, uri.as_str()).await;
    }

    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    sandbox.assert_hit_count(index_id, "", 10 * 1000).await;

    wait_until_predicate(
        || async {
            let shard_count = sandbox
                .rest_client(QuickwitService::Indexer)
                .sources(index_id)
                .get_shards(source_id)
                .await
                .unwrap()
                .len();
            tracing::info!("shard_count: {}", shard_count);
            shard_count == 5
        },
        Duration::from_secs(6),
        Duration::from_millis(200),
    )
    .await
    .expect("shards where not pruned within the timeout");

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .delete(index_id, false)
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}

// this source update test is done here because SQS is the only long running
// configurable source for which we have integration tests set up.
#[tokio::test]
async fn test_update_source_multi_node_cluster() {
    quickwit_common::setup_logging_for_tests();
    let index_id = "test-update-source-cluster";
    let sqs_client = sqs_test_helpers::get_localstack_sqs_client().await.unwrap();
    let queue_url = sqs_test_helpers::create_queue(&sqs_client, "test-update-source-cluster").await;

    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    // Create an index
    let index_config = format!(
        r#"
        version: 0.8
        index_id: {index_id}
        doc_mapping:
            field_mappings:
            - name: body
              type: text
        indexing_settings:
            commit_timeout_secs: 1
        "#
    );
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(index_config, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    // Wait until indexing pipelines are started
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    // create an SQS source with 1 pipeline
    let source_id: &str = "test-update-source-cluster";
    let source_config_input = format!(
        r#"
            version: 0.7
            source_id: {source_id}
            desired_num_pipelines: 1
            max_num_pipelines_per_indexer: 1
            source_type: file
            params:
                notifications:
                  - type: sqs
                    queue_url: {queue_url}
                    message_type: raw_uri
                    deduplication_window_max_messages: 5
                    deduplication_cleanup_interval_secs: 3
            input_format: plain_text
        "#
    );
    sandbox
        .rest_client(QuickwitService::Indexer)
        .sources(index_id)
        .create(source_config_input, ConfigFormat::Yaml)
        .await
        .unwrap();

    // Wait until the SQS indexing pipeline is also started
    sandbox.wait_for_indexing_pipelines(2).await.unwrap();

    // increase the number of pipelines to 3
    let source_config_input = format!(
        r#"
            version: 0.7
            source_id: {source_id}
            desired_num_pipelines: 3
            max_num_pipelines_per_indexer: 3
            source_type: file
            params:
                notifications:
                  - type: sqs
                    queue_url: {queue_url}
                    message_type: raw_uri
                    deduplication_window_max_messages: 5
                    deduplication_cleanup_interval_secs: 3
            input_format: plain_text
        "#
    );
    sandbox
        .rest_client(QuickwitService::Metastore)
        .sources(index_id)
        .update(source_id, source_config_input, ConfigFormat::Yaml, false)
        .await
        .unwrap();

    // Wait until the SQS indexing pipeline is also started
    sandbox.wait_for_indexing_pipelines(4).await.unwrap();

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/tls_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use hyper_util::rt::TokioExecutor;
use quickwit_config::service::QuickwitService;
use quickwit_serve::SearchRequestQueryString;

use crate::test_utils::ClusterSandboxBuilder;

#[tokio::test]
async fn test_tls_rest() {
    quickwit_common::setup_logging_for_tests();
    let mut sandbox_config = ClusterSandboxBuilder::default()
        .add_node(QuickwitService::supported_services())
        .build_config()
        .await;
    sandbox_config.node_configs[0].0.rest_config.tls = Some(quickwit_config::TlsConfig {
        cert_path: concat!(env!("CARGO_MANIFEST_DIR"), "/test_data/server.crt").to_string(),
        key_path: concat!(env!("CARGO_MANIFEST_DIR"), "/test_data/server.key").to_string(),
        ca_path: concat!(env!("CARGO_MANIFEST_DIR"), "/test_data/ca.crt").to_string(),
        expected_name: None,
        validate_client: false,
    });
    let sandbox = sandbox_config.start().await;
    let node_config = sandbox.node_configs.first().unwrap();
    let client = hyper_util::client::legacy::Client::builder(TokioExecutor::new())
        .pool_idle_timeout(Duration::from_secs(30))
        .http2_only(true)
        .build_http::<String>();
    let root_uri = format!("http://{}/", node_config.0.rest_config.listen_addr)
        .parse::<hyper::Uri>()
        .unwrap();
    client
        .get(root_uri.clone())
        .await
        .expect_err("non tls connection should fail");

    assert_eq!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .indexes()
            .list()
            .await
            .unwrap()
            .len(),
        0
    );

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_tls_grpc() {
    quickwit_common::setup_logging_for_tests();
    let mut sandbox_config = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_config()
        .await;

    for node in &mut sandbox_config.node_configs {
        node.0.rest_config.tls = Some(quickwit_config::TlsConfig {
            cert_path: concat!(env!("CARGO_MANIFEST_DIR"), "/test_data/server.crt").to_string(),
            key_path: concat!(env!("CARGO_MANIFEST_DIR"), "/test_data/server.key").to_string(),
            ca_path: concat!(env!("CARGO_MANIFEST_DIR"), "/test_data/ca.crt").to_string(),
            expected_name: Some("quickwit.local".to_string()),
            validate_client: false,
        });
    }

    let sandbox = sandbox_config.start().await;

    // TODO connect to grpc port and verify it refuses non-tls connection

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            r#"
            version: 0.8
            index_id: my-new-multi-node-index
            doc_mapping:
              field_mappings:
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            "#,
            quickwit_config::ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Assert that at least 1 indexing pipelines is successfully started
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    // Check that search is working
    let search_response_empty = sandbox
        .rest_client(QuickwitService::Searcher)
        .search(
            "my-new-multi-node-index",
            SearchRequestQueryString {
                query: "body:bar".to_string(),
                ..Default::default()
            },
        )
        .await
        .unwrap();
    assert_eq!(search_response_empty.num_hits, 0);

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/update_tests/create_on_update.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use quickwit_config::service::QuickwitService;
use quickwit_rest_client::rest_client::CommitType;
use serde_json::json;

use super::assert_hits_unordered;
use crate::ingest_json;
use crate::test_utils::{ClusterSandboxBuilder, ingest};

#[tokio::test]
async fn test_update_missing_no_create() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    let status_code = sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .update(
            "my-updatable-index",
            r#"
            version: 0.8
            index_id: my-updatable-index
            doc_mapping:
              field_mappings:
              - name: title
                type: text
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            search_settings:
              default_search_fields: [title, body]
            "#,
            quickwit_config::ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap_err()
        .status_code()
        .unwrap();
    assert_eq!(status_code, 404);

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_update_missing_create() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .update(
            "my-updatable-index",
            r#"
            version: 0.8
            index_id: my-updatable-index
            doc_mapping:
              field_mappings:
              - name: title
                type: text
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            search_settings:
              default_search_fields: [title, body]
            "#,
            quickwit_config::ConfigFormat::Yaml,
            true,
        )
        .await
        .unwrap();

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_update_create_existing_doesnt_clear() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    // Create an index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            r#"
            version: 0.8
            index_id: my-updatable-index
            doc_mapping:
              field_mappings:
              - name: title
                type: text
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            search_settings:
              default_search_fields: [title]
            "#,
            quickwit_config::ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();
    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Wait until indexing pipelines are started
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        "my-updatable-index",
        ingest_json!({"title": "first", "body": "first record"}),
        CommitType::Auto,
    )
    .await
    .unwrap();

    // Wait until split is committed
    tokio::time::sleep(Duration::from_secs(4)).await;

    // No hit because `default_search_fields` only covers the `title` field
    assert_hits_unordered(&sandbox, "my-updatable-index", "record", Ok(&[])).await;

    // Update the index to also search `body` by default, the same search should
    // now have 1 hit
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .update(
            "my-updatable-index",
            r#"
            version: 0.8
            index_id: my-updatable-index
            doc_mapping:
              field_mappings:
              - name: title
                type: text
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            search_settings:
              default_search_fields: [title, body]
            "#,
            quickwit_config::ConfigFormat::Yaml,
            true,
        )
        .await
        .unwrap();

    assert_hits_unordered(
        &sandbox,
        "my-updatable-index",
        "record",
        Ok(&[json!({"title": "first", "body": "first record"})]),
    )
    .await;

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/update_tests/doc_mapping_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Write;
use std::time::Duration;

use quickwit_config::service::QuickwitService;
use quickwit_rest_client::models::IngestSource;
use quickwit_rest_client::rest_client::CommitType;
use serde_json::{Value, json};

use super::assert_hits_unordered;
use crate::test_utils::ClusterSandboxBuilder;

/// Update the doc mapping between 2 calls to local-ingest (forces separate indexing pipelines) and
/// assert the number of hits for the given query
async fn validate_search_across_doc_mapping_updates(
    index_id: &str,
    original_doc_mapping: Value,
    ingest_before_update: &[Value],
    updated_doc_mapping: Value,
    ingest_after_update: &[Value],
    query_and_expect: &[(&str, Result<&[Value], ()>)],
) {
    let sandbox = ClusterSandboxBuilder::build_and_start_standalone().await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    // Create index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            json!({
                "version": "0.8",
                "index_id": index_id,
                "doc_mapping": original_doc_mapping,
                "indexing_settings": {
                    "commit_timeout_secs": 1
                },
            })
            .to_string(),
            quickwit_config::ConfigFormat::Json,
            false,
        )
        .await
        .unwrap();

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Wait until indexing pipelines are started.
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    // We use local ingest to always pick up the latest doc mapping
    sandbox
        .local_ingest(index_id, ingest_before_update)
        .await
        .unwrap();

    // Update index to also search "body" by default, search should now have 1 hit
    sandbox
        .rest_client(QuickwitService::Searcher)
        .indexes()
        .update(
            index_id,
            json!({
                "version": "0.8",
                "index_id": index_id,
                "doc_mapping": updated_doc_mapping,
                "indexing_settings": {
                    "commit_timeout_secs": 1,
                },
            })
            .to_string(),
            quickwit_config::ConfigFormat::Json,
            false,
        )
        .await
        .unwrap();

    sandbox
        .local_ingest(index_id, ingest_after_update)
        .await
        .unwrap();

    for (query, expected_hits) in query_and_expect.iter().copied() {
        assert_hits_unordered(&sandbox, index_id, query, expected_hits).await;
    }

    sandbox.shutdown().await.unwrap();
}

#[tokio::test]
async fn test_update_doc_mapping_text_to_u64() {
    let index_id = "update-text-to-u64";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"}
        ]
    });
    let ingest_before_update = &[json!({"body": "14"}), json!({"body": "15"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "u64"}
        ]
    });
    let ingest_after_update = &[json!({"body": 16}), json!({"body": 17})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:14", Ok(&[json!({"body": 14})])),
            ("body:16", Ok(&[json!({"body": 16})])),
            // error expected because the validation is performed
            // by latest doc mapping
            ("body:hello", Err(())),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_u64_to_text() {
    let index_id = "update-u64-to-text";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "u64"}
        ],
        "mode": "strict",
    });
    let ingest_before_update = &[json!({"body": 14}), json!({"body": 15})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"},
        ],
        "mode": "strict",
    });
    let ingest_after_update = &[json!({"body": "16"}), json!({"body": "hello world"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:14", Ok(&[json!({"body": "14"})])),
            ("body:16", Ok(&[json!({"body": "16"})])),
            ("body:hello", Ok(&[json!({"body": "hello world"})])),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_json_to_text() {
    let index_id = "update-json-to-text";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "json"}
        ]
    });
    let ingest_before_update = &[
        json!({"body": {"field1": "hello"}}),
        json!({"body": {"field2": "world"}}),
    ];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"}
        ]
    });
    let ingest_after_update = &[json!({"body": "hello world"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[json!({"body": "hello world"})])),
            // error expected because the validation is performed
            // by latest doc mapping
            ("body.field1:hello", Err(())),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_json_to_object() {
    let index_id = "update-json-to-object";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "json"}
        ]
    });
    let ingest_before_update = &[
        json!({"body": {"field1": "hello"}}),
        json!({"body": {"field2": "world"}}),
    ];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {
                "name": "body",
                "type": "object",
                "field_mappings": [
                    {"name": "field1", "type": "text"},
                    {"name": "field2", "type": "text"},
                ]
            }
        ]
    });
    let ingest_after_update = &[
        json!({"body": {"field1": "hola"}}),
        json!({"body": {"field2": "mundo"}}),
    ];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            (
                "body.field1:hello",
                Ok(&[json!({"body": {"field1": "hello"}})]),
            ),
            (
                "body.field1:hola",
                Ok(&[json!({"body": {"field1": "hola"}})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_object_to_json() {
    let index_id = "update-object-to-json";
    let original_doc_mappings = json!({
        "field_mappings": [
            {
                "name": "body",
                "type": "object",
                "field_mappings": [
                    {"name": "field1", "type": "text"},
                    {"name": "field2", "type": "text"},
                ]
            }
        ]
    });
    let ingest_before_update = &[
        json!({"body": {"field1": "hello"}}),
        json!({"body": {"field2": "world"}}),
    ];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "json"}
        ]
    });
    let ingest_after_update = &[
        json!({"body": {"field1": "hola"}}),
        json!({"body": {"field2": "mundo"}}),
    ];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            (
                "body.field1:hello",
                Ok(&[json!({"body": {"field1": "hello"}})]),
            ),
            (
                "body.field1:hola",
                Ok(&[json!({"body": {"field1": "hola"}})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_tokenizer_default_to_raw() {
    let index_id = "update-tokenizer-default-to-raw";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "default"}
        ]
    });
    let ingest_before_update = &[json!({"body": "hello-world"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "raw"}
        ]
    });
    let ingest_after_update = &[json!({"body": "bonjour-monde"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[json!({"body": "hello-world"})])),
            ("body:world", Ok(&[json!({"body": "hello-world"})])),
            // phrases queries won't apply to older splits that didn't support them
            ("body:\"hello world\"", Ok(&[])),
            ("body:\"hello-world\"", Ok(&[])),
            ("body:\"hello-worl\"*", Ok(&[])),
            ("body:bonjour", Ok(&[])),
            ("body:monde", Ok(&[])),
            // the raw tokenizer only returns exact matches
            ("body:\"bonjour monde\"", Ok(&[])),
            (
                "body:\"bonjour-monde\"",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
            (
                "body:\"bonjour-mond\"*",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_tokenizer_add_position() {
    let index_id = "update-tokenizer-add-position";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "default"}
        ]
    });
    let ingest_before_update = &[json!({"body": "hello-world"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "default", "record": "position"}
        ]
    });
    let ingest_after_update = &[json!({"body": "bonjour-monde"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[json!({"body": "hello-world"})])),
            ("body:world", Ok(&[json!({"body": "hello-world"})])),
            // phrases queries don't apply to older splits that didn't support them
            ("body:\"hello-world\"", Ok(&[])),
            ("body:\"hello world\"", Ok(&[])),
            ("body:\"hello-worl\"*", Ok(&[])),
            ("body:bonjour", Ok(&[json!({"body": "bonjour-monde"})])),
            ("body:monde", Ok(&[json!({"body": "bonjour-monde"})])),
            (
                "body:\"bonjour-monde\"",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
            (
                "body:\"bonjour monde\"",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
            (
                "body:\"bonjour-mond\"*",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_tokenizer_raw_to_phrase() {
    let index_id = "update-tokenizer-raw-to-phrase";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "raw"}
        ]
    });
    let ingest_before_update = &[json!({"body": "hello-world"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "default", "record": "position"}
        ]
    });
    let ingest_after_update = &[json!({"body": "bonjour-monde"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[])),
            ("body:world", Ok(&[])),
            // raw tokenizer used here, only exact matches returned
            (
                "body:\"hello-world\"",
                Ok(&[json!({"body": "hello-world"})]),
            ),
            ("body:\"hello world\"", Ok(&[])),
            ("body:bonjour", Ok(&[json!({"body": "bonjour-monde"})])),
            ("body:monde", Ok(&[json!({"body": "bonjour-monde"})])),
            (
                "body:\"bonjour-monde\"",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
            (
                "body:\"bonjour monde\"",
                Ok(&[json!({"body": "bonjour-monde"})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_unindexed_to_indexed() {
    let index_id = "update-not-indexed-to-indexed";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "indexed": false}
        ]
    });
    let ingest_before_update = &[json!({"body": "hello"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text", "tokenizer": "raw"}
        ]
    });
    let ingest_after_update = &[json!({"body": "bonjour"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            // term query won't apply to older splits that weren't indexed
            ("body:hello", Ok(&[])),
            ("body:IN [hello]", Ok(&[])),
            // works on newer data
            ("body:bonjour", Ok(&[json!({"body": "bonjour"})])),
            ("body:IN [bonjour]", Ok(&[json!({"body": "bonjour"})])),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_strict_to_dynamic() {
    let index_id = "update-strict-to-dynamic";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"}
        ],
        "mode": "strict",
    });
    let ingest_before_update = &[json!({"body": "hello"})];
    let updated_doc_mappings = json!({
        "mode": "dynamic",
    });
    let ingest_after_update = &[json!({"body": "world", "title": "salutations"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[json!({"body": "hello"})])),
            (
                "body:world",
                Ok(&[json!({"body": "world", "title": "salutations"})]),
            ),
            (
                "title:salutations",
                Ok(&[json!({"body": "world", "title": "salutations"})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_dynamic_to_strict() {
    let index_id = "update-dynamic-to-strict";
    let original_doc_mappings = json!({
        "mode": "dynamic",
    });
    let ingest_before_update = &[json!({"body": "hello"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"}
        ],
        "mode": "strict",
    });
    let ingest_after_update = &[json!({"body": "world"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[json!({"body": "hello"})])),
            ("body:world", Ok(&[json!({"body": "world"})])),
        ],
    )
    .await;
}

#[tokio::test]
async fn test_update_doc_mapping_add_field_on_strict() {
    let index_id = "update-add-field-on-strict";
    let original_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"},
        ],
        "mode": "strict",
    });
    let ingest_before_update = &[json!({"body": "hello"})];
    let updated_doc_mappings = json!({
        "field_mappings": [
            {"name": "body", "type": "text"},
            {"name": "title", "type": "text"},
        ],
        "mode": "strict",
    });
    let ingest_after_update = &[json!({"body": "world", "title": "salutations"})];
    validate_search_across_doc_mapping_updates(
        index_id,
        original_doc_mappings,
        ingest_before_update,
        updated_doc_mappings,
        ingest_after_update,
        &[
            ("body:hello", Ok(&[json!({"body": "hello"})])),
            (
                "body:world",
                Ok(&[json!({"body": "world", "title": "salutations"})]),
            ),
            (
                "title:salutations",
                Ok(&[json!({"body": "world", "title": "salutations"})]),
            ),
        ],
    )
    .await;
}

#[tokio::test]
#[ignore]
// TODO(#5738)
async fn test_update_doc_validation() {
    quickwit_common::setup_logging_for_tests();
    let index_id = "update-doc-validation";
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([
            QuickwitService::Searcher,
            QuickwitService::Metastore,
            QuickwitService::Indexer,
            QuickwitService::ControlPlane,
            QuickwitService::Janitor,
        ])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    // Create index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            json!({
                "version": "0.8",
                "index_id": index_id,
                "doc_mapping": {
                    "field_mappings": [
                        {"name": "body", "type": "u64"}
                    ]
                },
                "indexing_settings": {
                    "commit_timeout_secs": 1
                },
            })
            .to_string(),
            quickwit_config::ConfigFormat::Json,
            false,
        )
        .await
        .unwrap();

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Wait until indexing pipelines are started.
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    let unsigned_payload = (0..20).fold(String::new(), |mut buffer, id| {
        writeln!(&mut buffer, "{{\"body\": {id}}}").unwrap();
        buffer
    });

    let unsigned_response = sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            IngestSource::Str(unsigned_payload.clone()),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();

    assert_eq!(unsigned_response.num_rejected_docs.unwrap(), 0);

    sandbox
        .rest_client(QuickwitService::Searcher)
        .indexes()
        .update(
            index_id,
            json!({
                "version": "0.8",
                "index_id": index_id,
                "doc_mapping": {
                    "field_mappings": [
                        {"name": "body", "type": "i64"}
                    ]
                },
                "indexing_settings": {
                    "commit_timeout_secs": 1,
                },
            })
            .to_string(),
            quickwit_config::ConfigFormat::Json,
            false,
        )
        .await
        .unwrap();

    let signed_payload = (-20..0).fold(String::new(), |mut buffer, id| {
        writeln!(&mut buffer, "{{\"body\": {id}}}").unwrap();
        buffer
    });

    let signed_response = sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            IngestSource::Str(signed_payload.clone()),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();

    assert_eq!(signed_response.num_rejected_docs.unwrap(), 0);

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/update_tests/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::service::QuickwitService;
use quickwit_serve::SearchRequestQueryString;
use serde_json::Value;

use crate::test_utils::ClusterSandbox;

/// Checks that the result of the given query matches the expected values
async fn assert_hits_unordered(
    sandbox: &ClusterSandbox,
    index_id: &str,
    query: &str,
    expected_result: Result<&[Value], ()>,
) {
    let search_res = sandbox
        .rest_client(QuickwitService::Searcher)
        .search(
            index_id,
            SearchRequestQueryString {
                query: query.to_string(),
                max_hits: expected_result.map(|hits| hits.len() as u64).unwrap_or(1),
                ..Default::default()
            },
        )
        .await;
    if let Ok(expected_hits) = expected_result {
        let resp = search_res.unwrap_or_else(|err| panic!("query: {query}, error: {err}"));
        assert_eq!(resp.errors.len(), 0, "query: {query}");
        assert_eq!(resp.num_hits, expected_hits.len() as u64, "query: {query}");
        for expected_hit in expected_hits {
            assert!(
                resp.hits.contains(expected_hit),
                "query: {} -> expected hits: {:?}, got: {:?}",
                query,
                expected_hits,
                resp.hits
            );
        }
    } else if let Ok(search_response) = search_res {
        assert!(!search_response.errors.is_empty(), "query: {query}");
    }
}

mod create_on_update;
mod doc_mapping_tests;
mod restart_indexer_tests;
mod search_settings_tests;


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/update_tests/restart_indexer_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Write;
use std::time::Duration;

use quickwit_config::service::QuickwitService;
use quickwit_metastore::SplitState;
use quickwit_proto::types::DocMappingUid;
use quickwit_rest_client::models::IngestSource;
use quickwit_rest_client::rest_client::CommitType;
use quickwit_serve::ListSplitsQueryParams;
use serde_json::json;

use crate::test_utils::ClusterSandboxBuilder;

#[tokio::test]
async fn test_update_doc_mapping_restart_indexing_pipeline() {
    let index_id = "update-restart-ingest";
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([
            QuickwitService::Searcher,
            QuickwitService::Metastore,
            QuickwitService::Indexer,
            QuickwitService::ControlPlane,
            QuickwitService::Janitor,
        ])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    // usually these are choosen by quickwit, but actually the client can specify them
    // and we do here to simplify the test
    let initial_mapping_uid = DocMappingUid::for_test(1);
    let final_mapping_uid = DocMappingUid::for_test(2);

    // Create index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            json!({
                "version": "0.8",
                "index_id": index_id,
                "doc_mapping": {
                    "doc_mapping_uid": initial_mapping_uid,
                    "field_mappings": [
                        {"name": "body", "type": "u64"}
                    ]
                },
                "indexing_settings": {
                    "commit_timeout_secs": 1
                },
            })
            .to_string(),
            quickwit_config::ConfigFormat::Json,
            false,
        )
        .await
        .unwrap();

    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Wait until indexing pipelines are started.
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    let payload = (0..1000).fold(String::new(), |mut buffer, id| {
        writeln!(&mut buffer, "{{\"body\": {id}}}").unwrap();
        buffer
    });

    // ingest some documents with old doc mapping.
    // we *don't* use local ingest to use a normal indexing pipeline
    sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            IngestSource::Str(payload.clone()),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();

    // we wait for a new split. We don't want to force commits to let the pipeline behave as if in
    // a steady state.
    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 1)
        .await
        .unwrap();

    // we ingest again, this might end up with the new or old doc mapping depending on how quickly
    // the pipeline gets killed and restarted (in practice as this cluster is very lightly loaded,
    // it will almost always kill the pipeline before these documents are committed)
    sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            IngestSource::Str(payload.clone()),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();

    // Update index
    sandbox
        .rest_client(QuickwitService::Searcher)
        .indexes()
        .update(
            index_id,
            json!({
                "version": "0.8",
                "index_id": index_id,
                "doc_mapping": {
                    "doc_mapping_uid": final_mapping_uid,
                    "field_mappings": [
                        {"name": "body", "type": "i64"}
                    ]
                },
                "indexing_settings": {
                    "commit_timeout_secs": 1,
                },
            })
            .to_string(),
            quickwit_config::ConfigFormat::Json,
            false,
        )
        .await
        .unwrap();

    // we ingest again, this might end up with the new or old doc mapping depending on how quickly
    // the pipeline gets killed and restarted. In practice this will almost always use the new
    // mapping on a lightly loaded cluster.
    sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            IngestSource::Str(payload.clone()),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();

    // we wait for a 2nd split, though it might still be there if it contains only batch 2 and not
    // batch 3.
    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 2)
        .await
        .unwrap();

    // we ingest again, definitely with the up to date doc mapper this time
    sandbox
        .rest_client(QuickwitService::Indexer)
        .ingest(
            index_id,
            IngestSource::Str(payload.clone()),
            None,
            None,
            CommitType::Auto,
        )
        .await
        .unwrap();

    // wait for a last commit
    sandbox
        .wait_for_splits(index_id, Some(vec![SplitState::Published]), 3)
        .await
        .unwrap();

    let splits = sandbox
        .rest_client(QuickwitService::Indexer)
        .splits(index_id)
        .list(ListSplitsQueryParams::default())
        .await
        .unwrap();

    // we expect 3 splits, with all docs, and at least one split under old mapping and one under
    // new mapping
    assert_eq!(splits.len(), 3);
    assert!(
        splits
            .iter()
            .filter(|split| split.split_metadata.doc_mapping_uid == initial_mapping_uid)
            .count()
            > 0
    );
    assert!(
        splits
            .iter()
            .filter(|split| split.split_metadata.doc_mapping_uid == final_mapping_uid)
            .count()
            > 0
    );
    assert_eq!(
        splits
            .iter()
            .map(|split| split.split_metadata.num_docs)
            .sum::<usize>(),
        4000
    );

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/src/tests/update_tests/search_settings_tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use quickwit_config::service::QuickwitService;
use quickwit_rest_client::rest_client::CommitType;
use serde_json::json;

use super::assert_hits_unordered;
use crate::ingest_json;
use crate::test_utils::{ClusterSandboxBuilder, ingest};

#[tokio::test]
async fn test_update_search_settings_on_multi_nodes_cluster() {
    quickwit_common::setup_logging_for_tests();
    let sandbox = ClusterSandboxBuilder::default()
        .add_node([QuickwitService::Searcher])
        .add_node([QuickwitService::Metastore])
        .add_node([QuickwitService::Indexer])
        .add_node([QuickwitService::ControlPlane])
        .add_node([QuickwitService::Janitor])
        .build_and_start()
        .await;

    {
        // Wait for indexer to fully start.
        // The starting time is a bit long for a cluster.
        tokio::time::sleep(Duration::from_secs(3)).await;
        let indexing_service_counters = sandbox
            .rest_client(QuickwitService::Indexer)
            .node_stats()
            .indexing()
            .await
            .unwrap();
        assert_eq!(indexing_service_counters.num_running_pipelines, 0);
    }

    // Create an index
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .create(
            r#"
            version: 0.8
            index_id: my-updatable-index
            doc_mapping:
              field_mappings:
              - name: title
                type: text
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            search_settings:
              default_search_fields: [title]
            "#,
            quickwit_config::ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();
    assert!(
        sandbox
            .rest_client(QuickwitService::Indexer)
            .node_health()
            .is_live()
            .await
            .unwrap()
    );

    // Wait until indexing pipelines are started
    sandbox.wait_for_indexing_pipelines(1).await.unwrap();

    ingest(
        &sandbox.rest_client(QuickwitService::Indexer),
        "my-updatable-index",
        ingest_json!({"title": "first", "body": "first record"}),
        CommitType::Auto,
    )
    .await
    .unwrap();

    // Wait until split is committed
    tokio::time::sleep(Duration::from_secs(4)).await;

    // No hit because `default_search_fields`` only covers the `title` field
    assert_hits_unordered(&sandbox, "my-updatable-index", "record", Ok(&[])).await;

    // Update the index to also search `body` by default, the same search should
    // now have 1 hit
    sandbox
        .rest_client(QuickwitService::Indexer)
        .indexes()
        .update(
            "my-updatable-index",
            r#"
            version: 0.8
            index_id: my-updatable-index
            doc_mapping:
              field_mappings:
              - name: title
                type: text
              - name: body
                type: text
            indexing_settings:
              commit_timeout_secs: 1
            search_settings:
              default_search_fields: [title, body]
            "#,
            quickwit_config::ConfigFormat::Yaml,
            false,
        )
        .await
        .unwrap();

    assert_hits_unordered(
        &sandbox,
        "my-updatable-index",
        "record",
        Ok(&[json!({"title": "first", "body": "first record"})]),
    )
    .await;

    sandbox.shutdown().await.unwrap();
}


================================================
FILE: quickwit/quickwit-integration-tests/test_data/README.md
================================================
some of the assets containing in this directory are test certificates and corresponding private key.
It's not unusual for automatic scanners to pick them up and warn about leaked private keys. These
keys are not meant to be private, so if that happen, feel free to ignore the messages.


================================================
FILE: quickwit/quickwit-integration-tests/test_data/ca.crt
================================================
-----BEGIN CERTIFICATE-----
MIIFCzCCAvOgAwIBAgIUI70aP6K+1YrhuCysdEmmY9LcdXEwDQYJKoZIhvcNAQEL
BQAwFTETMBEGA1UEAwwKcXcgdGVzdCBDQTAeFw0yNDEyMDkxMTM4MDVaFw0zNDEy
MTAxMTM4MDVaMBUxEzARBgNVBAMMCnF3IHRlc3QgQ0EwggIiMA0GCSqGSIb3DQEB
AQUAA4ICDwAwggIKAoICAQDWZLa7Tzkm+hs9itOG4dGsGAOP6FmY7zQtpq2cvi62
GfzQZMrNyhNB49zRPKPmwZ7dTrqP65OHZt6JPn/Pw12reWRGIFHFnw87ybdqCi3W
M9bz6UYdvn5r3g+VrIVDJ0NlBKjv2ZGvv/lpzP3GbbT8hX1UThee8k8SdMMuEQzg
repZnOlby5sfIAZ+40pZagjln+w+wUvzupQpgHGRRPokWVrA6ej4Gx/6mRVFTT4S
dQABfAI6mAeQfkiK0AoN2DuujvDM6noqelePtQCD7X4XCj8QTw+qM8meDLNY92BK
2Y3zMnbBpnLfX1zA6hVWhBeBAfjFuCTxgh54RWGZm7vSFefwtA0c9xV4OXIMlZ95
3OB2W7pB+xGPIaJfH4YOFnAPWrDMBf1HXX4HWPgxahpntgJLwhOpR5FfeKaq8liK
PmFu2nr7PYcQ4yWDyFOy5hWSdsYejwo5IJiQryC+sitPaBIZrXl0Q29vGPqLUn5s
emP0XTsWPrZsm+RYz25Ux+DHEHzWCnRq16Qlye7cBrjJECCuD4dYCR/t8pfWeX4+
vICqaq46QZk5C5hFjPPjrP5ZtmjfScp//TuxyBYuY5D6ZzfUnsm/RfEiWicjOp4/
gWkqsDE1SwOzw0YZFVeZ+c3TBG8A/XxbZ7csFrzzmoGMnF/1bjSpGOAB4M/CubaN
dwIDAQABo1MwUTAdBgNVHQ4EFgQUKihfkQ1qc1VhyRkgnQfvHksi5iswHwYDVR0j
BBgwFoAUKihfkQ1qc1VhyRkgnQfvHksi5iswDwYDVR0TAQH/BAUwAwEB/zANBgkq
hkiG9w0BAQsFAAOCAgEA0jJTDB7hgwJnvWPvc4kKBQGnsIYt4dQFn377GLqPIB8Y
SLdBVVCRQCyssvqEMZe/+38SX8u3UVnBnnVlxuGqBTZJo7KN4geRkruXFVdnSOHF
lHslvPVp2KsYcpjqRspt8NRIkgvx5YGd02q2NUIIyY8JeEkt1B3QurPaUIpTlzWS
6dxVgo1Byyoxoe9BJ/M9bH+73mMTJvSjVKWGIJFvCdNV6twjyoWJeXkL696zquhu
0YdHYxS65AU0NAflBCxgxREr5dql0TruxwLG/6THAJcqmMLUwxyDYIP4P+1k4xtV
KEGKqESdZTUp61AhAOAdsUuK5Iz4HUTb0uB1fzZMVjxA+03VC0/pcum6qP15M+xg
chnQ8fNo0iZCDr3LD4kwsAqoWOQ4oV+ZLBthh6gVmHtuTS3ehMTH99r6T2II+8R1
5rPtE14uelgZJVcxD7z+xWDfODJIhxlWjwxJkBcCkvaGMQU3+kTUe5U6EJL52Z5q
G/Mh4uNceLx1uSuh0/R68AXj5LLmShjSYO7rV7KlFGS0B7iglsgwgs74GUQzt0nq
1Qe7QGsVoSVIabq0Es2gUjiEeRJYg6X7Gy9tAESY//zYW3Qh26/sqGgkYypa9Hy9
w0T+IrQAj2K+LkOEoFwBOdx5qyRlRdd1l7xioJjhjHA+u+e3HBf6fk/VVuFXgBc=
-----END CERTIFICATE-----


================================================
FILE: quickwit/quickwit-integration-tests/test_data/ca.key
================================================
-----BEGIN PRIVATE KEY-----
MIIJRAIBADANBgkqhkiG9w0BAQEFAASCCS4wggkqAgEAAoICAQDWZLa7Tzkm+hs9
itOG4dGsGAOP6FmY7zQtpq2cvi62GfzQZMrNyhNB49zRPKPmwZ7dTrqP65OHZt6J
Pn/Pw12reWRGIFHFnw87ybdqCi3WM9bz6UYdvn5r3g+VrIVDJ0NlBKjv2ZGvv/lp
zP3GbbT8hX1UThee8k8SdMMuEQzgrepZnOlby5sfIAZ+40pZagjln+w+wUvzupQp
gHGRRPokWVrA6ej4Gx/6mRVFTT4SdQABfAI6mAeQfkiK0AoN2DuujvDM6noqeleP
tQCD7X4XCj8QTw+qM8meDLNY92BK2Y3zMnbBpnLfX1zA6hVWhBeBAfjFuCTxgh54
RWGZm7vSFefwtA0c9xV4OXIMlZ953OB2W7pB+xGPIaJfH4YOFnAPWrDMBf1HXX4H
WPgxahpntgJLwhOpR5FfeKaq8liKPmFu2nr7PYcQ4yWDyFOy5hWSdsYejwo5IJiQ
ryC+sitPaBIZrXl0Q29vGPqLUn5semP0XTsWPrZsm+RYz25Ux+DHEHzWCnRq16Ql
ye7cBrjJECCuD4dYCR/t8pfWeX4+vICqaq46QZk5C5hFjPPjrP5ZtmjfScp//Tux
yBYuY5D6ZzfUnsm/RfEiWicjOp4/gWkqsDE1SwOzw0YZFVeZ+c3TBG8A/XxbZ7cs
FrzzmoGMnF/1bjSpGOAB4M/CubaNdwIDAQABAoICAAdp94ZmCJ7tb+W37aAGInRm
EYbMzSm5vpSEOrq8j5b33RiZHl5GylWxUIs3zUnckObW+Hf4+I1qeZrwu1tu8R1N
7FwfH/91LwICnsIe/1N0pXlNLCyOetwLaNSPNmiKbLfglQr+UMhtcMLqNi3CJiEZ
aKpyrORv6AYbsugz6hMW+zoFcBh0OQq21ngAL4EEvAayJL74JkKTxYM4kDTVgs+g
+2odF1OvycemZZLo8eg80uGPl/Ajc8Iua8nJGfU9RgsU9wTPEvxxu0zFQJ2kp9ia
H8YrmxS9XQ/cdpNGsrYZQeG9cVfkWVKaKfX4jQEEk7TVYZ9MwpJLd/bxcfJC7W1t
KjHStiIFuvp5pqfKYgGZPnVdEe8T43naQopvB/IJ8TYp3Jy7Pxl+FP7sHN2F4sgn
tHDdvuWTSQT9DvInvuEzMkFxI0SN1kt/GEA7xg4bd/TUCZgkIS92xxxKG8c/3a2O
BbXc5RpaGreDZn9cYtZ4nihJj7lsqouHAGcVz2oljZaWlJIkOzE/rDHDl2hQtvUg
oTQvsbsFZjm3tf3ZPoDjM5GCM8Z+BG61KAyIuUlZ9QgYANgUMd+XoM+NMpGOmbhZ
pLaCUzSKpVKt58rqepW3uFh+cQFi0kDkT5c9sNHrZtv9xZy0MzuzcErda/fJhASQ
m9xX9dbqsgIoJWsv5NnJAoIBAQD//JOQsTsZSGGPptaV6ctieat2jkemdVGdtGuO
9XjmC26htA0Unv+NBzeBfQ2Lf3nsap9ksw2/abnLAi8Bq6S/utQCVjoh5Kwg3m2d
j/rBDSd+GSPNH31yPki7tLsiLgWZGEo5sYu5bdaHGTXXD6SwY9xAZUT2CN9U83nR
+2OvOvd+oZvKok4DCstPKIYI5oDYgDrmII/4kKjaBfXU3qxWJ7jr4aKOCpUM1Xtd
dTCaDwKWOV4DyNGzn4VjNhLh/QHL1v+EbtZHJp2vqj8X+cLJDCMLJMqTPa/+2FvX
zj4orbh5Yo5APGs0QjT/67CeWbjHoczcZwTaJLY67zdoLGBLAoIBAQDWZ5TC+SZL
71REYW68rGIqa8T2Md9kLHD6h0UOPnReYFLPpE7nmQKp4+25wmuDTQVg2db3Zzxc
+be+JEpi8nJreMjsnyj6x9ufLST/2Hq2Ns9amZsdCXdFPK2zeuvrTh5ahieQ9ywQ
flg1VDOIXN+46Q+/dJmgfLtz5/AFyf/cGDiZ+KpmrZxWYAjV1kYDU1XbQ+IFwP3b
BweULbIw1ugEeXhkj5ecoqCnIhX33VmCMVbu+wuuFW9QOqIFEtpsYs1qf4CH6zW/
gyrgWmJHTBgnPj5XIGRpa+gkUB6dqCCQdpW/F3bdVj1jY6+ef6UXNlCKe0FT2BXR
9jNrfP2iVoQFAoIBAQCsAwcNpWo29QJJyyxKlE2MoIFtKvJOkmsDc+cKqzxQKMJw
elKH1seV9pF/u45MfJ5rFMKCoibMxriIB7Gah8Iu69XmtBZgDA72D0DNLaCr9LDi
9PWvskdTazLonutYbmBonX/TANEJCxuqsHATUXmy5Yds5h/Oy+t2ZB0p0qkLaK5C
M0pCgYm2VZyEVpCqjmlqEdCCLsNPnbU4u+SS5AYd5pdGOdpHZCj/9Lvu8v5zpz5v
v6DDHkB7WOgC4KUTojWAybntPaVTLkmrbtTywWv4OOWbaV+OTVdkAfLFMttl7kYV
mvpHg9HtzcdbaP7HiTa3PqwwNjF2fFDPjUtH/vm9AoIBAQCeGh2ptN4XqrFCB3MI
MDnnPDcusNIhZWAebfdvLIDVQ0Rtl6UTxVIgg1I+4+4yEW7A34JUR81MZlynGs27
rzrOo2/OhQNMAmqiM0EQZMsAaOR408J9JAjOhpM0QZWMm7toV3r/vDTDKNfU43Vo
vcu/6CTTsqDCppf4PXVSX4WMAFRkveix9J3PV9vMC8jvFNm/6YvXYFwR0lo1W4kF
2MOY4RX1WamcOJQtCsaWU6R4i/emHHudcHL3/3SQNznYKPd+6+yUzc6BnbDVZfEI
0EUTUyPXTaydzJOPi4E4Es2ImdmM4zmkt75m9xB+2XOc7VFw/LjMohBdFqcOQUor
Fo8dAoIBAQCsBBs7zNwOhVLBiq1BKMCSQF22snz/0jGgA+pNjNkbZspbVNrRQh3X
ZeBW1akN3z1uueAydMJvkhJjVp2Ub1e3xlQZK71NjT1HscttuZ7FhuGm04r7rWcZ
YtKtakOAuHmrTAaDR0akgPJvdblyhDrB9xjJHZAWyky/WqOwtrVQHE9VOWp5JOBd
Ma++rCEV0CSs/c+Mi5i0EMw3gJrE+x1veWIEbcDT4O6z4oN89GvswvMZxjEIUPlZ
Ignt0ylL665EKdoNfSDBt83XmixaHpNSkIRL/QePMUrSfMVeGwbuqb7v3BBbrGxq
7wK4WKdoN0S5t/D1Sv5mBCaf1RGPP8XQ
-----END PRIVATE KEY-----


================================================
FILE: quickwit/quickwit-integration-tests/test_data/ca.srl
================================================
083453D85C20FF26BD4F878E64C2F3C62316E7A5


================================================
FILE: quickwit/quickwit-integration-tests/test_data/regenerate-certs.sh
================================================
#!/usr/bin/env bash

# this script regenerate cryptographic material used in tests. These are valid for 10y, but better
# keep how to regenerate them than get stuck with failing tests eventually

rm ca.{crt,key,srl} server.{csr,key,v3.ext,crt}
openssl genrsa -out ca.key 4096
openssl req -x509 -new -nodes -key ca.key -sha256 -days 3653 -out ca.crt -subj '/CN=qw test CA'
openssl req -new -nodes -out server.csr -newkey rsa:4096 -keyout server.key -subj '/CN=qw test certificate'

cat > server.v3.ext << EOF
authorityKeyIdentifier=keyid,issuer
basicConstraints=CA:FALSE
keyUsage = digitalSignature, nonRepudiation, keyEncipherment, dataEncipherment
subjectAltName = @alt_names
[alt_names]
DNS.1 = quickwit.local
IP.1 = 127.0.0.1
EOF

openssl x509 -req -in server.csr -CA ca.crt -CAkey ca.key -CAcreateserial -out server.crt -days 3653 -sha256 -extfile server.v3.ext


================================================
FILE: quickwit/quickwit-integration-tests/test_data/server.crt
================================================
-----BEGIN CERTIFICATE-----
MIIFPDCCAySgAwIBAgIUCDRT2Fwg/ya9T4eOZMLzxiMW56UwDQYJKoZIhvcNAQEL
BQAwFTETMBEGA1UEAwwKcXcgdGVzdCBDQTAeFw0yNDEyMDkxMTM4MDVaFw0zNDEy
MTAxMTM4MDVaMB4xHDAaBgNVBAMME3F3IHRlc3QgY2VydGlmaWNhdGUwggIiMA0G
CSqGSIb3DQEBAQUAA4ICDwAwggIKAoICAQCJTizLx2PE0AyHhBBtctCwNw+3JR1Z
jTYmcgcdg4QEN/QE5VvUr3Cf8GZWZLjkzO2zQHExsmofcjGhnfayYnKTecWUryD8
WfC1fGwUGw+X7oef16f/hi2iQokk56WNBfB/rsi5tOH4cLZRszPiuPTP1hLJPpAN
PhmAXqjors2HptMCjwvoD+J6Rjd+H8tflyztSV8GbIRj2Xlkbj9kDclP6Ou9/Ie8
+omaSDXYPefv5jYIDF+w914wfqVn5bCrNSOtVQUOqazBZIKfqmmQxY7uggfdsk8p
u5eCGvA5Ql6PGOCrjSsmw3wuKpxJHS9j+Sg8n65fyB5v4DQxc98RQi9ryGynVF1+
YyuSnQN8A7CGPT8n+dwtApZMishrh8PMCJb9HYHrp1fnzmYcq8hLr0D3BxYPF7vl
wjhq4D5LiZgHLtKtWc30CY2+wjhqQC+FiPq35+XiSvjnNPWD/8oq0sIGJaTnBxVF
aGDhXH+i/HkIlbgDTaPAr9Kt8ZsUmc76LujuBcEyqQKFrQt9kce8xiJHcEz6F5sD
+VGiNrbsme1FE+W16M5CggkT5bjPtiXbcxBPTcByl2qbt2/Hh1fGjiihoC3Gl/0x
UjWJ4QvrG1fshW7Ylzf146genDg987QD9bw6ulCNJ/aT6yGZiBNh3zYIar8DX7sn
nTg2405jfIqiWQIDAQABo3sweTAfBgNVHSMEGDAWgBQqKF+RDWpzVWHJGSCdB+8e
SyLmKzAJBgNVHRMEAjAAMAsGA1UdDwQEAwIE8DAfBgNVHREEGDAWgg5xdWlja3dp
dC5sb2NhbIcEfwAAATAdBgNVHQ4EFgQULWzIQbbWgJ3ZgAx2wNy9Bl5LROIwDQYJ
KoZIhvcNAQELBQADggIBAJgIrxW3tEKsK/gaiSi5Lpng/LvSv2I9/Q7bnDGTKiLN
S6qcdyoiByu/88T1mK+kXyFzY2JSFSaLQgXxDip5kaPY+J8ySRkCii2NuMfMhfTP
/E2t+UEoXW8X87FRvAzGy2jbIPcFkkJE784TYsQhD6bjcKKTXvnAB7pCgu3zz1Xv
zmpN7vmcYwpkWbM2mYlzDYvhNs6XRGTKc0u4ho7VMyqYYBdXyT8KknWxzDLCXkhA
FahUPtm+63WyYDumm4dCuLIk3QjC/kYTcexhZTTlpHv6cnL2YOxcqUEpjCQHCisu
76f8mw9nA4Hm9SAHll2P9lT2cMs8edwhPfAKEk1xlLNvIz2QaG65YbifBPQAOO7S
Dhn32Vm7TIUPbgiP+TrTNjhHICcIALfsz32UuTM5r4VwvkODX64+1hN7GAHlBQPf
IQXogRlP2Dv6Gecrnr4HzP4kftgdDvGq+ULGPYzMszI1mVgrJLgO/1KTqVfN0eLu
Byqq14OodZKd+9RPEMrom+iSNmfgBffmL1zrBmGnUiHgMuzHrc2Eo3bOCguWIwRO
GrJZXmC+ldpy4XXzzulnzX40sgp7LXg7oVgQojWPZ4fEXEdszfb3yAdPqSjg8D73
8T/Z6edpFuVq86y4EM99xpd1I+THLryto6ebSYHOXlj+1fbMbam1kGZo8HE5+oHa
-----END CERTIFICATE-----


================================================
FILE: quickwit/quickwit-integration-tests/test_data/server.csr
================================================
-----BEGIN CERTIFICATE REQUEST-----
MIIEYzCCAksCAQAwHjEcMBoGA1UEAwwTcXcgdGVzdCBjZXJ0aWZpY2F0ZTCCAiIw
DQYJKoZIhvcNAQEBBQADggIPADCCAgoCggIBAIlOLMvHY8TQDIeEEG1y0LA3D7cl
HVmNNiZyBx2DhAQ39ATlW9SvcJ/wZlZkuOTM7bNAcTGyah9yMaGd9rJicpN5xZSv
IPxZ8LV8bBQbD5fuh5/Xp/+GLaJCiSTnpY0F8H+uyLm04fhwtlGzM+K49M/WEsk+
kA0+GYBeqOiuzYem0wKPC+gP4npGN34fy1+XLO1JXwZshGPZeWRuP2QNyU/o6738
h7z6iZpINdg95+/mNggMX7D3XjB+pWflsKs1I61VBQ6prMFkgp+qaZDFju6CB92y
Tym7l4Ia8DlCXo8Y4KuNKybDfC4qnEkdL2P5KDyfrl/IHm/gNDFz3xFCL2vIbKdU
XX5jK5KdA3wDsIY9Pyf53C0ClkyKyGuHw8wIlv0dgeunV+fOZhyryEuvQPcHFg8X
u+XCOGrgPkuJmAcu0q1ZzfQJjb7COGpAL4WI+rfn5eJK+Oc09YP/yirSwgYlpOcH
FUVoYOFcf6L8eQiVuANNo8Cv0q3xmxSZzvou6O4FwTKpAoWtC32Rx7zGIkdwTPoX
mwP5UaI2tuyZ7UUT5bXozkKCCRPluM+2JdtzEE9NwHKXapu3b8eHV8aOKKGgLcaX
/TFSNYnhC+sbV+yFbtiXN/XjqB6cOD3ztAP1vDq6UI0n9pPrIZmIE2HfNghqvwNf
uyedODbjTmN8iqJZAgMBAAGgADANBgkqhkiG9w0BAQsFAAOCAgEAfHtBglg3NED4
1MqoZmS8Q2DEAMgiIiq+CwpPW6yHV2BNBzfxfDezkrzH5b2oNg//IZ2ftCKV86jh
f9cszzhcbW3hre2tIg9CIC61qhp2MoPXeijneNYpGfXAvdXxs8VQB064ZdBj6ZbM
ZfIUdi+C9eb+kcgHBJ6fv4TSuik72f9bY0K7Kem0YoP4aXQ4aeZUkZFKZe2kw3hR
6jhSejHOrkNslXQhQIjjP8t3bx0vU7BdRniz/J0Dq+L/96v/KkGXNk39z5VDF6Ce
wl11KgeezZVNgczk2Xed7tQ/Uf05ptE9re+hYc3tRLW61VIpk93sZAOikm+69su3
IfLPo4Vq6gT1bxIErgwP5kjTb1gQWb+r1g5Yqyrvpiue3ReJ5OpZU6JQic61cOBH
lY50X34DeTzCMeGXbVYMpGybRGRQrMeK4RvULHM5s/FjN56HqpdDqDxH0UoVCF8w
vjJDqqvKHOFlBCUCu5CXBFHDjb6pev6kLP9G9JqnavmDzKdH4+pqp2kH4aOVrYl5
olXiz7l5JWEpwIXvkZa3ve6/cyXwDafbDzcVoq+dgLk8cMqT5uIqJdPjJXO2BCa3
0VzdC8CN8XR9hc3XKbD59zfZJRtw7qD57/EbV3kOTpE+ywCxRRMcjIBgz1ueOwfg
pHiu1g/7+yuiUEmZLOJLeODe6y5Ij3Q=
-----END CERTIFICATE REQUEST-----


================================================
FILE: quickwit/quickwit-integration-tests/test_data/server.key
================================================
-----BEGIN PRIVATE KEY-----
MIIJQQIBADANBgkqhkiG9w0BAQEFAASCCSswggknAgEAAoICAQCJTizLx2PE0AyH
hBBtctCwNw+3JR1ZjTYmcgcdg4QEN/QE5VvUr3Cf8GZWZLjkzO2zQHExsmofcjGh
nfayYnKTecWUryD8WfC1fGwUGw+X7oef16f/hi2iQokk56WNBfB/rsi5tOH4cLZR
szPiuPTP1hLJPpANPhmAXqjors2HptMCjwvoD+J6Rjd+H8tflyztSV8GbIRj2Xlk
bj9kDclP6Ou9/Ie8+omaSDXYPefv5jYIDF+w914wfqVn5bCrNSOtVQUOqazBZIKf
qmmQxY7uggfdsk8pu5eCGvA5Ql6PGOCrjSsmw3wuKpxJHS9j+Sg8n65fyB5v4DQx
c98RQi9ryGynVF1+YyuSnQN8A7CGPT8n+dwtApZMishrh8PMCJb9HYHrp1fnzmYc
q8hLr0D3BxYPF7vlwjhq4D5LiZgHLtKtWc30CY2+wjhqQC+FiPq35+XiSvjnNPWD
/8oq0sIGJaTnBxVFaGDhXH+i/HkIlbgDTaPAr9Kt8ZsUmc76LujuBcEyqQKFrQt9
kce8xiJHcEz6F5sD+VGiNrbsme1FE+W16M5CggkT5bjPtiXbcxBPTcByl2qbt2/H
h1fGjiihoC3Gl/0xUjWJ4QvrG1fshW7Ylzf146genDg987QD9bw6ulCNJ/aT6yGZ
iBNh3zYIar8DX7snnTg2405jfIqiWQIDAQABAoICAAuOuYWTrIm6C3vyuWFFG1zh
3aBIbv6FPOwiiAfLdLbYMOGinsa518yWsz6NbuTPfSisAXsx7e3kslnMzqG4WLWi
N+fqj+e9+F2GciCFIJxk1yS0xe7jz/6LBDlHiG9k8xgEUeAT4juD3UzmPTVV5UGD
XwRykDSVKBdeoHApmqJTAAsEmHd5stIhC/XBXmCW/JCiru1+/+vZt/aksxBMesgP
rpxI3/If0qpabrHbkCTo515pEDr4r4R8fJbQxjy7Fdw2vly8Go8S0032TbmCb6QS
7O+T3UcBg+DPPK5NMGFyMiMumFXEebT3ID2lR8JuDB2CQW7NjQZUxH/vJXUx8YTN
A2Ui7bYulT7g8z0P2UJeJCVXaOYoLgSQxnBJWMi3r/fuZmhC5fGYoBUF4/dwtaVd
ryMqDtaF9O9PilOQ4DsANSWqdBNkCkUObuWab9NDNksXLSDK+1nIeagLnG6U3qgy
DjSZ+LWHIGgTXpbP8KtxxlGeYznFcCH5Jdm/ubK/QyruLmhvrhdm6wXeFJwxt3M/
5CSy8WmM1B3kAZ3a/+RmJGAQwJkGN7gyPdTmLw9yhAiFTrZd/bhMFT08cGTJoGa9
d0yveZ5lFIxFeq12/u0gySx8Xqk2miIKq8OV8xh4M/9kOwUpNl9qMVFaK4G+nSjr
F1Git/7wE384CVMdb90BAoIBAQC8bzFIvkxCRh7ATl9faDcI/vPkwPos3w5fA7hC
HUELI5zdnBlYbd0X0HfUVRi5Lt2KY5AmeCIPLSMDfGMH7IE7LiAn2Jyp7pzVvoIk
EFAdeZ90o3ggj20IRuWNVNCQ0IOSdhSHCeAPsFtQst4lGzp8tFj8VAJl7nzY4moa
JD5sgOaB8WqXNKqWcdmxRGGK5VmXLKSW4ELRq3YNH+AGNquJgqu10hEkhvlpn3Qn
xVJ9KLPAhRHc81+Q8aVA0w73R3wrTmWaFmtDOKDeefB5zVbUYMDXrkEIHys9NXma
0I4ZhXvYjW6lL/ZNgHK3IP/kC0msycFl5H5l6+USJ+vIM96ZAoIBAQC6ib1++LtE
uauKYJsGaq+14s/LxfJ9KiIgxReE/eZRn3rG4LWXgdwwEVsmV1EYCTuCwMvIN+F0
j10YJqyoAtGwiFG4jGac0vDLFs3xx4+tp13aJ7WYCkM25O+9CMa32b89wOzN5lct
TYGrzQn2RhjKh3bGH4sGfaNb4R0kS6X5N1ErKPgGvCXlCrIYgNZyr88uVUeB4m6i
J2FobHpShjPoyaJn24KPwT4+GVnig3MZhbw0s4P25+VbTSMmHvAQmCHdv7MYSuDB
j9DmlvJ0mhoUKi3b1sKa1B9B4HAKVmmSaABfqpk4qdxyXjtUDQwN62YqAQLcmLOP
roxDm/YOdfnBAoIBABfAmGDIBArSleu9tU3scAuFP68VGDPxxfj6Gg7TazCBQ7O3
ioZYCueGkqREOcKWAr0AAdqnh/uLv/8ffcgw6rVQAiOjrVPKTSCwS+1J1R9yBkSI
morYKXFCporjJwsqDXu3wKyo9QJlQ41vjor03LF9dj4QROEeZ8Ra/e7fpLK+qM+2
Y649qEcggMVUjksYz+s7aF/QUvvk9hN/chi2aXcC7qwTl6+YB/ZlcBnXSKeYKthY
rcDBOMmnfCIouJk4/JDk5++9ZbXqfHSuwD5KQOiybXyCbZYdf7DOfc6i/VaAOfU5
FrphylVInK0yzq6rMZVDNUqnu7sTOiPIvnLU/vkCggEARSx1ABPe5jJwIYWHl46S
kEGGy0shjDbGpx5PhXreISCh2ARWctOuQoj9Iy+4G9C4p9k0+I94ZNARNraIylkZ
R3yVyXkPSFKVBsrzHhjh+ASbsh2Nos8Tc9Tb7l7FykHOQGk9p3EmnN8kGgCUFCaU
ZO5tJjVmScbngFfvhZkj+FICIJ41s9Grv88CkkGcxLTbgJQRS2Iborg10BKCHf40
W7wCJL9rIEIKAd9GzM/wK+PDEkwLwNDn5b6qLSXF4nF4BZJkKLsDs+PQFOKfEIxg
5V9q2B5A1keZO8Wt5rd6uNcmZFOQNEoRPLwjBh08fiDwJt1vITzjQYH588xvJ5eq
QQKCAQBX59K+aTukXUBC5clWMspLYUH4Ok8K35cKGbWtuy31EhNUlI+1Bc0ClV2l
uh3+XVv1Uicg+jymYEO229CIZz1XODyYfBSXP9QqJgE5T/W7dy+LOioZe2CDvZPp
2+ftXBaHlCk65EXt+a5LxtuIpc56Djo4yP8yFJRdG0QOSvOqYXK7dODvbTcdwEMa
cR6PUy8hXDsBbqylwqC/ZGK9YDN1J+RCwMWrqR1kDRfVaQolamLk2u+sVTySgSWk
8xyad6Vtj31jVCHhgA3WJgpied1QlRc4S1NXllIN47zHo5iUodj57FR9Ic1FSxT6
tyXdXUmgzPrm/d9zKsxJjionOhie
-----END PRIVATE KEY-----


================================================
FILE: quickwit/quickwit-integration-tests/test_data/server.v3.ext
================================================
authorityKeyIdentifier=keyid,issuer
basicConstraints=CA:FALSE
keyUsage = digitalSignature, nonRepudiation, keyEncipherment, dataEncipherment
subjectAltName = @alt_names
[alt_names]
DNS.1 = quickwit.local
IP.1 = 127.0.0.1


================================================
FILE: quickwit/quickwit-jaeger/Cargo.toml
================================================
[package]
name = "quickwit-jaeger"
description = "Jaeger storage backend"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
async-trait = { workspace = true }
itertools = { workspace = true }
once_cell = { workspace = true }
postcard = { workspace = true }
prost = { workspace = true }
prost-types = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
tantivy = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tonic = { workspace = true }
tracing = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-opentelemetry = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-query = { workspace = true }
quickwit-search = { workspace = true }

[dev-dependencies]
tempfile = { workspace = true }
time = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-ingest = { workspace = true }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-opentelemetry = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-search = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }

[features]
testsuite = []


================================================
FILE: quickwit/quickwit-jaeger/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::mem;
use std::ops::{Bound, RangeInclusive};
use std::sync::Arc;
use std::time::Instant;

use itertools::{Either, Itertools};
use prost::Message;
use prost_types::{Duration as WellKnownDuration, Timestamp as WellKnownTimestamp};
use quickwit_config::JaegerConfig;
use quickwit_opentelemetry::otlp::{
    Event as QwEvent, Link as QwLink, OTEL_TRACES_INDEX_ID, Span as QwSpan, SpanFingerprint,
    SpanId, SpanKind as QwSpanKind, SpanStatus as QwSpanStatus, TraceId,
};
use quickwit_proto::jaeger::api_v2::{
    KeyValue as JaegerKeyValue, Log as JaegerLog, Process as JaegerProcess, Span as JaegerSpan,
    SpanRef as JaegerSpanRef, SpanRefType as JaegerSpanRefType, ValueType,
};
use quickwit_proto::jaeger::storage::v1::{
    FindTraceIDsRequest, FindTraceIDsResponse, FindTracesRequest, GetOperationsRequest,
    GetOperationsResponse, GetServicesRequest, GetServicesResponse, GetTraceRequest, Operation,
    SpansResponseChunk, TraceQueryParameters,
};
use quickwit_proto::opentelemetry::proto::trace::v1::status::StatusCode as OtlpStatusCode;
use quickwit_proto::search::{CountHits, ListTermsRequest, SearchRequest};
use quickwit_query::BooleanOperand;
use quickwit_query::query_ast::{BoolQuery, QueryAst, RangeQuery, TermQuery, UserInputQuery};
use quickwit_search::{FindTraceIdsCollector, SearchService};
use serde::Deserialize;
use serde_json::Value as JsonValue;
use tantivy::collector::Collector;
use time::OffsetDateTime;
use time::format_description::well_known::Rfc3339;
use tokio::sync::mpsc;
use tokio_stream::wrappers::ReceiverStream;
use tonic::Status;
use tracing::field::Empty;
use tracing::{Span as RuntimeSpan, debug, error, instrument, warn};

pub(crate) use crate::metrics::JAEGER_SERVICE_METRICS;

mod metrics;
mod v1;
mod v2;

// OpenTelemetry to Jaeger Transformation
// <https://opentelemetry.io/docs/reference/specification/trace/sdk_exporters/jaeger/>

type TimeIntervalSecs = RangeInclusive<i64>;

pub(crate) type JaegerResult<T> = Result<T, Status>;

pub(crate) type SpanStream = ReceiverStream<Result<SpansResponseChunk, Status>>;

pub(crate) type TracesDataStream =
    ReceiverStream<Result<quickwit_proto::opentelemetry::proto::trace::v1::TracesData, Status>>;

#[derive(Clone)]
pub struct JaegerService {
    search_service: Arc<dyn SearchService>,
    lookback_period_secs: i64,
    max_trace_duration_secs: i64,
    max_fetch_spans: u64,
}

impl JaegerService {
    pub fn new(config: JaegerConfig, search_service: Arc<dyn SearchService>) -> Self {
        Self {
            search_service,
            lookback_period_secs: config.lookback_period().as_secs() as i64,
            max_trace_duration_secs: config.max_trace_duration().as_secs() as i64,
            max_fetch_spans: config.max_fetch_spans.get(),
        }
    }

    #[instrument("get_services", skip_all)]
    pub async fn get_services_for_indexes(
        &self,
        _request: GetServicesRequest,
        index_id_patterns: Vec<String>,
    ) -> JaegerResult<GetServicesResponse> {
        let services = get_services_impl(
            self.search_service.clone(),
            self.lookback_period_secs,
            index_id_patterns,
        )
        .await?;
        Ok(GetServicesResponse { services })
    }

    #[instrument("get_operations", skip_all, fields(service=%request.service, span_kind=%request.span_kind))]
    pub async fn get_operations_for_indexes(
        &self,
        request: GetOperationsRequest,
        index_id_patterns: Vec<String>,
    ) -> JaegerResult<GetOperationsResponse> {
        let operations = get_operations_impl(
            self.search_service.clone(),
            self.lookback_period_secs,
            request.service,
            request.span_kind,
            index_id_patterns,
        )
        .await?;
        Ok(GetOperationsResponse {
            operations,
            operation_names: Vec::new(), // `operation_names` is deprecated.
        })
    }

    // Instrumentation happens in `find_trace_ids`.
    pub async fn find_trace_ids_for_indexes(
        &self,
        request: FindTraceIDsRequest,
        index_id_patterns: Vec<String>,
    ) -> JaegerResult<FindTraceIDsResponse> {
        debug!(request=?request, index_ids=?index_id_patterns, "`find_trace_ids` request");

        let trace_query = request
            .query
            .ok_or_else(|| Status::invalid_argument("Query is empty."))?;

        let (trace_ids, _) = self.find_trace_ids(trace_query, index_id_patterns).await?;
        let trace_ids = trace_ids
            .into_iter()
            .map(|trace_id| trace_id.to_vec())
            .collect();
        debug!(trace_ids=?trace_ids, "`find_trace_ids` response");
        let response = FindTraceIDsResponse { trace_ids };
        Ok(response)
    }

    #[instrument("find_traces", skip_all)]
    pub async fn find_traces_for_indexes(
        &self,
        request: FindTracesRequest,
        operation_name: &'static str,
        request_start: Instant,
        index_id_patterns: Vec<String>,
        root_only: bool,
    ) -> JaegerResult<SpanStream> {
        debug!(request=?request, "`find_traces` request");

        let trace_query = request
            .query
            .ok_or_else(|| Status::invalid_argument("Trace query is empty."))?;
        let (trace_ids, span_timestamps_range) = self
            .find_trace_ids(trace_query, index_id_patterns.clone())
            .await?;
        let start = span_timestamps_range.start() - self.max_trace_duration_secs;
        let end = span_timestamps_range.end() + self.max_trace_duration_secs;
        let search_window = start..=end;
        let response = self
            .stream_spans(
                &trace_ids,
                search_window,
                operation_name,
                request_start,
                index_id_patterns,
                root_only,
            )
            .await?;
        Ok(response)
    }

    #[instrument("get_trace", skip_all)]
    pub async fn get_trace_for_indexes(
        &self,
        request: GetTraceRequest,
        operation_name: &'static str,
        request_start: Instant,
        index_id_patterns: Vec<String>,
    ) -> JaegerResult<SpanStream> {
        debug!(request=?request, "`get_trace` request");
        debug_assert_eq!(request.trace_id.len(), 16);
        let trace_id = TraceId::try_from(request.trace_id)
            .map_err(|error| Status::invalid_argument(error.to_string()))?;
        let end = OffsetDateTime::now_utc().unix_timestamp();
        let start = end - self.lookback_period_secs;
        let search_window = start..=end;
        let response = self
            .stream_spans(
                &[trace_id],
                search_window,
                operation_name,
                request_start,
                index_id_patterns,
                false,
            )
            .await?;
        Ok(response)
    }

    #[instrument("find_trace_ids", skip_all fields(service_name=%trace_query.service_name, operation_name=%trace_query.operation_name))]
    async fn find_trace_ids(
        &self,
        trace_query: TraceQueryParameters,
        index_id_patterns: Vec<String>,
    ) -> Result<(Vec<TraceId>, TimeIntervalSecs), Status> {
        let min_start_secs = trace_query.start_time_min.map(|ts| ts.seconds);
        let max_start_secs = trace_query.start_time_max.map(|ts| ts.seconds);
        let min_duration_millis = trace_query
            .duration_min
            .and_then(|d| to_duration_millis(&d));
        let max_duration_millis = trace_query
            .duration_max
            .and_then(|d| to_duration_millis(&d));

        find_trace_ids_common(
            self.search_service.clone(),
            &trace_query.service_name,
            &trace_query.operation_name,
            trace_query.tags,
            min_start_secs,
            max_start_secs,
            min_duration_millis,
            max_duration_millis,
            trace_query.num_traces as usize,
            index_id_patterns,
        )
        .await
    }
}

#[instrument("find_trace_ids_common", skip_all)]
#[allow(clippy::too_many_arguments)]
pub(crate) async fn find_trace_ids_common(
    search_service: Arc<dyn SearchService>,
    service_name: &str,
    operation_name: &str,
    tags: HashMap<String, String>,
    min_start_secs: Option<i64>,
    max_start_secs: Option<i64>,
    min_duration_millis: Option<i64>,
    max_duration_millis: Option<i64>,
    num_traces: usize,
    index_id_patterns: Vec<String>,
) -> Result<(Vec<TraceId>, TimeIntervalSecs), Status> {
    let query_ast = build_search_query(
        service_name,
        None,
        operation_name,
        tags,
        min_start_secs,
        max_start_secs,
        min_duration_millis,
        max_duration_millis,
    );

    let search_request = SearchRequest {
        index_id_patterns,
        query_ast: serde_json::to_string(&query_ast)
            .map_err(|err| Status::internal(err.to_string()))?,
        aggregation_request: Some(build_aggregations_query(num_traces)),
        max_hits: 0,
        start_timestamp: min_start_secs,
        end_timestamp: max_start_secs,
        count_hits: CountHits::Underestimate.into(),
        ..Default::default()
    };

    let search_response = search_service.root_search(search_request).await?;

    let Some(agg_result_postcard) = search_response.aggregation_postcard else {
        debug!("the query matched no traces");
        return Ok((Vec::new(), 0..=0));
    };

    let trace_ids = collect_trace_ids(&agg_result_postcard)?;
    debug!("the query matched {} traces.", trace_ids.0.len());
    Ok(trace_ids)
}

impl JaegerService {
    #[instrument("stream_spans", skip_all, fields(num_traces=%trace_ids.len(), num_spans=Empty, num_bytes=Empty))]
    async fn stream_spans(
        &self,
        trace_ids: &[TraceId],
        search_window: TimeIntervalSecs,
        operation_name: &'static str,
        request_start: Instant,
        index_id_patterns: Vec<String>,
        root_only: bool,
    ) -> Result<SpanStream, Status> {
        if trace_ids.is_empty() {
            let (_tx, rx) = mpsc::channel(1);
            return Ok(ReceiverStream::new(rx));
        }
        let num_traces = trace_ids.len() as u64;
        let mut query = BoolQuery::default();

        for trace_id in trace_ids {
            let value = trace_id.hex_display();
            let term_query = TermQuery {
                field: "trace_id".to_string(),
                value,
            };
            query.should.push(term_query.into());
        }
        if root_only {
            // we do this so we don't error on old indexes, and instead return both root and non
            // root spans
            let is_root = UserInputQuery {
                user_text: "NOT is_root:false".to_string(),
                default_fields: None,
                default_operator: BooleanOperand::And,
                lenient: true,
            };
            let mut new_query = BoolQuery::default();
            new_query.must.push(query.into());
            new_query.must.push(is_root.into());
            query = new_query;
        }

        let query_ast: QueryAst = query.into();
        let query_ast =
            serde_json::to_string(&query_ast).map_err(|err| Status::internal(err.to_string()))?;

        let search_request = SearchRequest {
            index_id_patterns,
            query_ast,
            start_timestamp: Some(*search_window.start()),
            end_timestamp: Some(*search_window.end()),
            max_hits: self.max_fetch_spans,
            count_hits: CountHits::Underestimate.into(),
            ..Default::default()
        };
        let search_response = match self.search_service.root_search(search_request).await {
            Ok(search_response) => search_response,
            Err(search_error) => {
                error!(search_error=?search_error, "failed to fetch spans");
                record_error(operation_name, request_start);
                return Err(Status::internal("Failed to fetch spans."));
            }
        };
        let mut spans: Vec<JaegerSpan> = Vec::with_capacity(search_response.hits.len());

        for hit in search_response.hits {
            match qw_span_to_jaeger_span(&hit.json) {
                Ok(span) => {
                    spans.push(span);
                }
                Err(status) => {
                    record_error(operation_name, request_start);
                    return Err(status);
                }
            };
        }
        if trace_ids.len() > 1 {
            spans.sort_unstable_by(|left, right| left.trace_id.cmp(&right.trace_id));
        }
        let (tx, rx) = mpsc::channel(2);
        let current_span = RuntimeSpan::current();

        tokio::task::spawn(async move {
            const MAX_CHUNK_LEN: usize = 1_000;
            const MAX_CHUNK_NUM_BYTES: usize = 4 * 1024 * 1024 - 10 * 1024; // 4 MiB, the default max size of gRPC messages, minus some headroom.

            let chunk_len = MAX_CHUNK_LEN.min(spans.len());
            let mut chunk = Vec::with_capacity(chunk_len);
            let mut chunk_num_bytes = 0;
            let mut num_spans_total = 0;
            let mut num_bytes_total = 0;

            while let Some(span) = spans.pop() {
                let span_num_bytes = span.encoded_len();

                if chunk.len() == MAX_CHUNK_LEN
                    || chunk_num_bytes + span_num_bytes > MAX_CHUNK_NUM_BYTES
                {
                    let num_spans = chunk.len();
                    num_spans_total += num_spans;
                    num_bytes_total += chunk_num_bytes;

                    // + 1 to account for the span we just popped from `spans` but haven't yet
                    // appended to `chunk`.
                    let chunk_len = MAX_CHUNK_LEN.min(spans.len() + 1);
                    let chunk = mem::replace(&mut chunk, Vec::with_capacity(chunk_len));
                    if let Err(send_error) = tx.send(Ok(SpansResponseChunk { spans: chunk })).await
                    {
                        debug!(send_error=?send_error, "client disconnected");
                        return;
                    }
                    record_send(operation_name, num_spans, chunk_num_bytes);
                    chunk_num_bytes = 0;
                }
                chunk_num_bytes += span_num_bytes;
                chunk.push(span);
            }
            if !chunk.is_empty() {
                let num_spans = chunk.len();
                num_spans_total += num_spans;
                num_bytes_total += chunk_num_bytes;

                if let Err(send_error) = tx.send(Ok(SpansResponseChunk { spans: chunk })).await {
                    debug!(error=?send_error, "client disconnected");
                    return;
                }
                record_send(operation_name, num_spans, chunk_num_bytes);
            }
            current_span.record("num_spans", num_spans_total);
            current_span.record("num_bytes", num_bytes_total);

            JAEGER_SERVICE_METRICS
                .fetched_traces_total
                .with_label_values([operation_name, OTEL_TRACES_INDEX_ID])
                .inc_by(num_traces);

            let elapsed = request_start.elapsed().as_secs_f64();
            JAEGER_SERVICE_METRICS
                .request_duration_seconds
                .with_label_values([operation_name, OTEL_TRACES_INDEX_ID, "false"])
                .observe(elapsed);
        });
        Ok(ReceiverStream::new(rx))
    }
}

pub(crate) fn record_error(operation_name: &'static str, request_start: Instant) {
    JAEGER_SERVICE_METRICS
        .request_errors_total
        .with_label_values([operation_name, OTEL_TRACES_INDEX_ID])
        .inc();

    let elapsed = request_start.elapsed().as_secs_f64();
    JAEGER_SERVICE_METRICS
        .request_duration_seconds
        .with_label_values([operation_name, OTEL_TRACES_INDEX_ID, "true"])
        .observe(elapsed);
}

pub(crate) fn record_send(operation_name: &'static str, num_spans: usize, num_bytes: usize) {
    JAEGER_SERVICE_METRICS
        .fetched_spans_total
        .with_label_values([operation_name, OTEL_TRACES_INDEX_ID])
        .inc_by(num_spans as u64);
    JAEGER_SERVICE_METRICS
        .transferred_bytes_total
        .with_label_values([operation_name, OTEL_TRACES_INDEX_ID])
        .inc_by(num_bytes as u64);
}

#[allow(deprecated)]
fn extract_term(term_bytes: &[u8]) -> String {
    tantivy::Term::wrap(term_bytes)
        .value()
        .as_str()
        .expect("Term should be a valid UTF-8 string.")
        .to_string()
}

fn extract_operation(term_bytes: &[u8]) -> Operation {
    let term = extract_term(term_bytes);
    let fingerprint = SpanFingerprint::from_string(term);
    let span_name = fingerprint
        .span_name()
        .expect("The span fingerprint should be properly formed.")
        .to_string();
    let span_kind = fingerprint
        .span_kind()
        .map(|span_kind| span_kind.as_jaeger())
        .expect("The span fingerprint should be properly formed.")
        .to_string();
    Operation {
        name: span_name,
        span_kind,
    }
}

#[instrument("get_services", skip_all)]
pub(crate) async fn get_services_impl(
    search_service: Arc<dyn SearchService>,
    lookback_period_secs: i64,
    index_id_patterns: Vec<String>,
) -> Result<Vec<String>, Status> {
    debug!(index_ids=?index_id_patterns, "`get_services` request");

    let max_hits = Some(1_000);
    let start_timestamp = Some(OffsetDateTime::now_utc().unix_timestamp() - lookback_period_secs);

    let search_request = ListTermsRequest {
        index_id_patterns,
        field: "service_name".to_string(),
        max_hits,
        start_timestamp,
        end_timestamp: None,
        start_key: None,
        end_key: None,
    };
    let search_response = search_service.root_list_terms(search_request).await?;
    let services: Vec<String> = search_response
        .terms
        .into_iter()
        .map(|term_bytes| extract_term(&term_bytes))
        .sorted()
        .collect();
    debug!(services=?services, "`get_services` response");
    Ok(services)
}

#[instrument("get_operations", skip_all, fields(service=%service, span_kind=%span_kind))]
pub(crate) async fn get_operations_impl(
    search_service: Arc<dyn SearchService>,
    lookback_period_secs: i64,
    service: String,
    span_kind: String,
    index_id_patterns: Vec<String>,
) -> Result<Vec<Operation>, Status> {
    debug!(service=%service, span_kind=%span_kind, index_ids=?index_id_patterns, "`get_operations` request");

    let max_hits = Some(1_000);
    let start_timestamp = Some(OffsetDateTime::now_utc().unix_timestamp() - lookback_period_secs);

    let span_kind_opt = span_kind.parse().ok();
    let start_key = SpanFingerprint::start_key(&service, span_kind_opt.clone());
    let end_key = SpanFingerprint::end_key(&service, span_kind_opt);

    let search_request = ListTermsRequest {
        index_id_patterns,
        field: "span_fingerprint".to_string(),
        max_hits,
        start_timestamp,
        end_timestamp: None,
        start_key,
        end_key,
    };
    let search_response = search_service.root_list_terms(search_request).await?;
    let operations: Vec<Operation> = search_response
        .terms
        .into_iter()
        .map(|term_json| extract_operation(&term_json))
        .sorted()
        .collect();
    debug!(operations=?operations, "`get_operations` response");
    Ok(operations)
}

// TODO: builder pattern
#[allow(clippy::too_many_arguments)]
pub(crate) fn build_search_query(
    service_name: &str,
    span_kind_opt: Option<QwSpanKind>,
    span_name: &str,
    mut tags: HashMap<String, String>,
    min_span_start_timestamp_secs_opt: Option<i64>,
    max_span_start_timestamp_secs_opt: Option<i64>,
    min_span_duration_millis_opt: Option<i64>,
    max_span_duration_millis_opt: Option<i64>,
) -> QueryAst {
    // TODO disable based on some feature?
    if let Some(qw_query) = tags.remove("_qw_query") {
        return quickwit_query::query_ast::query_ast_from_user_text(&qw_query, None);
    }
    // TODO should we use filter instead of must? Does it changes anything? Less scoring?
    let mut query_ast = BoolQuery::default();

    if !service_name.is_empty() {
        query_ast.must.push(
            TermQuery {
                field: "service_name".to_string(),
                value: service_name.to_string(),
            }
            .into(),
        );
    }
    if let Some(span_kind) = span_kind_opt {
        query_ast.must.push(
            TermQuery {
                field: "span_kind".to_string(),
                value: span_kind.as_char().to_string(),
            }
            .into(),
        )
    }
    if !span_name.is_empty() {
        query_ast.must.push(
            TermQuery {
                field: "span_name".to_string(),
                value: span_name.to_string(),
            }
            .into(),
        )
    }
    if !tags.is_empty() {
        // Sort the tags for deterministic tests.
        for (key, value) in tags.into_iter().sorted() {
            // In Jaeger land, `event` is a regular event attribute whereas in OpenTelemetry land,
            // it is an event top-level field named `name`. In Quickwit, it is stored as
            // `event_name` to distinguish it from the span top-level field `name`.
            if key == "event" {
                query_ast.must.push(
                    TermQuery {
                        field: "events.event_name".to_string(),
                        value,
                    }
                    .into(),
                )
            } else if key == "error" && value == "true" {
                query_ast.must.push(
                    TermQuery {
                        field: "span_status.code".to_string(),
                        value: "error".to_string(),
                    }
                    .into(),
                )
            } else if key == "error" && value == "false" {
                query_ast.must_not.push(
                    TermQuery {
                        field: "span_status.code".to_string(),
                        value: "error".to_string(),
                    }
                    .into(),
                )
            } else {
                let mut sub_query = BoolQuery::default();

                sub_query.should.push(
                    TermQuery {
                        field: format!("resource_attributes.{key}"),
                        value: value.clone(),
                    }
                    .into(),
                );
                sub_query.should.push(
                    TermQuery {
                        field: format!("span_attributes.{key}"),
                        value: value.clone(),
                    }
                    .into(),
                );
                sub_query.should.push(
                    TermQuery {
                        field: format!("events.event_attributes.{key}"),
                        value,
                    }
                    .into(),
                );
                query_ast.must.push(sub_query.into())
            }
        }
    }
    if min_span_start_timestamp_secs_opt.is_some() || max_span_start_timestamp_secs_opt.is_some() {
        let mut start_range = RangeQuery {
            field: "span_start_timestamp_nanos".to_string(),
            lower_bound: Bound::Unbounded,
            upper_bound: Bound::Unbounded,
        };

        if let Some(min_span_start_timestamp_secs) = min_span_start_timestamp_secs_opt {
            let min_span_start_datetime =
                OffsetDateTime::from_unix_timestamp(min_span_start_timestamp_secs)
                    .expect("Timestamp should fall within the [Date::MIN, Date::MAX] interval.");
            let min_span_start_datetime_rfc3339 = min_span_start_datetime
                .format(&Rfc3339)
                .expect("Datetime should be formattable to RFC 3339.");
            start_range.lower_bound = Bound::Included(min_span_start_datetime_rfc3339.into());
        }

        if let Some(max_span_start_timestamp_secs) = max_span_start_timestamp_secs_opt {
            let max_span_start_datetime =
                OffsetDateTime::from_unix_timestamp(max_span_start_timestamp_secs)
                    .expect("Timestamp should fall within the [Date::MIN, Date::MAX] interval.");
            let max_span_start_datetime_rfc3339 = max_span_start_datetime
                .format(&Rfc3339)
                .expect("Datetime should be formattable to RFC 3339.");
            start_range.upper_bound = Bound::Included(max_span_start_datetime_rfc3339.into());
        }

        query_ast.must.push(start_range.into());
    }
    if min_span_duration_millis_opt.is_some() || max_span_duration_millis_opt.is_some() {
        let mut duration_range = RangeQuery {
            field: "span_duration_millis".to_string(),
            lower_bound: Bound::Unbounded,
            upper_bound: Bound::Unbounded,
        };

        if let Some(min_span_duration_millis) = min_span_duration_millis_opt {
            duration_range.lower_bound = Bound::Included(min_span_duration_millis.into());
        }

        if let Some(max_span_duration_millis) = max_span_duration_millis_opt {
            duration_range.upper_bound = Bound::Included(max_span_duration_millis.into());
        }

        query_ast.must.push(duration_range.into());
    }
    if !query_ast.must.is_empty() || !query_ast.must_not.is_empty() {
        query_ast.into()
    } else {
        QueryAst::MatchAll
    }
}

pub(crate) fn build_aggregations_query(num_traces: usize) -> String {
    let query = serde_json::to_string(&FindTraceIdsCollector {
        num_traces,
        trace_id_field_name: "trace_id".to_string(),
        span_timestamp_field_name: "span_start_timestamp_nanos".to_string(),
    })
    .expect("The collector should be JSON serializable.");
    debug!(query=%query, "Aggregations query");
    query
}

#[allow(clippy::result_large_err)]
fn qw_span_to_jaeger_span(qw_span_json: &str) -> Result<JaegerSpan, Status> {
    let mut qw_span: QwSpan = json_deserialize(qw_span_json, "span")?;

    let start_time = Some(to_well_known_timestamp(qw_span.span_start_timestamp_nanos));
    let duration = Some(to_well_known_duration(
        qw_span.span_start_timestamp_nanos,
        qw_span.span_end_timestamp_nanos,
    ));
    qw_span.resource_attributes.remove("service.name");
    let process = Some(JaegerProcess {
        service_name: qw_span.service_name,
        tags: otlp_attributes_to_jaeger_tags(qw_span.resource_attributes),
    });
    let logs: Vec<JaegerLog> = qw_span
        .events
        .into_iter()
        .map(qw_event_to_jaeger_log)
        .collect::<Result<_, _>>()?;

    let mut tags = otlp_attributes_to_jaeger_tags(qw_span.span_attributes);
    inject_dropped_count_tags(
        &mut tags,
        qw_span.span_dropped_attributes_count,
        qw_span.span_dropped_events_count,
        qw_span.span_dropped_links_count,
    );
    inject_span_kind_tag(&mut tags, qw_span.span_kind);
    inject_span_status_tags(&mut tags, qw_span.span_status);

    let references =
        otlp_links_to_jaeger_references(&qw_span.trace_id, qw_span.parent_span_id, qw_span.links)?;

    let span = JaegerSpan {
        trace_id: qw_span.trace_id.to_vec(),
        span_id: qw_span.span_id.to_vec(),
        operation_name: qw_span.span_name,
        references,
        flags: 0, // TODO
        start_time,
        duration,
        tags,
        logs,
        process,
        process_id: "".to_string(), // TODO
        warnings: Vec::new(),       // TODO
    };
    Ok(span)
}

pub(crate) fn to_duration_millis(duration: &WellKnownDuration) -> Option<i64> {
    let duration_millis = duration.seconds * 1_000 + (duration.nanos as i64) / 1_000_000;
    if duration_millis == 0 {
        None
    } else {
        Some(duration_millis)
    }
}

fn to_well_known_timestamp(timestamp_nanos: u64) -> WellKnownTimestamp {
    let seconds = (timestamp_nanos / 1_000_000_000) as i64;
    let nanos = (timestamp_nanos % 1_000_000_000) as i32;
    WellKnownTimestamp { seconds, nanos }
}

fn to_well_known_duration(
    start_timestamp_nanos: u64,
    end_timestamp_nanos: u64,
) -> WellKnownDuration {
    let duration_nanos = end_timestamp_nanos - start_timestamp_nanos;
    let seconds = (duration_nanos / 1_000_000_000) as i64;
    let nanos = (duration_nanos % 1_000_000_000) as i32;
    WellKnownDuration { seconds, nanos }
}

fn inject_dropped_count_tags(
    tags: &mut Vec<JaegerKeyValue>,
    dropped_attributes_count: u32,
    dropped_events_count: u32,
    dropped_links_count: u32,
) {
    for (dropped_count, key) in [
        (dropped_attributes_count, "otel.dropped_attributes_count"),
        (dropped_events_count, "otel.dropped_events_count"),
        (dropped_links_count, "otel.dropped_links_count"),
    ] {
        if dropped_count > 0 {
            tags.push(JaegerKeyValue {
                key: key.to_string(),
                v_type: ValueType::Int64 as i32,
                v_str: String::new(),
                v_bool: false,
                v_int64: dropped_count as i64,
                v_float64: 0.0,
                v_binary: Vec::new(),
            });
        }
    }
}

/// Injects span kind tag.
/// <https://opentelemetry.io/docs/specs/otel/trace/sdk_exporters/jaeger/#spankind>
fn inject_span_kind_tag(tags: &mut Vec<JaegerKeyValue>, span_kind_id: u32) {
    // OpenTelemetry SpanKind field MUST be encoded as span.kind tag in Jaeger span, except for
    // SpanKind.INTERNAL, which SHOULD NOT be translated to a tag.
    let span_kind = match span_kind_id {
        0 | 1 => return,
        2 => "server",
        3 => "client",
        4 => "producer",
        5 => "consumer",
        _ => {
            warn!(span_kind_id=%span_kind_id, "unknown span kind ID");
            return;
        }
    };
    tags.push(JaegerKeyValue {
        key: "span.kind".to_string(),
        v_type: ValueType::String as i32,
        v_str: span_kind.to_string(),
        v_bool: false,
        v_int64: 0,
        v_float64: 0.0,
        v_binary: Vec::new(),
    });
}

/// Injects span status tags.
/// <https://opentelemetry.io/docs/specs/otel/common/mapping-to-non-otlp/#span-status>
fn inject_span_status_tags(tags: &mut Vec<JaegerKeyValue>, span_status: QwSpanStatus) {
    // "Span Status MUST be reported as key-value pairs associated with the Span, unless the Status
    // is UNSET. In the latter case it MUST NOT be reported."
    match span_status.code {
        OtlpStatusCode::Unset => {}
        OtlpStatusCode::Ok => {
            // "Name of the code, either OK or ERROR. MUST NOT be set if the code is UNSET."
            tags.push(JaegerKeyValue {
                key: "otel.status_code".to_string(),
                v_type: ValueType::String as i32,
                v_str: "OK".to_string(),
                v_bool: false,
                v_int64: 0,
                v_float64: 0.0,
                v_binary: Vec::new(),
            });
        }
        OtlpStatusCode::Error => {
            // "Name of the code, either OK or ERROR. MUST NOT be set if the code is UNSET."
            tags.push(JaegerKeyValue {
                key: "otel.status_code".to_string(),
                v_type: ValueType::String as i32,
                v_str: "ERROR".to_string(),
                v_bool: false,
                v_int64: 0,
                v_float64: 0.0,
                v_binary: Vec::new(),
            });
            // "Description of the Status if it has a value otherwise not set."
            if let Some(message) = span_status.message {
                tags.push(JaegerKeyValue {
                    key: "otel.status_description".to_string(),
                    v_type: ValueType::String as i32,
                    v_str: message,
                    v_bool: false,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new(),
                });
            }
            // "When Span Status is set to ERROR, an error span tag MUST be added with the Boolean
            // value of true. The added error tag MAY override any previous value."
            tags.push(JaegerKeyValue {
                key: "error".to_string(),
                v_type: ValueType::Bool as i32,
                v_str: String::new(),
                v_bool: true,
                v_int64: 0,
                v_float64: 0.0,
                v_binary: Vec::new(),
            });
        }
    };
}

/// Converts OpenTelemetry attributes to Jaeger tags. Objects are flattened with
/// their keys prefixed with the parent keys delimited by a dot.
///
/// <https://opentelemetry.io/docs/specs/otel/trace/sdk_exporters/jaeger/#attributes>
fn otlp_attributes_to_jaeger_tags(
    attributes: impl IntoIterator<Item = (String, JsonValue)>,
) -> Vec<JaegerKeyValue> {
    otlp_attributes_to_jaeger_tags_inner(attributes, None)
}

/// Inner helper for `otpl_attributes_to_jaeger_tags` recursive call
///
/// PERF: as long as `attributes` IntoIterator implementation correctly sets the
/// lower bound then collect should allocate efficiently. Note that the flat map
/// may cause more allocations as we cannot predict the number of elements in the
/// iterator.
fn otlp_attributes_to_jaeger_tags_inner(
    attributes: impl IntoIterator<Item = (String, JsonValue)>,
    parent_key: Option<&str>,
) -> Vec<JaegerKeyValue> {
    attributes
        .into_iter()
        .map(|(key, value)| {
            let key = parent_key
                .map(|parent_key| format!("{parent_key}.{key}"))
                .unwrap_or(key);
            match value {
                JsonValue::Array(values) => {
                    Either::Left(Some(JaegerKeyValue {
                        key,
                        v_type: ValueType::String as i32,
                        // Array values MUST be serialized to string like a JSON list.
                        v_str: serde_json::to_string(&values).expect(
                            "A vec of `serde_json::Value` values should be JSON serializable.",
                        ),
                        ..Default::default()
                    }))
                }
                JsonValue::Bool(v_bool) => Either::Left(Some(JaegerKeyValue {
                    key,
                    v_type: ValueType::Bool as i32,
                    v_bool,
                    ..Default::default()
                })),
                JsonValue::Number(number) => {
                    let value = if let Some(v_int64) = number.as_i64() {
                        Some(JaegerKeyValue {
                            key,
                            v_type: ValueType::Int64 as i32,
                            v_int64,
                            ..Default::default()
                        })
                    } else if let Some(v_float64) = number.as_f64() {
                        Some(JaegerKeyValue {
                            key,
                            v_type: ValueType::Float64 as i32,
                            v_float64,
                            ..Default::default()
                        })
                    } else {
                        // Print some error rather than silently ignoring the value.
                        warn!("ignoring unrepresentable number value: {number:?}");
                        None
                    };

                    Either::Left(value)
                }
                JsonValue::String(v_str) => Either::Left(Some(JaegerKeyValue {
                    key,
                    v_type: ValueType::String as i32,
                    v_str,
                    ..Default::default()
                })),
                JsonValue::Null => {
                    // No use including null values in the tags, so ignore
                    Either::Left(None)
                }
                JsonValue::Object(value) => {
                    Either::Right(otlp_attributes_to_jaeger_tags_inner(value, Some(&key)))
                }
            }
        })
        .flat_map(|e| e.into_iter())
        .collect()
}

/// Converts OpenTelemetry links to Jaeger span references.
/// <https://opentelemetry.io/docs/specs/otel/trace/sdk_exporters/jaeger/#links>
#[allow(clippy::result_large_err)]
fn otlp_links_to_jaeger_references(
    trace_id: &TraceId,
    parent_span_id_opt: Option<SpanId>,
    links: Vec<QwLink>,
) -> Result<Vec<JaegerSpanRef>, Status> {
    let mut references = Vec::with_capacity(parent_span_id_opt.is_some() as usize + links.len());

    // <https://opentelemetry.io/docs/specs/otel/trace/sdk_exporters/jaeger/#parent-id>
    if let Some(parent_span_id) = parent_span_id_opt {
        let reference = JaegerSpanRef {
            trace_id: trace_id.to_vec(),
            span_id: parent_span_id.to_vec(),
            ref_type: JaegerSpanRefType::ChildOf as i32,
        };
        references.push(reference);
    }
    // "Span references generated from Link(s) MUST be added after the span reference generated from
    // Parent ID, if any."
    for link in links {
        let trace_id = link.link_trace_id.to_vec();
        let span_id = link.link_span_id.to_vec();
        let reference = JaegerSpanRef {
            trace_id,
            span_id,
            ref_type: JaegerSpanRefType::FollowsFrom as i32,
        };
        references.push(reference);
    }
    Ok(references)
}

#[allow(clippy::result_large_err)]
fn qw_event_to_jaeger_log(event: QwEvent) -> Result<JaegerLog, Status> {
    let timestamp = to_well_known_timestamp(event.event_timestamp_nanos);
    // "OpenTelemetry Event’s name field should be added to Jaeger Log’s fields map as follows: name
    // -> event. If OpenTelemetry Event contains an attribute with the key event, it should take
    // precedence over Event’s name field."
    let insert_event_name =
        !event.event_name.is_empty() && !event.event_attributes.contains_key("event");

    let mut fields = otlp_attributes_to_jaeger_tags(event.event_attributes);

    if insert_event_name {
        fields.push(JaegerKeyValue {
            key: "event".to_string(),
            v_type: ValueType::String as i32,
            v_str: event.event_name,
            v_bool: false,
            v_int64: 0,
            v_float64: 0.0,
            v_binary: Vec::new(),
        });
    }
    inject_dropped_count_tags(&mut fields, event.event_dropped_attributes_count, 0, 0);
    let log = JaegerLog {
        timestamp: Some(timestamp),
        fields,
    };
    Ok(log)
}

#[allow(clippy::result_large_err)]
fn collect_trace_ids(
    trace_ids_postcard: &[u8],
) -> Result<(Vec<TraceId>, TimeIntervalSecs), Status> {
    let collector_fruit: <FindTraceIdsCollector as Collector>::Fruit =
        postcard_deserialize(trace_ids_postcard, "trace IDs aggregation")?;
    if collector_fruit.is_empty() {
        return Ok((Vec::new(), 0..=0));
    }
    let mut trace_ids = Vec::with_capacity(collector_fruit.len());
    let mut start = i64::MAX;
    let mut end = i64::MIN;

    for trace_id in collector_fruit {
        trace_ids.push(trace_id.trace_id);
        start = start.min(trace_id.span_timestamp.into_timestamp_secs());
        end = end.max(trace_id.span_timestamp.into_timestamp_secs());
    }
    Ok((trace_ids, start..=end))
}

#[allow(clippy::result_large_err)]
fn json_deserialize<'a, T>(json: &'a str, label: &'static str) -> Result<T, Status>
where T: Deserialize<'a> {
    match serde_json::from_str(json) {
        Ok(deserialized) => Ok(deserialized),
        Err(error) => {
            error!("failed to deserialize {label}: {error:?}");
            Err(Status::internal(format!(
                "Failed to deserialize {label}: {error:?}."
            )))
        }
    }
}

#[allow(clippy::result_large_err)]
fn postcard_deserialize<'a, T>(json: &'a [u8], label: &'static str) -> Result<T, Status>
where T: Deserialize<'a> {
    match postcard::from_bytes(json) {
        Ok(deserialized) => Ok(deserialized),
        Err(error) => {
            error!("failed to deserialize {label}: {error:?}");
            Err(Status::internal(format!(
                "Failed to deserialize {label}: {error:?}."
            )))
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_opentelemetry::otlp::{OTEL_TRACES_INDEX_ID_PATTERN, OtelSignal};
    use quickwit_proto::jaeger::api_v2::ValueType;
    use quickwit_proto::jaeger::storage::v1::span_reader_plugin_server::SpanReaderPlugin;
    use quickwit_search::{MockSearchService, QuickwitAggregations, encode_term_for_test};
    use serde_json::json;

    use super::*;

    #[track_caller]
    fn get_must(ast: QueryAst) -> Vec<QueryAst> {
        match ast {
            QueryAst::Bool(boolean_query) => boolean_query.must,
            _ => panic!("expected `QueryAst::Bool`, got `{ast:?}`"),
        }
    }

    #[track_caller]
    fn get_must_not(ast: QueryAst) -> Vec<QueryAst> {
        match ast {
            QueryAst::Bool(boolean_query) => boolean_query.must_not,
            _ => panic!("expected `QueryAst::Bool`, got `{ast:?}`"),
        }
    }

    #[test]
    fn test_build_query() {
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                ),
                QueryAst::MatchAll,
            );
        }
        {
            let service_name = "quickwit search";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "service_name".to_string(),
                        value: service_name.to_string(),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "quickwit";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::from_iter([("_qw_query".to_string(), "query".to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                ),
                quickwit_query::query_ast::UserInputQuery {
                    user_text: "query".to_string(),
                    default_fields: None,
                    default_operator: quickwit_query::BooleanOperand::And,
                    lenient: false,
                }
                .into()
            );
        }
        {
            let service_name = "";
            let span_kind = "client".parse().ok();
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "span_kind".to_string(),
                        value: "3".to_string(),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "GET /config";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "span_name".to_string(),
                        value: span_name.to_string(),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::from_iter([("error".to_string(), "true".to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "span_status.code".to_string(),
                        value: "error".to_string(),
                    }
                    .into(),
                ],
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::from_iter([("error".to_string(), "false".to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must_not(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "span_status.code".to_string(),
                        value: "error".to_string(),
                    }
                    .into(),
                ],
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tag_value = "bar baz";
            let tags = HashMap::from_iter([("foo".to_string(), tag_value.to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let event_name = "Failed to ...";
            let tags = HashMap::from_iter([("event".to_string(), event_name.to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "events.event_name".to_string(),
                        value: event_name.to_string(),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tag_value = "bar";
            let event_name = "Failed to ...";
            let tags = HashMap::from_iter([
                ("event".to_string(), event_name.to_string()),
                ("foo".to_string(), tag_value.to_string()),
            ]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "events.event_name".to_string(),
                        value: event_name.to_string(),
                    }
                    .into(),
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::from_iter([
                ("baz".to_string(), "qux".to_string()),
                ("foo".to_string(), "bar".to_string()),
            ]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.baz".to_string(),
                                value: "qux".to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.baz".to_string(),
                                value: "qux".to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.baz".to_string(),
                                value: "qux".to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into(),
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: "bar".to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: "bar".to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: "bar".to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = Some(3);
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    RangeQuery {
                        field: "span_start_timestamp_nanos".to_string(),
                        lower_bound: Bound::Included("1970-01-01T00:00:03Z".to_string().into()),
                        upper_bound: Bound::Unbounded
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = Some(33);
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    RangeQuery {
                        field: "span_start_timestamp_nanos".to_string(),
                        lower_bound: Bound::Unbounded,
                        upper_bound: Bound::Included("1970-01-01T00:00:33Z".to_string().into()),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = Some(3);
            let max_span_start_timestamp_secs = Some(33);
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    RangeQuery {
                        field: "span_start_timestamp_nanos".to_string(),
                        lower_bound: Bound::Included("1970-01-01T00:00:03Z".to_string().into()),
                        upper_bound: Bound::Included("1970-01-01T00:00:33Z".to_string().into()),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = Some(7);
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    RangeQuery {
                        field: "span_duration_millis".to_string(),
                        lower_bound: Bound::Included(7u64.into()),
                        upper_bound: Bound::Unbounded
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = Some(77);
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    RangeQuery {
                        field: "span_duration_millis".to_string(),
                        lower_bound: Bound::Unbounded,
                        upper_bound: Bound::Included(77u64.into()),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "";
            let span_kind = None;
            let span_name = "";
            let tags = HashMap::new();
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = Some(7);
            let max_span_duration_secs = Some(77);
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    RangeQuery {
                        field: "span_duration_millis".to_string(),
                        lower_bound: Bound::Included(7u64.into()),
                        upper_bound: Bound::Included(77u64.into()),
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "quickwit";
            let span_kind = None;
            let span_name = "";
            let tag_value = "bar";
            let tags = HashMap::from_iter([("foo".to_string(), tag_value.to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "service_name".to_string(),
                        value: service_name.to_string(),
                    }
                    .into(),
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "quickwit";
            let span_kind = "client".parse().ok();
            let span_name = "";
            let tag_value = "bar";
            let tags = HashMap::from_iter([("foo".to_string(), tag_value.to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "service_name".to_string(),
                        value: service_name.to_string(),
                    }
                    .into(),
                    TermQuery {
                        field: "span_kind".to_string(),
                        value: "3".to_string()
                    }
                    .into(),
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "quickwit";
            let span_kind = "client".parse().ok();
            let span_name = "leaf_search";
            let tag_value = "bar";
            let tags = HashMap::from_iter([("foo".to_string(), tag_value.to_string())]);
            let min_span_start_timestamp_secs = None;
            let max_span_start_timestamp_secs = None;
            let min_span_duration_secs = None;
            let max_span_duration_secs = None;
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "service_name".to_string(),
                        value: service_name.to_string(),
                    }
                    .into(),
                    TermQuery {
                        field: "span_kind".to_string(),
                        value: "3".to_string()
                    }
                    .into(),
                    TermQuery {
                        field: "span_name".to_string(),
                        value: span_name.to_string(),
                    }
                    .into(),
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into()
                ]
            );
        }
        {
            let service_name = "quickwit";
            let span_kind = "client".parse().ok();
            let span_name = "leaf_search";
            let tag_value = "bar";
            let tags = HashMap::from_iter([("foo".to_string(), tag_value.to_string())]);
            let min_span_start_timestamp_secs = Some(3);
            let max_span_start_timestamp_secs = Some(33);
            let min_span_duration_secs = Some(7);
            let max_span_duration_secs = Some(77);
            assert_eq!(
                get_must(build_search_query(
                    service_name,
                    span_kind,
                    span_name,
                    tags,
                    min_span_start_timestamp_secs,
                    max_span_start_timestamp_secs,
                    min_span_duration_secs,
                    max_span_duration_secs
                )),
                vec![
                    TermQuery {
                        field: "service_name".to_string(),
                        value: service_name.to_string(),
                    }
                    .into(),
                    TermQuery {
                        field: "span_kind".to_string(),
                        value: "3".to_string()
                    }
                    .into(),
                    TermQuery {
                        field: "span_name".to_string(),
                        value: span_name.to_string(),
                    }
                    .into(),
                    BoolQuery {
                        should: vec![
                            TermQuery {
                                field: "resource_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "span_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                            TermQuery {
                                field: "events.event_attributes.foo".to_string(),
                                value: tag_value.to_string(),
                            }
                            .into(),
                        ],
                        ..Default::default()
                    }
                    .into(),
                    RangeQuery {
                        field: "span_start_timestamp_nanos".to_string(),
                        lower_bound: Bound::Included("1970-01-01T00:00:03Z".to_string().into()),
                        upper_bound: Bound::Included("1970-01-01T00:00:33Z".to_string().into()),
                    }
                    .into(),
                    RangeQuery {
                        field: "span_duration_millis".to_string(),
                        lower_bound: Bound::Included(7u64.into()),
                        upper_bound: Bound::Included(77u64.into()),
                    }
                    .into(),
                ]
            );
        }
    }

    #[test]
    fn test_build_aggregations_query() {
        let aggregations_query = build_aggregations_query(77);
        let aggregations: QuickwitAggregations = serde_json::from_str(&aggregations_query).unwrap();
        let QuickwitAggregations::FindTraceIdsAggregation(collector) = aggregations else {
            panic!("Expected find trace IDs aggregation!");
        };
        assert_eq!(collector.num_traces, 77);
        assert_eq!(collector.trace_id_field_name, "trace_id");
        assert_eq!(
            collector.span_timestamp_field_name,
            "span_start_timestamp_nanos"
        );
    }

    #[test]
    fn test_to_duration_millis() {
        {
            let duration = WellKnownDuration {
                seconds: 0,
                nanos: 1,
            };
            let duration_millis = to_duration_millis(&duration);
            assert!(duration_millis.is_none())
        }
        {
            let duration = WellKnownDuration {
                seconds: 1,
                nanos: 1_000_000,
            };
            let duration_millis = to_duration_millis(&duration).unwrap();
            assert_eq!(duration_millis, 1001)
        }
    }

    #[test]
    fn test_to_well_known_duration() {
        let duration = to_well_known_duration(1_000_000_001, 2_000_000_002);
        assert_eq!(duration.seconds, 1);
        assert_eq!(duration.nanos, 1);
    }

    #[test]
    fn test_to_well_known_timestamp() {
        let timestamp = to_well_known_timestamp(1_000_000_001);
        assert_eq!(timestamp.seconds, 1);
        assert_eq!(timestamp.nanos, 1);
    }

    #[test]
    fn test_otlp_attributes_to_jaeger_tags() {
        let mut tags = otlp_attributes_to_jaeger_tags([
            ("array_int".to_string(), json!([1, 2])),
            ("array_str".to_string(), json!(["foo", "bar"])),
            ("bool".to_string(), json!(true)),
            ("float".to_string(), json!(1.0)),
            ("integer".to_string(), json!(1)),
            ("string".to_string(), json!("foo")),
            (
                "object".to_string(),
                json!({
                    "array_int": [1,2],
                    "array_str": ["foo", "bar"],
                    "bool": true,
                    "float": 1.0,
                    "integer": 1,
                    "string": "foo",
                }),
            ),
        ]);
        tags.sort_by(|left, right| left.key.cmp(&right.key));

        // a tag for the 6 keys in the root, plus 6 more for the nested keys
        assert_eq!(tags.len(), 12);

        assert_eq!(tags[0].key, "array_int");
        assert_eq!(tags[0].v_type(), ValueType::String);
        assert_eq!(tags[0].v_str, "[1,2]");

        assert_eq!(tags[1].key, "array_str");
        assert_eq!(tags[1].v_type(), ValueType::String);
        assert_eq!(tags[1].v_str, r#"["foo","bar"]"#);

        assert_eq!(tags[2].key, "bool");
        assert_eq!(tags[2].v_type(), ValueType::Bool);
        assert!(tags[2].v_bool);

        assert_eq!(tags[3].key, "float");
        assert_eq!(tags[3].v_type(), ValueType::Float64);
        assert_eq!(tags[3].v_float64, 1.0);

        assert_eq!(tags[4].key, "integer");
        assert_eq!(tags[4].v_type(), ValueType::Int64);
        assert_eq!(tags[4].v_int64, 1);

        assert_eq!(tags[5].key, "object.array_int");
        assert_eq!(tags[5].v_type(), ValueType::String);
        assert_eq!(tags[5].v_str, "[1,2]");

        assert_eq!(tags[6].key, "object.array_str");
        assert_eq!(tags[6].v_type(), ValueType::String);
        assert_eq!(tags[6].v_str, r#"["foo","bar"]"#);

        assert_eq!(tags[7].key, "object.bool");
        assert_eq!(tags[7].v_type(), ValueType::Bool);
        assert!(tags[7].v_bool);

        assert_eq!(tags[8].key, "object.float");
        assert_eq!(tags[8].v_type(), ValueType::Float64);
        assert_eq!(tags[8].v_float64, 1.0);

        assert_eq!(tags[9].key, "object.integer");
        assert_eq!(tags[9].v_type(), ValueType::Int64);
        assert_eq!(tags[9].v_int64, 1);

        assert_eq!(tags[10].key, "object.string");
        assert_eq!(tags[10].v_type(), ValueType::String);
        assert_eq!(tags[10].v_str, "foo");

        assert_eq!(tags[11].key, "string");
        assert_eq!(tags[11].v_type(), ValueType::String);
        assert_eq!(tags[11].v_str, "foo");
    }

    #[test]
    fn test_inject_dropped_attribute_tag() {
        let mut tags = Vec::new();

        inject_dropped_count_tags(&mut tags, 0, 0, 0);
        assert!(tags.is_empty());

        inject_dropped_count_tags(&mut tags, 1, 2, 3);
        assert_eq!(tags.len(), 3);

        assert_eq!(tags[0].key, "otel.dropped_attributes_count");
        assert_eq!(tags[0].v_type(), ValueType::Int64);
        assert_eq!(tags[0].v_int64, 1);

        assert_eq!(tags[1].key, "otel.dropped_events_count");
        assert_eq!(tags[1].v_type(), ValueType::Int64);
        assert_eq!(tags[1].v_int64, 2);

        assert_eq!(tags[2].key, "otel.dropped_links_count");
        assert_eq!(tags[2].v_type(), ValueType::Int64);
        assert_eq!(tags[2].v_int64, 3);
    }

    #[test]
    fn test_inject_span_kind_tag() {
        {
            let mut tags = Vec::new();
            inject_span_kind_tag(&mut tags, 0);
            assert!(tags.is_empty());
        }
        {
            let mut tags = Vec::new();
            inject_span_kind_tag(&mut tags, 1);
            assert!(tags.is_empty());
        }
        {
            for (expected_span_kind, span_kind_id) in ["server", "client", "producer", "consumer"]
                .iter()
                .zip(2..6)
            {
                let mut tags = Vec::new();
                inject_span_kind_tag(&mut tags, span_kind_id);
                assert_eq!(tags.len(), 1);

                assert_eq!(tags[0].key, "span.kind");
                assert_eq!(tags[0].v_type(), ValueType::String);
                assert_eq!(tags[0].v_str, *expected_span_kind);
            }
        }
    }

    #[test]
    fn test_inject_status_code_tag() {
        {
            let mut tags = Vec::new();
            let span_status = QwSpanStatus {
                code: OtlpStatusCode::Unset,
                message: None,
            };
            inject_span_status_tags(&mut tags, span_status);
            assert!(tags.is_empty());
        }
        {
            let mut tags = Vec::new();
            let span_status = QwSpanStatus {
                code: OtlpStatusCode::Ok,
                message: None,
            };
            inject_span_status_tags(&mut tags, span_status);
            assert_eq!(tags.len(), 1);
            assert_eq!(tags[0].key, "otel.status_code");
            assert_eq!(tags[0].v_type(), ValueType::String);
            assert_eq!(tags[0].v_str, "OK");
        }
        {
            let mut tags = Vec::new();
            let span_status = QwSpanStatus {
                code: OtlpStatusCode::Error,
                message: Some("An error occurred.".to_string()),
            };
            inject_span_status_tags(&mut tags, span_status);
            assert_eq!(tags.len(), 3);

            assert_eq!(tags[0].key, "otel.status_code");
            assert_eq!(tags[0].v_type(), ValueType::String);
            assert_eq!(tags[0].v_str, "ERROR");

            assert_eq!(tags[1].key, "otel.status_description");
            assert_eq!(tags[1].v_type(), ValueType::String);
            assert_eq!(tags[1].v_str, "An error occurred.");

            assert_eq!(tags[2].key, "error");
            assert_eq!(tags[2].v_type(), ValueType::Bool);
            assert!(tags[2].v_bool);
        }
    }

    #[test]
    fn test_qw_event_to_jaeger_logs() {
        {
            let event = QwEvent {
                event_timestamp_nanos: 1_000_000_001,
                event_name: "".to_string(),
                event_attributes: HashMap::from_iter([("foo".to_string(), json!("bar"))]),
                event_dropped_attributes_count: 0,
            };
            let log = qw_event_to_jaeger_log(event).unwrap();
            assert_eq!(
                log.timestamp.unwrap(),
                to_well_known_timestamp(1_000_000_001)
            );
            assert_eq!(log.fields.len(), 1);

            assert_eq!(log.fields[0].key, "foo");
            assert_eq!(log.fields[0].v_type(), ValueType::String);
            assert_eq!(log.fields[0].v_str, "bar");
        }
        {
            let event = QwEvent {
                event_timestamp_nanos: 1_000_000_001,
                event_name: "Failed to ...".to_string(),
                event_attributes: HashMap::from_iter([("foo".to_string(), json!("bar"))]),
                event_dropped_attributes_count: 1,
            };
            let log = qw_event_to_jaeger_log(event).unwrap();
            assert_eq!(log.fields.len(), 3);

            assert_eq!(log.fields[0].key, "foo");
            assert_eq!(log.fields[0].v_type(), ValueType::String);
            assert_eq!(log.fields[0].v_str, "bar");

            assert_eq!(log.fields[1].key, "event");
            assert_eq!(log.fields[1].v_type(), ValueType::String);
            assert_eq!(log.fields[1].v_str, "Failed to ...");

            assert_eq!(log.fields[2].key, "otel.dropped_attributes_count");
            assert_eq!(log.fields[2].v_type(), ValueType::Int64);
            assert_eq!(log.fields[2].v_int64, 1);
        }
        {
            let event = QwEvent {
                event_timestamp_nanos: 1_000_000_001,
                event_name: "Failed to ...".to_string(),
                event_attributes: HashMap::from_iter([("event".to_string(), json!("foo"))]),
                event_dropped_attributes_count: 0,
            };
            let log = qw_event_to_jaeger_log(event).unwrap();
            assert_eq!(log.fields.len(), 1);
            assert_eq!(log.fields[0].key, "event");
            assert_eq!(log.fields[0].v_type(), ValueType::String);
            assert_eq!(log.fields[0].v_str, "foo");
        }
    }

    #[test]
    fn test_qw_span_to_jaeger_span() {
        let qw_span = QwSpan {
            trace_id: TraceId::new([1; 16]),
            trace_state: Some("key1=value1,key2=value2".to_string()),
            service_name: "quickwit".to_string(),
            resource_attributes: HashMap::from_iter([(
                "resource_key".to_string(),
                json!("resource_value"),
            )]),
            resource_dropped_attributes_count: 1,
            scope_name: Some("vector.dev".to_string()),
            scope_version: Some("1.0.0".to_string()),
            scope_attributes: HashMap::from_iter([("scope_key".to_string(), json!("scope_value"))]),
            scope_dropped_attributes_count: 2,
            span_id: SpanId::new([2; 8]),
            span_kind: 2,
            span_name: "publish_split".to_string(),
            span_fingerprint: Some(SpanFingerprint::new("quickwit", 2.into(), "publish_split")),
            span_start_timestamp_nanos: 1_000_000_001,
            span_end_timestamp_nanos: 2_000_000_002,
            span_duration_millis: Some(1_001),
            span_attributes: HashMap::from_iter([("span_key".to_string(), json!("span_value"))]),
            span_dropped_attributes_count: 3,
            span_dropped_events_count: 4,
            span_dropped_links_count: 5,
            span_status: QwSpanStatus {
                code: OtlpStatusCode::Error,
                message: Some("An error occurred.".to_string()),
            },
            parent_span_id: Some(SpanId::new([3; 8])),
            is_root: Some(false),
            events: vec![QwEvent {
                event_timestamp_nanos: 1000500003,
                event_name: "event_name".to_string(),
                event_attributes: HashMap::from_iter([(
                    "event_key".to_string(),
                    json!("event_value"),
                )]),
                event_dropped_attributes_count: 6,
            }],
            event_names: vec!["event_name".to_string()],
            links: vec![QwLink {
                link_trace_id: TraceId::new([4; 16]),
                link_trace_state: Some("link_key1=link_value1,link_key2=link_value2".to_string()),
                link_span_id: SpanId::new([5; 8]),
                link_attributes: HashMap::from_iter([(
                    "link_key".to_string(),
                    json!("link_value"),
                )]),
                link_dropped_attributes_count: 7,
            }],
        };
        let qw_span_json = serde_json::to_string(&qw_span).unwrap();
        let jaeger_span = qw_span_to_jaeger_span(&qw_span_json).unwrap();
        assert_eq!(jaeger_span.trace_id, [1; 16]);
        assert_eq!(jaeger_span.span_id, [2; 8]);
        assert_eq!(jaeger_span.operation_name, "publish_split");
        assert_eq!(
            jaeger_span.references,
            vec![
                JaegerSpanRef {
                    trace_id: vec![1; 16],
                    span_id: vec![3; 8],
                    ref_type: 0,
                },
                JaegerSpanRef {
                    trace_id: vec![4; 16],
                    span_id: vec![5; 8],
                    ref_type: 1,
                }
            ]
        );
        assert_eq!(jaeger_span.flags, 0);
        assert_eq!(
            jaeger_span.start_time.unwrap(),
            WellKnownTimestamp {
                seconds: 1,
                nanos: 1,
            }
        );
        assert_eq!(
            jaeger_span.duration.unwrap(),
            WellKnownDuration {
                seconds: 1,
                nanos: 1,
            }
        );
        assert_eq!(
            jaeger_span.tags,
            vec![
                JaegerKeyValue {
                    key: "span_key".to_string(),
                    v_type: 0,
                    v_str: "span_value".to_string(),
                    v_bool: false,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "otel.dropped_attributes_count".to_string(),
                    v_type: 2,
                    v_str: String::new(),
                    v_bool: false,
                    v_int64: 3,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "otel.dropped_events_count".to_string(),
                    v_type: 2,
                    v_str: String::new(),
                    v_bool: false,
                    v_int64: 4,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "otel.dropped_links_count".to_string(),
                    v_type: 2,
                    v_str: String::new(),
                    v_bool: false,
                    v_int64: 5,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "span.kind".to_string(),
                    v_type: 0,
                    v_str: "server".to_string(),
                    v_bool: false,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "otel.status_code".to_string(),
                    v_type: 0,
                    v_str: "ERROR".to_string(),
                    v_bool: false,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "otel.status_description".to_string(),
                    v_type: 0,
                    v_str: "An error occurred.".to_string(),
                    v_bool: false,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
                JaegerKeyValue {
                    key: "error".to_string(),
                    v_type: 1,
                    v_str: String::new(),
                    v_bool: true,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                },
            ]
        );
        assert_eq!(
            jaeger_span.logs,
            vec![JaegerLog {
                timestamp: Some(WellKnownTimestamp {
                    seconds: 1,
                    nanos: 500003,
                }),
                fields: vec![
                    JaegerKeyValue {
                        key: "event_key".to_string(),
                        v_type: 0,
                        v_str: "event_value".to_string(),
                        v_bool: false,
                        v_int64: 0,
                        v_float64: 0.0,
                        v_binary: Vec::new()
                    },
                    JaegerKeyValue {
                        key: "event".to_string(),
                        v_type: 0,
                        v_str: "event_name".to_string(),
                        v_bool: false,
                        v_int64: 0,
                        v_float64: 0.0,
                        v_binary: Vec::new()
                    },
                    JaegerKeyValue {
                        key: "otel.dropped_attributes_count".to_string(),
                        v_type: 2,
                        v_str: String::new(),
                        v_bool: false,
                        v_int64: 6,
                        v_float64: 0.0,
                        v_binary: Vec::new()
                    },
                ],
            }]
        );
        assert_eq!(
            jaeger_span.process.unwrap(),
            JaegerProcess {
                service_name: "quickwit".to_string(),
                tags: vec![JaegerKeyValue {
                    key: "resource_key".to_string(),
                    v_type: 0,
                    v_str: "resource_value".to_string(),
                    v_bool: false,
                    v_int64: 0,
                    v_float64: 0.0,
                    v_binary: Vec::new()
                }]
            }
        );
        assert!(jaeger_span.warnings.is_empty());
    }

    #[test]
    fn test_otlp_links_to_jaeger_references() {
        let trace_id = TraceId::new([1; 16]);
        let parent_span_id = SpanId::new([3; 8]);
        let links = vec![QwLink {
            link_trace_id: TraceId::new([4; 16]),
            link_trace_state: Some("link_key1=link_value1,link_key2=link_value2".to_string()),
            link_span_id: SpanId::new([5; 8]),
            link_attributes: HashMap::from_iter([("link_key".to_string(), json!("link_value"))]),
            link_dropped_attributes_count: 7,
        }];
        let jaeger_references =
            otlp_links_to_jaeger_references(&trace_id, Some(parent_span_id), links).unwrap();
        assert_eq!(
            jaeger_references,
            vec![
                JaegerSpanRef {
                    trace_id: vec![1; 16],
                    span_id: vec![3; 8],
                    ref_type: 0,
                },
                JaegerSpanRef {
                    trace_id: vec![4; 16],
                    span_id: vec![5; 8],
                    ref_type: 1,
                }
            ]
        );
    }

    #[test]
    fn test_collect_trace_ids() {
        use quickwit_opentelemetry::otlp::TraceId;
        use quickwit_search::Span;
        use tantivy::DateTime;
        {
            let agg_result: Vec<Span> = Vec::new();
            let agg_result_postcard = postcard::to_stdvec(&agg_result).unwrap();
            let (trace_ids, _span_timestamps_range) =
                collect_trace_ids(&agg_result_postcard).unwrap();
            assert!(trace_ids.is_empty());
        }
        {
            let agg_result = vec![Span {
                trace_id: TraceId::new([
                    0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01,
                    0x01, 0x01, 0x01,
                ]),
                span_timestamp: DateTime::from_timestamp_nanos(1684857492783747000),
            }];
            let agg_result_postcard = postcard::to_stdvec(&agg_result).unwrap();
            let (trace_ids, span_timestamps_range) =
                collect_trace_ids(&agg_result_postcard).unwrap();
            assert_eq!(trace_ids.len(), 1);
            assert_eq!(span_timestamps_range, 1684857492..=1684857492);
        }
        {
            let agg_result = vec![
                Span {
                    trace_id: TraceId::new([
                        0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0a, 0x0b, 0x0c,
                        0x0d, 0x0e, 0x0f, 0x10,
                    ]),
                    span_timestamp: DateTime::from_timestamp_nanos(1684857492783747000),
                },
                Span {
                    trace_id: TraceId::new([
                        0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02, 0x02,
                        0x02, 0x02, 0x02, 0x02,
                    ]),
                    span_timestamp: DateTime::from_timestamp_nanos(1684857826019627000),
                },
            ];
            let agg_result_postcard = postcard::to_stdvec(&agg_result).unwrap();
            let (trace_ids, span_timestamps_range) =
                collect_trace_ids(&agg_result_postcard).unwrap();
            assert_eq!(trace_ids.len(), 2);
            assert_eq!(span_timestamps_range, 1684857492..=1684857826);
        }
    }

    #[tokio::test]
    async fn test_get_services() {
        let mut service = MockSearchService::new();
        service
            .expect_root_list_terms()
            .withf(|req| {
                req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID_PATTERN]
                    && req.field == "service_name"
                    && req.start_timestamp.is_some()
            })
            .return_once(|_| {
                Ok(quickwit_proto::search::ListTermsResponse {
                    num_hits: 3,
                    terms: vec![
                        encode_term_for_test!("service1"),
                        encode_term_for_test!("service2"),
                        encode_term_for_test!("service3"),
                    ],
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                })
            });

        let service = Arc::new(service);
        let jaeger = JaegerService::new(JaegerConfig::default(), service);

        let request = tonic::Request::new(GetServicesRequest {});
        let response = jaeger.get_services(request).await.unwrap().into_inner();
        assert_eq!(response.services, &["service1", "service2", "service3"]);
    }

    #[tokio::test]
    async fn test_get_services_on_custom_indexes() {
        let mut service = MockSearchService::new();
        service
            .expect_root_list_terms()
            .withf(|req| {
                req.index_id_patterns == vec!["index-1", "index-3*"]
                    && req.field == "service_name"
                    && req.start_timestamp.is_some()
            })
            .return_once(|_| {
                Ok(quickwit_proto::search::ListTermsResponse {
                    num_hits: 3,
                    terms: vec![
                        encode_term_for_test!("service1"),
                        encode_term_for_test!("service2"),
                        encode_term_for_test!("service3"),
                    ],
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                })
            });

        let service = Arc::new(service);
        let jaeger = JaegerService::new(JaegerConfig::default(), service);

        let mut request = tonic::Request::new(GetServicesRequest {});
        request.metadata_mut().insert(
            OtelSignal::Traces.header_name(),
            "index-1,index-3*".parse().unwrap(),
        );
        let response = jaeger.get_services(request).await.unwrap().into_inner();
        assert_eq!(response.services, &["service1", "service2", "service3"]);
    }

    #[tokio::test]
    async fn test_v2_get_services() {
        let mut service = MockSearchService::new();
        service
            .expect_root_list_terms()
            .withf(|req| {
                req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID_PATTERN]
                    && req.field == "service_name"
                    && req.start_timestamp.is_some()
            })
            .return_once(|_| {
                Ok(quickwit_proto::search::ListTermsResponse {
                    num_hits: 3,
                    terms: vec![
                        encode_term_for_test!("service1"),
                        encode_term_for_test!("service2"),
                        encode_term_for_test!("service3"),
                    ],
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                })
            });

        let service = Arc::new(service);
        let jaeger = JaegerService::new(JaegerConfig::default(), service);

        let request =
            tonic::Request::new(quickwit_proto::jaeger::storage::v2::GetServicesRequest {});
        let response =
            quickwit_proto::jaeger::storage::v2::trace_reader_server::TraceReader::get_services(
                &jaeger, request,
            )
            .await
            .unwrap()
            .into_inner();
        assert_eq!(response.services, &["service1", "service2", "service3"]);
    }

    #[tokio::test]
    async fn test_v2_get_operations() {
        let mut service = MockSearchService::new();
        service
            .expect_root_list_terms()
            .withf(|req| {
                req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID_PATTERN]
                    && req.field == "span_fingerprint"
                    && req.start_timestamp.is_some()
            })
            .return_once(|_| {
                let fingerprint1 =
                    SpanFingerprint::new("test-service", QwSpanKind::from(2), "GET /api");
                let fingerprint2 =
                    SpanFingerprint::new("test-service", QwSpanKind::from(3), "POST /data");

                Ok(quickwit_proto::search::ListTermsResponse {
                    num_hits: 2,
                    terms: vec![
                        encode_term_for_test!(fingerprint1.as_str()),
                        encode_term_for_test!(fingerprint2.as_str()),
                    ],
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                })
            });

        let service = Arc::new(service);
        let jaeger = JaegerService::new(JaegerConfig::default(), service);

        let request =
            tonic::Request::new(quickwit_proto::jaeger::storage::v2::GetOperationsRequest {
                service: "test-service".to_string(),
                span_kind: String::new(),
            });
        let response =
            quickwit_proto::jaeger::storage::v2::trace_reader_server::TraceReader::get_operations(
                &jaeger, request,
            )
            .await
            .unwrap()
            .into_inner();
        assert_eq!(response.operations.len(), 2);
        assert_eq!(response.operations[0].name, "GET /api");
        assert_eq!(response.operations[0].span_kind, "server");
        assert_eq!(response.operations[1].name, "POST /data");
        assert_eq!(response.operations[1].span_kind, "client");
    }

    #[tokio::test]
    async fn test_v2_find_trace_ids() {
        let mut service = MockSearchService::new();
        service
            .expect_root_search()
            .withf(|req| {
                req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID_PATTERN]
                    && req.start_timestamp.is_some()
                    && req.end_timestamp.is_some()
            })
            .return_once(|_| {
                use quickwit_search::Span as TraceSpan;
                use tantivy::DateTime;

                let trace_id_1 =
                    TraceId::new([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16]);
                let trace_id_2 = TraceId::new([
                    17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32,
                ]);

                let spans = vec![
                    TraceSpan {
                        trace_id: trace_id_1,
                        span_timestamp: DateTime::from_timestamp_secs(1500),
                    },
                    TraceSpan {
                        trace_id: trace_id_2,
                        span_timestamp: DateTime::from_timestamp_secs(1600),
                    },
                ];

                let aggregation_postcard = postcard::to_allocvec(&spans).unwrap();

                Ok(quickwit_proto::search::SearchResponse {
                    num_hits: 2,
                    hits: vec![],
                    elapsed_time_micros: 100,
                    errors: Vec::new(),
                    aggregation_postcard: Some(aggregation_postcard),
                    scroll_id: None,
                    failed_splits: Vec::new(),
                    num_successful_splits: 1,
                })
            });

        let service = Arc::new(service);
        let jaeger = JaegerService::new(JaegerConfig::default(), service);

        let request = tonic::Request::new(quickwit_proto::jaeger::storage::v2::FindTracesRequest {
            query: Some(quickwit_proto::jaeger::storage::v2::TraceQueryParameters {
                service_name: "test-service".to_string(),
                operation_name: String::new(),
                attributes: vec![],
                start_time_min: Some(prost_types::Timestamp {
                    seconds: 1000,
                    nanos: 0,
                }),
                start_time_max: Some(prost_types::Timestamp {
                    seconds: 2000,
                    nanos: 0,
                }),
                duration_min: None,
                duration_max: None,
                search_depth: 10,
            }),
        });
        let response =
            quickwit_proto::jaeger::storage::v2::trace_reader_server::TraceReader::find_trace_i_ds(
                &jaeger, request,
            )
            .await
            .unwrap()
            .into_inner();
        assert_eq!(response.trace_ids.len(), 2);
        assert_eq!(response.trace_ids[0].trace_id.len(), 16);
        assert_eq!(response.trace_ids[1].trace_id.len(), 16);
    }

    #[test]
    fn test_convert_v2_attributes_to_v1_tags() {
        let attributes = vec![
            quickwit_proto::jaeger::storage::v2::KeyValue {
                key: "http.method".to_string(),
                value: Some(quickwit_proto::jaeger::storage::v2::AnyValue {
                    value: Some(
                        quickwit_proto::jaeger::storage::v2::any_value::Value::StringValue(
                            "GET".to_string(),
                        ),
                    ),
                }),
            },
            quickwit_proto::jaeger::storage::v2::KeyValue {
                key: "http.status_code".to_string(),
                value: Some(quickwit_proto::jaeger::storage::v2::AnyValue {
                    value: Some(
                        quickwit_proto::jaeger::storage::v2::any_value::Value::IntValue(200),
                    ),
                }),
            },
            quickwit_proto::jaeger::storage::v2::KeyValue {
                key: "error".to_string(),
                value: Some(quickwit_proto::jaeger::storage::v2::AnyValue {
                    value: Some(
                        quickwit_proto::jaeger::storage::v2::any_value::Value::BoolValue(false),
                    ),
                }),
            },
        ];

        let tags = crate::v2::convert_v2_attributes_to_v1_tags(attributes);
        assert_eq!(tags.len(), 3);
        assert_eq!(tags.get("http.method"), Some(&"GET".to_string()));
        assert_eq!(tags.get("http.status_code"), Some(&"200".to_string()));
        assert_eq!(tags.get("error"), Some(&"false".to_string()));
    }

    // Note: test_spans_to_otel_traces_data was removed as v2 now works directly with
    // native OpenTelemetry format (QwSpan) instead of converting from Jaeger v1 format
}


================================================
FILE: quickwit/quickwit-jaeger/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    HistogramVec, IntCounterVec, exponential_buckets, new_counter_vec, new_histogram_vec,
};

pub struct JaegerServiceMetrics {
    pub requests_total: IntCounterVec<2>,
    pub request_errors_total: IntCounterVec<2>,
    pub request_duration_seconds: HistogramVec<3>,
    pub fetched_traces_total: IntCounterVec<2>,
    pub fetched_spans_total: IntCounterVec<2>,
    pub transferred_bytes_total: IntCounterVec<2>,
}

impl Default for JaegerServiceMetrics {
    fn default() -> Self {
        Self {
            requests_total: new_counter_vec(
                "requests_total",
                "Number of requests",
                "jaeger",
                &[],
                ["operation", "index"],
            ),
            request_errors_total: new_counter_vec(
                "request_errors_total",
                "Number of failed requests",
                "jaeger",
                &[],
                ["operation", "index"],
            ),
            request_duration_seconds: new_histogram_vec(
                "request_duration_seconds",
                "Duration of requests",
                "jaeger",
                &[],
                ["operation", "index", "error"],
                exponential_buckets(0.02, 2.0, 8).unwrap(),
            ),
            fetched_traces_total: new_counter_vec(
                "fetched_traces_total",
                "Number of traces retrieved from storage",
                "jaeger",
                &[],
                ["operation", "index"],
            ),
            fetched_spans_total: new_counter_vec(
                "fetched_spans_total",
                "Number of spans retrieved from storage",
                "jaeger",
                &[],
                ["operation", "index"],
            ),
            transferred_bytes_total: new_counter_vec(
                "transferred_bytes_total",
                "Number of bytes transferred",
                "jaeger",
                &[],
                ["operation", "index"],
            ),
        }
    }
}

pub static JAEGER_SERVICE_METRICS: Lazy<JaegerServiceMetrics> =
    Lazy::new(JaegerServiceMetrics::default);


================================================
FILE: quickwit/quickwit-jaeger/src/v1.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Jaeger v1 API implementation (SpanReaderPlugin)

use std::time::Instant;

use async_trait::async_trait;
use quickwit_opentelemetry::otlp::{
    OTEL_TRACES_INDEX_ID, extract_otel_traces_index_id_patterns_from_metadata,
};
use quickwit_proto::jaeger::storage::v1::span_reader_plugin_server::SpanReaderPlugin;
use quickwit_proto::jaeger::storage::v1::{
    FindTraceIDsRequest, FindTraceIDsResponse, FindTracesRequest, GetOperationsRequest,
    GetOperationsResponse, GetServicesRequest, GetServicesResponse, GetTraceRequest,
};
use tonic::{Request, Response, Status};

use crate::metrics::JAEGER_SERVICE_METRICS;
use crate::{JaegerService, SpanStream};

macro_rules! metrics {
    ($expr:expr, [$operation:ident, $($label:expr),*]) => {
        let start = std::time::Instant::now();
        let labels = [stringify!($operation), $($label,)*];
        JAEGER_SERVICE_METRICS.requests_total.with_label_values(labels).inc();
        let (res, is_error) = match $expr {
            ok @ Ok(_) => {
                (ok, "false")
            },
            err @ Err(_) => {
                JAEGER_SERVICE_METRICS.request_errors_total.with_label_values(labels).inc();
                (err, "true")
            },
        };
        let elapsed = start.elapsed().as_secs_f64();
        let labels = [stringify!($operation), $($label,)* is_error];
        JAEGER_SERVICE_METRICS.request_duration_seconds.with_label_values(labels).observe(elapsed);

        return res.map(Response::new);
    };
}

#[async_trait]
impl SpanReaderPlugin for JaegerService {
    type GetTraceStream = SpanStream;

    type FindTracesStream = SpanStream;

    async fn get_services(
        &self,
        request: Request<GetServicesRequest>,
    ) -> Result<Response<GetServicesResponse>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;
        metrics!(
            self.get_services_for_indexes(request.into_inner(), index_id_patterns)
                .await,
            [get_services, OTEL_TRACES_INDEX_ID]
        );
    }

    async fn get_operations(
        &self,
        request: Request<GetOperationsRequest>,
    ) -> Result<Response<GetOperationsResponse>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;
        metrics!(
            self.get_operations_for_indexes(request.into_inner(), index_id_patterns)
                .await,
            [get_operations, OTEL_TRACES_INDEX_ID]
        );
    }

    async fn find_trace_i_ds(
        &self,
        request: Request<FindTraceIDsRequest>,
    ) -> Result<Response<FindTraceIDsResponse>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;
        metrics!(
            self.find_trace_ids_for_indexes(request.into_inner(), index_id_patterns)
                .await,
            [find_trace_ids, OTEL_TRACES_INDEX_ID]
        );
    }

    async fn find_traces(
        &self,
        request: Request<FindTracesRequest>,
    ) -> Result<Response<Self::FindTracesStream>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;
        self.find_traces_for_indexes(
            request.into_inner(),
            "find_traces",
            Instant::now(),
            index_id_patterns,
            false, /* if we use true, Jaeger will display "1 Span", and display an empty trace
                    * when clicking on the ui (but display the full trace after reloading the
                    * page) */
        )
        .await
        .map(Response::new)
    }

    async fn get_trace(
        &self,
        request: Request<GetTraceRequest>,
    ) -> Result<Response<Self::GetTraceStream>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;
        self.get_trace_for_indexes(
            request.into_inner(),
            "get_trace",
            Instant::now(),
            index_id_patterns,
        )
        .await
        .map(Response::new)
    }
}


================================================
FILE: quickwit/quickwit-jaeger/src/v2.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// Jaeger v2 API implementation (TraceReader)
use std::collections::HashMap;
use std::sync::Arc;
use std::time::Instant;

use async_trait::async_trait;
use prost_types::Timestamp as WellKnownTimestamp;
use quickwit_opentelemetry::otlp::{
    OTEL_TRACES_INDEX_ID, Span as QwSpan, TraceId,
    extract_otel_traces_index_id_patterns_from_metadata,
};
use quickwit_proto::jaeger::storage::v2::trace_reader_server::TraceReader;
use quickwit_proto::jaeger::storage::v2::{
    FindTracesRequest, FoundTraceId, GetOperationsRequest, GetOperationsResponse,
    GetServicesRequest, GetServicesResponse, GetTracesRequest, Operation,
};
use quickwit_proto::opentelemetry::proto::common::v1::any_value::Value as OtelValue;
use quickwit_proto::opentelemetry::proto::common::v1::{
    AnyValue as OtelAnyValue, InstrumentationScope, KeyValue as OtelKeyValue,
};
use quickwit_proto::opentelemetry::proto::resource::v1::Resource as OtelResource;
use quickwit_proto::opentelemetry::proto::trace::v1 as otel_trace;
use quickwit_proto::opentelemetry::proto::trace::v1::status::StatusCode as OtelStatusCode;
use quickwit_proto::opentelemetry::proto::trace::v1::{
    ResourceSpans, ScopeSpans, Span as OtelSpan, Status as OtelStatus,
};
use quickwit_proto::search::{CountHits, SearchRequest};
use quickwit_query::BooleanOperand;
use quickwit_query::query_ast::{BoolQuery, QueryAst, TermQuery, UserInputQuery};
use quickwit_search::SearchService;
use serde_json::Value as JsonValue;
use time::OffsetDateTime;
use tokio::sync::mpsc;
use tokio_stream::wrappers::ReceiverStream;
use tonic::{Request, Response, Status};
use tracing::field::Empty;
use tracing::{Span as RuntimeSpan, debug, error, instrument};

use crate::metrics::JAEGER_SERVICE_METRICS;
use crate::{
    JaegerService, TimeIntervalSecs, TracesDataStream, get_operations_impl, get_services_impl,
    json_deserialize, record_error, record_send, to_duration_millis,
};

macro_rules! metrics {
    ($expr:expr, [$operation:ident, $($label:expr),*]) => {
        let start = std::time::Instant::now();
        let labels = [stringify!($operation), $($label,)*];
        JAEGER_SERVICE_METRICS.requests_total.with_label_values(labels).inc();
        let (res, is_error) = match $expr {
            ok @ Ok(_) => {
                (ok, "false")
            },
            err @ Err(_) => {
                JAEGER_SERVICE_METRICS.request_errors_total.with_label_values(labels).inc();
                (err, "true")
            },
        };
        let elapsed = start.elapsed().as_secs_f64();
        let labels = [stringify!($operation), $($label,)* is_error];
        JAEGER_SERVICE_METRICS.request_duration_seconds.with_label_values(labels).observe(elapsed);

        return res.map(Response::new);
    };
}

#[async_trait]
impl TraceReader for JaegerService {
    async fn get_services(
        &self,
        request: Request<GetServicesRequest>,
    ) -> Result<Response<GetServicesResponse>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;

        let services = get_services_impl(
            self.search_service.clone(),
            self.lookback_period_secs,
            index_id_patterns,
        )
        .await?;

        let response = GetServicesResponse { services };
        metrics!(Ok(response), [get_services_v2, OTEL_TRACES_INDEX_ID]);
    }

    async fn get_operations(
        &self,
        request: Request<GetOperationsRequest>,
    ) -> Result<Response<GetOperationsResponse>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;

        let req = request.into_inner();

        let operations = get_operations_impl(
            self.search_service.clone(),
            self.lookback_period_secs,
            req.service,
            req.span_kind,
            index_id_patterns,
        )
        .await?
        .into_iter()
        .map(|op| Operation {
            name: op.name,
            span_kind: op.span_kind,
        })
        .collect();

        let response = GetOperationsResponse { operations };
        metrics!(Ok(response), [get_operations_v2, OTEL_TRACES_INDEX_ID]);
    }

    type GetTracesStream = TracesDataStream;

    async fn get_traces(
        &self,
        request: Request<GetTracesRequest>,
    ) -> Result<Response<Self::GetTracesStream>, Status> {
        let request_start = Instant::now();
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;

        let (tx, rx) = mpsc::channel(2);
        let search_service = self.search_service.clone();
        let max_fetch_spans = self.max_fetch_spans;
        let lookback_period_secs = self.lookback_period_secs;
        let query_list = request.into_inner().query;

        tokio::task::spawn(async move {
            for query_params in query_list {
                let trace_id = match TraceId::try_from(query_params.trace_id) {
                    Ok(id) => id,
                    Err(error) => {
                        let _ = tx
                            .send(Err(Status::invalid_argument(error.to_string())))
                            .await;
                        return;
                    }
                };

                let end = OffsetDateTime::now_utc().unix_timestamp();
                let search_window = (end - lookback_period_secs)..=end;

                let otel_spans = match stream_otel_spans_impl(
                    search_service.clone(),
                    max_fetch_spans,
                    &[trace_id],
                    search_window,
                    "get_traces_v2",
                    request_start,
                    index_id_patterns.clone(),
                    false,
                )
                .await
                {
                    Ok(spans) => spans,
                    Err(e) => {
                        let _ = tx.send(Err(e)).await;
                        return;
                    }
                };

                if tx
                    .send(Ok(qw_spans_to_otel_traces_data(otel_spans)))
                    .await
                    .is_err()
                {
                    return;
                }
            }
        });

        Ok(Response::new(ReceiverStream::new(rx)))
    }

    type FindTracesStream = TracesDataStream;

    async fn find_traces(
        &self,
        request: Request<FindTracesRequest>,
    ) -> Result<Response<Self::FindTracesStream>, Status> {
        let request_start = Instant::now();

        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;

        let query = request
            .into_inner()
            .query
            .ok_or_else(|| Status::invalid_argument("Query is empty."))?;

        let (trace_ids, span_timestamps_range) = find_trace_ids_impl(
            self.search_service.clone(),
            self.max_trace_duration_secs,
            query,
            index_id_patterns.clone(),
        )
        .await?;

        let search_window = (span_timestamps_range.start() - self.max_trace_duration_secs)
            ..=(span_timestamps_range.end() + self.max_trace_duration_secs);

        let (tx, rx) = mpsc::channel(2);
        let search_service = self.search_service.clone();
        let max_fetch_spans = self.max_fetch_spans;

        tokio::task::spawn(async move {
            let all_spans = match stream_otel_spans_impl(
                search_service,
                max_fetch_spans,
                &trace_ids,
                search_window,
                "find_traces_v2",
                request_start,
                index_id_patterns,
                false,
            )
            .await
            {
                Ok(spans) => spans,
                Err(e) => {
                    let _ = tx.send(Err(e)).await;
                    return;
                }
            };

            // Group by trace_id and send each trace
            let mut spans_by_trace: HashMap<Vec<u8>, Vec<QwSpan>> = HashMap::new();
            for span in all_spans {
                spans_by_trace
                    .entry(span.trace_id.to_vec())
                    .or_default()
                    .push(span);
            }

            for spans in spans_by_trace.into_values() {
                if tx
                    .send(Ok(qw_spans_to_otel_traces_data(spans)))
                    .await
                    .is_err()
                {
                    return;
                }
            }
        });

        Ok(Response::new(ReceiverStream::new(rx)))
    }

    async fn find_trace_i_ds(
        &self,
        request: Request<quickwit_proto::jaeger::storage::v2::FindTracesRequest>,
    ) -> Result<Response<quickwit_proto::jaeger::storage::v2::FindTraceIDsResponse>, Status> {
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(request.metadata())?;

        let query = request
            .into_inner()
            .query
            .ok_or_else(|| Status::invalid_argument("Query is empty."))?;

        let (trace_ids, time_range) = find_trace_ids_impl(
            self.search_service.clone(),
            self.max_trace_duration_secs,
            query,
            index_id_patterns,
        )
        .await?;

        let trace_ids = trace_ids
            .into_iter()
            .map(|trace_id| FoundTraceId {
                trace_id: trace_id.to_vec(),
                start: Some(WellKnownTimestamp {
                    seconds: *time_range.start(),
                    nanos: 0,
                }),
                end: Some(WellKnownTimestamp {
                    seconds: *time_range.end(),
                    nanos: 0,
                }),
            })
            .collect();

        let response = quickwit_proto::jaeger::storage::v2::FindTraceIDsResponse { trace_ids };
        metrics!(Ok(response), [find_trace_ids_v2, OTEL_TRACES_INDEX_ID]);
    }
}

// === Helper functions ===
#[instrument("find_trace_ids", skip_all)]
async fn find_trace_ids_impl(
    search_service: Arc<dyn SearchService>,
    _max_trace_duration_secs: i64,
    query: quickwit_proto::jaeger::storage::v2::TraceQueryParameters,
    index_id_patterns: Vec<String>,
) -> Result<(Vec<TraceId>, TimeIntervalSecs), Status> {
    debug!(service_name=%query.service_name, operation_name=%query.operation_name, "`find_trace_ids` request");

    let min_start_secs = query.start_time_min.as_ref().map(|ts| ts.seconds);
    let max_start_secs = query.start_time_max.as_ref().map(|ts| ts.seconds);
    let min_duration_millis = query.duration_min.as_ref().and_then(to_duration_millis);
    let max_duration_millis = query.duration_max.as_ref().and_then(to_duration_millis);
    let tags = convert_v2_attributes_to_v1_tags(query.attributes);

    crate::find_trace_ids_common(
        search_service,
        &query.service_name,
        &query.operation_name,
        tags,
        min_start_secs,
        max_start_secs,
        min_duration_millis,
        max_duration_millis,
        query.search_depth as usize,
        index_id_patterns,
    )
    .await
}

#[instrument("stream_otel_spans", skip_all, fields(num_traces=%trace_ids.len(), num_spans=Empty, num_bytes=Empty))]
#[allow(clippy::too_many_arguments)]
async fn stream_otel_spans_impl(
    search_service: Arc<dyn SearchService>,
    max_fetch_spans: u64,
    trace_ids: &[TraceId],
    search_window: TimeIntervalSecs,
    operation_name: &'static str,
    request_start: Instant,
    index_id_patterns: Vec<String>,
    root_only: bool,
) -> Result<Vec<QwSpan>, Status> {
    if trace_ids.is_empty() {
        return Ok(Vec::new());
    }

    let mut query = BoolQuery::default();

    for trace_id in trace_ids {
        let value = trace_id.hex_display();
        let term_query = TermQuery {
            field: "trace_id".to_string(),
            value,
        };
        query.should.push(term_query.into());
    }

    if root_only {
        let is_root = UserInputQuery {
            user_text: "NOT is_root:false".to_string(),
            default_fields: None,
            default_operator: BooleanOperand::And,
            lenient: true,
        };
        let mut new_query = BoolQuery::default();
        new_query.must.push(query.into());
        new_query.must.push(is_root.into());
        query = new_query;
    }

    let query_ast: QueryAst = query.into();
    let query_ast =
        serde_json::to_string(&query_ast).map_err(|err| Status::internal(err.to_string()))?;

    let search_request = SearchRequest {
        index_id_patterns,
        query_ast,
        start_timestamp: Some(*search_window.start()),
        end_timestamp: Some(*search_window.end()),
        max_hits: max_fetch_spans,
        count_hits: CountHits::Underestimate.into(),
        ..Default::default()
    };

    let search_response = match search_service.root_search(search_request).await {
        Ok(search_response) => search_response,
        Err(search_error) => {
            error!(search_error=?search_error, "failed to fetch spans");
            record_error(operation_name, request_start);
            return Err(Status::internal("Failed to fetch spans."));
        }
    };

    let mut qw_spans: Vec<QwSpan> = Vec::with_capacity(search_response.hits.len());

    for hit in search_response.hits {
        match qw_span_from_json(&hit.json) {
            Ok(span) => {
                qw_spans.push(span);
            }
            Err(status) => {
                record_error(operation_name, request_start);
                return Err(status);
            }
        };
    }

    if trace_ids.len() > 1 {
        qw_spans.sort_unstable_by(|left, right| left.trace_id.cmp(&right.trace_id));
    }

    let num_spans = qw_spans.len();
    let num_bytes = qw_spans
        .iter()
        .map(|span| serde_json::to_string(span).unwrap_or_default().len())
        .sum::<usize>();

    RuntimeSpan::current().record("num_spans", num_spans);
    RuntimeSpan::current().record("num_bytes", num_bytes);

    record_send(operation_name, num_spans, num_bytes);

    JAEGER_SERVICE_METRICS
        .fetched_traces_total
        .with_label_values([operation_name, OTEL_TRACES_INDEX_ID])
        .inc_by(trace_ids.len() as u64);

    let elapsed = request_start.elapsed().as_secs_f64();
    JAEGER_SERVICE_METRICS
        .request_duration_seconds
        .with_label_values([operation_name, OTEL_TRACES_INDEX_ID, "false"])
        .observe(elapsed);

    Ok(qw_spans)
}

// === Conversion functions ===
// Note: record_error and record_send are now shared in lib.rs

/// Direct conversion from Quickwit's native OpenTelemetry span to Jaeger v2's OpenTelemetry format
fn qw_spans_to_otel_traces_data(
    qw_spans: Vec<QwSpan>,
) -> quickwit_proto::opentelemetry::proto::trace::v1::TracesData {
    // Group spans by service
    let mut spans_by_service: HashMap<String, Vec<QwSpan>> = HashMap::new();
    for span in qw_spans {
        spans_by_service
            .entry(span.service_name.clone())
            .or_default()
            .push(span);
    }

    let resource_spans = spans_by_service
        .into_iter()
        .map(|(service_name, spans)| {
            // Get resource attributes from first span before grouping
            let first_span_attrs = spans
                .first()
                .map(|span| span.resource_attributes.clone())
                .unwrap_or_default();

            // Group by scope
            let mut spans_by_scope: HashMap<(Option<String>, Option<String>), Vec<QwSpan>> =
                HashMap::new();
            for span in spans {
                let key = (span.scope_name.clone(), span.scope_version.clone());
                spans_by_scope.entry(key).or_default().push(span);
            }

            let scope_spans = spans_by_scope
                .into_iter()
                .map(|((scope_name, scope_version), spans)| {
                    let otel_spans = spans.into_iter().map(qw_span_to_otel_span).collect();

                    ScopeSpans {
                        scope: Some(InstrumentationScope {
                            name: scope_name.unwrap_or_default(),
                            version: scope_version.unwrap_or_default(),
                            attributes: vec![],
                            dropped_attributes_count: 0,
                        }),
                        spans: otel_spans,
                        schema_url: String::new(),
                    }
                })
                .collect();

            let mut resource_attrs = vec![OtelKeyValue {
                key: "service.name".to_string(),
                value: Some(OtelAnyValue {
                    value: Some(OtelValue::StringValue(service_name)),
                }),
            }];

            // Add other resource attributes
            for (key, value) in first_span_attrs {
                resource_attrs.push(json_value_to_otel_kv(key, value));
            }

            ResourceSpans {
                resource: Some(OtelResource {
                    attributes: resource_attrs,
                    dropped_attributes_count: 0,
                }),
                scope_spans,
                schema_url: String::new(),
            }
        })
        .collect();

    quickwit_proto::opentelemetry::proto::trace::v1::TracesData { resource_spans }
}

/// Convert a Quickwit span (native OTEL format) to Jaeger v2 OTEL span
fn qw_span_to_otel_span(qw_span: QwSpan) -> OtelSpan {
    OtelSpan {
        trace_id: qw_span.trace_id.to_vec(),
        span_id: qw_span.span_id.to_vec(),
        trace_state: qw_span.trace_state.unwrap_or_default(),
        parent_span_id: qw_span
            .parent_span_id
            .map(|id| id.to_vec())
            .unwrap_or_default(),
        name: qw_span.span_name,
        kind: qw_span.span_kind as i32,
        start_time_unix_nano: qw_span.span_start_timestamp_nanos,
        end_time_unix_nano: qw_span.span_end_timestamp_nanos,
        attributes: qw_span
            .span_attributes
            .into_iter()
            .map(|(k, v)| json_value_to_otel_kv(k, v))
            .collect(),
        dropped_attributes_count: qw_span.span_dropped_attributes_count,
        events: qw_span
            .events
            .into_iter()
            .map(|event| otel_trace::span::Event {
                time_unix_nano: event.event_timestamp_nanos,
                name: event.event_name,
                attributes: event
                    .event_attributes
                    .into_iter()
                    .map(|(k, v)| json_value_to_otel_kv(k, v))
                    .collect(),
                dropped_attributes_count: event.event_dropped_attributes_count,
            })
            .collect(),
        dropped_events_count: qw_span.span_dropped_events_count,
        links: qw_span
            .links
            .into_iter()
            .map(|link| otel_trace::span::Link {
                trace_id: link.link_trace_id.to_vec(),
                span_id: link.link_span_id.to_vec(),
                trace_state: link.link_trace_state.unwrap_or_default(),
                attributes: link
                    .link_attributes
                    .into_iter()
                    .map(|(k, v)| json_value_to_otel_kv(k, v))
                    .collect(),
                dropped_attributes_count: link.link_dropped_attributes_count,
            })
            .collect(),
        dropped_links_count: qw_span.span_dropped_links_count,
        status: Some(OtelStatus {
            message: qw_span.span_status.message.unwrap_or_default(),
            code: match qw_span.span_status.code {
                quickwit_proto::opentelemetry::proto::trace::v1::status::StatusCode::Unset => {
                    OtelStatusCode::Unset as i32
                }
                quickwit_proto::opentelemetry::proto::trace::v1::status::StatusCode::Ok => {
                    OtelStatusCode::Ok as i32
                }
                quickwit_proto::opentelemetry::proto::trace::v1::status::StatusCode::Error => {
                    OtelStatusCode::Error as i32
                }
            },
        }),
    }
}

fn json_value_to_otel_kv(key: String, value: JsonValue) -> OtelKeyValue {
    let otel_value = match value {
        JsonValue::String(s) => OtelValue::StringValue(s),
        JsonValue::Number(n) => {
            if let Some(i) = n.as_i64() {
                OtelValue::IntValue(i)
            } else if let Some(f) = n.as_f64() {
                OtelValue::DoubleValue(f)
            } else {
                OtelValue::StringValue(n.to_string())
            }
        }
        JsonValue::Bool(b) => OtelValue::BoolValue(b),
        JsonValue::Array(_) | JsonValue::Object(_) => OtelValue::StringValue(value.to_string()),
        JsonValue::Null => OtelValue::StringValue(String::new()),
    };

    OtelKeyValue {
        key,
        value: Some(OtelAnyValue {
            value: Some(otel_value),
        }),
    }
}

#[allow(clippy::result_large_err)]
fn qw_span_from_json(qw_span_json: &str) -> Result<QwSpan, Status> {
    json_deserialize(qw_span_json, "span")
}

pub(crate) fn convert_v2_attributes_to_v1_tags(
    attributes: Vec<quickwit_proto::jaeger::storage::v2::KeyValue>,
) -> HashMap<String, String> {
    attributes
        .into_iter()
        .filter_map(|kv| {
            let value = kv.value?.value?;
            let string_value = match value {
                quickwit_proto::jaeger::storage::v2::any_value::Value::StringValue(s) => s,
                quickwit_proto::jaeger::storage::v2::any_value::Value::IntValue(i) => i.to_string(),
                quickwit_proto::jaeger::storage::v2::any_value::Value::DoubleValue(d) => {
                    d.to_string()
                }
                quickwit_proto::jaeger::storage::v2::any_value::Value::BoolValue(b) => {
                    b.to_string()
                }
                _ => return None,
            };
            Some((kv.key, string_value))
        })
        .collect()
}


================================================
FILE: quickwit/quickwit-janitor/Cargo.toml
================================================
[package]
name = "quickwit-janitor"
description = "Janitor service implementation"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
futures = { workspace = true }
itertools = { workspace = true }
once_cell = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
tantivy = { workspace = true }
thiserror = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }
utoipa = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-index-management = { workspace = true }
quickwit-indexing = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-query = { workspace = true }
quickwit-search = { workspace = true }
quickwit-storage = { workspace = true }

[features]
testsuite = []

[dev-dependencies]
mockall = { workspace = true }
tempfile = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-search = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }


================================================
FILE: quickwit/quickwit-janitor/src/actors/delete_task_pipeline.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::PathBuf;
use std::sync::Arc;
use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, Handler, Mailbox, Supervisor,
    SupervisorState,
};
use quickwit_common::io::IoControls;
use quickwit_common::pubsub::EventBroker;
use quickwit_common::temp_dir::{self};
use quickwit_common::uri::Uri;
use quickwit_config::build_doc_mapper;
use quickwit_indexing::actors::{
    MergeExecutor, MergeSchedulerService, MergeSplitDownloader, Packager, Publisher,
    PublisherCounters, Uploader, UploaderCounters, UploaderType,
};
use quickwit_indexing::merge_policy::merge_policy_from_settings;
use quickwit_indexing::{IndexingSplitStore, PublisherType, SplitsUpdateMailbox};
use quickwit_metastore::IndexMetadataResponseExt;
use quickwit_proto::indexing::MergePipelineId;
use quickwit_proto::metastore::{IndexMetadataRequest, MetastoreService, MetastoreServiceClient};
use quickwit_proto::types::{IndexUid, NodeId};
use quickwit_search::SearchJobPlacer;
use quickwit_storage::Storage;
use serde::Serialize;
use tokio::join;
use tracing::info;

use super::delete_task_planner::DeleteTaskPlanner;
use crate::actors::delete_task_planner::DeleteTaskPlannerState;

const OBSERVE_PIPELINE_INTERVAL: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(500)
} else {
    // 1 minute.
    // This is only for observation purpose, not supervision.
    Duration::from_secs(60)
};

struct DeletePipelineHandle {
    pub delete_task_planner: ActorHandle<Supervisor<DeleteTaskPlanner>>,
    pub downloader: ActorHandle<Supervisor<MergeSplitDownloader>>,
    pub delete_task_executor: ActorHandle<Supervisor<MergeExecutor>>,
    pub packager: ActorHandle<Supervisor<Packager>>,
    pub uploader: ActorHandle<Supervisor<Uploader>>,
    pub publisher: ActorHandle<Supervisor<Publisher>>,
}

/// A Struct to hold all statistical data about deletes.
#[derive(Clone, Debug, Default, Serialize)]
pub struct DeleteTaskPipelineState {
    pub delete_task_planner: SupervisorState<DeleteTaskPlannerState>,
    pub downloader: SupervisorState<()>,
    pub delete_task_executor: SupervisorState<()>,
    pub packager: SupervisorState<()>,
    pub uploader: SupervisorState<UploaderCounters>,
    pub publisher: SupervisorState<PublisherCounters>,
}

pub struct DeleteTaskPipeline {
    index_uid: IndexUid,
    metastore: MetastoreServiceClient,
    search_job_placer: SearchJobPlacer,
    index_storage: Arc<dyn Storage>,
    delete_service_task_dir: PathBuf,
    handles: Option<DeletePipelineHandle>,
    max_concurrent_split_uploads: usize,
    state: DeleteTaskPipelineState,
    merge_scheduler_service: Mailbox<MergeSchedulerService>,
    event_broker: EventBroker,
}

#[async_trait]
impl Actor for DeleteTaskPipeline {
    type ObservableState = DeleteTaskPipelineState;

    fn observable_state(&self) -> Self::ObservableState {
        self.state.clone()
    }

    fn name(&self) -> String {
        "DeleteTaskPipeline".to_string()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.spawn_pipeline(ctx).await?;
        self.handle(Observe, ctx).await?;
        Ok(())
    }

    async fn finalize(
        &mut self,
        _exit_status: &ActorExitStatus,
        _ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        if let Some(handles) = self.handles.take() {
            join!(
                handles.delete_task_planner.quit(),
                handles.downloader.quit(),
                handles.delete_task_executor.quit(),
                handles.packager.quit(),
                handles.uploader.quit(),
                handles.publisher.quit(),
            );
        };
        Ok(())
    }
}

impl DeleteTaskPipeline {
    #[allow(clippy::too_many_arguments)]
    pub fn new(
        index_uid: IndexUid,
        metastore: MetastoreServiceClient,
        search_job_placer: SearchJobPlacer,
        index_storage: Arc<dyn Storage>,
        delete_service_task_dir: PathBuf,
        max_concurrent_split_uploads: usize,
        merge_scheduler_service: Mailbox<MergeSchedulerService>,
        event_broker: EventBroker,
    ) -> Self {
        Self {
            index_uid,
            metastore,
            search_job_placer,
            index_storage,
            delete_service_task_dir,
            handles: Default::default(),
            max_concurrent_split_uploads,
            state: DeleteTaskPipelineState::default(),
            merge_scheduler_service,
            event_broker,
        }
    }

    pub async fn spawn_pipeline(&mut self, ctx: &ActorContext<Self>) -> anyhow::Result<()> {
        info!(
            index_uid=%self.index_uid,
            root_dir=%self.delete_service_task_dir.to_str().unwrap(),
            "spawning delete tasks pipeline",
        );
        let index_config = self
            .metastore
            .index_metadata(IndexMetadataRequest::for_index_uid(self.index_uid.clone()))
            .await?
            .deserialize_index_metadata()?
            .into_index_config();
        let publisher = Publisher::new(
            PublisherType::MergePublisher,
            self.metastore.clone(),
            None,
            None,
        );
        let (publisher_mailbox, publisher_supervisor_handler) =
            ctx.spawn_actor().supervise(publisher);
        let split_store =
            IndexingSplitStore::create_without_local_store_for_test(self.index_storage.clone());
        let merge_policy = merge_policy_from_settings(&index_config.indexing_settings);
        let uploader = Uploader::new(
            UploaderType::DeleteUploader,
            self.metastore.clone(),
            merge_policy,
            index_config.retention_policy_opt.clone(),
            split_store.clone(),
            SplitsUpdateMailbox::Publisher(publisher_mailbox),
            self.max_concurrent_split_uploads,
            self.event_broker.clone(),
        );
        let (uploader_mailbox, uploader_supervisor_handler) = ctx.spawn_actor().supervise(uploader);

        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &index_config.search_settings)?;
        let tag_fields = doc_mapper.tag_named_fields()?;
        let packager = Packager::new("MergePackager", tag_fields, uploader_mailbox);
        let (packager_mailbox, packager_supervisor_handler) = ctx.spawn_actor().supervise(packager);
        let pipeline_id = MergePipelineId {
            node_id: NodeId::from("unknown"),
            index_uid: self.index_uid.clone(),
            source_id: "unknown".to_string(),
        };

        let delete_executor_io_controls = IoControls::default().set_component("deleter");

        let split_download_io_controls = delete_executor_io_controls
            .clone()
            .set_component("split_downloader_delete");
        let delete_executor = MergeExecutor::new(
            pipeline_id,
            self.metastore.clone(),
            doc_mapper.clone(),
            delete_executor_io_controls,
            packager_mailbox,
        );
        let (delete_executor_mailbox, task_executor_supervisor_handler) =
            ctx.spawn_actor().supervise(delete_executor);
        let scratch_directory = temp_dir::Builder::default()
            .join(&self.index_uid.index_id)
            .join(&self.index_uid.incarnation_id.to_string())
            .tempdir_in(&self.delete_service_task_dir)?;
        let merge_split_downloader = MergeSplitDownloader {
            scratch_directory,
            split_store,
            executor_mailbox: delete_executor_mailbox,
            io_controls: split_download_io_controls,
        };
        let (downloader_mailbox, downloader_supervisor_handler) =
            ctx.spawn_actor().supervise(merge_split_downloader);
        let doc_mapper_str = serde_json::to_string(&doc_mapper)?;
        let index_uri: &Uri = &index_config.index_uri;
        let task_planner = DeleteTaskPlanner::new(
            self.index_uid.clone(),
            index_uri.clone(),
            doc_mapper_str,
            self.metastore.clone(),
            self.search_job_placer.clone(),
            downloader_mailbox,
            self.merge_scheduler_service.clone(),
        );
        let (_, task_planner_supervisor_handler) = ctx.spawn_actor().supervise(task_planner);
        self.handles = Some(DeletePipelineHandle {
            delete_task_planner: task_planner_supervisor_handler,
            downloader: downloader_supervisor_handler,
            delete_task_executor: task_executor_supervisor_handler,
            packager: packager_supervisor_handler,
            uploader: uploader_supervisor_handler,
            publisher: publisher_supervisor_handler,
        });
        Ok(())
    }
}

#[derive(Debug)]
struct Observe;

#[async_trait]
impl Handler<Observe> for DeleteTaskPipeline {
    type Reply = ();
    async fn handle(
        &mut self,
        _: Observe,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        if let Some(handles) = &self.handles {
            handles.delete_task_planner.refresh_observe();
            handles.downloader.refresh_observe();
            handles.delete_task_executor.refresh_observe();
            handles.packager.refresh_observe();
            handles.uploader.refresh_observe();
            handles.publisher.refresh_observe();
            self.state = DeleteTaskPipelineState {
                delete_task_planner: handles.delete_task_planner.last_observation().clone(),
                downloader: handles.downloader.last_observation().clone(),
                delete_task_executor: handles.delete_task_executor.last_observation().clone(),
                packager: handles.packager.last_observation().clone(),
                uploader: handles.uploader.last_observation().clone(),
                publisher: handles.publisher.last_observation().clone(),
            }
        }
        ctx.schedule_self_msg(OBSERVE_PIPELINE_INTERVAL, Observe);
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use async_trait::async_trait;
    use quickwit_actors::{Handler, Universe};
    use quickwit_common::pubsub::EventBroker;
    use quickwit_common::temp_dir::TempDirectory;
    use quickwit_indexing::TestSandbox;
    use quickwit_indexing::actors::MergeSchedulerService;
    use quickwit_metastore::{ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitState};
    use quickwit_proto::metastore::{DeleteQuery, ListSplitsRequest, MetastoreService};
    use quickwit_proto::search::{LeafSearchRequest, LeafSearchResponse};
    use quickwit_search::{
        MockSearchService, SearchError, SearchJobPlacer, searcher_pool_for_test,
    };

    use super::{ActorContext, ActorExitStatus, DeleteTaskPipeline, OBSERVE_PIPELINE_INTERVAL};

    #[derive(Debug)]
    struct GracefulShutdown;

    #[async_trait]
    impl Handler<GracefulShutdown> for DeleteTaskPipeline {
        type Reply = ();
        async fn handle(
            &mut self,
            _: GracefulShutdown,
            _: &ActorContext<Self>,
        ) -> Result<(), ActorExitStatus> {
            if let Some(handles) = self.handles.take() {
                handles.delete_task_planner.quit().await;
                handles.publisher.join().await;
            }
            // Nothing to do.
            Err(ActorExitStatus::Success)
        }
    }

    #[tokio::test]
    async fn test_delete_pipeline_simple() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let index_id = "test-delete-pipeline-simple";
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: i64
                fast: true
        "#;
        let indexing_settings_yaml = r#"
            merge_policy:
                type: no_merge
        "#;
        let test_sandbox = TestSandbox::create(
            index_id,
            doc_mapping_yaml,
            indexing_settings_yaml,
            &["body"],
        )
        .await
        .unwrap();
        let universe: &Universe = test_sandbox.universe();
        let merge_scheduler_service = universe.get_or_spawn_one::<MergeSchedulerService>();
        let index_uid = test_sandbox.index_uid();
        let docs = vec![
            serde_json::json!({"body": "info", "ts": 0 }),
            serde_json::json!({"body": "info", "ts": 0 }),
            serde_json::json!({"body": "delete", "ts": 0 }),
        ];
        test_sandbox.add_documents(docs).await?;
        let metastore = test_sandbox.metastore();
        metastore
            .create_delete_task(DeleteQuery {
                index_uid: Some(index_uid.clone()),
                start_timestamp: None,
                end_timestamp: None,
                query_ast: quickwit_query::query_ast::qast_json_helper("body:delete", &[]),
            })
            .await
            .unwrap();
        let mut mock_search_service = MockSearchService::new();
        let mut leaf_search_num_failures = 1;
        mock_search_service
            .expect_leaf_search()
            .withf(|leaf_request| -> bool {
                leaf_request
                    .search_request
                    .as_ref()
                    .unwrap()
                    .index_id_patterns
                    == vec!["test-delete-pipeline-simple".to_string()]
            })
            .times(2)
            .returning(move |_: LeafSearchRequest| {
                if leaf_search_num_failures > 0 {
                    leaf_search_num_failures -= 1;
                    return Err(SearchError::Internal("leaf search error".to_string()));
                }
                Ok(LeafSearchResponse {
                    num_hits: 1,
                    ..Default::default()
                })
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let delete_service_task_dir = TempDirectory::for_test();
        let pipeline = DeleteTaskPipeline::new(
            test_sandbox.index_uid(),
            metastore.clone(),
            search_job_placer,
            test_sandbox.storage(),
            delete_service_task_dir.path().into(),
            4,
            merge_scheduler_service,
            EventBroker::default(),
        );

        let (pipeline_mailbox, pipeline_handler) = universe.spawn_builder().spawn(pipeline);
        // Ensure that the message sent by initialize method is processed.
        let _ = pipeline_handler.process_pending_and_observe().await.state;
        // Pipeline will first fail and we need to wait a OBSERVE_PIPELINE_INTERVAL * some number
        // for the pipeline state to be updated.
        universe.sleep(OBSERVE_PIPELINE_INTERVAL * 5).await;
        let pipeline_state = pipeline_handler.process_pending_and_observe().await.state;
        assert_eq!(pipeline_state.delete_task_planner.metrics.num_errors, 1);
        assert_eq!(pipeline_state.downloader.metrics.num_errors, 0);
        assert_eq!(pipeline_state.delete_task_executor.metrics.num_errors, 0);
        assert_eq!(pipeline_state.packager.metrics.num_errors, 0);
        assert_eq!(pipeline_state.uploader.metrics.num_errors, 0);
        assert_eq!(pipeline_state.publisher.metrics.num_errors, 0);
        let _ = pipeline_mailbox.ask(GracefulShutdown).await;

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 2);
        let published_split = splits
            .iter()
            .find(|split| split.split_state == SplitState::Published)
            .unwrap();
        assert_eq!(published_split.split_metadata.delete_opstamp, 1);
        test_sandbox.assert_quit().await;
        Ok(())
    }

    #[tokio::test]
    async fn test_delete_pipeline_shut_down() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let index_id = "test-delete-pipeline-shut-down";
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: i64
                fast: true
        "#;
        let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"])
            .await
            .unwrap();
        let universe: &Universe = test_sandbox.universe();
        let merge_scheduler_mailbox = universe.get_or_spawn_one::<MergeSchedulerService>();
        let metastore = test_sandbox.metastore();
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_leaf_search()
            .withf(|leaf_request| -> bool {
                leaf_request
                    .search_request
                    .as_ref()
                    .unwrap()
                    .index_id_patterns
                    == vec!["test-delete-pipeline-shut-down".to_string()]
            })
            .returning(move |_: LeafSearchRequest| {
                Ok(LeafSearchResponse {
                    num_hits: 0,
                    ..Default::default()
                })
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let delete_service_task_dir = TempDirectory::for_test();
        let pipeline = DeleteTaskPipeline::new(
            test_sandbox.index_uid(),
            metastore.clone(),
            search_job_placer,
            test_sandbox.storage(),
            delete_service_task_dir.path().into(),
            4,
            merge_scheduler_mailbox,
            EventBroker::default(),
        );

        let (_pipeline_mailbox, pipeline_handler) = universe.spawn_builder().spawn(pipeline);
        pipeline_handler.quit().await;
        let observations = universe.observe(OBSERVE_PIPELINE_INTERVAL).await;
        assert!(observations.into_iter().all(
            |observation| observation.type_name != std::any::type_name::<DeleteTaskPipeline>()
        ));
        test_sandbox.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/actors/delete_task_planner.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::str::FromStr;
use std::time::Duration;

use anyhow::Context;
use async_trait::async_trait;
use itertools::Itertools;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, Handler, Mailbox, QueueCapacity};
use quickwit_common::extract_time_range;
use quickwit_common::uri::Uri;
use quickwit_doc_mapper::tag_pruning::extract_tags_from_query;
use quickwit_indexing::actors::{MergeSchedulerService, MergeSplitDownloader, schedule_merge};
use quickwit_indexing::merge_policy::MergeOperation;
use quickwit_metastore::{ListSplitsResponseExt, Split, split_tag_filter, split_time_range_filter};
use quickwit_proto::metastore::{
    DeleteTask, LastDeleteOpstampRequest, ListDeleteTasksRequest, ListStaleSplitsRequest,
    MetastoreResult, MetastoreService, MetastoreServiceClient, UpdateSplitsDeleteOpstampRequest,
};
use quickwit_proto::search::SearchRequest;
use quickwit_proto::types::IndexUid;
use quickwit_search::{IndexMetasForLeafSearch, SearchJob, SearchJobPlacer, jobs_to_leaf_request};
use serde::Serialize;
use tantivy::Inventory;
use tracing::{debug, info};

use crate::metrics::JANITOR_METRICS;

const PLANNER_REFRESH_INTERVAL: Duration = Duration::from_secs(60);
const NUM_STALE_SPLITS_TO_FETCH: usize = 1000;

/// The `DeleteTaskPlanner` plans delete operations on splits for a given index.
/// For each split, the planner checks if there is some documents to delete:
/// - If this is the case, it sends a [`MergeOperation`] to the `MergeExecutor` `MergeOperation` to
///   the `MergeExecutor`.
/// - If there is no document to delete, it updates the split `delete_opstamp` to the latest delete
///   task opstamp.
///
/// Pseudo-algorithm for a given index:
/// 1. Fetches the delete tasks and deduce the last `opstamp`.
/// 2. Fetches the last `N` stale splits ordered by their `delete_opstamp`. A stale split is a split
///    a `delete_opstamp` inferior to the last `opstamp` In theory, this works but... there is one
///    difficulty:
///    - Delete operations do not run on immature splits and they are excluded after fetching stale
///      splits from the metastore as the metastore has no knowledge about the merge policy. If
///      there are more than `N` immature stale splits, the planner will plan no operations.
///      However, this is mitigated by the fact that a merge policy should consider "old split" as
///      mature and an index should not have many immature splits.
///      See tracked issue <https://github.com/quickwit-oss/quickwit/issues/2147>.
/// 3. If there is no stale splits, stop.
/// 4. If there are stale splits, for each split, do:
///    - Get the list of delete queries to apply to this split.
///    - Keep only delete queries that match the split metadata (time range and tags).
///    - If no delete queries remains, then update the split `delete_opstamp` to the latest
///      `opstamp`.
///    - If there are delete queries that match the metadata, do: + Execute delete queries
///      (`leaf_request`) one by one to check if there is a match. + As soon as a hit is returned
///      for a given query, the split is sent to the `MergeExecutor`. + If no delete queries match
///      documents, update the split `delete_opstamp` to the last `opstamp`.
#[derive(Clone)]
pub struct DeleteTaskPlanner {
    index_uid: IndexUid,
    index_uri: Uri,
    doc_mapper_str: String,
    metastore: MetastoreServiceClient,
    search_job_placer: SearchJobPlacer,
    merge_split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
    merge_scheduler_service: Mailbox<MergeSchedulerService>,
    /// Inventory of ongoing delete operations. If everything goes well,
    /// a merge operation is dropped after the publish of the split that underwent
    /// the delete operation.
    /// The inventory is used to avoid sending twice the same delete operation.
    ongoing_delete_operations_inventory: Inventory<MergeOperation>,
}

#[async_trait]
impl Actor for DeleteTaskPlanner {
    type ObservableState = DeleteTaskPlannerState;

    fn observable_state(&self) -> Self::ObservableState {
        let ongoing_delete_operations = self
            .ongoing_delete_operations_inventory
            .list()
            .iter()
            .map(|tracked_operation| tracked_operation.as_ref().clone())
            .collect_vec();
        DeleteTaskPlannerState {
            ongoing_delete_operations,
        }
    }

    fn name(&self) -> String {
        "DeleteTaskPlanner".to_string()
    }

    fn queue_capacity(&self) -> QueueCapacity {
        QueueCapacity::Bounded(0)
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.handle(PlanDeleteLoop, ctx).await
    }
}

impl DeleteTaskPlanner {
    pub fn new(
        index_uid: IndexUid,
        index_uri: Uri,
        doc_mapper_str: String,
        metastore: MetastoreServiceClient,
        search_job_placer: SearchJobPlacer,
        merge_split_downloader_mailbox: Mailbox<MergeSplitDownloader>,
        merge_scheduler_service: Mailbox<MergeSchedulerService>,
    ) -> Self {
        Self {
            index_uid,
            index_uri,
            doc_mapper_str,
            metastore,
            search_job_placer,
            merge_split_downloader_mailbox,
            merge_scheduler_service,
            ongoing_delete_operations_inventory: Inventory::new(),
        }
    }

    /// Send delete operations for a given `index_id`.
    async fn send_delete_operations(&mut self, ctx: &ActorContext<Self>) -> anyhow::Result<()> {
        // Loop until there is no more stale splits.
        loop {
            let last_delete_opstamp_request = LastDeleteOpstampRequest {
                index_uid: Some(self.index_uid.clone()),
            };
            let last_delete_opstamp = self
                .metastore
                .last_delete_opstamp(last_delete_opstamp_request)
                .await?
                .last_delete_opstamp;
            let stale_splits = self
                .get_relevant_stale_splits(self.index_uid.clone(), last_delete_opstamp, ctx)
                .await?;
            ctx.record_progress();
            debug!(
                index_id = self.index_uid.index_id,
                last_delete_opstamp = last_delete_opstamp,
                num_stale_splits = stale_splits.len()
            );

            if stale_splits.is_empty() {
                break;
            }

            let (splits_with_deletes, splits_without_deletes) =
                self.partition_splits_by_deletes(&stale_splits, ctx).await?;

            info!(
                "{} splits with deletes, {} splits without deletes.",
                splits_with_deletes.len(),
                splits_without_deletes.len()
            );
            ctx.record_progress();

            // Updates `delete_opstamp` of splits that won't undergo delete operations.
            let split_ids_without_delete = splits_without_deletes
                .iter()
                .map(|split| split.split_id().to_string())
                .collect_vec();
            let update_splits_delete_opstamp_request = UpdateSplitsDeleteOpstampRequest {
                index_uid: Some(self.index_uid.clone()),
                split_ids: split_ids_without_delete.clone(),
                delete_opstamp: last_delete_opstamp,
            };
            ctx.protect_future(
                self.metastore
                    .update_splits_delete_opstamp(update_splits_delete_opstamp_request),
            )
            .await?;

            // Sends delete operations.
            for split_with_deletes in splits_with_deletes {
                let delete_operation = MergeOperation::new_delete_and_merge_operation(
                    split_with_deletes.split_metadata,
                );
                info!(delete_operation=?delete_operation, "planned delete operation");
                let tracked_delete_operation = self
                    .ongoing_delete_operations_inventory
                    .track(delete_operation);
                schedule_merge(
                    &self.merge_scheduler_service,
                    tracked_delete_operation,
                    self.merge_split_downloader_mailbox.clone(),
                )
                .await?;
                let index_label =
                    quickwit_common::metrics::index_label(self.index_uid.index_id.as_str());
                JANITOR_METRICS
                    .ongoing_num_delete_operations_total
                    .with_label_values([index_label])
                    .set(self.ongoing_delete_operations_inventory.list().len() as i64);
            }
        }

        Ok(())
    }

    /// Identifies splits that contain documents to delete and
    /// splits that do not and returns the two groups.
    async fn partition_splits_by_deletes(
        &mut self,
        stale_splits: &[Split],
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<(Vec<Split>, Vec<Split>)> {
        let mut splits_without_deletes: Vec<Split> = Vec::new();
        let mut splits_with_deletes: Vec<Split> = Vec::new();

        for stale_split in stale_splits {
            let list_delete_tasks_request = ListDeleteTasksRequest::new(
                self.index_uid.clone(),
                stale_split.split_metadata.delete_opstamp,
            );
            let pending_tasks = ctx
                .protect_future(self.metastore.list_delete_tasks(list_delete_tasks_request))
                .await?
                .delete_tasks;

            // Keep only delete tasks that matches the split metadata.
            let pending_and_matching_metadata_tasks = pending_tasks
                .into_iter()
                .filter(|delete_task| {
                    let delete_query = delete_task
                        .delete_query
                        .as_ref()
                        .expect("Delete task must have a delete query.");
                    let time_range = extract_time_range(
                        delete_query.start_timestamp,
                        delete_query.end_timestamp,
                    );
                    // TODO: validate the query at the beginning and return an appropriate error.
                    let delete_query_ast = serde_json::from_str(&delete_query.query_ast)
                        .expect("Failed to deserialize query_ast json");
                    let tags_filter = extract_tags_from_query(delete_query_ast);
                    split_time_range_filter(&stale_split.split_metadata, time_range.as_ref())
                        && split_tag_filter(&stale_split.split_metadata, tags_filter.as_ref())
                })
                .collect_vec();

            // If there is no matching delete tasks,
            // there is no document to delete on this split.
            if pending_and_matching_metadata_tasks.is_empty() {
                splits_without_deletes.push(stale_split.clone());
                continue;
            }

            let has_split_docs_to_delete = self
                .has_split_docs_to_delete(
                    stale_split,
                    &pending_and_matching_metadata_tasks,
                    &self.doc_mapper_str,
                    self.index_uri.as_str(),
                    ctx,
                )
                .await?;
            ctx.record_progress();

            if has_split_docs_to_delete {
                splits_with_deletes.push(stale_split.clone());
            } else {
                splits_without_deletes.push(stale_split.clone());
            }
        }

        Ok((splits_with_deletes, splits_without_deletes))
    }

    /// Executes a `LeafSearchRequest` on the split and returns true
    /// if it matches documents.
    async fn has_split_docs_to_delete(
        &self,
        stale_split: &Split,
        delete_tasks: &[DeleteTask],
        doc_mapper_str: &str,
        index_uri: &str,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<bool> {
        let search_job = SearchJob::from(&stale_split.split_metadata);
        let mut search_client = self
            .search_job_placer
            .assign_job(search_job.clone(), &HashSet::new())
            .await?;
        for delete_task in delete_tasks {
            let delete_query = delete_task
                .delete_query
                .as_ref()
                .expect("Delete task must have a delete query.");
            // TODO: resolve with the default fields.
            let search_request = SearchRequest {
                index_id_patterns: vec![delete_query.index_uid().index_id.to_string()],
                query_ast: delete_query.query_ast.clone(),
                start_timestamp: delete_query.start_timestamp,
                end_timestamp: delete_query.end_timestamp,
                ..Default::default()
            };
            let mut search_indexes_metas = HashMap::new();
            let index_uri = Uri::from_str(index_uri).context("invalid index URI")?;
            search_indexes_metas.insert(
                delete_query.index_uid().clone(),
                IndexMetasForLeafSearch {
                    doc_mapper_str: doc_mapper_str.to_string(),
                    index_uri,
                },
            );
            let leaf_search_request = jobs_to_leaf_request(
                &search_request,
                &search_indexes_metas,
                vec![search_job.clone()],
            )?;
            let response = search_client.leaf_search(leaf_search_request).await?;
            ctx.record_progress();
            if response.num_hits > 0 {
                return Ok(true);
            }
        }
        Ok(false)
    }

    /// Fetches stale splits from [`quickwit_metastore::Metastore`] and excludes immature splits and
    /// split already among ongoing delete operations.
    async fn get_relevant_stale_splits(
        &mut self,
        index_uid: IndexUid,
        last_delete_opstamp: u64,
        ctx: &ActorContext<Self>,
    ) -> MetastoreResult<Vec<Split>> {
        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: Some(index_uid.clone()),
            delete_opstamp: last_delete_opstamp,
            num_splits: NUM_STALE_SPLITS_TO_FETCH as u64,
        };
        let stale_splits = ctx
            .protect_future(self.metastore.list_stale_splits(list_stale_splits_request))
            .await?
            .deserialize_splits()
            .await?;
        debug!(
            index_id = index_uid.index_id,
            last_delete_opstamp = last_delete_opstamp,
            num_stale_splits_from_metastore = stale_splits.len()
        );
        let ongoing_delete_operations = self.ongoing_delete_operations_inventory.list();
        let filtered_splits = stale_splits
            .into_iter()
            .filter(|stale_split| {
                !ongoing_delete_operations.iter().any(|operation| {
                    operation
                        .splits
                        .first()
                        .unwrap() // <- This is safe as we know for sure that an operation is on one split.
                        .split_id()
                        == stale_split.split_id()
                })
            })
            .collect_vec();
        Ok(filtered_splits)
    }
}

#[derive(Clone, Debug, Serialize)]
pub struct DeleteTaskPlannerState {
    ongoing_delete_operations: Vec<MergeOperation>,
}

#[derive(Debug)]
struct PlanDeleteOperations;

#[async_trait]
impl Handler<PlanDeleteOperations> for DeleteTaskPlanner {
    type Reply = ();

    async fn handle(
        &mut self,
        _: PlanDeleteOperations,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.send_delete_operations(ctx).await?;
        Ok(())
    }
}

#[derive(Debug)]
struct PlanDeleteLoop;

#[async_trait]
impl Handler<PlanDeleteLoop> for DeleteTaskPlanner {
    type Reply = ();

    async fn handle(
        &mut self,
        _: PlanDeleteLoop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        self.handle(PlanDeleteOperations, ctx).await?;
        ctx.schedule_self_msg(PLANNER_REFRESH_INTERVAL, PlanDeleteLoop);
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use quickwit_config::build_doc_mapper;
    use quickwit_indexing::TestSandbox;
    use quickwit_indexing::merge_policy::MergeTask;
    use quickwit_metastore::{
        IndexMetadataResponseExt, ListSplitsRequestExt, MetastoreServiceStreamSplitsExt,
        SplitMetadata,
    };
    use quickwit_proto::metastore::{DeleteQuery, IndexMetadataRequest, ListSplitsRequest};
    use quickwit_proto::search::{LeafSearchRequest, LeafSearchResponse};
    use quickwit_search::{MockSearchService, searcher_pool_for_test};

    use super::*;

    #[tokio::test]
    async fn test_delete_task_planner() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let index_id = "test-delete-task-planner";
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: i64
                fast: true
        "#;
        let indexing_settings_yaml = r#"
            merge_policy:
                type: no_merge
        "#;
        let test_sandbox = TestSandbox::create(
            index_id,
            doc_mapping_yaml,
            indexing_settings_yaml,
            &["body"],
        )
        .await?;
        let universe = test_sandbox.universe();
        let docs = [
            serde_json::json!({"body": "info", "ts": 0 }),
            serde_json::json!({"body": "info", "ts": 0 }),
            serde_json::json!({"body": "delete", "ts": 0 }),
        ];
        // Creates 3 splits
        for doc in docs {
            test_sandbox.add_documents(vec![doc]).await?;
        }
        let metastore = test_sandbox.metastore();
        let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
        let index_metadata = metastore
            .index_metadata(index_metadata_request)
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        let index_uid = index_metadata.index_uid.clone();
        let index_config = index_metadata.into_index_config();
        let split_metas: Vec<SplitMetadata> = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits_metadata()
            .await
            .unwrap();
        assert_eq!(split_metas.len(), 3);
        let doc_mapper =
            build_doc_mapper(&index_config.doc_mapping, &index_config.search_settings)?;
        let doc_mapper_str = serde_json::to_string(&doc_mapper)?;

        // Creates 2 delete tasks, one that will match 1 document,
        // the other that will match no document.

        let body_delete_ast = quickwit_query::query_ast::qast_json_helper("body:delete", &[]);
        let match_nothing_ast =
            quickwit_query::query_ast::qast_json_helper("body:matchnothing", &[]);
        metastore
            .create_delete_task(DeleteQuery {
                index_uid: Some(index_uid.clone()),
                start_timestamp: None,
                end_timestamp: None,
                query_ast: body_delete_ast.clone(),
            })
            .await?;
        metastore
            .create_delete_task(DeleteQuery {
                index_uid: Some(index_uid.clone()),
                start_timestamp: None,
                end_timestamp: None,
                query_ast: match_nothing_ast,
            })
            .await?;
        let mut mock_search_service = MockSearchService::new();

        // We have 2 delete tasks. Each one will trigger a leaf request for each
        // of the 3 splits. This makes 6 requests.
        let split_id_with_doc_to_delete = split_metas[2].split_id().to_string();
        mock_search_service.expect_leaf_search().times(6).returning(
            move |request: LeafSearchRequest| {
                // Search on body:delete should return one hit only on the last split
                // that should contains the doc.
                if request.leaf_requests[0].split_offsets[0].split_id == split_id_with_doc_to_delete
                    && request.search_request.as_ref().unwrap().query_ast == body_delete_ast
                {
                    return Ok(LeafSearchResponse {
                        num_hits: 1,
                        ..Default::default()
                    });
                }
                Ok(LeafSearchResponse {
                    num_hits: 0,
                    ..Default::default()
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1000", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let merge_scheduler_mailbox = universe.get_or_spawn_one();
        let (merge_split_downloader_mailbox, merge_split_downloader_inbox) =
            universe.create_test_mailbox();
        let delete_planner = DeleteTaskPlanner::new(
            index_uid.clone(),
            index_config.index_uri.clone(),
            doc_mapper_str,
            metastore.clone(),
            search_job_placer,
            merge_split_downloader_mailbox,
            merge_scheduler_mailbox,
        );
        let (delete_planner_mailbox, delete_planner_handle) = test_sandbox
            .universe()
            .spawn_builder()
            .spawn(delete_planner);
        delete_planner_handle.process_pending_and_observe().await;
        let downloader_msgs: Vec<MergeTask> = merge_split_downloader_inbox.drain_for_test_typed();
        assert_eq!(downloader_msgs.len(), 1);
        // The last split will undergo a delete operation.
        assert_eq!(
            downloader_msgs[0].splits[0].split_id(),
            split_metas[2].split_id()
        );
        // Check planner state is inline.
        let delete_planner_state = delete_planner_handle.observe().await;
        assert_eq!(
            delete_planner_state.ongoing_delete_operations[0].splits[0].split_id(),
            split_metas[2].split_id()
        );
        // Trigger new plan evaluation and check that we don't have new merge operation.
        delete_planner_mailbox
            .ask(PlanDeleteOperations)
            .await
            .unwrap();
        assert!(merge_split_downloader_inbox.drain_for_test().is_empty());
        // Now drop the current merge operation and check that the planner will plan a new
        // operation.
        drop(downloader_msgs.into_iter().next().unwrap());
        // Check planner state is inline.
        assert!(
            delete_planner_handle
                .observe()
                .await
                .ongoing_delete_operations
                .is_empty()
        );

        // Trigger operations planning.
        delete_planner_mailbox
            .ask(PlanDeleteOperations)
            .await
            .unwrap();
        let downloader_last_msgs = merge_split_downloader_inbox.drain_for_test_typed::<MergeTask>();
        assert_eq!(downloader_last_msgs.len(), 1);
        assert_eq!(
            downloader_last_msgs[0].splits[0].split_id(),
            split_metas[2].split_id()
        );
        // The other splits has just their delete opstamps updated to the last opstamps which is 2
        // as there are 2 delete tasks. The last split
        let all_splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
            .await
            .unwrap()
            .collect_splits_metadata()
            .await
            .unwrap();
        assert_eq!(all_splits[0].delete_opstamp, 2);
        assert_eq!(all_splits[1].delete_opstamp, 2);
        // The last split has not yet its delete opstamp updated.
        assert_eq!(all_splits[2].delete_opstamp, 0);
        test_sandbox.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/actors/delete_task_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::path::PathBuf;
use std::time::Duration;

use async_trait::async_trait;
use quickwit_actors::{Actor, ActorContext, ActorExitStatus, ActorHandle, Handler, Mailbox};
use quickwit_common::pubsub::EventBroker;
use quickwit_common::temp_dir::{self};
use quickwit_config::IndexConfig;
use quickwit_indexing::actors::MergeSchedulerService;
use quickwit_metastore::{IndexMetadataResponseExt, ListIndexesMetadataResponseExt};
use quickwit_proto::metastore::{
    IndexMetadataRequest, ListIndexesMetadataRequest, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::IndexUid;
use quickwit_search::SearchJobPlacer;
use quickwit_storage::StorageResolver;
use serde::Serialize;
use tracing::{error, info, warn};

use super::delete_task_pipeline::DeleteTaskPipeline;

pub const DELETE_SERVICE_TASK_DIR_NAME: &str = "delete_task_service";

const UPDATE_PIPELINES_INTERVAL: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(200)
} else {
    // Each update triggers a call to the metastore. Deletes are not frequent operation and
    // it's fine to wait a bit before updating the pipelines.
    Duration::from_secs(30)
};

#[derive(Debug, Clone, Serialize)]
pub struct DeleteTaskServiceState {
    pub num_running_pipelines: usize,
}

pub struct DeleteTaskService {
    metastore: MetastoreServiceClient,
    search_job_placer: SearchJobPlacer,
    storage_resolver: StorageResolver,
    delete_service_task_dir: PathBuf,
    pipeline_handles_by_index_uid: HashMap<IndexUid, ActorHandle<DeleteTaskPipeline>>,
    max_concurrent_split_uploads: usize,
    event_broker: EventBroker,
    merge_scheduler_service: Mailbox<MergeSchedulerService>,
}

impl DeleteTaskService {
    pub async fn new(
        metastore: MetastoreServiceClient,
        search_job_placer: SearchJobPlacer,
        storage_resolver: StorageResolver,
        data_dir_path: PathBuf,
        max_concurrent_split_uploads: usize,
        merge_scheduler_service: Mailbox<MergeSchedulerService>,
        event_broker: EventBroker,
    ) -> anyhow::Result<Self> {
        let delete_service_task_path = data_dir_path.join(DELETE_SERVICE_TASK_DIR_NAME);
        let delete_service_task_dir =
            temp_dir::create_or_purge_directory(delete_service_task_path.as_path()).await?;
        Ok(Self {
            metastore,
            search_job_placer,
            storage_resolver,
            delete_service_task_dir,
            pipeline_handles_by_index_uid: Default::default(),
            max_concurrent_split_uploads,
            merge_scheduler_service,
            event_broker,
        })
    }
}

#[async_trait]
impl Actor for DeleteTaskService {
    type ObservableState = DeleteTaskServiceState;

    fn observable_state(&self) -> Self::ObservableState {
        DeleteTaskServiceState {
            num_running_pipelines: self.pipeline_handles_by_index_uid.len(),
        }
    }

    fn name(&self) -> String {
        "DeleteTaskService".to_string()
    }

    async fn initialize(&mut self, ctx: &ActorContext<Self>) -> Result<(), ActorExitStatus> {
        self.handle(UpdatePipelines, ctx).await?;
        Ok(())
    }
}

impl DeleteTaskService {
    pub async fn update_pipeline_handles(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        let mut index_config_by_index_id: HashMap<IndexUid, IndexConfig> = self
            .metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await?
            .deserialize_indexes_metadata()
            .await?
            .into_iter()
            .map(|index_metadata| {
                (
                    index_metadata.index_uid.clone(),
                    index_metadata.into_index_config(),
                )
            })
            .collect();
        let index_uids: HashSet<IndexUid> = index_config_by_index_id.keys().cloned().collect();
        let pipeline_index_uids: HashSet<IndexUid> =
            self.pipeline_handles_by_index_uid.keys().cloned().collect();

        // Remove pipelines on deleted indexes.
        for deleted_index_uid in pipeline_index_uids.difference(&index_uids) {
            info!(
                deleted_index_id = deleted_index_uid.index_id,
                "Remove deleted index from delete task pipelines."
            );
            let pipeline_handle = self
                .pipeline_handles_by_index_uid
                .remove(deleted_index_uid)
                .expect("Handle must be present.");
            // Kill the pipeline, this avoids to wait a long time for a delete operation to finish.
            pipeline_handle.kill().await;
        }

        // Start new pipelines and add them to the handles hashmap.
        for index_uid in index_uids.difference(&pipeline_index_uids) {
            let index_config = index_config_by_index_id
                .remove(index_uid)
                .expect("index metadata should be present");
            if self.spawn_pipeline(index_config, ctx).await.is_err() {
                warn!("failed to spawn delete pipeline for {}", index_uid.index_id);
            }
        }

        Ok(())
    }

    pub async fn spawn_pipeline(
        &mut self,
        index_config: IndexConfig,
        ctx: &ActorContext<Self>,
    ) -> anyhow::Result<()> {
        let index_uri = index_config.index_uri.clone();
        let index_storage = self.storage_resolver.resolve(&index_uri).await?;
        let index_metadata_request =
            IndexMetadataRequest::for_index_id(index_config.index_id.to_string());
        let index_metadata = self
            .metastore
            .index_metadata(index_metadata_request)
            .await?
            .deserialize_index_metadata()?;
        let pipeline = DeleteTaskPipeline::new(
            index_metadata.index_uid.clone(),
            self.metastore.clone(),
            self.search_job_placer.clone(),
            index_storage,
            self.delete_service_task_dir.clone(),
            self.max_concurrent_split_uploads,
            self.merge_scheduler_service.clone(),
            self.event_broker.clone(),
        );
        let (_pipeline_mailbox, pipeline_handler) = ctx.spawn_actor().spawn(pipeline);
        self.pipeline_handles_by_index_uid
            .insert(index_metadata.index_uid, pipeline_handler);
        Ok(())
    }
}

#[derive(Debug)]
struct UpdatePipelines;

#[async_trait]
impl Handler<UpdatePipelines> for DeleteTaskService {
    type Reply = ();

    async fn handle(
        &mut self,
        _: UpdatePipelines,
        ctx: &ActorContext<Self>,
    ) -> Result<(), ActorExitStatus> {
        let result = self.update_pipeline_handles(ctx).await;
        if let Err(error) = result {
            error!(error=%error, "delete task pipelines update failed");
        }
        ctx.schedule_self_msg(UPDATE_PIPELINES_INTERVAL, UpdatePipelines);
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use quickwit_actors::Universe;
    use quickwit_common::pubsub::EventBroker;
    use quickwit_indexing::TestSandbox;
    use quickwit_proto::metastore::{
        DeleteIndexRequest, DeleteQuery, ListDeleteTasksRequest, MetastoreService,
    };
    use quickwit_search::{MockSearchService, SearchJobPlacer, searcher_pool_for_test};
    use quickwit_storage::StorageResolver;

    use super::{DeleteTaskService, UPDATE_PIPELINES_INTERVAL};

    #[tokio::test]
    async fn test_delete_task_service() -> anyhow::Result<()> {
        quickwit_common::setup_logging_for_tests();
        let index_id = "test-delete-task-service-index";
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: i64
                fast: true
        "#;
        let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"]).await?;
        let index_uid = test_sandbox.index_uid();
        let metastore = test_sandbox.metastore();
        let mock_search_service = MockSearchService::new();
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1000", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let temp_dir = tempfile::tempdir().unwrap();
        let data_dir_path = temp_dir.path().to_path_buf();
        let universe: &Universe = test_sandbox.universe();
        let delete_task_service = DeleteTaskService::new(
            metastore.clone(),
            search_job_placer,
            StorageResolver::unconfigured(),
            data_dir_path,
            4,
            universe.get_or_spawn_one(),
            EventBroker::default(),
        )
        .await
        .unwrap();
        let (_delete_task_service_mailbox, delete_task_service_handler) =
            universe.spawn_builder().spawn(delete_task_service);
        let state = delete_task_service_handler
            .process_pending_and_observe()
            .await;
        assert_eq!(state.num_running_pipelines, 1);
        let delete_query = DeleteQuery {
            index_uid: Some(index_uid.clone()),
            start_timestamp: None,
            end_timestamp: None,
            query_ast: r#"{"type": "MatchAll"}"#.to_string(),
        };
        metastore.create_delete_task(delete_query).await.unwrap();
        // Just test creation of delete query.
        assert_eq!(
            metastore
                .list_delete_tasks(ListDeleteTasksRequest::new(index_uid.clone(), 0))
                .await
                .unwrap()
                .delete_tasks
                .len(),
            1
        );
        metastore
            .delete_index(DeleteIndexRequest {
                index_uid: Some(index_uid.clone()),
            })
            .await
            .unwrap();
        universe.sleep(UPDATE_PIPELINES_INTERVAL * 2).await;
        let state_after_deletion = delete_task_service_handler
            .process_pending_and_observe()
            .await;
        assert_eq!(state_after_deletion.num_running_pipelines, 0);
        assert!(universe.get_one::<DeleteTaskService>().is_some());
        let actors_observations = universe.observe(UPDATE_PIPELINES_INTERVAL).await;
        assert!(
            actors_observations
                .into_iter()
                .any(|observation| observation.type_name
                    == std::any::type_name::<DeleteTaskService>())
        );
        assert!(universe.get_one::<DeleteTaskService>().is_some());
        test_sandbox.assert_quit().await;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/actors/garbage_collector.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::path::Path;
use std::sync::Arc;
use std::time::{Duration, Instant};

use async_trait::async_trait;
use futures::{StreamExt, stream};
use quickwit_actors::{Actor, ActorContext, Handler};
use quickwit_common::shared_consts::split_deletion_grace_period;
use quickwit_index_management::{GcMetrics, run_garbage_collect};
use quickwit_metastore::ListIndexesMetadataResponseExt;
use quickwit_proto::metastore::{
    ListIndexesMetadataRequest, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::IndexUid;
use quickwit_storage::{Storage, StorageResolver};
use serde::Serialize;
use tracing::{debug, error, info};

use crate::metrics::JANITOR_METRICS;

const RUN_INTERVAL: Duration = Duration::from_secs(10 * 60); // 10 minutes

/// Staged files needs to be deleted if there was a failure.
/// TODO ideally we want clean up all staged splits every time we restart the indexing pipeline, but
/// the grace period strategy should do the job for the moment.
const STAGED_GRACE_PERIOD: Duration = Duration::from_secs(60 * 60 * 24); // 24 hours

#[derive(Clone, Debug, Default, Serialize)]
pub struct GarbageCollectorCounters {
    /// The number of passes the garbage collector has performed.
    pub num_passes: usize,
    /// The number of deleted files.
    pub num_deleted_files: usize,
    /// The number of bytes deleted.
    pub num_deleted_bytes: usize,
    /// The number of failed garbage collection run.
    pub num_failed_gc_run: usize,
    /// The number of successful garbage collection run.
    pub num_successful_gc_run: usize,
    /// The number or failed storage resolution.
    pub num_failed_storage_resolution: usize,
    /// The number of splits that were unable to be removed.
    pub num_failed_splits: usize,
}

#[derive(Debug)]
struct Loop;

/// An actor for collecting garbage periodically from an index.
pub struct GarbageCollector {
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
    counters: GarbageCollectorCounters,
}

impl GarbageCollector {
    pub fn new(metastore: MetastoreServiceClient, storage_resolver: StorageResolver) -> Self {
        Self {
            metastore,
            storage_resolver,
            counters: GarbageCollectorCounters::default(),
        }
    }

    /// Gc Loop handler logic.
    /// Should not return an error to prevent the actor from crashing.
    async fn handle_inner(&mut self, ctx: &ActorContext<Self>) {
        debug!("loading indexes from the metastore");
        self.counters.num_passes += 1;

        let start = Instant::now();

        let response = match self
            .metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
        {
            Ok(response) => response,
            Err(error) => {
                error!(%error, "failed to list indexes from the metastore");
                return;
            }
        };
        let indexes = match response.deserialize_indexes_metadata().await {
            Ok(indexes) => indexes,
            Err(error) => {
                error!(%error, "failed to deserialize indexes metadata");
                return;
            }
        };
        info!("loaded {} indexes from the metastore", indexes.len());

        let expected_count = indexes.len();
        let index_storages: HashMap<IndexUid, Arc<dyn Storage>> = stream::iter(indexes).filter_map(|index| {
            let storage_resolver = self.storage_resolver.clone();
            async move {
                let index_uid = index.index_uid.clone();
                let index_uri = index.index_uri();
                let storage = match storage_resolver.resolve(index_uri).await {
                    Ok(storage) => storage,
                    Err(error) => {
                        error!(index=%index.index_id(), error=?error, "failed to resolve the index storage Uri");
                        return None;
                    }
                };
                Some((index_uid, storage))
            }}).collect()
            .await;

        let storage_got_count = index_storages.len();
        self.counters.num_failed_storage_resolution += expected_count - storage_got_count;

        if index_storages.is_empty() {
            return;
        }

        let gc_res = run_garbage_collect(
            index_storages,
            self.metastore.clone(),
            STAGED_GRACE_PERIOD,
            split_deletion_grace_period(),
            false,
            Some(ctx.progress()),
            Some(GcMetrics {
                deleted_splits: JANITOR_METRICS
                    .gc_deleted_splits
                    .with_label_values(["success"])
                    .clone(),
                deleted_bytes: JANITOR_METRICS.gc_deleted_bytes.clone(),
                failed_splits: JANITOR_METRICS
                    .gc_deleted_splits
                    .with_label_values(["error"])
                    .clone(),
            }),
        )
        .await;

        let run_duration = start.elapsed().as_secs();
        JANITOR_METRICS.gc_seconds_total.inc_by(run_duration);

        let deleted_file_entries = match gc_res {
            Ok(removal_info) => {
                self.counters.num_successful_gc_run += 1;
                JANITOR_METRICS.gc_runs.with_label_values(["success"]).inc();
                self.counters.num_failed_splits += removal_info.failed_splits.len();
                removal_info.removed_split_entries
            }
            Err(error) => {
                self.counters.num_failed_gc_run += 1;
                JANITOR_METRICS.gc_runs.with_label_values(["error"]).inc();
                error!(error=?error, "failed to run garbage collection");
                return;
            }
        };
        if !deleted_file_entries.is_empty() {
            let num_deleted_splits = deleted_file_entries.len();
            let num_deleted_bytes = deleted_file_entries
                .iter()
                .map(|entry| entry.file_size_bytes.as_u64() as usize)
                .sum::<usize>();
            let deleted_files: HashSet<&Path> = deleted_file_entries
                .iter()
                .map(|deleted_entry| deleted_entry.file_name.as_path())
                .take(5)
                .collect();
            info!(
                num_deleted_splits = num_deleted_splits,
                "Janitor deleted {:?} and {} other splits.", deleted_files, num_deleted_splits,
            );
            self.counters.num_deleted_files += num_deleted_splits;
            self.counters.num_deleted_bytes += num_deleted_bytes;
        }
    }
}

#[async_trait]
impl Actor for GarbageCollector {
    type ObservableState = GarbageCollectorCounters;

    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    fn name(&self) -> String {
        "GarbageCollector".to_string()
    }

    async fn initialize(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        self.handle(Loop, ctx).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<Loop> for GarbageCollector {
    type Reply = ();

    async fn handle(
        &mut self,
        _: Loop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        self.handle_inner(ctx).await;
        ctx.schedule_self_msg(RUN_INTERVAL, Loop);
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Bound;
    use std::path::Path;
    use std::sync::Arc;

    use quickwit_actors::Universe;
    use quickwit_common::ServiceStream;
    use quickwit_common::shared_consts::split_deletion_grace_period;
    use quickwit_metastore::{
        IndexMetadata, ListSplitsRequestExt, ListSplitsResponseExt, Split, SplitMetadata,
        SplitState,
    };
    use quickwit_proto::metastore::{
        EmptyResponse, ListIndexesMetadataResponse, ListSplitsResponse, MetastoreError,
        MockMetastoreService,
    };
    use quickwit_proto::types::IndexUid;
    use quickwit_storage::MockStorage;
    use time::OffsetDateTime;

    use super::*;

    fn hashmap<K: Eq + std::hash::Hash, V>(key: K, value: V) -> HashMap<K, V> {
        let mut map = HashMap::new();
        map.insert(key, value);
        map
    }

    fn make_splits(index_id: &str, split_ids: &[&str], split_state: SplitState) -> Vec<Split> {
        split_ids
            .iter()
            .map(|split_id| Split {
                split_metadata: SplitMetadata {
                    split_id: split_id.to_string(),
                    index_uid: IndexUid::for_test(index_id, 0),
                    footer_offsets: 5..20,
                    ..Default::default()
                },
                split_state,
                update_timestamp: 0i64,
                publish_timestamp: None,
            })
            .collect()
    }

    #[tokio::test]
    async fn test_run_garbage_collect_calls_dependencies_appropriately() {
        let index_uid = IndexUid::for_test("test-index", 0);
        let mut mock_storage = MockStorage::default();
        mock_storage
            .expect_bulk_delete()
            .times(1)
            .returning(|paths: &[&Path]| {
                let actual: HashSet<&Path> = HashSet::from_iter(paths.iter().copied());
                let expected: HashSet<&Path> = HashSet::from_iter([
                    Path::new("a.split"),
                    Path::new("b.split"),
                    Path::new("c.split"),
                ]);

                assert_eq!(actual, expected);

                Ok(())
            });

        let mut mock_metastore = MockMetastoreService::new();
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_list_splits()
            .times(2)
            .returning(move |list_splits_request| {
                let query = list_splits_request.deserialize_list_splits_query().unwrap();
                let splits = match query.split_states[0] {
                    SplitState::Staged => {
                        assert_eq!(query.index_uids.unwrap()[0], index_uid_clone);
                        make_splits("test-index", &["a"], SplitState::Staged)
                    }
                    SplitState::MarkedForDeletion => {
                        assert!(query.index_uids.is_none());
                        let expected_deletion_timestamp = OffsetDateTime::now_utc()
                            .unix_timestamp()
                            - split_deletion_grace_period().as_secs() as i64;
                        assert_eq!(
                            query.update_timestamp.end,
                            Bound::Included(expected_deletion_timestamp),
                            "Expected splits query to only select splits which have not been \
                             updated since the expected deletion timestamp.",
                        );
                        assert_eq!(
                            query.update_timestamp.start,
                            Bound::Unbounded,
                            "Expected the lower bound to be unbounded when filtering splits.",
                        );

                        make_splits(
                            "test-index",
                            &["a", "b", "c"],
                            SplitState::MarkedForDeletion,
                        )
                    }
                    _ => panic!("only Staged and MarkedForDeletion expected."),
                };
                let splits = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits)]))
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_mark_splits_for_deletion()
            .times(1)
            .returning(move |mark_splits_for_deletion_request| {
                assert_eq!(
                    mark_splits_for_deletion_request.index_uid(),
                    &index_uid_clone
                );
                assert_eq!(mark_splits_for_deletion_request.split_ids, vec!["a"]);
                Ok(EmptyResponse {})
            });
        let index_uid_clone = index_uid.clone();
        mock_metastore
            .expect_delete_splits()
            .times(1)
            .returning(move |delete_splits_request| {
                assert_eq!(delete_splits_request.index_uid(), &index_uid_clone);
                let split_ids = HashSet::<&str>::from_iter(
                    delete_splits_request
                        .split_ids
                        .iter()
                        .map(|split_id| split_id.as_str()),
                );
                let expected_split_ids = HashSet::<&str>::from_iter(["a", "b", "c"]);
                assert_eq!(split_ids, expected_split_ids);

                Ok(EmptyResponse {})
            });

        let result = run_garbage_collect(
            hashmap(index_uid, Arc::new(mock_storage)),
            MetastoreServiceClient::from_mock(mock_metastore),
            STAGED_GRACE_PERIOD,
            split_deletion_grace_period(),
            false,
            None,
            None,
        )
        .await;
        assert!(result.is_ok());
    }

    #[tokio::test]
    async fn test_garbage_collect_calls_dependencies_appropriately() {
        let storage_resolver = StorageResolver::unconfigured();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .returning(|_list_indexes_request| {
                let indexes_metadata = vec![IndexMetadata::for_test(
                    "test-index",
                    "ram://indexes/test-index",
                )];
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });
        mock_metastore
            .expect_list_splits()
            .times(2)
            .returning(|list_splits_request| {
                let query = list_splits_request.deserialize_list_splits_query().unwrap();
                let splits = match query.split_states[0] {
                    SplitState::Staged => {
                        assert_eq!(&query.index_uids.unwrap()[0].index_id, "test-index");
                        make_splits("test-index", &["a"], SplitState::Staged)
                    }
                    SplitState::MarkedForDeletion => {
                        assert!(query.index_uids.is_none());
                        make_splits(
                            "test-index",
                            &["a", "b", "c"],
                            SplitState::MarkedForDeletion,
                        )
                    }
                    _ => panic!("only Staged and MarkedForDeletion expected."),
                };
                let splits = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits)]))
            });
        mock_metastore
            .expect_mark_splits_for_deletion()
            .times(1)
            .returning(|mark_splits_for_deletion_request| {
                let index_uid: IndexUid = mark_splits_for_deletion_request.index_uid().clone();
                assert_eq!(&index_uid.index_id, "test-index");
                assert_eq!(mark_splits_for_deletion_request.split_ids, vec!["a"]);
                Ok(EmptyResponse {})
            });
        mock_metastore
            .expect_delete_splits()
            .times(1)
            .returning(|delete_splits_request| {
                let index_uid: IndexUid = delete_splits_request.index_uid().clone();
                assert_eq!(&index_uid.index_id, "test-index");

                let split_ids = HashSet::<&str>::from_iter(
                    delete_splits_request
                        .split_ids
                        .iter()
                        .map(|split_id| split_id.as_str()),
                );
                let expected_split_ids = HashSet::<&str>::from_iter(["a", "b", "c"]);

                assert_eq!(split_ids, expected_split_ids);
                Ok(EmptyResponse {})
            });

        let garbage_collect_actor = GarbageCollector::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            storage_resolver,
        );
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handler) = universe.spawn_builder().spawn(garbage_collect_actor);

        let state_after_initialization = handler.process_pending_and_observe().await.state;
        assert_eq!(state_after_initialization.num_passes, 1);
        assert_eq!(state_after_initialization.num_deleted_files, 3);
        assert_eq!(state_after_initialization.num_deleted_bytes, 60);
        assert_eq!(state_after_initialization.num_failed_splits, 0);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_garbage_collect_get_calls_repeatedly() {
        let storage_resolver = StorageResolver::unconfigured();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(3)
            .returning(|_list_indexes_metadata| {
                let indexes_metadata = vec![IndexMetadata::for_test(
                    "test-index",
                    "ram://indexes/test-index",
                )];
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });
        mock_metastore
            .expect_list_splits()
            .times(6)
            .returning(|list_splits_request| {
                let query = list_splits_request.deserialize_list_splits_query().unwrap();
                let splits = match query.split_states[0] {
                    SplitState::Staged => {
                        assert_eq!(&query.index_uids.unwrap()[0].index_id, "test-index");
                        make_splits("test-index", &["a"], SplitState::Staged)
                    }
                    SplitState::MarkedForDeletion => {
                        assert!(&query.index_uids.is_none());
                        make_splits("test-index", &["a", "b"], SplitState::MarkedForDeletion)
                    }
                    _ => panic!("only Staged and MarkedForDeletion expected."),
                };
                let splits = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits)]))
            });
        mock_metastore
            .expect_mark_splits_for_deletion()
            .times(3)
            .returning(|mark_splits_for_deletion_request| {
                let index_uid: IndexUid = mark_splits_for_deletion_request.index_uid().clone();
                assert_eq!(&index_uid.index_id, "test-index");
                assert_eq!(mark_splits_for_deletion_request.split_ids, vec!["a"]);
                Ok(EmptyResponse {})
            });
        mock_metastore
            .expect_delete_splits()
            .times(3)
            .returning(|delete_splits_request| {
                let index_uid: IndexUid = delete_splits_request.index_uid().clone();
                assert_eq!(&index_uid.index_id, "test-index");

                let split_ids = HashSet::<&str>::from_iter(
                    delete_splits_request
                        .split_ids
                        .iter()
                        .map(|split_id| split_id.as_str()),
                );
                let expected_split_ids = HashSet::<&str>::from_iter(["a", "b"]);

                assert_eq!(split_ids, expected_split_ids);
                Ok(EmptyResponse {})
            });

        let garbage_collect_actor = GarbageCollector::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            storage_resolver,
        );
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handle) = universe.spawn_builder().spawn(garbage_collect_actor);

        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 1);
        assert_eq!(counters.num_deleted_files, 2);
        assert_eq!(counters.num_deleted_bytes, 40);
        assert_eq!(counters.num_successful_gc_run, 1);
        assert_eq!(counters.num_failed_storage_resolution, 0);
        assert_eq!(counters.num_failed_gc_run, 0);
        assert_eq!(counters.num_failed_splits, 0);

        // 30 secs later
        universe.sleep(Duration::from_secs(30)).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 1);
        assert_eq!(counters.num_deleted_files, 2);
        assert_eq!(counters.num_deleted_bytes, 40);
        assert_eq!(counters.num_successful_gc_run, 1);
        assert_eq!(counters.num_failed_storage_resolution, 0);
        assert_eq!(counters.num_failed_gc_run, 0);
        assert_eq!(counters.num_failed_splits, 0);

        // 60 secs later
        universe.sleep(RUN_INTERVAL).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 2);
        assert_eq!(counters.num_deleted_files, 4);
        assert_eq!(counters.num_deleted_bytes, 80);
        assert_eq!(counters.num_successful_gc_run, 2);
        assert_eq!(counters.num_failed_storage_resolution, 0);
        assert_eq!(counters.num_failed_gc_run, 0);
        assert_eq!(counters.num_failed_splits, 0);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_garbage_collect_get_called_repeatedly_on_failure() {
        let storage_resolver = StorageResolver::unconfigured();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(4)
            .returning(|_list_indexes_request| {
                Err(MetastoreError::Db {
                    message: "fail to list indexes".to_string(),
                })
            });

        let garbage_collect_actor = GarbageCollector::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            storage_resolver,
        );
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handle) = universe.spawn_builder().spawn(garbage_collect_actor);

        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 1);

        universe.sleep(RUN_INTERVAL).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 2);

        universe.sleep(RUN_INTERVAL).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 3);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_garbage_collect_fails_to_resolve_storage() {
        let storage_resolver = StorageResolver::unconfigured();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .returning(move |_list_indexes_request| {
                let indexes_metadata = vec![IndexMetadata::for_test(
                    "test-index",
                    "postgresql://indexes/test-index",
                )];
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });

        let garbage_collect_actor = GarbageCollector::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            storage_resolver,
        );
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handle) = universe.spawn_builder().spawn(garbage_collect_actor);

        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 1);
        assert_eq!(counters.num_deleted_files, 0);
        assert_eq!(counters.num_deleted_bytes, 0);
        assert_eq!(counters.num_successful_gc_run, 0);
        assert_eq!(counters.num_failed_storage_resolution, 1);
        assert_eq!(counters.num_failed_gc_run, 0);
        assert_eq!(counters.num_failed_splits, 0);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_garbage_collect_fails_to_run_delete_on_one_index() {
        let storage_resolver = StorageResolver::unconfigured();
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .returning(|_list_indexes_request| {
                let indexes_metadata = vec![
                    IndexMetadata::for_test("test-index-1", "ram://indexes/test-index-1"),
                    IndexMetadata::for_test("test-index-2", "ram://indexes/test-index-2"),
                ];
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });
        mock_metastore
            .expect_list_splits()
            .times(3)
            .returning(|list_splits_request| {
                let query = list_splits_request.deserialize_list_splits_query().unwrap();
                let splits_ids_string: Vec<String> =
                    (0..8000).map(|seq| format!("split-{seq:04}")).collect();
                let splits_ids: Vec<&str> = splits_ids_string
                    .iter()
                    .map(|string| string.as_str())
                    .collect();
                let mut splits = match query.split_states[0] {
                    SplitState::Staged => {
                        let index_uids = query.index_uids.unwrap();
                        assert_eq!(index_uids.len(), 2);
                        assert!(
                            ["test-index-1", "test-index-2"]
                                .contains(&index_uids[0].index_id.as_ref())
                        );
                        assert!(
                            ["test-index-1", "test-index-2"]
                                .contains(&index_uids[1].index_id.as_ref())
                        );
                        let mut splits = make_splits("test-index-1", &["a"], SplitState::Staged);
                        splits.append(&mut make_splits("test-index-2", &["a"], SplitState::Staged));
                        splits
                    }
                    SplitState::MarkedForDeletion => {
                        assert!(query.index_uids.is_none());
                        assert_eq!(query.limit, Some(10_000));
                        let mut splits =
                            make_splits("test-index-1", &splits_ids, SplitState::MarkedForDeletion);
                        splits.append(&mut make_splits(
                            "test-index-2",
                            &splits_ids,
                            SplitState::MarkedForDeletion,
                        ));
                        splits
                    }
                    _ => panic!("only Staged and MarkedForDeletion expected."),
                };
                if let Some((index_uid, split_id)) = query.after_split {
                    splits.retain(|split| {
                        (
                            &split.split_metadata.index_uid,
                            &split.split_metadata.split_id,
                        ) > (&index_uid, &split_id)
                    });
                }
                splits.truncate(10_000);
                let splits = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits)]))
            });
        mock_metastore
            .expect_mark_splits_for_deletion()
            .times(2)
            .returning(|mark_splits_for_deletion_request| {
                let index_uid: IndexUid = mark_splits_for_deletion_request.index_uid().clone();
                assert!(["test-index-1", "test-index-2"].contains(&index_uid.index_id.as_ref()));
                assert_eq!(mark_splits_for_deletion_request.split_ids, vec!["a"]);
                Ok(EmptyResponse {})
            });
        mock_metastore
            .expect_delete_splits()
            .times(3)
            .returning(|delete_splits_request| {
                let index_uid: IndexUid = delete_splits_request.index_uid().clone();
                let split_ids = HashSet::<&str>::from_iter(
                    delete_splits_request
                        .split_ids
                        .iter()
                        .map(|split_id| split_id.as_str()),
                );
                if index_uid.index_id == "test-index-1" {
                    assert_eq!(split_ids.len(), 8000);
                    for seq in 0..8000 {
                        let split_id = format!("split-{seq:04}");
                        assert!(split_ids.contains(&*split_id));
                    }
                } else if split_ids.len() == 2000 {
                    for seq in 0..2000 {
                        let split_id = format!("split-{seq:04}");
                        assert!(split_ids.contains(&*split_id));
                    }
                } else if split_ids.len() == 6000 {
                    for seq in 2000..8000 {
                        let split_id = format!("split-{seq:04}");
                        assert!(split_ids.contains(&*split_id));
                    }
                } else {
                    panic!();
                }

                // This should not cause the whole run to fail and return an error,
                // instead this should simply get logged and return the list of splits
                // which have successfully been deleted.
                if index_uid.index_id == "test-index-2" && split_ids.len() == 2000 {
                    Err(MetastoreError::Db {
                        message: "fail to delete".to_string(),
                    })
                } else {
                    Ok(EmptyResponse {})
                }
            });

        let garbage_collect_actor = GarbageCollector::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            storage_resolver,
        );
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handle) = universe.spawn_builder().spawn(garbage_collect_actor);

        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_passes, 1);
        assert_eq!(counters.num_deleted_files, 14000);
        assert_eq!(counters.num_deleted_bytes, 20 * 14000);
        assert_eq!(counters.num_successful_gc_run, 1);
        assert_eq!(counters.num_failed_storage_resolution, 0);
        assert_eq!(counters.num_failed_gc_run, 0);
        assert_eq!(counters.num_failed_splits, 2000);
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/actors/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod delete_task_pipeline;
mod delete_task_planner;
mod delete_task_service;
mod garbage_collector;
mod retention_policy_executor;

pub use delete_task_service::{DELETE_SERVICE_TASK_DIR_NAME, DeleteTaskService};
pub use garbage_collector::GarbageCollector;
pub use retention_policy_executor::RetentionPolicyExecutor;


================================================
FILE: quickwit/quickwit-janitor/src/actors/retention_policy_executor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::time::Duration;

use async_trait::async_trait;
use itertools::Itertools;
use quickwit_actors::{Actor, ActorContext, Handler};
use quickwit_config::IndexConfig;
use quickwit_metastore::ListIndexesMetadataResponseExt;
use quickwit_proto::metastore::{
    ListIndexesMetadataRequest, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::IndexUid;
use serde::Serialize;
use tracing::{debug, error, info};

use crate::retention_policy_execution::run_execute_retention_policy;

const RUN_INTERVAL: Duration = Duration::from_secs(60 * 60); // 1 hours

#[derive(Clone, Debug, Default, Serialize)]
pub struct RetentionPolicyExecutorCounters {
    /// The number of refresh the config passes.
    pub num_refresh_passes: usize,

    /// The number of execution passes.
    pub num_execution_passes: usize,

    /// The number of expired splits.
    pub num_expired_splits: usize,
}

#[derive(Debug)]
struct Loop;

#[derive(Debug)]
struct Execute {
    index_uid: IndexUid,
}

/// An actor for scheduling retention policy execution on all indexes.
/// It keeps a list of indexes that have retention policy configured
/// in a cache and periodically update this list.
pub struct RetentionPolicyExecutor {
    metastore: MetastoreServiceClient,
    /// A map of index_id to index metadata that are managed by this executor.
    /// This act as local cache that is periodically updated while taking into
    /// account deleted indexes, updated or removed retention policy on indexes.
    index_configs: HashMap<String, IndexConfig>,
    counters: RetentionPolicyExecutorCounters,
}

impl RetentionPolicyExecutor {
    pub fn new(metastore: MetastoreServiceClient) -> Self {
        Self {
            metastore,
            index_configs: HashMap::new(),
            counters: RetentionPolicyExecutorCounters::default(),
        }
    }

    /// Indexes refresh Loop handler logic.
    /// Should not return an error to prevent the actor from crashing.
    async fn handle_refresh_loop(&mut self, ctx: &ActorContext<Self>) {
        debug!("loading indexes from the metastore");
        self.counters.num_refresh_passes += 1;

        let response = match self
            .metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
        {
            Ok(response) => response,
            Err(error) => {
                error!(%error, "failed to list indexes from the metastore");
                return;
            }
        };
        let indexes = match response.deserialize_indexes_metadata().await {
            Ok(indexes) => indexes,
            Err(error) => {
                error!(%error, "failed to deserialize indexes metadata");
                return;
            }
        };
        info!("loaded {} indexes from the metastore", indexes.len());

        let deleted_indexes = compute_deleted_indexes(
            self.index_configs.keys().map(String::as_str),
            indexes
                .iter()
                .map(|index_metadata| index_metadata.index_id()),
        );
        if !deleted_indexes.is_empty() {
            debug!(index_ids=%deleted_indexes.iter().join(", "), "deleting indexes from cache");
            for index_id in deleted_indexes {
                self.index_configs.remove(&index_id);
            }
        }
        for index_metadata in indexes {
            let index_uid = index_metadata.index_uid.clone();
            let index_config = index_metadata.into_index_config();
            // We only care about indexes with a retention policy configured.
            let retention_policy = match &index_config.retention_policy_opt {
                Some(policy) => policy,
                None => {
                    // Remove the index from the cache if it exist.
                    // In case where the retention policy was removed this index might have
                    // been inserted in the cache from a previous iteration.
                    self.index_configs.remove(&index_config.index_id);
                    continue;
                }
            };

            // Insert or update the index in the cache.
            if let Some(value) = self.index_configs.get_mut(&index_config.index_id) {
                // Update the cache index entry in case the retention policy was updated.
                *value = index_config;
                continue;
            }

            if let Ok(next_interval) = retention_policy.duration_until_next_evaluation() {
                let message = Execute { index_uid };
                info!(index_id=?index_config.index_id, scheduled_in=?next_interval, "retention-policy-schedule-operation");
                // Inserts & schedule the index's first retention policy execution.
                self.index_configs
                    .insert(index_config.index_id.clone(), index_config);
                ctx.schedule_self_msg(next_interval, message);
            } else {
                error!(index_id=%index_config.index_id, "Couldn't extract the index next schedule time.")
            }
        }
    }
}

#[async_trait]
impl Actor for RetentionPolicyExecutor {
    type ObservableState = RetentionPolicyExecutorCounters;

    fn observable_state(&self) -> Self::ObservableState {
        self.counters.clone()
    }

    fn name(&self) -> String {
        "RetentionPolicyExecutor".to_string()
    }

    async fn initialize(
        &mut self,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        self.handle(Loop, ctx).await?;
        Ok(())
    }
}

#[async_trait]
impl Handler<Loop> for RetentionPolicyExecutor {
    type Reply = ();

    async fn handle(
        &mut self,
        _: Loop,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        self.handle_refresh_loop(ctx).await;
        ctx.schedule_self_msg(RUN_INTERVAL, Loop);
        Ok(())
    }
}

#[async_trait]
impl Handler<Execute> for RetentionPolicyExecutor {
    type Reply = ();

    async fn handle(
        &mut self,
        message: Execute,
        ctx: &ActorContext<Self>,
    ) -> Result<(), quickwit_actors::ActorExitStatus> {
        info!(index_id=%message.index_uid.index_id, "retention-policy-execute-operation");
        self.counters.num_execution_passes += 1;

        let index_config = match self.index_configs.get(&message.index_uid.index_id) {
            Some(config) => config,
            None => {
                debug!(index_id=%message.index_uid.index_id, "the index might have been deleted");
                return Ok(());
            }
        };

        let retention_policy = index_config
            .retention_policy_opt
            .as_ref()
            .expect("Expected index to have retention policy configure.");

        let execution_result = run_execute_retention_policy(
            message.index_uid.clone(),
            self.metastore.clone(),
            retention_policy,
            ctx,
        )
        .await;
        match execution_result {
            Ok(splits) => self.counters.num_expired_splits += splits.len(),
            Err(error) => {
                error!(index_id=%message.index_uid.index_id, error=?error, "Failed to execute the retention policy on the index.")
            }
        }

        if let Ok(next_interval) = retention_policy.duration_until_next_evaluation() {
            info!(index_id=?index_config.index_id, scheduled_in=?next_interval, "retention-policy-schedule-operation");
            ctx.schedule_self_msg(next_interval, message);
        } else {
            // Since we have failed to schedule next execution for this index,
            // we remove it from the cache for it to be retried next time it gets
            // added back by the RetentionPolicyExecutor cache refresh loop.
            self.index_configs.remove(&message.index_uid.index_id);
            error!(index_id=%message.index_uid.index_id, "couldn't extract the index next schedule interval");
        }
        Ok(())
    }
}

/// Extract the list of deleted indexes.
fn compute_deleted_indexes<'a>(
    cached_indexes: impl Iterator<Item = &'a str>,
    indexes: impl Iterator<Item = &'a str>,
) -> HashSet<String> {
    let cached_set: HashSet<_> = cached_indexes.collect();
    let indexes_set: HashSet<_> = indexes.collect();
    (&cached_set - &indexes_set)
        .into_iter()
        .map(ToString::to_string)
        .collect()
}

#[cfg(test)]
mod tests {
    use std::ops::RangeInclusive;

    use mockall::Sequence;
    use quickwit_actors::Universe;
    use quickwit_common::ServiceStream;
    use quickwit_config::RetentionPolicy;
    use quickwit_metastore::{
        IndexMetadata, ListSplitsRequestExt, ListSplitsResponseExt, Split, SplitMetadata,
        SplitState,
    };
    use quickwit_proto::metastore::{
        EmptyResponse, ListIndexesMetadataResponse, ListSplitsResponse, MockMetastoreService,
    };

    use super::*;

    #[derive(Debug)]
    struct AssertState(Vec<(&'static str, Option<&'static str>)>);

    #[async_trait]
    impl Handler<AssertState> for RetentionPolicyExecutor {
        type Reply = ();

        async fn handle(
            &mut self,
            message: AssertState,
            _ctx: &ActorContext<Self>,
        ) -> Result<Self::Reply, quickwit_actors::ActorExitStatus> {
            let indexes_set: HashSet<_> = self
                .index_configs
                .values()
                .map(|im| (&im.index_id, &im.retention_policy_opt))
                .collect();

            let expected_indexes: Vec<IndexConfig> = make_indexes(&message.0)
                .into_iter()
                .map(IndexMetadata::into_index_config)
                .collect();
            let expected_indexes_set: HashSet<_> = expected_indexes
                .iter()
                .map(|im| (&im.index_id, &im.retention_policy_opt))
                .collect();
            assert_eq!(
                indexes_set, expected_indexes_set,
                "Mismatch set of indexes."
            );
            Ok(())
        }
    }

    const EVALUATION_SCHEDULE: &str = "hourly";

    fn make_index(index_id: &str, retention_period_opt: Option<&str>) -> IndexConfig {
        let mut index = IndexConfig::for_test(index_id, &format!("ram://indexes/{index_id}"));
        if let Some(retention_period) = retention_period_opt {
            index.retention_policy_opt = Some(RetentionPolicy {
                retention_period: retention_period.to_string(),
                evaluation_schedule: EVALUATION_SCHEDULE.to_string(),
            })
        }
        index
    }

    fn make_indexes(index_ids: &[(&str, Option<&str>)]) -> Vec<IndexMetadata> {
        index_ids
            .iter()
            .map(|(index_id, retention_period_opt)| make_index(index_id, *retention_period_opt))
            .map(IndexMetadata::new)
            .collect()
    }

    fn make_split(split_id: &str, time_range: Option<RangeInclusive<i64>>) -> Split {
        Split {
            split_metadata: SplitMetadata {
                split_id: split_id.to_string(),
                footer_offsets: 5..20,
                time_range,
                ..Default::default()
            },
            split_state: SplitState::Published,
            update_timestamp: 0,
            publish_timestamp: Some(100),
        }
    }

    // Uses the retention policy scheduler to calculate
    // how much time to advance for the execution to take place.
    fn shift_time_by() -> Duration {
        let scheduler = RetentionPolicy {
            retention_period: "".to_string(),
            evaluation_schedule: EVALUATION_SCHEDULE.to_string(),
        };

        scheduler.duration_until_next_evaluation().unwrap() + Duration::from_secs(1)
    }

    #[tokio::test]
    async fn test_retention_executor_refresh() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();

        let mut sequence = Sequence::new();
        mock_metastore
            .expect_list_splits()
            .times(..)
            .returning(|_| Ok(ServiceStream::empty()));
        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .in_sequence(&mut sequence)
            .returning(|_list_indexes_request| {
                let indexes_metadata = make_indexes(&[
                    ("index-1", Some("1 hour")),
                    ("index-2", Some("1 hour")),
                    ("index-3", None),
                ]);
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });

        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .in_sequence(&mut sequence)
            .returning(|_list_indexes_request| {
                let indexes_metadata = make_indexes(&[
                    ("index-1", Some("1 hour")),
                    ("index-2", Some("2 hour")),
                    ("index-3", Some("1 hour")),
                ]);
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });

        mock_metastore
            .expect_list_indexes_metadata()
            .times(1)
            .in_sequence(&mut sequence)
            .returning(|_list_indexes_request| {
                let indexes_metadata = make_indexes(&[
                    ("index-2", Some("1 hour")),
                    ("index-4", Some("1 hour")),
                    ("index-5", None),
                ]);
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });

        let retention_policy_executor =
            RetentionPolicyExecutor::new(MetastoreServiceClient::from_mock(mock_metastore));
        let universe = Universe::with_accelerated_time();
        let (mailbox, handle) = universe.spawn_builder().spawn(retention_policy_executor);

        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_refresh_passes, 1);
        mailbox
            .ask(AssertState(vec![
                ("index-1", Some("1 hour")),
                ("index-2", Some("1 hour")),
            ]))
            .await?;

        universe.sleep(RUN_INTERVAL + Duration::from_secs(5)).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_refresh_passes, 2);
        mailbox
            .ask(AssertState(vec![
                ("index-1", Some("1 hour")),
                ("index-2", Some("2 hour")),
                ("index-3", Some("1 hour")),
            ]))
            .await?;

        universe.sleep(RUN_INTERVAL + Duration::from_secs(5)).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_refresh_passes, 3);
        mailbox
            .ask(AssertState(vec![
                ("index-2", Some("1 hour")),
                ("index-4", Some("1 hour")),
            ]))
            .await?;
        universe.assert_quit().await;

        Ok(())
    }

    #[tokio::test]
    async fn test_retention_policy_execution_calls_dependencies() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .times(..)
            .returning(|_list_indexes_request| {
                let indexes_metadata = make_indexes(&[
                    ("index-1", Some("2 hour")),
                    ("index-2", Some("1 hour")),
                    ("index-3", None),
                ]);
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });

        mock_metastore
            .expect_list_splits()
            .times(2..=4)
            .returning(|list_splits_request| {
                let query = list_splits_request.deserialize_list_splits_query().unwrap();
                assert_eq!(query.split_states, &[SplitState::Published]);
                let splits = match query.index_uids.unwrap()[0].index_id.as_ref() {
                    "index-1" => {
                        vec![
                            make_split("split-1", Some(1000..=5000)),
                            make_split("split-2", Some(2000..=6000)),
                            make_split("split-3", None),
                        ]
                    }
                    "index-2" => Vec::new(),
                    unknown => panic!("Unknown index: `{unknown}`."),
                };
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });

        mock_metastore
            .expect_mark_splits_for_deletion()
            .times(1..=3)
            .returning(|mark_splits_for_deletion_request| {
                let index_uid: IndexUid = mark_splits_for_deletion_request.index_uid().clone();
                assert_eq!(index_uid.index_id, "index-1");
                assert_eq!(
                    mark_splits_for_deletion_request.split_ids,
                    ["split-1", "split-2"]
                );
                Ok(EmptyResponse {})
            });

        let retention_policy_executor =
            RetentionPolicyExecutor::new(MetastoreServiceClient::from_mock(mock_metastore));
        let universe = Universe::with_accelerated_time();
        let (_mailbox, handle) = universe.spawn_builder().spawn(retention_policy_executor);

        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_execution_passes, 0);
        assert_eq!(counters.num_expired_splits, 0);

        universe.sleep(shift_time_by()).await;
        let counters = handle.process_pending_and_observe().await.state;
        assert_eq!(counters.num_execution_passes, 2);
        assert_eq!(counters.num_expired_splits, 2);
        universe.assert_quit().await;

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::rate_limited_error;
use quickwit_proto::metastore::MetastoreError;
use quickwit_proto::{ServiceError, ServiceErrorCode};
use serde::{Deserialize, Serialize};
use thiserror::Error;

/// Janitor errors.
#[allow(missing_docs)]
#[derive(Error, Debug, Serialize, Deserialize)]
pub enum JanitorError {
    #[error("internal error: `{0}`")]
    Internal(String),
    #[error("invalid delete query: `{0}`")]
    InvalidDeleteQuery(String),
    #[error("metastore error: `{0}`")]
    Metastore(#[from] MetastoreError),
}

impl ServiceError for JanitorError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(err_msg) => {
                rate_limited_error!(limit_per_min = 6, "janitor internal error {err_msg}");
                ServiceErrorCode::Internal
            }
            Self::InvalidDeleteQuery(_) => ServiceErrorCode::BadRequest,
            Self::Metastore(metastore_error) => metastore_error.error_code(),
        }
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/janitor_service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;
use quickwit_actors::{
    Actor, ActorContext, ActorExitStatus, ActorHandle, ActorState, Handler, Healthz,
};
use serde_json::{Value as JsonValue, json};

use crate::actors::{DeleteTaskService, GarbageCollector, RetentionPolicyExecutor};

pub struct JanitorService {
    delete_task_service_handle: Option<ActorHandle<DeleteTaskService>>,
    garbage_collector_handle: ActorHandle<GarbageCollector>,
    retention_policy_executor_handle: ActorHandle<RetentionPolicyExecutor>,
}

impl JanitorService {
    pub fn new(
        delete_task_service_handle: Option<ActorHandle<DeleteTaskService>>,
        garbage_collector_handle: ActorHandle<GarbageCollector>,
        retention_policy_executor_handle: ActorHandle<RetentionPolicyExecutor>,
    ) -> Self {
        Self {
            delete_task_service_handle,
            garbage_collector_handle,
            retention_policy_executor_handle,
        }
    }

    fn is_healthy(&self) -> bool {
        let delete_task_is_not_failure: bool =
            if let Some(delete_task_service_handle) = &self.delete_task_service_handle {
                delete_task_service_handle.state() != ActorState::Failure
            } else {
                true
            };
        delete_task_is_not_failure
            && self.garbage_collector_handle.state() != ActorState::Failure
            && self.retention_policy_executor_handle.state() != ActorState::Failure
    }
}

#[async_trait]
impl Actor for JanitorService {
    type ObservableState = JsonValue;

    fn name(&self) -> String {
        "JanitorService".to_string()
    }

    fn observable_state(&self) -> Self::ObservableState {
        json!({})
    }
}

#[async_trait]
impl Handler<Healthz> for JanitorService {
    type Reply = bool;

    async fn handle(
        &mut self,
        _message: Healthz,
        _ctx: &ActorContext<Self>,
    ) -> Result<Self::Reply, ActorExitStatus> {
        Ok(self.is_healthy())
    }
}


================================================
FILE: quickwit/quickwit-janitor/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

use quickwit_actors::{Mailbox, Universe};
use quickwit_common::pubsub::EventBroker;
use quickwit_config::NodeConfig;
use quickwit_indexing::actors::MergeSchedulerService;
use quickwit_metastore::SplitInfo;
use quickwit_proto::metastore::MetastoreServiceClient;
use quickwit_search::SearchJobPlacer;
use quickwit_storage::StorageResolver;
use tracing::info;

pub mod actors;
pub mod error;
mod janitor_service;
mod metrics;
mod retention_policy_execution;

pub use janitor_service::JanitorService;

use crate::actors::{DeleteTaskService, GarbageCollector, RetentionPolicyExecutor};

#[derive(utoipa::OpenApi)]
#[openapi(components(schemas(SplitInfo)))]
/// Schema used for the OpenAPI generation which are apart of this crate.
pub struct JanitorApiSchemas;

pub async fn start_janitor_service(
    universe: &Universe,
    config: &NodeConfig,
    metastore: MetastoreServiceClient,
    search_job_placer: SearchJobPlacer,
    storage_resolver: StorageResolver,
    event_broker: EventBroker,
    run_delete_task_service: bool,
) -> anyhow::Result<Mailbox<JanitorService>> {
    info!("starting janitor service");
    let garbage_collector = GarbageCollector::new(metastore.clone(), storage_resolver.clone());
    let (_, garbage_collector_handle) = universe.spawn_builder().spawn(garbage_collector);

    let retention_policy_executor = RetentionPolicyExecutor::new(metastore.clone());
    let (_, retention_policy_executor_handle) =
        universe.spawn_builder().spawn(retention_policy_executor);
    let delete_task_service_handle = if run_delete_task_service {
        let delete_task_service = DeleteTaskService::new(
            metastore,
            search_job_placer,
            storage_resolver,
            config.data_dir_path.clone(),
            config.indexer_config.max_concurrent_split_uploads,
            universe.get_or_spawn_one::<MergeSchedulerService>(),
            event_broker,
        )
        .await?;
        let (_, delete_task_service_handle) = universe.spawn_builder().spawn(delete_task_service);
        Some(delete_task_service_handle)
    } else {
        tracing::warn!("delete task service is disabled: delete queries will not be processed");
        None
    };

    let janitor_service = JanitorService::new(
        delete_task_service_handle,
        garbage_collector_handle,
        retention_policy_executor_handle,
    );
    let (janitor_service_mailbox, _janitor_service_handle) =
        universe.spawn_builder().spawn(janitor_service);
    Ok(janitor_service_mailbox)
}


================================================
FILE: quickwit/quickwit-janitor/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    IntCounter, IntCounterVec, IntGaugeVec, new_counter, new_counter_vec, new_gauge_vec,
};

pub struct JanitorMetrics {
    pub ongoing_num_delete_operations_total: IntGaugeVec<1>,
    pub gc_deleted_splits: IntCounterVec<1>,
    pub gc_deleted_bytes: IntCounter,
    pub gc_runs: IntCounterVec<1>,
    pub gc_seconds_total: IntCounter,
    // TODO having a current run duration which is 0|undefined out of run, and returns `now -
    // start_time` during a run would be nice
}

impl Default for JanitorMetrics {
    fn default() -> Self {
        JanitorMetrics {
            ongoing_num_delete_operations_total: new_gauge_vec(
                "ongoing_num_delete_operations_total",
                "Num of ongoing delete operations (per index).",
                "quickwit_janitor",
                &[],
                ["index"],
            ),
            gc_deleted_splits: new_counter_vec(
                "gc_deleted_splits_total",
                "Total number of splits deleted by the garbage collector.",
                "quickwit_janitor",
                &[],
                ["result"],
            ),
            gc_deleted_bytes: new_counter(
                "gc_deleted_bytes_total",
                "Total number of bytes deleted by the garbage collector.",
                "quickwit_janitor",
                &[],
            ),
            gc_runs: new_counter_vec(
                "gc_runs_total",
                "Total number of garbage collector execition.",
                "quickwit_janitor",
                &[],
                ["result"],
            ),
            gc_seconds_total: new_counter(
                "gc_seconds_total",
                "Total time spent running the garbage collector",
                "quickwit_janitor",
                &[],
            ),
        }
    }
}

/// `JANITOR_METRICS` exposes a bunch of related metrics through a prometheus
/// endpoint.
pub static JANITOR_METRICS: Lazy<JanitorMetrics> = Lazy::new(JanitorMetrics::default);


================================================
FILE: quickwit/quickwit-janitor/src/retention_policy_execution.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_actors::ActorContext;
use quickwit_common::pretty::PrettySample;
use quickwit_config::RetentionPolicy;
use quickwit_metastore::{
    ListSplitsQuery, ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitMetadata,
    SplitState,
};
use quickwit_proto::metastore::{
    ListSplitsRequest, MarkSplitsForDeletionRequest, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::{IndexUid, SplitId};
use time::OffsetDateTime;
use tracing::{info, warn};

use crate::actors::RetentionPolicyExecutor;

/// Detect all expired splits based a retention policy and
/// only mark them as `MarkedForDeletion`. Actual split deletion
/// is taken care of by the garbage collector.
///
/// * `index_id` - The target index id.
/// * `metastore` - The metastore managing the target index.
/// * `retention_policy` - The retention policy to used to evaluate the splits.
/// * `ctx_opt` - A context for reporting progress (only useful within quickwit actor).
pub async fn run_execute_retention_policy(
    index_uid: IndexUid,
    metastore: MetastoreServiceClient,
    retention_policy: &RetentionPolicy,
    ctx: &ActorContext<RetentionPolicyExecutor>,
) -> anyhow::Result<Vec<SplitMetadata>> {
    // Select splits that are published and older than the retention period.
    let retention_period = retention_policy.retention_period()?;
    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    let max_retention_timestamp = current_timestamp - retention_period.as_secs() as i64;
    let query = ListSplitsQuery::for_index(index_uid.clone())
        .with_split_state(SplitState::Published)
        .with_max_time_range_end(max_retention_timestamp);

    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
    let (expired_splits, ignored_splits): (Vec<SplitMetadata>, Vec<SplitMetadata>) = ctx
        .protect_future(metastore.list_splits(list_splits_request))
        .await?
        .collect_splits_metadata()
        .await?
        .into_iter()
        .partition(|split_metadata| split_metadata.time_range.is_some());

    if !ignored_splits.is_empty() {
        let ignored_split_ids: Vec<String> = ignored_splits
            .into_iter()
            .map(|split_metadata| split_metadata.split_id)
            .collect();
        warn!(
            index_id=%index_uid.index_id,
            split_ids=?PrettySample::new(&ignored_split_ids, 5),
            "Retention policy could not be applied to {} splits because they lack a timestamp range.",
            ignored_split_ids.len()
        );
    }
    if expired_splits.is_empty() {
        return Ok(expired_splits);
    }
    // Mark the expired splits for deletion.
    let expired_split_ids: Vec<SplitId> = expired_splits
        .iter()
        .map(|split_metadata| split_metadata.split_id.to_string())
        .collect();
    info!(
        index_id=%index_uid.index_id,
        split_ids=?PrettySample::new(&expired_split_ids, 5),
        "Marking {} splits for deletion based on retention policy.",
        expired_split_ids.len()
    );
    let mark_splits_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid, expired_split_ids);
    ctx.protect_future(metastore.mark_splits_for_deletion(mark_splits_for_deletion_request))
        .await?;
    Ok(expired_splits)
}


================================================
FILE: quickwit/quickwit-lambda-client/Cargo.toml
================================================
[package]
name = "quickwit-lambda-client"
description = "AWS Lambda client for Quickwit leaf search invocation and deployment"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
aws-config = { workspace = true }
aws-sdk-lambda = { workspace = true }
base64 = { workspace = true }
md5 = { workspace = true }
prost = { workspace = true }
serde_json = { workspace = true }
once_cell = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-lambda-server = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-search = { workspace = true }

[dev-dependencies]
aws-smithy-mocks = { workspace = true }
aws-sdk-lambda = { workspace = true, features = ["test-util"] }
bytesize = { workspace = true }
tokio = { workspace = true, features = ["test-util", "macros"] }

# Required for complicated reasons. quickwit-storage checks that we
# do use preserve order with serde. aws forces that feature. We disable
# the check by switching on its testsuite feature.
quickwit-storage = { workspace = true, features = ["testsuite"] }

[build-dependencies]
sha2 = { workspace = true }
ureq = { workspace = true }


================================================
FILE: quickwit/quickwit-lambda-client/README.md
================================================
# Quickwit Lambda

Quickwit supports offloading leaf search to AWS Lambda for horizontal scaling.
The Lambda function is built separately and embedded into Quickwit's binary,
allowing Quickwit to auto-deploy the function at startup.

## Architecture

- **quickwit-lambda-server**: The Lambda function binary that executes leaf searches
- **quickwit-lambda-client**: The client that invokes Lambda and embeds the Lambda zip for auto-deployment

## Release Process

### 1. Tag the release

Push a tag with the `lambda-` prefix:

```bash
git tag lambda-v0.8.0
git push origin lambda-v0.8.0
```

This triggers the `publish_lambda.yaml` GitHub Action which:
- Cross-compiles the Lambda binary for ARM64
- Creates a zip file named `quickwit-aws-lambda-v0.8.0-aarch64.zip`
- Uploads it as a **draft** GitHub release

### 2. Publish the release

Go to GitHub releases and manually publish the draft release to make the
artifact URL publicly accessible.

### 3. Update the embedded Lambda URL

Update `LAMBDA_ZIP_URL` in `quickwit-lambda-client/build.rs` to point to the
new release:

```rust
const LAMBDA_ZIP_URL: &str = "https://github.com/quickwit-oss/quickwit/releases/download/lambda-v0.8.0/quickwit-aws-lambda-v0.8.0-aarch64.zip";
```

### 4. Versioning

The Lambda client uses content-based versioning:
- An MD5 hash of the Lambda zip is computed at build time
- This hash is embedded in the Lambda function description as `quickwit:{version}-{hash_short}`
- When Quickwit starts, it checks if a matching version exists before deploying

This ensures that:
- Different Quickwit builds with the same Lambda binary share the same Lambda version
- Updating the Lambda binary automatically triggers a new deployment


================================================
FILE: quickwit/quickwit-lambda-client/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Build script for quickwit-lambda-client.
//!
//! This script downloads the pre-built Lambda zip from a GitHub release
//! and places it in OUT_DIR for embedding via include_bytes!
//!
//! The Lambda binary is built separately in CI and published as a GitHub release.

use std::env;
use std::path::{Path, PathBuf};

use sha2::{Digest, Sha256};

/// URL to download the pre-built Lambda zip from GitHub releases.
/// This should be updated when a new Lambda binary is released.
const LAMBDA_ZIP_URL: &str = "https://github.com/quickwit-oss/quickwit/releases/download/lambda-ff6fdfa5/quickwit-aws-lambda--aarch64.zip";

/// Expected SHA256 hash of the Lambda zip artifact.
/// Must be updated alongside LAMBDA_ZIP_URL when a new Lambda binary is released.
const LAMBDA_ZIP_SHA256: &str = "fa940f44178e28460c21e44bb2610b776542b9b97db66a53bc65b10cad653b90";

/// AWS Lambda direct upload limit is 50MB.
/// Larger artifacts must be uploaded via S3.
const MAX_LAMBDA_ZIP_SIZE: usize = 50 * 1024 * 1024;

fn main() {
    println!("cargo:rerun-if-changed=build.rs");

    let out_dir = PathBuf::from(env::var("OUT_DIR").expect("OUT_DIR not set"));
    let zip_path = out_dir.join("lambda_bootstrap.zip");

    fetch_lambda_zip(&zip_path);

    // Export first 8 hex chars of the SHA256 as environment variable.
    // This is used to create a unique qualifier for Lambda versioning.
    let hash_short = &LAMBDA_ZIP_SHA256[..8];
    println!("cargo:rustc-env=LAMBDA_BINARY_HASH={}", hash_short);
    println!("lambda binary hash (short): {}", hash_short);
}

/// Fetch the Lambda zip and save it to `local_cache_path`.
///
/// If a cached file already exists with the correct SHA256, this is a no-op.
/// If the hash doesn't match (stale artifact), the file is deleted and re-downloaded.
/// If no cached file exists, the artifact is downloaded fresh.
///
/// This function panics if a problem happens.
fn fetch_lambda_zip(local_cache_path: &Path) {
    // Try the cache first.
    if let Ok(data) = std::fs::read(local_cache_path) {
        let actual_hash = sha256_hex(&data);
        if actual_hash == LAMBDA_ZIP_SHA256 {
            println!("using cached Lambda zip from {:?}", local_cache_path);
            return;
        }
        println!("cargo:warning=cached Lambda zip has wrong SHA256, re-downloading");
        std::fs::remove_file(local_cache_path).expect("failed to delete stale cached zip");
    }

    // Download from the remote URL.
    println!(
        "cargo:warning=downloading Lambda zip from: {}",
        LAMBDA_ZIP_URL
    );
    let data = download_lambda_zip(LAMBDA_ZIP_URL).expect("failed to download Lambda zip");

    // Verify SHA256 BEFORE writing to disk.
    let actual_hash = sha256_hex(&data);
    if actual_hash != LAMBDA_ZIP_SHA256 {
        panic!(
            "SHA256 mismatch for Lambda zip!\n  expected: {LAMBDA_ZIP_SHA256}\n  actual:   \
             {actual_hash}\nThe artifact at {LAMBDA_ZIP_URL} may have been tampered with."
        );
    }

    std::fs::write(local_cache_path, &data).expect("failed to write zip file");
    println!(
        "cargo:warning=downloaded Lambda zip to {:?} ({} bytes)",
        local_cache_path,
        data.len()
    );
}

fn sha256_hex(data: &[u8]) -> String {
    format!("{:x}", Sha256::digest(data))
}

fn download_lambda_zip(url: &str) -> Result<Vec<u8>, String> {
    let response = ureq::get(url)
        .call()
        .map_err(|err| format!("HTTP request failed: {err}"))?;
    // Set limit higher than MAX_LAMBDA_ZIP_SIZE so we can detect oversized artifacts.
    let data = response
        .into_body()
        .with_config()
        .limit(MAX_LAMBDA_ZIP_SIZE as u64 + 1)
        .read_to_vec()
        .map_err(|err| format!("failed to read response body: {err}"))?;
    if data.len() > MAX_LAMBDA_ZIP_SIZE {
        return Err(format!(
            "Lambda zip is too large ({} bytes, max {} bytes).\nAWS Lambda does not support \
             direct upload of binaries larger than 50MB.\nWorkaround: upload the Lambda zip to S3 \
             and deploy from there instead.",
            data.len(),
            MAX_LAMBDA_ZIP_SIZE
        ));
    }
    Ok(data)
}


================================================
FILE: quickwit/quickwit-lambda-client/src/deploy.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Lambda function deployment for auto-deploy feature.
//!
//! This module provides functionality to automatically deploy or update
//! the Lambda function used for leaf search operations.
//!
//! # Versioning Strategy
//!
//! We use AWS Lambda published versions with description-based identification:
//! - Each published version has a description like `quickwit:0_8_0-fa752891`
//! - We list versions to find one matching our qualifier
//! - We invoke the specific version number (not $LATEST)
//! - Old versions are garbage collected (keep current + top 5 most recent)

use std::collections::HashMap;
use std::sync::OnceLock;

use anyhow::{Context, anyhow};
use aws_sdk_lambda::Client as LambdaClient;
use aws_sdk_lambda::error::SdkError;
use aws_sdk_lambda::primitives::Blob;
use aws_sdk_lambda::types::{
    Architecture, Environment, FunctionCode, LastUpdateStatus, Runtime, State,
};
use quickwit_config::{LambdaConfig, LambdaDeployConfig};
use quickwit_search::LambdaLeafSearchInvoker;
use tracing::{debug, info};

use crate::invoker::create_lambda_invoker_for_version;

/// Embedded Lambda binary (arm64, compressed).
/// This is included at compile time.
const LAMBDA_BINARY: &[u8] = include_bytes!(concat!(env!("OUT_DIR"), "/lambda_bootstrap.zip"));

/// Prefix for version descriptions to identify Quickwit-managed versions.
const VERSION_DESCRIPTION_PREFIX: &str = "quickwit";

/// Number of recent versions to keep during garbage collection (in addition to current).
const GC_KEEP_RECENT_VERSIONS: usize = 5;

/// Returns the Lambda qualifier combining version and binary hash.
/// Format: "{quickwit_version}-{hash_short}" with dots replaced by underscores.
/// Example: "0_8_0-fa752891"
fn lambda_qualifier() -> &'static str {
    static LAMBDA_QUALIFIER: OnceLock<String> = OnceLock::new();
    LAMBDA_QUALIFIER
        .get_or_init(|| {
            format!(
                "{}_{}",
                env!("CARGO_PKG_VERSION").replace('.', "_"),
                env!("LAMBDA_BINARY_HASH")
            )
        })
        .as_str()
}

/// Returns the version description for our qualifier.
///
/// We also pass the deploy config, as we want the function to be redeployed
/// if the deploy config is changed.
fn version_description(deploy_config_opt: Option<&LambdaDeployConfig>) -> String {
    if let Some(deploy_config) = deploy_config_opt {
        let memory_size_mib = deploy_config.memory_size.as_mib() as u64;
        let execution_role_arn_digest: String = format!(
            "{:x}",
            md5::compute(deploy_config.execution_role_arn.as_bytes())
        );
        format!(
            "{}_{}_{}_{}s_{}",
            VERSION_DESCRIPTION_PREFIX,
            lambda_qualifier(),
            memory_size_mib,
            deploy_config.invocation_timeout_secs,
            &execution_role_arn_digest[..5]
        )
    } else {
        format!(
            "{}_{}_nodeploy",
            VERSION_DESCRIPTION_PREFIX,
            lambda_qualifier()
        )
    }
}

/// Get or deploy the Lambda function and return an invoker.
///
/// This function:
/// 1. Lists existing Lambda versions to find one matching our description
/// 2. If not found, (and if a deploy config is provided) attempt to deploy the embedded Lambda
///    binary
/// 3. Garbage collects old versions (keeps current + 5 most recent)
/// 4. Returns an invoker configured to call the specific version
///
/// The qualifier is computed from the Quickwit version and Lambda binary hash,
/// ensuring the deployed Lambda matches the embedded binary.
pub async fn try_get_or_deploy_invoker(
    lambda_config: &LambdaConfig,
) -> anyhow::Result<impl LambdaLeafSearchInvoker> {
    let aws_config = aws_config::load_defaults(aws_config::BehaviorVersion::latest()).await;
    let client = LambdaClient::new(&aws_config);
    let function_name = &lambda_config.function_name;
    let target_description = version_description(lambda_config.auto_deploy.as_ref());

    info!(
        function_name = %function_name,
        qualifier = %lambda_qualifier(),
        "looking for Lambda function version"
    );

    let version = find_or_deploy_version(
        &client,
        function_name,
        &target_description,
        lambda_config.auto_deploy.as_ref(),
    )
    .await?;

    // Spawn background garbage collection (best effort, non-blocking)
    let gc_client = client.clone();
    let gc_function_name = function_name.clone();
    let gc_version = version.clone();
    tokio::spawn(async move {
        if let Err(e) =
            garbage_collect_old_versions(&gc_client, &gc_function_name, &gc_version).await
        {
            info!(error = %e, "failed to garbage collect old Lambda versions");
        }
    });

    // Create and return the invoker
    let invoker = create_lambda_invoker_for_version(function_name.clone(), version)
        .await
        .context("failed to create Lambda invoker")?;

    info!("created the lambda invoker");

    Ok(invoker)
}

/// Find a Lambda version with a description matching our qualifier.
///
/// If none is found and a deploy config is provided, attempt to deploy a new version.
///
/// Returns the version number as a string (because it is a string on AWS side, e.g.: "7") if found.
async fn find_or_deploy_version(
    client: &LambdaClient,
    function_name: &str,
    target_description: &str,
    deploy_config: Option<&LambdaDeployConfig>,
) -> anyhow::Result<String> {
    if let Some(version) = find_matching_version(client, function_name, target_description).await? {
        info!(
            function_name = %function_name,
            version = %version,
            "found existing Lambda version"
        );
        return Ok(version);
    }

    let deploy_config = deploy_config.with_context(|| {
        format!(
            "no Lambda version found with description '{}' and auto_deploy is not configured. \
             Either deploy the Lambda function manually or enable auto_deploy.",
            target_description
        )
    })?;

    info!(
        function_name = %function_name,
        "no matching version found, deploying Lambda function"
    );

    deploy_lambda_function(client, function_name, deploy_config).await
}

async fn find_matching_version(
    client: &LambdaClient,
    function_name: &str,
    target_description: &str,
) -> anyhow::Result<Option<String>> {
    let mut marker: Option<String> = None;

    loop {
        let mut request = client
            .list_versions_by_function()
            .function_name(function_name);

        if let Some(m) = marker {
            request = request.marker(m);
        }

        let response = match request.send().await {
            Ok(resp) => resp,
            Err(SdkError::ServiceError(err)) if err.err().is_resource_not_found_exception() => {
                info!(
                    function_name = %function_name,
                    "lambda function does not exist yet"
                );
                return Ok(None);
            }
            Err(e) => {
                return Err(anyhow!(
                    "failed to list Lambda versions for '{}': {}",
                    function_name,
                    e
                ));
            }
        };

        for version in response.versions() {
            if let Some(description) = version.description()
                && description == target_description
                && let Some(ver) = version.version()
                && ver != "$LATEST"
            {
                return Ok(Some(ver.to_string()));
            }
        }

        marker = response.next_marker().map(|s| s.to_string());
        if marker.is_none() {
            break;
        }
    }

    Ok(None)
}

/// Deploy the Lambda function and publish a new version.
/// AWS's API is pretty terrible.
///
/// Lambda's version are integer generated by AWS (we don't have control over them).
/// To publish a new version, we need to implement two paths:
/// - If the function doesn't exist yet, `create_function(publish=true)` atomically creates it and
///   publishes a version in one call.
/// - If the function already exists, we first update the code. We do not publish because strangely
///   the API call does not make it possible to change the description. Updating the code has the
///   effect of create a version $LATEST.
/// - We publish the version $LATEST. That's the moment AWS attributes a version number. That call
///   allows us to change the description. We pass the sha256 hash of the code to ensure that
///   $LATEST has not been overwritten by another concurrent update.
async fn deploy_lambda_function(
    client: &LambdaClient,
    function_name: &str,
    deploy_config: &LambdaDeployConfig,
) -> anyhow::Result<String> {
    // This looks overly complicated but this is not AI slop.
    // The AWS API forces us to go through a bunch of hoops to update our function
    // in a safe manner.
    let description = version_description(Some(deploy_config));

    // Fast path: if the function does not exist, we can create and publish the function atomically.
    if let Some(version) =
        try_create_function(client, function_name, deploy_config, &description).await?
    {
        return Ok(version);
    }

    // Function already exists — we need to update the code.
    // This will create or update a version called "$LATEST" (that's the actual string)
    //
    // We cannot directly publish here, because updating the function code does not allow
    // us to pass a different description.
    let code_sha256 = update_function_code(client, function_name).await?;

    // We can now publish that new uploaded version.
    // We pass the code_sha256 guard to make sure a race condition does not cause
    // us to publish a different version.
    //
    // Publishing will create an actual version (a number as a string) and return it.
    publish_version(client, function_name, &code_sha256, &description).await
}

/// Try to create the Lambda function with `publish=true`.
///
/// Returns `Some(version)` if the function was created and published.
/// Returns `None` if the function already exists (`ResourceConflictException`).
async fn try_create_function(
    client: &LambdaClient,
    function_name: &str,
    deploy_config: &LambdaDeployConfig,
    description: &str,
) -> anyhow::Result<Option<String>> {
    let memory_size_mb = deploy_config
        .memory_size
        .as_u64()
        .div_ceil(1024u64 * 1024u64) as i32;
    let timeout_secs = deploy_config.invocation_timeout_secs as i32;

    info!(
        function_name = %function_name,
        memory_size_mb = memory_size_mb,
        timeout_secs = timeout_secs,
        "attempting to create Lambda function"
    );

    let function_code = FunctionCode::builder()
        .zip_file(Blob::new(LAMBDA_BINARY))
        .build();

    let create_result = client
        .create_function()
        .function_name(function_name)
        .runtime(Runtime::Providedal2023)
        .role(&deploy_config.execution_role_arn)
        .handler("bootstrap")
        .description(description)
        .code(function_code)
        .architectures(Architecture::Arm64)
        .memory_size(memory_size_mb)
        .timeout(timeout_secs)
        .environment(build_environment())
        .set_tags(Some(build_tags()))
        .publish(true)
        .send()
        .await;

    match create_result {
        Ok(output) => {
            let version = output
                .version()
                .ok_or_else(|| anyhow!("created function has no version number"))?
                .to_string();
            info!(
                function_name = %function_name,
                version = %version,
                "lambda function created and published"
            );
            Ok(Some(version))
        }
        Err(SdkError::ServiceError(err)) if err.err().is_resource_conflict_exception() => {
            debug!(
                function_name = %function_name,
                "lambda function already exists"
            );
            Ok(None)
        }
        Err(e) => Err(anyhow!(
            "failed to create Lambda function '{}': {}",
            function_name,
            e
        )),
    }
}

/// Update `$LATEST` to our embedded binary.
///
/// Returns the `code_sha256` of the uploaded code, to be used as a guard
/// when publishing the version (detects if another process overwrote `$LATEST`
/// between our update and publish).
async fn update_function_code(
    client: &LambdaClient,
    function_name: &str,
) -> anyhow::Result<String> {
    info!(
        function_name = %function_name,
        "updating Lambda function code to current binary"
    );

    let response = client
        .update_function_code()
        .function_name(function_name)
        .zip_file(Blob::new(LAMBDA_BINARY))
        .architectures(Architecture::Arm64)
        .send()
        .await
        .context("failed to update Lambda function code")?;

    let code_sha256 = response
        .code_sha256()
        .ok_or_else(|| anyhow!("update_function_code response missing code_sha256"))?
        .to_string();

    wait_for_function_ready(client, function_name).await?;

    Ok(code_sha256)
}

/// Publish a new immutable version from `$LATEST` with our description.
///
/// The `code_sha256` parameter guards against races: if another process
/// overwrote `$LATEST` since our `update_function_code` call, AWS will
/// reject the publish.
///
/// Returns the version number (e.g., "8").
async fn publish_version(
    client: &LambdaClient,
    function_name: &str,
    code_sha256: &str,
    description: &str,
) -> anyhow::Result<String> {
    info!(
        function_name = %function_name,
        description = %description,
        "publishing new Lambda version"
    );

    let publish_response = client
        .publish_version()
        .function_name(function_name)
        .description(description)
        .code_sha256(code_sha256)
        .send()
        .await
        .context(
            "failed to publish Lambda version (code_sha256 mismatch means a concurrent deploy \
             race)",
        )?;

    let version = publish_response
        .version()
        .context("published version has no version number")?
        .to_string();

    info!(
        function_name = %function_name,
        version = %version,
        "lambda version published successfully"
    );

    Ok(version)
}

/// Wait for the Lambda function to be ready.
///
/// "Ready" means `State == Active` and no update is in progress
/// (`LastUpdateStatus` is absent or `Successful`).
///
/// This matters because:
/// - After `create_function`: `State` transitions `Pending → Active`
/// - After `update_function_code`: `State` stays `Active` but `LastUpdateStatus` transitions
///   `InProgress → Successful`
async fn wait_for_function_ready(client: &LambdaClient, function_name: &str) -> anyhow::Result<()> {
    const MAX_WAIT_ATTEMPTS: u32 = 30;
    const WAIT_INTERVAL: tokio::time::Duration = tokio::time::Duration::from_secs(1);

    let mut interval = tokio::time::interval(WAIT_INTERVAL);

    for attempt in 0..MAX_WAIT_ATTEMPTS {
        interval.tick().await;

        let response = client
            .get_function()
            .function_name(function_name)
            .send()
            .await
            .context("failed to get function status")?;

        let Some(config) = response.configuration() else {
            continue;
        };

        // Check for terminal failure states.
        if config.state() == Some(&State::Failed) {
            let reason = config.state_reason().unwrap_or("unknown reason");
            anyhow::bail!(
                "lambda function '{}' is in Failed state: {}",
                function_name,
                reason
            );
        }

        let last_update_status: &LastUpdateStatus = config
            .last_update_status()
            .unwrap_or(&LastUpdateStatus::Successful);

        if last_update_status == &LastUpdateStatus::Failed {
            let reason = config
                .last_update_status_reason()
                .unwrap_or("unknown reason");
            anyhow::bail!(
                "lambda function '{}' last update failed: {}",
                function_name,
                reason
            );
        }

        // Ready = Active state with no update in progress.
        let is_active = config.state() == Some(&State::Active);
        if is_active && last_update_status == &LastUpdateStatus::Successful {
            info!(
                function_name = %function_name,
                attempts = attempt + 1,
                "lambda function is ready"
            );
            return Ok(());
        }

        info!(
            function_name = %function_name,
            state = ?config.state(),
            last_update_status = ?config.last_update_status(),
            attempt = attempt + 1,
            "waiting for Lambda function to be ready"
        );
    }

    anyhow::bail!(
        "lambda function '{}' did not become ready within {} seconds",
        function_name,
        MAX_WAIT_ATTEMPTS as u64 * WAIT_INTERVAL.as_secs()
    )
}

/// Garbage collect old Lambda versions, keeping the current + 5 most recent.
async fn garbage_collect_old_versions(
    client: &LambdaClient,
    function_name: &str,
    current_version: &str,
) -> anyhow::Result<()> {
    let mut quickwit_lambda_versions: Vec<(u64, String)> = Vec::new();
    let mut marker: Option<String> = None;

    // Collect all Quickwit-managed versions
    loop {
        let mut request = client
            .list_versions_by_function()
            .function_name(function_name);

        if let Some(m) = marker {
            request = request.marker(m);
        }

        let response = request
            .send()
            .await
            .context("failed to list Lambda versions for garbage collection")?;

        for version in response.versions() {
            let Some(version_str) = version.version() else {
                continue;
            };
            if version_str == "$LATEST" {
                continue;
            }
            // Only consider Quickwit-managed versions
            let Some(description) = version.description() else {
                continue;
            };
            if description.starts_with(VERSION_DESCRIPTION_PREFIX)
                && let Ok(version_num) = version_str.parse::<u64>()
            {
                quickwit_lambda_versions.push((version_num, version_str.to_string()));
            }
        }

        marker = response.next_marker().map(ToString::to_string);
        if marker.is_none() {
            break;
        }
    }

    // Sort by version number ascending (oldest first)
    quickwit_lambda_versions.sort();

    // We keep the last 5 versions.
    quickwit_lambda_versions.truncate(
        quickwit_lambda_versions
            .len()
            .saturating_sub(GC_KEEP_RECENT_VERSIONS),
    );

    if let Some(pos) = quickwit_lambda_versions
        .iter()
        .position(|(_version, version_str)| version_str == current_version)
    {
        quickwit_lambda_versions.swap_remove(pos);
    }

    // Delete old versions
    for (version, version_str) in quickwit_lambda_versions {
        info!(
            function_name = %function_name,
            version = %version_str,
            "deleting old Lambda version"
        );

        if let Err(e) = client
            .delete_function()
            .function_name(function_name)
            .qualifier(&version_str)
            .send()
            .await
        {
            info!(
                function_name = %function_name,
                version = %version,
                error = %e,
                "failed to delete old Lambda version"
            );
        }
    }

    Ok(())
}

/// Build environment variables for the Lambda function.
fn build_environment() -> Environment {
    let mut env_vars = HashMap::new();
    env_vars.insert("RUST_LOG".to_string(), "info".to_string());
    env_vars.insert("RUST_BACKTRACE".to_string(), "1".to_string());
    Environment::builder().set_variables(Some(env_vars)).build()
}

/// Build tags for the Lambda function.
fn build_tags() -> HashMap<String, String> {
    let mut tags = HashMap::new();
    tags.insert("managed_by".to_string(), "quickwit".to_string());
    tags
}

#[cfg(test)]
mod tests {
    use aws_sdk_lambda::operation::create_function::{CreateFunctionError, CreateFunctionOutput};
    use aws_sdk_lambda::operation::delete_function::DeleteFunctionOutput;
    use aws_sdk_lambda::operation::get_function::GetFunctionOutput;
    use aws_sdk_lambda::operation::list_versions_by_function::{
        ListVersionsByFunctionError, ListVersionsByFunctionOutput,
    };
    use aws_sdk_lambda::operation::publish_version::PublishVersionOutput;
    use aws_sdk_lambda::operation::update_function_code::UpdateFunctionCodeOutput;
    use aws_sdk_lambda::types::FunctionConfiguration;
    use aws_sdk_lambda::types::error::{ResourceConflictException, ResourceNotFoundException};
    use aws_smithy_mocks::{RuleMode, mock, mock_client};
    use bytesize::ByteSize;

    use super::*;

    fn make_version(version: &str, description: &str) -> FunctionConfiguration {
        FunctionConfiguration::builder()
            .version(version)
            .description(description)
            .build()
    }

    fn test_deploy_config() -> LambdaDeployConfig {
        LambdaDeployConfig {
            execution_role_arn: "arn:aws:iam::123456789:role/test-role".to_string(),
            memory_size: ByteSize::gib(5),
            invocation_timeout_secs: 60,
        }
    }

    fn test_description() -> String {
        version_description(None)
    }

    #[test]
    fn test_version_description() {
        let lambda_deploy_config = test_deploy_config();
        let description = version_description(Some(&lambda_deploy_config));
        assert!(description.ends_with("_60s_6c3b2"));
        let description = version_description(None);
        assert!(description.ends_with("_nodeploy"));
    }

    // --- find_matching_version tests ---

    #[tokio::test]
    async fn test_find_matching_version_found() {
        let target = "quickwit:test_version";
        let rule = mock!(aws_sdk_lambda::Client::list_versions_by_function).then_output(|| {
            ListVersionsByFunctionOutput::builder()
                .versions(make_version("$LATEST", ""))
                .versions(make_version("1", "quickwit:old_version"))
                .versions(make_version("7", "quickwit:test_version"))
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        let matching_version_opt = find_matching_version(&client, "my-fn", target)
            .await
            .unwrap();
        assert_eq!(matching_version_opt, Some("7".to_string()));
    }

    #[tokio::test]
    async fn test_find_matching_version_not_found() {
        let rule = mock!(aws_sdk_lambda::Client::list_versions_by_function).then_output(|| {
            ListVersionsByFunctionOutput::builder()
                .versions(make_version("$LATEST", ""))
                .versions(make_version("1", "quickwit:other"))
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        let result = find_matching_version(&client, "my-fn", "quickwit:no_match")
            .await
            .unwrap();
        assert_eq!(result, None);
    }

    #[tokio::test]
    async fn test_find_matching_version_function_does_not_exist() {
        let rule = mock!(aws_sdk_lambda::Client::list_versions_by_function).then_error(|| {
            ListVersionsByFunctionError::ResourceNotFoundException(
                ResourceNotFoundException::builder().build(),
            )
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        let result = find_matching_version(&client, "no-such-fn", "quickwit:x")
            .await
            .unwrap();
        assert_eq!(result, None);
    }

    #[tokio::test]
    async fn test_find_matching_version_skips_latest_even_if_description_matches() {
        let rule = mock!(aws_sdk_lambda::Client::list_versions_by_function).then_output(|| {
            ListVersionsByFunctionOutput::builder()
                .versions(make_version("$LATEST", "quickwit:match"))
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        let result = find_matching_version(&client, "my-fn", "quickwit:match")
            .await
            .unwrap();
        assert_eq!(result, None);
    }

    // --- try_create_function tests ---

    #[tokio::test]
    async fn test_try_create_function_success() {
        let rule = mock!(aws_sdk_lambda::Client::create_function).then_output(|| {
            CreateFunctionOutput::builder()
                .version("1")
                .function_name("my-fn")
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);
        let config = test_deploy_config();

        let result = try_create_function(&client, "my-fn", &config, &test_description())
            .await
            .unwrap();
        assert_eq!(result, Some("1".to_string()));
    }

    #[tokio::test]
    async fn test_try_create_function_already_exists() {
        let rule = mock!(aws_sdk_lambda::Client::create_function).then_error(|| {
            CreateFunctionError::ResourceConflictException(
                ResourceConflictException::builder().build(),
            )
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);
        let config = test_deploy_config();

        let result = try_create_function(&client, "my-fn", &config, &test_description())
            .await
            .unwrap();
        assert_eq!(result, None);
    }

    // --- deploy (update path) tests ---

    #[tokio::test]
    async fn test_deploy_update_path() {
        // create_function → conflict (function exists)
        let create_rule = mock!(aws_sdk_lambda::Client::create_function).then_error(|| {
            CreateFunctionError::ResourceConflictException(
                ResourceConflictException::builder().build(),
            )
        });
        // update_function_code → success with code_sha256
        let update_rule = mock!(aws_sdk_lambda::Client::update_function_code).then_output(|| {
            UpdateFunctionCodeOutput::builder()
                .code_sha256("abc123hash")
                .build()
        });
        // get_function → active and ready (for wait_for_function_ready)
        let get_rule = mock!(aws_sdk_lambda::Client::get_function).then_output(|| {
            GetFunctionOutput::builder()
                .configuration(
                    FunctionConfiguration::builder()
                        .state(State::Active)
                        .last_update_status(LastUpdateStatus::Successful)
                        .build(),
                )
                .build()
        });
        // publish_version → success
        let publish_rule = mock!(aws_sdk_lambda::Client::publish_version)
            .then_output(|| PublishVersionOutput::builder().version("8").build());

        let client = mock_client!(
            aws_sdk_lambda,
            RuleMode::MatchAny,
            [&create_rule, &update_rule, &get_rule, &publish_rule]
        );
        let config = test_deploy_config();

        tokio::time::pause();
        let version = deploy_lambda_function(&client, "my-fn", &config)
            .await
            .unwrap();
        assert_eq!(version, "8");
    }

    // --- wait_for_function_ready tests ---

    #[tokio::test]
    async fn test_wait_for_function_ready_immediate() {
        let rule = mock!(aws_sdk_lambda::Client::get_function).then_output(|| {
            GetFunctionOutput::builder()
                .configuration(
                    FunctionConfiguration::builder()
                        .state(State::Active)
                        .last_update_status(LastUpdateStatus::Successful)
                        .build(),
                )
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        tokio::time::pause();
        wait_for_function_ready(&client, "my-fn").await.unwrap();
    }

    #[tokio::test]
    async fn test_wait_for_function_ready_after_update_in_progress() {
        let rule = mock!(aws_sdk_lambda::Client::get_function)
            .sequence()
            .output(|| {
                GetFunctionOutput::builder()
                    .configuration(
                        FunctionConfiguration::builder()
                            .state(State::Active)
                            .last_update_status(LastUpdateStatus::InProgress)
                            .build(),
                    )
                    .build()
            })
            .output(|| {
                GetFunctionOutput::builder()
                    .configuration(
                        FunctionConfiguration::builder()
                            .state(State::Active)
                            .last_update_status(LastUpdateStatus::Successful)
                            .build(),
                    )
                    .build()
            })
            .build();
        let client = mock_client!(aws_sdk_lambda, RuleMode::Sequential, [&rule]);

        tokio::time::pause();
        wait_for_function_ready(&client, "my-fn").await.unwrap();
        assert_eq!(rule.num_calls(), 2);
    }

    #[tokio::test]
    async fn test_wait_for_function_ready_fails_on_failed_state() {
        let rule = mock!(aws_sdk_lambda::Client::get_function).then_output(|| {
            GetFunctionOutput::builder()
                .configuration(
                    FunctionConfiguration::builder()
                        .state(State::Failed)
                        .state_reason("Something broke")
                        .build(),
                )
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        tokio::time::pause();
        let err = wait_for_function_ready(&client, "my-fn").await.unwrap_err();
        assert!(
            err.to_string().contains("Failed state"),
            "unexpected error: {}",
            err
        );
    }

    #[tokio::test]
    async fn test_wait_for_function_ready_fails_on_last_update_failed() {
        let rule = mock!(aws_sdk_lambda::Client::get_function).then_output(|| {
            GetFunctionOutput::builder()
                .configuration(
                    FunctionConfiguration::builder()
                        .state(State::Active)
                        .last_update_status(LastUpdateStatus::Failed)
                        .last_update_status_reason("Update broke")
                        .build(),
                )
                .build()
        });
        let client = mock_client!(aws_sdk_lambda, [&rule]);

        tokio::time::pause();
        let err = wait_for_function_ready(&client, "my-fn").await.unwrap_err();
        assert!(
            err.to_string().contains("last update failed"),
            "unexpected error: {}",
            err
        );
    }

    // --- garbage_collect_old_versions tests ---

    #[tokio::test]
    async fn test_gc_deletes_old_versions_keeps_recent() {
        // 8 quickwit versions (1..=8) + $LATEST + one non-quickwit version
        let list_rule =
            mock!(aws_sdk_lambda::Client::list_versions_by_function).then_output(|| {
                let mut builder = ListVersionsByFunctionOutput::builder()
                    .versions(make_version("$LATEST", ""))
                    .versions(make_version("99", "not-quickwit"));
                for i in 1..=8 {
                    builder = builder
                        .versions(make_version(&i.to_string(), &format!("quickwit:ver_{}", i)));
                }
                builder.build()
            });

        let delete_rule = mock!(aws_sdk_lambda::Client::delete_function)
            .then_output(|| DeleteFunctionOutput::builder().build());

        let client = mock_client!(
            aws_sdk_lambda,
            RuleMode::MatchAny,
            [&list_rule, &delete_rule]
        );

        // Current version is "7", so keep 7 + the 5 most recent (4,5,6,7,8).
        // Should delete versions 1, 2, 3.
        garbage_collect_old_versions(&client, "my-fn", "7")
            .await
            .unwrap();

        assert_eq!(delete_rule.num_calls(), 3);
    }

    #[tokio::test]
    async fn test_gc_nothing_to_delete() {
        // Only 3 quickwit versions — below the GC_KEEP_RECENT_VERSIONS threshold.
        let list_rule =
            mock!(aws_sdk_lambda::Client::list_versions_by_function).then_output(|| {
                ListVersionsByFunctionOutput::builder()
                    .versions(make_version("$LATEST", ""))
                    .versions(make_version("1", "quickwit:v1"))
                    .versions(make_version("2", "quickwit:v2"))
                    .versions(make_version("3", "quickwit:v3"))
                    .build()
            });

        let delete_rule = mock!(aws_sdk_lambda::Client::delete_function)
            .then_output(|| DeleteFunctionOutput::builder().build());

        let client = mock_client!(
            aws_sdk_lambda,
            RuleMode::MatchAny,
            [&list_rule, &delete_rule]
        );

        garbage_collect_old_versions(&client, "my-fn", "3")
            .await
            .unwrap();

        assert_eq!(delete_rule.num_calls(), 0);
    }

    #[tokio::test]
    async fn test_gc_does_not_delete_current_version() {
        // 7 quickwit versions, current is "1" (the oldest).
        // Without the current-version guard, version 1 would be deleted.
        let list_rule =
            mock!(aws_sdk_lambda::Client::list_versions_by_function).then_output(|| {
                let mut builder =
                    ListVersionsByFunctionOutput::builder().versions(make_version("$LATEST", ""));
                for i in 1..=7 {
                    builder = builder
                        .versions(make_version(&i.to_string(), &format!("quickwit:ver_{}", i)));
                }
                builder.build()
            });

        let delete_rule = mock!(aws_sdk_lambda::Client::delete_function)
            .then_output(|| DeleteFunctionOutput::builder().build());

        let client = mock_client!(
            aws_sdk_lambda,
            RuleMode::MatchAny,
            [&list_rule, &delete_rule]
        );

        // Current version is "1". Without guard: would delete 1,2. With guard: only deletes 2.
        garbage_collect_old_versions(&client, "my-fn", "1")
            .await
            .unwrap();

        assert_eq!(delete_rule.num_calls(), 1);
    }
}


================================================
FILE: quickwit/quickwit-lambda-client/src/invoker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use anyhow::Context as _;
use async_trait::async_trait;
use aws_sdk_lambda::Client as LambdaClient;
use aws_sdk_lambda::error::{DisplayErrorContext, SdkError};
use aws_sdk_lambda::operation::invoke::InvokeError;
use aws_sdk_lambda::primitives::Blob;
use aws_sdk_lambda::types::InvocationType;
use base64::prelude::*;
use prost::Message;
use quickwit_common::retry::RetryParams;
use quickwit_lambda_server::{LambdaSearchRequestPayload, LambdaSearchResponsePayload};
use quickwit_proto::search::{LambdaSearchResponses, LambdaSingleSplitResult, LeafSearchRequest};
use quickwit_search::{LambdaLeafSearchInvoker, SearchError};
use tracing::{debug, info, instrument, warn};

use crate::metrics::LAMBDA_METRICS;

/// Upper bound on the retry-after hint we will honor from Lambda rate-limit responses.
const MAX_RETRY_AFTER: Duration = Duration::from_secs(10);

/// Richer error type used internally by the invoker so that rate-limit retry-after hints
/// are not lost before the retry loop can consume them.
enum LambdaInvokeError {
    /// Lambda returned a throttling error. The optional duration is the `Retry-After` hint
    /// provided by Lambda; `None` means no hint was present.
    RateLimited(Option<Duration>),
    /// The invocation timed out.
    Timeout(String),
    /// A non-retryable error.
    Permanent(SearchError),
}

impl LambdaInvokeError {
    fn into_search_error(self) -> SearchError {
        match self {
            Self::RateLimited(_) => SearchError::TooManyRequests,
            Self::Timeout(msg) => SearchError::Timeout(msg),
            Self::Permanent(err) => err,
        }
    }
}

impl From<SearchError> for LambdaInvokeError {
    fn from(err: SearchError) -> Self {
        LambdaInvokeError::Permanent(err)
    }
}

fn invoke_error_to_lambda_error(error: SdkError<InvokeError>) -> LambdaInvokeError {
    if let SdkError::ServiceError(ref service_error) = error {
        match service_error.err() {
            InvokeError::TooManyRequestsException(exc) => {
                let retry_after = exc
                    .retry_after_seconds()
                    .and_then(|raw| raw.parse::<f64>().ok())
                    .filter(|secs| secs.is_finite() && *secs > 0.0)
                    .map(|secs| Duration::from_secs_f64(secs).min(MAX_RETRY_AFTER));
                return LambdaInvokeError::RateLimited(retry_after);
            }
            InvokeError::EniLimitReachedException(_)
            | InvokeError::SubnetIpAddressLimitReachedException(_)
            | InvokeError::Ec2ThrottledException(_)
            | InvokeError::ResourceConflictException(_) => {
                return LambdaInvokeError::RateLimited(None);
            }
            _ => {}
        }
    }

    let is_timeout = match &error {
        SdkError::TimeoutError(_) => true,
        SdkError::DispatchFailure(failure) => failure.is_timeout(),
        SdkError::ServiceError(service_error) => matches!(
            service_error.err(),
            InvokeError::EfsMountTimeoutException(_) | InvokeError::SnapStartTimeoutException(_)
        ),
        _ => false,
    };

    let error_msg = format!("lambda invocation failed: {}", DisplayErrorContext(&error));

    if is_timeout {
        LambdaInvokeError::Timeout(error_msg)
    } else {
        LambdaInvokeError::Permanent(SearchError::Internal(error_msg))
    }
}

/// Create a Lambda invoker for a specific version.
///
/// The version number is used as the qualifier when invoking, ensuring we call
/// the exact published version (not $LATEST).
pub(crate) async fn create_lambda_invoker_for_version(
    function_name: String,
    version: String,
) -> anyhow::Result<AwsLambdaInvoker> {
    let aws_config = aws_config::load_defaults(aws_config::BehaviorVersion::latest()).await;
    let client = LambdaClient::new(&aws_config);
    let invoker = AwsLambdaInvoker {
        client,
        function_name,
        version,
    };
    invoker.validate().await?;
    Ok(invoker)
}

/// AWS Lambda implementation of RemoteFunctionInvoker.
pub(crate) struct AwsLambdaInvoker {
    client: LambdaClient,
    function_name: String,
    /// The version number to invoke (e.g., "7", "12").
    version: String,
}

impl AwsLambdaInvoker {
    /// Validate that the Lambda function version exists and is invocable.
    /// Uses DryRun invocation type - validates without executing.
    async fn validate(&self) -> anyhow::Result<()> {
        info!("lambda invoker dry run");
        let request = self
            .client
            .invoke()
            .function_name(&self.function_name)
            .qualifier(&self.version)
            .invocation_type(InvocationType::DryRun);

        request.send().await.with_context(|| {
            format!(
                "failed to validate Lambda function '{}:{}'",
                self.function_name, self.version
            )
        })?;

        info!("the lambda invoker dry run was successful");
        Ok(())
    }
}

/// Retry parameters used for exponential backoff when no `Retry-After` hint is available.
const LAMBDA_RETRY_PARAMS: RetryParams = RetryParams {
    base_delay: Duration::from_secs(1),
    max_delay: Duration::from_secs(10),
    max_attempts: 3,
};

#[async_trait]
impl LambdaLeafSearchInvoker for AwsLambdaInvoker {
    #[instrument(skip(self, request), fields(function_name = %self.function_name, version = %self.version))]
    async fn invoke_leaf_search(
        &self,
        request: LeafSearchRequest,
    ) -> Result<Vec<LambdaSingleSplitResult>, SearchError> {
        let start = std::time::Instant::now();
        let result = self.invoke_leaf_search_with_retry(request).await;
        let elapsed = start.elapsed().as_secs_f64();
        let status = if result.is_ok() { "success" } else { "error" };
        LAMBDA_METRICS
            .leaf_search_requests_total
            .with_label_values([status])
            .inc();
        LAMBDA_METRICS
            .leaf_search_duration_seconds
            .with_label_values([status])
            .observe(elapsed);
        result
    }
}

impl AwsLambdaInvoker {
    async fn invoke_leaf_search_with_retry(
        &self,
        request: LeafSearchRequest,
    ) -> Result<Vec<LambdaSingleSplitResult>, SearchError> {
        let mut error = match self.invoke_leaf_search_once(request.clone()).await {
            Ok(results) => return Ok(results),
            Err(error) => error,
        };

        for num_attempts in 1..LAMBDA_RETRY_PARAMS.max_attempts {
            // Determine whether to retry and how long to wait.
            let delay = match &error {
                LambdaInvokeError::RateLimited(retry_after) => {
                    retry_after.unwrap_or_else(|| LAMBDA_RETRY_PARAMS.compute_delay(num_attempts))
                }
                LambdaInvokeError::Timeout(_) => LAMBDA_RETRY_PARAMS.compute_delay(num_attempts),
                LambdaInvokeError::Permanent(_) => return Err(error.into_search_error()),
            };

            warn!(
                num_attempts = num_attempts,
                delay_ms = delay.as_millis(),
                "lambda invocation failed, retrying"
            );
            tokio::time::sleep(delay).await;

            match self.invoke_leaf_search_once(request.clone()).await {
                Ok(results) => return Ok(results),
                Err(e) => error = e,
            };
        }

        Err(error.into_search_error())
    }

    async fn invoke_leaf_search_once(
        &self,
        request: LeafSearchRequest,
    ) -> Result<Vec<LambdaSingleSplitResult>, LambdaInvokeError> {
        // Serialize request to protobuf bytes, then base64 encode
        let request_bytes = request.encode_to_vec();
        let payload = LambdaSearchRequestPayload {
            payload: BASE64_STANDARD.encode(&request_bytes),
        };

        let payload_json = serde_json::to_vec(&payload)
            .map_err(|e| SearchError::Internal(format!("JSON serialization error: {}", e)))?;

        LAMBDA_METRICS
            .leaf_search_request_payload_size_bytes
            .observe(payload_json.len() as f64);

        debug!(
            payload_size = payload_json.len(),
            version = %self.version,
            "invoking Lambda function"
        );

        // Invoke the specific version
        let invoke_builder = self
            .client
            .invoke()
            .function_name(&self.function_name)
            .qualifier(&self.version)
            .invocation_type(InvocationType::RequestResponse)
            .payload(Blob::new(payload_json));

        let response = invoke_builder
            .send()
            .await
            .map_err(invoke_error_to_lambda_error)?;

        // Check for function error
        if let Some(error) = response.function_error() {
            let error_payload = response
                .payload()
                .map(|b| String::from_utf8_lossy(b.as_ref()).to_string())
                .unwrap_or_default();
            return Err(SearchError::Internal(format!(
                "lambda function error: {}: {}",
                error, error_payload
            ))
            .into());
        }

        // Deserialize response
        let response_payload = response
            .payload()
            .ok_or_else(|| SearchError::Internal("no response payload from Lambda".into()))?;

        LAMBDA_METRICS
            .leaf_search_response_payload_size_bytes
            .observe(response_payload.as_ref().len() as f64);

        let lambda_response: LambdaSearchResponsePayload =
            serde_json::from_slice(response_payload.as_ref())
                .map_err(|e| SearchError::Internal(format!("json deserialization error: {}", e)))?;

        let response_bytes = BASE64_STANDARD
            .decode(&lambda_response.payload)
            .map_err(|e| SearchError::Internal(format!("base64 decode error: {}", e)))?;

        let leaf_responses = LambdaSearchResponses::decode(&response_bytes[..])
            .map_err(|e| SearchError::Internal(format!("protobuf decode error: {}", e)))?;

        debug!(
            num_results = leaf_responses.split_results.len(),
            "lambda invocation completed"
        );

        Ok(leaf_responses.split_results)
    }
}


================================================
FILE: quickwit/quickwit-lambda-client/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! AWS Lambda client for Quickwit leaf search operations.
//!
//! This crate provides:
//! - An AWS Lambda implementation of the `LambdaLeafSearchInvoker` trait used by `quickwit-search`
//! - Auto-deployment functionality for Lambda functions
//!
//! # Usage
//!
//! Use `try_get_or_deploy_invoker` to get an invoker that will automatically deploy
//! the Lambda function if needed:
//!
//! ```ignore
//! let invoker = try_get_or_deploy_invoker(&function_name, &deploy_config).await?;
//! ```

mod deploy;
mod invoker;
mod metrics;

pub use deploy::try_get_or_deploy_invoker;
pub use metrics::LAMBDA_METRICS;
// Re-export payload types from server crate for convenience
pub use quickwit_lambda_server::{LambdaSearchRequestPayload, LambdaSearchResponsePayload};


================================================
FILE: quickwit/quickwit-lambda-client/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// See https://prometheus.io/docs/practices/naming/

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    Histogram, HistogramVec, IntCounterVec, exponential_buckets, new_counter_vec, new_histogram,
    new_histogram_vec,
};

/// From 100ms to 73s seconds
fn duration_buckets() -> Vec<f64> {
    exponential_buckets(0.100, 3f64.sqrt(), 13).unwrap()
}

/// From 1KB to 16MB
fn payload_size_buckets() -> Vec<f64> {
    exponential_buckets(1024.0, 4.0, 8).unwrap()
}

pub struct LambdaMetrics {
    pub leaf_search_requests_total: IntCounterVec<1>,
    pub leaf_search_duration_seconds: HistogramVec<1>,
    pub leaf_search_request_payload_size_bytes: Histogram,
    pub leaf_search_response_payload_size_bytes: Histogram,
}

impl Default for LambdaMetrics {
    fn default() -> Self {
        LambdaMetrics {
            leaf_search_requests_total: new_counter_vec(
                "leaf_search_requests_total",
                "Total number of Lambda leaf search invocations.",
                "lambda",
                &[],
                ["status"],
            ),
            leaf_search_duration_seconds: new_histogram_vec(
                "leaf_search_duration_seconds",
                "Duration of Lambda leaf search invocations in seconds.",
                "lambda",
                &[],
                ["status"],
                duration_buckets(),
            ),
            leaf_search_request_payload_size_bytes: new_histogram(
                "leaf_search_request_payload_size_bytes",
                "Size of the request payload sent to Lambda in bytes.",
                "lambda",
                payload_size_buckets(),
            ),
            leaf_search_response_payload_size_bytes: new_histogram(
                "leaf_search_response_payload_size_bytes",
                "Size of the response payload received from Lambda in bytes.",
                "lambda",
                payload_size_buckets(),
            ),
        }
    }
}

pub static LAMBDA_METRICS: Lazy<LambdaMetrics> = Lazy::new(LambdaMetrics::default);


================================================
FILE: quickwit/quickwit-lambda-server/Cargo.toml
================================================
[package]
name = "quickwit-lambda-server"
description = "AWS Lambda handler for Quickwit leaf search"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[package.metadata.cargo-machete]
# Its here even though it is not useful, in order to enable its "vendor" feature,
# allowing the cross-build.
ignored = ["openssl"]

[dependencies]
anyhow = { workspace = true }
base64 = { workspace = true }
bytesize = { workspace = true }
lambda_runtime = { workspace = true }
prost = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }
tracing-subscriber = { workspace = true, features = ["env-filter", "json"] }

openssl = { workspace = true, optional = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-search = { workspace = true }
quickwit-storage = { workspace = true }

[[bin]]
name = "quickwit-aws-lambda-leaf-search"
path = "src/bin/leaf_search.rs"

[features]
default = []
testsuite = []

# Keep this in sync with quickwit-cli!
lambda-release = [
    # The vendored OpenSSL will be compiled from source during the
    # build, avoiding the pkg-config dependency issue during
    # cross-compilation.
    "openssl/vendored",
]


================================================
FILE: quickwit/quickwit-lambda-server/src/bin/leaf_search.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! AWS Lambda binary entry point for Quickwit leaf search.

use std::sync::Arc;

use lambda_runtime::{Error, LambdaEvent, service_fn};
use quickwit_lambda_server::{
    LambdaSearchRequestPayload, LambdaSearcherContext, handle_leaf_search,
};
use tracing::info;
use tracing_subscriber::EnvFilter;

#[tokio::main]
async fn main() -> Result<(), Error> {
    // Initialize tracing with JSON output for CloudWatch
    tracing_subscriber::fmt()
        .with_env_filter(EnvFilter::from_default_env())
        .json()
        .init();

    // Initialize context on cold start (wrapped in Arc for sharing across invocations)
    let context = Arc::new(LambdaSearcherContext::try_from_env()?);

    info!("lambda context initialized, starting handler loop");

    // Run the Lambda handler
    lambda_runtime::run(service_fn(
        |event: LambdaEvent<LambdaSearchRequestPayload>| {
            let ctx = Arc::clone(&context);
            async move {
                let (payload, _event_ctx) = event.into_parts();
                handle_leaf_search(payload, &ctx)
                    .await
                    .map_err(|e| lambda_runtime::Error::from(e.to_string()))
            }
        },
    ))
    .await
}


================================================
FILE: quickwit/quickwit-lambda-server/src/context.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use anyhow::Context as _;
use bytesize::ByteSize;
use quickwit_config::{CacheConfig, SearcherConfig};
use quickwit_search::SearcherContext;
use quickwit_storage::StorageResolver;
use tracing::info;

/// Lambda-specific searcher context that holds resources for search execution.
pub struct LambdaSearcherContext {
    pub searcher_context: Arc<SearcherContext>,
    pub storage_resolver: StorageResolver,
}

impl LambdaSearcherContext {
    /// Create a new Lambda searcher context from environment variables.
    pub fn try_from_env() -> anyhow::Result<Self> {
        info!("initializing lambda searcher context");

        let searcher_config = try_searcher_config_from_env()?;
        let searcher_context =
            Arc::new(SearcherContext::new_without_invoker(searcher_config, None));
        let storage_resolver = StorageResolver::configured(&Default::default());

        Ok(Self {
            searcher_context,
            storage_resolver,
        })
    }
}

/// Create a Lambda-optimized searcher config based on the `AWS_LAMBDA_FUNCTION_MEMORY_SIZE`
/// environment variable.
fn try_searcher_config_from_env() -> anyhow::Result<SearcherConfig> {
    let lambda_memory_mib: u64 = quickwit_common::get_from_env_opt(
        "AWS_LAMBDA_FUNCTION_MEMORY_SIZE",
        /* sensitive */ false,
    )
    .context("could not get aws lambda function memory size from ENV")?;
    let lambda_memory = ByteSize::mib(lambda_memory_mib);
    anyhow::ensure!(
        lambda_memory >= ByteSize::gib(1u64),
        "lambda memory must be at least 1GB"
    );
    let warmup_memory_budget = ByteSize::b(lambda_memory.as_u64() - ByteSize::mib(500).as_u64());

    let mut searcher_config = SearcherConfig::default();
    searcher_config.max_num_concurrent_split_searches = 20;
    searcher_config.warmup_memory_budget = warmup_memory_budget;
    searcher_config.fast_field_cache = CacheConfig::no_cache();
    searcher_config.split_footer_cache = CacheConfig::no_cache();
    searcher_config.predicate_cache = CacheConfig::no_cache();
    searcher_config.partial_request_cache = CacheConfig::no_cache();
    Ok(searcher_config)
}


================================================
FILE: quickwit/quickwit-lambda-server/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_search::SearchError;
use thiserror::Error;

/// Result type for Lambda operations.
pub type LambdaResult<T> = Result<T, LambdaError>;

/// Errors that can occur during Lambda handler operations.
#[derive(Debug, Error)]
pub enum LambdaError {
    /// Error serializing/deserializing protobuf.
    #[error("serialization error: {0}")]
    Serialization(String),
    /// Error from the search operation.
    #[error("search error: {0}")]
    Search(#[from] SearchError),
    /// Internal error.
    #[error("internal error: {0}")]
    Internal(String),
    /// Task was cancelled.
    #[error("cancelled")]
    Cancelled,
}

impl From<prost::DecodeError> for LambdaError {
    fn from(err: prost::DecodeError) -> Self {
        LambdaError::Serialization(format!("protobuf decode error: {}", err))
    }
}

impl From<prost::EncodeError> for LambdaError {
    fn from(err: prost::EncodeError) -> Self {
        LambdaError::Serialization(format!("protobuf encode error: {}", err))
    }
}

impl From<base64::DecodeError> for LambdaError {
    fn from(err: base64::DecodeError) -> Self {
        LambdaError::Serialization(format!("base64 decode error: {}", err))
    }
}

impl From<serde_json::Error> for LambdaError {
    fn from(err: serde_json::Error) -> Self {
        LambdaError::Serialization(format!("json error: {}", err))
    }
}

impl From<LambdaError> for SearchError {
    fn from(err: LambdaError) -> Self {
        match err {
            LambdaError::Search(search_err) => search_err,
            other => SearchError::Internal(other.to_string()),
        }
    }
}


================================================
FILE: quickwit/quickwit-lambda-server/src/handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::str::FromStr;
use std::sync::Arc;

use base64::prelude::*;
use prost::Message;
use quickwit_common::uri::Uri;
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::search::lambda_single_split_result::Outcome;
use quickwit_proto::search::{
    LambdaSearchResponses, LambdaSingleSplitResult, LeafRequestRef, LeafSearchRequest,
    SearchRequest,
};
use quickwit_search::leaf::single_doc_mapping_leaf_search;
use quickwit_storage::Storage;
use serde::{Deserialize, Serialize};
use tracing::{error, info, instrument, warn};

use crate::context::LambdaSearcherContext;
use crate::error::{LambdaError, LambdaResult};

/// Payload for leaf search Lambda invocation.
#[derive(Debug, Serialize, Deserialize)]
pub struct LambdaSearchRequestPayload {
    /// Base64-encoded serialized LeafSearchRequest protobuf.
    pub payload: String,
}

/// Response from leaf search Lambda invocation.
#[derive(Debug, Serialize, Deserialize)]
pub struct LambdaSearchResponsePayload {
    /// Base64-encoded serialized `LambdaSearchResponses` protobuf (one per split).
    pub payload: String,
}

/// Handle a leaf search request in Lambda.
///
/// Returns one `LambdaSingleSplitResult` per split, each tagged with its
/// split_id. Individual split failures are reported per-split rather than
/// failing the entire invocation, so the caller can retry only failed splits.
#[instrument(skip(ctx), fields(request_id))]
pub async fn handle_leaf_search(
    event: LambdaSearchRequestPayload,
    ctx: &LambdaSearcherContext,
) -> LambdaResult<LambdaSearchResponsePayload> {
    // Decode base64 payload
    let request_bytes: Vec<u8> = BASE64_STANDARD
        .decode(&event.payload)
        .map_err(|err| LambdaError::Serialization(format!("base64 decode error: {}", err)))?;

    // Deserialize LeafSearchRequest
    let leaf_search_request = LeafSearchRequest::decode(&request_bytes[..])?;

    // Unpack the shared fields once instead of cloning per split.
    let search_request: Arc<SearchRequest> = leaf_search_request
        .search_request
        .ok_or_else(|| LambdaError::Internal("no search request".to_string()))?
        .into();

    let doc_mappers: Vec<Arc<DocMapper>> = leaf_search_request
        .doc_mappers
        .iter()
        .map(String::as_str)
        .map(serde_json::from_str::<Arc<DocMapper>>)
        .collect::<Result<Vec<_>, _>>()
        .map_err(|err| {
            LambdaError::Internal(format!("failed to deserialize doc mapper: `{err}`"))
        })?;

    // Resolve storage for every index URI upfront.
    let mut storages: Vec<Arc<dyn quickwit_storage::Storage>> =
        Vec::with_capacity(leaf_search_request.index_uris.len());
    for uri_str in &leaf_search_request.index_uris {
        let uri = Uri::from_str(uri_str)
            .map_err(|err| LambdaError::Internal(format!("invalid index uri: {err}")))?;
        let storage =
            ctx.storage_resolver.resolve(&uri).await.map_err(|err| {
                LambdaError::Internal(format!("failed to resolve storage: {err}"))
            })?;
        storages.push(storage);
    }

    let split_results: Vec<LambdaSingleSplitResult> = lambda_leaf_search(
        search_request,
        leaf_search_request.leaf_requests,
        &doc_mappers[..],
        &storages[..],
        ctx,
    )
    .await?;
    let wrapper = LambdaSearchResponses { split_results };
    let response_bytes = wrapper.encode_to_vec();
    let payload = BASE64_STANDARD.encode(&response_bytes);

    Ok(LambdaSearchResponsePayload { payload })
}

/// Lambda leaf search returns individual split results.
async fn lambda_leaf_search(
    search_request: Arc<SearchRequest>,
    leaf_req_ref: Vec<LeafRequestRef>,
    doc_mappers: &[Arc<DocMapper>],
    storages: &[Arc<dyn Storage>],
    ctx: &LambdaSearcherContext,
) -> LambdaResult<Vec<LambdaSingleSplitResult>> {
    // Flatten leaf_requests into per-split tasks using pre-resolved Arc references.
    let mut split_search_joinset: tokio::task::JoinSet<(String, Result<_, String>)> =
        tokio::task::JoinSet::new();

    for leaf_req in leaf_req_ref {
        let doc_mapper = doc_mappers
            .get(leaf_req.doc_mapper_ord as usize)
            .ok_or_else(|| {
                LambdaError::Internal(format!(
                    "doc_mapper_ord out of bounds: {}",
                    leaf_req.doc_mapper_ord
                ))
            })?
            .clone();
        let storage = storages[leaf_req.index_uri_ord as usize].clone();

        for split_id_and_footer_offsets in leaf_req.split_offsets {
            let split_id = split_id_and_footer_offsets.split_id.clone();
            let searcher_context = ctx.searcher_context.clone();
            let search_request = search_request.clone();
            let doc_mapper = doc_mapper.clone();
            let storage = storage.clone();
            let split = split_id_and_footer_offsets.clone();
            split_search_joinset.spawn(async move {
                let result = single_doc_mapping_leaf_search(
                    searcher_context,
                    search_request,
                    storage,
                    vec![split],
                    doc_mapper,
                )
                .await
                .map_err(|err| format!("{err}"));
                (split_id, result)
            });
        }
    }

    let num_splits = split_search_joinset.len();
    info!(num_splits, "processing leaf search request (per-split)");

    // Collect results. Order is irrelevant: each result is tagged with its split_id.
    let mut split_results: Vec<LambdaSingleSplitResult> = Vec::with_capacity(num_splits);
    let mut num_successes: usize = 0;
    let mut num_failures: usize = 0;
    while let Some(join_result) = split_search_joinset.join_next().await {
        match join_result {
            Ok((split_id, Ok(response))) => {
                num_successes += 1;
                split_results.push(LambdaSingleSplitResult {
                    split_id,
                    outcome: Some(Outcome::Response(response)),
                });
            }
            Ok((split_id, Err(error_msg))) => {
                num_failures += 1;
                warn!(split_id = %split_id, error = %error_msg, "split search failed");
                split_results.push(LambdaSingleSplitResult {
                    split_id,
                    outcome: Some(Outcome::Error(error_msg)),
                });
            }
            Err(join_error) if join_error.is_cancelled() => {
                warn!("search task was cancelled");
                return Err(LambdaError::Cancelled);
            }
            Err(join_error) => {
                // Panics lose the captured split_id, so we fail the entire invocation.
                error!(error = %join_error, "search task panicked");
                return Err(LambdaError::Internal(format!(
                    "search task panicked: {join_error}"
                )));
            }
        }
    }
    info!(
        num_successes,
        num_failures, "leaf search completed (per-split)"
    );

    Ok(split_results)
}


================================================
FILE: quickwit/quickwit-lambda-server/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! AWS Lambda handler for Quickwit leaf search operations.
//!
//! This crate provides the Lambda handler that executes leaf search requests.
//! It is designed to be deployed as an AWS Lambda function.

mod context;
mod error;
mod handler;

pub use context::LambdaSearcherContext;
pub use error::{LambdaError, LambdaResult};
pub use handler::{LambdaSearchRequestPayload, LambdaSearchResponsePayload, handle_leaf_search};


================================================
FILE: quickwit/quickwit-macros/Cargo.toml
================================================
[package]
name = "quickwit-macros"
description =  "Proc macro definitions"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[lib]
proc-macro = true

[dependencies]
proc-macro2 = { workspace = true }
quote = { workspace = true }
syn = { workspace = true }


================================================
FILE: quickwit/quickwit-macros/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::mem;

use proc_macro::TokenStream;
use proc_macro2::{Span, TokenStream as TokenStream2};
use quote::quote;
use syn::parse::{Parse, ParseStream, Parser};
use syn::punctuated::Punctuated;
use syn::{
    Attribute, Error, Field, Fields, FieldsNamed, Ident, ItemStruct, Meta, Path, Token, Visibility,
    parenthesized,
};

#[proc_macro_attribute]
pub fn serde_multikey(attr: TokenStream, item: TokenStream) -> TokenStream {
    match serde_multikey_inner(attr, item) {
        Ok(ts) => ts,
        Err(e) => e.to_compile_error().into(),
    }
}

fn serde_multikey_inner(_attr: TokenStream, item: TokenStream) -> Result<TokenStream, Error> {
    let Ok(input) = syn::parse::<ItemStruct>(item) else {
        return Err(Error::new(
            Span::call_site(),
            "the attribute can only be applied to struct",
        ));
    };

    let main_struct = generate_main_struct(input.clone())?;

    let proxy_struct = generate_proxy_struct(input)?;

    Ok(quote!(
    #main_struct
    #proxy_struct
    )
    .into())
}

/// Generate the main struct. It's a copy of the original struct, but with most
/// ser/de attributes removed, and serde try_from/into `__MultiKey{}` added.
fn generate_main_struct(mut input: ItemStruct) -> Result<TokenStream2, Error> {
    let (serialize, deserialize) = get_ser_de(&input.attrs)?;
    let has_utoipa_schema = get_and_remove_utoipa_schema(&mut input.attrs)?;

    if !deserialize && !serialize {
        return Err(Error::new(
            Span::call_site(),
            "`serde_multikey` was applied to a non Serialize/Deserialize struct",
        ));
    }

    // remove serde and utoipa attributes from fields
    for field in input.fields.iter_mut() {
        let attrs = mem::take(&mut field.attrs);
        field.attrs = attrs
            .into_iter()
            .filter(|attr| {
                !(attr.path().is_ident("serde_multikey")
                    || attr.path().is_ident("serde")
                    || attr.path().is_ident("serde_as")
                    || attr.path().is_ident("schema"))
            })
            .collect();
    }

    // remove serde attributes from struct
    let attrs = mem::take(&mut input.attrs);
    input.attrs = attrs
        .into_iter()
        .filter(|attr| !(attr.path().is_ident("serde") || attr.path().is_ident("serde_as")))
        .collect();

    if deserialize {
        let mut attr = Attribute::parse_outer
            .parse_str(&format!(
                r#"#[serde(try_from = "__MultiKey{}")]"#,
                input.ident
            ))
            .unwrap();
        input.attrs.append(&mut attr);
    }

    if serialize {
        let mut attr = Attribute::parse_outer
            .parse_str(&format!(r#"#[serde(into = "__MultiKey{}")]"#, input.ident))
            .unwrap();
        input.attrs.append(&mut attr);
    }

    let utoipa = if has_utoipa_schema {
        let main_ident = input.ident.clone();
        let main_ident_str = main_ident.to_string();
        let proxy_ident = Ident::new(&format!("__MultiKey{}", input.ident), input.ident.span());

        Some(quote!(
            impl<'__s> utoipa::ToSchema<'__s> for #main_ident {
                fn schema() -> (
                    &'__s str,
                    utoipa::openapi::RefOr<utoipa::openapi::schema::Schema>,
                ) {
                    (
                        #main_ident_str,
                        <#proxy_ident as utoipa::ToSchema>::schema().1,
                    )
                }
            }
        ))
    } else {
        None
    };

    Ok(quote!(
        #input

        #utoipa
    ))
}

/// Generate the proxy struct. It is a copy of the original struct, but fields marked
/// with `serde_multikey` have been replaced with the fields the correspond to.
/// Also generate TryFrom/Into as required.
fn generate_proxy_struct(mut input: ItemStruct) -> Result<TokenStream2, Error> {
    let main_ident = input.ident.clone();
    let proxy_ident = Ident::new(&format!("__MultiKey{}", input.ident), input.ident.span());

    input.ident = proxy_ident.clone();
    input.vis = Visibility::Inherited;
    // TODO wait for https://github.com/juhaku/utoipa/issues/704 to re-enable
    // input.attrs.append(&mut Attribute::parse_outer
    // .parse_str(&"#[doc(hidden)]")
    // .unwrap());

    let (ser, de) = get_ser_de(&input.attrs)?;

    let mut pass_through = Vec::<Ident>::new();
    let mut final_fields = Punctuated::<Field, Token![,]>::new();
    let mut try_from_conv = Vec::<TokenStream2>::new();
    let mut into_pre_conv = Vec::<TokenStream2>::new();
    let mut into_in_conv = Vec::<TokenStream2>::new();

    let Fields::Named(FieldsNamed { brace_token, named }) = input.fields else {
        return Err(Error::new(
            Span::call_site(),
            "`serde_multikey` was applied to a tuple-struct or an empty struct",
        ));
    };
    for pair in named.into_pairs() {
        let (mut field, ponct) = pair.into_tuple();
        // we are in a "normal" struct, not a tuple-struct, unwrap is fine.
        let field_name = field.ident.clone().unwrap();

        let (field_config, attrs) = parse_attributes(field.attrs, &field_name)?;
        field.attrs = attrs;

        if let Some(field_config) = field_config {
            let value = Ident::new("value", Span::call_site());
            for field in &field_config.proxy_fields {
                final_fields.push(field.clone());
            }
            match (ser, field_config.get_into(&value)) {
                (true, Some((pre_conv, in_conv))) => {
                    into_pre_conv.push(pre_conv);
                    into_in_conv.push(in_conv);
                }
                (false, None) => (),
                (true, None) => {
                    return Err(Error::new(
                        field_name.span(),
                        "structure implement serialize but no serializer defined",
                    ));
                }
                (false, Some(_)) => {
                    return Err(Error::new(
                        field_name.span(),
                        "structure doesn't implement serialize but a serializer is defined",
                    ));
                }
            }
            match (de, field_config.get_try_from(&value)) {
                (true, Some(conv)) => {
                    try_from_conv.push(conv);
                }
                (false, None) => (),
                (true, None) => {
                    return Err(Error::new(
                        field_name.span(),
                        "structure implement deserialize but no deserializer defined",
                    ));
                }
                (false, Some(_)) => {
                    return Err(Error::new(
                        field_name.span(),
                        "structure doesn't implement deserialize but a deserializer is defined",
                    ));
                }
            }
        } else {
            pass_through.push(field_name);
            final_fields.push(field);
            if let Some(ponct) = ponct {
                final_fields.push_punct(ponct);
            }
        }
    }
    input.fields = Fields::Named(FieldsNamed {
        brace_token,
        named: final_fields,
    });

    let into = if ser {
        Some(quote!(
            impl From<#main_ident> for #proxy_ident {
                fn from(value: #main_ident) -> #proxy_ident {
                    #(#into_pre_conv)*
                    #proxy_ident {
                        #(#pass_through: value.#pass_through,)*
                        #(#into_in_conv)*
                    }
                }
            }
        ))
    } else {
        None
    };
    let try_from = if de {
        Some(quote!(
            impl TryFrom<#proxy_ident> for #main_ident {
                type Error = String;

                fn try_from(value: #proxy_ident) -> Result<Self, Self::Error> {
                    Ok(#main_ident {
                        #(#pass_through: value.#pass_through,)*
                        #(#try_from_conv)*
                    })
                }
            }
        ))
    } else {
        None
    };
    Ok(quote!(
        #input

        #into
        #try_from
    ))
}

fn get_ser_de(attributes: &[Attribute]) -> Result<(bool, bool), Error> {
    let mut ser = false;
    let mut de = false;

    for attr in attributes {
        if !attr.path().is_ident("derive") {
            continue;
        }
        let Meta::List(ref derives) = attr.meta else {
            continue;
        };
        let derives =
            Punctuated::<Path, Token![,]>::parse_terminated.parse2(derives.tokens.clone())?;

        for path in derives.iter() {
            ser |= path_equiv(path, &["serde", "Serialize"]);
            de |= path_equiv(path, &["serde", "Deserialize"]);
        }
    }
    Ok((ser, de))
}

fn get_and_remove_utoipa_schema(attributes: &mut [Attribute]) -> Result<bool, Error> {
    let mut has_schema = false;
    for attr in attributes {
        if !attr.path().is_ident("derive") {
            continue;
        }
        let Meta::List(ref mut derives) = attr.meta else {
            continue;
        };

        let derive_list =
            Punctuated::<Path, Token![,]>::parse_terminated.parse2(derives.tokens.clone())?;
        let mut new_derives = Punctuated::<Path, Token![,]>::new();
        for path in derive_list {
            if path_equiv(&path, &["utoipa", "ToSchema"]) {
                has_schema = true;
            } else {
                new_derives.push(path);
            }
        }
        derives.tokens = quote!(#new_derives);
    }

    Ok(has_schema)
}

fn path_equiv(path: &Path, reference: &[&str]) -> bool {
    if path.segments.is_empty() || reference.is_empty() {
        return false;
    }

    path.segments
        .iter()
        .rev()
        .zip(reference.iter().rev())
        .fold(true, |equal, (path_part, ref_part)| {
            equal && path_part.ident == ref_part
        })
}

#[derive(Debug)]
struct MultiKeyOptions {
    main_field_name: Ident,
    deserializer: Option<Path>,
    serializer: Option<Path>,
    proxy_fields: Vec<Field>,
}

impl MultiKeyOptions {
    fn get_into(&self, this: &Ident) -> Option<(TokenStream2, TokenStream2)> {
        if let Some(ref serializer) = self.serializer {
            let field_names: Vec<_> = self
                .proxy_fields
                .iter()
                .map(|field| field.ident.clone().unwrap())
                .collect();
            let main_field_name = &self.main_field_name;

            let pre = quote!(
                let (#(#field_names,)*) = #serializer(#this.#main_field_name);
            );
            let in_struct = quote!(
                #(
                    #field_names,
                )*
            );
            Some((pre, in_struct))
        } else {
            None
        }
    }

    fn get_try_from(&self, this: &Ident) -> Option<TokenStream2> {
        if let Some(ref deserializer) = self.deserializer {
            let field_names: Vec<_> = self
                .proxy_fields
                .iter()
                .map(|field| field.ident.clone().unwrap())
                .collect();
            let main_field_name = &self.main_field_name;

            Some(quote!(
                #main_field_name: match #deserializer( #(#this.#field_names,)* ) {
                    Ok(val) => val,
                    Err(e) => return Err(e.to_string()),
                },
            ))
        } else {
            None
        }
    }
}

enum MultiKeyOption {
    Deserializer(Path),
    Serializer(Path),
    Fields(Vec<Field>),
}

impl Parse for MultiKeyOption {
    fn parse(input: ParseStream) -> Result<Self, Error> {
        let ident: Ident = input.parse()?;
        match ident.to_string().as_str() {
            "serializer" => {
                input.parse::<Token![=]>()?;
                Ok(MultiKeyOption::Serializer(input.parse::<Path>()?))
            }
            "deserializer" => {
                input.parse::<Token![=]>()?;
                Ok(MultiKeyOption::Deserializer(input.parse::<Path>()?))
            }
            "fields" => {
                input.parse::<Token![=]>()?;
                let content;
                parenthesized!(content in input);
                let fields = content.parse_terminated(Field::parse_named, Token![,])?;
                Ok(MultiKeyOption::Fields(fields.into_iter().collect()))
            }
            _ => Err(Error::new(ident.span(), "unknown field")),
        }
    }
}

impl Parse for MultiKeyOptions {
    fn parse(input: ParseStream) -> Result<Self, Error> {
        let mut res = MultiKeyOptions {
            main_field_name: Ident::new("tmp_name", Span::call_site()),
            deserializer: None,
            serializer: None,
            proxy_fields: Vec::new(),
        };

        let options = Punctuated::<MultiKeyOption, Token![,]>::parse_terminated(input)?;
        for option in options {
            match option {
                MultiKeyOption::Deserializer(path) => {
                    if res.deserializer.is_none() {
                        res.deserializer = Some(path);
                    } else {
                        todo!("throw error");
                    }
                }
                MultiKeyOption::Serializer(path) => {
                    if res.serializer.is_none() {
                        res.serializer = Some(path);
                    } else {
                        todo!("throw error");
                    }
                }
                MultiKeyOption::Fields(fields) => {
                    if res.proxy_fields.is_empty() {
                        res.proxy_fields = fields;
                    } else {
                        todo!("throw error");
                    }
                }
            }
        }

        if res.proxy_fields.is_empty() {
            todo!("throw error")
        }

        Ok(res)
    }
}

fn parse_attributes(
    attributes: Vec<Attribute>,
    field_name: &Ident,
) -> Result<(Option<MultiKeyOptions>, Vec<Attribute>), Error> {
    let (mut multikey_attributes, normal_attributes): (Vec<_>, _) = attributes
        .into_iter()
        .partition(|attr| attr.path().is_ident("serde_multikey"));

    if multikey_attributes.len() > 1 {
        let last = multikey_attributes.last().unwrap();
        return Err(Error::new(
            last.pound_token.spans[0],
            "`serde_multikey` was applied multiple time to the same field",
        ));
    }
    let options = if let Some(multikey_attribute) = multikey_attributes.pop() {
        let Meta::List(meta_list) = multikey_attribute.meta else {
            return Err(Error::new(
                multikey_attribute.pound_token.spans[0],
                "`serde_multikey` require list-style arguments",
            ));
        };
        let mut options: MultiKeyOptions = syn::parse2(meta_list.tokens)?;
        options.main_field_name = field_name.clone();
        Some(options)
    } else {
        None
    };

    Ok((options, normal_attributes))
}


================================================
FILE: quickwit/quickwit-metastore/Cargo.toml
================================================
[package]
name = "quickwit-metastore"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
futures = { workspace = true }
http = { workspace = true }
itertools = { workspace = true }
mockall = { workspace = true, optional = true }
once_cell = { workspace = true }
ouroboros = { workspace = true }
rand = { workspace = true }
regex = { workspace = true }
regex-syntax = { workspace = true }
sea-query = { workspace = true, optional = true }
sea-query-binder = { workspace = true, optional = true }
serde = { workspace = true }
serde_json = { workspace = true }
serde_with = { workspace = true }
sqlx = { workspace = true, optional = true }
tempfile = { workspace = true, optional = true }
thiserror = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tower = { workspace = true }
tracing = { workspace = true }
ulid = { workspace = true, features = ["serde"] }
uuid = { workspace = true }
utoipa = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-query = { workspace = true }
quickwit-storage = { workspace = true }

[dev-dependencies]
dotenvy = { workspace = true }
futures = { workspace = true }
hyper-util = { workspace = true }
md5 = { workspace = true }
mockall = { workspace = true }
rand = { workspace = true }
serial_test = { workspace = true }
tempfile = { workspace = true }
tracing-subscriber = { workspace = true }

quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-doc-mapper = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }

[features]
ci-test = []
postgres = ["quickwit-proto/postgres", "sea-query", "sea-query-binder", "sqlx"]
testsuite = ["mockall", "tempfile", "quickwit-config/testsuite"]


================================================
FILE: quickwit/quickwit-metastore/README.md
================================================
# quickwit-metastore

## Starting postgres

The following command starts a postgresql server
locally to test the postgres metastore implementation.

`docker-compose up postgres`

Its data is saved in the tmp directory, and
is not necessarily cleaned up between two runs.

You can execute `make rm-postgres` to remove the
data of this postgresql database.

## Testing quickwit-metastore

To test FileBackedMetastore only, use the following command.

```
$ cargo test
```

To test including PostgresqlMetastore, you need to start PostgreSQL beforehand.
Start PostgreSQL for testing with the following command in `quickwit` project root.

```
$ make docker-compose-up DOCKER_SERVICES=postgres
```

Once PostgreSQL is up and running, you can run tests including PostgresqlMetastore with the following command.

```
$ cargo test --features=postgres
```

You can stop PostgreSQL with the following command.

```
$ docker-compose down
```

## Sqlx-cli and migrations

This sqlx-cli can be useful (but is not necessary) to work with migrations.

```
cargo install sqlx-cli
```

You can then use the following commands to apply/revert your postgresql migrations.
```
sqlx migrate run  --database-url postgres://quickwit-dev:quickwit-dev@localhost:5432/quickwit-metastore-dev --source migrations/postgresql
sqlx migrate revert  --database-url postgres://quickwit-dev:quickwit-dev@localhost:5432/quickwit-metastore-dev --source migrations/postgresql
```


================================================
FILE: quickwit/quickwit-metastore/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

fn main() {
    println!("cargo:rerun-if-changed=migrations/postgresql");
}


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/10_add-split-incarnation-id.down.sql
================================================
ALTER TABLE indexes ALTER COLUMN index_uid TYPE VARCHAR(64);
ALTER TABLE indexes ALTER COLUMN index_id TYPE VARCHAR(50);
ALTER TABLE splits ALTER COLUMN index_uid TYPE VARCHAR(64);
ALTER TABLE delete_tasks ALTER COLUMN index_uid TYPE VARCHAR(64);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/10_add-split-incarnation-id.up.sql
================================================
ALTER TABLE indexes ALTER COLUMN index_uid TYPE VARCHAR(282);
ALTER TABLE indexes ALTER COLUMN index_id TYPE VARCHAR(255);
ALTER TABLE splits ALTER COLUMN index_uid TYPE VARCHAR(282);
ALTER TABLE delete_tasks ALTER COLUMN index_uid TYPE VARCHAR(282);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/11_add-split-maturity-timestamp-field.down.sql
================================================
ALTER TABLE splits
  DROP COLUMN maturity_timestamp;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/11_add-split-maturity-timestamp-field.up.sql
================================================
ALTER TABLE splits
    ADD COLUMN maturity_timestamp TIMESTAMP DEFAULT TO_TIMESTAMP(0);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/12_create-shards.down.sql
================================================
DROP TABLE shards;

DROP TYPE IF EXISTS SHARD_STATE;

================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/12_create-shards.up.sql
================================================
CREATE TYPE SHARD_STATE AS ENUM ('unspecified', 'open', 'unavailable', 'closed');

CREATE TABLE IF NOT EXISTS shards (
    index_uid VARCHAR(282) NOT NULL,
    source_id VARCHAR(255) NOT NULL,
    shard_id BIGSERIAL,
    leader_id VARCHAR(255) NOT NULL,
    follower_id VARCHAR(255),
    shard_state SHARD_STATE NOT NULL,
    publish_position_inclusive VARCHAR(255) NOT NULL,
    publish_token VARCHAR(255),
    PRIMARY KEY (index_uid, source_id, shard_id),
    FOREIGN KEY (index_uid) REFERENCES indexes (index_uid)
);

================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/13_migrate-otel-indexes-v0_6.down.sql
================================================
UPDATE 
   indexes
SET 
   index_metadata_json = REPLACE(
      REPLACE(index_metadata_json, '"output_format":"hex"', '"output_format":"base64"'),
      '"input_format":"hex"', '"input_format":"base64"'
   )
WHERE 
    index_id in ('otel-logs-v0_6', 'otel-traces-v0_6');


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/13_migrate-otel-indexes-v0_6.up.sql
================================================
UPDATE 
   indexes
SET 
   index_metadata_json = REPLACE(
      REPLACE(index_metadata_json, '"output_format":"base64"', '"output_format":"hex"'),
      '"input_format":"base64"', '"input_format":"hex"'
   )
WHERE 
    index_id in ('otel-logs-v0_6', 'otel-traces-v0_6');


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/14_update-shard-id.down.sql
================================================
ALTER TABLE shards
    ALTER COLUMN shard_id TYPE BIGSERIAL,
    ALTER COLUMN shard_id DROP NOT NULL,
    ALTER COLUMN shard_state DROP DEFAULT,
    ALTER COLUMN publish_position_inclusive DROP DEFAULT,
    DROP CONSTRAINT shards_index_uid_fkey,
    ADD CONSTRAINT shards_index_uid_fkey FOREIGN KEY (index_uid) REFERENCES indexes(index_uid)


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/14_update-shard-id.up.sql
================================================
ALTER TABLE shards
    ALTER COLUMN shard_id TYPE VARCHAR(255),
    ALTER COLUMN shard_id SET NOT NULL,
    ALTER COLUMN shard_state SET DEFAULT 'open',
    ALTER COLUMN publish_position_inclusive SET DEFAULT '',
    DROP CONSTRAINT shards_index_uid_fkey,
    ADD CONSTRAINT shards_index_uid_fkey FOREIGN KEY (index_uid) REFERENCES indexes(index_uid) ON DELETE CASCADE


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/15_create-templates.down.sql
================================================
DROP TABLE index_templates;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/15_create-templates.up.sql
================================================
CREATE TABLE IF NOT EXISTS index_templates (
    template_id VARCHAR(255) NOT NULL,
    positive_index_id_patterns VARCHAR(255)[] NOT NULL,
    negative_index_id_patterns VARCHAR(255)[] NOT NULL,
    priority INTEGER NOT NULL DEFAULT 0,
    index_template_json TEXT NOT NULL,
    PRIMARY KEY (template_id)
);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/16_create-index-split-uid.down.sql
================================================
DROP INDEX IF EXISTS splits_index_uid_idx;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/16_create-index-split-uid.up.sql
================================================
CREATE INDEX IF NOT EXISTS splits_index_uid_idx ON splits USING HASH(index_uid);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/17_create-index-split-timestamp.down.sql
================================================
DROP INDEX IF EXISTS splits_time_range_start_idx;
DROP INDEX IF EXISTS splits_time_range_end_idx;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/17_create-index-split-timestamp.up.sql
================================================
CREATE INDEX IF NOT EXISTS splits_time_range_start_idx ON splits (time_range_start);
CREATE INDEX IF NOT EXISTS splits_time_range_end_idx ON splits (time_range_end);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/18_create-index-shard-index-uid.down.sql
================================================
CREATE INDEX IF NOT EXISTS shards_index_uid_idx ON shards USING HASH(index_uid);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/18_create-index-shard-index-uid.up.sql
================================================
DROP INDEX IF EXISTS shards_index_uid_idx;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/19_add-split-node-id-field.down.sql
================================================
DROP INDEX IF EXISTS splits_node_id_idx;

ALTER TABLE splits
    DROP IF EXISTS COLUMN node_id;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/19_add-split-node-id-field.up.sql
================================================
ALTER TABLE splits
    ADD COLUMN node_id VARCHAR(253);

-- Split metadata has been stable for quite a while, so we allow ourselves to do this,
-- but please, reader of the future, do not reapply this pattern without careful consideration.
UPDATE
    splits
SET
    node_id = splits.split_metadata_json::json ->> 'node_id';

ALTER TABLE splits
    ALTER COLUMN node_id SET NOT NULL;

CREATE INDEX IF NOT EXISTS splits_node_id_idx ON splits USING HASH (node_id);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/1_create-indexes.down.sql
================================================
DROP TABLE indexes;

DROP FUNCTION IF EXISTS quickwit_manage_update_timestamp(_tbl regclass);
DROP FUNCTION IF EXISTS quickwit_set_update_timestamp();


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/1_create-indexes.up.sql
================================================
DO $$
BEGIN
    IF EXISTS (SELECT * FROM pg_tables WHERE tablename  = '__diesel_schema_migrations')
	THEN
	    -- We are migrating from a diesel table.
	    -- That's ok, but let's make sure we are at the last version.
	    --
	    -- If you hit this Assert, the workaround is to download Quickwit 0.3.1
	    -- and run the missing migrations.
	    ASSERT EXISTS (
		    SELECT FROM __diesel_schema_migrations
		    WHERE version = '20211217102648'
		);
		DROP TABLE __diesel_schema_migrations;
	END IF;
END $$;


CREATE TABLE IF NOT EXISTS indexes (
    index_id VARCHAR(50) PRIMARY KEY,
    index_metadata_json TEXT NOT NULL,
    create_timestamp TIMESTAMP NOT NULL DEFAULT (CURRENT_TIMESTAMP AT TIME ZONE 'UTC'),
    update_timestamp TIMESTAMP NOT NULL DEFAULT (CURRENT_TIMESTAMP AT TIME ZONE 'UTC')
);

CREATE OR REPLACE FUNCTION quickwit_manage_update_timestamp(_tbl regclass) RETURNS VOID AS $$
BEGIN
    EXECUTE format('DROP TRIGGER IF EXISTS set_update_timestamp ON %s CASCADE', _tbl);
    EXECUTE format('CREATE TRIGGER set_update_timestamp BEFORE UPDATE ON %s
                    FOR EACH ROW EXECUTE PROCEDURE quickwit_set_update_timestamp()', _tbl);
END;
$$ LANGUAGE plpgsql;

CREATE OR REPLACE FUNCTION quickwit_set_update_timestamp() RETURNS trigger AS $$
BEGIN
    IF (
        NEW IS DISTINCT FROM OLD AND
        NEW.update_timestamp IS NOT DISTINCT FROM OLD.update_timestamp
    ) THEN
        NEW.update_timestamp := (CURRENT_TIMESTAMP AT TIME ZONE 'UTC');
    END IF;
    RETURN NEW;
END;
$$ LANGUAGE plpgsql;

-- Apply the `update_timestamp` trigger to the `indexes` table
SELECT quickwit_manage_update_timestamp('indexes');

-- We also want to update an index `update_timestamp` field whenever a related split
-- is modified.
CREATE OR REPLACE FUNCTION set_index_update_timestamp_for_split() RETURNS trigger AS $$
BEGIN
    IF (TG_OP = 'INSERT' OR TG_OP = 'UPDATE') THEN
        UPDATE indexes SET update_timestamp = NEW.update_timestamp
        WHERE indexes.index_id = NEW.index_id;
    ELSIF (TG_OP = 'DELETE') THEN
        UPDATE indexes SET update_timestamp = (CURRENT_TIMESTAMP AT TIME ZONE 'UTC')
        WHERE indexes.index_id = OLD.index_id;
    END IF;
    RETURN NULL;
END;
$$ LANGUAGE plpgsql;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/20_add-shard-doc-mapping-uid-field.down.sql
================================================
ALTER TABLE shards
    DROP IF EXISTS COLUMN doc_mapping_uid;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/20_add-shard-doc-mapping-uid-field.up.sql
================================================
ALTER TABLE shards
    ADD COLUMN IF NOT EXISTS doc_mapping_uid VARCHAR(26);

-- Index metadata has been stable for quite a while, so we allow ourselves to do this,
-- but please, reader of the future, do not reapply this pattern without careful consideration.
UPDATE
    shards
SET
    doc_mapping_uid = '00000000000000000000000000';

ALTER TABLE shards
    ALTER COLUMN doc_mapping_uid SET NOT NULL;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/21_add-shard-update-timestamp-field.down.sql
================================================
ALTER TABLE shards
    DROP IF EXISTS update_timestamp;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/21_add-shard-update-timestamp-field.up.sql
================================================
ALTER TABLE shards
    -- We prefer a fix value here because it makes  tests simpler. 
    -- Very few users use the shard API in versions <0.9 anyway.
    ADD COLUMN IF NOT EXISTS update_timestamp TIMESTAMP NOT NULL DEFAULT '2024-01-01 00:00:00+00';


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/22_change-splits-pkey.down.sql
================================================
CREATE INDEX IF NOT EXISTS splits_index_uid_idx ON splits USING HASH(index_uid);
ALTER TABLE splits DROP CONSTRAINT splits_pkey, ADD PRIMARY KEY (split_id);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/22_change-splits-pkey.up.sql
================================================
ALTER TABLE splits DROP CONSTRAINT splits_pkey, ADD PRIMARY KEY (index_uid, split_id);
DROP INDEX IF EXISTS splits_index_uid_idx;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/23_change-indexes-unique-index.down.sql
================================================
DROP INDEX IF EXISTS indexes_index_id_unique;
ALTER TABLE indexes ADD CONSTRAINT indexes_index_id_unique UNIQUE (index_id);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/23_change-indexes-unique-index.up.sql
================================================
ALTER TABLE indexes DROP CONSTRAINT IF EXISTS indexes_index_id_unique;

CREATE UNIQUE INDEX IF NOT EXISTS indexes_index_id_unique
  ON indexes USING btree ("index_id" varchar_pattern_ops);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/24_add-arbitrary-kv.down.sql
================================================
DROP TABLE kv;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/24_add-arbitrary-kv.up.sql
================================================
CREATE TABLE IF NOT EXISTS kv (
    key VARCHAR(50) PRIMARY KEY,
    value TEXT NOT NULL
);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/25_add-split-size.down.sql
================================================
DROP INDEX IF EXISTS idx_splits_stats;

ALTER TABLE splits DROP COLUMN IF EXISTS split_size_bytes;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/25_add-split-size.up.sql
================================================
ALTER TABLE splits ADD COLUMN IF NOT EXISTS split_size_bytes BIGINT NOT NULL GENERATED ALWAYS AS ((split_metadata_json::json->'footer_offsets'->>'end')::bigint) STORED;

CREATE INDEX IF NOT EXISTS idx_splits_stats ON splits (index_uid, split_state) INCLUDE (split_size_bytes);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/2_create-splits.down.sql
================================================
DROP TABLE splits;

DROP FUNCTION IF EXISTS set_index_update_timestamp_for_split();


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/2_create-splits.up.sql
================================================
CREATE TABLE IF NOT EXISTS splits (
    split_id VARCHAR(50) PRIMARY KEY,
    split_state VARCHAR(30) NOT NULL,
    time_range_start BIGINT,
    time_range_end BIGINT,
    tags TEXT[] NOT NULL,
    split_metadata_json TEXT NOT NULL,
    index_id VARCHAR(50) NOT NULL,
    create_timestamp TIMESTAMP NOT NULL DEFAULT (CURRENT_TIMESTAMP AT TIME ZONE 'UTC'),
    update_timestamp TIMESTAMP NOT NULL DEFAULT (CURRENT_TIMESTAMP AT TIME ZONE 'UTC'),

    FOREIGN KEY(index_id) REFERENCES indexes(index_id)
);

DROP TRIGGER IF EXISTS quickwit_set_index_update_timestamp_on_split_change ON splits CASCADE;
CREATE TRIGGER quickwit_set_index_update_timestamp_on_split_change
    AFTER INSERT OR DELETE OR UPDATE ON splits
    FOR EACH ROW
    EXECUTE PROCEDURE set_index_update_timestamp_for_split();

-- We also want to update an index `update_timestamp` field whenever a related split
-- is modified.
CREATE OR REPLACE FUNCTION set_index_update_timestamp_for_split() RETURNS trigger AS $$
BEGIN
    IF (TG_OP = 'INSERT' OR TG_OP = 'UPDATE') THEN
        UPDATE indexes SET update_timestamp = NEW.update_timestamp
        WHERE indexes.index_id = NEW.index_id;
    ELSIF (TG_OP = 'DELETE') THEN
        UPDATE indexes SET update_timestamp = (CURRENT_TIMESTAMP AT TIME ZONE 'UTC')
        WHERE indexes.index_id = OLD.index_id;
    END IF;
    RETURN NULL;
END;

$$ LANGUAGE plpgsql;


-- apply the trigger to the `splits` table
SELECT quickwit_manage_update_timestamp('splits');


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/3_add-split-publish-timestamp-field.down.sql
================================================
ALTER TABLE splits
  DROP COLUMN publish_timestamp;


DROP FUNCTION IF EXISTS set_split_publish_timestamp_on_split_publish();
DROP TRIGGER IF EXISTS set_split_publish_timestamp_on_split_publish ON splits CASCADE;
DROP FUNCTION IF EXISTS set_split_publish_timestamp_for_split(); 


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/3_add-split-publish-timestamp-field.up.sql
================================================
ALTER TABLE splits
    ADD COLUMN publish_timestamp TIMESTAMP DEFAULT NULL;

-- We want to update the split `publish_timestamp` field whenever the split
-- being is published.
CREATE OR REPLACE FUNCTION set_split_publish_timestamp_for_split() RETURNS trigger AS $$
BEGIN
    IF (TG_OP = 'UPDATE') AND (NEW.split_state = 'Published') AND (OLD.split_state = 'Staged') THEN
        NEW.publish_timestamp := (CURRENT_TIMESTAMP AT TIME ZONE 'UTC');
    END IF;
    RETURN NEW;
END;

$$ LANGUAGE plpgsql;

DROP TRIGGER IF EXISTS set_split_publish_timestamp_on_split_publish ON splits CASCADE;
CREATE TRIGGER set_split_publish_timestamp_on_split_publish
    BEFORE UPDATE ON splits
    FOR EACH ROW
    EXECUTE PROCEDURE set_split_publish_timestamp_for_split();


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/4_create-delete_tasks.down.sql
================================================
DROP TABLE delete_tasks;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/4_create-delete_tasks.up.sql
================================================
CREATE TABLE IF NOT EXISTS delete_tasks (
    create_timestamp TIMESTAMP NOT NULL DEFAULT (CURRENT_TIMESTAMP AT TIME ZONE 'UTC'),
    opstamp BIGSERIAL PRIMARY KEY,
    index_id VARCHAR(50) NOT NULL,
    delete_query_json TEXT NOT NULL,

    FOREIGN KEY(index_id) REFERENCES indexes(index_id) ON DELETE CASCADE
);


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/5_add-delete-opstamp-splits.down.sql
================================================
ALTER TABLE splits DROP COLUMN delete_opstamp;

================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/5_add-delete-opstamp-splits.up.sql
================================================
ALTER TABLE splits ADD COLUMN delete_opstamp BIGINT CHECK (delete_opstamp >= 0) DEFAULT 0;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/6_delete-update-index-update-timestamp-on-split-update-trigger.up.sql
================================================
DROP TRIGGER IF EXISTS quickwit_set_index_update_timestamp_on_split_change ON splits CASCADE;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/7_delete-split-table-triggers.up.sql
================================================
DROP TRIGGER IF EXISTS set_split_publish_timestamp_on_split_publish ON splits CASCADE;
DROP TRIGGER IF EXISTS set_update_timestamp ON splits CASCADE;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/8_delete-update-timestamp-on-indexes-table.up.sql
================================================
ALTER TABLE indexes DROP COLUMN IF EXISTS update_timestamp;
DROP TRIGGER IF EXISTS set_update_timestamp ON indexes;

================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/9_add-split-incarnation-id.down.sql
================================================

ALTER TABLE delete_tasks DROP CONSTRAINT IF EXISTS delete_tasks_index_uid_fkey;
UPDATE delete_tasks set index_uid = split_part(index_uid,':',1);
ALTER TABLE delete_tasks ALTER COLUMN index_uid TYPE VARCHAR(50);
ALTER TABLE delete_tasks RENAME COLUMN index_uid TO index_id;

ALTER TABLE splits DROP CONSTRAINT IF EXISTS splits_index_uid_fkey;
ALTER TABLE splits ADD COLUMN incarnation_id VARCHAR(26) NOT NULL DEFAULT '00000000000000000000000000';
UPDATE splits set index_uid = split_part(index_uid,':',1);
ALTER TABLE splits ALTER COLUMN index_uid TYPE VARCHAR(50);
ALTER TABLE splits RENAME COLUMN index_uid TO index_id;

ALTER TABLE indexes DROP COLUMN index_id;
UPDATE indexes set index_uid = split_part(index_uid,':',1);
ALTER TABLE indexes ALTER COLUMN index_uid TYPE VARCHAR(50);
ALTER TABLE indexes RENAME COLUMN index_uid TO index_id;

ALTER TABLE delete_tasks ADD CONSTRAINT delete_tasks_index_id_fkey FOREIGN KEY (index_id) REFERENCES indexes(index_id) ON DELETE CASCADE;
ALTER TABLE splits ADD CONSTRAINT splits_index_id_fkey FOREIGN KEY (index_id) REFERENCES indexes(index_id) ON DELETE CASCADE;


================================================
FILE: quickwit/quickwit-metastore/migrations/postgresql/9_add-split-incarnation-id.up.sql
================================================
ALTER TABLE indexes RENAME COLUMN index_id TO index_uid;
ALTER TABLE indexes ADD COLUMN index_id VARCHAR(50) NOT NULL DEFAULT '';
UPDATE indexes set index_id = index_uid;
ALTER TABLE indexes ADD CONSTRAINT indexes_index_id_unique UNIQUE (index_id);
ALTER TABLE indexes ALTER COLUMN index_uid TYPE VARCHAR(64);

ALTER TABLE splits DROP CONSTRAINT IF EXISTS splits_index_id_fkey;
ALTER TABLE splits RENAME COLUMN index_id TO index_uid;
ALTER TABLE splits ALTER COLUMN index_uid TYPE VARCHAR(64);
ALTER TABLE splits ADD CONSTRAINT splits_index_uid_fkey FOREIGN KEY (index_uid) REFERENCES indexes(index_uid) ON DELETE CASCADE;

ALTER TABLE delete_tasks DROP CONSTRAINT IF EXISTS delete_tasks_index_id_fkey;
ALTER TABLE delete_tasks RENAME COLUMN index_id TO index_uid;
ALTER TABLE delete_tasks ALTER COLUMN index_uid TYPE VARCHAR(64);
ALTER TABLE delete_tasks ADD CONSTRAINT delete_tasks_index_uid_fkey FOREIGN KEY (index_uid) REFERENCES indexes(index_uid) ON DELETE CASCADE;


================================================
FILE: quickwit/quickwit-metastore/src/backward_compatibility_tests/README.md
================================================
See docs/internals/backward-compatibility.md.


================================================
FILE: quickwit/quickwit-metastore/src/backward_compatibility_tests/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fs;
use std::path::{Path, PathBuf};

use anyhow::{Context, bail};
use quickwit_config::{IndexConfig, IndexTemplate, SourceConfig, TestableForRegression};
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;

use crate::file_backed::file_backed_index::FileBackedIndex;
use crate::file_backed::manifest::Manifest;
use crate::{IndexMetadata, SplitMetadata};

/// In order to avoid confusion, we need to make sure that the
/// resource versions is the same for all resources.
///
/// We don't want to confuse quickwit users with different source_config /
/// index_config versions.
///
/// If you bump this version, makes sure to update all resources.
/// Of course some resource may not have any config change.
///
/// You can just reuse the same versioned object in that case.
/// ```
/// enum MyResource {
///     #[serde(rename="0.1")]
///     V0_1(MyResourceV1),
///     #[serde(rename="0.2")]
///     V0_2(MyResourceV1) //< there was no change in this version.
/// }
const GLOBAL_QUICKWIT_RESOURCE_VERSION: &str = "0.9";

/// This test makes sure that the resource is using the current `GLOBAL_QUICKWIT_RESOURCE_VERSION`.
fn test_global_version<T: Serialize>(serializable: &T) -> anyhow::Result<()> {
    let json = serde_json::to_value(serializable).unwrap();
    let version_value = json.get("version").context("no version tag")?;
    let version_str = version_value.as_str().context("version should be a str")?;
    if version_str != GLOBAL_QUICKWIT_RESOURCE_VERSION {
        bail!(
            "version `{version_str}` is not the global quickwit resource version \
             ({GLOBAL_QUICKWIT_RESOURCE_VERSION})"
        );
    }
    Ok(())
}

fn deserialize_json_file<T>(path: &Path) -> anyhow::Result<T>
where for<'a> T: Deserialize<'a> {
    let payload = std::fs::read(path)?;
    let deserialized: T = serde_json::from_slice(&payload)?;
    Ok(deserialized)
}

fn test_backward_compatibility_single_case<T>(path: &Path) -> anyhow::Result<()>
where T: TestableForRegression + std::fmt::Debug {
    println!("---\nTest deserialization of {}", path.display());
    let deserialized: T = deserialize_json_file(path)?;
    let expected_path = path.to_string_lossy().replace(".json", ".expected.json");
    let expected: T = deserialize_json_file(Path::new(&expected_path))?;
    println!("---\nTest equality of {expected:?}");
    println!("---\nwith {deserialized:?}");
    deserialized.assert_equality(&expected);
    Ok(())
}

/// For each pair of `x.json` and `x.expected.json` in `test_dir`, assert that the deserialized
/// versions are equal according to `T::assert_equality`.
fn test_backward_compatibility<T>(test_dir: &Path) -> anyhow::Result<()>
where T: TestableForRegression + std::fmt::Debug {
    for entry in
        fs::read_dir(test_dir).with_context(|| format!("failed to read {}", test_dir.display()))?
    {
        let entry = entry?;
        let path = entry.path();
        if path.to_string_lossy().ends_with(".expected.json")
            || path.to_string_lossy().ends_with(".modified.json")
        {
            continue;
        }
        test_backward_compatibility_single_case::<T>(&path)
            .with_context(|| format!("test path {}", path.display()))?;
    }
    Ok(())
}

fn test_and_update_expected_files_single_case<T>(expected_path: &Path) -> anyhow::Result<bool>
where for<'a> T: std::fmt::Debug + Serialize + Deserialize<'a> {
    let expected: T = deserialize_json_file(Path::new(&expected_path))?;
    let expected_old_json_value: JsonValue = deserialize_json_file(Path::new(&expected_path))?;
    let expected_new_json_value: JsonValue = serde_json::to_value(&expected)?;
    // We compare json Value, so we don't detect format change like a change in the field order.
    if expected_old_json_value == expected_new_json_value {
        // No modification
        return Ok(false);
    }
    println!("---\nTest deserialization of {}", expected_path.display());
    println!("---\nexpected {expected:?}");
    println!("---\nwith {expected_new_json_value:?}");
    let mut expected_new_json = serde_json::to_string_pretty(&expected_new_json_value)?;
    expected_new_json.push('\n');
    std::fs::write(
        expected_path.with_extension("modified.json"),
        expected_new_json.as_bytes(),
    )?;
    Ok(true)
}

/// For versions different (older) than the current [GLOBAL_QUICKWIT_RESOURCE_VERSION],
/// assert whether the expected.json files need to be changed.
///
/// Returns the proposed updated files (xxx.expected.modified.json).
fn test_and_update_old_expected_files<T>(test_dir: &Path) -> anyhow::Result<Vec<PathBuf>>
where for<'a> T: std::fmt::Debug + Deserialize<'a> + Serialize {
    let mut updated_expected_files = Vec::new();
    for entry in fs::read_dir(test_dir)? {
        let entry = entry?;
        let path = entry.path();
        if !path.to_string_lossy().ends_with(".expected.json") {
            continue;
        }
        if path.to_string_lossy().ends_with(&format!(
            "v{GLOBAL_QUICKWIT_RESOURCE_VERSION}.expected.json"
        )) {
            continue;
        }
        if test_and_update_expected_files_single_case::<T>(&path)
            .with_context(|| format!("test filepath {}", path.display()))?
        {
            updated_expected_files.push(path.with_extension("modified.json"));
        }
    }
    Ok(updated_expected_files)
}

/// Asserts whether the serialized version of the `sample` is the same as the existing
/// `v{GLOBAL_QUICKWIT_RESOURCE_VERSION}.json`.
///
/// Returns the created serialized files if they didn't exist (x.json and x.expected.json) or the
/// proposed updated files (.modified.json) if they changed.
///
/// Both generated files have identical contents.
fn test_and_create_new_test<T>(test_dir: &Path, sample: T) -> anyhow::Result<Vec<PathBuf>>
where for<'a> T: Serialize {
    let sample_json_value = serde_json::to_value(&sample)?;
    let mut sample_json = serde_json::to_string_pretty(&sample_json_value)?;
    sample_json.push('\n');

    let file_regression_test_path_str = format!(
        "{}/v{GLOBAL_QUICKWIT_RESOURCE_VERSION}.json",
        test_dir.display()
    );
    let mut file_regression_test_path = PathBuf::from(file_regression_test_path_str);

    let (changes_detected, file_created) = if file_regression_test_path.try_exists()? {
        let expected_old_json_value: JsonValue = deserialize_json_file(&file_regression_test_path)?;
        let expected_new_json_value: JsonValue = serde_json::from_str(&sample_json)?;
        (expected_old_json_value != expected_new_json_value, false)
    } else {
        (false, true)
    };

    let mut file_regression_expected_path =
        file_regression_test_path.with_extension("expected.json");

    if !file_created {
        file_regression_test_path = file_regression_test_path.with_extension("modified.json");
        file_regression_expected_path =
            file_regression_expected_path.with_extension("modified.json")
    }

    if changes_detected || file_created {
        std::fs::write(&file_regression_test_path, sample_json.as_bytes())?;
        std::fs::write(&file_regression_expected_path, sample_json.as_bytes())?;
        Ok(vec![
            file_regression_test_path,
            file_regression_expected_path,
        ])
    } else {
        Ok(vec![])
    }
}

/// This helper function scans the `test-data/{test_name}`
/// for JSON deserialization regression tests and runs them sequentially.
///
/// - `test_name` is just the subdirectory name, for the type being test.
pub(crate) fn test_json_backward_compatibility_helper<T>(test_name: &str) -> anyhow::Result<()>
where T: TestableForRegression + std::fmt::Debug {
    let sample_instance: T = T::sample_for_regression();
    test_global_version(&sample_instance).unwrap();

    let test_dir = Path::new("test-data").join(test_name);
    test_backward_compatibility::<T>(&test_dir).context("backward-compatibility")?;
    let updated_files =
        test_and_update_old_expected_files::<T>(&test_dir).context("test-and-update")?;

    let mut updated_or_new_files = test_and_create_new_test::<T>(&test_dir, sample_instance)
        .context("test-and-create-new-test")?;

    updated_or_new_files.extend(updated_files);

    if !updated_or_new_files.is_empty() {
        panic!(
            "Some files have been updated or created. Please check the diff and replace their \
             counterparts when appropriate: {updated_or_new_files:?}"
        );
    }

    Ok(())
}

#[test]
fn test_split_metadata_backward_compatibility() {
    test_json_backward_compatibility_helper::<SplitMetadata>("split-metadata").unwrap();
}

#[test]
fn test_index_metadata_backward_compatibility() {
    test_json_backward_compatibility_helper::<IndexMetadata>("index-metadata").unwrap();
}

#[test]
fn test_index_config_global_version() {
    let sample_instance = IndexConfig::sample_for_regression();
    test_global_version(&sample_instance).unwrap();
}

#[test]
fn test_source_config_global_version() {
    let sample_instance = SourceConfig::sample_for_regression();
    test_global_version(&sample_instance).unwrap();
}

#[test]
fn test_file_backed_index_backward_compatibility() {
    test_json_backward_compatibility_helper::<FileBackedIndex>("file-backed-index").unwrap();
}

#[test]
fn test_file_backed_metastore_manifest_backward_compatibility() {
    test_json_backward_compatibility_helper::<Manifest>("manifest").unwrap();
}

#[test]
fn test_index_template_global_version() {
    let sample_instance = IndexTemplate::sample_for_regression();
    test_global_version(&sample_instance).unwrap();
}

/// Testing the tests
///
/// A simplified example that helps understanding the backward compatibility tests.
#[cfg(test)]
mod tests {
    use std::panic::catch_unwind;

    use serde_json::json;

    use super::*;

    #[derive(Serialize, Deserialize, Debug, Clone)]
    #[serde(into = "VersionedTestEntity")]
    #[serde(from = "VersionedTestEntity")]
    struct TestEntity {
        field_already_in_0_7: u16,
        field_added_in_0_8: u16,
    }

    #[derive(Serialize, Deserialize, Debug, Clone)]
    struct TestEntityV0_8 {
        field_already_in_0_7: u16,
        field_added_in_0_8: u16,
    }

    #[derive(Deserialize, Debug, Clone)]
    struct TestEntityV0_7 {
        field_already_in_0_7: u16,
    }

    #[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
    #[serde(tag = "version")]
    enum VersionedTestEntity {
        #[serde(rename = "0.9")]
        #[serde(alias = "0.8")]
        V0_8(TestEntityV0_8),
        #[serde(alias = "0.7", skip_serializing)]
        V0_7(TestEntityV0_7),
    }

    impl From<VersionedTestEntity> for TestEntity {
        fn from(versioned_test_entity: VersionedTestEntity) -> Self {
            match versioned_test_entity {
                VersionedTestEntity::V0_8(v0_9) => TestEntity {
                    field_added_in_0_8: v0_9.field_added_in_0_8,
                    field_already_in_0_7: v0_9.field_already_in_0_7,
                },
                VersionedTestEntity::V0_7(v0_7) => TestEntity {
                    field_already_in_0_7: v0_7.field_already_in_0_7,
                    field_added_in_0_8: 1,
                },
            }
        }
    }

    impl From<TestEntity> for VersionedTestEntity {
        fn from(test_entity: TestEntity) -> Self {
            VersionedTestEntity::V0_8(TestEntityV0_8 {
                field_added_in_0_8: test_entity.field_added_in_0_8,
                field_already_in_0_7: test_entity.field_already_in_0_7,
            })
        }
    }

    impl TestableForRegression for TestEntity {
        fn sample_for_regression() -> Self {
            TestEntity {
                field_added_in_0_8: 43,
                field_already_in_0_7: 42,
            }
        }

        fn assert_equality(&self, other: &Self) {
            assert_eq!(self.field_added_in_0_8, other.field_added_in_0_8);
            assert_eq!(self.field_already_in_0_7, other.field_already_in_0_7);
        }
    }

    #[test]
    fn test_test_json_backward_compatibility_helper_create() {
        let temp_dir = tempfile::tempdir().unwrap();
        let temp_path = temp_dir.path();

        let json_sample_0_7 = json!({"version": "0.7", "field_already_in_0_7": 42});
        let json_sample_0_8 = json!({"version": GLOBAL_QUICKWIT_RESOURCE_VERSION,
"field_already_in_0_7": 42, "field_added_in_0_8": 43});

        let json_sample_0_7_str = serde_json::to_string_pretty(&json_sample_0_7).unwrap();
        let json_sample_0_8_str = serde_json::to_string_pretty(&json_sample_0_8).unwrap();

        std::fs::write(temp_path.join("v0.7.json"), json_sample_0_7_str.as_bytes()).unwrap();
        std::fs::write(
            temp_path.join("v0.7.expected.json"),
            json_sample_0_7_str.as_bytes(),
        )
        .unwrap();
        std::fs::write(temp_path.join("v0.8.json"), json_sample_0_8_str.as_bytes()).unwrap();
        std::fs::write(
            temp_path.join("v0.8.expected.json"),
            json_sample_0_8_str.as_bytes(),
        )
        .unwrap();

        let test_panic = catch_unwind(|| {
            test_json_backward_compatibility_helper::<TestEntity>(&temp_path.to_string_lossy())
                .unwrap();
        });
        let test_panic_msg = format!(
            "{:?}",
            test_panic.unwrap_err().downcast::<String>().unwrap()
        );
        let latest_version_filename = format!("v{GLOBAL_QUICKWIT_RESOURCE_VERSION}.json");
        let latest_version_expected_filename =
            format!("v{GLOBAL_QUICKWIT_RESOURCE_VERSION}.expected.json");
        assert!(test_panic_msg.contains(&latest_version_filename));
        assert!(test_panic_msg.contains(&latest_version_expected_filename));
        assert!(test_panic_msg.contains("v0.7.expected.modified.json"));

        // assert on the directory
        let nb_files = fs::read_dir(temp_path).unwrap().count();
        assert_eq!(nb_files, 4 + 3);
        let created_last_version =
            deserialize_json_file::<JsonValue>(&temp_path.join(latest_version_filename)).unwrap();
        assert_eq!(created_last_version, json_sample_0_8);
        let created_expected_last_version =
            deserialize_json_file::<JsonValue>(&temp_path.join(latest_version_expected_filename))
                .unwrap();
        assert_eq!(created_expected_last_version, json_sample_0_8);
        let created_expected_modified_0_7 =
            deserialize_json_file::<JsonValue>(&temp_path.join("v0.7.expected.modified.json"))
                .unwrap();
        assert_eq!(
            created_expected_modified_0_7,
            json!({
                "version": GLOBAL_QUICKWIT_RESOURCE_VERSION,
                "field_already_in_0_7": 42,
                // use TestEntity::From<VersionedTestEntity>
                "field_added_in_0_8": 1,
            })
        );

        // assert idempotency
        let test_panic = catch_unwind(|| {
            test_json_backward_compatibility_helper::<TestEntity>(&temp_path.to_string_lossy())
                .unwrap();
        });
        test_panic.unwrap_err();
        let nb_files = fs::read_dir(temp_path).unwrap().count();
        assert_eq!(nb_files, 4 + 3);
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/checkpoint.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Ordering;
use std::collections::BTreeMap;
use std::collections::btree_map::Entry;
use std::fmt;
use std::iter::FromIterator;
use std::ops::Range;
use std::sync::Arc;

use quickwit_proto::types::{Position, SourceId};
use serde::ser::SerializeMap;
use serde::{Deserialize, Serialize};
/// Updates running indexing tasks in chitchat cluster state.
use thiserror::Error;
use tracing::{debug, warn};

/// A `PartitionId` uniquely identifies a partition for a given source.
#[derive(Clone, Debug, Default, Eq, PartialEq, Ord, PartialOrd, Serialize, Deserialize, Hash)]
pub struct PartitionId(pub Arc<String>);

impl PartitionId {
    /// Returns the partition ID as a `i64`.
    pub fn as_i64(&self) -> Option<i64> {
        self.0.parse::<i64>().ok()
    }

    /// Returns the partition ID as a `u64`.
    pub fn as_u64(&self) -> Option<u64> {
        self.0.parse().ok()
    }

    pub fn as_str(&self) -> &str {
        &self.0
    }
}

impl fmt::Display for PartitionId {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{}", &self.0)
    }
}

impl From<String> for PartitionId {
    fn from(partition_id_str: String) -> Self {
        PartitionId(Arc::new(partition_id_str))
    }
}

impl From<&str> for PartitionId {
    fn from(partition_id_str: &str) -> Self {
        PartitionId(Arc::new(partition_id_str.to_string()))
    }
}

impl From<u64> for PartitionId {
    fn from(partition_id: u64) -> Self {
        let partition_id_str = format!("{partition_id:0>20}");
        PartitionId(Arc::new(partition_id_str))
    }
}

impl From<i64> for PartitionId {
    fn from(partition_id: i64) -> Self {
        let partition_id_str = format!("{partition_id:0>20}");
        PartitionId(Arc::new(partition_id_str))
    }
}

/// A partition delta represents an interval (from, to] over a partition of a source.
#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize)]
pub struct PartitionDelta {
    pub from: Position,
    pub to: Position,
}

#[derive(Default, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct IndexCheckpoint {
    #[serde(flatten)]
    per_source: BTreeMap<SourceId, SourceCheckpoint>,
}

impl fmt::Debug for IndexCheckpoint {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let json = serde_json::to_string_pretty(&self).map_err(|_| fmt::Error)?;
        write!(f, "{json}")?;
        Ok(())
    }
}

impl From<BTreeMap<SourceId, SourceCheckpoint>> for IndexCheckpoint {
    fn from(per_source: BTreeMap<SourceId, SourceCheckpoint>) -> Self {
        Self { per_source }
    }
}

impl IndexCheckpoint {
    /// Updates a checkpoint in place. Returns whether the checkpoint was modified.
    ///
    /// If the checkpoint delta is not compatible with the
    /// current checkpoint, an error is returned, and the
    /// checkpoint remains unchanged.
    ///
    /// See [`SourceCheckpoint::try_apply_delta`] for more details.
    pub fn try_apply_delta(
        &mut self,
        delta: IndexCheckpointDelta,
    ) -> Result<bool, IncompatibleCheckpointDelta> {
        if delta.is_empty() {
            return Ok(false);
        }
        self.per_source
            .entry(delta.source_id)
            .or_default()
            .try_apply_delta(delta.source_delta)?;
        Ok(true)
    }

    /// Resets the checkpoint of the source identified by `source_id`. Returns whether a mutation
    /// occurred.
    pub(crate) fn reset_source(&mut self, source_id: &str) -> bool {
        self.per_source.remove(source_id).is_some()
    }

    /// Returns the checkpoint associated with a given source.
    ///
    /// All registered source have an associated checkpoint (that is possibly empty).
    ///
    /// Some non-registered source may also have checkpoint (due to backward compatibility
    /// and the ingest command).
    pub fn source_checkpoint(&self, source_id: &str) -> Option<&SourceCheckpoint> {
        self.per_source.get(source_id)
    }

    /// Adds a new source. If the source was already here, this
    /// method returns successfully and does not override the existing checkpoint.
    pub fn add_source(&mut self, source_id: &str) {
        self.per_source.entry(source_id.to_string()).or_default();
    }

    /// Removes a source.
    /// Returns successfully regardless of whether the source was present or not.
    pub fn remove_source(&mut self, source_id: &str) {
        self.per_source.remove(source_id);
    }

    /// Returns [`true`] if the checkpoint is empty.
    pub fn is_empty(&self) -> bool {
        self.per_source.is_empty()
    }
}

/// A source checkpoint is a map of the last processed position for every partition.
///
/// If a partition is missing, it implicitly means that none of its message
/// has been processed.
#[derive(Default, Clone, Eq, PartialEq)]
pub struct SourceCheckpoint {
    per_partition: BTreeMap<PartitionId, Position>,
}
impl SourceCheckpoint {
    /// Adds a partition to the checkpoint.
    pub fn add_partition(&mut self, partition_id: PartitionId, position: Position) {
        self.per_partition.insert(partition_id, position);
    }

    /// Returns the number of partitions covered by the checkpoint.
    pub fn num_partitions(&self) -> usize {
        self.per_partition.len()
    }

    /// Returns [`true`] if the checkpoint is empty.
    pub fn is_empty(&self) -> bool {
        self.per_partition.is_empty()
    }
}

/// Creates a checkpoint from an iterator of `(PartitionId, Position)` tuples.
/// ```
/// use quickwit_metastore::checkpoint::{SourceCheckpoint, PartitionId};
/// use quickwit_proto::types::Position;
///
/// let checkpoint: SourceCheckpoint = [(0u64, 0u64), (1u64, 2u64)]
///     .into_iter()
///     .map(|(partition_id, offset)| {
///         (PartitionId::from(partition_id), Position::offset(offset))
///     })
///     .collect();
/// ```
impl FromIterator<(PartitionId, Position)> for SourceCheckpoint {
    fn from_iter<I>(iter: I) -> SourceCheckpoint
    where I: IntoIterator<Item = (PartitionId, Position)> {
        SourceCheckpoint {
            per_partition: iter.into_iter().collect(),
        }
    }
}

impl Serialize for SourceCheckpoint {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        let mut map = serializer.serialize_map(Some(self.per_partition.len()))?;
        for (partition, position) in &self.per_partition {
            map.serialize_entry(&*partition.0, position)?;
        }
        map.end()
    }
}

impl<'de> Deserialize<'de> for SourceCheckpoint {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        let string_to_string_map: BTreeMap<String, String> = BTreeMap::deserialize(deserializer)?;
        let per_partition: BTreeMap<PartitionId, Position> = string_to_string_map
            .into_iter()
            .map(|(partition_id, position)| {
                (PartitionId::from(partition_id), Position::from(position))
            })
            .collect();
        Ok(SourceCheckpoint { per_partition })
    }
}

/// Error returned when trying to apply a checkpoint delta to a checkpoint that is not
/// compatible. ie: the checkpoint delta starts from a point anterior to
/// the checkpoint.
#[derive(Clone, Debug, Error, Eq, PartialEq, Serialize, Deserialize)]
#[error(
    "incompatible checkpoint delta at partition `{partition_id}`: end position is \
     `{partition_position:?}` (inclusive), whereas delta starts at `{delta_from_position:?}` \
     (exclusive)"
)]
pub struct IncompatibleCheckpointDelta {
    /// The partition ID for which the incompatibility has been detected.
    pub partition_id: PartitionId,
    /// The current position (inclusive) within this partition.
    pub partition_position: Position,
    /// The start position (exclusive) for the delta.
    pub delta_from_position: Position,
}

#[derive(Clone, Debug, Error, Serialize, Deserialize, PartialEq, Eq)]
pub enum PartitionDeltaError {
    #[error(transparent)]
    IncompatibleCheckpointDelta(#[from] IncompatibleCheckpointDelta),
    #[error(
        "empty or negative delta at partition `{partition_id}`: {from_position:?} >= \
         {to_position:?}"
    )]
    EmptyOrNegativeDelta {
        /// One PartitionId for which the negative delta has been detected.
        partition_id: PartitionId,
        /// Delta from position.
        from_position: Position,
        /// Delta to position.
        to_position: Position,
    },
}

impl SourceCheckpoint {
    /// Returns the position reached for a given partition.
    pub fn position_for_partition(&self, partition_id: &PartitionId) -> Option<&Position> {
        self.per_partition.get(partition_id)
    }

    /// Returns an iterator with the reached position for each partition.
    pub fn iter(&self) -> impl Iterator<Item = (PartitionId, Position)> + '_ {
        self.per_partition
            .iter()
            .map(|(partition_id, position)| (partition_id.clone(), position.clone()))
    }

    pub fn check_compatibility(
        &self,
        delta: &SourceCheckpointDelta,
    ) -> Result<(), IncompatibleCheckpointDelta> {
        for (delta_partition, delta_position) in &delta.per_partition {
            let Some(position) = self.per_partition.get(delta_partition) else {
                continue;
            };
            match position.cmp(&delta_position.from) {
                Ordering::Equal => {}
                Ordering::Less => {
                    warn!(cur_pos=?position, delta_pos_from=?delta_position.from,partition=?delta_partition, "some positions were skipped");
                }
                Ordering::Greater => {
                    return Err(IncompatibleCheckpointDelta {
                        partition_id: delta_partition.clone(),
                        partition_position: position.clone(),
                        delta_from_position: delta_position.from.clone(),
                    });
                }
            }
        }
        Ok(())
    }

    /// Try and apply a delta.
    ///
    /// We accept a delta as long as it comes after the current checkpoint,
    /// for all partitions.
    ///
    /// We accept a delta that is not perfected chained after a checkpoint,
    /// as gaps may happen. For instance, assuming a Kafka source, if the indexing
    /// pipeline is down for more than the retention period.
    ///
    ///   |    Checkpoint & Delta        | Outcome                     |
    ///   |------------------------------|-----------------------------|
    ///   |  (..a] (b..c] with a = b     | Compatible                  |
    ///   |  (..a] (b..c] with b > a     | Compatible                  |
    ///   |  (..a] (b..c] with b < a     | Incompatible                |
    ///
    /// If the delta is incompatible, returns an error without modifying the original checkpoint.
    pub fn try_apply_delta(
        &mut self,
        delta: SourceCheckpointDelta,
    ) -> Result<(), IncompatibleCheckpointDelta> {
        self.check_compatibility(&delta)?;
        debug!(delta=?delta, checkpoint=?self, "applying delta to checkpoint");
        for (partition_id, partition_position) in delta.per_partition {
            self.per_partition
                .insert(partition_id, partition_position.to);
        }
        Ok(())
    }
}

impl fmt::Debug for SourceCheckpoint {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.write_str("Ckpt(")?;
        for (i, (partition_id, position)) in self.per_partition.iter().enumerate() {
            f.write_str(&partition_id.0)?;
            f.write_str(":")?;
            write!(f, "{position}")?;
            let is_last = i == self.per_partition.len() - 1;
            if !is_last {
                f.write_str(" ")?;
            }
        }
        f.write_str(")")?;
        Ok(())
    }
}

/// A checkpoint delta represents a checkpoint update.
///
/// It is shipped as part of a split to convey the update
/// that should be applied to the index checkpoint once the split
/// is published.
///
/// The `CheckpointDelta` not only ships for each
/// partition not only a new position, but also an expected
/// `from` position. This makes it possible to defensively check that
/// we are not trying to add documents to the index that were already indexed.
#[derive(Clone, PartialEq, Eq, Serialize, Deserialize)]
pub struct IndexCheckpointDelta {
    pub source_id: SourceId,
    pub source_delta: SourceCheckpointDelta,
}

impl IndexCheckpointDelta {
    pub fn is_empty(&self) -> bool {
        self.source_delta.is_empty()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(source_id: &str, pos_range: Range<u64>) -> Self {
        Self {
            source_id: source_id.to_string(),
            source_delta: SourceCheckpointDelta::from_range(pos_range),
        }
    }
}

impl fmt::Debug for IndexCheckpointDelta {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{}:{:?}", &self.source_id, self.source_delta)?;
        Ok(())
    }
}

#[derive(Default, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct SourceCheckpointDelta {
    per_partition: BTreeMap<PartitionId, PartitionDelta>,
}

impl fmt::Debug for SourceCheckpointDelta {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.write_str("∆(")?;
        for (i, (partition_id, partition_delta)) in self.per_partition.iter().enumerate() {
            write!(
                f,
                "{}:({}..{}]",
                partition_id.0, partition_delta.from, partition_delta.to,
            )?;
            if i != self.per_partition.len() - 1 {
                f.write_str(" ")?;
            }
        }
        f.write_str(")")?;
        Ok(())
    }
}

impl TryFrom<Range<u64>> for SourceCheckpointDelta {
    type Error = PartitionDeltaError;

    fn try_from(range: Range<u64>) -> Result<Self, Self::Error> {
        // Checkpoint delta are expressed as (from, to] intervals while ranges
        // are [start, end) intervals
        let from_position = if range.start == 0 {
            Position::Beginning
        } else {
            Position::offset(range.start - 1)
        };
        let to_position = if range.end == 0 {
            Position::Beginning
        } else {
            Position::offset(range.end - 1)
        };
        SourceCheckpointDelta::from_partition_delta(
            PartitionId::default(),
            from_position,
            to_position,
        )
    }
}

impl SourceCheckpointDelta {
    /// Used for tests only.
    /// Panics if the range is not strictly increasing.
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_range(range: Range<u64>) -> Self {
        SourceCheckpointDelta::try_from(range).expect("Invalid position range")
    }

    /// Creates a new checkpoint delta initialized with a single partition delta.
    pub fn from_partition_delta(
        partition_id: PartitionId,
        from_position: Position,
        to_position: Position,
    ) -> Result<Self, PartitionDeltaError> {
        let mut delta = SourceCheckpointDelta::default();
        delta.record_partition_delta(partition_id, from_position, to_position)?;
        Ok(delta)
    }

    /// Returns the checkpoint associated with the endpoint of the delta.
    pub fn get_source_checkpoint(&self) -> SourceCheckpoint {
        let mut source_checkpoint = SourceCheckpoint::default();
        source_checkpoint.try_apply_delta(self.clone()).unwrap();
        source_checkpoint
    }

    /// Returns an iterator of partition IDs and associated deltas.
    pub fn iter(&self) -> impl Iterator<Item = (PartitionId, PartitionDelta)> + '_ {
        self.per_partition
            .iter()
            .map(|(partition_id, partition_delta)| (partition_id.clone(), partition_delta.clone()))
    }

    /// Records a `(from, to]` partition delta for a given partition.
    pub fn record_partition_delta(
        &mut self,
        partition_id: PartitionId,
        from_position: Position,
        to_position: Position,
    ) -> Result<(), PartitionDeltaError> {
        // `from_position == to_position` means delta is empty.
        if from_position >= to_position {
            return Err(PartitionDeltaError::EmptyOrNegativeDelta {
                partition_id,
                from_position,
                to_position,
            });
        }
        let entry = self.per_partition.entry(partition_id);
        match entry {
            Entry::Occupied(mut occupied_entry) => {
                if occupied_entry.get().to == from_position {
                    occupied_entry.get_mut().to = to_position;
                } else {
                    return Err(PartitionDeltaError::from(IncompatibleCheckpointDelta {
                        partition_id: occupied_entry.key().clone(),
                        partition_position: occupied_entry.get().to.clone(),
                        delta_from_position: from_position,
                    }));
                }
            }
            Entry::Vacant(vacant_entry) => {
                let partition_delta = PartitionDelta {
                    from: from_position,
                    to: to_position,
                };
                vacant_entry.insert(partition_delta);
            }
        }
        Ok(())
    }

    /// Extends the current checkpoint delta in-place with the provided checkpoint delta.
    ///
    /// Contrary to checkpoint update, the two deltas here need to chain perfectly.
    pub fn extend(&mut self, delta: SourceCheckpointDelta) -> Result<(), PartitionDeltaError> {
        for (partition_id, partition_delta) in delta.per_partition {
            self.record_partition_delta(partition_id, partition_delta.from, partition_delta.to)?;
        }
        Ok(())
    }

    /// Returns the number of partitions covered by the checkpoint delta.
    pub fn num_partitions(&self) -> usize {
        self.per_partition.len()
    }

    /// Returns an iterator over the partition_ids.
    pub fn partitions(&self) -> impl Iterator<Item = &PartitionId> {
        self.per_partition.keys()
    }

    /// Returns `true` if the checkpoint delta is empty.
    pub fn is_empty(&self) -> bool {
        self.per_partition.is_empty()
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_delta_from_range() {
        let checkpoint_delta = SourceCheckpointDelta::from_range(0..3);
        assert_eq!(
            format!("{checkpoint_delta:?}"),
            "∆(:(..00000000000000000002])"
        );
        let checkpoint_delta = SourceCheckpointDelta::from_range(1..4);
        assert_eq!(
            format!("{checkpoint_delta:?}"),
            "∆(:(00000000000000000000..00000000000000000003])"
        );
    }

    #[test]
    fn test_checkpoint_simple() {
        let mut checkpoint = SourceCheckpoint::default();
        assert_eq!(format!("{checkpoint:?}"), "Ckpt()");

        let delta = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset(123u64),
                Position::offset(128u64),
            )
            .unwrap();
            delta
                .record_partition_delta(
                    PartitionId::from("b"),
                    Position::offset(60002u64),
                    Position::offset(60187u64),
                )
                .unwrap();
            delta
        };
        checkpoint.try_apply_delta(delta.clone()).unwrap();
        assert_eq!(
            format!("{checkpoint:?}"),
            "Ckpt(a:00000000000000000128 b:00000000000000060187)"
        );
        // `try_apply_delta` is not idempotent.
        checkpoint.try_apply_delta(delta).unwrap_err();
        assert_eq!(
            format!("{checkpoint:?}"),
            "Ckpt(a:00000000000000000128 b:00000000000000060187)"
        );
    }

    #[test]
    fn test_partially_incompatible_does_not_update() -> anyhow::Result<()> {
        let mut checkpoint = SourceCheckpoint::default();
        let delta1 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset("00123"),
                Position::offset("00128"),
            )
            .unwrap();
            delta.record_partition_delta(
                PartitionId::from("b"),
                Position::offset("60002"),
                Position::offset("60187"),
            )?;
            delta
        };
        assert!(checkpoint.try_apply_delta(delta1).is_ok());
        let delta2 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset("00128"),
                Position::offset("00129"),
            )
            .unwrap();
            delta.record_partition_delta(
                PartitionId::from("b"),
                Position::offset("50099"),
                Position::offset("60002"),
            )?;
            delta
        };
        assert!(matches!(
            checkpoint.try_apply_delta(delta2),
            Err(IncompatibleCheckpointDelta { .. })
        ));
        // checkpoint was unchanged
        assert_eq!(format!("{checkpoint:?}"), "Ckpt(a:00128 b:60187)");
        Ok(())
    }

    #[test]
    fn test_adding_new_partition() -> anyhow::Result<()> {
        let mut checkpoint = SourceCheckpoint::default();
        let delta1 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset("00123"),
                Position::offset("00128"),
            )
            .unwrap();
            delta.record_partition_delta(
                PartitionId::from("b"),
                Position::offset("60002"),
                Position::offset("60187"),
            )?;
            delta
        };
        assert!(checkpoint.try_apply_delta(delta1).is_ok());
        let delta3 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("b"),
                Position::offset("60187"),
                Position::offset("60190"),
            )
            .unwrap();
            delta.record_partition_delta(
                PartitionId::from("c"),
                Position::offset("20001"),
                Position::offset("20008"),
            )?;
            delta
        };
        assert!(checkpoint.try_apply_delta(delta3).is_ok());
        assert_eq!(format!("{checkpoint:?}"), "Ckpt(a:00128 b:60190 c:20008)");
        Ok(())
    }

    #[test]
    fn test_extend_checkpoint_delta() {
        let mut delta1 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset("00123"),
                Position::offset("00128"),
            )
            .unwrap();
            delta
                .record_partition_delta(
                    PartitionId::from("b"),
                    Position::offset("60002"),
                    Position::offset("60187"),
                )
                .unwrap();
            delta
        };
        let delta2 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("b"),
                Position::offset("60187"),
                Position::offset("60348"),
            )
            .unwrap();
            delta
                .record_partition_delta(
                    PartitionId::from("c"),
                    Position::offset("20001"),
                    Position::offset("20008"),
                )
                .unwrap();
            delta
        };
        let delta3 = {
            let mut delta = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset("00123"),
                Position::offset("00128"),
            )
            .unwrap();
            delta
                .record_partition_delta(
                    PartitionId::from("b"),
                    Position::offset("60002"),
                    Position::offset("60348"),
                )
                .unwrap();
            delta
                .record_partition_delta(
                    PartitionId::from("c"),
                    Position::offset("20001"),
                    Position::offset("20008"),
                )
                .unwrap();
            delta
        };
        delta1.extend(delta2).unwrap();
        assert_eq!(delta1, delta3);

        let delta4 = SourceCheckpointDelta::from_partition_delta(
            PartitionId::from("a"),
            Position::offset("00130"),
            Position::offset("00142"),
        )
        .unwrap();
        let result = delta1.extend(delta4);
        assert_eq!(
            result,
            Err(PartitionDeltaError::from(IncompatibleCheckpointDelta {
                partition_id: PartitionId::from("a"),
                partition_position: Position::offset("00128"),
                delta_from_position: Position::offset("00130")
            }))
        );
    }

    #[test]
    fn test_record_negative_partition_delta_is_failing() {
        {
            let delta_error = SourceCheckpointDelta::from_partition_delta(
                PartitionId::from("a"),
                Position::offset("20"),
                Position::offset("20"),
            )
            .unwrap_err();
            matches!(
                delta_error,
                PartitionDeltaError::EmptyOrNegativeDelta { .. }
            );
        }
        {
            let mut delta = SourceCheckpointDelta::from_range(10..20);
            let delta_error = delta
                .record_partition_delta(
                    PartitionId::from("a"),
                    Position::offset("20"),
                    Position::offset("10"),
                )
                .unwrap_err();
            matches!(
                delta_error,
                PartitionDeltaError::EmptyOrNegativeDelta { .. }
            );
        }
    }

    #[test]
    fn test_index_checkpoint() {
        let mut index_checkpoint = IndexCheckpoint::default();
        assert!(
            index_checkpoint
                .source_checkpoint("missing_source")
                .is_none()
        );
        index_checkpoint.add_source("existing_source_with_empty_checkpoint");
        assert!(
            index_checkpoint
                .source_checkpoint("existing_source_with_empty_checkpoint")
                .is_some()
        );
        index_checkpoint.remove_source("missing_source"); //< we just check this does not fail
        assert!(
            index_checkpoint
                .source_checkpoint("missing_source")
                .is_none()
        );
        assert!(
            index_checkpoint
                .source_checkpoint("existing_source_with_empty_checkpoint")
                .is_some()
        );
        index_checkpoint.remove_source("existing_source_with_empty_checkpoint"); //< we just check this does not fail
        assert!(
            index_checkpoint
                .source_checkpoint("existing_source_with_empty_checkpoint")
                .is_none()
        );
    }

    #[test]
    fn test_get_source_checkpoint() {
        let partition = PartitionId::from("a");
        let delta = SourceCheckpointDelta::from_partition_delta(
            partition.clone(),
            Position::offset(42u64),
            Position::offset(43u64),
        )
        .unwrap();
        let checkpoint: SourceCheckpoint = delta.get_source_checkpoint();
        assert_eq!(
            checkpoint.position_for_partition(&partition).unwrap(),
            &Position::offset(43u64)
        );
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_proto::metastore::MetastoreError;

/// Generic Storage Resolver error.
#[derive(Debug, thiserror::Error)]
pub enum MetastoreResolverError {
    /// The metastore config is invalid.
    #[error("invalid metastore config: `{0}`")]
    InvalidConfig(String),

    /// The URI does not contain sufficient information to connect to the metastore.
    #[error("invalid metastore URI: `{0}`")]
    InvalidUri(String),

    /// The requested backend is unsupported or unavailable.
    #[error("unsupported metastore backend: `{0}`")]
    UnsupportedBackend(String),

    /// The config and URI are valid, and are meant to be handled by this resolver, but the
    /// resolver failed to actually connect to the backend. e.g. connection error, credentials
    /// error, incompatible version, internal error in a third party, etc.
    #[error("failed to connect to metastore: `{0}`")]
    Initialization(#[from] MetastoreError),
}


================================================
FILE: quickwit/quickwit-metastore/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![warn(missing_docs)]
#![allow(clippy::bool_assert_comparison)]
#![deny(clippy::disallowed_methods)]
#![allow(rustdoc::invalid_html_tags)]

//! `quickwit-metastore` is the abstraction used in Quickwit to interface itself to different
//! metastore:
//! - file-backed metastore
//! - PostgreSQL metastore
//! - etc.

#[allow(missing_docs)]
pub mod checkpoint;
mod error;
mod metastore;
mod metastore_factory;
mod metastore_resolver;
mod split_metadata;
mod split_metadata_version;
#[cfg(test)]
pub(crate) mod tests;

use std::ops::Range;

pub use error::MetastoreResolverError;
pub use metastore::control_plane_metastore::ControlPlaneMetastore;
pub use metastore::file_backed::FileBackedMetastore;
pub(crate) use metastore::index_metadata::serialize::{IndexMetadataV0_8, VersionedIndexMetadata};
#[cfg(feature = "postgres")]
pub use metastore::postgres::PostgresqlMetastore;
pub use metastore::{
    AddSourceRequestExt, CreateIndexRequestExt, CreateIndexResponseExt, IndexMetadata,
    IndexMetadataResponseExt, IndexesMetadataResponseExt, ListIndexesMetadataResponseExt,
    ListSplitsQuery, ListSplitsRequestExt, ListSplitsResponseExt, MetastoreServiceExt,
    MetastoreServiceStreamSplitsExt, PublishSplitsRequestExt, StageSplitsRequestExt,
    UpdateIndexRequestExt, UpdateSourceRequestExt, file_backed,
};
pub use metastore_factory::{MetastoreFactory, UnsupportedMetastore};
pub use metastore_resolver::MetastoreResolver;
use quickwit_common::is_disjoint;
use quickwit_doc_mapper::tag_pruning::TagFilterAst;
pub use split_metadata::{Split, SplitInfo, SplitMaturity, SplitMetadata, SplitState};
pub(crate) use split_metadata_version::{SplitMetadataV0_8, VersionedSplitMetadata};

#[derive(utoipa::OpenApi)]
#[openapi(components(schemas(
    IndexMetadataV0_8,
    Split,
    SplitMetadataV0_8,
    SplitState,
    VersionedIndexMetadata,
    VersionedSplitMetadata,
)))]
/// Schema used for the OpenAPI generation which are apart of this crate.
pub struct MetastoreApiSchemas;

/// Returns `true` if the split time range is included in `time_range_opt`.
/// If `time_range_opt` is None, returns always true.
pub fn split_time_range_filter(
    split_metadata: &SplitMetadata,
    time_range_opt: Option<&Range<i64>>,
) -> bool {
    match (time_range_opt, split_metadata.time_range.as_ref()) {
        (Some(filter_time_range), Some(split_time_range)) => {
            !is_disjoint(filter_time_range, split_time_range)
        }
        _ => true, // Return `true` if `time_range` is omitted or the split has no time range.
    }
}
/// Returns `true` if the tags filter evaluation is true.
/// If `tags_filter_opt` is None, returns always true.
pub fn split_tag_filter(
    split_metadata: &SplitMetadata,
    tags_filter_opt: Option<&TagFilterAst>,
) -> bool {
    tags_filter_opt
        .map(|tags_filter_ast| tags_filter_ast.evaluate(&split_metadata.tags))
        .unwrap_or(true)
}

#[cfg(test)]
mod backward_compatibility_tests;

#[cfg(any(test, feature = "testsuite"))]
/// Returns a metastore backed by an "in-memory file" for testing.
pub fn metastore_for_test() -> quickwit_proto::metastore::MetastoreServiceClient {
    quickwit_proto::metastore::MetastoreServiceClient::new(FileBackedMetastore::for_test(
        std::sync::Arc::new(quickwit_storage::RamStorage::default()),
    ))
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/control_plane_metastore.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_proto::control_plane::{ControlPlaneService, ControlPlaneServiceClient};
use quickwit_proto::metastore::{
    AcquireShardsRequest, AcquireShardsResponse, AddSourceRequest, CreateIndexRequest,
    CreateIndexResponse, CreateIndexTemplateRequest, DeleteIndexRequest,
    DeleteIndexTemplatesRequest, DeleteQuery, DeleteShardsRequest, DeleteShardsResponse,
    DeleteSourceRequest, DeleteSplitsRequest, DeleteTask, EmptyResponse,
    FindIndexTemplateMatchesRequest, FindIndexTemplateMatchesResponse, GetClusterIdentityRequest,
    GetClusterIdentityResponse, GetIndexTemplateRequest, GetIndexTemplateResponse,
    IndexMetadataRequest, IndexMetadataResponse, IndexesMetadataRequest, IndexesMetadataResponse,
    LastDeleteOpstampRequest, LastDeleteOpstampResponse, ListDeleteTasksRequest,
    ListDeleteTasksResponse, ListIndexStatsRequest, ListIndexStatsResponse,
    ListIndexTemplatesRequest, ListIndexTemplatesResponse, ListIndexesMetadataRequest,
    ListIndexesMetadataResponse, ListShardsRequest, ListShardsResponse, ListSplitsRequest,
    ListSplitsResponse, ListStaleSplitsRequest, MarkSplitsForDeletionRequest, MetastoreResult,
    MetastoreService, MetastoreServiceClient, MetastoreServiceStream, OpenShardsRequest,
    OpenShardsResponse, PruneShardsRequest, PublishSplitsRequest, ResetSourceCheckpointRequest,
    StageSplitsRequest, ToggleSourceRequest, UpdateIndexRequest, UpdateSourceRequest,
    UpdateSplitsDeleteOpstampRequest, UpdateSplitsDeleteOpstampResponse,
};

/// A [`MetastoreService`] implementation that proxies some requests to the control plane so it can
/// track the state of the metastore accurately and react to events in real-time.
#[derive(Clone)]
pub struct ControlPlaneMetastore {
    control_plane: ControlPlaneServiceClient,
    metastore: MetastoreServiceClient,
}

impl fmt::Debug for ControlPlaneMetastore {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("ControlPlaneMetastore").finish()
    }
}

impl ControlPlaneMetastore {
    /// Creates a new [`ControlPlaneMetastore`].
    pub fn new(
        control_plane: ControlPlaneServiceClient,
        metastore: MetastoreServiceClient,
    ) -> Self {
        Self {
            control_plane,
            metastore,
        }
    }
}

#[async_trait]
impl MetastoreService for ControlPlaneMetastore {
    fn endpoints(&self) -> Vec<Uri> {
        self.metastore.endpoints()
    }

    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.metastore.check_connectivity().await
    }

    // Proxied metastore API calls.

    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> MetastoreResult<CreateIndexResponse> {
        let response = self.control_plane.create_index(request).await?;
        Ok(response)
    }

    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> MetastoreResult<IndexMetadataResponse> {
        let response = self.control_plane.update_index(request).await?;
        Ok(response)
    }

    async fn delete_index(&self, request: DeleteIndexRequest) -> MetastoreResult<EmptyResponse> {
        let response = self.control_plane.delete_index(request).await?;
        Ok(response)
    }

    async fn add_source(&self, request: AddSourceRequest) -> MetastoreResult<EmptyResponse> {
        let response = self.control_plane.add_source(request).await?;
        Ok(response)
    }

    async fn update_source(&self, request: UpdateSourceRequest) -> MetastoreResult<EmptyResponse> {
        let response = self.control_plane.update_source(request).await?;
        Ok(response)
    }

    async fn toggle_source(&self, request: ToggleSourceRequest) -> MetastoreResult<EmptyResponse> {
        let response = self.control_plane.toggle_source(request).await?;
        Ok(response)
    }

    async fn delete_source(&self, request: DeleteSourceRequest) -> MetastoreResult<EmptyResponse> {
        let response = self.control_plane.delete_source(request).await?;
        Ok(response)
    }

    // Proxy through the control plane to debounce queries
    async fn prune_shards(&self, request: PruneShardsRequest) -> MetastoreResult<EmptyResponse> {
        self.control_plane.prune_shards(request).await?;
        Ok(EmptyResponse {})
    }

    // Other metastore API calls.

    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> MetastoreResult<IndexMetadataResponse> {
        self.metastore.index_metadata(request).await
    }

    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> MetastoreResult<IndexesMetadataResponse> {
        self.metastore.indexes_metadata(request).await
    }

    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> MetastoreResult<ListIndexesMetadataResponse> {
        self.metastore.list_indexes_metadata(request).await
    }

    async fn stage_splits(&self, request: StageSplitsRequest) -> MetastoreResult<EmptyResponse> {
        self.metastore.stage_splits(request).await
    }

    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> MetastoreResult<EmptyResponse> {
        self.metastore.publish_splits(request).await
    }

    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        self.metastore.list_splits(request).await
    }

    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> MetastoreResult<ListIndexStatsResponse> {
        self.metastore.list_index_stats(request).await
    }

    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> MetastoreResult<ListSplitsResponse> {
        self.metastore.list_stale_splits(request).await
    }

    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> MetastoreResult<EmptyResponse> {
        self.metastore.mark_splits_for_deletion(request).await
    }

    async fn delete_splits(&self, request: DeleteSplitsRequest) -> MetastoreResult<EmptyResponse> {
        self.metastore.delete_splits(request).await
    }

    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> MetastoreResult<EmptyResponse> {
        self.metastore.reset_source_checkpoint(request).await
    }

    // Delete tasks API

    async fn create_delete_task(&self, delete_query: DeleteQuery) -> MetastoreResult<DeleteTask> {
        self.metastore.create_delete_task(delete_query).await
    }

    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> MetastoreResult<LastDeleteOpstampResponse> {
        self.metastore.last_delete_opstamp(request).await
    }

    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        self.metastore.update_splits_delete_opstamp(request).await
    }

    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> MetastoreResult<ListDeleteTasksResponse> {
        self.metastore.list_delete_tasks(request).await
    }

    // Shard API

    async fn open_shards(&self, request: OpenShardsRequest) -> MetastoreResult<OpenShardsResponse> {
        self.metastore.open_shards(request).await
    }

    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> MetastoreResult<AcquireShardsResponse> {
        self.metastore.acquire_shards(request).await
    }

    async fn list_shards(&self, request: ListShardsRequest) -> MetastoreResult<ListShardsResponse> {
        self.metastore.list_shards(request).await
    }

    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> MetastoreResult<DeleteShardsResponse> {
        self.metastore.delete_shards(request).await
    }

    // Index Template API

    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> MetastoreResult<EmptyResponse> {
        self.metastore.create_index_template(request).await
    }

    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> MetastoreResult<GetIndexTemplateResponse> {
        self.metastore.get_index_template(request).await
    }

    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> MetastoreResult<FindIndexTemplateMatchesResponse> {
        self.metastore.find_index_template_matches(request).await
    }

    async fn list_index_templates(
        &self,
        request: ListIndexTemplatesRequest,
    ) -> MetastoreResult<ListIndexTemplatesResponse> {
        self.metastore.list_index_templates(request).await
    }

    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> MetastoreResult<EmptyResponse> {
        self.metastore.delete_index_templates(request).await
    }

    async fn get_cluster_identity(
        &self,
        request: GetClusterIdentityRequest,
    ) -> MetastoreResult<GetClusterIdentityResponse> {
        self.metastore.get_cluster_identity(request).await
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/file_backed_index/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! [`FileBackedIndex`] module. It is public so that the crate `quickwit-backward-compat` can
//! import [`FileBackedIndex`] and run backward-compatibility tests. You should not have to import
//! anything from here directly.

mod serialize;
mod shards;

use std::collections::HashMap;
use std::fmt::Debug;
use std::ops::Bound;

use itertools::Itertools;
use quickwit_common::pretty::PrettySample;
use quickwit_config::{
    DocMapping, IndexingSettings, IngestSettings, RetentionPolicy, SearchSettings, SourceConfig,
};
use quickwit_proto::metastore::{
    AcquireShardsRequest, AcquireShardsResponse, DeleteQuery, DeleteShardsRequest,
    DeleteShardsResponse, DeleteTask, EntityKind, IndexStats, ListShardsSubrequest,
    ListShardsSubresponse, MetastoreError, MetastoreResult, OpenShardSubrequest,
    OpenShardSubresponse, PruneShardsRequest, SplitStats,
};
use quickwit_proto::types::{IndexUid, PublishToken, SourceId, SplitId};
use serde::{Deserialize, Serialize};
use serialize::VersionedFileBackedIndex;
use shards::Shards;
use time::OffsetDateTime;
use tracing::{info, warn};

use super::MutationOccurred;
use crate::checkpoint::IndexCheckpointDelta;
use crate::metastore::{SortBy, use_shard_api};
use crate::{IndexMetadata, ListSplitsQuery, Split, SplitMetadata, SplitState, split_tag_filter};

/// A `FileBackedIndex` object carries an index metadata and its split metadata.
// This struct is meant to be used only within the [`FileBackedMetastore`]. The public visibility is
#[derive(Clone, Debug, Serialize, Deserialize)]
#[serde(into = "VersionedFileBackedIndex")]
#[serde(from = "VersionedFileBackedIndex")]
pub(crate) struct FileBackedIndex {
    /// Metadata specific to the index.
    metadata: IndexMetadata,
    /// List of splits belonging to the index.
    splits: HashMap<SplitId, Split>,
    /// Shards of each source.
    per_source_shards: HashMap<SourceId, Shards>,
    /// Delete tasks.
    delete_tasks: Vec<DeleteTask>,
    /// Stamper.
    stamper: Stamper,
    /// Flag used to avoid polling the metastore if
    /// the process is actually writing the metastore.
    ///
    /// The logic is "soft". We avoid the polling step
    /// if the metastore wrote some value since the last
    /// polling loop.
    recently_modified: bool,
    /// Has been discarded. This field exists to make
    /// it possible to discard this entry if there is an error
    /// while mutating the Index.
    pub discarded: bool,
}

#[cfg(any(test, feature = "testsuite"))]
impl quickwit_config::TestableForRegression for FileBackedIndex {
    fn sample_for_regression() -> Self {
        use quickwit_config::INGEST_V2_SOURCE_ID;
        use quickwit_proto::ingest::{Shard, ShardState};
        use quickwit_proto::types::{DocMappingUid, Position, ShardId};

        let index_metadata = IndexMetadata::sample_for_regression();
        let index_uid = index_metadata.index_uid.clone();
        let source_id = INGEST_V2_SOURCE_ID.to_string();

        let split_metadata = SplitMetadata::sample_for_regression();
        let split = Split {
            split_state: SplitState::Published,
            split_metadata,
            update_timestamp: 1789,
            publish_timestamp: Some(1789),
        };
        let splits = vec![split];

        let shard = Shard {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            leader_id: "leader-ingester".to_string(),
            follower_id: Some("follower-ingester".to_string()),
            doc_mapping_uid: Some(DocMappingUid::for_test(1)),
            publish_position_inclusive: Some(Position::Beginning),
            update_timestamp: 1724240908,
            ..Default::default()
        };
        let shards = Shards::from_shards_vec(index_uid.clone(), source_id.clone(), vec![shard]);
        let per_source_shards = HashMap::from_iter([(source_id, shards)]);

        let delete_task = DeleteTask {
            create_timestamp: 0,
            opstamp: 10,
            delete_query: Some(DeleteQuery {
                index_uid: index_uid.into(),
                start_timestamp: None,
                end_timestamp: None,
                query_ast: quickwit_query::query_ast::qast_json_helper("Harry Potter", &["body"]),
            }),
        };
        let delete_tasks = vec![delete_task];
        FileBackedIndex::new(index_metadata, splits, per_source_shards, delete_tasks)
    }

    fn assert_equality(&self, other: &Self) {
        self.metadata().assert_equality(other.metadata());
        assert_eq!(self.splits, other.splits);
        assert_eq!(self.per_source_shards, other.per_source_shards);
        assert_eq!(self.delete_tasks, other.delete_tasks);
    }
}

impl From<IndexMetadata> for FileBackedIndex {
    fn from(index_metadata: IndexMetadata) -> Self {
        let per_source_shards = index_metadata
            .sources
            .keys()
            .map(|source_id| {
                let shards = Shards::empty(index_metadata.index_uid.clone(), source_id.clone());
                (source_id.clone(), shards)
            })
            .collect();

        Self {
            metadata: index_metadata,
            splits: Default::default(),
            per_source_shards,
            delete_tasks: Default::default(),
            stamper: Default::default(),
            recently_modified: false,
            discarded: false,
        }
    }
}

enum DeleteSplitOutcome {
    Success,
    SplitNotFound,
    // The split is in another state than marked for deletion.
    Forbidden,
}

impl FileBackedIndex {
    /// Constructor.
    pub fn new(
        metadata: IndexMetadata,
        splits: Vec<Split>,
        per_source_shards: HashMap<SourceId, Shards>,
        delete_tasks: Vec<DeleteTask>,
    ) -> Self {
        let last_opstamp = delete_tasks
            .iter()
            .map(|delete_task| delete_task.opstamp)
            .max()
            .unwrap_or(0) as usize;
        let splits = splits
            .into_iter()
            .map(|split| (split.split_id().to_string(), split))
            .collect();
        Self {
            metadata,
            splits,
            per_source_shards,
            delete_tasks,
            stamper: Stamper::new(last_opstamp),
            recently_modified: false,
            discarded: false,
        }
    }

    /// Sets the `recently_modified` flag to false and returns the previous value.
    pub fn flip_recently_modified_down(&mut self) -> bool {
        std::mem::replace(&mut self.recently_modified, false)
    }

    /// Marks the file as `recently_modified`.
    pub fn set_recently_modified(&mut self) {
        self.recently_modified = true;
    }

    /// Index ID accessor.
    pub fn index_id(&self) -> &str {
        self.metadata.index_id()
    }

    /// Index UID accessor.
    pub fn index_uid(&self) -> &IndexUid {
        &self.metadata.index_uid
    }

    /// Index metadata accessor.
    pub fn metadata(&self) -> &IndexMetadata {
        &self.metadata
    }

    pub fn update_index_config(
        &mut self,
        doc_mapping: DocMapping,
        indexing_settings: IndexingSettings,
        ingest_settings: IngestSettings,
        search_settings: SearchSettings,
        retention_policy_opt: Option<RetentionPolicy>,
    ) -> MetastoreResult<bool> {
        self.metadata.update_index_config(
            doc_mapping,
            indexing_settings,
            ingest_settings,
            search_settings,
            retention_policy_opt,
        )
    }

    /// Stages a single split.
    ///
    /// If a split already exists and is in the [SplitState::Staged] state,
    /// it is simply updated/overwritten.
    ///
    /// If a split already exists and is *not* in the [SplitState::Staged] state, a
    /// [MetastoreError::NotFound] error is returned providing the split ID to go with
    /// it.
    pub(crate) fn stage_split(
        &mut self,
        split_metadata: SplitMetadata,
    ) -> Result<(), MetastoreError> {
        // Check whether the split exists.
        // If the split exists, we check what state it is in. If it's anything other than `Staged`
        // something has gone very wrong and we should abort the operation.
        if let Some(split) = self.splits.get(split_metadata.split_id())
            && split.split_state != SplitState::Staged
        {
            let entity = EntityKind::Split {
                split_id: split.split_id().to_string(),
            };
            let message = "split is not staged".to_string();
            return Err(MetastoreError::FailedPrecondition { entity, message });
        }
        let now_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        let split = Split {
            split_state: SplitState::Staged,
            update_timestamp: now_timestamp,
            publish_timestamp: None,
            split_metadata,
        };
        self.splits.insert(split.split_id().to_string(), split);
        Ok(())
    }

    /// Marks the splits for deletion. Returns whether a mutation occurred.
    pub(crate) fn mark_splits_for_deletion(
        &mut self,
        split_ids: impl IntoIterator<Item = impl AsRef<str>>,
        deletable_split_states: &[SplitState],
        return_error_on_splits_not_found: bool,
    ) -> MetastoreResult<bool> {
        let mut mutation_occurred = false;
        let mut split_not_found_ids = Vec::new();
        let mut non_deletable_split_ids = Vec::new();
        let now_timestamp = OffsetDateTime::now_utc().unix_timestamp();

        for split_id in split_ids {
            let split_id_ref = split_id.as_ref();
            // Check for the existence of split.
            let metadata = match self.splits.get_mut(split_id_ref) {
                Some(metadata) => metadata,
                None => {
                    split_not_found_ids.push(split_id_ref.to_string());
                    continue;
                }
            };
            if !deletable_split_states.contains(&metadata.split_state) {
                non_deletable_split_ids.push(split_id_ref.to_string());
                continue;
            };
            if metadata.split_state == SplitState::MarkedForDeletion {
                // If the split is already marked for deletion, This is fine, we just skip it.
                continue;
            }
            metadata.split_state = SplitState::MarkedForDeletion;
            metadata.update_timestamp = now_timestamp;
            mutation_occurred = true;
        }
        if !split_not_found_ids.is_empty() {
            if return_error_on_splits_not_found {
                return Err(MetastoreError::NotFound(EntityKind::Splits {
                    split_ids: split_not_found_ids,
                }));
            } else {
                warn!(
                    index_id=%self.index_id(),
                    split_ids=?PrettySample::new(&split_not_found_ids, 5),
                    "{} splits were not found and could not be marked for deletion.",
                    split_not_found_ids.len()
                );
            }
        }
        if !non_deletable_split_ids.is_empty() {
            let entity = EntityKind::Splits {
                split_ids: non_deletable_split_ids,
            };
            let message = "splits are not deletable".to_string();
            return Err(MetastoreError::FailedPrecondition { entity, message });
        }
        Ok(mutation_occurred)
    }

    /// Helper to mark a list of splits as published.
    /// This function however does not update the checkpoint.
    fn mark_splits_as_published_helper(
        &mut self,
        staged_split_ids: impl IntoIterator<Item = impl AsRef<str>>,
    ) -> MetastoreResult<()> {
        let mut split_not_found_ids = Vec::new();
        let mut split_not_staged_ids = Vec::new();

        let now_timestamp = OffsetDateTime::now_utc().unix_timestamp();

        for staged_plit_id in staged_split_ids {
            let staged_split_id_ref = staged_plit_id.as_ref();
            // Check for the existence of split.
            let Some(metadata) = self.splits.get_mut(staged_split_id_ref) else {
                split_not_found_ids.push(staged_split_id_ref.to_string());
                continue;
            };
            if metadata.split_state == SplitState::Staged {
                metadata.split_state = SplitState::Published;
                metadata.update_timestamp = now_timestamp;
                metadata.publish_timestamp = Some(now_timestamp);
            } else {
                split_not_staged_ids.push(staged_split_id_ref.to_string());
            }
        }
        if !split_not_found_ids.is_empty() {
            return Err(MetastoreError::NotFound(EntityKind::Splits {
                split_ids: split_not_found_ids,
            }));
        }
        if !split_not_staged_ids.is_empty() {
            let entity = EntityKind::Splits {
                split_ids: split_not_staged_ids,
            };
            let message = "splits are not staged".to_string();
            return Err(MetastoreError::FailedPrecondition { entity, message });
        }
        Ok(())
    }

    /// Publishes splits.
    pub(crate) fn publish_splits(
        &mut self,
        staged_split_ids: impl IntoIterator<Item = impl AsRef<str>>,
        replaced_split_ids: impl IntoIterator<Item = impl AsRef<str>>,
        checkpoint_delta_opt: Option<IndexCheckpointDelta>,
        publish_token_opt: Option<PublishToken>,
    ) -> MetastoreResult<()> {
        if let Some(checkpoint_delta) = checkpoint_delta_opt {
            let source_id = checkpoint_delta.source_id.clone();
            let source = self.metadata.sources.get(&source_id).ok_or_else(|| {
                MetastoreError::NotFound(EntityKind::Source {
                    index_id: self.index_id().to_string(),
                    source_id: source_id.clone(),
                })
            })?;

            if use_shard_api(&source.source_params) {
                let publish_token = publish_token_opt.ok_or_else(|| {
                    let message = format!(
                        "publish token is required for publishing splits for source `{source_id}`"
                    );
                    MetastoreError::InvalidArgument { message }
                })?;
                self.try_apply_delta_v2(checkpoint_delta, publish_token)?;
            } else {
                self.metadata
                    .checkpoint
                    .try_apply_delta(checkpoint_delta)
                    .map_err(|error| {
                        quickwit_common::rate_limited_error!(
                            limit_per_min = 6,
                            index = self.index_id(),
                            "failed to apply checkpoint delta"
                        );
                        let entity = EntityKind::CheckpointDelta {
                            index_id: self.index_id().to_string(),
                            source_id,
                        };
                        let message = error.to_string();
                        MetastoreError::FailedPrecondition { entity, message }
                    })?;
            }
        }
        self.mark_splits_as_published_helper(staged_split_ids)?;
        self.mark_splits_for_deletion(replaced_split_ids, &[SplitState::Published], true)?;
        Ok(())
    }

    /// Lists splits.
    pub(crate) fn list_splits(&self, query: &ListSplitsQuery) -> MetastoreResult<Vec<Split>> {
        let limit = query
            .limit
            .map(|limit| limit + query.offset.unwrap_or_default())
            .unwrap_or(usize::MAX);
        // skip is done at a higher layer in case other indexes give spltis that would go before
        // ours

        let results = if query.sort_by == SortBy::None {
            // internally sorted_unstable_by collect everything to an intermediary vec. When not
            // sorting at all, skip that.
            self.splits
                .values()
                .filter(|split| split_query_predicate(split, query))
                .take(limit)
                .cloned()
                .collect()
        } else {
            self.splits
                .values()
                .filter(|split| split_query_predicate(split, query))
                .sorted_unstable_by(|lhs, rhs| query.sort_by.compare(lhs, rhs))
                .take(limit)
                .cloned()
                .collect()
        };
        Ok(results)
    }

    /// Deletes a split.
    fn delete_split(&mut self, split_id: &str) -> DeleteSplitOutcome {
        match self.splits.get(split_id).map(|split| split.split_state) {
            Some(SplitState::MarkedForDeletion) => {
                self.splits.remove(split_id);
                DeleteSplitOutcome::Success
            }
            Some(SplitState::Staged | SplitState::Published) => DeleteSplitOutcome::Forbidden,
            None => DeleteSplitOutcome::SplitNotFound,
        }
    }

    /// Deletes multiple splits.
    pub(crate) fn delete_splits(
        &mut self,
        split_ids: impl IntoIterator<Item = impl AsRef<str>>,
    ) -> MetastoreResult<()> {
        let num_deleted_splits = 0;
        let mut split_not_found_ids = Vec::new();
        let mut split_not_deletable_ids = Vec::new();

        for split_id in split_ids {
            let split_id_ref = split_id.as_ref();
            match self.delete_split(split_id_ref) {
                DeleteSplitOutcome::Success => {}
                DeleteSplitOutcome::SplitNotFound => {
                    split_not_found_ids.push(split_id_ref.to_string());
                }
                DeleteSplitOutcome::Forbidden => {
                    split_not_deletable_ids.push(split_id_ref.to_string());
                }
            }
        }
        if !split_not_deletable_ids.is_empty() {
            let entity = EntityKind::Splits {
                split_ids: split_not_deletable_ids,
            };
            let message = "splits are not deletable".to_string();
            return Err(MetastoreError::FailedPrecondition { entity, message });
        }
        info!(index_id=%self.index_id(), "deleted {num_deleted_splits} splits from index");

        if !split_not_found_ids.is_empty() {
            warn!(
                index_id=self.index_id().to_string(),
                split_ids=?PrettySample::new(&split_not_found_ids, 5),
                "{} splits were not found and could not be deleted",
                split_not_found_ids.len()
            );
        }
        Ok(())
    }

    /// Gets IndexStats for this index
    pub(crate) fn get_stats(&self) -> MetastoreResult<IndexStats> {
        let mut staged_stats = SplitStats::default();
        let mut published_stats = SplitStats::default();
        let mut marked_for_deletion_stats = SplitStats::default();

        for split in self.splits.values() {
            match split.split_state {
                SplitState::Staged => {
                    staged_stats.add_split(split.split_metadata.footer_offsets.end)
                }
                SplitState::Published => {
                    published_stats.add_split(split.split_metadata.footer_offsets.end)
                }
                SplitState::MarkedForDeletion => {
                    marked_for_deletion_stats.add_split(split.split_metadata.footer_offsets.end)
                }
            }
        }

        Ok(IndexStats {
            index_uid: Some(self.index_uid().clone()),
            staged: Some(staged_stats),
            published: Some(published_stats),
            marked_for_deletion: Some(marked_for_deletion_stats),
        })
    }

    /// Adds a source.
    pub(crate) fn add_source(&mut self, source_config: SourceConfig) -> MetastoreResult<()> {
        let index_uid = self.index_uid().clone();
        let source_id = source_config.source_id.clone();

        self.metadata.add_source(source_config)?;

        let shards = Shards::empty(index_uid, source_id.clone());
        self.per_source_shards.insert(source_id, shards);
        Ok(())
    }

    /// Updates a source. Returns whether a mutation occurred.
    pub(crate) fn update_source(&mut self, source_config: SourceConfig) -> MetastoreResult<bool> {
        self.metadata.update_source(source_config)
    }

    /// Enables or disables a source. Returns whether a mutation occurred.
    pub(crate) fn toggle_source(&mut self, source_id: &str, enable: bool) -> MetastoreResult<bool> {
        self.metadata.toggle_source(source_id, enable)
    }

    /// Deletes the source. Returns whether a mutation occurred.
    pub(crate) fn delete_source(&mut self, source_id: &str) -> MetastoreResult<()> {
        self.metadata.delete_source(source_id)
    }

    /// Resets the checkpoint of a source. Returns whether a mutation occurred.
    pub(crate) fn reset_source_checkpoint(&mut self, source_id: &str) -> MetastoreResult<bool> {
        Ok(self.metadata.checkpoint.reset_source(source_id))
    }

    /// Creates [`DeleteTask`] from a [`DeleteQuery`].
    pub(crate) fn create_delete_task(
        &mut self,
        delete_query: DeleteQuery,
    ) -> MetastoreResult<DeleteTask> {
        let now_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        let delete_task = DeleteTask {
            create_timestamp: now_timestamp,
            opstamp: self.stamper.stamp() as u64,
            delete_query: Some(delete_query),
        };
        self.delete_tasks.push(delete_task.clone());
        Ok(delete_task)
    }

    /// Returns index last delete opstamp.
    pub(crate) fn last_delete_opstamp(&self) -> u64 {
        self.delete_tasks
            .iter()
            .map(|delete_task| delete_task.opstamp)
            .max()
            .unwrap_or(0)
    }

    /// Updates splits delete opstamp. Returns that a mutation occurred (true).
    pub(crate) fn update_splits_delete_opstamp(
        &mut self,
        split_ids: &[&str],
        delete_opstamp: u64,
    ) -> MetastoreResult<bool> {
        for split_id in split_ids {
            let split = self.splits.get_mut(*split_id).ok_or_else(|| {
                MetastoreError::NotFound(EntityKind::Splits {
                    split_ids: vec![split_id.to_string()],
                })
            })?;
            split.split_metadata.delete_opstamp = delete_opstamp;
        }
        Ok(true)
    }

    /// Lists delete tasks with opstamp > `opstamp_start`.
    pub(crate) fn list_delete_tasks(&self, opstamp_start: u64) -> MetastoreResult<Vec<DeleteTask>> {
        let delete_tasks = self
            .delete_tasks
            .iter()
            .filter(|delete_task| delete_task.opstamp > opstamp_start)
            .cloned()
            .collect();
        Ok(delete_tasks)
    }

    // Shard API

    fn get_shards_for_source(&self, source_id: &str) -> MetastoreResult<&Shards> {
        self.per_source_shards.get(source_id).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Source {
                index_id: self.index_id().to_string(),
                source_id: source_id.to_string(),
            })
        })
    }

    fn get_shards_for_source_mut(&mut self, source_id: &str) -> MetastoreResult<&mut Shards> {
        self.per_source_shards.get_mut(source_id).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Source {
                index_id: self.metadata.index_id().to_string(),
                source_id: source_id.to_string(),
            })
        })
    }

    pub(crate) fn open_shards(
        &mut self,
        subrequests: Vec<OpenShardSubrequest>,
    ) -> MetastoreResult<MutationOccurred<Vec<OpenShardSubresponse>>> {
        let mut mutation_occurred = false;
        let mut subresponses = Vec::with_capacity(subrequests.len());

        for subrequest in subrequests {
            let subresponse = match self
                .get_shards_for_source_mut(&subrequest.source_id)?
                .open_shard(subrequest)?
            {
                MutationOccurred::Yes(subresponse) => {
                    mutation_occurred = true;
                    subresponse
                }
                MutationOccurred::No(subresponse) => subresponse,
            };
            subresponses.push(subresponse);
        }
        if mutation_occurred {
            Ok(MutationOccurred::Yes(subresponses))
        } else {
            Ok(MutationOccurred::No(subresponses))
        }
    }

    pub(crate) fn acquire_shards(
        &mut self,
        request: AcquireShardsRequest,
    ) -> MetastoreResult<MutationOccurred<AcquireShardsResponse>> {
        self.get_shards_for_source_mut(&request.source_id)?
            .acquire_shards(request)
    }

    pub(crate) fn delete_shards(
        &mut self,
        request: DeleteShardsRequest,
    ) -> MetastoreResult<MutationOccurred<DeleteShardsResponse>> {
        self.get_shards_for_source_mut(&request.source_id)?
            .delete_shards(request)
    }

    pub(crate) fn prune_shards(
        &mut self,
        request: PruneShardsRequest,
    ) -> MetastoreResult<MutationOccurred<()>> {
        self.get_shards_for_source_mut(&request.source_id)?
            .prune_shards(request)
    }

    pub(crate) fn list_shards(
        &self,
        subrequest: ListShardsSubrequest,
    ) -> MetastoreResult<ListShardsSubresponse> {
        self.get_shards_for_source(&subrequest.source_id)?
            .list_shards(subrequest)
    }

    pub(crate) fn try_apply_delta_v2(
        &mut self,
        checkpoint_delta: IndexCheckpointDelta,
        publish_token: PublishToken,
    ) -> MetastoreResult<MutationOccurred<()>> {
        self.get_shards_for_source_mut(&checkpoint_delta.source_id)?
            .try_apply_delta(checkpoint_delta.source_delta, publish_token)
    }
}

/// Stamper provides Opstamps, which is just an auto-increment id to label
/// a delete operation.
#[derive(Clone, Default)]
struct Stamper(usize);

impl Stamper {
    /// Creates a new [`Stamper`].
    pub fn new(initial_opstamp: usize) -> Self {
        Self(initial_opstamp)
    }

    /// Increments the stamper by 1 and returns the incremented value.
    pub fn stamp(&mut self) -> usize {
        self.0 += 1;
        self.0
    }
}

impl Debug for Stamper {
    fn fmt(&self, fmt: &mut std::fmt::Formatter) -> std::fmt::Result {
        fmt.debug_struct("Stamper").field("stamp", &self.0).finish()
    }
}

fn split_query_predicate(split: &&Split, query: &ListSplitsQuery) -> bool {
    if !split_tag_filter(&split.split_metadata, query.tags.as_ref()) {
        return false;
    }

    if !query.split_states.is_empty() && !query.split_states.contains(&split.split_state) {
        return false;
    }

    if !query
        .delete_opstamp
        .contains(&split.split_metadata.delete_opstamp)
    {
        return false;
    }

    if !query.update_timestamp.contains(&split.update_timestamp) {
        return false;
    }

    if !query
        .create_timestamp
        .contains(&split.split_metadata.create_timestamp)
    {
        return false;
    }

    match &query.mature {
        Bound::Included(evaluation_datetime) => {
            return split.split_metadata.is_mature(*evaluation_datetime);
        }
        Bound::Excluded(evaluation_datetime) => {
            return !split.split_metadata.is_mature(*evaluation_datetime);
        }
        Bound::Unbounded => {}
    }

    if let Some(range) = &split.split_metadata.time_range {
        if !query.time_range.overlaps_with(range.clone()) {
            return false;
        }
        if let Some(v) = query.max_time_range_end
            && range.end() > &v
        {
            return false;
        }
    }

    if let Some(node_id) = &query.node_id
        && split.split_metadata.node_id != *node_id
    {
        return false;
    }

    if let Some((index_uid, split_id)) = &query.after_split {
        if *index_uid > split.split_metadata.index_uid {
            return false;
        }
        if *index_uid == split.split_metadata.index_uid
            && *split_id >= split.split_metadata.split_id
        {
            return false;
        }
    }

    true
}

#[cfg(test)]
mod tests {
    use std::collections::{BTreeSet, HashMap};

    use quickwit_doc_mapper::tag_pruning::TagFilterAst;
    use quickwit_proto::ingest::Shard;
    use quickwit_proto::metastore::{ListShardsSubrequest, SplitStats};
    use quickwit_proto::types::{IndexUid, SourceId};

    use super::FileBackedIndex;
    use crate::file_backed::file_backed_index::split_query_predicate;
    use crate::{IndexMetadata, ListSplitsQuery, Split, SplitMetadata, SplitState};

    impl FileBackedIndex {
        pub(crate) fn insert_shards(&mut self, source_id: &SourceId, shards: Vec<Shard>) {
            self.per_source_shards
                .get_mut(source_id)
                .unwrap()
                .insert_shards(shards)
        }

        pub(crate) fn list_all_shards(&self, source_id: &SourceId) -> Vec<Shard> {
            self.per_source_shards
                .get(source_id)
                .unwrap()
                .list_shards(ListShardsSubrequest {
                    ..Default::default()
                })
                .unwrap()
                .shards
        }
    }

    fn make_splits() -> [Split; 3] {
        [
            Split {
                split_metadata: SplitMetadata {
                    split_id: "split-1".to_string(),
                    delete_opstamp: 9,
                    time_range: Some(32..=40),
                    tags: BTreeSet::from(["tag-1".to_string()]),
                    create_timestamp: 12,
                    footer_offsets: 0..2048,
                    ..Default::default()
                },
                split_state: SplitState::Staged,
                update_timestamp: 70i64,
                publish_timestamp: None,
            },
            Split {
                split_metadata: SplitMetadata {
                    split_id: "split-2".to_string(),
                    delete_opstamp: 4,
                    time_range: None,
                    tags: BTreeSet::from(["tag-2".to_string(), "tag-3".to_string()]),
                    create_timestamp: 5,
                    footer_offsets: 0..1024,
                    ..Default::default()
                },
                split_state: SplitState::MarkedForDeletion,
                update_timestamp: 50i64,
                publish_timestamp: None,
            },
            Split {
                split_metadata: SplitMetadata {
                    split_id: "split-3".to_string(),
                    delete_opstamp: 0,
                    time_range: Some(0..=90),
                    tags: BTreeSet::from(["tag-2".to_string(), "tag-4".to_string()]),
                    create_timestamp: 64,
                    footer_offsets: 0..512,
                    ..Default::default()
                },
                split_state: SplitState::Published,
                update_timestamp: 0i64,
                publish_timestamp: Some(10i64),
            },
        ]
    }

    #[test]
    fn test_single_filter_behaviour() {
        let [split_1, split_2, split_3] = make_splits();

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_split_state(SplitState::Staged);
        assert!(split_query_predicate(&&split_1, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_split_state(SplitState::Published);
        assert!(!split_query_predicate(&&split_2, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_split_states([SplitState::Published, SplitState::MarkedForDeletion]);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_update_timestamp_lt(51);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_create_timestamp_gte(51);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(!split_query_predicate(&&split_2, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_delete_opstamp_gte(4);
        assert!(split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(!split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_time_range_start_gt(45);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_time_range_end_lt(45);
        assert!(split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_tags_filter(TagFilterAst::Tag {
                is_present: false,
                tag: "tag-2".to_string(),
            });
        assert!(split_query_predicate(&&split_1, &query));
        assert!(!split_query_predicate(&&split_2, &query));
        assert!(!split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_max_time_range_end(50);
        assert!(split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(!split_query_predicate(&&split_3, &query));
    }

    #[test]
    fn test_combination_filter() {
        let [split_1, split_2, split_3] = make_splits();

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_time_range_start_gt(0)
            .with_time_range_end_lt(40);
        assert!(split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_time_range_start_gt(45)
            .with_delete_opstamp_gt(0);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(!split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_update_timestamp_lt(51)
            .with_split_states([SplitState::Published, SplitState::MarkedForDeletion]);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_update_timestamp_lt(51)
            .with_create_timestamp_lte(63);
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(split_query_predicate(&&split_2, &query));
        assert!(!split_query_predicate(&&split_3, &query));

        let query = ListSplitsQuery::for_index(IndexUid::new_with_random_ulid("test-index"))
            .with_time_range_start_gt(90)
            .with_tags_filter(TagFilterAst::Tag {
                is_present: true,
                tag: "tag-1".to_string(),
            });
        assert!(!split_query_predicate(&&split_1, &query));
        assert!(!split_query_predicate(&&split_2, &query));
        assert!(!split_query_predicate(&&split_3, &query));
    }

    #[test]
    fn test_get_stats() {
        let index_id = "test-index";
        let index_metadata = IndexMetadata::for_test(index_id, "file:///qwdata/indexes/test-index");
        let index =
            FileBackedIndex::new(index_metadata, make_splits().into(), HashMap::new(), vec![]);

        let expected_staged = Some(SplitStats {
            num_splits: 1,
            total_size_bytes: 2048,
        });
        let expected_published = Some(SplitStats {
            num_splits: 1,
            total_size_bytes: 512,
        });
        let expected_marked_for_deletion = Some(SplitStats {
            num_splits: 1,
            total_size_bytes: 1024,
        });
        let stats = index.get_stats().unwrap();

        assert_eq!(stats.staged, expected_staged);
        assert_eq!(stats.published, expected_published);
        assert_eq!(stats.marked_for_deletion, expected_marked_for_deletion);
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/file_backed_index/serialize.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use itertools::Itertools;
use quickwit_proto::ingest::Shard;
use quickwit_proto::metastore::SourceType;
use quickwit_proto::types::{DocMappingUid, SourceId};
use serde::{Deserialize, Serialize};

use super::shards::Shards;
use crate::file_backed::file_backed_index::FileBackedIndex;
use crate::metastore::DeleteTask;
use crate::{IndexMetadata, Split};

#[derive(Clone, Debug, Serialize, Deserialize)]
#[serde(tag = "version")]
pub(crate) enum VersionedFileBackedIndex {
    #[serde(rename = "0.9")]
    V0_9(FileBackedIndexV0_8),
    // Retro compatibility.
    #[serde(alias = "0.8")]
    #[serde(alias = "0.7")]
    V0_8(FileBackedIndexV0_8),
}

impl From<FileBackedIndex> for VersionedFileBackedIndex {
    fn from(index: FileBackedIndex) -> Self {
        VersionedFileBackedIndex::V0_9(index.into())
    }
}

impl From<VersionedFileBackedIndex> for FileBackedIndex {
    fn from(index: VersionedFileBackedIndex) -> Self {
        match index {
            VersionedFileBackedIndex::V0_8(mut v0_8) => {
                for shards in v0_8.shards.values_mut() {
                    for shard in shards {
                        shard.doc_mapping_uid = Some(DocMappingUid::default());
                    }
                }
                v0_8.into()
            }
            VersionedFileBackedIndex::V0_9(v0_8) => v0_8.into(),
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub(crate) struct FileBackedIndexV0_8 {
    #[serde(rename = "index")]
    metadata: IndexMetadata,
    splits: Vec<Split>,
    // TODO: Remove `skip_serializing_if` when we release ingest v2.
    #[serde(default, skip_serializing_if = "HashMap::is_empty")]
    shards: HashMap<SourceId, Vec<Shard>>,
    #[serde(default)]
    delete_tasks: Vec<DeleteTask>,
}

impl From<FileBackedIndex> for FileBackedIndexV0_8 {
    fn from(index: FileBackedIndex) -> Self {
        let splits = index
            .splits
            .into_values()
            .sorted_by_key(|split| split.update_timestamp)
            .collect();
        let shards = index
            .per_source_shards
            .into_iter()
            .filter_map(|(source_id, shards)| {
                // TODO: Remove this filter when we release ingest v2.
                // Skip serializing empty shards since the feature is hidden and disabled by
                // default. This way, we can still modify the serialization format without worrying
                // about backward compatibility post `0.7`.
                if !shards.is_empty() {
                    Some((source_id, shards.into_shards_vec()))
                } else {
                    None
                }
            })
            .collect();
        let delete_tasks = index
            .delete_tasks
            .into_iter()
            .sorted_by_key(|delete_task| delete_task.opstamp)
            .collect();
        Self {
            metadata: index.metadata,
            splits,
            shards,
            delete_tasks,
        }
    }
}

impl From<FileBackedIndexV0_8> for FileBackedIndex {
    fn from(index: FileBackedIndexV0_8) -> Self {
        let mut per_source_shards: HashMap<SourceId, Shards> = index
            .shards
            .into_iter()
            .map(|(source_id, shards_vec)| {
                let index_uid = index.metadata.index_uid.clone();
                (
                    source_id.clone(),
                    Shards::from_shards_vec(index_uid, source_id, shards_vec),
                )
            })
            .collect();
        // TODO: Remove this when we release ingest v2.
        for source in index.metadata.sources.values() {
            if source.source_type() == SourceType::IngestV2
                && !per_source_shards.contains_key(&source.source_id)
            {
                let index_uid = index.metadata.index_uid.clone();
                let source_id = source.source_id.clone();
                per_source_shards.insert(source_id.clone(), Shards::empty(index_uid, source_id));
            }
        }
        Self::new(
            index.metadata,
            index.splits,
            per_source_shards,
            index.delete_tasks,
        )
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/file_backed_index/shards.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::collections::hash_map::Entry;
use std::fmt;

use itertools::Itertools;
use quickwit_proto::ingest::{Shard, ShardState};
use quickwit_proto::metastore::{
    AcquireShardsRequest, AcquireShardsResponse, DeleteShardsRequest, DeleteShardsResponse,
    EntityKind, ListShardsSubrequest, ListShardsSubresponse, MetastoreError, MetastoreResult,
    OpenShardSubrequest, OpenShardSubresponse, PruneShardsRequest,
};
use quickwit_proto::types::{IndexUid, Position, PublishToken, ShardId, SourceId, queue_id};
use time::OffsetDateTime;
use tracing::{info, warn};

use crate::checkpoint::{PartitionId, SourceCheckpoint, SourceCheckpointDelta};
use crate::file_backed::MutationOccurred;

// TODO: Rename `SourceShards`
/// Manages the shards of a source.
#[derive(Clone, Eq, PartialEq)]
pub(crate) struct Shards {
    index_uid: IndexUid,
    source_id: SourceId,
    checkpoint: SourceCheckpoint,
    shards: HashMap<ShardId, Shard>,
}

impl fmt::Debug for Shards {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("Shards")
            .field("index_uid", &self.index_uid)
            .field("source_id", &self.source_id)
            .field("num_shards", &self.shards.len())
            .field("shards", &self.shards)
            .finish()
    }
}

impl Shards {
    pub(super) fn empty(index_uid: IndexUid, source_id: SourceId) -> Self {
        Self {
            index_uid,
            source_id,
            checkpoint: SourceCheckpoint::default(),
            shards: HashMap::new(),
        }
    }

    pub(super) fn from_shards_vec(
        index_uid: IndexUid,
        source_id: SourceId,
        shards_vec: Vec<Shard>,
    ) -> Self {
        let mut shards: HashMap<ShardId, Shard> = HashMap::with_capacity(shards_vec.len());
        let mut checkpoint = SourceCheckpoint::default();

        for shard in shards_vec {
            let shard_id = shard.shard_id().clone();
            let partition_id = PartitionId::from(shard_id.as_str());
            let position = shard.publish_position_inclusive();
            checkpoint.add_partition(partition_id, position);
            shards.insert(shard_id, shard);
        }

        Self {
            index_uid,
            source_id,
            checkpoint,
            shards,
        }
    }

    pub fn into_shards_vec(self) -> Vec<Shard> {
        self.shards.into_values().collect()
    }

    pub fn is_empty(&self) -> bool {
        self.shards.is_empty()
    }

    fn get_shard(&self, shard_id: &ShardId) -> MetastoreResult<&Shard> {
        self.shards.get(shard_id).ok_or_else(|| {
            let queue_id = queue_id(&self.index_uid, &self.source_id, shard_id);
            MetastoreError::NotFound(EntityKind::Shard { queue_id })
        })
    }

    fn get_shard_mut(&mut self, shard_id: &ShardId) -> MetastoreResult<&mut Shard> {
        self.shards.get_mut(shard_id).ok_or_else(|| {
            let queue_id = queue_id(&self.index_uid, &self.source_id, shard_id);
            MetastoreError::NotFound(EntityKind::Shard { queue_id })
        })
    }

    pub(super) fn open_shard(
        &mut self,
        subrequest: OpenShardSubrequest,
    ) -> MetastoreResult<MutationOccurred<OpenShardSubresponse>> {
        let mut mutation_occurred = false;

        let shard_id = subrequest.shard_id().clone();
        let entry = self.shards.entry(shard_id.clone());
        let shard = match entry {
            Entry::Occupied(entry) => entry.get().clone(),
            Entry::Vacant(entry) => {
                let shard = Shard {
                    index_uid: Some(self.index_uid.clone()),
                    source_id: self.source_id.clone(),
                    shard_id: Some(shard_id.clone()),
                    shard_state: ShardState::Open as i32,
                    leader_id: subrequest.leader_id,
                    follower_id: subrequest.follower_id,
                    doc_mapping_uid: subrequest.doc_mapping_uid,
                    publish_position_inclusive: Some(Position::Beginning),
                    publish_token: subrequest.publish_token.clone(),
                    update_timestamp: OffsetDateTime::now_utc().unix_timestamp(),
                };
                mutation_occurred = true;
                entry.insert(shard.clone());

                info!(
                    index_uid=%self.index_uid,
                    source_id=%self.source_id,
                    %shard_id,
                    leader_id=%shard.leader_id,
                    follower_id=?shard.follower_id,
                    "opened shard"
                );
                shard
            }
        };
        let response = OpenShardSubresponse {
            subrequest_id: subrequest.subrequest_id,
            open_shard: Some(shard),
        };
        if mutation_occurred {
            Ok(MutationOccurred::Yes(response))
        } else {
            Ok(MutationOccurred::No(response))
        }
    }

    pub(super) fn acquire_shards(
        &mut self,
        request: AcquireShardsRequest,
    ) -> MetastoreResult<MutationOccurred<AcquireShardsResponse>> {
        let mut mutation_occurred = false;
        let mut acquired_shards = Vec::with_capacity(request.shard_ids.len());

        for shard_id in &request.shard_ids {
            if let Some(shard) = self.shards.get_mut(shard_id) {
                if shard.publish_token() != request.publish_token {
                    shard.publish_token = Some(request.publish_token.clone());
                    mutation_occurred = true;
                }
                acquired_shards.push(shard.clone());
            } else {
                warn!(
                    index_uid=%self.index_uid,
                    source_id=%self.source_id,
                    %shard_id,
                    "shard not found"
                );
            }
        }
        let response = AcquireShardsResponse { acquired_shards };

        if mutation_occurred {
            Ok(MutationOccurred::Yes(response))
        } else {
            Ok(MutationOccurred::No(response))
        }
    }

    pub(super) fn delete_shards(
        &mut self,
        request: DeleteShardsRequest,
    ) -> MetastoreResult<MutationOccurred<DeleteShardsResponse>> {
        let mut successes = Vec::with_capacity(request.shard_ids.len());
        let mut failures = Vec::new();
        let mut mutation_occurred = false;

        for shard_id in request.shard_ids {
            if let Entry::Occupied(entry) = self.shards.entry(shard_id.clone()) {
                let shard = entry.get();
                if !request.force && !shard.publish_position_inclusive().is_eof() {
                    failures.push(shard_id);
                    continue;
                }
                info!(
                    index_uid=%self.index_uid,
                    source_id=%self.source_id,
                    %shard_id,
                    "deleted shard",
                );
                entry.remove();
                mutation_occurred = true;
            }
            successes.push(shard_id);
        }
        if !failures.is_empty() {
            warn!(
                index_uid=%self.index_uid,
                source_id=%self.source_id,
                "failed to delete shards `{}`: shards are not fully indexed",
                failures.iter().join(", ")
            );
        }
        let response = DeleteShardsResponse {
            index_uid: request.index_uid,
            source_id: request.source_id,
            successes,
            failures,
        };
        if mutation_occurred {
            Ok(MutationOccurred::Yes(response))
        } else {
            Ok(MutationOccurred::No(response))
        }
    }

    pub(super) fn prune_shards(
        &mut self,
        request: PruneShardsRequest,
    ) -> MetastoreResult<MutationOccurred<()>> {
        let initial_shard_count = self.shards.len();

        if let Some(max_age_secs) = request.max_age_secs {
            self.shards.retain(|_, shard| {
                let gc_deadline = shard.update_timestamp + max_age_secs as i64;
                let now = OffsetDateTime::now_utc().unix_timestamp();
                gc_deadline >= now
            });
        };
        if let Some(max_count) = request.max_count {
            let max_count = max_count as usize;
            if max_count < self.shards.len() {
                let num_to_remove = self.shards.len() - max_count;
                let shard_ids_to_delete = self
                    .shards
                    .values()
                    .sorted_by_key(|shard| shard.update_timestamp)
                    .take(num_to_remove)
                    .map(|shard| shard.shard_id().clone())
                    .collect_vec();
                for shard_id in shard_ids_to_delete {
                    self.shards.remove(&shard_id);
                }
            }
        }
        if initial_shard_count > self.shards.len() {
            Ok(MutationOccurred::Yes(()))
        } else {
            Ok(MutationOccurred::No(()))
        }
    }

    pub(super) fn list_shards(
        &self,
        subrequest: ListShardsSubrequest,
    ) -> MetastoreResult<ListShardsSubresponse> {
        let shards = self.list_shards_inner(subrequest.shard_state);
        let response = ListShardsSubresponse {
            index_uid: subrequest.index_uid,
            source_id: subrequest.source_id,
            shards,
        };
        Ok(response)
    }

    pub(super) fn try_apply_delta(
        &mut self,
        checkpoint_delta: SourceCheckpointDelta,
        publish_token: PublishToken,
    ) -> MetastoreResult<MutationOccurred<()>> {
        if checkpoint_delta.is_empty() {
            return Ok(MutationOccurred::No(()));
        }
        self.checkpoint
            .check_compatibility(&checkpoint_delta)
            .map_err(|error| MetastoreError::InvalidArgument {
                message: error.to_string(),
            })?;

        let mut shard_ids = Vec::with_capacity(checkpoint_delta.num_partitions());

        for (partition_id, partition_delta) in checkpoint_delta.iter() {
            let shard_id = ShardId::from(partition_id.as_str());
            let shard = self.get_shard(&shard_id)?;

            if shard.publish_token() != publish_token {
                let message = "failed to apply checkpoint delta: invalid publish token".to_string();
                return Err(MetastoreError::InvalidArgument { message });
            }
            let publish_position_inclusive = partition_delta.to;
            shard_ids.push((shard_id, publish_position_inclusive))
        }
        self.checkpoint
            .try_apply_delta(checkpoint_delta)
            .expect("delta compatibility should have been checked");

        for (shard_id, publish_position_inclusive) in shard_ids {
            let shard = self.get_shard_mut(&shard_id).expect("shard should exist");

            if publish_position_inclusive.is_eof() {
                shard.shard_state = ShardState::Closed as i32;
            }
            shard.publish_position_inclusive = Some(publish_position_inclusive);
            shard.update_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        }
        Ok(MutationOccurred::Yes(()))
    }

    fn list_shards_inner(&self, shard_state: Option<i32>) -> Vec<Shard> {
        if let Some(shard_state) = shard_state {
            self.shards
                .values()
                .filter(|shard| shard.shard_state == shard_state)
                .cloned()
                .collect()
        } else {
            self.shards.values().cloned().collect()
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_proto::ingest::ShardState;
    use quickwit_proto::types::DocMappingUid;

    use super::*;

    impl Shards {
        pub(crate) fn insert_shards(&mut self, shards: Vec<Shard>) {
            for shard in shards {
                let shard_id = shard.shard_id().clone();
                self.shards.insert(shard_id, shard);
            }
        }
    }

    #[test]
    fn test_open_shards() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let mut shards = Shards::empty(index_uid.clone(), source_id.clone());

        let subrequest = OpenShardSubrequest {
            subrequest_id: 0,
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "leader_id".to_string(),
            follower_id: None,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_token: None,
        };
        let MutationOccurred::Yes(subresponse) = shards.open_shard(subrequest.clone()).unwrap()
        else {
            panic!("expected `MutationOccurred::Yes`");
        };
        assert_eq!(subresponse.subrequest_id, 0);

        let shard = subresponse.open_shard();
        assert_eq!(shard.index_uid(), &index_uid);
        assert_eq!(shard.source_id, source_id);
        assert_eq!(shard.shard_id(), ShardId::from(1));
        assert_eq!(shard.shard_state(), ShardState::Open);
        assert_eq!(shard.leader_id, "leader_id");
        assert_eq!(shard.follower_id, None);
        assert_eq!(shard.publish_token, None);
        assert_eq!(shard.publish_position_inclusive(), Position::Beginning);

        let MutationOccurred::No(subresponse) = shards.open_shard(subrequest).unwrap() else {
            panic!("Expected `MutationOccurred::No`");
        };
        assert_eq!(subresponse.subrequest_id, 0);

        let shard = subresponse.open_shard();
        assert_eq!(shards.shards.get(&ShardId::from(1)).unwrap(), shard);

        let subrequest = OpenShardSubrequest {
            subrequest_id: 0,
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            leader_id: "leader_id".to_string(),
            follower_id: Some("follower_id".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_token: Some("publish_token".to_string()),
        };
        let MutationOccurred::Yes(subresponse) = shards.open_shard(subrequest).unwrap() else {
            panic!("Expected `MutationOccurred::No`");
        };
        assert_eq!(subresponse.subrequest_id, 0);

        let shard = subresponse.open_shard();
        assert_eq!(shard.index_uid(), &index_uid);
        assert_eq!(shard.source_id, source_id);
        assert_eq!(shard.shard_id(), ShardId::from(2));
        assert_eq!(shard.shard_state(), ShardState::Open);
        assert_eq!(shard.leader_id, "leader_id");
        assert_eq!(shard.follower_id.as_ref().unwrap(), "follower_id");
        assert_eq!(shard.publish_position_inclusive(), Position::Beginning);

        assert_eq!(shards.shards.get(&ShardId::from(2)).unwrap(), shard);
    }

    #[test]
    fn test_list_shards() {
        let index_uid: IndexUid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let mut shards = Shards::empty(index_uid.clone(), source_id.clone());

        let subrequest = ListShardsSubrequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_state: None,
        };
        let subresponse = shards.list_shards(subrequest).unwrap();
        assert_eq!(subresponse.index_uid(), &index_uid);
        assert_eq!(subresponse.source_id, source_id);
        assert_eq!(subresponse.shards.len(), 0);

        let shard_0 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(0)),
            shard_state: ShardState::Open as i32,
            ..Default::default()
        };
        let shard_1 = Shard {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Closed as i32,
            ..Default::default()
        };
        shards.shards.insert(ShardId::from(0), shard_0);
        shards.shards.insert(ShardId::from(1), shard_1);

        let subrequest = ListShardsSubrequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_state: None,
        };
        let mut subresponse = shards.list_shards(subrequest).unwrap();
        subresponse
            .shards
            .sort_unstable_by(|left, right| left.shard_id.cmp(&right.shard_id));
        assert_eq!(subresponse.shards.len(), 2);
        assert_eq!(subresponse.shards[0].shard_id(), ShardId::from(0));
        assert_eq!(subresponse.shards[1].shard_id(), ShardId::from(1));

        let subrequest = ListShardsSubrequest {
            index_uid: index_uid.into(),
            source_id,
            shard_state: Some(ShardState::Closed as i32),
        };
        let subresponse = shards.list_shards(subrequest).unwrap();
        assert_eq!(subresponse.shards.len(), 1);
        assert_eq!(subresponse.shards[0].shard_id(), ShardId::from(1));
    }

    #[test]
    fn test_acquire_shards() {
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let mut shards = Shards::empty(index_uid.clone(), source_id.clone());

        let request = AcquireShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_ids: Vec::new(),
            publish_token: "test-publish-token".to_string(),
        };
        let MutationOccurred::No(response) = shards.acquire_shards(request).unwrap() else {
            panic!("Expected `MutationOccurred::No`");
        };
        assert!(response.acquired_shards.is_empty());

        let request = AcquireShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_ids: vec![ShardId::from(0), ShardId::from(1)],
            publish_token: "test-publish-token".to_string(),
        };
        let MutationOccurred::No(response) = shards.acquire_shards(request.clone()).unwrap() else {
            panic!("Expected `MutationOccurred::No`");
        };
        assert!(response.acquired_shards.is_empty());

        shards.shards.insert(
            ShardId::from(0),
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(0)),
                shard_state: ShardState::Open as i32,
                publish_position_inclusive: Some(Position::eof(0u64)),
                ..Default::default()
            },
        );
        let MutationOccurred::Yes(response) = shards.acquire_shards(request.clone()).unwrap()
        else {
            panic!("expected `MutationOccurred::Yes`");
        };
        assert_eq!(response.acquired_shards.len(), 1);
        let acquired_shard = &response.acquired_shards[0];
        assert_eq!(acquired_shard.shard_id(), ShardId::from(0));

        assert_eq!(
            shards
                .shards
                .get(&ShardId::from(0))
                .unwrap()
                .publish_token(),
            "test-publish-token"
        );
    }

    #[test]
    fn test_delete_shards() {
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let mut shards = Shards::empty(index_uid.clone(), source_id.clone());

        let request = DeleteShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_ids: Vec::new(),
            force: false,
        };
        let MutationOccurred::No(response) = shards.delete_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::No`");
        };
        assert_eq!(response.index_uid(), &index_uid);
        assert_eq!(response.source_id, source_id);
        assert!(response.successes.is_empty());
        assert!(response.failures.is_empty());

        let request = DeleteShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_ids: vec![ShardId::from(0)],
            force: false,
        };
        let MutationOccurred::No(response) = shards.delete_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::No`");
        };
        assert_eq!(response.index_uid(), &index_uid);
        assert_eq!(response.source_id, source_id);
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.successes[0], ShardId::from(0));
        assert!(response.failures.is_empty());

        shards.shards.insert(
            ShardId::from(0),
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(0)),
                shard_state: ShardState::Open as i32,
                publish_position_inclusive: Some(Position::eof(0u64)),
                ..Default::default()
            },
        );
        shards.shards.insert(
            ShardId::from(1),
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                publish_position_inclusive: Some(Position::offset(0u64)),
                ..Default::default()
            },
        );
        let request = DeleteShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_ids: vec![ShardId::from(0), ShardId::from(1)],
            force: false,
        };
        let MutationOccurred::Yes(response) = shards.delete_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::Yes`");
        };
        assert_eq!(response.index_uid(), &index_uid);
        assert_eq!(response.source_id, source_id);
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.successes[0], ShardId::from(0));
        assert_eq!(response.failures.len(), 1);
        assert_eq!(response.failures[0], ShardId::from(1));

        let request = DeleteShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            shard_ids: vec![ShardId::from(1)],
            force: true,
        };
        let MutationOccurred::Yes(response) = shards.delete_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::Yes`");
        };
        assert_eq!(response.index_uid(), &index_uid);
        assert_eq!(response.source_id, source_id);
        assert_eq!(response.successes.len(), 1);
        assert_eq!(response.successes[0], ShardId::from(1));
        assert!(response.failures.is_empty());

        assert!(shards.shards.is_empty());
    }

    #[test]
    fn test_prune_shards() {
        let index_uid = IndexUid::for_test("test-index", 0);
        let source_id = "test-source".to_string();
        let mut shards = Shards::empty(index_uid.clone(), source_id.clone());

        let request = PruneShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            max_age_secs: None,
            max_count: None,
            interval_secs: None,
        };
        let MutationOccurred::No(()) = shards.prune_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::No`");
        };

        let request = PruneShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            max_age_secs: Some(50),
            max_count: None,
            interval_secs: None,
        };
        let MutationOccurred::No(()) = shards.prune_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::No`");
        };

        let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
        shards.shards.insert(
            ShardId::from(0),
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(0)),
                shard_state: ShardState::Open as i32,
                publish_position_inclusive: Some(Position::eof(0u64)),
                update_timestamp: current_timestamp - 200,
                ..Default::default()
            },
        );
        shards.shards.insert(
            ShardId::from(1),
            Shard {
                index_uid: Some(index_uid.clone()),
                source_id: source_id.clone(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                publish_position_inclusive: Some(Position::offset(0u64)),
                update_timestamp: current_timestamp - 100,
                ..Default::default()
            },
        );

        let request = PruneShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            max_age_secs: Some(150),
            max_count: None,
            interval_secs: None,
        };
        let MutationOccurred::Yes(()) = shards.prune_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::Yes`");
        };

        let request = PruneShardsRequest {
            index_uid: Some(index_uid.clone()),
            source_id: source_id.clone(),
            max_age_secs: Some(150),
            max_count: None,
            interval_secs: None,
        };
        let MutationOccurred::No(()) = shards.prune_shards(request).unwrap() else {
            panic!("expected `MutationOccurred::No`");
        };
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/file_backed_metastore_factory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::str::FromStr;
use std::sync::Arc;
use std::time::Duration;

use async_trait::async_trait;
use once_cell::sync::OnceCell;
use quickwit_common::uri::Uri;
use quickwit_config::{MetastoreBackend, MetastoreConfig};
use quickwit_proto::metastore::{MetastoreError, MetastoreServiceClient};
use quickwit_storage::{StorageResolver, StorageResolverError};
use regex::Regex;
use tokio::sync::Mutex;
use tracing::debug;

use crate::{FileBackedMetastore, MetastoreFactory, MetastoreResolverError};

/// A file-backed metastore factory.
///
/// The implementation ensures that there is only
/// one living instance of `FileBasedMetastore` per metastore URI.
/// As a result, within a same process as long as we keep a single
/// FileBasedMetastoreFactory, it is safe to use the file based
/// metastore, even from different threads.
#[derive(Clone)]
pub struct FileBackedMetastoreFactory {
    storage_resolver: StorageResolver,
    // We never garbage collect unused metastore client instances. This should not be a problem
    // because during normal use this cache will hold at most a single instance.
    cache: Arc<Mutex<HashMap<Uri, MetastoreServiceClient>>>,
}

fn extract_polling_interval_from_uri(uri: &str) -> (String, Option<Duration>) {
    static URI_FRAGMENT_PATTERN: OnceCell<Regex> = OnceCell::new();
    if let Some(captures) = URI_FRAGMENT_PATTERN
        .get_or_init(|| Regex::new("(.*)#polling_interval=([1-9][0-9]{0,8})s").unwrap())
        .captures(uri)
    {
        let uri_without_fragment = captures.get(1).unwrap().as_str().to_string();
        let polling_interval_in_secs: u64 =
            captures.get(2).unwrap().as_str().parse::<u64>().unwrap();
        (
            uri_without_fragment,
            Some(Duration::from_secs(polling_interval_in_secs)),
        )
    } else {
        (uri.to_string(), None)
    }
}

impl FileBackedMetastoreFactory {
    /// Creates a new [`FileBackedMetastoreFactory`].
    pub fn new(storage_resolver: StorageResolver) -> Self {
        Self {
            storage_resolver,
            cache: Default::default(),
        }
    }

    async fn get_from_cache(&self, uri: &Uri) -> Option<MetastoreServiceClient> {
        self.cache.lock().await.get(uri).cloned()
    }

    /// If there is a valid entry in the cache to begin with, we ignore the new
    /// metastore and return the old one.
    ///
    /// This way we make sure that we keep only one instance associated
    /// to the key `uri` outside of this struct.
    async fn cache_metastore(
        &self,
        uri: Uri,
        metastore: MetastoreServiceClient,
    ) -> MetastoreServiceClient {
        self.cache
            .lock()
            .await
            .entry(uri)
            .or_insert(metastore)
            .clone()
    }
}

#[async_trait]
impl MetastoreFactory for FileBackedMetastoreFactory {
    fn backend(&self) -> MetastoreBackend {
        MetastoreBackend::File
    }

    async fn resolve(
        &self,
        _metastore_config: &MetastoreConfig,
        uri: &Uri,
    ) -> Result<MetastoreServiceClient, MetastoreResolverError> {
        let (uri_stripped, polling_interval_opt) = extract_polling_interval_from_uri(uri.as_str());
        let uri = Uri::from_str(&uri_stripped).map_err(|_| {
            MetastoreResolverError::InvalidConfig(format!("invalid URI: `{uri_stripped}`"))
        })?;
        if let Some(metastore) = self.get_from_cache(&uri).await {
            debug!("using metastore from cache");
            return Ok(metastore);
        }
        debug!("metastore not found in cache");
        let storage = self
            .storage_resolver
            .resolve(&uri)
            .await
            .map_err(|err| match err {
                StorageResolverError::InvalidConfig(message) => {
                    MetastoreResolverError::InvalidConfig(message)
                }
                StorageResolverError::InvalidUri(message) => {
                    MetastoreResolverError::InvalidUri(message)
                }
                StorageResolverError::UnsupportedBackend(message) => {
                    MetastoreResolverError::UnsupportedBackend(message)
                }
                StorageResolverError::FailedToOpenStorage { kind, message } => {
                    MetastoreResolverError::Initialization(MetastoreError::Internal {
                        message: format!("failed to open metastore file `{uri}`"),
                        cause: format!("StorageError {kind:?}: {message}"),
                    })
                }
            })?;
        let file_backed_metastore = FileBackedMetastore::try_new(storage, polling_interval_opt)
            .await
            .map(MetastoreServiceClient::new)
            .map_err(MetastoreResolverError::Initialization)?;
        let unique_metastore_for_uri = self.cache_metastore(uri, file_backed_metastore).await;
        Ok(unique_metastore_for_uri)
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use crate::metastore::file_backed::file_backed_metastore_factory::extract_polling_interval_from_uri;

    #[test]
    fn test_extract_polling_interval_from_uri() {
        assert_eq!(
            extract_polling_interval_from_uri("file://some-uri#polling_interval=23s"),
            ("file://some-uri".to_string(), Some(Duration::from_secs(23)))
        );
        assert_eq!(
            extract_polling_interval_from_uri(
                "file://some-uri#polling_interval=18446744073709551616s"
            ),
            (
                "file://some-uri#polling_interval=18446744073709551616s".to_string(),
                None
            )
        );
        assert_eq!(
            extract_polling_interval_from_uri("file://some-uri#polling_interval=0s"),
            ("file://some-uri#polling_interval=0s".to_string(), None)
        );
        assert_eq!(
            extract_polling_interval_from_uri("file://some-uri#otherfragment#polling_interval=10s"),
            (
                "file://some-uri#otherfragment".to_string(),
                Some(Duration::from_secs(10))
            )
        );
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/index_id_matcher.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::validate_index_id_pattern;
use quickwit_proto::metastore::{MetastoreError, MetastoreResult};
use regex::RegexSet;
use regex_syntax::escape_into;

pub(super) type IndexIdPattern = String;

#[derive(Debug)]
pub(super) struct IndexIdMatcher {
    positive_matcher: RegexSet,
    negative_matcher: RegexSet,
}

impl IndexIdMatcher {
    /// Builds an [`IndexIdMatcher`] from an set of index ID patterns using the following rules:
    /// - If the given pattern does not contain a `*` char, it matches the exact pattern.
    /// - If the given pattern contains one or more `*`, it matches the regex built from a regex
    ///   where `*` is replaced by `.*`. All other regular expression meta characters are escaped.
    pub fn try_from_index_id_patterns(
        index_id_patterns: &[IndexIdPattern],
    ) -> MetastoreResult<Self> {
        let mut positive_patterns: Vec<&str> = Vec::new();
        let mut negative_patterns: Vec<&str> = Vec::new();

        for pattern in index_id_patterns {
            if let Some(negative_pattern) = pattern.strip_prefix('-') {
                negative_patterns.push(negative_pattern);
            } else {
                positive_patterns.push(pattern);
            }
        }
        if positive_patterns.is_empty() {
            let message = "failed to build index ID matcher: at least one positive index ID \
                           pattern must be provided"
                .to_string();
            return Err(MetastoreError::InvalidArgument { message });
        }
        let positive_matcher = build_regex_set(&positive_patterns)?;
        let negative_matcher = build_regex_set(&negative_patterns)?;

        let matcher = IndexIdMatcher {
            positive_matcher,
            negative_matcher,
        };
        Ok(matcher)
    }

    pub fn is_match(&self, index_id: &str) -> bool {
        self.positive_matcher.is_match(index_id) && !self.negative_matcher.is_match(index_id)
    }
}

fn build_regex_set(patterns: &[&str]) -> MetastoreResult<RegexSet> {
    for pattern in patterns {
        if *pattern == "*" {
            let regex_set = RegexSet::new([".*"]).expect("regular expression set should compile");
            return Ok(regex_set);
        }
        validate_index_id_pattern(pattern, false).map_err(|error| {
            let message = format!("failed to build index ID matcher: {error}");
            MetastoreError::InvalidArgument { message }
        })?;
    }
    let regexes = patterns.iter().map(|pattern| build_regex(pattern));

    let regex_set = RegexSet::new(regexes).map_err(|error| {
        let message = format!("failed to build index ID matcher: {error}");
        MetastoreError::InvalidArgument { message }
    })?;
    Ok(regex_set)
}

fn build_regex(pattern: &str) -> String {
    let mut regex = String::new();
    regex.push('^');

    for (idx, part) in pattern.split('*').enumerate() {
        if idx > 0 {
            regex.push_str(".*");
        }
        escape_into(part, &mut regex);
    }
    regex.push('$');
    regex
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_build_regex() {
        let regex = build_regex("");
        assert_eq!(regex, r"^$");

        let regex = build_regex("*");
        assert_eq!(regex, r"^.*$");

        let regex = build_regex("index-1");
        assert_eq!(regex, r"^index\-1$");

        let regex = build_regex("*-index-*-1");
        assert_eq!(regex, r"^.*\-index\-.*\-1$");

        let regex = build_regex("INDEX.2*-1");
        assert_eq!(regex, r"^INDEX\.2.*\-1$");
    }

    #[test]
    fn test_build_regex_set() {
        let error = build_regex_set(&["_index-1"]).unwrap_err();
        assert!(matches!(error, MetastoreError::InvalidArgument { .. }));

        let regex_set = build_regex_set(&["index-1"]).unwrap();
        assert!(regex_set.is_match("index-1"));
        assert!(!regex_set.is_match("index-2"));

        let regex_set = build_regex_set(&["index-1", "index-2"]).unwrap();
        assert!(regex_set.is_match("index-1"));
        assert!(regex_set.is_match("index-2"));
        assert!(!regex_set.is_match("index-3"));

        let regex_set = build_regex_set(&["index-1*"]).unwrap();
        assert!(regex_set.is_match("index-1"));
        assert!(regex_set.is_match("index-10"));
        assert!(!regex_set.is_match("index-2"));
    }

    #[test]
    fn test_index_id_matcher() {
        let error = IndexIdMatcher::try_from_index_id_patterns(&[]).unwrap_err();
        assert!(matches!(error, MetastoreError::InvalidArgument { .. }));

        let matcher = IndexIdMatcher::try_from_index_id_patterns(&[
            "index-foo*".to_string(),
            "-index-foobar".to_string(),
        ])
        .unwrap();
        assert!(matcher.is_match("index-foo"));
        assert!(matcher.is_match("index-fooo"));
        assert!(!matcher.is_match("index-foobar"));
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/index_template_matcher.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::{IndexTemplate, IndexTemplateId};
use quickwit_proto::metastore::MetastoreResult;

use super::index_id_matcher::IndexIdMatcher;

struct InnerMatcher {
    template_id: IndexTemplateId,
    priority: usize,
    matcher: IndexIdMatcher,
}

impl InnerMatcher {
    /// Compares two matchers by (-<priority>, <template ID>)
    fn cmp_by_priority_desc(&self, other: &Self) -> std::cmp::Ordering {
        self.priority
            .cmp(&other.priority)
            .reverse()
            .then_with(|| self.template_id.cmp(&other.template_id))
    }

    fn is_match(&self, index_id: &str) -> bool {
        self.matcher.is_match(index_id)
    }
}

/// Finds the best matching index template for a given index ID. The matching algorithm is naive and
/// should be improved to support a large number of templates, should the need arise. It maintains a
/// list of index templates matchers sorted by priority and performs a linear search returning the
/// first match.
#[derive(Default)]
pub(super) struct IndexTemplateMatcher {
    inner_matchers: Vec<InnerMatcher>,
}

impl IndexTemplateMatcher {
    pub fn try_from_index_templates<'a>(
        templates: impl Iterator<Item = &'a IndexTemplate> + 'a,
    ) -> MetastoreResult<Self> {
        let mut inner_matchers = Vec::new();

        for template in templates {
            let matcher = IndexIdMatcher::try_from_index_id_patterns(&template.index_id_patterns)?;
            let inner_matcher = InnerMatcher {
                template_id: template.template_id.clone(),
                priority: template.priority,
                matcher,
            };
            inner_matchers.push(inner_matcher);
        }
        let mut matcher = Self { inner_matchers };
        matcher.sort_by_priority_desc();

        Ok(matcher)
    }

    pub fn insert(&mut self, template: &IndexTemplate) -> MetastoreResult<()> {
        let matcher = IndexIdMatcher::try_from_index_id_patterns(&template.index_id_patterns)?;
        let inner_matcher = InnerMatcher {
            template_id: template.template_id.clone(),
            priority: template.priority,
            matcher,
        };
        self.inner_matchers.push(inner_matcher);
        self.sort_by_priority_desc();

        Ok(())
    }

    pub fn remove(&mut self, template_id: &str) {
        self.inner_matchers
            .retain(|matcher| matcher.template_id != *template_id);
    }

    pub fn find_match(&self, index_id: &str) -> Option<IndexTemplateId> {
        self.inner_matchers
            .iter()
            .find(|inner_matcher| inner_matcher.is_match(index_id))
            .map(|inner_matcher| inner_matcher.template_id.clone())
    }

    fn sort_by_priority_desc(&mut self) {
        self.inner_matchers
            .sort_unstable_by(InnerMatcher::cmp_by_priority_desc)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_index_template_matcher() {
        let index_template_bar =
            IndexTemplate::for_test("test-template-bar", &["test-index-bar*"], 0);
        let index_template_foo =
            IndexTemplate::for_test("test-template-foo", &["test-index-foo*"], 100);
        let index_template_foobar =
            IndexTemplate::for_test("test-template-foobar", &["test-index-foobar*"], 200);

        let mut matcher = IndexTemplateMatcher::default();
        matcher.insert(&index_template_foo).unwrap();
        matcher.insert(&index_template_bar).unwrap();

        assert_eq!(
            matcher.find_match("test-index-bar-1").unwrap(),
            "test-template-bar"
        );
        assert_eq!(
            matcher.find_match("test-index-foobar").unwrap(),
            "test-template-foo"
        );
        assert_eq!(
            matcher.find_match("test-index-foo").unwrap(),
            "test-template-foo"
        );

        matcher.insert(&index_template_foobar).unwrap();
        assert_eq!(
            matcher.find_match("test-index-foobar").unwrap(),
            "test-template-foobar"
        );

        matcher.remove("test-template-foobar");
        assert_eq!(
            matcher.find_match("test-index-foobar").unwrap(),
            "test-template-foo"
        );

        matcher.remove("test-template-foo");
        assert!(matcher.find_match("test-index-foobar").is_none())
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/lazy_file_backed_index.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::{Arc, Weak};
use std::time::Duration;

use quickwit_proto::metastore::{EntityKind, MetastoreError, MetastoreResult};
use quickwit_proto::types::IndexId;
use quickwit_storage::Storage;
use tokio::sync::{Mutex, OnceCell};
use tracing::error;

use super::file_backed_index::FileBackedIndex;
use super::store_operations::{METASTORE_FILE_NAME, load_index};

/// Lazy [`FileBackedIndex`]. It loads a `FileBackedIndex` on demand. When the index is first
/// loaded, it optionally spawns a task to periodically poll the storage and update the index.
pub(crate) struct LazyFileBackedIndex {
    index_id: IndexId,
    storage: Arc<dyn Storage>,
    polling_interval_opt: Option<Duration>,
    lazy_index: OnceCell<Arc<Mutex<FileBackedIndex>>>,
}

impl LazyFileBackedIndex {
    /// Create `LazyFileBackedIndex`.
    pub fn new(
        storage: Arc<dyn Storage>,
        index_id: IndexId,
        polling_interval_opt: Option<Duration>,
        file_backed_index: Option<FileBackedIndex>,
    ) -> Self {
        let index_mutex_opt = file_backed_index.map(|index| Arc::new(Mutex::new(index)));
        // If the polling interval is configured and the index is already loaded,
        // spawn immediately the polling task
        if let Some(index_mutex) = &index_mutex_opt
            && let Some(polling_interval) = polling_interval_opt
        {
            spawn_index_metadata_polling_task(
                storage.clone(),
                index_id.clone(),
                Arc::downgrade(index_mutex),
                polling_interval,
            );
        }
        Self {
            index_id,
            storage,
            polling_interval_opt,
            lazy_index: OnceCell::new_with(index_mutex_opt),
        }
    }

    /// Gets a synchronized `FileBackedIndex`. If the index wasn't provided on creation, we load it
    /// lazily on the first call of this method.
    pub async fn get(&self) -> MetastoreResult<Arc<Mutex<FileBackedIndex>>> {
        self.lazy_index
            .get_or_try_init(|| async move {
                let index = load_index(&*self.storage, &self.index_id).await?;
                let index_mutex = Arc::new(Mutex::new(index));
                // When the index is loaded lazily, the polling task is not started in the
                // constructor so we do it here when the index is actually loaded.
                if let Some(polling_interval) = self.polling_interval_opt {
                    spawn_index_metadata_polling_task(
                        self.storage.clone(),
                        self.index_id.clone(),
                        Arc::downgrade(&index_mutex),
                        polling_interval,
                    );
                }
                Ok(index_mutex)
            })
            .await
            .cloned()
    }
}

async fn poll_index_metadata_once(
    storage: &dyn Storage,
    index_id: &str,
    index_mutex: &Mutex<FileBackedIndex>,
) {
    let mut locked_index = index_mutex.lock().await;
    if locked_index.flip_recently_modified_down() {
        return;
    }
    let load_index_result = load_index(storage, index_id).await;

    match load_index_result {
        Ok(index) => {
            *locked_index = index;
        }
        Err(MetastoreError::NotFound(EntityKind::Index { .. })) => {
            // The index has been deleted by the file-backed metastore holding a reference to this
            // index. When it removes an index, it does so without holding the lock on the target
            // index. As a result, the associated polling task may run for one
            // more iteration before exiting and `load_index` returns a `NotFound` error.
        }
        Err(metastore_error) => {
            error!(
                error=%metastore_error,
                "failed to load index metadata from metastore file located at `{}/{index_id}/{METASTORE_FILE_NAME}`",
                storage.uri()
            );
        }
    }
}

fn spawn_index_metadata_polling_task(
    storage: Arc<dyn Storage>,
    index_id: IndexId,
    metastore_weak: Weak<Mutex<FileBackedIndex>>,
    polling_interval: Duration,
) {
    tokio::task::spawn(async move {
        let mut interval = tokio::time::interval(polling_interval);
        interval.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Delay);
        interval.tick().await; //< this is to prevent fetch right after the first population of the data.

        while let Some(metadata_mutex) = metastore_weak.upgrade() {
            interval.tick().await;
            poll_index_metadata_once(&*storage, &index_id, &metadata_mutex).await;
        }
    });
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/manifest.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, HashMap};
use std::path::Path;

use itertools::Itertools;
use quickwit_common::uri::Uri;
use quickwit_config::{IndexTemplate, IndexTemplateId};
use quickwit_proto::metastore::{MetastoreError, MetastoreResult, serde_utils};
use quickwit_proto::types::{DocMappingUid, IndexId};
use quickwit_storage::{OwnedBytes, Storage, StorageError, StorageErrorKind, StorageResult};
use serde::{Deserialize, Serialize};
use tracing::error;
use uuid::Uuid;

pub(super) const MANIFEST_FILE_NAME: &str = "manifest.json";

// The legacy manifest file was deprecated in 0.8.0, we can drop support for it in 0.10.0 or 0.11.0.
const LEGACY_MANIFEST_FILE_NAME: &str = "indexes_states.json";

#[derive(Clone, Debug, Deserialize)]
struct LegacyManifest {
    #[serde(default, flatten)]
    indexes: BTreeMap<IndexId, IndexStatus>,
}

impl LegacyManifest {
    fn into_manifest(self) -> Manifest {
        Manifest {
            indexes: self.indexes,
            templates: HashMap::new(),
            identity: Uuid::nil(),
        }
    }
}

// TODO: Remove the aliases once we drop support for the legacy manifest file.
#[derive(Clone, Copy, Debug, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub(crate) enum IndexStatus {
    #[serde(alias = "Creating")]
    Creating,
    #[serde(alias = "Alive")]
    Active,
    #[serde(alias = "Deleting")]
    Deleting,
}

#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
#[serde(into = "VersionedManifest")]
#[serde(from = "VersionedManifest")]
pub(crate) struct Manifest {
    pub indexes: BTreeMap<IndexId, IndexStatus>,
    // The templates are serialized as a sorted `Vec<IndexTemplate>` so the btree map is
    // unnecessary here and we can pass the hash map as is to the `MetastoreState`
    pub templates: HashMap<IndexTemplateId, IndexTemplate>,
    pub identity: Uuid,
}

#[derive(Clone, Debug, Serialize, Deserialize)]
#[serde(tag = "version")]
enum VersionedManifest {
    // The two versions use the same format but for v0.8 and below, we need to set the
    // `doc_mapping_uid` to the nil value upon deserialization.
    #[serde(rename = "0.9")]
    V0_9(ManifestV0_8),
    #[serde(alias = "0.8")]
    #[serde(alias = "0.7")]
    V0_8(ManifestV0_8),
}

impl From<Manifest> for VersionedManifest {
    fn from(manifest: Manifest) -> Self {
        VersionedManifest::V0_9(manifest.into())
    }
}

impl From<VersionedManifest> for Manifest {
    fn from(versioned_manifest: VersionedManifest) -> Self {
        match versioned_manifest {
            VersionedManifest::V0_8(mut manifest) => {
                for template in &mut manifest.templates {
                    // Override the randomly generated doc mapping UID with the nil value.
                    template.doc_mapping.doc_mapping_uid = DocMappingUid::default();
                }
                manifest.into()
            }
            VersionedManifest::V0_9(manifest) => manifest.into(),
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize)]
struct ManifestV0_8 {
    indexes: BTreeMap<IndexId, IndexStatus>,
    templates: Vec<IndexTemplate>,
    #[serde(default, skip_serializing_if = "Uuid::is_nil")]
    identity: Uuid,
}

impl From<Manifest> for ManifestV0_8 {
    fn from(manifest: Manifest) -> Self {
        let templates = manifest
            .templates
            .into_values()
            .sorted_unstable_by(|left, right| left.template_id.cmp(&right.template_id))
            .collect();
        ManifestV0_8 {
            indexes: manifest.indexes,
            templates,
            identity: manifest.identity,
        }
    }
}

impl From<ManifestV0_8> for Manifest {
    fn from(manifest: ManifestV0_8) -> Self {
        let indexes = manifest.indexes.into_iter().collect();
        let templates = manifest
            .templates
            .into_iter()
            .map(|template| (template.template_id.clone(), template))
            .collect();
        Manifest {
            indexes,
            templates,
            identity: manifest.identity,
        }
    }
}

#[cfg(any(test, feature = "testsuite"))]
impl quickwit_config::TestableForRegression for Manifest {
    fn sample_for_regression() -> Self {
        let mut indexes = BTreeMap::new();
        indexes.insert("test-index-1".to_string(), IndexStatus::Creating);
        indexes.insert("test-index-2".to_string(), IndexStatus::Active);
        indexes.insert("test-index-3".to_string(), IndexStatus::Deleting);

        let mut templates = HashMap::new();
        templates.insert(
            "test-template-1".to_string(),
            IndexTemplate::sample_for_regression(),
        );
        Manifest {
            indexes,
            templates,
            identity: Uuid::nil(),
        }
    }

    fn assert_equality(&self, other: &Self) {
        assert_eq!(self.indexes, other.indexes);
        assert_eq!(self.templates, other.templates);
    }
}

pub(super) async fn load_or_create_manifest(storage: &dyn Storage) -> MetastoreResult<Manifest> {
    if file_exists(storage, MANIFEST_FILE_NAME).await? {
        let manifest_json = get_bytes(storage, MANIFEST_FILE_NAME).await?;
        let manifest: Manifest = serde_utils::from_json_bytes(&manifest_json)?;
        return Ok(manifest);
    }
    if file_exists(storage, LEGACY_MANIFEST_FILE_NAME).await? {
        let legacy_manifest_json = get_bytes(storage, LEGACY_MANIFEST_FILE_NAME).await?;
        let legacy_manifest: LegacyManifest = serde_utils::from_json_bytes(&legacy_manifest_json)?;
        let manifest = legacy_manifest.into_manifest();
        save_manifest(storage, &manifest).await?;

        if let Err(storage_error) = delete_file(storage, LEGACY_MANIFEST_FILE_NAME).await {
            error!(
                error=%storage_error,
                "failed to delete legacy manifest file located at `{}/{LEGACY_MANIFEST_FILE_NAME}`", storage.uri()
            );
        }
        return Ok(manifest);
    }
    let manifest = Manifest::default();
    save_manifest(storage, &manifest).await?;
    Ok(manifest)
}

pub(super) async fn save_manifest(
    storage: &dyn Storage,
    manifest: &Manifest,
) -> MetastoreResult<()> {
    let manifest_json_bytes = serde_utils::to_json_bytes_pretty(manifest)?;
    put_bytes(storage, MANIFEST_FILE_NAME, manifest_json_bytes).await?;
    Ok(())
}

async fn delete_file(storage: &dyn Storage, path: &str) -> StorageResult<()> {
    storage.delete(Path::new(path)).await?;
    Ok(())
}

async fn file_exists(storage: &dyn Storage, path_str: &str) -> MetastoreResult<bool> {
    let path = Path::new(path_str);
    let exists = storage.exists(path).await.map_err(|storage_error| {
        into_metastore_error(storage_error, storage.uri(), path, "list")
    })?;
    Ok(exists)
}

async fn get_bytes(storage: &dyn Storage, path_str: &str) -> MetastoreResult<OwnedBytes> {
    let path = Path::new(path_str);
    let bytes = storage.get_all(path).await.map_err(|storage_error| {
        into_metastore_error(storage_error, storage.uri(), path, "load")
    })?;
    Ok(bytes)
}

async fn put_bytes(storage: &dyn Storage, path_str: &str, content: Vec<u8>) -> MetastoreResult<()> {
    let path = Path::new(path_str);
    storage
        .put(path, Box::new(content))
        .await
        .map_err(|storage_error| {
            into_metastore_error(storage_error, storage.uri(), path, "save")
        })?;
    Ok(())
}

fn into_metastore_error(
    storage_error: StorageError,
    uri: &Uri,
    path: &Path,
    operation_name: &str,
) -> MetastoreError {
    match storage_error.kind() {
        StorageErrorKind::Unauthorized => MetastoreError::Forbidden {
            message: format!(
                "failed to access manifest file located at `{uri}/{}`: unauthorized",
                path.display()
            ),
        },
        _ => MetastoreError::Internal {
            message: format!(
                "failed to {operation_name} manifest file located at `{uri}/{}`",
                path.display()
            ),
            cause: storage_error.to_string(),
        },
    }
}

#[cfg(test)]
mod tests {
    use serde_json::json;

    use super::*;

    #[test]
    fn test_legacy_manifest_deserialization() {
        let legacy_manifest_json = r#"{
            "test-index-1": "Creating",
            "test-index-2": "Alive",
            "test-index-3": "Deleting"
        }
        "#;
        let legacy_manifest: LegacyManifest = serde_json::from_str(legacy_manifest_json).unwrap();
        assert_eq!(legacy_manifest.indexes.len(), 3);

        assert_eq!(
            legacy_manifest.indexes.get("test-index-1").unwrap(),
            &IndexStatus::Creating
        );
        assert_eq!(
            legacy_manifest.indexes.get("test-index-2").unwrap(),
            &IndexStatus::Active
        );
        assert_eq!(
            legacy_manifest.indexes.get("test-index-3").unwrap(),
            &IndexStatus::Deleting
        );
    }

    #[test]
    fn test_legacy_manifest_into_manifest() {
        let legacy_manifest = LegacyManifest {
            indexes: vec![
                ("test-index-1".to_string(), IndexStatus::Creating),
                ("test-index-2".to_string(), IndexStatus::Active),
                ("test-index-3".to_string(), IndexStatus::Deleting),
            ]
            .into_iter()
            .collect(),
        };
        let manifest = legacy_manifest.into_manifest();

        assert_eq!(manifest.indexes.len(), 3);
        assert_eq!(manifest.templates.len(), 0);

        assert_eq!(
            manifest.indexes.get("test-index-1").unwrap(),
            &IndexStatus::Creating
        );
        assert_eq!(
            manifest.indexes.get("test-index-2").unwrap(),
            &IndexStatus::Active
        );
        assert_eq!(
            manifest.indexes.get("test-index-3").unwrap(),
            &IndexStatus::Deleting
        );
    }

    #[test]
    fn test_manifest_serde() {
        let indexes = BTreeMap::from_iter([
            ("test-index-1".to_string(), IndexStatus::Creating),
            ("test-index-2".to_string(), IndexStatus::Active),
            ("test-index-3".to_string(), IndexStatus::Deleting),
        ]);
        let templates = HashMap::from_iter([
            (
                "test-template-1".to_string(),
                IndexTemplate::for_test("test-template-1", &["test-index-foo*"], 100),
            ),
            (
                "test-template-2".to_string(),
                IndexTemplate::for_test("test-template-2", &["test-index-bar*"], 200),
            ),
        ]);
        let manifest = Manifest {
            indexes,
            templates,
            identity: Uuid::nil(),
        };
        let manifest_json = serde_json::to_string_pretty(&manifest).unwrap();
        let manifest_deserialized: Manifest = serde_json::from_str(&manifest_json).unwrap();
        assert_eq!(manifest, manifest_deserialized);
    }

    #[tokio::test]
    async fn test_create_mutate_save_load_manifest() {
        let storage = quickwit_storage::storage_for_test();
        let mut manifest = load_or_create_manifest(&*storage).await.unwrap();

        assert_eq!(manifest.indexes.len(), 0);
        assert_eq!(manifest.templates.len(), 0);

        let empty_manifest_size = storage
            .get_all(Path::new(MANIFEST_FILE_NAME))
            .await
            .unwrap()
            .len();
        assert!(empty_manifest_size > 0);

        manifest
            .indexes
            .insert("test-index".to_string(), IndexStatus::Creating);
        manifest.templates.insert(
            "test-template".to_string(),
            IndexTemplate::for_test("test-template", &["test-index-*"], 100),
        );

        save_manifest(&*storage, &manifest).await.unwrap();

        let populated_manifest_size = storage
            .get_all(Path::new(MANIFEST_FILE_NAME))
            .await
            .unwrap()
            .len();
        assert!(populated_manifest_size > empty_manifest_size);

        let manifest = load_or_create_manifest(&*storage).await.unwrap();
        assert_eq!(manifest.indexes.len(), 1);
        assert_eq!(
            manifest.indexes.get("test-index").unwrap(),
            &IndexStatus::Creating
        );

        assert_eq!(manifest.templates.len(), 1);

        let template = manifest.templates.get("test-template").unwrap();
        assert_eq!(template.template_id, "test-template");
        assert_eq!(template.index_id_patterns, ["test-index-*"]);
        assert_eq!(template.priority, 100);
    }

    #[tokio::test]
    async fn test_legacy_manifest_migration() {
        let storage = quickwit_storage::storage_for_test();
        let legacy_manifest_json = json!(
            {
                "test-index-1": "Creating",
                "test-index-2": "Alive",
                "test-index-3": "Deleting"
            }
        );
        let legacy_manifest_json_bytes = serde_json::to_vec(&legacy_manifest_json).unwrap();

        put_bytes(
            &*storage,
            LEGACY_MANIFEST_FILE_NAME,
            legacy_manifest_json_bytes,
        )
        .await
        .unwrap();

        let manifest = load_or_create_manifest(&*storage).await.unwrap();
        assert_eq!(manifest.indexes.len(), 3);
        assert_eq!(manifest.templates.len(), 0);

        assert_eq!(
            manifest.indexes.get("test-index-1").unwrap(),
            &IndexStatus::Creating
        );
        assert_eq!(
            manifest.indexes.get("test-index-2").unwrap(),
            &IndexStatus::Active
        );
        assert_eq!(
            manifest.indexes.get("test-index-3").unwrap(),
            &IndexStatus::Deleting
        );

        let legacy_manifest_exists = file_exists(&*storage, LEGACY_MANIFEST_FILE_NAME)
            .await
            .unwrap();
        assert!(!legacy_manifest_exists);

        let manifest_exists = file_exists(&*storage, MANIFEST_FILE_NAME).await.unwrap();
        assert!(manifest_exists);
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Module for [`FileBackedMetastore`]. It is public so that the crate `quickwit-backward-compat`
//! can import [`FileBackedIndex`] and run backward-compatibility tests. You should not have to
//! import anything from here directly.

pub mod file_backed_index;
mod file_backed_metastore_factory;
mod index_id_matcher;
mod index_template_matcher;
mod lazy_file_backed_index;
pub(crate) mod manifest;
mod state;
mod store_operations;

use core::fmt;
use std::collections::HashMap;
use std::collections::hash_map::Entry;
use std::path::Path;
use std::sync::Arc;
use std::time::Duration;

use async_trait::async_trait;
use futures::StreamExt;
use futures::future::try_join_all;
use futures::stream::FuturesUnordered;
use itertools::Itertools;
use quickwit_common::ServiceStream;
use quickwit_config::IndexTemplate;
use quickwit_proto::metastore::{
    AcquireShardsRequest, AcquireShardsResponse, AddSourceRequest, CreateIndexRequest,
    CreateIndexResponse, CreateIndexTemplateRequest, DeleteIndexRequest,
    DeleteIndexTemplatesRequest, DeleteQuery, DeleteShardsRequest, DeleteShardsResponse,
    DeleteSourceRequest, DeleteSplitsRequest, DeleteTask, EmptyResponse, EntityKind,
    FindIndexTemplateMatchesRequest, FindIndexTemplateMatchesResponse, GetClusterIdentityRequest,
    GetClusterIdentityResponse, GetIndexTemplateRequest, GetIndexTemplateResponse,
    IndexMetadataFailure, IndexMetadataFailureReason, IndexMetadataRequest, IndexMetadataResponse,
    IndexTemplateMatch, IndexesMetadataRequest, IndexesMetadataResponse, LastDeleteOpstampRequest,
    LastDeleteOpstampResponse, ListDeleteTasksRequest, ListDeleteTasksResponse,
    ListIndexStatsRequest, ListIndexStatsResponse, ListIndexTemplatesRequest,
    ListIndexTemplatesResponse, ListIndexesMetadataRequest, ListIndexesMetadataResponse,
    ListShardsRequest, ListShardsResponse, ListSplitsRequest, ListSplitsResponse,
    ListStaleSplitsRequest, MarkSplitsForDeletionRequest, MetastoreError, MetastoreResult,
    MetastoreService, MetastoreServiceStream, OpenShardSubrequest, OpenShardsRequest,
    OpenShardsResponse, PruneShardsRequest, PublishSplitsRequest, ResetSourceCheckpointRequest,
    StageSplitsRequest, ToggleSourceRequest, UpdateIndexRequest, UpdateSourceRequest,
    UpdateSplitsDeleteOpstampRequest, UpdateSplitsDeleteOpstampResponse, serde_utils,
};
use quickwit_proto::types::{IndexId, IndexUid};
use quickwit_storage::Storage;
use time::OffsetDateTime;
use tokio::sync::{Mutex, OwnedMutexGuard, RwLock};
use ulid::Ulid;
use uuid::Uuid;

use self::file_backed_index::FileBackedIndex;
pub use self::file_backed_metastore_factory::FileBackedMetastoreFactory;
use self::index_id_matcher::IndexIdMatcher;
use self::lazy_file_backed_index::LazyFileBackedIndex;
use self::manifest::{MANIFEST_FILE_NAME, load_or_create_manifest, save_manifest};
use self::state::MetastoreState;
use self::store_operations::{delete_index, index_exists, load_index, put_index};
use super::{
    AddSourceRequestExt, CreateIndexRequestExt, IndexMetadataResponseExt,
    IndexesMetadataResponseExt, ListIndexesMetadataResponseExt, ListSplitsRequestExt,
    ListSplitsResponseExt, PublishSplitsRequestExt, STREAM_SPLITS_CHUNK_SIZE,
    StageSplitsRequestExt, UpdateIndexRequestExt, UpdateSourceRequestExt,
};
use crate::checkpoint::IndexCheckpointDelta;
use crate::{IndexMetadata, ListSplitsQuery, MetastoreServiceExt, Split, SplitState};

/// Status of an index tracked by the metastore.
pub(crate) enum LazyIndexStatus {
    /// The index is being created but its metadata have yet to be written on the storage.
    Creating,
    /// The index is created and available.
    Active(LazyFileBackedIndex),
    /// The index is being deleted and but its index metadata file has not yet been removed from
    /// storage.
    Deleting,
}

#[derive(Debug)]
pub(crate) enum MutationOccurred<T> {
    Yes(T),
    No(T),
}

impl From<bool> for MutationOccurred<()> {
    fn from(mutation_occurred: bool) -> Self {
        if mutation_occurred {
            Self::Yes(())
        } else {
            Self::No(())
        }
    }
}

/// A metastore implementation that stores all the metadata associated to each index
/// into as many files and stores a map of indexes
/// (index_id, index_status) in a dedicated file `manifest.json`.
///
/// A [`LazyIndexStatus`] describes the lifecycle of an index: [`LazyIndexStatus::Creating`] and
/// [`LazyIndexStatus::Deleting`] are transitioning states that indicates that the index is not
/// yet available. On the contrary, the [`LazyIndexStatus::Active`] status indicates the index is
/// ready to be fetched and updated.
///
/// Transitioning states are useful to track inconsistencies between the in-memory and on-disk data
/// structures when error(s) occur during index creations and deletions:
/// - `Creating` indicates that the metastore updated the manifest file with this state but not yet
///   the index metadata file;
/// - `Deleting` indicates that the metastore updated the manifest file with this state but the
///   index metadata file is not yet deleted.
///
/// !!! Important note: the indexes map manifest does not
/// guarantee exhaustivity: an index metadata file can be on the storage
/// but not present in the states map. As the map is incomplete, the metastore
/// does not rely on it to check index existence, this leads to following
/// implementations:
/// - on creation, the metastore always checks if an index metadata file is already present on the
///   storage even if the index is not in the indexes map;
/// - on get/update of an index, same story, the metastore checks if index is on the storage and if
///   present, the index is loaded in the map and returned /modified;
/// - on deletion, same story, the metastore deletes an index metadata file present on the storage
///   even if the index is not in the map.
///
/// !!! Important note 2: it is strongly advised to restrict the `FileBackedMetastore`
/// usage to the following use cases:
/// - testing;
/// - single-node environment;
/// - multiple-nodes environment with only one writer and readers. In this case, you must be very
///   cautious and ensure that your readers are really readers.
#[derive(Clone)]
pub struct FileBackedMetastore {
    state: Arc<RwLock<MetastoreState>>,
    storage: Arc<dyn Storage>,
    polling_interval_opt: Option<Duration>,
}

impl fmt::Debug for FileBackedMetastore {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("FileBackedMetastore")
            .field("storage_uri", self.storage.uri())
            .field("polling_interval_opt", &self.polling_interval_opt)
            .finish()
    }
}

impl FileBackedMetastore {
    /// Creates a [`FileBackedMetastore`] for tests.
    #[doc(hidden)]
    pub fn for_test(storage: Arc<dyn Storage>) -> Self {
        Self {
            state: Default::default(),
            storage,
            polling_interval_opt: None,
        }
    }

    /// Sets the polling interval.
    ///
    /// Only newly accessed indexes will be affected by the change of this setting.
    pub fn set_polling_interval(&mut self, polling_interval_opt: Option<Duration>) {
        self.polling_interval_opt = polling_interval_opt;
    }

    /// Return the underlying storage.
    ///
    /// This is only build in tests to verify the metastore did indeed store what it should.
    /// It shouldn't be relied uppon elsewhere as to not break abstractions.
    #[cfg(test)]
    pub fn storage(&self) -> Arc<dyn Storage> {
        self.storage.clone()
    }

    /// Creates a [`FileBackedMetastore`] for a specified storage, immediately loading the manifest
    /// file.
    pub async fn try_new(
        storage: Arc<dyn Storage>,
        polling_interval_opt: Option<Duration>,
    ) -> MetastoreResult<Self> {
        let manifest = load_or_create_manifest(&*storage).await?;
        let state =
            MetastoreState::try_from_manifest(storage.clone(), manifest, polling_interval_opt)?;
        let metastore = Self {
            state: Arc::new(RwLock::new(state)),
            storage,
            polling_interval_opt,
        };
        Ok(metastore)
    }

    async fn mutate<T>(
        &self,
        index_uid: &IndexUid,
        mutate_fn: impl FnOnce(&mut FileBackedIndex) -> MetastoreResult<MutationOccurred<T>>,
    ) -> MetastoreResult<T> {
        let index_id = &index_uid.index_id;
        let mut locked_index = self.get_locked_index(index_id).await?;
        if locked_index.index_uid() != index_uid {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_id.to_string(),
            }));
        }
        let mut index = locked_index.clone();

        let value = match mutate_fn(&mut index)? {
            MutationOccurred::Yes(value) => value,
            MutationOccurred::No(value) => {
                return Ok(value);
            }
        };
        locked_index.set_recently_modified();

        let put_result = put_index(&*self.storage, &index).await;
        match put_result {
            Ok(()) => {
                *locked_index = index;
                Ok(value)
            }
            Err(error) => {
                // For some of the error type here, we cannot know for sure
                // whether the content was written or not.
                //
                // Just to be sure, let's discard the cache.
                let mut state_wlock_guard = self.state.write().await;

                // At this point, we hold both locks.
                state_wlock_guard.indexes.insert(
                    index_id.to_string(),
                    LazyIndexStatus::Active(LazyFileBackedIndex::new(
                        self.storage.clone(),
                        index_id.to_string(),
                        self.polling_interval_opt,
                        None,
                    )),
                );
                locked_index.discarded = true;
                Err(error)
            }
        }
    }

    async fn read<T, F>(&self, index_uid: &IndexUid, view: F) -> MetastoreResult<T>
    where F: FnOnce(&FileBackedIndex) -> MetastoreResult<T> {
        self.read_any(
            index_uid.index_id.as_str(),
            Some(index_uid.incarnation_id),
            view,
        )
        .await
    }

    /// Reads the index metadata given an `index_id`. The difference with `read` it that
    /// this function does necessarily take a incarnation id, so that it is less strict.
    async fn read_any<T>(
        &self,
        index_id: &str,
        incarnation_id_opt: Option<Ulid>,
        view: impl FnOnce(&FileBackedIndex) -> MetastoreResult<T>,
    ) -> MetastoreResult<T> {
        let locked_index = self.get_locked_index(index_id).await?;
        if let Some(incarnation_id) = incarnation_id_opt
            && locked_index.index_uid().incarnation_id != incarnation_id
        {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_id.to_string(),
            }));
        }
        view(&locked_index)
    }

    /// Returns a valid locked index.
    ///
    /// This function guarantees that it has not been
    /// marked as discarded.
    async fn get_locked_index(
        &self,
        index_id: &str,
    ) -> MetastoreResult<OwnedMutexGuard<FileBackedIndex>> {
        loop {
            let index = self.index(index_id).await?;
            let locked_index = index.lock_owned().await;

            if !locked_index.discarded {
                return Ok(locked_index);
            }
        }
    }

    /// Returns a FileBackedIndex for the given index_id.
    ///
    /// If `index_id` is in a transitioning state `Creating` or `Deleting`, it will
    /// trigger an error.
    /// If `index_id` is not yet in `per_index_metastores` map,
    /// a fetch to the storage will be initiated and might trigger an error.
    ///
    /// For a given index_id, only copies of the same index_view are returned.
    async fn index(&self, index_id: &str) -> MetastoreResult<Arc<Mutex<FileBackedIndex>>> {
        {
            // Happy path!
            // If the object is already in our cache then we just return a copy
            let inner_rlock_guard = self.state.read().await;
            if let Some(index_state) = inner_rlock_guard.indexes.get(index_id) {
                return get_index_mutex(index_id, index_state).await;
            }
        }
        // At this point we do not hold our mutex, so we need to do a little dance
        // to make sure we return the same instance.
        //
        // If there is an error here, note we do not return right away.
        // That's because we want to observe the property that after one success
        // all subsequent calls will succeed.
        let index_result = load_index(&*self.storage, index_id).await;

        // Here we retake the lock, still no io ongoing.
        let mut state_wlock_guard = self.state.write().await;

        // At this point, some other client might have added another instance of the Metadataet in
        // the map. We want to avoid two copies to exist in the application, so we keep only
        // one.
        if let Some(index_state) = state_wlock_guard.indexes.get(index_id) {
            return get_index_mutex(index_id, index_state).await;
        }

        // We need to instantiate a `LazyFileBackedIndex` that will hold the mutex
        // and take care of spawning the polling if needed.
        let index = index_result?;
        let lazy_index = LazyFileBackedIndex::new(
            self.storage.clone(),
            index_id.to_string(),
            self.polling_interval_opt,
            Some(index),
        );
        let index_mutex = lazy_index.get().await?;
        state_wlock_guard
            .indexes
            .insert(index_id.to_string(), LazyIndexStatus::Active(lazy_index));
        Ok(index_mutex)
    }

    async fn index_metadata_inner(
        &self,
        index_id_opt: Option<IndexId>,
        index_uid_opt: Option<IndexUid>,
    ) -> Result<IndexMetadata, (MetastoreError, Option<IndexId>, Option<IndexUid>)> {
        let index_id = if let Some(index_id) = &index_id_opt {
            index_id
        } else if let Some(index_uid) = &index_uid_opt {
            &index_uid.index_id
        } else {
            let message = "invalid request: neither `index_id` nor `index_uid` is set".to_string();
            let metastore_error = MetastoreError::Internal {
                message,
                cause: "".to_string(),
            };
            return Err((metastore_error, index_id_opt, index_uid_opt));
        };
        let index_metadata = match self
            .read_any(index_id, None, |index| Ok(index.metadata().clone()))
            .await
        {
            Ok(index_metadata) => index_metadata,
            Err(metastore_error) => {
                return Err((metastore_error, index_id_opt, index_uid_opt));
            }
        };
        if let Some(index_uid) = &index_uid_opt
            && index_metadata.index_uid != *index_uid
        {
            let metastore_error = MetastoreError::NotFound(EntityKind::Index {
                index_id: index_id.to_string(),
            });
            return Err((metastore_error, index_id_opt, index_uid_opt));
        }
        Ok(index_metadata)
    }

    async fn list_splits_aux(
        &self,
        index_id_with_incarnation_id_opts: &[(IndexId, Option<Ulid>)],
        list_splits_query: ListSplitsQuery,
    ) -> MetastoreResult<Vec<Split>> {
        let mut splits_per_index = Vec::with_capacity(index_id_with_incarnation_id_opts.len());
        for (index_id, incarnation_id_opt) in index_id_with_incarnation_id_opts {
            match self
                .read_any(index_id, *incarnation_id_opt, |index| {
                    index.list_splits(&list_splits_query)
                })
                .await
            {
                Ok(splits) => {
                    splits_per_index.push(splits);
                }
                Err(MetastoreError::NotFound(_)) => {
                    // If the index does not exist, we just skip it.
                    continue;
                }
                Err(error) => return Err(error),
            }
        }

        let limit = list_splits_query.limit.unwrap_or(usize::MAX);
        let offset = list_splits_query.offset.unwrap_or_default();

        let merged_results = splits_per_index
            .into_iter()
            .kmerge_by(|lhs, rhs| list_splits_query.sort_by.compare(lhs, rhs).is_lt())
            .skip(offset)
            .take(limit)
            .collect();

        Ok(merged_results)
    }

    /// Returns the list of splits for the given request.
    /// No error is returned if any of the requested `index_uid` does not exist.
    async fn list_splits_inner(&self, request: ListSplitsRequest) -> MetastoreResult<Vec<Split>> {
        let mut list_splits_query = request.deserialize_list_splits_query()?;

        let index_id_incarnation_id_opts: Vec<(IndexId, Option<Ulid>)> =
            if let Some(index_uids) = list_splits_query.index_uids.take() {
                index_uids
                    .into_iter()
                    .map(|index_uid| (index_uid.index_id, Some(index_uid.incarnation_id)))
                    .collect()
            } else {
                // We do not have an explicit list of index_uids with the query, so we search for
                // all indexes.
                let inner_rlock_guard = self.state.read().await;
                inner_rlock_guard
                    .indexes
                    .iter()
                    .filter_map(|(index_id, index_state)| match index_state {
                        LazyIndexStatus::Active(_) => Some(index_id),
                        _ => None,
                    })
                    .map(|index_id| (index_id.clone(), None))
                    .collect()
            };

        self.list_splits_aux(&index_id_incarnation_id_opts, list_splits_query)
            .await
    }

    /// Helper used for testing to obtain the data associated with the given index.
    #[cfg(test)]
    async fn get_index(&self, index_uid: &IndexUid) -> MetastoreResult<FileBackedIndex> {
        self.read(index_uid, |index| Ok(index.clone())).await
    }
}

#[async_trait]
impl MetastoreService for FileBackedMetastore {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.storage.exists(Path::new(MANIFEST_FILE_NAME)).await?;
        Ok(())
    }

    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        vec![self.storage.uri().clone()]
    }

    // -------------------------------------------------------------------------------
    // Mutations over the high-level index.

    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> MetastoreResult<CreateIndexResponse> {
        let index_config = request.deserialize_index_config()?;
        let source_configs = request.deserialize_source_configs()?;

        let mut index_metadata = IndexMetadata::new(index_config);

        for source_config in source_configs {
            index_metadata.add_source(source_config)?;
        }
        let index_uid = index_metadata.index_uid.clone();
        let index_id = &index_uid.index_id;

        let index_metadata_json = serde_utils::to_json_str(&index_metadata)?;
        let index = FileBackedIndex::from(index_metadata);

        let mut state_wlock_guard = self.state.write().await;

        // Checking if index already exists is a bit tedious:
        // - first we check the index state: if it's `Active`, return `IndexAlreadyExists` error,
        //   and if it's `Creating` or `Deleting`, it's ok to override them as these are
        //   transitioning states.
        // - if the index is not in the index states map, we still need to check the storage as we
        //   don't want to override an existing metadata file.
        if let Some(index_status) = state_wlock_guard.indexes.get(index_id) {
            if let LazyIndexStatus::Active(_) = index_status {
                return Err(MetastoreError::AlreadyExists(EntityKind::Index {
                    index_id: index_id.to_string(),
                }));
            }
        } else if index_exists(&*self.storage, index_id).await? {
            return Err(MetastoreError::Internal {
                message: format!("index {index_id} cannot be created"),
                cause: format!(
                    "index {index_id} is not present in the manifest file but its file \
                     `{index_id}/metastore.json` is on the storage"
                ),
            });
        }
        // Set state to `Creating` and rollback on metastore error.
        state_wlock_guard
            .indexes
            .insert(index_id.clone(), LazyIndexStatus::Creating);

        let manifest = state_wlock_guard.as_manifest();

        if let Err(error) = save_manifest(&*self.storage, &manifest).await {
            state_wlock_guard.indexes.remove(index_id);
            return Err(error);
        }
        put_index(&*self.storage, &index).await?;

        state_wlock_guard.indexes.insert(
            index_id.clone(),
            LazyIndexStatus::Active(LazyFileBackedIndex::new(
                self.storage.clone(),
                index_id.clone(),
                self.polling_interval_opt,
                Some(index),
            )),
        );
        // Set state to `Active` and rollback on metastore error.
        let manifest = state_wlock_guard.as_manifest();

        if let Err(error) = save_manifest(&*self.storage, &manifest).await {
            state_wlock_guard
                .indexes
                .insert(index_id.clone(), LazyIndexStatus::Creating);
            return Err(error);
        }

        let response = CreateIndexResponse {
            index_uid: index_uid.into(),
            index_metadata_json,
        };
        Ok(response)
    }

    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> MetastoreResult<IndexMetadataResponse> {
        let index_uid = request.index_uid();
        let doc_mapping = request.deserialize_doc_mapping()?;
        let indexing_settings = request.deserialize_indexing_settings()?;
        let ingest_settings = request.deserialize_ingest_settings()?;
        let search_settings = request.deserialize_search_settings()?;
        let retention_policy_opt = request.deserialize_retention_policy()?;

        let index_metadata = self
            .mutate(index_uid, |index| {
                let mutation_occurred = index.update_index_config(
                    doc_mapping,
                    indexing_settings,
                    ingest_settings,
                    search_settings,
                    retention_policy_opt,
                )?;
                let index_metadata = index.metadata().clone();

                if mutation_occurred {
                    Ok(MutationOccurred::Yes(index_metadata))
                } else {
                    Ok(MutationOccurred::No(index_metadata))
                }
            })
            .await?;
        IndexMetadataResponse::try_from_index_metadata(&index_metadata)
    }

    async fn delete_index(&self, request: DeleteIndexRequest) -> MetastoreResult<EmptyResponse> {
        // We pick the outer lock here, so that we enter a critical section.
        let mut state_wlock_guard = self.state.write().await;

        let index_id = &request.index_uid().index_id;
        // If index is neither in `per_index_metastores_wlock` nor on the storage, it does not
        // exist.
        if !state_wlock_guard.indexes.contains_key(index_id)
            && !index_exists(&*self.storage, index_id).await?
        {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_id.to_string(),
            }));
        }
        // Set state to `Deleting` and keep the previous state in memory in case we need to insert
        // if an error occurs.
        let index_state_opt = state_wlock_guard
            .indexes
            .insert(index_id.to_string(), LazyIndexStatus::Deleting);
        let manifest = state_wlock_guard.as_manifest();
        // On a put error, reinsert the previous state if any.
        if let Err(error) = save_manifest(&*self.storage, &manifest).await {
            if let Some(index_state) = index_state_opt {
                state_wlock_guard
                    .indexes
                    .insert(index_id.to_string(), index_state);
            } else {
                state_wlock_guard.indexes.remove(index_id);
            }
            return Err(error);
        }

        let delete_result = delete_index(&*self.storage, index_id).await;

        if matches!(
            &delete_result,
            Ok(()) | Err(MetastoreError::NotFound(EntityKind::Index { .. }))
        ) {
            state_wlock_guard.indexes.remove(index_id);
            let manifest = state_wlock_guard.as_manifest();

            if let Err(error) = save_manifest(&*self.storage, &manifest).await {
                state_wlock_guard
                    .indexes
                    .insert(index_id.to_string(), LazyIndexStatus::Deleting);
                return Err(error);
            }
        }
        delete_result.map(|_| EmptyResponse {})
    }

    // -------------------------------------------------------------------------------
    // Mutations over a single index

    async fn stage_splits(&self, request: StageSplitsRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid().clone();
        let splits_metadata = request.deserialize_splits_metadata()?;

        self.mutate(&index_uid, |index| {
            let mut failed_split_ids = Vec::new();

            for split_metadata in splits_metadata {
                match index.stage_split(split_metadata) {
                    Ok(()) => {}
                    Err(MetastoreError::FailedPrecondition {
                        entity: EntityKind::Split { split_id },
                        ..
                    }) => {
                        failed_split_ids.push(split_id);
                    }
                    Err(error) => return Err(error),
                };
            }
            if !failed_split_ids.is_empty() {
                let entity = EntityKind::Splits {
                    split_ids: failed_split_ids,
                };
                let message = "splits are not staged".to_string();
                Err(MetastoreError::FailedPrecondition { entity, message })
            } else {
                Ok(MutationOccurred::Yes(()))
            }
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let index_checkpoint_delta: Option<IndexCheckpointDelta> =
            request.deserialize_index_checkpoint()?;
        let index_uid = request.index_uid().clone();
        self.mutate(&index_uid, |index| {
            index.publish_splits(
                request.staged_split_ids,
                request.replaced_split_ids,
                index_checkpoint_delta,
                request.publish_token_opt,
            )?;
            Ok(MutationOccurred::Yes(()))
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid().clone();

        self.mutate(&index_uid, |index| {
            index
                .mark_splits_for_deletion(
                    request.split_ids,
                    &[
                        SplitState::Staged,
                        SplitState::Published,
                        SplitState::MarkedForDeletion,
                    ],
                    false,
                )
                .map(MutationOccurred::from)
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn delete_splits(&self, request: DeleteSplitsRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid().clone();

        self.mutate(&index_uid, |index| {
            index.delete_splits(request.split_ids)?;
            Ok(MutationOccurred::Yes(EmptyResponse {}))
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn add_source(&self, request: AddSourceRequest) -> MetastoreResult<EmptyResponse> {
        let source_config = request.deserialize_source_config()?;
        let index_uid = request.index_uid();

        self.mutate(index_uid, |index| {
            index.add_source(source_config)?;
            Ok(MutationOccurred::Yes(()))
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn update_source(&self, request: UpdateSourceRequest) -> MetastoreResult<EmptyResponse> {
        let source_config = request.deserialize_source_config()?;
        let index_uid = request.index_uid();

        self.mutate(index_uid, |index| {
            let mutation_occurred = index.update_source(source_config)?;
            Ok(MutationOccurred::from(mutation_occurred))
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn toggle_source(&self, request: ToggleSourceRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid();

        self.mutate(index_uid, |index| {
            index
                .toggle_source(&request.source_id, request.enable)
                .map(MutationOccurred::from)
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn delete_source(&self, request: DeleteSourceRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid();

        self.mutate(index_uid, |index| {
            index.delete_source(&request.source_id)?;
            Ok(MutationOccurred::Yes(()))
        })
        .await?;
        Ok(EmptyResponse {})
    }

    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid();

        self.mutate(index_uid, |index| {
            index
                .reset_source_checkpoint(&request.source_id)
                .map(MutationOccurred::from)
        })
        .await?;
        Ok(EmptyResponse {})
    }

    // -------------------------------------------------------------------------------
    // Read-only accessors

    /// Streams of splits for the given request.
    /// No error is returned if any of the requested `index_uid` does not exist.
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        let splits = self.list_splits_inner(request).await?;
        let splits_responses: Vec<MetastoreResult<ListSplitsResponse>> = splits
            .chunks(STREAM_SPLITS_CHUNK_SIZE)
            .map(|chunk| ListSplitsResponse::try_from_splits(chunk.to_vec()))
            .collect();
        let splits_responses_stream = Box::pin(futures::stream::iter(splits_responses));
        Ok(ServiceStream::new(splits_responses_stream))
    }

    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> MetastoreResult<ListIndexStatsResponse> {
        let index_id_matcher =
            IndexIdMatcher::try_from_index_id_patterns(&request.index_id_patterns)?;
        let index_ids: Vec<IndexId> = {
            let inner_rlock_guard = self.state.read().await;
            inner_rlock_guard
                .indexes
                .iter()
                .filter_map(|(index_id, index_state)| match index_state {
                    LazyIndexStatus::Active(_) if index_id_matcher.is_match(index_id) => {
                        Some(index_id)
                    }
                    _ => None,
                })
                .cloned()
                .collect()
        };

        let mut index_read_futures = FuturesUnordered::new();
        for index_id in index_ids {
            let index_read_future = async move {
                self.read_any(&index_id, None, |index| index.get_stats())
                    .await
            };
            index_read_futures.push(index_read_future);
        }

        let mut index_stats = Vec::new();
        while let Some(index_read_result) = index_read_futures.next().await {
            match index_read_result {
                Ok(stats) => index_stats.push(stats),
                Err(MetastoreError::NotFound(_)) => {
                    // If the index does not exist, we just skip it.
                    continue;
                }
                Err(error) => return Err(error),
            }
        }

        Ok(ListIndexStatsResponse { index_stats })
    }

    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> MetastoreResult<ListSplitsResponse> {
        let list_splits_query = ListSplitsQuery::for_index(request.index_uid().clone())
            .with_delete_opstamp_lt(request.delete_opstamp)
            .with_split_state(SplitState::Published)
            .retain_mature(OffsetDateTime::now_utc())
            .sort_by_staleness()
            .with_limit(request.num_splits as usize);
        let list_splits_request =
            ListSplitsRequest::try_from_list_splits_query(&list_splits_query)?;
        let splits = self.list_splits_inner(list_splits_request).await?;
        ListSplitsResponse::try_from_splits(splits)
    }

    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> MetastoreResult<IndexMetadataResponse> {
        let index_metadata = self
            .index_metadata_inner(request.index_id, request.index_uid)
            .await
            .map_err(|(metastore_error, _index_id_opt, _index_uid_opt)| metastore_error)?;
        let response = IndexMetadataResponse::try_from_index_metadata(&index_metadata)?;
        Ok(response)
    }

    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> MetastoreResult<IndexesMetadataResponse> {
        let mut indexes_metadata: Vec<IndexMetadata> =
            Vec::with_capacity(request.subrequests.len());
        let mut failures: Vec<IndexMetadataFailure> = Vec::new();

        let mut index_metadata_futures = FuturesUnordered::new();

        for subrequest in request.subrequests {
            let metastore = self.clone();
            let index_metadata_future = async move {
                metastore
                    .index_metadata_inner(subrequest.index_id, subrequest.index_uid)
                    .await
            };
            index_metadata_futures.push(index_metadata_future);
        }
        while let Some(index_metadata_result) = index_metadata_futures.next().await {
            match index_metadata_result {
                Ok(index_metadata) => indexes_metadata.push(index_metadata),
                Err((MetastoreError::NotFound(_), index_id, index_uid)) => {
                    let failure = IndexMetadataFailure {
                        index_id,
                        index_uid,
                        reason: IndexMetadataFailureReason::NotFound as i32,
                    };
                    failures.push(failure)
                }
                // All other errors are considered internal errors.
                Err((_metastore_error, index_id, index_uid)) => {
                    let failure = IndexMetadataFailure {
                        index_id,
                        index_uid,
                        reason: IndexMetadataFailureReason::Internal as i32,
                    };
                    failures.push(failure)
                }
            }
        }
        let response =
            IndexesMetadataResponse::try_from_indexes_metadata(indexes_metadata, failures).await?;
        Ok(response)
    }

    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> MetastoreResult<ListIndexesMetadataResponse> {
        // Done in two steps:
        // 1) Get index IDs and release the lock on `per_index_metastores`.
        // 2) Get each index metadata. Note that each get will take a read lock on
        // `per_index_metastores`. Lock is released in 1) to let a concurrent task/thread to
        // take a write lock on `per_index_metastores`.
        let index_id_matcher =
            IndexIdMatcher::try_from_index_id_patterns(&request.index_id_patterns)?;
        let inner_rlock_guard = self.state.read().await;
        let index_ids: Vec<IndexId> = inner_rlock_guard
            .indexes
            .iter()
            .filter_map(|(index_id, index_state)| match index_state {
                LazyIndexStatus::Active(_) if index_id_matcher.is_match(index_id) => Some(index_id),
                _ => None,
            })
            .cloned()
            .collect();
        drop(inner_rlock_guard);

        let metastore = self.clone();
        let indexes_metadata: Vec<IndexMetadata> = try_join_all(
            index_ids
                .into_iter()
                .map(|index_id| get_index_metadata(metastore.clone(), index_id)),
        )
        .await?
        .into_iter()
        .flatten()
        .collect();
        let response =
            ListIndexesMetadataResponse::try_from_indexes_metadata(indexes_metadata).await?;
        Ok(response)
    }

    // Shard API

    async fn open_shards(&self, request: OpenShardsRequest) -> MetastoreResult<OpenShardsResponse> {
        let mut response = OpenShardsResponse {
            subresponses: Vec::with_capacity(request.subrequests.len()),
        };
        // We must group the subrequests by `index_uid` to mutate each index only once, since each
        // mutation triggers an IO.
        let per_index_uid_subrequests: HashMap<IndexUid, Vec<OpenShardSubrequest>> = request
            .subrequests
            .into_iter()
            .into_group_map_by(|subrequest| subrequest.index_uid().clone());

        for (index_uid, subrequests) in per_index_uid_subrequests {
            let subresponses = self
                .mutate(&index_uid, |index| index.open_shards(subrequests))
                .await?;
            response.subresponses.extend(subresponses);
        }
        Ok(response)
    }

    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> MetastoreResult<AcquireShardsResponse> {
        let index_uid = request.index_uid().clone();
        let response = self
            .mutate(&index_uid, |index| index.acquire_shards(request))
            .await?;
        Ok(response)
    }

    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> MetastoreResult<DeleteShardsResponse> {
        let index_uid = request.index_uid().clone();
        let response = self
            .mutate(&index_uid, |index| index.delete_shards(request))
            .await?;
        Ok(response)
    }

    async fn prune_shards(&self, request: PruneShardsRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid = request.index_uid().clone();
        self.mutate(&index_uid, |index| index.prune_shards(request))
            .await?;
        Ok(EmptyResponse {})
    }

    async fn list_shards(&self, request: ListShardsRequest) -> MetastoreResult<ListShardsResponse> {
        let mut subresponses = Vec::with_capacity(request.subrequests.len());

        for subrequest in request.subrequests {
            let index_uid = subrequest.index_uid().clone();
            let subresponse = self
                .read(&index_uid, |index| index.list_shards(subrequest))
                .await?;
            subresponses.push(subresponse);
        }
        let response = ListShardsResponse { subresponses };
        Ok(response)
    }

    // -------------------------------------------------------------------------------
    // Delete tasks

    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> MetastoreResult<LastDeleteOpstampResponse> {
        let last_delete_opstamp = self
            .read(request.index_uid(), |index| Ok(index.last_delete_opstamp()))
            .await?;
        Ok(LastDeleteOpstampResponse::new(last_delete_opstamp))
    }

    async fn create_delete_task(&self, delete_query: DeleteQuery) -> MetastoreResult<DeleteTask> {
        let index_uid = delete_query.index_uid().clone();
        let delete_task = self
            .mutate(&index_uid, |index| {
                index
                    .create_delete_task(delete_query)
                    .map(MutationOccurred::Yes)
            })
            .await?;
        Ok(delete_task)
    }

    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        let index_uid = request.index_uid();

        self.mutate(index_uid, |index| {
            let split_ids_str = request
                .split_ids
                .iter()
                .map(|split_id| split_id.as_str())
                .collect::<Vec<_>>();
            index
                .update_splits_delete_opstamp(&split_ids_str, request.delete_opstamp)
                .map(MutationOccurred::from)
        })
        .await?;
        Ok(UpdateSplitsDeleteOpstampResponse {})
    }

    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> MetastoreResult<ListDeleteTasksResponse> {
        let index_uid = request.index_uid();

        let delete_tasks = self
            .read(index_uid, |index| {
                Ok(index.list_delete_tasks(request.opstamp_start))
            })
            .await??;
        let response = ListDeleteTasksResponse { delete_tasks };
        Ok(response)
    }

    // Index Template API

    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let index_template: IndexTemplate =
            serde_utils::from_json_str(&request.index_template_json)?;
        let template_id = index_template.template_id.clone();

        let mut state_wlock_guard = self.state.write().await;

        let evicted_template_opt = match state_wlock_guard.templates.entry(template_id.clone()) {
            Entry::Vacant(entry) => {
                entry.insert(index_template.clone());
                None
            }
            Entry::Occupied(mut entry) if request.overwrite => {
                let evicted_template = entry.insert(index_template.clone());
                Some(evicted_template)
            }
            Entry::Occupied(_) => {
                return Err(MetastoreError::AlreadyExists(EntityKind::IndexTemplate {
                    template_id,
                }));
            }
        };
        if let Err(error) = state_wlock_guard.template_matcher.insert(&index_template) {
            if let Some(evicted_template) = evicted_template_opt {
                state_wlock_guard
                    .templates
                    .insert(evicted_template.template_id.clone(), evicted_template);
            } else {
                state_wlock_guard.templates.remove(&template_id);
            }
            return Err(error);
        }
        let manifest = state_wlock_guard.as_manifest();
        let save_result = save_manifest(&*self.storage, &manifest).await;

        // Rollback on error.
        if let Err(error) = save_result {
            if let Some(evicted_template) = evicted_template_opt {
                state_wlock_guard
                    .template_matcher
                    .insert(&evicted_template)
                    .expect("evicted template should be valid");
                state_wlock_guard
                    .templates
                    .insert(evicted_template.template_id.clone(), evicted_template);
            } else {
                state_wlock_guard.templates.remove(&template_id);
                state_wlock_guard.template_matcher.remove(&template_id);
            }
            return Err(error);
        }
        Ok(EmptyResponse {})
    }

    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> MetastoreResult<GetIndexTemplateResponse> {
        let inner_rlock_guard = self.state.read().await;
        let index_template = inner_rlock_guard
            .templates
            .get(&request.template_id)
            .ok_or({
                MetastoreError::NotFound(EntityKind::IndexTemplate {
                    template_id: request.template_id,
                })
            })?;
        let index_template_json = serde_utils::to_json_str(index_template)?;
        let response = GetIndexTemplateResponse {
            index_template_json,
        };
        Ok(response)
    }

    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> MetastoreResult<FindIndexTemplateMatchesResponse> {
        let inner_rlock_guard = self.state.read().await;

        let mut matches = Vec::new();

        for index_id in request.index_ids {
            if let Some(template_id) = inner_rlock_guard
                .template_matcher
                .find_match(&index_id)
                .clone()
            {
                let index_template = inner_rlock_guard
                    .templates
                    .get(&template_id)
                    .expect("template should exist");
                let index_template_json = serde_utils::to_json_str(index_template)?;
                let index_template_match = IndexTemplateMatch {
                    index_id,
                    template_id,
                    index_template_json,
                };
                matches.push(index_template_match);
            };
        }
        let response = FindIndexTemplateMatchesResponse { matches };
        Ok(response)
    }

    async fn list_index_templates(
        &self,
        _request: ListIndexTemplatesRequest,
    ) -> MetastoreResult<ListIndexTemplatesResponse> {
        let inner_rlock_guard = self.state.read().await;

        let index_templates_json: Vec<String> = inner_rlock_guard
            .templates
            .values()
            .map(serde_utils::to_json_str)
            .collect::<MetastoreResult<_>>()?;
        let response = ListIndexTemplatesResponse {
            index_templates_json,
        };
        Ok(response)
    }

    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let mut evicted_templates = Vec::with_capacity(request.template_ids.len());
        let mut state_wlock_guard = self.state.write().await;

        for template_id in &request.template_ids {
            if let Some(evicted_template) = state_wlock_guard.templates.remove(template_id) {
                evicted_templates.push(evicted_template);
                state_wlock_guard.template_matcher.remove(template_id);
            }
        }
        let manifest = state_wlock_guard.as_manifest();
        let save_result = save_manifest(&*self.storage, &manifest).await;

        // Rollback on error.
        if let Err(error) = save_result {
            for evicted_template in evicted_templates {
                state_wlock_guard
                    .template_matcher
                    .insert(&evicted_template)
                    .expect("evicted template should be valid");
                state_wlock_guard
                    .templates
                    .insert(evicted_template.template_id.clone(), evicted_template);
            }
            return Err(error);
        }
        Ok(EmptyResponse {})
    }

    // Get cluster identity api

    // this returns a constant uuid. on first call, it generate said uuid if it doesn't already
    // exists
    async fn get_cluster_identity(
        &self,
        _: GetClusterIdentityRequest,
    ) -> MetastoreResult<GetClusterIdentityResponse> {
        let mut state_wlock_guard = self.state.write().await;

        if state_wlock_guard.identity.is_nil() {
            state_wlock_guard.identity = Uuid::new_v4();

            let manifest = state_wlock_guard.as_manifest();

            if let Err(error) = save_manifest(&*self.storage, &manifest).await {
                state_wlock_guard.identity = Uuid::nil();
                return Err(error);
            }
        }

        Ok(GetClusterIdentityResponse {
            uuid: state_wlock_guard.identity.hyphenated().to_string(),
        })
    }
}

impl MetastoreServiceExt for FileBackedMetastore {}

async fn get_index_mutex(
    index_id: &str,
    lazy_index_status: &LazyIndexStatus,
) -> MetastoreResult<Arc<Mutex<FileBackedIndex>>> {
    match lazy_index_status {
        LazyIndexStatus::Active(lazy_index) => lazy_index.get().await,
        LazyIndexStatus::Creating => Err(MetastoreError::Internal {
            message: format!("index `{index_id}` cannot be retrieved"),
            cause: "index `{index_id}` is in transitioning state `creating` and this should not \
                    happened. either recreate or delete it"
                .to_string(),
        }),
        LazyIndexStatus::Deleting => Err(MetastoreError::Internal {
            message: format!("index `{index_id}` cannot be retrieved"),
            cause: "index `{index_id}` is in transitioning state `deleting` and this should not \
                    happened. try to delete it again"
                .to_string(),
        }),
    }
}

async fn get_index_metadata(
    metastore: FileBackedMetastore,
    index_id: IndexId,
) -> MetastoreResult<Option<IndexMetadata>> {
    let request = IndexMetadataRequest::for_index_id(index_id);
    let index_metadata_result = metastore
        .index_metadata(request)
        .await
        .and_then(|response| response.deserialize_index_metadata());
    match index_metadata_result {
        Ok(index_metadata) => Ok(Some(index_metadata)),
        Err(MetastoreError::NotFound { .. }) => Ok(None),
        Err(MetastoreError::Internal { message, cause }) => {
            // Indexes can be in transient states `Creating` or `Deleting`.
            // It is fine to ignore those errors.
            if message.contains("transient state") {
                Ok(None)
            } else {
                Err(MetastoreError::Internal { message, cause })
            }
        }
        Err(error) => Err(error),
    }
}

#[cfg(test)]
#[async_trait]
impl crate::tests::DefaultForTest for FileBackedMetastore {
    async fn default_for_test() -> Self {
        use quickwit_storage::RamStorage;
        FileBackedMetastore::try_new(Arc::new(RamStorage::default()), None)
            .await
            .unwrap()
    }
}

#[cfg(test)]
mod tests {

    use std::ops::RangeInclusive;
    use std::path::Path;
    use std::sync::Arc;

    use futures::executor::block_on;
    use quickwit_common::uri::{Protocol, Uri};
    use quickwit_config::IndexConfig;
    use quickwit_proto::ingest::Shard;
    use quickwit_proto::metastore::{DeleteQuery, MetastoreError};
    use quickwit_proto::types::SourceId;
    use quickwit_query::query_ast::qast_helper;
    use quickwit_storage::{MockStorage, RamStorage, Storage, StorageErrorKind};
    use rand::Rng;
    use tests::manifest::{IndexStatus, Manifest};
    use time::OffsetDateTime;
    use tokio::time::Duration;

    use super::store_operations::{metastore_filepath, put_index_given_index_id};
    use super::*;
    use crate::metastore::MetastoreServiceStreamSplitsExt;
    use crate::tests::DefaultForTest;
    use crate::tests::shard::ReadWriteShardsForTest;
    use crate::{IndexMetadata, ListSplitsQuery, SplitMetadata, SplitState, metastore_test_suite};

    #[async_trait]
    impl ReadWriteShardsForTest for FileBackedMetastore {
        async fn insert_shards(
            &self,
            index_uid: &IndexUid,
            source_id: &SourceId,
            shards: Vec<Shard>,
        ) {
            self.mutate(index_uid, |index| {
                index.insert_shards(source_id, shards);
                Ok(MutationOccurred::Yes(()))
            })
            .await
            .unwrap();
        }

        async fn list_all_shards(&self, index_uid: &IndexUid, source_id: &SourceId) -> Vec<Shard> {
            self.read(index_uid, |index| {
                let shards = index.list_all_shards(source_id);
                Ok(shards)
            })
            .await
            .unwrap()
        }
    }

    metastore_test_suite!(crate::FileBackedMetastore);

    #[tokio::test]
    async fn test_metastore_connectivity_and_endpoints() {
        let metastore = FileBackedMetastore::default_for_test().await;
        metastore.check_connectivity().await.unwrap();
        assert_eq!(metastore.endpoints()[0].protocol(), Protocol::Ram);
    }

    #[tokio::test]
    async fn test_file_backed_metastore_connectivity_fails_if_states_file_does_not_exist() {
        let mut mock_storage = MockStorage::default();
        let ram_storage = RamStorage::default();
        let ram_storage_clone = ram_storage.clone();
        mock_storage // remove this if we end up changing the semantics of create.
            .expect_exists()
            .times(3)
            .returning(|_| Ok(false));
        mock_storage
            .expect_put()
            .times(1)
            .returning(move |path, put_payload| {
                assert!(path == Path::new("manifest.json"));
                block_on(ram_storage_clone.put(path, put_payload))
            });
        let metastore = FileBackedMetastore::try_new(Arc::new(mock_storage), None)
            .await
            .unwrap();

        metastore.check_connectivity().await.unwrap();
    }

    #[tokio::test]
    async fn test_file_backed_metastore_index_exists() {
        let index_id = "test-index";
        let mut metastore = FileBackedMetastore::default_for_test().await;
        assert!(!metastore.index_exists(index_id).await.unwrap());

        let index_config = IndexConfig::for_test(index_id, "ram:///indexes/test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        metastore.create_index(create_index_request).await.unwrap();

        assert!(metastore.index_exists(index_id).await.unwrap());
    }

    #[tokio::test]
    async fn test_file_backed_metastore_get_index() {
        let metastore = FileBackedMetastore::default_for_test().await;

        // Create index
        let index_id = "test-index";
        let index_config = IndexConfig::for_test(index_id, "ram:///indexes/test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        // Open index and check its metadata
        let created_index = metastore.get_index(&index_uid).await.unwrap();
        assert_eq!(created_index.index_id(), index_config.index_id);
        assert_eq!(
            created_index.metadata().index_uri(),
            &index_config.index_uri
        );

        // Check index is returned by list indexes.
        let indexes_metadata = metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
            .unwrap()
            .deserialize_indexes_metadata()
            .await
            .unwrap();
        assert_eq!(indexes_metadata.len(), 1);

        // Open a non-existent index.
        let metastore_error = metastore
            .get_index(&IndexUid::new_with_random_ulid("index-does-not-exist"))
            .await
            .unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::NotFound { .. }));

        // Open a index with a different incarnation_id.
        let metastore_error = metastore
            .get_index(&IndexUid::new_with_random_ulid(index_id))
            .await
            .unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::NotFound { .. }));
    }

    #[tokio::test]
    async fn test_file_backed_metastore_storage_failing() {
        // The file-backed metastore should not update its internal state if the storage fails.
        let mut mock_storage = MockStorage::default();

        let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();

        let ram_storage = RamStorage::default();
        let ram_storage_clone = ram_storage.clone();

        mock_storage // remove this if we end up changing the semantics of create.
            .expect_exists()
            .returning(|_| Ok(false));
        mock_storage
            .expect_put()
            .times(4)
            .returning(move |path, put_payload| {
                assert!(
                    path == Path::new("manifest.json") || path == metastore_filepath("test-index")
                );
                block_on(ram_storage_clone.put(path, put_payload))
            });
        mock_storage
            .expect_get_all()
            .times(1)
            .returning(move |path| block_on(ram_storage.get_all(path)));
        mock_storage.expect_put().times(1).returning(|_uri, _| {
            Err(StorageErrorKind::Io
                .with_error(anyhow::anyhow!("Oops. Some network problem maybe?")))
        });
        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));

        let index_config = IndexConfig::for_test("test-index", "ram:///indexes/test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let split_id = "split-one";
        let split_metadata = SplitMetadata {
            footer_offsets: 1000..2000,
            split_id: split_id.to_string(),
            num_docs: 1,
            uncompressed_docs_size_in_bytes: 2,
            time_range: Some(RangeInclusive::new(0, 99)),
            create_timestamp: current_timestamp,
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        // publish split fails
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id.to_string()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();

        let list_splits_query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Published);
        let list_splits_request =
            ListSplitsRequest::try_from_list_splits_query(&list_splits_query).unwrap();
        let splits = metastore
            .list_splits(list_splits_request)
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());

        let list_splits_query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
        let list_splits_request =
            ListSplitsRequest::try_from_list_splits_query(&list_splits_query).unwrap();
        let splits = metastore
            .list_splits(list_splits_request)
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(!splits.is_empty());
    }

    #[tokio::test]
    async fn test_file_backed_metastore_get_index_checks_for_inconsistent_index_id()
    -> MetastoreResult<()> {
        let storage = Arc::new(RamStorage::default());
        let index_id = "test-index";
        let index_metadata =
            IndexMetadata::for_test("my-inconsistent-index", "ram:///indexes/test-index");

        // Put inconsistent index and manifest into storage.
        let index = FileBackedIndex::from(index_metadata);
        put_index_given_index_id(&*storage, &index, index_id).await?;
        let mut manifest = Manifest::default();
        manifest
            .indexes
            .insert(index_id.to_string(), IndexStatus::Active);
        save_manifest(&*storage, &manifest).await.unwrap();

        let metastore = FileBackedMetastore::try_new(storage.clone(), None)
            .await
            .unwrap();

        // Getting index with inconsistent index ID should raise an error.
        let metastore_error = metastore
            .get_index(&IndexUid::new_with_random_ulid(index_id))
            .await
            .unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::Internal { .. }));

        Ok(())
    }

    #[tokio::test]
    async fn test_file_backed_metastore_write_directly_visible() -> MetastoreResult<()> {
        let metastore = FileBackedMetastore::default_for_test().await;

        let index_config = IndexConfig::for_test("test-index", "ram:///indexes/test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = metastore.create_index(create_index_request).await.unwrap();
        let index_uid: IndexUid = create_index_response.index_uid().clone();

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());

        let split_metadata = SplitMetadata {
            footer_offsets: 1000..2000,
            split_id: "split1".to_string(),
            num_docs: 1,
            uncompressed_docs_size_in_bytes: 2,
            time_range: Some(0..=99),
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await?;

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 1);
        Ok(())
    }

    #[tokio::test]
    async fn test_file_backed_metastore_polling() -> MetastoreResult<()> {
        let storage = Arc::new(RamStorage::default());

        let metastore_write = FileBackedMetastore::try_new(storage.clone(), None)
            .await
            .unwrap();
        let polling_interval = Duration::from_millis(20);
        let metastore_read = FileBackedMetastore::try_new(storage, Some(polling_interval))
            .await
            .unwrap();

        let index_config = IndexConfig::for_test("test-index", "ram:///indexes/test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = metastore_write
            .create_index(create_index_request)
            .await
            .unwrap();
        let index_uid: IndexUid = create_index_response.index_uid().clone();

        let splits = metastore_write
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());

        let splits = metastore_read
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());

        let split_metadata = SplitMetadata {
            footer_offsets: 1000..2000,
            split_id: "split1".to_string(),
            num_docs: 1,
            uncompressed_docs_size_in_bytes: 2,
            time_range: Some(0..=99),
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore_write.stage_splits(stage_splits_request).await?;

        let splits = metastore_read
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());

        for _ in 0..10 {
            tokio::time::sleep(polling_interval).await;

            let splits = metastore_read
                .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
                .await
                .unwrap()
                .collect_splits()
                .await
                .unwrap();
            if !splits.is_empty() {
                return Ok(());
            }
        }
        panic!("The metastore should have been updated.");
    }

    #[tokio::test(flavor = "multi_thread", worker_threads = 3)]
    async fn test_file_backed_metastore_race_condition() {
        let metastore = FileBackedMetastore::default_for_test().await;

        let index_config = IndexConfig::for_test("test-index", "ram:///indexes/test-index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = metastore.create_index(create_index_request).await.unwrap();
        let index_uid: IndexUid = create_index_response.index_uid().clone();

        // Stage splits in multiple threads
        let mut handles = Vec::new();
        let mut random_generator = rand::rng();
        for i in 1..=20 {
            let sleep_duration = Duration::from_millis(random_generator.random_range(0..=200));
            let metastore = metastore.clone();
            let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
            let handle = tokio::spawn({
                let index_uid = index_uid.clone();
                async move {
                    let split_metadata = SplitMetadata {
                        footer_offsets: 1000..2000,
                        split_id: format!("split-{i}"),
                        num_docs: 1,
                        uncompressed_docs_size_in_bytes: 2,
                        time_range: Some(RangeInclusive::new(0, 99)),
                        create_timestamp: current_timestamp,
                        ..Default::default()
                    };
                    // stage split
                    let stage_splits_request = StageSplitsRequest::try_from_split_metadata(
                        index_uid.clone(),
                        &split_metadata,
                    )
                    .unwrap();
                    metastore.stage_splits(stage_splits_request).await.unwrap();

                    tokio::time::sleep(sleep_duration).await;

                    // publish split
                    let split_id = format!("split-{i}");
                    let publish_splits_request = PublishSplitsRequest {
                        index_uid: Some(index_uid.clone()),
                        staged_split_ids: vec![split_id.to_string()],
                        ..Default::default()
                    };
                    metastore
                        .publish_splits(publish_splits_request)
                        .await
                        .unwrap();
                }
            });
            handles.push(handle);
        }

        futures::future::try_join_all(handles).await.unwrap();

        let list_splits_query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Published);
        let list_splits_request =
            ListSplitsRequest::try_from_list_splits_query(&list_splits_query).unwrap();
        let splits = metastore
            .list_splits(list_splits_request)
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();

        // Make sure that all 20 splits are in `Published` state.
        assert_eq!(splits.len(), 20);
    }

    #[tokio::test(flavor = "multi_thread", worker_threads = 3)]
    async fn test_file_backed_metastore_list_indexes_race_condition() {
        let metastore = FileBackedMetastore::default_for_test().await;
        let mut index_uids = Vec::new();
        for idx in 0..10 {
            let index_uid = IndexUid::new_with_random_ulid(&format!("test-index-{idx}"));
            let index_config =
                IndexConfig::for_test(&index_uid.index_id, "ram:///indexes/test-index");
            let create_index_request =
                CreateIndexRequest::try_from_index_config(&index_config).unwrap();
            let index_uid: IndexUid = metastore
                .create_index(create_index_request)
                .await
                .unwrap()
                .index_uid()
                .clone();
            index_uids.push(index_uid);
        }
        // Delete indexes + call to list_indexes_metadata.
        let mut handles = Vec::new();
        for index_uid in index_uids {
            let delete_request = DeleteIndexRequest {
                index_uid: Some(index_uid.clone()),
            };
            {
                let metastore = metastore.clone();
                let handle = tokio::spawn(async move {
                    metastore
                        .list_indexes_metadata(ListIndexesMetadataRequest::all())
                        .await
                        .unwrap();
                });
                handles.push(handle);
            }
            {
                let metastore = metastore.clone();
                let handle = tokio::spawn(async move {
                    metastore.delete_index(delete_request).await.unwrap();
                });
                handles.push(handle);
            }
        }
        tokio::time::timeout(
            Duration::from_secs(2),
            futures::future::try_join_all(handles),
        )
        .await
        .unwrap()
        .unwrap();
    }

    #[tokio::test]
    async fn test_file_backed_metastore_create_index_when_storage_failing_on_indexes_states_put() {
        let mut mock_storage = MockStorage::default();
        let ram_storage = RamStorage::default();
        let index_id = "test-index";

        mock_storage
            .expect_uri()
            .return_const(Uri::for_test("ram:///indexes"));
        mock_storage.expect_exists().returning(|_| Ok(false));
        mock_storage
            .expect_put()
            .times(1)
            .returning(move |path, _| {
                assert!(path == Path::new("manifest.json"));
                Err(StorageErrorKind::Io
                    .with_error(anyhow::anyhow!("Oops. Some network problem maybe?")))
            });
        mock_storage
            .expect_get_all()
            .times(1)
            .returning(move |path| block_on(ram_storage.get_all(path)));

        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));
        let index_config = IndexConfig::for_test(index_id, "ram:///indexes/test-index");

        // Create index.
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let metastore_error = metastore
            .create_index(create_index_request)
            .await
            .unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::Internal { .. }));
        // Try fetch the not created index.
        let created_index_error = metastore
            .get_index(&IndexUid::new_with_random_ulid(index_id))
            .await
            .unwrap_err();
        assert!(matches!(
            created_index_error,
            MetastoreError::NotFound { .. }
        ));
    }

    #[tokio::test]
    async fn test_file_backed_metastore_create_index_when_storage_failing_before_metadata_put() {
        let mut mock_storage = MockStorage::default();
        let ram_storage = RamStorage::default();
        let ram_storage_clone = ram_storage.clone();
        let ram_storage_clone_2 = ram_storage.clone();
        let index_id = "test-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);

        mock_storage // remove this if we end up changing the semantics of create.
            .expect_exists()
            .returning(|_| Ok(false));
        mock_storage
            .expect_put()
            .times(4)
            .returning(move |path, put_payload| {
                assert!(
                    path == Path::new("manifest.json") || path == metastore_filepath("test-index")
                );
                if path == Path::new("manifest.json") {
                    return block_on(ram_storage_clone.put(path, put_payload));
                }
                Err(StorageErrorKind::Io
                    .with_error(anyhow::anyhow!("Oops. Some network problem maybe?")))
            });
        mock_storage
            .expect_get_all()
            .times(1)
            .returning(move |path| block_on(ram_storage.get_all(path)));
        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));
        let index_config = IndexConfig::for_test(index_id, "ram:///indexes/test-index");

        // Create index
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let metastore_error = metastore
            .create_index(create_index_request)
            .await
            .unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::Internal { .. }));
        // Let's fetch the index, we expect an internal error as the index state is in `Creating`
        // state.
        let created_index_error = metastore.get_index(&index_uid.clone()).await.unwrap_err();
        assert!(matches!(
            created_index_error,
            MetastoreError::Internal { .. }
        ));
        // Check index state is in `Creating` in the manifest file.
        let storage = Arc::new(ram_storage_clone_2.clone());
        let manifest = load_or_create_manifest(&*storage).await.unwrap();
        assert!(matches!(
            *manifest.indexes.get(index_id).unwrap(),
            IndexStatus::Creating
        ));
        // Let's delete the index to clean states.
        let delete_request = DeleteIndexRequest {
            index_uid: Some(index_uid.clone()),
        };
        let deleted_index_error = metastore.delete_index(delete_request).await.unwrap_err();
        assert!(matches!(
            deleted_index_error,
            MetastoreError::NotFound { .. }
        ));
        let manifest = load_or_create_manifest(&*storage).await.unwrap();
        assert!(!manifest.indexes.contains_key(index_id));
        // Now we can expect an `IndexDoesNotExist` error.
        let created_index_error = metastore.get_index(&index_uid).await.unwrap_err();
        assert!(matches!(
            created_index_error,
            MetastoreError::NotFound { .. }
        ));
    }

    #[tokio::test]
    async fn test_file_backed_metastore_create_index_when_storage_failing_before_last_indexes_states_put()
     {
        let mut mock_storage = MockStorage::default();
        let ram_storage = RamStorage::default();
        let ram_storage_clone = ram_storage.clone();
        let index_id = "test-index";
        let mut indexes_json_valid_put = 1;

        mock_storage
            .expect_uri()
            .return_const(Uri::for_test("ram:///indexes"));
        mock_storage // remove this if we end up changing the semantics of create.
            .expect_exists()
            .returning(|_| Ok(false));
        mock_storage
            .expect_put()
            .times(3)
            .returning(move |path, put_payload| {
                assert!(
                    path == Path::new("manifest.json") || path == metastore_filepath("test-index")
                );
                if path == Path::new("manifest.json") {
                    if indexes_json_valid_put == 0 {
                        return Err(StorageErrorKind::Io.with_error(anyhow::anyhow!(
                            "oops. perhaps there are some network problems"
                        )));
                    }
                    indexes_json_valid_put -= 1;
                }
                block_on(ram_storage_clone.put(path, put_payload))
            });
        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));
        let index_config = IndexConfig::for_test(index_id, "ram:///indexes/test-index");

        // Create index
        let metastore_error = metastore
            .create_index(CreateIndexRequest::try_from_index_config(&index_config).unwrap())
            .await
            .unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::Internal { .. }));
        // Let's fetch the index, we expect an internal error as the index state is in `Creating`
        // state.
        let created_index_error = metastore
            .get_index(&IndexUid::new_with_random_ulid(index_id))
            .await
            .unwrap_err();
        assert!(matches!(
            created_index_error,
            MetastoreError::Internal { .. }
        ));
    }

    #[tokio::test]
    async fn test_file_backed_metastore_delete_index_when_storage_failing_before_metadata_delete() {
        let mut mock_storage = MockStorage::default();
        let ram_storage = RamStorage::default();
        let ram_storage_clone = ram_storage.clone();
        let index_id = "test-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let index_metadata =
            IndexMetadata::for_test(&index_uid.index_id, "ram:///indexes/test-index");
        let index = FileBackedIndex::from(index_metadata);
        put_index_given_index_id(&ram_storage, &index, &index_uid.index_id)
            .await
            .unwrap();

        mock_storage
            .expect_uri()
            .return_const(Uri::for_test("ram:///indexes"));
        mock_storage // remove this if we end up changing the semantics of create.
            .expect_exists()
            .returning(|_| Ok(true));
        mock_storage // remove this if we end up changing the semantics of create.
            .expect_delete()
            .returning(|_| {
                Err(StorageErrorKind::Io
                    .with_error(anyhow::anyhow!("Oops. Some network problem maybe?")))
            });
        mock_storage
            .expect_put()
            .times(1)
            .returning(move |path, put_payload| block_on(ram_storage_clone.put(path, put_payload)));
        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));

        // Delete index
        let delete_request = DeleteIndexRequest {
            index_uid: Some(index_uid.clone()),
        };
        let metastore_error = metastore.delete_index(delete_request).await.unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::Internal { .. }));
        // Let's fetch the index, we expect an internal error as the index state is in `Deleting`
        // state.
        let created_index_error = metastore.get_index(&index_uid).await.unwrap_err();
        assert!(matches!(
            created_index_error,
            MetastoreError::Internal { .. }
        ));
    }

    #[tokio::test]
    async fn test_file_backed_metastore_delete_index_storage_failing_before_last_indexes_states_put()
     {
        let mut mock_storage = MockStorage::default();
        let ram_storage = RamStorage::default();
        let ram_storage_clone = ram_storage.clone();
        let index_id = "test-index";
        let index_uid = IndexUid::new_with_random_ulid(index_id);
        let index_metadata =
            IndexMetadata::for_test(&index_uid.index_id, "ram:///indexes/test-index");
        let index = FileBackedIndex::from(index_metadata);
        put_index_given_index_id(&ram_storage, &index, &index_uid.index_id)
            .await
            .unwrap();
        let mut indexes_json_valid_put = 1;
        mock_storage
            .expect_uri()
            .return_const(Uri::for_test("ram:///indexes"));
        mock_storage // remove this if we end up changing the semantics of create.
            .expect_exists()
            .returning(|_| Ok(true));
        mock_storage // remove this if we end up changing the semantics of create.
            .expect_delete()
            .returning(|_| Ok(()));
        mock_storage
            .expect_put()
            .times(2)
            .returning(move |path, put_payload| {
                assert!(path == Path::new("manifest.json"));
                if path == Path::new("manifest.json") {
                    if indexes_json_valid_put == 0 {
                        return Err(StorageErrorKind::Io.with_error(anyhow::anyhow!(
                            "oops. perhaps there are some network problems"
                        )));
                    }
                    indexes_json_valid_put -= 1;
                }
                block_on(ram_storage_clone.put(path, put_payload))
            });
        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));

        // Delete index
        let delete_request = DeleteIndexRequest {
            index_uid: Some(index_uid.clone()),
        };
        let metastore_error = metastore.delete_index(delete_request).await.unwrap_err();
        assert!(matches!(metastore_error, MetastoreError::Internal { .. }));
        // Let's fetch the index, we expect an internal error as the index state is in `Deleting`
        // state.
        let created_index_error = metastore.get_index(&index_uid).await.unwrap_err();
        assert!(matches!(
            created_index_error,
            MetastoreError::Internal { .. }
        ));
    }

    #[tokio::test]
    async fn test_file_backed_metastore_get_list_indexes() -> MetastoreResult<()> {
        let index_id_creating = "test-index--creating";
        let index_id_alive = "testing-index--alive";
        let index_id_unregistered = "test-index--unregistered";
        let index_id_deleting = "test-index--deleting";

        let index_metadata_alive =
            IndexMetadata::for_test(index_id_alive, "ram:///indexes/test-index--alive");
        let index_metadata_unregistered = IndexMetadata::for_test(
            index_id_unregistered,
            "ram:///indexes/test-index--unregistered",
        );

        // Put index states into storage.
        let ram_storage = Arc::new(RamStorage::default());
        let mut manifest = Manifest::default();
        manifest
            .indexes
            .insert(index_id_creating.to_string(), IndexStatus::Creating);
        manifest
            .indexes
            .insert(index_id_alive.to_string(), IndexStatus::Active);
        manifest
            .indexes
            .insert(index_id_deleting.to_string(), IndexStatus::Deleting);
        save_manifest(&*ram_storage, &manifest).await.unwrap();

        let index_alive = FileBackedIndex::from(index_metadata_alive);
        let index_alive_unregistered = FileBackedIndex::from(index_metadata_unregistered);
        let index_uid_alive = index_alive.index_uid();
        let index_uid_unregistered = index_alive_unregistered.index_uid();

        // Put indexes metadatas.
        put_index_given_index_id(&*ram_storage, &index_alive, index_id_alive).await?;
        put_index_given_index_id(
            &*ram_storage,
            &index_alive_unregistered,
            index_id_unregistered,
        )
        .await?;

        // Fetch alive indexes metadatas.
        let metastore = FileBackedMetastore::try_new(ram_storage.clone(), None)
            .await
            .unwrap();
        let indexes_metadata = metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
            .unwrap()
            .deserialize_indexes_metadata()
            .await
            .unwrap();
        assert_eq!(indexes_metadata.len(), 1);

        // Fetch the index metadata not registered in index states json.
        metastore
            .get_index(&index_uid_unregistered.clone())
            .await
            .unwrap();

        // Now list indexes return 2 indexes metadatas as the metastore is now aware of
        // 2 alive indexes.
        let indexes_metadata = metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
            .unwrap()
            .deserialize_indexes_metadata()
            .await
            .unwrap();
        assert_eq!(indexes_metadata.len(), 2);

        // Let's delete indexes.
        let delete_request = DeleteIndexRequest {
            index_uid: Some(index_uid_alive.clone()),
        };
        metastore.delete_index(delete_request).await.unwrap();

        let delete_request = DeleteIndexRequest {
            index_uid: Some(index_uid_unregistered.clone()),
        };
        metastore.delete_index(delete_request).await.unwrap();
        let indexes_metadata = metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
            .unwrap()
            .deserialize_indexes_metadata()
            .await
            .unwrap();
        assert!(indexes_metadata.is_empty());

        Ok(())
    }

    #[tokio::test]
    async fn test_monotically_increasing_stamps_by_index() {
        let storage = RamStorage::default();
        let metastore = FileBackedMetastore::try_new(Arc::new(storage.clone()), None)
            .await
            .unwrap();
        let index_id = "test-index-increasing-stamps-by-index";
        let index_config = IndexConfig::for_test(
            index_id,
            "ram:///indexes/test-index-increasing-stamps-by-index",
        );
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = metastore.create_index(create_index_request).await.unwrap();
        let index_uid = create_index_response.index_uid;

        let delete_query = DeleteQuery {
            start_timestamp: None,
            end_timestamp: None,
            index_uid,
            query_ast: serde_json::to_string(&qast_helper("harry potter", &["body"])).unwrap(),
        };

        let delete_task_1 = metastore
            .create_delete_task(delete_query.clone())
            .await
            .unwrap();
        assert_eq!(delete_task_1.opstamp, 1);
        let delete_task_2 = metastore
            .create_delete_task(delete_query.clone())
            .await
            .unwrap();
        assert_eq!(delete_task_2.opstamp, 2);

        // Create metastore with data already in the storage.
        let new_metastore = FileBackedMetastore::try_new(Arc::new(storage), None)
            .await
            .unwrap();
        let delete_task_3 = new_metastore
            .create_delete_task(delete_query.clone())
            .await
            .unwrap();
        assert_eq!(delete_task_3.opstamp, 3);

        // Create delete tasks on new index.
        let index_id_2 = "test-index-increasing-stamps-by-index-2";
        let index_config = IndexConfig::for_test(
            index_id_2,
            "ram:///indexes/test-index-increasing-stamps-by-index-2",
        );
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = metastore.create_index(create_index_request).await.unwrap();
        let index_uid = create_index_response.index_uid;

        let delete_query = DeleteQuery {
            start_timestamp: None,
            end_timestamp: None,
            index_uid,
            query_ast: serde_json::to_string(&qast_helper("harry potter", &["body"])).unwrap(),
        };
        let delete_task_4 = metastore.create_delete_task(delete_query).await.unwrap();
        assert_eq!(delete_task_4.opstamp, 1);
    }

    #[tokio::test]
    async fn test_create_index_template_rollback() {
        let mut mock_storage = MockStorage::default();

        mock_storage
            .expect_uri()
            .return_const(Uri::for_test("ram:///indexes"));

        mock_storage
            .expect_put()
            .once()
            .returning(|path, _payload| {
                assert_eq!(path, Path::new(MANIFEST_FILE_NAME));
                Ok(())
            });

        mock_storage
            .expect_put()
            .once()
            .returning(|path, _payload| {
                assert_eq!(path, Path::new(MANIFEST_FILE_NAME));
                let io_error = StorageErrorKind::Io.with_error(anyhow::anyhow!("IO error"));
                Err(io_error)
            });

        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));

        let index_template = IndexTemplate::for_test("test-template", &["test-index-foo*"], 100);
        let index_template_json = serde_json::to_string(&index_template).unwrap();
        let create_index_template_request = CreateIndexTemplateRequest {
            index_template_json,
            overwrite: false,
        };
        metastore
            .create_index_template(create_index_template_request)
            .await
            .unwrap();
        {
            let state = metastore.state.read().await;
            assert_eq!(state.templates.len(), 1);
            state.template_matcher.find_match("test-index-foo").unwrap();
        }
        let index_template = IndexTemplate::for_test("test-template", &["test-index-bar*"], 100);
        let index_template_json = serde_json::to_string(&index_template).unwrap();
        let create_index_template_request = CreateIndexTemplateRequest {
            index_template_json,
            overwrite: true,
        };
        metastore
            .create_index_template(create_index_template_request)
            .await
            .unwrap_err();
        {
            let state = metastore.state.read().await;
            assert_eq!(state.templates.len(), 1);
            state.template_matcher.find_match("test-index-foo").unwrap();
        }
    }

    #[tokio::test]
    async fn test_delete_index_templates_rollback() {
        let mut mock_storage = MockStorage::default();

        mock_storage
            .expect_uri()
            .return_const(Uri::for_test("ram:///indexes"));

        mock_storage
            .expect_put()
            .once()
            .returning(|path, _payload| {
                assert_eq!(path, Path::new(MANIFEST_FILE_NAME));
                Ok(())
            });

        mock_storage
            .expect_put()
            .once()
            .returning(|path, _payload| {
                assert_eq!(path, Path::new(MANIFEST_FILE_NAME));
                let io_error = StorageErrorKind::Io.with_error(anyhow::anyhow!("IO error"));
                Err(io_error)
            });

        let metastore = FileBackedMetastore::for_test(Arc::new(mock_storage));

        let index_template = IndexTemplate::for_test("test-template", &["test-index-foo*"], 100);
        let index_template_json = serde_json::to_string(&index_template).unwrap();
        let create_index_template_request = CreateIndexTemplateRequest {
            index_template_json,
            overwrite: false,
        };
        metastore
            .create_index_template(create_index_template_request)
            .await
            .unwrap();
        {
            let state = metastore.state.read().await;
            assert_eq!(state.templates.len(), 1);
            state.template_matcher.find_match("test-index-foo").unwrap();
        }
        let delete_index_templates_request = DeleteIndexTemplatesRequest {
            template_ids: vec![index_template.template_id],
        };
        metastore
            .delete_index_templates(delete_index_templates_request)
            .await
            .unwrap_err();
        {
            let state = metastore.state.read().await;
            assert_eq!(state.templates.len(), 1);
            state.template_matcher.find_match("test-index-foo").unwrap();

            assert!(
                state
                    .template_matcher
                    .find_match("test-index-bar")
                    .is_none()
            );
        }
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/state.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::sync::Arc;
use std::time::Duration;

use quickwit_config::{IndexTemplate, IndexTemplateId};
use quickwit_proto::metastore::MetastoreResult;
use quickwit_proto::types::IndexId;
use quickwit_storage::Storage;
use uuid::Uuid;

use super::LazyIndexStatus;
use super::index_template_matcher::IndexTemplateMatcher;
use super::lazy_file_backed_index::LazyFileBackedIndex;
use super::manifest::{IndexStatus, Manifest};

#[derive(Default)]
pub(super) struct MetastoreState {
    pub indexes: HashMap<IndexId, LazyIndexStatus>,
    pub templates: HashMap<IndexTemplateId, IndexTemplate>,
    pub template_matcher: IndexTemplateMatcher,
    pub identity: Uuid,
}

impl MetastoreState {
    pub fn try_from_manifest(
        storage: Arc<dyn Storage>,
        manifest: Manifest,
        polling_interval_opt: Option<Duration>,
    ) -> MetastoreResult<Self> {
        let indexes = manifest
            .indexes
            .into_iter()
            .map(|(index_id, index_status)| match index_status {
                IndexStatus::Creating => (index_id, LazyIndexStatus::Creating),
                IndexStatus::Deleting => (index_id, LazyIndexStatus::Deleting),
                IndexStatus::Active => {
                    let lazy_index = LazyFileBackedIndex::new(
                        storage.clone(),
                        index_id.clone(),
                        polling_interval_opt,
                        None,
                    );
                    (index_id, LazyIndexStatus::Active(lazy_index))
                }
            })
            .collect();

        let template_matcher =
            IndexTemplateMatcher::try_from_index_templates(manifest.templates.values())?;

        let state = Self {
            indexes,
            templates: manifest.templates,
            template_matcher,
            identity: manifest.identity,
        };
        Ok(state)
    }

    pub fn as_manifest(&self) -> Manifest {
        let indexes = self
            .indexes
            .iter()
            .map(|(index_id, index_state)| {
                let index_status = match index_state {
                    LazyIndexStatus::Creating => IndexStatus::Creating,
                    LazyIndexStatus::Active(_) => IndexStatus::Active,
                    LazyIndexStatus::Deleting => IndexStatus::Deleting,
                };
                (index_id.clone(), index_status)
            })
            .collect();
        let templates = self.templates.clone();
        Manifest {
            indexes,
            templates,
            identity: self.identity,
        }
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/file_backed/store_operations.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::{Path, PathBuf};

use quickwit_proto::metastore::{EntityKind, MetastoreError, MetastoreResult, serde_utils};
use quickwit_storage::{Storage, StorageError, StorageErrorKind};

use crate::metastore::file_backed::file_backed_index::FileBackedIndex;

/// Index metastore file managed by [`FileBackedMetastore`](crate::FileBackedMetastore).
pub(super) const METASTORE_FILE_NAME: &str = "metastore.json";

/// Path to the metadata file from the given index ID.
pub(super) fn metastore_filepath(index_id: &str) -> PathBuf {
    Path::new(index_id).join(METASTORE_FILE_NAME)
}

fn convert_error(index_id: &str, storage_error: StorageError) -> MetastoreError {
    match storage_error.kind() {
        StorageErrorKind::NotFound => MetastoreError::NotFound(EntityKind::Index {
            index_id: index_id.to_string(),
        }),
        StorageErrorKind::Unauthorized => MetastoreError::Forbidden {
            message: "the request credentials do not allow for this operation".to_string(),
        },
        _ => MetastoreError::Internal {
            message: "failed to get index files".to_string(),
            cause: storage_error.to_string(),
        },
    }
}

pub(super) async fn load_index(
    storage: &dyn Storage,
    index_id: &str,
) -> MetastoreResult<FileBackedIndex> {
    let metastore_filepath = metastore_filepath(index_id);

    let content = storage
        .get_all(&metastore_filepath)
        .await
        .map_err(|storage_err| convert_error(index_id, storage_err))?;

    let index: FileBackedIndex = serde_utils::from_json_bytes(&content)?;

    if index.index_id() != index_id {
        return Err(MetastoreError::Internal {
            message: "inconsistent manifest: index_id mismatch".to_string(),
            cause: format!(
                "expected index_id `{}`, but found `{}`",
                index_id,
                index.index_id()
            ),
        });
    }
    Ok(index)
}

pub(super) async fn index_exists(storage: &dyn Storage, index_id: &str) -> MetastoreResult<bool> {
    let metastore_filepath = metastore_filepath(index_id);
    let exists = storage
        .exists(&metastore_filepath)
        .await
        .map_err(|storage_error| convert_error(index_id, storage_error))?;
    Ok(exists)
}

/// Serializes the `Index` object and stores the data on the storage.
///
/// Do not call this method. Instead, call `put_index`.
/// The point of having two methods here is just to make it usable in a unit test.
pub(super) async fn put_index_given_index_id(
    storage: &dyn Storage,
    index: &FileBackedIndex,
    index_id: &str,
) -> MetastoreResult<()> {
    // Serialize Index.
    let content: Vec<u8> = serde_utils::to_json_bytes_pretty(index)?;
    let metastore_filepath = metastore_filepath(index_id);
    // Put data back into storage.
    storage
        .put(&metastore_filepath, Box::new(content))
        .await
        .map_err(|storage_err| convert_error(index_id, storage_err))?;
    Ok(())
}

/// Serializes the `Index` object and stores the data on the storage.
pub(super) async fn put_index(
    storage: &dyn Storage,
    index: &FileBackedIndex,
) -> MetastoreResult<()> {
    put_index_given_index_id(storage, index, index.index_id()).await
}

/// Serializes the Index and stores the data on the storage.
pub(super) async fn delete_index(storage: &dyn Storage, index_id: &str) -> MetastoreResult<()> {
    let metastore_filepath = metastore_filepath(index_id);

    let file_exists = storage
        .exists(&metastore_filepath)
        .await
        .map_err(|storage_err| convert_error(index_id, storage_err))?;

    if !file_exists {
        return Err(MetastoreError::NotFound(EntityKind::Index {
            index_id: index_id.to_string(),
        }));
    }
    // Put data back into storage.
    storage
        .delete(&metastore_filepath)
        .await
        .map_err(|storage_error| match storage_error.kind() {
            StorageErrorKind::Unauthorized => MetastoreError::Forbidden {
                message: "the request credentials do not allow for this operation".to_string(),
            },
            _ => MetastoreError::Internal {
                message: format!(
                    "failed to delete metastore file located at `{}/{}`",
                    storage.uri(),
                    metastore_filepath.display()
                ),
                cause: storage_error.to_string(),
            },
        })?;
    Ok(())
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/index_metadata/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub(crate) mod serialize;

use std::collections::HashMap;
use std::collections::hash_map::Entry;

use quickwit_common::uri::Uri;
use quickwit_config::{
    DocMapping, IndexConfig, IndexingSettings, IngestSettings, RetentionPolicy, SearchSettings,
    SourceConfig, prepare_doc_mapping_update,
};
use quickwit_proto::metastore::{EntityKind, MetastoreError, MetastoreResult};
use quickwit_proto::types::{IndexUid, SourceId};
use serde::{Deserialize, Serialize};
use serialize::VersionedIndexMetadata;
use time::OffsetDateTime;

use crate::checkpoint::IndexCheckpoint;

/// An index metadata carries all meta data about an index.
#[derive(Clone, Debug, Serialize, Deserialize, PartialEq)]
#[serde(into = "VersionedIndexMetadata")]
#[serde(try_from = "VersionedIndexMetadata")]
pub struct IndexMetadata {
    /// Index incarnation id
    pub index_uid: IndexUid,
    /// Index configuration
    pub index_config: IndexConfig,
    /// Per-source map of checkpoint for the given index.
    pub checkpoint: IndexCheckpoint,
    /// Time at which the index was created.
    pub create_timestamp: i64,
    /// Sources
    pub sources: HashMap<SourceId, SourceConfig>,
}

impl IndexMetadata {
    /// Panics if `index_config` is missing `index_uri`.
    pub fn new(index_config: IndexConfig) -> Self {
        let index_uid = IndexUid::new_with_random_ulid(&index_config.index_id);
        IndexMetadata::new_with_index_uid(index_uid, index_config)
    }

    /// Panics if `index_config` is missing `index_uri`.
    pub fn new_with_index_uid(index_uid: IndexUid, index_config: IndexConfig) -> Self {
        IndexMetadata {
            index_uid,
            index_config,
            checkpoint: Default::default(),
            create_timestamp: OffsetDateTime::now_utc().unix_timestamp(),
            sources: HashMap::default(),
        }
    }

    /// Returns an [`IndexMetadata`] object with multiple hard coded values for tests.
    ///
    /// An incarnation id of `0` will be used to complete the index id into a index uuid.
    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(index_id: &str, index_uri: &str) -> Self {
        let index_uid = IndexUid::for_test(index_id, 0);
        let mut index_metadata = IndexMetadata::new(IndexConfig::for_test(index_id, index_uri));
        index_metadata.index_uid = index_uid;
        index_metadata
    }

    /// Extracts the index config from the index metadata object.
    pub fn into_index_config(self) -> IndexConfig {
        self.index_config
    }

    /// Accessor to the index config.
    pub fn index_config(&self) -> &IndexConfig {
        &self.index_config
    }

    /// Accessor to the index config's index id for convenience.
    pub fn index_id(&self) -> &str {
        &self.index_config.index_id
    }

    /// Accessor to the index config's index uri for convenience.
    pub fn index_uri(&self) -> &Uri {
        &self.index_config().index_uri
    }

    /// Updates the index config.
    ///
    /// Returns whether a mutation occurred.
    pub fn update_index_config(
        &mut self,
        doc_mapping: DocMapping,
        indexing_settings: IndexingSettings,
        ingest_settings: IngestSettings,
        search_settings: SearchSettings,
        retention_policy_opt: Option<RetentionPolicy>,
    ) -> MetastoreResult<bool> {
        let (updated_doc_mapping, mut mutation_occurred) = prepare_doc_mapping_update(
            doc_mapping,
            &self.index_config.doc_mapping,
            &search_settings,
        )
        .map_err(|error| MetastoreError::InvalidArgument {
            message: error.to_string(),
        })?;
        self.index_config.doc_mapping = updated_doc_mapping;
        if indexing_settings != self.index_config.indexing_settings {
            self.index_config.indexing_settings = indexing_settings;
            mutation_occurred = true;
        }
        if ingest_settings != self.index_config.ingest_settings {
            self.index_config.ingest_settings = ingest_settings;
            mutation_occurred = true;
        }
        if search_settings != self.index_config.search_settings {
            self.index_config.search_settings = search_settings;
            mutation_occurred = true;
        }
        if retention_policy_opt != self.index_config.retention_policy_opt {
            self.index_config.retention_policy_opt = retention_policy_opt;
            mutation_occurred = true;
        }
        Ok(mutation_occurred)
    }

    /// Adds a source to the index. Returns an error if the source already exists.
    pub fn add_source(&mut self, source_config: SourceConfig) -> MetastoreResult<()> {
        match self.sources.entry(source_config.source_id.clone()) {
            Entry::Occupied(_) => Err(MetastoreError::AlreadyExists(EntityKind::Source {
                index_id: self.index_id().to_string(),
                source_id: source_config.source_id,
            })),
            Entry::Vacant(entry) => {
                self.checkpoint.add_source(&source_config.source_id);
                entry.insert(source_config);
                Ok(())
            }
        }
    }

    /// Adds a source to the index. Returns whether a mutation occurred and an
    /// error if the source doesn't exist.
    pub fn update_source(&mut self, source_config: SourceConfig) -> MetastoreResult<bool> {
        match self.sources.entry(source_config.source_id.clone()) {
            Entry::Occupied(mut entry) => {
                if entry.get() == &source_config {
                    return Ok(false);
                }
                entry.insert(source_config);
                Ok(true)
            }
            Entry::Vacant(_) => Err(MetastoreError::NotFound(EntityKind::Source {
                index_id: self.index_id().to_string(),
                source_id: source_config.source_id,
            })),
        }
    }

    pub(crate) fn toggle_source(&mut self, source_id: &str, enable: bool) -> MetastoreResult<bool> {
        let Some(source_config) = self.sources.get_mut(source_id) else {
            return Err(MetastoreError::NotFound(EntityKind::Source {
                index_id: self.index_id().to_string(),
                source_id: source_id.to_string(),
            }));
        };
        let mutation_occurred = source_config.enabled != enable;
        source_config.enabled = enable;
        Ok(mutation_occurred)
    }

    /// Deletes a source from the index.
    pub(crate) fn delete_source(&mut self, source_id: &str) -> MetastoreResult<()> {
        self.sources.remove(source_id).ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Source {
                index_id: self.index_id().to_string(),
                source_id: source_id.to_string(),
            })
        })?;
        self.checkpoint.remove_source(source_id);
        Ok(())
    }
}

#[cfg(any(test, feature = "testsuite"))]
impl quickwit_config::TestableForRegression for IndexMetadata {
    fn sample_for_regression() -> IndexMetadata {
        use std::collections::BTreeMap;

        use quickwit_proto::types::Position;

        use crate::checkpoint::{PartitionId, SourceCheckpoint, SourceCheckpointDelta};

        let index_config = IndexConfig::sample_for_regression();

        let mut source_checkpoint = SourceCheckpoint::default();
        let delta = SourceCheckpointDelta::from_partition_delta(
            PartitionId::from(0i64),
            Position::Beginning,
            Position::offset(42u64),
        )
        .unwrap();
        source_checkpoint.try_apply_delta(delta).unwrap();

        let per_source_checkpoint: BTreeMap<String, SourceCheckpoint> =
            BTreeMap::from_iter([("kafka-source".to_string(), source_checkpoint)]);
        let checkpoint = IndexCheckpoint::from(per_source_checkpoint);

        let mut index_metadata = IndexMetadata {
            index_uid: IndexUid::for_test(&index_config.index_id, 1),
            index_config,
            checkpoint,
            create_timestamp: 1789,
            sources: Default::default(),
        };
        index_metadata
            .add_source(SourceConfig::sample_for_regression())
            .unwrap();
        index_metadata
    }

    fn assert_equality(&self, other: &Self) {
        self.index_config().assert_equality(other.index_config());
        assert_eq!(self.checkpoint, other.checkpoint);
        assert_eq!(self.create_timestamp, other.create_timestamp);
        assert_eq!(self.sources, other.sources);
    }
}

#[cfg(test)]
mod tests {
    use quickwit_doc_mapper::Mode;
    use quickwit_proto::types::DocMappingUid;

    use super::*;

    #[test]
    fn test_update_index_config() {
        let current_index_config = IndexConfig::for_test("test-index", "s3://test-index");
        let mut current_index_metadata = IndexMetadata::new(current_index_config.clone());

        let mutation_occurred = current_index_metadata
            .update_index_config(
                current_index_config.doc_mapping.clone(),
                current_index_config.indexing_settings.clone(),
                current_index_config.ingest_settings.clone(),
                current_index_config.search_settings.clone(),
                current_index_config.retention_policy_opt.clone(),
            )
            .unwrap();
        assert!(!mutation_occurred);

        let new_search_settings = SearchSettings {
            default_search_fields: vec!["message".to_string(), "status".to_string()],
        };
        let mutation_occurred = current_index_metadata
            .update_index_config(
                current_index_config.doc_mapping.clone(),
                current_index_config.indexing_settings.clone(),
                current_index_config.ingest_settings.clone(),
                new_search_settings,
                current_index_config.retention_policy_opt.clone(),
            )
            .unwrap();
        assert!(mutation_occurred);
        assert_eq!(
            current_index_metadata
                .index_config()
                .search_settings
                .default_search_fields,
            ["message", "status"]
        );
    }

    #[test]
    fn test_update_doc_mapping() {
        let current_index_config = IndexConfig::for_test("test-index", "s3://test-index");
        let mut current_index_metadata = IndexMetadata::new(current_index_config.clone());

        let mut new_doc_mapping = current_index_config.doc_mapping.clone();
        new_doc_mapping.doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.timestamp_field = Some("ts".to_string()); // This is set to `timestamp` for the current doc mapping.

        current_index_metadata
            .update_index_config(
                new_doc_mapping,
                current_index_config.indexing_settings.clone(),
                current_index_config.ingest_settings.clone(),
                current_index_config.search_settings.clone(),
                current_index_config.retention_policy_opt.clone(),
            )
            .unwrap_err();

        let mut new_doc_mapping = current_index_config.doc_mapping.clone();
        let new_doc_mapping_uid = DocMappingUid::random();
        new_doc_mapping.doc_mapping_uid = new_doc_mapping_uid;
        new_doc_mapping.mode = Mode::Strict;

        let mutation_occurred = current_index_metadata
            .update_index_config(
                new_doc_mapping,
                current_index_config.indexing_settings,
                current_index_config.ingest_settings,
                current_index_config.search_settings,
                current_index_config.retention_policy_opt,
            )
            .unwrap();
        assert!(mutation_occurred);
        assert_eq!(
            current_index_metadata
                .index_config()
                .doc_mapping
                .doc_mapping_uid,
            new_doc_mapping_uid
        );
        assert_eq!(
            current_index_metadata.index_config().doc_mapping.mode,
            Mode::Strict
        );
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/index_metadata/serialize.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use quickwit_config::{IndexConfig, SourceConfig};
use quickwit_proto::types::IndexUid;
use serde::{self, Deserialize, Serialize};

use crate::IndexMetadata;
use crate::checkpoint::IndexCheckpoint;
use crate::split_metadata::utc_now_timestamp;

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(tag = "version")]
pub(crate) enum VersionedIndexMetadata {
    #[serde(rename = "0.9")]
    // Retro compatibility.
    #[serde(alias = "0.8")]
    #[serde(alias = "0.7")]
    V0_8(IndexMetadataV0_8),
}

impl From<IndexMetadata> for VersionedIndexMetadata {
    fn from(index_metadata: IndexMetadata) -> Self {
        VersionedIndexMetadata::V0_8(index_metadata.into())
    }
}

impl TryFrom<VersionedIndexMetadata> for IndexMetadata {
    type Error = anyhow::Error;

    fn try_from(index_metadata: VersionedIndexMetadata) -> anyhow::Result<Self> {
        match index_metadata {
            // When we have more than one version, you should chain version conversion.
            // ie. Implement conversion from V_k -> V_{k+1}
            VersionedIndexMetadata::V0_8(v8) => v8.try_into(),
        }
    }
}

impl From<IndexMetadata> for IndexMetadataV0_8 {
    fn from(index_metadata: IndexMetadata) -> Self {
        let sources: Vec<SourceConfig> = index_metadata.sources.values().cloned().collect();
        Self {
            index_uid: index_metadata.index_uid,
            index_config: index_metadata.index_config,
            checkpoint: index_metadata.checkpoint,
            create_timestamp: index_metadata.create_timestamp,
            sources,
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize, utoipa::ToSchema)]
pub(crate) struct IndexMetadataV0_8 {
    #[schema(value_type = String)]
    pub index_uid: IndexUid,
    #[schema(value_type = VersionedIndexConfig)]
    pub index_config: IndexConfig,
    #[schema(value_type = Object)]
    pub checkpoint: IndexCheckpoint,
    #[serde(default = "utc_now_timestamp")]
    pub create_timestamp: i64,
    #[schema(value_type = Vec<VersionedSourceConfig>)]
    pub sources: Vec<SourceConfig>,
}

impl TryFrom<IndexMetadataV0_8> for IndexMetadata {
    type Error = anyhow::Error;

    fn try_from(v0_8: IndexMetadataV0_8) -> anyhow::Result<Self> {
        let mut sources: HashMap<String, SourceConfig> = Default::default();
        for source in v0_8.sources {
            if sources.contains_key(&source.source_id) {
                anyhow::bail!("source `{}` is defined more than once", source.source_id);
            }
            sources.insert(source.source_id.clone(), source);
        }
        Ok(Self {
            index_uid: v0_8.index_uid,
            index_config: v0_8.index_config,
            checkpoint: v0_8.checkpoint,
            create_timestamp: v0_8.create_timestamp,
            sources,
        })
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub mod file_backed;
pub(crate) mod index_metadata;
#[cfg(feature = "postgres")]
pub mod postgres;

pub mod control_plane_metastore;

use std::cmp::Ordering;
use std::ops::{Bound, RangeInclusive};

use async_trait::async_trait;
use bytes::Bytes;
use futures::TryStreamExt;
pub use index_metadata::IndexMetadata;
use itertools::Itertools;
use quickwit_common::thread_pool::run_cpu_intensive;
use quickwit_config::{
    DocMapping, FileSourceParams, IndexConfig, IndexingSettings, IngestSettings, RetentionPolicy,
    SearchSettings, SourceConfig, SourceParams,
};
use quickwit_doc_mapper::tag_pruning::TagFilterAst;
use quickwit_proto::metastore::{
    AddSourceRequest, CreateIndexRequest, CreateIndexResponse, DeleteTask, IndexMetadataFailure,
    IndexMetadataRequest, IndexMetadataResponse, IndexesMetadataResponse,
    ListIndexesMetadataResponse, ListSplitsRequest, ListSplitsResponse, MetastoreError,
    MetastoreResult, MetastoreService, MetastoreServiceClient, MetastoreServiceStream,
    PublishSplitsRequest, StageSplitsRequest, UpdateIndexRequest, UpdateSourceRequest, serde_utils,
};
use quickwit_proto::types::{IndexUid, NodeId, SplitId};
use time::OffsetDateTime;

use crate::checkpoint::IndexCheckpointDelta;
use crate::{Split, SplitMetadata, SplitState};

/// Splits batch size returned by the stream splits API
pub(crate) const STREAM_SPLITS_CHUNK_SIZE: usize = 100;

/// An extended trait for [`MetastoreService`].
#[async_trait]
pub trait MetastoreServiceExt: MetastoreService {
    /// Returns whether the index `index_id` exists in the metastore.
    async fn index_exists(&mut self, index_id: &str) -> MetastoreResult<bool> {
        let request = IndexMetadataRequest::for_index_id(index_id.to_string());
        match self.index_metadata(request).await {
            Ok(_) => Ok(true),
            Err(MetastoreError::NotFound { .. }) => Ok(false),
            Err(error) => Err(error),
        }
    }
}

impl MetastoreServiceExt for MetastoreServiceClient {}

/// Helper trait to collect splits from a [`MetastoreServiceStream<ListSplitsResponse>`].
#[async_trait]
pub trait MetastoreServiceStreamSplitsExt {
    /// Collects all splits from a [`MetastoreServiceStream<ListSplitsResponse>`].
    async fn collect_splits(mut self) -> MetastoreResult<Vec<Split>>;

    /// Collects all splits metadata from a [`MetastoreServiceStream<ListSplitsResponse>`].
    async fn collect_splits_metadata(mut self) -> MetastoreResult<Vec<SplitMetadata>>;

    /// Collects all splits IDs from a [`MetastoreServiceStream<ListSplitsResponse>`].
    async fn collect_split_ids(mut self) -> MetastoreResult<Vec<SplitId>>;
}

#[async_trait]
impl MetastoreServiceStreamSplitsExt for MetastoreServiceStream<ListSplitsResponse> {
    async fn collect_splits(mut self) -> MetastoreResult<Vec<Split>> {
        let mut all_splits = Vec::new();
        while let Some(list_splits_response) = self.try_next().await? {
            let splits = list_splits_response.deserialize_splits().await?;
            all_splits.extend(splits);
        }
        Ok(all_splits)
    }

    async fn collect_splits_metadata(mut self) -> MetastoreResult<Vec<SplitMetadata>> {
        let mut all_splits_metadata = Vec::new();
        while let Some(list_splits_response) = self.try_next().await? {
            let splits_metadata = list_splits_response.deserialize_splits_metadata().await?;
            all_splits_metadata.extend(splits_metadata);
        }
        Ok(all_splits_metadata)
    }

    async fn collect_split_ids(mut self) -> MetastoreResult<Vec<SplitId>> {
        let mut all_splits = Vec::new();
        while let Some(list_splits_response) = self.try_next().await? {
            let splits = list_splits_response.deserialize_split_ids().await?;
            all_splits.extend(splits);
        }
        Ok(all_splits)
    }
}

/// Helper trait to build a [`CreateIndexRequest`] and deserialize its payload.
pub trait CreateIndexRequestExt {
    /// Creates a new [`CreateIndexRequest`] from an [`IndexConfig`].
    fn try_from_index_config(index_config: &IndexConfig) -> MetastoreResult<CreateIndexRequest>;

    /// Creates a new [`CreateIndexRequest`] from an [`IndexConfig`] and a list of [`SourceConfig`].
    fn try_from_index_and_source_configs(
        index_config: &IndexConfig,
        source_configs: &[SourceConfig],
    ) -> MetastoreResult<CreateIndexRequest>;

    /// Deserializes the `index_config_json` field of a [`CreateIndexRequest`] into an
    /// [`IndexConfig`].
    fn deserialize_index_config(&self) -> MetastoreResult<IndexConfig>;

    /// Deserializes the `source_configs_json` field of a [`CreateIndexRequest`] into an
    /// `Vec` of [`SourceConfig`].
    fn deserialize_source_configs(&self) -> MetastoreResult<Vec<SourceConfig>>;
}

impl CreateIndexRequestExt for CreateIndexRequest {
    fn try_from_index_config(index_config: &IndexConfig) -> MetastoreResult<CreateIndexRequest> {
        let index_config_json = serde_utils::to_json_str(index_config)?;
        let source_configs_json = Vec::new();
        let request = Self {
            index_config_json,
            source_configs_json,
        };
        Ok(request)
    }

    fn try_from_index_and_source_configs(
        index_config: &IndexConfig,
        source_configs: &[SourceConfig],
    ) -> MetastoreResult<CreateIndexRequest> {
        let index_config_json = serde_utils::to_json_str(index_config)?;
        let source_configs_json: Vec<String> = source_configs
            .iter()
            .map(serde_utils::to_json_str)
            .collect::<MetastoreResult<_>>()?;
        let request = Self {
            index_config_json,
            source_configs_json,
        };
        Ok(request)
    }

    fn deserialize_index_config(&self) -> MetastoreResult<IndexConfig> {
        serde_utils::from_json_str(&self.index_config_json)
    }

    fn deserialize_source_configs(&self) -> MetastoreResult<Vec<SourceConfig>> {
        self.source_configs_json
            .iter()
            .map(|source_config_json| serde_utils::from_json_str(source_config_json))
            .collect()
    }
}

/// Helper trait to deserialize the payload of a [`CreateIndexResponse`].
pub trait CreateIndexResponseExt {
    /// Deserializes the `index_metadata_json` field of a [`CreateIndexResponse`] into an
    /// [`IndexMetadata`].
    fn deserialize_index_metadata(&self) -> MetastoreResult<IndexMetadata>;
}

impl CreateIndexResponseExt for CreateIndexResponse {
    fn deserialize_index_metadata(&self) -> MetastoreResult<IndexMetadata> {
        serde_utils::from_json_str(&self.index_metadata_json)
    }
}

/// Helper trait to build a [`UpdateIndexRequest`] and deserialize its payload.
pub trait UpdateIndexRequestExt {
    /// Creates a new [`UpdateIndexRequest`] from the different updated fields.
    fn try_from_updates(
        index_uid: impl Into<IndexUid>,
        doc_mapping: &DocMapping,
        indexing_settings: &IndexingSettings,
        ingest_settings: &IngestSettings,
        search_settings: &SearchSettings,
        retention_policy_opt: &Option<RetentionPolicy>,
    ) -> MetastoreResult<UpdateIndexRequest>;

    /// Deserializes the `doc_mapping_json` field of an `[UpdateIndexRequest]` into a
    /// [`DocMapping`] object.
    fn deserialize_doc_mapping(&self) -> MetastoreResult<DocMapping>;

    /// Deserializes the `indexing_settings_json` field of an [`UpdateIndexRequest`] into a
    /// [`IndexingSettings`] object.
    fn deserialize_indexing_settings(&self) -> MetastoreResult<IndexingSettings>;

    /// Deserializes the `ingest_settings_json` field of an [`UpdateIndexRequest`] into a
    /// [`IngestSettings`] object.
    fn deserialize_ingest_settings(&self) -> MetastoreResult<IngestSettings>;

    /// Deserializes the `search_settings_json` field of an [`UpdateIndexRequest`] into a
    /// [`SearchSettings`] object.
    fn deserialize_search_settings(&self) -> MetastoreResult<SearchSettings>;

    /// Deserializes the `retention_policy_json` field of an [`UpdateIndexRequest`] into a
    /// [`RetentionPolicy`] object.
    fn deserialize_retention_policy(&self) -> MetastoreResult<Option<RetentionPolicy>>;
}

impl UpdateIndexRequestExt for UpdateIndexRequest {
    fn try_from_updates(
        index_uid: impl Into<IndexUid>,
        doc_mapping: &DocMapping,
        indexing_settings: &IndexingSettings,
        ingest_settings: &IngestSettings,
        search_settings: &SearchSettings,
        retention_policy_opt: &Option<RetentionPolicy>,
    ) -> MetastoreResult<UpdateIndexRequest> {
        let doc_mapping_json = serde_utils::to_json_str(doc_mapping)?;
        let indexing_settings_json = serde_utils::to_json_str(indexing_settings)?;
        let ingest_settings_json = serde_utils::to_json_str(ingest_settings)?;
        let search_settings_json = serde_utils::to_json_str(search_settings)?;
        let retention_policy_json_opt = retention_policy_opt
            .as_ref()
            .map(serde_utils::to_json_str)
            .transpose()?;

        let update_request = UpdateIndexRequest {
            index_uid: Some(index_uid.into()),
            doc_mapping_json,
            indexing_settings_json,
            ingest_settings_json,
            search_settings_json,
            retention_policy_json_opt,
        };
        Ok(update_request)
    }
    fn deserialize_doc_mapping(&self) -> MetastoreResult<DocMapping> {
        serde_utils::from_json_str(&self.doc_mapping_json)
    }

    fn deserialize_indexing_settings(&self) -> MetastoreResult<IndexingSettings> {
        serde_utils::from_json_str(&self.indexing_settings_json)
    }

    fn deserialize_ingest_settings(&self) -> MetastoreResult<IngestSettings> {
        serde_utils::from_json_str(&self.ingest_settings_json)
    }

    fn deserialize_search_settings(&self) -> MetastoreResult<SearchSettings> {
        serde_utils::from_json_str(&self.search_settings_json)
    }

    fn deserialize_retention_policy(&self) -> MetastoreResult<Option<RetentionPolicy>> {
        self.retention_policy_json_opt
            .as_ref()
            .map(|policy_json| serde_utils::from_json_str(policy_json))
            .transpose()
    }
}

/// Helper trait to build a [`IndexMetadataResponse`] and deserialize its payload.
pub trait IndexMetadataResponseExt {
    /// Creates a new [`IndexMetadataResponse`] from an [`IndexMetadata`].
    fn try_from_index_metadata(
        index_metadata: &IndexMetadata,
    ) -> MetastoreResult<IndexMetadataResponse>;

    /// Deserializes the `index_metadata_serialized_json` field of a [`IndexMetadataResponse`] into
    /// an [`IndexMetadata`].
    fn deserialize_index_metadata(&self) -> MetastoreResult<IndexMetadata>;
}

impl IndexMetadataResponseExt for IndexMetadataResponse {
    fn try_from_index_metadata(index_metadata: &IndexMetadata) -> MetastoreResult<Self> {
        let index_metadata_serialized_json = serde_utils::to_json_str(index_metadata)?;
        let response = Self {
            index_metadata_serialized_json,
        };
        Ok(response)
    }

    fn deserialize_index_metadata(&self) -> MetastoreResult<IndexMetadata> {
        serde_utils::from_json_str(&self.index_metadata_serialized_json)
    }
}

/// Helper trait to build a [`IndexesMetadataResponse`] and deserialize its payload.
#[async_trait]
pub trait IndexesMetadataResponseExt {
    /// Creates a new `IndexesMetadataResponse` from a `Vec` of [`IndexMetadata`].
    async fn try_from_indexes_metadata(
        indexes_metadata: Vec<IndexMetadata>,
        failures: Vec<IndexMetadataFailure>,
    ) -> MetastoreResult<IndexesMetadataResponse>;

    /// Deserializes the payload of an `IndexesMetadataResponse` into a `Vec`` of [`IndexMetadata`].
    async fn deserialize_indexes_metadata(self) -> MetastoreResult<Vec<IndexMetadata>>;

    /// Creates a new `IndexesMetadataResponse` from a `Vec` of [`IndexMetadata`] synchronously.
    #[cfg(any(test, feature = "testsuite"))]
    fn for_test(
        indexes_metadata: Vec<IndexMetadata>,
        failures: Vec<IndexMetadataFailure>,
    ) -> IndexesMetadataResponse {
        use futures::executor;

        executor::block_on(Self::try_from_indexes_metadata(indexes_metadata, failures)).unwrap()
    }
}

#[async_trait]
impl IndexesMetadataResponseExt for IndexesMetadataResponse {
    async fn try_from_indexes_metadata(
        indexes_metadata: Vec<IndexMetadata>,
        failures: Vec<IndexMetadataFailure>,
    ) -> MetastoreResult<Self> {
        let indexes_metadata_json_zstd = run_cpu_intensive(move || {
            serde_utils::to_json_zstd(&indexes_metadata, 0).map(Bytes::from)
        })
        .await
        .map_err(|join_error| MetastoreError::Internal {
            message: "failed to serialize indexes metadata".to_string(),
            cause: join_error.to_string(),
        })??;
        let response = Self {
            indexes_metadata_json_zstd,
            failures,
        };
        Ok(response)
    }

    async fn deserialize_indexes_metadata(self) -> MetastoreResult<Vec<IndexMetadata>> {
        run_cpu_intensive(move || serde_utils::from_json_zstd(&self.indexes_metadata_json_zstd))
            .await
            .map_err(|join_error| MetastoreError::Internal {
                message: "failed to deserialize indexes metadata".to_string(),
                cause: join_error.to_string(),
            })?
    }
}

/// Helper trait to build a `ListIndexesResponse` and deserialize its payload.
#[async_trait]
pub trait ListIndexesMetadataResponseExt {
    /// Creates a new `ListIndexesMetadataResponse` from a `Vec` of [`IndexMetadata`].
    async fn try_from_indexes_metadata(
        indexes_metadata: Vec<IndexMetadata>,
    ) -> MetastoreResult<ListIndexesMetadataResponse>;

    /// Deserializes the payload of a `ListIndexesResponse` into a `Vec`` of [`IndexMetadata`].
    async fn deserialize_indexes_metadata(self) -> MetastoreResult<Vec<IndexMetadata>>;

    /// Creates a new `ListIndexesMetadataResponse` from a `Vec` of [`IndexMetadata`] synchronously.
    #[cfg(any(test, feature = "testsuite"))]
    fn for_test(indexes_metadata: Vec<IndexMetadata>) -> ListIndexesMetadataResponse {
        use futures::executor;

        executor::block_on(Self::try_from_indexes_metadata(indexes_metadata)).unwrap()
    }
}

#[async_trait]
impl ListIndexesMetadataResponseExt for ListIndexesMetadataResponse {
    async fn try_from_indexes_metadata(
        indexes_metadata: Vec<IndexMetadata>,
    ) -> MetastoreResult<Self> {
        let indexes_metadata_json_zstd = run_cpu_intensive(move || {
            serde_utils::to_json_zstd(&indexes_metadata, 0).map(Bytes::from)
        })
        .await
        .map_err(|join_error| MetastoreError::Internal {
            message: "failed to serialize indexes metadata".to_string(),
            cause: join_error.to_string(),
        })??;
        let response = Self {
            indexes_metadata_json_zstd,
            indexes_metadata_json_opt: None,
        };
        Ok(response)
    }

    async fn deserialize_indexes_metadata(self) -> MetastoreResult<Vec<IndexMetadata>> {
        run_cpu_intensive(move || {
            if let Some(indexes_metadata_json) = &self.indexes_metadata_json_opt {
                return serde_utils::from_json_str(indexes_metadata_json);
            };
            serde_utils::from_json_zstd(&self.indexes_metadata_json_zstd)
        })
        .await
        .map_err(|join_error| MetastoreError::Internal {
            message: "failed to deserialize indexes metadata".to_string(),
            cause: join_error.to_string(),
        })?
    }
}

/// Helper trait to build a [`AddSourceRequest`] and deserialize its payload.
pub trait AddSourceRequestExt {
    /// Creates a new [`AddSourceRequest`] from a [`SourceConfig`].
    fn try_from_source_config(
        index_uid: impl Into<IndexUid>,
        source_config: &SourceConfig,
    ) -> MetastoreResult<AddSourceRequest>;

    /// Deserializes the `source_config_json` field of a [`AddSourceRequest`] into a
    /// [`SourceConfig`].
    fn deserialize_source_config(&self) -> MetastoreResult<SourceConfig>;
}

impl AddSourceRequestExt for AddSourceRequest {
    fn try_from_source_config(
        index_uid: impl Into<IndexUid>,
        source_config: &SourceConfig,
    ) -> MetastoreResult<AddSourceRequest> {
        let source_config_json = serde_utils::to_json_str(&source_config)?;
        let request = Self {
            index_uid: Some(index_uid.into()),
            source_config_json,
        };
        Ok(request)
    }

    fn deserialize_source_config(&self) -> MetastoreResult<SourceConfig> {
        serde_utils::from_json_str(&self.source_config_json)
    }
}

/// Helper trait to build a [`UpdateSourceRequest`] and deserialize its payload.
pub trait UpdateSourceRequestExt {
    /// Creates a new [`UpdateSourceRequest`] from a [`SourceConfig`].
    fn try_from_source_config(
        index_uid: impl Into<IndexUid>,
        source_config: &SourceConfig,
    ) -> MetastoreResult<UpdateSourceRequest>;

    /// Deserializes the `source_config_json` field of a [`UpdateSourceRequest`] into a
    /// [`SourceConfig`].
    fn deserialize_source_config(&self) -> MetastoreResult<SourceConfig>;
}

impl UpdateSourceRequestExt for UpdateSourceRequest {
    fn try_from_source_config(
        index_uid: impl Into<IndexUid>,
        source_config: &SourceConfig,
    ) -> MetastoreResult<UpdateSourceRequest> {
        let source_config_json = serde_utils::to_json_str(&source_config)?;
        let request = Self {
            index_uid: Some(index_uid.into()),
            source_config_json,
        };
        Ok(request)
    }

    fn deserialize_source_config(&self) -> MetastoreResult<SourceConfig> {
        serde_utils::from_json_str(&self.source_config_json)
    }
}
/// Helper trait to build a [`DeleteTask`] and deserialize its payload.
pub trait StageSplitsRequestExt {
    /// Creates a new [`StageSplitsRequest`] from a [`SplitMetadata`].
    fn try_from_split_metadata(
        index_uid: impl Into<IndexUid>,
        split_metadata: &SplitMetadata,
    ) -> MetastoreResult<StageSplitsRequest>;

    /// Creates a new [`StageSplitsRequest`] from a list of [`SplitMetadata`].
    fn try_from_splits_metadata(
        index_uid: impl Into<IndexUid>,
        splits_metadata: impl IntoIterator<Item = SplitMetadata>,
    ) -> MetastoreResult<StageSplitsRequest>;

    /// Deserializes the `split_metadata_list_serialized_json` field of a [`StageSplitsRequest`]
    /// into a list of [`SplitMetadata`].
    fn deserialize_splits_metadata(&self) -> MetastoreResult<Vec<SplitMetadata>>;
}

impl StageSplitsRequestExt for StageSplitsRequest {
    fn try_from_split_metadata(
        index_uid: impl Into<IndexUid>,
        split_metadata: &SplitMetadata,
    ) -> MetastoreResult<StageSplitsRequest> {
        let split_metadata_list_serialized_json = serde_utils::to_json_str(&[split_metadata])?;
        let request = Self {
            index_uid: Some(index_uid.into()),
            split_metadata_list_serialized_json,
        };
        Ok(request)
    }

    fn try_from_splits_metadata(
        index_uid: impl Into<IndexUid>,
        splits_metadata: impl IntoIterator<Item = SplitMetadata>,
    ) -> MetastoreResult<StageSplitsRequest> {
        let splits_metadata: Vec<SplitMetadata> = splits_metadata.into_iter().collect();
        let split_metadata_list_serialized_json = serde_utils::to_json_str(&splits_metadata)?;
        let request = Self {
            index_uid: Some(index_uid.into()),
            split_metadata_list_serialized_json,
        };
        Ok(request)
    }

    fn deserialize_splits_metadata(&self) -> MetastoreResult<Vec<SplitMetadata>> {
        serde_utils::from_json_str(&self.split_metadata_list_serialized_json)
    }
}

/// Helper trait to build a [`ListSplitsRequest`] and deserialize its payload.
pub trait ListSplitsRequestExt {
    /// Creates a new [`ListSplitsRequest`] from an [`IndexUid`].
    fn try_from_index_uid(index_uid: IndexUid) -> MetastoreResult<ListSplitsRequest>;

    /// Creates a new [`ListSplitsRequest`] from a [`ListSplitsQuery`].
    fn try_from_list_splits_query(
        list_splits_query: &ListSplitsQuery,
    ) -> MetastoreResult<ListSplitsRequest>;

    /// Deserializes the `query_json` field of a [`ListSplitsRequest`] into a [`ListSplitsQuery`].
    fn deserialize_list_splits_query(&self) -> MetastoreResult<ListSplitsQuery>;
}

impl ListSplitsRequestExt for ListSplitsRequest {
    fn try_from_index_uid(index_uid: IndexUid) -> MetastoreResult<ListSplitsRequest> {
        let list_splits_query = ListSplitsQuery::for_index(index_uid);
        Self::try_from_list_splits_query(&list_splits_query)
    }

    fn try_from_list_splits_query(
        list_splits_query: &ListSplitsQuery,
    ) -> MetastoreResult<ListSplitsRequest> {
        let query_json = serde_utils::to_json_str(&list_splits_query)?;
        let request = Self { query_json };
        Ok(request)
    }

    fn deserialize_list_splits_query(&self) -> MetastoreResult<ListSplitsQuery> {
        let list_splits_query = serde_utils::from_json_str(&self.query_json)?;
        Ok(list_splits_query)
    }
}

/// Helper trait to build a [`ListSplitsResponse`] and deserialize its payload.
#[async_trait]
pub trait ListSplitsResponseExt {
    /// Creates a new [`ListSplitsResponse`] from a list of [`Split`].
    fn try_from_splits(
        splits: impl IntoIterator<Item = Split>,
    ) -> MetastoreResult<ListSplitsResponse>;

    /// Deserializes the `splits_serialized_json` field of a [`ListSplitsResponse`] into a list of
    /// [`Split`].
    async fn deserialize_splits(self) -> MetastoreResult<Vec<Split>>;

    /// Deserializes the `splits_serialized_json` field of a [`ListSplitsResponse`] into a list of
    /// [`SplitMetadata`].
    async fn deserialize_splits_metadata(self) -> MetastoreResult<Vec<SplitMetadata>>;

    /// Deserializes the `splits_serialized_json` field of a [`ListSplitsResponse`] into a list of
    /// [`SplitId`].
    async fn deserialize_split_ids(self) -> MetastoreResult<Vec<SplitId>>;

    /// Creates an empty [`ListSplitsResponse`].
    fn empty() -> Self;
}

/// Helper trait for [`PublishSplitsRequest`] to deserialize its payload.
pub trait PublishSplitsRequestExt {
    /// Deserializes the `index_checkpoint_delta_json_opt` field of a [`PublishSplitsRequest`] into
    /// an [`Option<IndexCheckpointDelta>`].
    fn deserialize_index_checkpoint(&self) -> MetastoreResult<Option<IndexCheckpointDelta>>;
}

impl PublishSplitsRequestExt for PublishSplitsRequest {
    fn deserialize_index_checkpoint(&self) -> MetastoreResult<Option<IndexCheckpointDelta>> {
        self.index_checkpoint_delta_json_opt
            .as_ref()
            .map(|value| serde_utils::from_json_str(value))
            .transpose()
    }
}

#[async_trait]
impl ListSplitsResponseExt for ListSplitsResponse {
    fn empty() -> Self {
        Self {
            splits_serialized_json: "[]".to_string(),
        }
    }

    fn try_from_splits(splits: impl IntoIterator<Item = Split>) -> MetastoreResult<Self> {
        let splits_serialized_json = serde_utils::to_json_str(&splits.into_iter().collect_vec())?;
        let response = Self {
            splits_serialized_json,
        };
        Ok(response)
    }

    async fn deserialize_splits(self) -> MetastoreResult<Vec<Split>> {
        run_cpu_intensive(move || serde_utils::from_json_str(&self.splits_serialized_json))
            .await
            .map_err(|join_error| MetastoreError::Internal {
                message: "failed to deserialize splits".to_string(),
                cause: join_error.to_string(),
            })?
    }

    async fn deserialize_splits_metadata(self) -> MetastoreResult<Vec<SplitMetadata>> {
        let splits = self.deserialize_splits().await?;
        let splits_metadata = splits
            .into_iter()
            .map(|split| split.split_metadata)
            .collect();
        Ok(splits_metadata)
    }

    async fn deserialize_split_ids(self) -> MetastoreResult<Vec<SplitId>> {
        let splits = self.deserialize_splits().await?;
        let split_ids = splits
            .into_iter()
            .map(|split| split.split_metadata.split_id)
            .collect();
        Ok(split_ids)
    }
}

#[derive(Debug, Clone, serde::Serialize, serde::Deserialize)]
/// A query builder for listing splits within the metastore.
pub struct ListSplitsQuery {
    /// A non-empty list of index UIDs for which to fetch the splits, or
    /// None if we want splits from all indexes.
    pub index_uids: Option<Vec<IndexUid>>,

    /// A specific node ID to filter by.
    pub node_id: Option<NodeId>,

    /// The maximum number of splits to retrieve.
    pub limit: Option<usize>,

    /// The number of splits to skip.
    pub offset: Option<usize>,

    /// A specific split state(s) to filter by.
    pub split_states: Vec<SplitState>,

    /// A specific set of tag(s) to filter by.
    pub tags: Option<TagFilterAst>,

    /// The time range to filter by.
    pub time_range: FilterRange<i64>,

    /// The maximum time range end to filter by.
    pub max_time_range_end: Option<i64>,

    /// The delete opstamp range to filter by.
    pub delete_opstamp: FilterRange<u64>,

    /// The update timestamp range to filter by.
    pub update_timestamp: FilterRange<i64>,

    /// The create timestamp range to filter by.
    pub create_timestamp: FilterRange<i64>,

    /// The datetime at which you include or exclude mature splits.
    pub mature: Bound<OffsetDateTime>,

    /// Sorts the splits by staleness, i.e. by delete opstamp and publish timestamp in ascending
    /// order.
    pub sort_by: SortBy,

    /// Only return splits whose (index_uid, split_id) are lexicographically after this split
    pub after_split: Option<(IndexUid, SplitId)>,
}

#[derive(Debug, Clone, PartialEq, serde::Serialize, serde::Deserialize)]
pub enum SortBy {
    None,
    Staleness,
    IndexUid,
}

impl SortBy {
    fn compare(&self, left_split: &Split, right_split: &Split) -> Ordering {
        match self {
            SortBy::None => Ordering::Equal,
            SortBy::Staleness => left_split
                .split_metadata
                .delete_opstamp
                .cmp(&right_split.split_metadata.delete_opstamp)
                .then_with(|| {
                    left_split
                        .publish_timestamp
                        .cmp(&right_split.publish_timestamp)
                }),
            SortBy::IndexUid => left_split
                .split_metadata
                .index_uid
                .cmp(&right_split.split_metadata.index_uid)
                .then_with(|| {
                    left_split
                        .split_metadata
                        .split_id
                        .cmp(&right_split.split_metadata.split_id)
                }),
        }
    }
}

#[allow(unused_attributes)]
impl ListSplitsQuery {
    /// Creates a new [`ListSplitsQuery`] for the designated index.
    pub fn for_index(index_uid: IndexUid) -> Self {
        Self {
            index_uids: Some(vec![index_uid]),
            node_id: None,
            limit: None,
            offset: None,
            split_states: Vec::new(),
            tags: None,
            time_range: Default::default(),
            max_time_range_end: None,
            delete_opstamp: Default::default(),
            update_timestamp: Default::default(),
            create_timestamp: Default::default(),
            mature: Bound::Unbounded,
            sort_by: SortBy::None,
            after_split: None,
        }
    }

    /// Creates a new [`ListSplitsQuery`] from a non-empty list of index UIDs.
    /// Returns None if the list is empty.
    pub fn try_from_index_uids(index_uids: Vec<IndexUid>) -> Option<Self> {
        if index_uids.is_empty() {
            return None;
        }
        Some(Self {
            index_uids: Some(index_uids),
            node_id: None,
            limit: None,
            offset: None,
            split_states: Vec::new(),
            tags: None,
            time_range: Default::default(),
            max_time_range_end: None,
            delete_opstamp: Default::default(),
            update_timestamp: Default::default(),
            create_timestamp: Default::default(),
            mature: Bound::Unbounded,
            sort_by: SortBy::None,
            after_split: None,
        })
    }

    /// Creates a new [`ListSplitsQuery`] for all indexes.
    pub fn for_all_indexes() -> Self {
        Self {
            index_uids: None,
            node_id: None,
            limit: None,
            offset: None,
            split_states: Vec::new(),
            tags: None,
            time_range: Default::default(),
            max_time_range_end: None,
            delete_opstamp: Default::default(),
            update_timestamp: Default::default(),
            create_timestamp: Default::default(),
            mature: Bound::Unbounded,
            sort_by: SortBy::None,
            after_split: None,
        }
    }

    /// Selects splits produced by the specified node.
    pub fn with_node_id(mut self, node_id: NodeId) -> Self {
        self.node_id = Some(node_id);
        self
    }

    /// Sets the maximum number of splits to retrieve.
    pub fn with_limit(mut self, n: usize) -> Self {
        self.limit = Some(n);
        self
    }

    /// Sets the number of splits to skip.
    pub fn with_offset(mut self, n: usize) -> Self {
        self.offset = Some(n);
        self
    }

    /// Selects splits which have the given split state.
    pub fn with_split_state(mut self, state: SplitState) -> Self {
        self.split_states.push(state);
        self
    }

    /// Selects splits which have the any of the following split state.
    pub fn with_split_states(mut self, states: impl AsRef<[SplitState]>) -> Self {
        self.split_states.extend_from_slice(states.as_ref());
        self
    }

    /// Selects splits which match the given tag filter.
    pub fn with_tags_filter(mut self, tags: TagFilterAst) -> Self {
        self.tags = Some(tags);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than or equal to* the provided value.
    pub fn with_time_range_end_lte(mut self, v: i64) -> Self {
        self.time_range.end = Bound::Included(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than* the provided value.
    pub fn with_time_range_end_lt(mut self, v: i64) -> Self {
        self.time_range.end = Bound::Excluded(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than or equal to* the provided value.
    pub fn with_time_range_start_gte(mut self, v: i64) -> Self {
        self.time_range.start = Bound::Included(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than* the provided value.
    pub fn with_time_range_start_gt(mut self, v: i64) -> Self {
        self.time_range.start = Bound::Excluded(v);
        self
    }

    /// Retains only splits with a time range end that is
    /// *less than or equal to* the provided value.
    pub fn with_max_time_range_end(mut self, v: i64) -> Self {
        self.max_time_range_end = Some(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than or equal to* the provided value.
    pub fn with_delete_opstamp_lte(mut self, v: u64) -> Self {
        self.delete_opstamp.end = Bound::Included(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than* the provided value.
    pub fn with_delete_opstamp_lt(mut self, v: u64) -> Self {
        self.delete_opstamp.end = Bound::Excluded(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than or equal to* the provided value.
    pub fn with_delete_opstamp_gte(mut self, v: u64) -> Self {
        self.delete_opstamp.start = Bound::Included(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than* the provided value.
    pub fn with_delete_opstamp_gt(mut self, v: u64) -> Self {
        self.delete_opstamp.start = Bound::Excluded(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than or equal to* the provided value.
    pub fn with_update_timestamp_lte(mut self, v: i64) -> Self {
        self.update_timestamp.end = Bound::Included(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than* the provided value.
    pub fn with_update_timestamp_lt(mut self, v: i64) -> Self {
        self.update_timestamp.end = Bound::Excluded(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than or equal to* the provided value.
    pub fn with_update_timestamp_gte(mut self, v: i64) -> Self {
        self.update_timestamp.start = Bound::Included(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than* the provided value.
    pub fn with_update_timestamp_gt(mut self, v: i64) -> Self {
        self.update_timestamp.start = Bound::Excluded(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than or equal to* the provided value.
    pub fn with_create_timestamp_lte(mut self, v: i64) -> Self {
        self.create_timestamp.end = Bound::Included(v);
        self
    }

    /// Sets the field's lower bound to match values that are
    /// *less than* the provided value.
    pub fn with_create_timestamp_lt(mut self, v: i64) -> Self {
        self.create_timestamp.end = Bound::Excluded(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than or equal to* the provided value.
    pub fn with_create_timestamp_gte(mut self, v: i64) -> Self {
        self.create_timestamp.start = Bound::Included(v);
        self
    }

    /// Sets the field's upper bound to match values that are
    /// *greater than* the provided value.
    pub fn with_create_timestamp_gt(mut self, v: i64) -> Self {
        self.create_timestamp.start = Bound::Excluded(v);
        self
    }

    /// Retains splits that are mature at the given datetime.
    pub fn retain_mature(mut self, now: OffsetDateTime) -> Self {
        self.mature = Bound::Included(now);
        self
    }

    /// Retains splits that are immature at the given datetime.
    pub fn retain_immature(mut self, now: OffsetDateTime) -> Self {
        self.mature = Bound::Excluded(now);
        self
    }

    /// Sorts the splits by staleness, i.e. by delete opstamp and publish timestamp in ascending
    /// order.
    pub fn sort_by_staleness(mut self) -> Self {
        self.sort_by = SortBy::Staleness;
        self
    }

    /// Sorts the splits by index_uid and split_id.
    pub fn sort_by_index_uid(mut self) -> Self {
        self.sort_by = SortBy::IndexUid;
        self
    }

    /// Only return splits whose (index_uid, split_id) are lexicographically after this split.
    /// This is only useful if results are sorted by index_uid and split_id.
    pub fn after_split(mut self, split_meta: &SplitMetadata) -> Self {
        self.after_split = Some((split_meta.index_uid.clone(), split_meta.split_id.clone()));
        self
    }
}

#[derive(Debug, Clone, serde::Serialize, serde::Deserialize)]
/// A range containing the upper and lower bounds to filter documents by.
pub struct FilterRange<T> {
    /// The lower bound of the filter.
    pub start: Bound<T>,
    /// The upper bound of the filter.
    pub end: Bound<T>,
}

impl<T: PartialEq + PartialOrd> FilterRange<T> {
    /// Checks if both the upper and lower bound are `Bound::Unbounded`.
    pub fn is_unbounded(&self) -> bool {
        self.start == Bound::Unbounded && self.end == Bound::Unbounded
    }

    /// Checks if the provided value lies within the upper and lower bounds
    /// of the range.
    pub fn contains(&self, value: &T) -> bool {
        if self.is_unbounded() {
            return true;
        }

        let lower_check = match &self.start {
            Bound::Unbounded => true,
            Bound::Included(left) => left <= value,
            Bound::Excluded(left) => left < value,
        };

        let upper_check = match &self.end {
            Bound::Unbounded => true,
            Bound::Included(left) => left >= value,
            Bound::Excluded(left) => left > value,
        };

        lower_check && upper_check
    }

    /// Checks if the provided range overlaps with the range.
    pub fn overlaps_with(&self, range: RangeInclusive<T>) -> bool {
        if self.is_unbounded() {
            return true;
        }

        let lower_check = match &self.start {
            Bound::Unbounded => true,
            Bound::Included(left) => left <= range.end(),
            Bound::Excluded(left) => left < range.end(),
        };

        let upper_check = match &self.end {
            Bound::Unbounded => true,
            Bound::Included(left) => left >= range.start(),
            Bound::Excluded(left) => left > range.start(),
        };

        lower_check && upper_check
    }
}

// The `Default` derive implementation imposes a restriction
// for `T` to also implement Default when this is not required.
impl<T> Default for FilterRange<T> {
    fn default() -> Self {
        Self {
            start: Bound::Unbounded,
            end: Bound::Unbounded,
        }
    }
}

/// Maps the given source params to whether checkpoints should be stored in the index metadata
/// (false) or the shard table (true)
fn use_shard_api(params: &SourceParams) -> bool {
    match params {
        SourceParams::File(FileSourceParams::Filepath(_)) => false,
        SourceParams::File(FileSourceParams::Notifications(_)) => true,
        SourceParams::Ingest => true,
        SourceParams::IngestApi => false,
        SourceParams::IngestCli => false,
        SourceParams::Kafka(_) => false,
        SourceParams::Kinesis(_) => false,
        SourceParams::PubSub(_) => false,
        SourceParams::Pulsar(_) => false,
        SourceParams::Stdin => panic!("stdin cannot be checkpointed"),
        SourceParams::Vec(_) => false,
        SourceParams::Void(_) => false,
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_filter_contains() {
        let filter = FilterRange {
            start: Bound::Unbounded,
            end: Bound::Excluded(50),
        };
        assert!(!filter.contains(&50));
        assert!(filter.contains(&0));
        assert!(filter.contains(&49));

        let filter = FilterRange {
            start: Bound::Included(50),
            end: Bound::Unbounded,
        };
        assert!(filter.contains(&50));
        assert!(filter.contains(&51));
        assert!(!filter.contains(&0));

        let filter = FilterRange {
            start: Bound::Included(50),
            end: Bound::Excluded(75),
        };
        assert!(filter.contains(&50));
        assert!(filter.contains(&51));
        assert!(!filter.contains(&0));
        assert!(!filter.contains(&75));
        assert!(filter.contains(&74));
    }

    #[test]
    fn test_overlaps_with() {
        let filter = FilterRange {
            start: Bound::Unbounded,
            end: Bound::Excluded(50),
        };
        assert!(filter.overlaps_with(0..=50));
        assert!(filter.overlaps_with(0..=51));
        assert!(filter.overlaps_with(32..=63));
        assert!(filter.overlaps_with(32..=32));
        assert!(!filter.overlaps_with(51..=76));
        assert!(!filter.overlaps_with(50..=76));

        let filter = FilterRange {
            start: Bound::Unbounded,
            end: Bound::Included(50),
        };
        assert!(filter.overlaps_with(0..=50));
        assert!(filter.overlaps_with(0..=51));
        assert!(filter.overlaps_with(50..=76));
        assert!(!filter.overlaps_with(51..=76));

        let filter = FilterRange {
            start: Bound::Excluded(50),
            end: Bound::Unbounded,
        };
        assert!(filter.overlaps_with(51..=75));
        assert!(filter.overlaps_with(0..=51));
        assert!(filter.overlaps_with(51..=76));
        assert!(filter.overlaps_with(50..=76));
        assert!(!filter.overlaps_with(0..=49));
        assert!(!filter.overlaps_with(0..=50));

        let filter = FilterRange {
            start: Bound::Included(50),
            end: Bound::Unbounded,
        };
        assert!(filter.overlaps_with(51..=75));
        assert!(filter.overlaps_with(0..=51));
        assert!(filter.overlaps_with(51..=76));
        assert!(filter.overlaps_with(50..=76));
        assert!(filter.overlaps_with(0..=50));
        assert!(!filter.overlaps_with(0..=49));

        let filter = FilterRange {
            start: Bound::Included(50),
            end: Bound::Excluded(75),
        };
        assert!(filter.overlaps_with(51..=75));
        assert!(filter.overlaps_with(0..=51));
        assert!(filter.overlaps_with(45..=76));
        assert!(filter.overlaps_with(50..=76));
        assert!(filter.overlaps_with(0..=50));
        assert!(filter.overlaps_with(74..=124));
        assert!(!filter.overlaps_with(0..=49));
        assert!(!filter.overlaps_with(75..=124));
    }

    #[tokio::test]
    async fn test_list_splits_response_empty() {
        let response = ListSplitsResponse::empty();
        let splits = response.deserialize_splits().await.unwrap();
        assert!(splits.is_empty());
    }

    #[tokio::test]
    async fn test_list_indexes_metadata_response_serde() {
        let response = ListIndexesMetadataResponse::try_from_indexes_metadata(Vec::new())
            .await
            .unwrap();
        let indexes_metadata = response.deserialize_indexes_metadata().await.unwrap();
        assert!(indexes_metadata.is_empty());

        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let response = ListIndexesMetadataResponse::for_test(vec![index_metadata.clone()]);
        let indexes_metadata = response.deserialize_indexes_metadata().await.unwrap();
        assert_eq!(indexes_metadata.len(), 1);
        assert_eq!(indexes_metadata[0], index_metadata);
    }

    #[tokio::test]
    async fn test_list_indexes_metadata_backward_compatible_serde() {
        let indexes_metadata_json = serde_json::to_string(&Vec::<IndexMetadata>::new()).unwrap();
        let response = ListIndexesMetadataResponse {
            indexes_metadata_json_opt: Some(indexes_metadata_json),
            indexes_metadata_json_zstd: Bytes::from_static(b""),
        };
        let indexes_metadata = response.deserialize_indexes_metadata().await.unwrap();
        assert!(indexes_metadata.is_empty());

        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let indexes_metadata_json = serde_json::to_string(&vec![index_metadata.clone()]).unwrap();
        let response = ListIndexesMetadataResponse {
            indexes_metadata_json_opt: Some(indexes_metadata_json),
            indexes_metadata_json_zstd: Bytes::from_static(b""),
        };
        let indexes_metadata = response.deserialize_indexes_metadata().await.unwrap();
        assert_eq!(indexes_metadata.len(), 1);
        assert_eq!(indexes_metadata[0], index_metadata);
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_proto::metastore::{EntityKind, MetastoreError};
use sqlx::postgres::PgDatabaseError;
use tracing::error;

// https://www.postgresql.org/docs/current/errcodes-appendix.html
mod pg_error_codes {
    pub const FOREIGN_KEY_VIOLATION: &str = "23503";
    pub const UNIQUE_VIOLATION: &str = "23505";
}

pub(super) fn convert_sqlx_err(index_id: &str, sqlx_error: sqlx::Error) -> MetastoreError {
    match &sqlx_error {
        sqlx::Error::Database(boxed_db_error) => {
            let pg_db_error = boxed_db_error.downcast_ref::<PgDatabaseError>();
            let pg_error_code = pg_db_error.code();
            let pg_error_table = pg_db_error.table();

            match (pg_error_code, pg_error_table) {
                (pg_error_codes::FOREIGN_KEY_VIOLATION, _) => {
                    MetastoreError::NotFound(EntityKind::Index {
                        index_id: index_id.to_string(),
                    })
                }
                (pg_error_codes::UNIQUE_VIOLATION, Some(table)) if table.starts_with("indexes") => {
                    MetastoreError::AlreadyExists(EntityKind::Index {
                        index_id: index_id.to_string(),
                    })
                }
                (pg_error_codes::UNIQUE_VIOLATION, _) => {
                    error!(error=?boxed_db_error, "postgresql-error");
                    MetastoreError::Internal {
                        message: "unique key violation".to_string(),
                        cause: format!("DB error {boxed_db_error:?}"),
                    }
                }
                _ => {
                    error!(error=?boxed_db_error, "postgresql-error");
                    MetastoreError::Db {
                        message: boxed_db_error.to_string(),
                    }
                }
            }
        }
        _ => {
            error!(error=?sqlx_error, "an error has occurred in the database operation");
            MetastoreError::Db {
                message: sqlx_error.to_string(),
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/factory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_config::{MetastoreBackend, MetastoreConfig};
use quickwit_proto::metastore::MetastoreServiceClient;
use tokio::sync::Mutex;
use tracing::debug;

use crate::{MetastoreFactory, MetastoreResolverError, PostgresqlMetastore};

#[derive(Clone, Default)]
pub struct PostgresqlMetastoreFactory {
    // Under normal conditions of use, this cache will contain a single `Metastore`.
    //
    // In contrast to the file-backed metastore, we use a strong pointer here, so that the
    // `Metastore` doesn't get dropped. This is done in order to keep the underlying connection
    // pool to Postgres alive.
    cache: Arc<Mutex<HashMap<Uri, MetastoreServiceClient>>>,
}

impl PostgresqlMetastoreFactory {
    async fn get_from_cache(&self, uri: &Uri) -> Option<MetastoreServiceClient> {
        let cache_lock = self.cache.lock().await;
        cache_lock.get(uri).cloned()
    }

    /// If there is a valid entry in the cache to begin with, we trash the new
    /// one and return the old one.
    ///
    /// This way we make sure that we keep only one instance associated
    /// to the key `uri` outside of this struct.
    async fn cache_metastore(
        &self,
        uri: Uri,
        metastore: MetastoreServiceClient,
    ) -> MetastoreServiceClient {
        let mut cache_lock = self.cache.lock().await;
        if let Some(metastore) = cache_lock.get(&uri) {
            return metastore.clone();
        }
        cache_lock.insert(uri, metastore.clone());
        metastore
    }
}

#[async_trait]
impl MetastoreFactory for PostgresqlMetastoreFactory {
    fn backend(&self) -> MetastoreBackend {
        MetastoreBackend::PostgreSQL
    }

    async fn resolve(
        &self,
        metastore_config: &MetastoreConfig,
        uri: &Uri,
    ) -> Result<MetastoreServiceClient, MetastoreResolverError> {
        if let Some(metastore) = self.get_from_cache(uri).await {
            debug!("using metastore from cache");
            return Ok(metastore);
        }
        debug!("metastore not found in cache");
        let postgresql_metastore_config = metastore_config.as_postgres().ok_or_else(|| {
            let message = format!(
                "expected PostgreSQL metastore config, got `{:?}`",
                metastore_config.backend()
            );
            MetastoreResolverError::InvalidConfig(message)
        })?;
        let postgresql_metastore = PostgresqlMetastore::new(postgresql_metastore_config, uri)
            .await
            .map(MetastoreServiceClient::new)
            .map_err(MetastoreResolverError::Initialization)?;
        let unique_metastore_for_uri = self
            .cache_metastore(uri.clone(), postgresql_metastore)
            .await;
        Ok(unique_metastore_for_uri)
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/metastore.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt::{self, Write};
use std::str::FromStr;
use std::time::Duration;

use async_trait::async_trait;
use futures::StreamExt;
use itertools::Itertools;
use quickwit_common::pretty::PrettySample;
use quickwit_common::uri::Uri;
use quickwit_common::{ServiceStream, get_bool_from_env, rate_limited_error};
use quickwit_config::{
    IndexTemplate, IndexTemplateId, PostgresMetastoreConfig, validate_index_id_pattern,
};
use quickwit_proto::ingest::{Shard, ShardState};
use quickwit_proto::metastore::{
    AcquireShardsRequest, AcquireShardsResponse, AddSourceRequest, CreateIndexRequest,
    CreateIndexResponse, CreateIndexTemplateRequest, DeleteIndexRequest,
    DeleteIndexTemplatesRequest, DeleteQuery, DeleteShardsRequest, DeleteShardsResponse,
    DeleteSourceRequest, DeleteSplitsRequest, DeleteTask, EmptyResponse, EntityKind,
    FindIndexTemplateMatchesRequest, FindIndexTemplateMatchesResponse, GetClusterIdentityRequest,
    GetClusterIdentityResponse, GetIndexTemplateRequest, GetIndexTemplateResponse,
    IndexMetadataFailure, IndexMetadataFailureReason, IndexMetadataRequest, IndexMetadataResponse,
    IndexStats, IndexTemplateMatch, IndexesMetadataRequest, IndexesMetadataResponse,
    LastDeleteOpstampRequest, LastDeleteOpstampResponse, ListDeleteTasksRequest,
    ListDeleteTasksResponse, ListIndexStatsRequest, ListIndexStatsResponse,
    ListIndexTemplatesRequest, ListIndexTemplatesResponse, ListIndexesMetadataRequest,
    ListIndexesMetadataResponse, ListShardsRequest, ListShardsResponse, ListShardsSubresponse,
    ListSplitsRequest, ListSplitsResponse, ListStaleSplitsRequest, MarkSplitsForDeletionRequest,
    MetastoreError, MetastoreResult, MetastoreService, MetastoreServiceStream, OpenShardSubrequest,
    OpenShardSubresponse, OpenShardsRequest, OpenShardsResponse, PruneShardsRequest,
    PublishSplitsRequest, ResetSourceCheckpointRequest, SplitStats, StageSplitsRequest,
    ToggleSourceRequest, UpdateIndexRequest, UpdateSourceRequest, UpdateSplitsDeleteOpstampRequest,
    UpdateSplitsDeleteOpstampResponse, serde_utils,
};
use quickwit_proto::types::{IndexId, IndexUid, Position, PublishToken, ShardId, SourceId};
use sea_query::{Alias, Asterisk, Expr, Func, PostgresQueryBuilder, Query, UnionType};
use sea_query_binder::SqlxBinder;
use sqlx::{Acquire, Executor, Postgres, Transaction};
use time::OffsetDateTime;
use tracing::{debug, info, instrument, warn};
use uuid::Uuid;

use super::error::convert_sqlx_err;
use super::migrator::run_migrations;
use super::model::{PgDeleteTask, PgIndex, PgIndexTemplate, PgShard, PgSplit, Splits};
use super::pool::TrackedPool;
use super::split_stream::SplitStream;
use super::utils::{append_query_filters_and_order_by, establish_connection};
use super::{
    QW_POSTGRES_READ_ONLY_ENV_KEY, QW_POSTGRES_SKIP_MIGRATION_LOCKING_ENV_KEY,
    QW_POSTGRES_SKIP_MIGRATIONS_ENV_KEY,
};
use crate::checkpoint::{
    IndexCheckpointDelta, PartitionId, SourceCheckpoint, SourceCheckpointDelta,
};
use crate::file_backed::MutationOccurred;
use crate::metastore::postgres::model::Shards;
use crate::metastore::postgres::utils::split_maturity_timestamp;
use crate::metastore::{
    IndexesMetadataResponseExt, PublishSplitsRequestExt, STREAM_SPLITS_CHUNK_SIZE,
    UpdateSourceRequestExt, use_shard_api,
};
use crate::{
    AddSourceRequestExt, CreateIndexRequestExt, IndexMetadata, IndexMetadataResponseExt,
    ListIndexesMetadataResponseExt, ListSplitsRequestExt, ListSplitsResponseExt,
    MetastoreServiceExt, Split, SplitState, StageSplitsRequestExt, UpdateIndexRequestExt,
};

/// PostgreSQL metastore implementation.
#[derive(Clone)]
pub struct PostgresqlMetastore {
    uri: Uri,
    connection_pool: TrackedPool<Postgres>,
}

impl fmt::Debug for PostgresqlMetastore {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("PostgresqlMetastore")
            .field("uri", &self.uri)
            .finish()
    }
}

impl PostgresqlMetastore {
    /// Creates a metastore given a database URI.
    pub async fn new(
        postgres_metastore_config: &PostgresMetastoreConfig,
        connection_uri: &Uri,
    ) -> MetastoreResult<Self> {
        let min_connections = postgres_metastore_config.min_connections;
        let max_connections = postgres_metastore_config.max_connections.get();
        let acquire_timeout = postgres_metastore_config
            .acquire_connection_timeout()
            .expect("PostgreSQL metastore config should have been validated");
        let idle_timeout_opt = postgres_metastore_config
            .idle_connection_timeout_opt()
            .expect("PostgreSQL metastore config should have been validated");
        let max_lifetime_opt = postgres_metastore_config
            .max_connection_lifetime_opt()
            .expect("PostgreSQL metastore config should have been validated");

        let read_only = get_bool_from_env(QW_POSTGRES_READ_ONLY_ENV_KEY, false);
        let skip_migrations = get_bool_from_env(QW_POSTGRES_SKIP_MIGRATIONS_ENV_KEY, false);
        let skip_locking = get_bool_from_env(QW_POSTGRES_SKIP_MIGRATION_LOCKING_ENV_KEY, false);

        let connection_pool = establish_connection(
            connection_uri,
            min_connections,
            max_connections,
            acquire_timeout,
            idle_timeout_opt,
            max_lifetime_opt,
            read_only,
        )
        .await?;

        run_migrations(&connection_pool, skip_migrations, skip_locking).await?;

        let metastore = PostgresqlMetastore {
            uri: connection_uri.clone(),
            connection_pool,
        };
        Ok(metastore)
    }
}

/// Returns an Index object given an index_id or None if it does not exist.
async fn index_opt<'a, E>(
    executor: E,
    index_id: &str,
    lock: bool,
) -> MetastoreResult<Option<PgIndex>>
where
    E: sqlx::Executor<'a, Database = Postgres>,
{
    let index_opt: Option<PgIndex> = sqlx::query_as::<_, PgIndex>(&format!(
        r#"
        SELECT *
        FROM indexes
        WHERE index_id = $1
        {}
        "#,
        if lock { "FOR UPDATE" } else { "" }
    ))
    .bind(index_id)
    .fetch_optional(executor)
    .await?;
    Ok(index_opt)
}

/// Returns an Index object given an index_uid or None if it does not exist.
async fn index_opt_for_uid<'a, E>(
    executor: E,
    index_uid: IndexUid,
    lock: bool,
) -> MetastoreResult<Option<PgIndex>>
where
    E: sqlx::Executor<'a, Database = Postgres>,
{
    let index_opt: Option<PgIndex> = sqlx::query_as::<_, PgIndex>(&format!(
        r#"
        SELECT *
        FROM indexes
        WHERE index_uid = $1
        {}
        "#,
        if lock { "FOR UPDATE" } else { "" }
    ))
    .bind(&index_uid)
    .fetch_optional(executor)
    .await?;
    Ok(index_opt)
}

async fn index_metadata(
    tx: &mut Transaction<'_, Postgres>,
    index_id: &str,
    lock: bool,
) -> MetastoreResult<IndexMetadata> {
    index_opt(tx.as_mut(), index_id, lock)
        .await?
        .ok_or_else(|| {
            MetastoreError::NotFound(EntityKind::Index {
                index_id: index_id.to_string(),
            })
        })?
        .index_metadata()
}

async fn try_apply_delta_v2(
    tx: &mut Transaction<'_, Postgres>,
    index_uid: &IndexUid,
    source_id: &SourceId,
    checkpoint_delta: SourceCheckpointDelta,
    publish_token: PublishToken,
) -> MetastoreResult<()> {
    let num_partitions = checkpoint_delta.num_partitions();
    let shard_ids: Vec<String> = checkpoint_delta
        .partitions()
        .map(|partition_id| partition_id.to_string())
        .collect();

    let shards: Vec<(String, String, Option<PublishToken>)> = sqlx::query_as(
        r#"
        SELECT
            shard_id, publish_position_inclusive, publish_token
        FROM
            shards
        WHERE
            index_uid = $1
            AND source_id = $2
            AND shard_id = ANY($3)
        FOR UPDATE
        "#,
    )
    .bind(index_uid)
    .bind(source_id)
    .bind(shard_ids)
    .fetch_all(tx.as_mut())
    .await?;

    if shards.len() != num_partitions {
        let queue_id = format!("{index_uid}/{source_id}"); // FIXME
        let entity_kind = EntityKind::Shard { queue_id };
        return Err(MetastoreError::NotFound(entity_kind));
    }
    let mut current_checkpoint = SourceCheckpoint::default();

    for (shard_id, current_position, current_publish_token_opt) in shards {
        if current_publish_token_opt.is_none()
            || current_publish_token_opt.unwrap() != publish_token
        {
            let message = "failed to apply checkpoint delta: invalid publish token".to_string();
            return Err(MetastoreError::InvalidArgument { message });
        }
        let partition_id = PartitionId::from(shard_id);
        let current_position = Position::from(current_position);
        current_checkpoint.add_partition(partition_id, current_position);
    }
    current_checkpoint
        .try_apply_delta(checkpoint_delta)
        .map_err(|error| MetastoreError::InvalidArgument {
            message: error.to_string(),
        })?;

    let mut shard_ids = Vec::with_capacity(num_partitions);
    let mut new_positions = Vec::with_capacity(num_partitions);

    for (partition_id, new_position) in current_checkpoint.iter() {
        let shard_id = partition_id.to_string();
        shard_ids.push(shard_id.to_string());
        new_positions.push(new_position.to_string());
    }

    sqlx::query(
        r#"
            UPDATE
                shards
            SET
                publish_position_inclusive = new_positions.position,
                shard_state = CASE WHEN new_positions.position LIKE '~%' THEN 'closed' ELSE shards.shard_state END,
                update_timestamp = $5
            FROM
                UNNEST($3, $4)
                AS new_positions(shard_id, position)
            WHERE
                index_uid = $1
                AND source_id = $2
                AND shards.shard_id = new_positions.shard_id
            "#,
    )
    .bind(index_uid)
    .bind(source_id)
    .bind(shard_ids)
    .bind(new_positions)
    // Use a timestamp generated by the metastore node to avoid clock drift issues
    .bind(OffsetDateTime::now_utc())
    .execute(tx.as_mut())
    .await?;
    Ok(())
}

/// This macro is used to systematically wrap the metastore
/// into transaction, commit them on Result::Ok and rollback on Error.
///
/// Note this is suboptimal.
/// Some of the methods actually did not require a transaction.
///
/// We still use this macro for them in order to make the code
/// "trivially correct".
macro_rules! run_with_tx {
    ($connection_pool:expr, $tx_refmut:ident, $label:literal, $x:block) => {{
        let mut tx: Transaction<'_, Postgres> = $connection_pool.begin().await?;
        let $tx_refmut = &mut tx;
        let op_fut = move || async move { $x };
        let op_result: MetastoreResult<_> = op_fut().await;
        match &op_result {
            Ok(_) => {
                debug!("committing transaction");
                tx.commit().await?;
            }
            Err(error) => {
                rate_limited_error!(limit_per_min = 60, error=%error, "failed to {}, rolling transaction back" , $label);
                tx.rollback().await?;
            }
        }
        op_result
    }};
}

async fn mutate_index_metadata<E, M>(
    tx: &mut Transaction<'_, Postgres>,
    index_uid: IndexUid,
    mutate_fn: M,
) -> MetastoreResult<IndexMetadata>
where
    MetastoreError: From<E>,
    M: FnOnce(&mut IndexMetadata) -> Result<MutationOccurred<()>, E>,
{
    let index_id = &index_uid.index_id;
    let mut index_metadata = index_metadata(tx, index_id, true).await?;

    if index_metadata.index_uid != index_uid {
        return Err(MetastoreError::NotFound(EntityKind::Index {
            index_id: index_id.to_string(),
        }));
    }
    if let MutationOccurred::No(()) = mutate_fn(&mut index_metadata)? {
        return Ok(index_metadata);
    }
    let index_metadata_json = serde_utils::to_json_str(&index_metadata)?;

    let update_index_res = sqlx::query(
        r#"
        UPDATE indexes
        SET index_metadata_json = $1
        WHERE index_uid = $2
        "#,
    )
    .bind(index_metadata_json)
    .bind(&index_uid)
    .execute(tx.as_mut())
    .await?;
    if update_index_res.rows_affected() == 0 {
        return Err(MetastoreError::NotFound(EntityKind::Index {
            index_id: index_id.to_string(),
        }));
    }
    Ok(index_metadata)
}

#[async_trait]
impl MetastoreService for PostgresqlMetastore {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.connection_pool.acquire().await?;
        Ok(())
    }

    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        vec![self.uri.clone()]
    }

    // Index API:
    // - `create_index`
    // - `update_index`
    // - `index_metadata`
    // - `indexes_metadata`
    // - `list_indexes_metadata`

    #[instrument(skip(self))]
    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> MetastoreResult<CreateIndexResponse> {
        let index_config = request.deserialize_index_config()?;
        let mut index_metadata = IndexMetadata::new(index_config);

        let source_configs = request.deserialize_source_configs()?;

        for source_config in source_configs {
            index_metadata.add_source(source_config)?;
        }
        let index_metadata_json = serde_utils::to_json_str(&index_metadata)?;

        sqlx::query(
            "INSERT INTO indexes (index_uid, index_id, index_metadata_json) VALUES ($1, $2, $3)",
        )
        .bind(index_metadata.index_uid.to_string())
        .bind(&index_metadata.index_uid.index_id)
        .bind(&index_metadata_json)
        .execute(&self.connection_pool)
        .await
        .map_err(|sqlx_error| convert_sqlx_err(index_metadata.index_id(), sqlx_error))?;

        let response = CreateIndexResponse {
            index_uid: index_metadata.index_uid.into(),
            index_metadata_json,
        };
        Ok(response)
    }

    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> MetastoreResult<IndexMetadataResponse> {
        let doc_mapping = request.deserialize_doc_mapping()?;
        let indexing_settings = request.deserialize_indexing_settings()?;
        let ingest_settings = request.deserialize_ingest_settings()?;
        let search_settings = request.deserialize_search_settings()?;
        let retention_policy_opt = request.deserialize_retention_policy()?;

        let index_uid: IndexUid = request.index_uid().clone();
        let updated_index_metadata = run_with_tx!(self.connection_pool, tx, "update index", {
            mutate_index_metadata::<MetastoreError, _>(tx, index_uid, |index_metadata| {
                let mutation_occurred = index_metadata.update_index_config(
                    doc_mapping,
                    indexing_settings,
                    ingest_settings,
                    search_settings,
                    retention_policy_opt,
                )?;
                Ok(MutationOccurred::from(mutation_occurred))
            })
            .await
        })?;
        IndexMetadataResponse::try_from_index_metadata(&updated_index_metadata)
    }

    #[instrument(skip(self))]
    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> MetastoreResult<IndexMetadataResponse> {
        let pg_index_opt = if let Some(index_uid) = &request.index_uid {
            index_opt_for_uid(&self.connection_pool, index_uid.clone(), false).await?
        } else if let Some(index_id) = &request.index_id {
            index_opt(&self.connection_pool, index_id, false).await?
        } else {
            let message = "invalid request: neither `index_id` nor `index_uid` is set".to_string();
            return Err(MetastoreError::Internal {
                message,
                cause: "".to_string(),
            });
        };
        let index_metadata = pg_index_opt
            .ok_or(MetastoreError::NotFound(EntityKind::Index {
                index_id: request
                    .into_index_id()
                    .expect("`index_id` or `index_uid` should be set"),
            }))?
            .index_metadata()?;
        let response = IndexMetadataResponse::try_from_index_metadata(&index_metadata)?;
        Ok(response)
    }

    #[instrument(skip(self))]
    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> MetastoreResult<IndexesMetadataResponse> {
        const INDEXES_METADATA_QUERY: &str = include_str!("queries/indexes_metadata.sql");

        let num_subrequests = request.subrequests.len();

        if num_subrequests == 0 {
            return Ok(Default::default());
        }
        let mut index_ids: Vec<IndexId> = Vec::new();
        let mut index_uids: Vec<IndexUid> = Vec::with_capacity(num_subrequests);
        let mut failures: Vec<IndexMetadataFailure> = Vec::new();

        for subrequest in request.subrequests {
            if let Some(index_id) = subrequest.index_id {
                index_ids.push(index_id);
            } else if let Some(index_uid) = subrequest.index_uid {
                index_uids.push(index_uid);
            } else {
                let failure = IndexMetadataFailure {
                    index_id: subrequest.index_id,
                    index_uid: subrequest.index_uid,
                    reason: IndexMetadataFailureReason::Internal as i32,
                };
                failures.push(failure);
            }
        }
        let pg_indexes: Vec<PgIndex> = sqlx::query_as::<_, PgIndex>(INDEXES_METADATA_QUERY)
            .bind(&index_ids)
            .bind(&index_uids)
            .fetch_all(&self.connection_pool)
            .await?;

        let indexes_metadata: Vec<IndexMetadata> = pg_indexes
            .iter()
            .map(|pg_index| pg_index.index_metadata())
            .collect::<MetastoreResult<_>>()?;

        if pg_indexes.len() + failures.len() < num_subrequests {
            for index_id in index_ids {
                if pg_indexes
                    .iter()
                    .all(|pg_index| pg_index.index_id != index_id)
                {
                    let failure = IndexMetadataFailure {
                        index_id: Some(index_id),
                        index_uid: None,
                        reason: IndexMetadataFailureReason::NotFound as i32,
                    };
                    failures.push(failure);
                }
            }
            for index_uid in index_uids {
                if pg_indexes
                    .iter()
                    .all(|pg_index| pg_index.index_uid != index_uid)
                {
                    let failure = IndexMetadataFailure {
                        index_id: None,
                        index_uid: Some(index_uid),
                        reason: IndexMetadataFailureReason::NotFound as i32,
                    };
                    failures.push(failure);
                }
            }
        }
        let response =
            IndexesMetadataResponse::try_from_indexes_metadata(indexes_metadata, failures).await?;
        Ok(response)
    }

    #[instrument(skip(self))]
    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> MetastoreResult<ListIndexesMetadataResponse> {
        let sql =
            build_index_id_patterns_sql_query(&request.index_id_patterns).map_err(|error| {
                MetastoreError::Internal {
                    message: "failed to build `list_indexes_metadata` SQL query".to_string(),
                    cause: error.to_string(),
                }
            })?;
        let pg_indexes = sqlx::query_as::<_, PgIndex>(&sql)
            .fetch_all(&self.connection_pool)
            .await?;
        let indexes_metadata: Vec<IndexMetadata> = pg_indexes
            .into_iter()
            .map(|pg_index| pg_index.index_metadata())
            .collect::<MetastoreResult<_>>()?;
        let response =
            ListIndexesMetadataResponse::try_from_indexes_metadata(indexes_metadata).await?;
        Ok(response)
    }

    #[instrument(skip_all, fields(index_id=%request.index_uid()))]
    async fn delete_index(&self, request: DeleteIndexRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let delete_result = sqlx::query("DELETE FROM indexes WHERE index_uid = $1")
            .bind(&index_uid)
            .execute(&self.connection_pool)
            .await?;
        // FIXME: This is not idempotent.
        if delete_result.rows_affected() == 0 {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.index_id,
            }));
        }
        info!(index_id = index_uid.index_id, "deleted index successfully");
        Ok(EmptyResponse {})
    }

    #[instrument(skip_all, fields(split_ids))]
    async fn stage_splits(&self, request: StageSplitsRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let splits_metadata = request.deserialize_splits_metadata()?;

        if splits_metadata.is_empty() {
            return Ok(Default::default());
        }
        let mut split_ids = Vec::with_capacity(splits_metadata.len());
        let mut time_range_start_list = Vec::with_capacity(splits_metadata.len());
        let mut time_range_end_list = Vec::with_capacity(splits_metadata.len());
        let mut tags_list = Vec::with_capacity(splits_metadata.len());
        let mut splits_metadata_json = Vec::with_capacity(splits_metadata.len());
        let mut delete_opstamps = Vec::with_capacity(splits_metadata.len());
        let mut maturity_timestamps = Vec::with_capacity(splits_metadata.len());
        let mut node_ids = Vec::with_capacity(splits_metadata.len());

        for split_metadata in splits_metadata {
            let split_metadata_json = serde_utils::to_json_str(&split_metadata)?;
            splits_metadata_json.push(split_metadata_json);

            let time_range_start = split_metadata
                .time_range
                .as_ref()
                .map(|range| *range.start());
            time_range_start_list.push(time_range_start);
            maturity_timestamps.push(split_maturity_timestamp(&split_metadata));

            let time_range_end = split_metadata.time_range.map(|range| *range.end());
            time_range_end_list.push(time_range_end);

            let tags: Vec<String> = split_metadata.tags.into_iter().collect();
            tags_list.push(sqlx::types::Json(tags));
            split_ids.push(split_metadata.split_id);
            delete_opstamps.push(split_metadata.delete_opstamp as i64);
            node_ids.push(split_metadata.node_id);
        }
        tracing::Span::current().record("split_ids", format!("{split_ids:?}"));

        // TODO: Remove transaction.
        run_with_tx!(self.connection_pool, tx, "stage splits", {
            let upserted_split_ids: Vec<String> = sqlx::query_scalar(r#"
                INSERT INTO splits
                    (split_id, time_range_start, time_range_end, tags, split_metadata_json, delete_opstamp, maturity_timestamp, split_state, index_uid, node_id)
                SELECT
                    split_id,
                    time_range_start,
                    time_range_end,
                    ARRAY(SELECT json_array_elements_text(tags_json::json)) as tags,
                    split_metadata_json,
                    delete_opstamp,
                    to_timestamp(maturity_timestamp),
                    $9 as split_state,
                    $10 as index_uid,
                    node_id
                FROM
                    UNNEST($1, $2, $3, $4, $5, $6, $7, $8)
                    AS staged_splits (split_id, time_range_start, time_range_end, tags_json, split_metadata_json, delete_opstamp, maturity_timestamp, node_id)
                ON CONFLICT(index_uid, split_id) DO UPDATE
                    SET
                        time_range_start = excluded.time_range_start,
                        time_range_end = excluded.time_range_end,
                        tags = excluded.tags,
                        split_metadata_json = excluded.split_metadata_json,
                        delete_opstamp = excluded.delete_opstamp,
                        maturity_timestamp = excluded.maturity_timestamp,
                        node_id = excluded.node_id,
                        update_timestamp = CURRENT_TIMESTAMP,
                        create_timestamp = CURRENT_TIMESTAMP
                    WHERE splits.split_id = excluded.split_id AND splits.split_state = 'Staged'
                RETURNING split_id;
                "#)
                .bind(&split_ids)
                .bind(time_range_start_list)
                .bind(time_range_end_list)
                .bind(tags_list)
                .bind(splits_metadata_json)
                .bind(delete_opstamps)
                .bind(maturity_timestamps)
                .bind(&node_ids)
                .bind(SplitState::Staged.as_str())
                .bind(&index_uid)
                .fetch_all(tx.as_mut())
                .await
                .map_err(|sqlx_error| convert_sqlx_err(&index_uid.index_id, sqlx_error))?;

            if upserted_split_ids.len() != split_ids.len() {
                let failed_split_ids: Vec<String> = split_ids
                    .into_iter()
                    .filter(|split_id| !upserted_split_ids.contains(split_id))
                    .collect();
                let entity = EntityKind::Splits {
                    split_ids: failed_split_ids,
                };
                let message = "splits are not staged".to_string();
                return Err(MetastoreError::FailedPrecondition { entity, message });
            }
            info!(
                %index_uid,
                "staged `{}` splits successfully", split_ids.len()
            );
            Ok(EmptyResponse {})
        })
    }

    #[instrument(skip(self))]
    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let checkpoint_delta_opt: Option<IndexCheckpointDelta> =
            request.deserialize_index_checkpoint()?;
        let index_uid: IndexUid = request.index_uid().clone();
        let staged_split_ids = request.staged_split_ids;
        let replaced_split_ids = request.replaced_split_ids;

        run_with_tx!(self.connection_pool, tx, "publish splits", {
            let mut index_metadata = index_metadata(tx, &index_uid.index_id, true).await?;
            if index_metadata.index_uid != index_uid {
                return Err(MetastoreError::NotFound(EntityKind::Index {
                    index_id: index_uid.index_id,
                }));
            }
            if let Some(checkpoint_delta) = checkpoint_delta_opt {
                let source_id = checkpoint_delta.source_id.clone();
                let source = index_metadata.sources.get(&source_id).ok_or_else(|| {
                    MetastoreError::NotFound(EntityKind::Source {
                        index_id: index_uid.index_id.to_string(),
                        source_id: source_id.to_string(),
                    })
                })?;

                if use_shard_api(&source.source_params) {
                    let publish_token = request.publish_token_opt.ok_or_else(|| {
                        let message = format!(
                            "publish token is required for publishing splits for source \
                             `{source_id}`"
                        );
                        MetastoreError::InvalidArgument { message }
                    })?;
                    try_apply_delta_v2(
                        tx,
                        &index_uid,
                        &source_id,
                        checkpoint_delta.source_delta,
                        publish_token,
                    )
                    .await?;
                } else {
                    index_metadata
                        .checkpoint
                        .try_apply_delta(checkpoint_delta)
                        .map_err(|error| {
                            let entity = EntityKind::CheckpointDelta {
                                index_id: index_uid.index_id.to_string(),
                                source_id,
                            };
                            let message = error.to_string();
                            MetastoreError::FailedPrecondition { entity, message }
                        })?;
                }
            }
            let index_metadata_json = serde_utils::to_json_str(&index_metadata)?;

            const PUBLISH_SPLITS_QUERY: &str = r#"
            -- Select the splits to update, regardless of their state.
            -- The left join make it possible to identify the splits that do not exist.
            WITH input_splits AS (
                SELECT input_splits.split_id, input_splits.expected_split_state, splits.actual_split_state
                FROM (
                    SELECT split_id, 'Staged' AS expected_split_state
                    FROM UNNEST($3) AS staged_splits(split_id)
                    UNION
                    SELECT split_id, 'Published' AS expected_split_state
                    FROM UNNEST($4) AS published_splits(split_id)
                ) input_splits
                LEFT JOIN (
                    SELECT split_id, split_state AS actual_split_state
                    FROM splits
                    WHERE
                        index_uid = $1
                        AND (split_id = ANY($3) OR split_id = ANY($4))
                    FOR UPDATE
                    ) AS splits
                USING (split_id)
            ),
            -- Update the index metadata with the new checkpoint.
            updated_index_metadata AS (
                UPDATE indexes
                SET
                    index_metadata_json = $2
                WHERE
                    index_uid = $1
                    AND NOT EXISTS (
                        SELECT 1
                        FROM input_splits
                        WHERE
                            actual_split_state != expected_split_state
                        )
            ),
            -- Publish the staged splits and mark the published splits for deletion.
            updated_splits AS (
                UPDATE splits
                SET
                    split_state = CASE split_state
                        WHEN 'Staged' THEN 'Published'
                        ELSE 'MarkedForDeletion'
                    END,
                    update_timestamp = (CURRENT_TIMESTAMP AT TIME ZONE 'UTC'),
                    publish_timestamp = (CURRENT_TIMESTAMP AT TIME ZONE 'UTC')
                FROM input_splits
                WHERE
                    splits.index_uid = $1
                    AND splits.split_id = input_splits.split_id
                    AND NOT EXISTS (
                        SELECT 1
                        FROM input_splits
                        WHERE
                            actual_split_state != expected_split_state
                    )
            )
            -- Report the outcome of the update query.
            SELECT
                COUNT(1) FILTER (WHERE actual_split_state = 'Staged' AND expected_split_state = 'Staged'),
                COUNT(1) FILTER (WHERE actual_split_state = 'Published' AND expected_split_state = 'Published'),
                COALESCE(ARRAY_AGG(split_id) FILTER (WHERE actual_split_state IS NULL), ARRAY[]::TEXT[]),
                COALESCE(ARRAY_AGG(split_id) FILTER (WHERE actual_split_state != 'Staged' AND expected_split_state = 'Staged'), ARRAY[]::TEXT[]),
                COALESCE(ARRAY_AGG(split_id) FILTER (WHERE actual_split_state != 'Published' AND expected_split_state = 'Published'), ARRAY[]::TEXT[])
                FROM input_splits
        "#;
            let (
                num_published_splits,
                num_marked_splits,
                not_found_split_ids,
                not_staged_split_ids,
                not_marked_split_ids,
            ): (i64, i64, Vec<String>, Vec<String>, Vec<String>) =
                sqlx::query_as(PUBLISH_SPLITS_QUERY)
                    .bind(&index_uid)
                    .bind(index_metadata_json)
                    .bind(staged_split_ids)
                    .bind(replaced_split_ids)
                    .fetch_one(tx.as_mut())
                    .await
                    .map_err(|sqlx_error| convert_sqlx_err(&index_uid.index_id, sqlx_error))?;

            if !not_found_split_ids.is_empty() {
                return Err(MetastoreError::NotFound(EntityKind::Splits {
                    split_ids: not_found_split_ids,
                }));
            }
            if !not_staged_split_ids.is_empty() {
                let entity = EntityKind::Splits {
                    split_ids: not_staged_split_ids,
                };
                let message = "splits are not staged".to_string();
                return Err(MetastoreError::FailedPrecondition { entity, message });
            }
            if !not_marked_split_ids.is_empty() {
                let entity = EntityKind::Splits {
                    split_ids: not_marked_split_ids,
                };
                let message = "splits are not marked for deletion".to_string();
                return Err(MetastoreError::FailedPrecondition { entity, message });
            }
            info!(
                %index_uid,
                "published {num_published_splits} splits and marked {num_marked_splits} for deletion successfully"
            );
            Ok(EmptyResponse {})
        })
    }

    #[instrument(skip(self))]
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        let list_splits_query = request.deserialize_list_splits_query()?;
        let mut sql_query_builder = Query::select();
        sql_query_builder.column(Asterisk).from(Splits::Table);
        append_query_filters_and_order_by(&mut sql_query_builder, &list_splits_query);

        let (sql_query, values) = sql_query_builder.build_sqlx(PostgresQueryBuilder);
        let pg_split_stream = SplitStream::new(
            self.connection_pool.clone(),
            sql_query,
            |connection_pool: &TrackedPool<Postgres>, sql_query: &String| {
                sqlx::query_as_with::<_, PgSplit, _>(sql_query, values).fetch(connection_pool)
            },
        );
        let split_stream =
            pg_split_stream
                .chunks(STREAM_SPLITS_CHUNK_SIZE)
                .map(|pg_splits_results| {
                    let mut splits = Vec::with_capacity(pg_splits_results.len());
                    for pg_split_result in pg_splits_results {
                        let pg_split = match pg_split_result {
                            Ok(pg_split) => pg_split,
                            Err(error) => {
                                return Err(MetastoreError::Internal {
                                    message: "failed to fetch splits".to_string(),
                                    cause: error.to_string(),
                                });
                            }
                        };
                        let split: Split = match pg_split.try_into() {
                            Ok(split) => split,
                            Err(error) => {
                                return Err(MetastoreError::Internal {
                                    message: "failed to convert `PgSplit` to `Split`".to_string(),
                                    cause: error.to_string(),
                                });
                            }
                        };
                        splits.push(split);
                    }
                    ListSplitsResponse::try_from_splits(splits)
                });
        let service_stream = ServiceStream::new(Box::pin(split_stream));
        Ok(service_stream)
    }

    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> MetastoreResult<ListIndexStatsResponse> {
        let index_pattern_sql = build_index_id_patterns_sql_query(&request.index_id_patterns)
            .map_err(|error| MetastoreError::Internal {
                message: "failed to build `list_index_stats` SQL query".to_string(),
                cause: error.to_string(),
            })?;
        let sql = format!(
            "SELECT
                i.index_uid,
                s.split_state,
                COUNT(s.split_state) AS num_splits,
                COALESCE(SUM(s.split_size_bytes)::BIGINT, 0) AS total_size_bytes
            FROM ({index_pattern_sql}) i
            LEFT JOIN splits s ON s.index_uid = i.index_uid
            GROUP BY i.index_uid, s.split_state"
        );

        let rows: Vec<(String, Option<String>, i64, i64)> = sqlx::query_as(&sql)
            .fetch_all(&self.connection_pool)
            .await?;

        let mut index_stats = HashMap::new();
        for (index_uid_str, split_state, num_splits, total_size_bytes) in rows {
            let Ok(index_uid) = IndexUid::from_str(&index_uid_str) else {
                return Err(MetastoreError::Internal {
                    message: "failed to parse index_uid".to_string(),
                    cause: index_uid_str.to_string(),
                });
            };
            let stats = index_stats
                .entry(index_uid_str)
                .or_insert_with(|| IndexStats {
                    index_uid: Some(index_uid),
                    staged: Some(SplitStats::default()),
                    published: Some(SplitStats::default()),
                    marked_for_deletion: Some(SplitStats::default()),
                });
            let num_splits = num_splits as u64;
            let total_size_bytes = total_size_bytes as u64;
            match split_state.as_deref() {
                Some("Staged") => {
                    stats.staged = Some(SplitStats {
                        num_splits,
                        total_size_bytes,
                    });
                }
                Some("Published") => {
                    stats.published = Some(SplitStats {
                        num_splits,
                        total_size_bytes,
                    });
                }
                Some("MarkedForDeletion") => {
                    stats.marked_for_deletion = Some(SplitStats {
                        num_splits,
                        total_size_bytes,
                    });
                }
                None => {} // if an index has no splits, we can keep the defaults
                Some(split_state) => {
                    return Err(MetastoreError::Internal {
                        message: "invalid split state".to_string(),
                        cause: split_state.to_string(),
                    });
                }
            }
        }

        Ok(ListIndexStatsResponse {
            index_stats: index_stats.into_values().collect(),
        })
    }

    #[instrument(skip(self))]
    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let split_ids = request.split_ids;
        const MARK_SPLITS_FOR_DELETION_QUERY: &str = r#"
            -- Select the splits to update, regardless of their state.
            -- The left join make it possible to identify the splits that do not exist.
            WITH input_splits AS (
                SELECT input_splits.split_id, splits.split_state
                FROM UNNEST($2) AS input_splits(split_id)
                LEFT JOIN (
                    SELECT split_id, split_state
                    FROM splits
                    WHERE
                        index_uid = $1
                        AND split_id = ANY($2)
                    FOR UPDATE
                    ) AS splits
                USING (split_id)
            ),
            -- Mark the staged and published splits for deletion.
            marked_splits AS (
                UPDATE splits
                SET
                    split_state = 'MarkedForDeletion',
                    update_timestamp = (CURRENT_TIMESTAMP AT TIME ZONE 'UTC')
                FROM input_splits
                WHERE
                    splits.index_uid = $1
                    AND splits.split_id = input_splits.split_id
                    AND splits.split_state IN ('Staged', 'Published')
            )
            -- Report the outcome of the update query.
            SELECT
                COUNT(split_state),
                COUNT(1) FILTER (WHERE split_state IN ('Staged', 'Published')),
                COALESCE(ARRAY_AGG(split_id) FILTER (WHERE split_state IS NULL), ARRAY[]::TEXT[])
                FROM input_splits
        "#;
        let (num_found_splits, num_marked_splits, not_found_split_ids): (i64, i64, Vec<String>) =
            sqlx::query_as(MARK_SPLITS_FOR_DELETION_QUERY)
                .bind(&index_uid)
                .bind(split_ids.clone())
                .fetch_one(&self.connection_pool)
                .await
                .map_err(|sqlx_error| convert_sqlx_err(&index_uid.index_id, sqlx_error))?;

        if num_found_splits == 0
            && index_opt(&self.connection_pool, &index_uid.index_id, false)
                .await?
                .is_none()
        {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.index_id,
            }));
        }
        info!(
            %index_uid,
            "Marked {} splits for deletion, among which {} were newly marked.",
            split_ids.len() - not_found_split_ids.len(),
            num_marked_splits
        );
        if !not_found_split_ids.is_empty() {
            warn!(
                %index_uid,
                split_ids=?PrettySample::new(&not_found_split_ids, 5),
                "{} splits were not found and could not be marked for deletion.",
                not_found_split_ids.len()
            );
        }
        Ok(EmptyResponse {})
    }

    #[instrument(skip(self))]
    async fn delete_splits(&self, request: DeleteSplitsRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let split_ids = request.split_ids;
        const DELETE_SPLITS_QUERY: &str = r#"
            -- Select the splits to delete, regardless of their state.
            -- The left join make it possible to identify the splits that do not exist.
            WITH input_splits AS (
                SELECT input_splits.split_id, splits.split_state
                FROM UNNEST($2) AS input_splits(split_id)
                LEFT JOIN (
                    SELECT split_id, split_state
                    FROM splits
                    WHERE
                        index_uid = $1
                        AND split_id = ANY($2)
                    FOR UPDATE
                    ) AS splits
                USING (split_id)
            ),
            -- Delete the splits if and only if all the splits are marked for deletion.
            deleted_splits AS (
                DELETE FROM splits
                USING input_splits
                WHERE
                    splits.index_uid = $1
                    AND splits.split_id = input_splits.split_id
                    AND NOT EXISTS (
                        SELECT 1
                        FROM input_splits
                        WHERE
                            split_state IN ('Staged', 'Published')
                    )
            )
            -- Report the outcome of the delete query.
            SELECT
                COUNT(split_state),
                COUNT(1) FILTER (WHERE split_state = 'MarkedForDeletion'),
                COALESCE(ARRAY_AGG(split_id) FILTER (WHERE split_state IN ('Staged', 'Published')), ARRAY[]::TEXT[]),
                COALESCE(ARRAY_AGG(split_id) FILTER (WHERE split_state IS NULL), ARRAY[]::TEXT[])
                FROM input_splits
        "#;
        let (num_found_splits, num_deleted_splits, not_deletable_split_ids, not_found_split_ids): (
            i64,
            i64,
            Vec<String>,
            Vec<String>,
        ) = sqlx::query_as(DELETE_SPLITS_QUERY)
            .bind(&index_uid)
            .bind(split_ids)
            .fetch_one(&self.connection_pool)
            .await
            .map_err(|sqlx_error| convert_sqlx_err(&index_uid.index_id, sqlx_error))?;

        if num_found_splits == 0
            && index_opt_for_uid(&self.connection_pool, index_uid.clone(), false)
                .await?
                .is_none()
        {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.index_id,
            }));
        }
        if !not_deletable_split_ids.is_empty() {
            let message = format!(
                "splits `{}` are not deletable",
                not_deletable_split_ids.join(", ")
            );
            let entity = EntityKind::Splits {
                split_ids: not_deletable_split_ids,
            };
            return Err(MetastoreError::FailedPrecondition { entity, message });
        }
        info!(%index_uid, "deleted {} splits from index", num_deleted_splits);

        if !not_found_split_ids.is_empty() {
            warn!(
                %index_uid,
                split_ids=?PrettySample::new(&not_found_split_ids, 5),
                "{} splits were not found and could not be deleted.",
                not_found_split_ids.len()
            );
        }
        Ok(EmptyResponse {})
    }

    #[instrument(skip(self))]
    async fn add_source(&self, request: AddSourceRequest) -> MetastoreResult<EmptyResponse> {
        let source_config = request.deserialize_source_config()?;
        let index_uid: IndexUid = request.index_uid().clone();
        run_with_tx!(self.connection_pool, tx, "add source", {
            mutate_index_metadata::<MetastoreError, _>(tx, index_uid, |index_metadata| {
                index_metadata.add_source(source_config)?;
                Ok(MutationOccurred::Yes(()))
            })
            .await?;
            Ok(())
        })?;
        Ok(EmptyResponse {})
    }

    #[instrument(skip(self))]
    async fn update_source(&self, request: UpdateSourceRequest) -> MetastoreResult<EmptyResponse> {
        let source_config = request.deserialize_source_config()?;
        let index_uid: IndexUid = request.index_uid().clone();
        run_with_tx!(self.connection_pool, tx, "update source", {
            mutate_index_metadata::<MetastoreError, _>(tx, index_uid, |index_metadata| {
                let mutation_occurred = index_metadata.update_source(source_config)?;
                Ok(MutationOccurred::from(mutation_occurred))
            })
            .await?;
            Ok(())
        })?;
        Ok(EmptyResponse {})
    }

    #[instrument(skip(self))]
    async fn toggle_source(&self, request: ToggleSourceRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        run_with_tx!(self.connection_pool, tx, "toggle source", {
            mutate_index_metadata(tx, index_uid, |index_metadata| {
                if index_metadata.toggle_source(&request.source_id, request.enable)? {
                    Ok::<_, MetastoreError>(MutationOccurred::Yes(()))
                } else {
                    Ok::<_, MetastoreError>(MutationOccurred::No(()))
                }
            })
            .await?;
            Ok(())
        })?;
        Ok(EmptyResponse {})
    }

    #[instrument(skip(self))]
    async fn delete_source(&self, request: DeleteSourceRequest) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let source_id = request.source_id.clone();
        run_with_tx!(self.connection_pool, tx, "delete source", {
            mutate_index_metadata(tx, index_uid.clone(), |index_metadata| {
                index_metadata.delete_source(&source_id)?;
                Ok::<_, MetastoreError>(MutationOccurred::Yes(()))
            })
            .await?;
            sqlx::query(
                r#"
                    DELETE FROM shards
                    WHERE
                        index_uid = $1
                        AND source_id = $2
                "#,
            )
            .bind(&index_uid)
            .bind(source_id)
            .execute(tx.as_mut())
            .await?;
            Ok(())
        })?;
        Ok(EmptyResponse {})
    }

    #[instrument(skip(self))]
    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> MetastoreResult<EmptyResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        run_with_tx!(self.connection_pool, tx, "reset source checkpoint", {
            mutate_index_metadata(tx, index_uid, |index_metadata| {
                if index_metadata.checkpoint.reset_source(&request.source_id) {
                    Ok::<_, MetastoreError>(MutationOccurred::Yes(()))
                } else {
                    Ok::<_, MetastoreError>(MutationOccurred::No(()))
                }
            })
            .await?;
            Ok(())
        })?;
        Ok(EmptyResponse {})
    }

    /// Retrieves the last delete opstamp for a given `index_id`.
    #[instrument(skip(self))]
    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> MetastoreResult<LastDeleteOpstampResponse> {
        let max_opstamp: i64 = sqlx::query_scalar(
            r#"
            SELECT COALESCE(MAX(opstamp), 0)
            FROM delete_tasks
            WHERE index_uid = $1
        "#,
        )
        .bind(request.index_uid())
        .fetch_one(&self.connection_pool)
        .await
        .map_err(|error| MetastoreError::Db {
            message: error.to_string(),
        })?;

        Ok(LastDeleteOpstampResponse::new(max_opstamp as u64))
    }

    /// Creates a delete task from a delete query.
    #[instrument(skip(self))]
    async fn create_delete_task(&self, delete_query: DeleteQuery) -> MetastoreResult<DeleteTask> {
        let delete_query_json = serde_utils::to_json_str(&delete_query)?;
        let (create_timestamp, opstamp): (sqlx::types::time::PrimitiveDateTime, i64) =
            sqlx::query_as(
                r#"
                INSERT INTO delete_tasks (index_uid, delete_query_json) VALUES ($1, $2)
                RETURNING create_timestamp, opstamp
            "#,
            )
            .bind(delete_query.index_uid().to_string())
            .bind(&delete_query_json)
            .fetch_one(&self.connection_pool)
            .await
            .map_err(|error| convert_sqlx_err(&delete_query.index_uid().index_id, error))?;

        Ok(DeleteTask {
            create_timestamp: create_timestamp.assume_utc().unix_timestamp(),
            opstamp: opstamp as u64,
            delete_query: Some(delete_query),
        })
    }

    /// Update splits delete opstamps.
    #[instrument(skip(self))]
    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let split_ids = request.split_ids;
        if split_ids.is_empty() {
            return Ok(UpdateSplitsDeleteOpstampResponse {});
        }
        let update_result = sqlx::query(
            r#"
            UPDATE splits
            SET
                delete_opstamp = $1,
                -- The values we compare with are *before* the modification:
                update_timestamp = CASE
                    WHEN delete_opstamp != $1 THEN (CURRENT_TIMESTAMP AT TIME ZONE 'UTC')
                    ELSE update_timestamp
                END
            WHERE
                index_uid = $2
                AND split_id = ANY($3)
        "#,
        )
        .bind(request.delete_opstamp as i64)
        .bind(&index_uid)
        .bind(split_ids)
        .execute(&self.connection_pool)
        .await?;

        // If no splits were updated, maybe the index does not exist in the first place?
        if update_result.rows_affected() == 0
            && index_opt_for_uid(&self.connection_pool, index_uid.clone(), false)
                .await?
                .is_none()
        {
            return Err(MetastoreError::NotFound(EntityKind::Index {
                index_id: index_uid.index_id,
            }));
        }
        Ok(UpdateSplitsDeleteOpstampResponse {})
    }

    /// Lists the delete tasks with opstamp > `opstamp_start`.
    #[instrument(skip(self))]
    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> MetastoreResult<ListDeleteTasksResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let pg_delete_tasks: Vec<PgDeleteTask> = sqlx::query_as::<_, PgDeleteTask>(
            r#"
                SELECT * FROM delete_tasks
                WHERE
                    index_uid = $1
                    AND opstamp > $2
                "#,
        )
        .bind(&index_uid)
        .bind(request.opstamp_start as i64)
        .fetch_all(&self.connection_pool)
        .await?;
        let delete_tasks: Vec<DeleteTask> = pg_delete_tasks
            .into_iter()
            .map(|pg_delete_task| pg_delete_task.try_into())
            .collect::<MetastoreResult<_>>()?;
        Ok(ListDeleteTasksResponse { delete_tasks })
    }

    /// Returns `num_splits` published splits with `split.delete_opstamp` < `delete_opstamp`.
    /// Results are ordered by ascending `split.delete_opstamp` and `split.publish_timestamp`
    /// values.
    #[instrument(skip(self))]
    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> MetastoreResult<ListSplitsResponse> {
        let index_uid: IndexUid = request.index_uid().clone();
        let stale_pg_splits: Vec<PgSplit> = sqlx::query_as::<_, PgSplit>(
            r#"
                SELECT *
                FROM splits
                WHERE
                    index_uid = $1
                    AND delete_opstamp < $2
                    AND split_state = $3
                    AND (maturity_timestamp = to_timestamp(0) OR (CURRENT_TIMESTAMP AT TIME ZONE 'UTC') >= maturity_timestamp)
                ORDER BY delete_opstamp ASC, publish_timestamp ASC
                LIMIT $4
            "#,
        )
        .bind(&index_uid)
        .bind(request.delete_opstamp as i64)
        .bind(SplitState::Published.as_str())
        .bind(request.num_splits as i64)
        .fetch_all(&self.connection_pool)
        .await?;

        let stale_splits: Vec<Split> = stale_pg_splits
            .into_iter()
            .map(|pg_split| pg_split.try_into())
            .collect::<MetastoreResult<_>>()?;
        let response = ListSplitsResponse::try_from_splits(stale_splits)?;
        Ok(response)
    }

    // TODO: Issue a single SQL query.
    async fn open_shards(&self, request: OpenShardsRequest) -> MetastoreResult<OpenShardsResponse> {
        let mut subresponses = Vec::with_capacity(request.subrequests.len());

        for subrequest in request.subrequests {
            let open_shard: Shard = open_or_fetch_shard(&self.connection_pool, &subrequest).await?;
            let subresponse = OpenShardSubresponse {
                subrequest_id: subrequest.subrequest_id,
                open_shard: Some(open_shard),
            };
            subresponses.push(subresponse);
        }
        Ok(OpenShardsResponse { subresponses })
    }

    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> MetastoreResult<AcquireShardsResponse> {
        const ACQUIRE_SHARDS_QUERY: &str = include_str!("queries/shards/acquire.sql");

        if request.shard_ids.is_empty() {
            return Ok(Default::default());
        }
        let pg_shards: Vec<PgShard> = sqlx::query_as(ACQUIRE_SHARDS_QUERY)
            .bind(request.index_uid())
            .bind(&request.source_id)
            .bind(&request.shard_ids)
            .bind(&request.publish_token)
            .fetch_all(&self.connection_pool)
            .await?;
        let acquired_shards = pg_shards
            .into_iter()
            .map(|pg_shard| pg_shard.into())
            .collect();
        let response = AcquireShardsResponse { acquired_shards };
        Ok(response)
    }

    async fn list_shards(&self, request: ListShardsRequest) -> MetastoreResult<ListShardsResponse> {
        if request.subrequests.is_empty() {
            return Ok(Default::default());
        }
        let mut sql_query_builder = Query::select();

        for (idx, subrequest) in request.subrequests.iter().enumerate() {
            let mut sql_subquery_builder = Query::select();

            sql_subquery_builder
                .column(Asterisk)
                .from(Shards::Table)
                .and_where(Expr::col(Shards::IndexUid).eq(subrequest.index_uid()))
                .and_where(Expr::col(Shards::SourceId).eq(&subrequest.source_id));

            let shard_state = subrequest.shard_state();

            if shard_state != ShardState::Unspecified {
                let shard_state_str = shard_state.as_json_str_name();
                let shard_state_alias = Alias::new("SHARD_STATE");
                let cast_expr = Func::cast_as(shard_state_str, shard_state_alias);
                sql_subquery_builder.and_where(Expr::col(Shards::ShardState).eq(cast_expr));
            }
            if idx == 0 {
                sql_query_builder = sql_subquery_builder;
            } else {
                sql_query_builder.union(UnionType::All, sql_subquery_builder);
            }
        }
        let (sql_query, values) = sql_query_builder.build_sqlx(PostgresQueryBuilder);

        let pg_shards: Vec<PgShard> = sqlx::query_as_with::<_, PgShard, _>(&sql_query, values)
            .fetch_all(&self.connection_pool)
            .await?;

        let mut per_source_subresponses: HashMap<(IndexUid, SourceId), ListShardsSubresponse> =
            request
                .subrequests
                .into_iter()
                .map(|subrequest| {
                    let index_uid = subrequest.index_uid().clone();
                    let source_id = subrequest.source_id.clone();
                    (
                        (index_uid, source_id),
                        ListShardsSubresponse {
                            index_uid: subrequest.index_uid,
                            source_id: subrequest.source_id,
                            shards: Vec::new(),
                        },
                    )
                })
                .collect();

        for pg_shard in pg_shards {
            let shard: Shard = pg_shard.into();
            let source_key = (shard.index_uid().clone(), shard.source_id.clone());

            let Some(subresponse) = per_source_subresponses.get_mut(&source_key) else {
                warn!(
                    index_uid=%shard.index_uid(),
                    source_id=%shard.source_id,
                    "could not find source in subresponses: this should never happen, please report"
                );
                continue;
            };
            subresponse.shards.push(shard);
        }
        let subresponses = per_source_subresponses.into_values().collect();
        let response = ListShardsResponse { subresponses };
        Ok(response)
    }

    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> MetastoreResult<DeleteShardsResponse> {
        const DELETE_SHARDS_QUERY: &str = include_str!("queries/shards/delete.sql");

        const FIND_NOT_DELETABLE_SHARDS_QUERY: &str =
            include_str!("queries/shards/find_not_deletable.sql");

        if request.shard_ids.is_empty() {
            return Ok(Default::default());
        }
        let query_result = sqlx::query(DELETE_SHARDS_QUERY)
            .bind(request.index_uid())
            .bind(&request.source_id)
            .bind(&request.shard_ids)
            .bind(request.force)
            .execute(&self.connection_pool)
            .await?;

        // Happy path: all shards were deleted.
        if request.force || query_result.rows_affected() == request.shard_ids.len() as u64 {
            let response = DeleteShardsResponse {
                index_uid: request.index_uid,
                source_id: request.source_id,
                successes: request.shard_ids,
                failures: Vec::new(),
            };
            return Ok(response);
        }
        // Unhappy path: some shards were not deleted because they do not exist or are not fully
        // indexed.
        let not_deletable_pg_shards: Vec<PgShard> = sqlx::query_as(FIND_NOT_DELETABLE_SHARDS_QUERY)
            .bind(request.index_uid())
            .bind(&request.source_id)
            .bind(&request.shard_ids)
            .fetch_all(&self.connection_pool)
            .await?;

        if not_deletable_pg_shards.is_empty() {
            let response = DeleteShardsResponse {
                index_uid: request.index_uid,
                source_id: request.source_id,
                successes: request.shard_ids,
                failures: Vec::new(),
            };
            return Ok(response);
        }
        let failures: Vec<ShardId> = not_deletable_pg_shards
            .into_iter()
            .map(|pg_shard| pg_shard.shard_id)
            .collect();
        warn!(
            index_uid=%request.index_uid(),
            source_id=%request.source_id,
            "failed to delete shards `{}`: shards are not fully indexed",
            failures.iter().join(", ")
        );
        let successes: Vec<ShardId> = request
            .shard_ids
            .into_iter()
            .filter(|shard_id| !failures.contains(shard_id))
            .collect();
        let response = DeleteShardsResponse {
            index_uid: request.index_uid,
            source_id: request.source_id,
            successes,
            failures,
        };
        Ok(response)
    }

    async fn prune_shards(&self, request: PruneShardsRequest) -> MetastoreResult<EmptyResponse> {
        const PRUNE_AGE_SHARDS_QUERY: &str = include_str!("queries/shards/prune_age.sql");
        const PRUNE_COUNT_SHARDS_QUERY: &str = include_str!("queries/shards/prune_count.sql");

        if let Some(max_age_secs) = request.max_age_secs {
            let limit_datetime =
                OffsetDateTime::now_utc() - Duration::from_secs(max_age_secs as u64);
            sqlx::query(PRUNE_AGE_SHARDS_QUERY)
                .bind(request.index_uid())
                .bind(&request.source_id)
                .bind(limit_datetime)
                .execute(&self.connection_pool)
                .await?;
        }

        if let Some(max_count) = request.max_count {
            sqlx::query(PRUNE_COUNT_SHARDS_QUERY)
                .bind(request.index_uid())
                .bind(&request.source_id)
                .bind(max_count as i64)
                .execute(&self.connection_pool)
                .await?;
        }
        Ok(EmptyResponse {})
    }

    // Index Template API

    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> MetastoreResult<EmptyResponse> {
        const INSERT_INDEX_TEMPLATE_QUERY: &str =
            include_str!("queries/index_templates/insert.sql");
        const UPSERT_INDEX_TEMPLATE_QUERY: &str =
            include_str!("queries/index_templates/upsert.sql");

        let index_template: IndexTemplate =
            serde_utils::from_json_str(&request.index_template_json)?;

        index_template
            .validate()
            .map_err(|error| MetastoreError::InvalidArgument {
                message: format!(
                    "invalid index template `{}`: `{error}`",
                    index_template.template_id
                ),
            })?;

        let mut positive_patterns = Vec::new();
        let mut negative_patterns = Vec::new();

        for pattern in &index_template.index_id_patterns {
            if let Some(negative_pattern) = pattern.strip_prefix('-') {
                negative_patterns.push(negative_pattern.replace('*', "%"));
            } else {
                positive_patterns.push(pattern.replace('*', "%"));
            }
        }
        if request.overwrite {
            sqlx::query(UPSERT_INDEX_TEMPLATE_QUERY)
                .bind(&index_template.template_id)
                .bind(positive_patterns)
                .bind(negative_patterns)
                .bind(index_template.priority as i32)
                .bind(&request.index_template_json)
                .execute(&self.connection_pool)
                .await?;

            return Ok(EmptyResponse {});
        }
        let pg_query_result = sqlx::query(INSERT_INDEX_TEMPLATE_QUERY)
            .bind(&index_template.template_id)
            .bind(positive_patterns)
            .bind(negative_patterns)
            .bind(index_template.priority as i32)
            .bind(&request.index_template_json)
            .execute(&self.connection_pool)
            .await?;

        if pg_query_result.rows_affected() == 0 {
            return Err(MetastoreError::AlreadyExists(EntityKind::IndexTemplate {
                template_id: index_template.template_id,
            }));
        }
        Ok(EmptyResponse {})
    }

    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> MetastoreResult<GetIndexTemplateResponse> {
        let pg_index_template_json: PgIndexTemplate =
            sqlx::query_as("SELECT * FROM index_templates WHERE template_id = $1")
                .bind(&request.template_id)
                .fetch_optional(&self.connection_pool)
                .await?
                .ok_or({
                    MetastoreError::NotFound(EntityKind::IndexTemplate {
                        template_id: request.template_id,
                    })
                })?;
        let response = GetIndexTemplateResponse {
            index_template_json: pg_index_template_json.index_template_json,
        };
        Ok(response)
    }

    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> MetastoreResult<FindIndexTemplateMatchesResponse> {
        if request.index_ids.is_empty() {
            return Ok(Default::default());
        }
        const FIND_INDEX_TEMPLATE_MATCHES_QUERY: &str =
            include_str!("queries/index_templates/find.sql");

        let sql_matches: Vec<(IndexId, IndexTemplateId, String)> =
            sqlx::query_as(FIND_INDEX_TEMPLATE_MATCHES_QUERY)
                .bind(&request.index_ids)
                .fetch_all(&self.connection_pool)
                .await?;

        let matches = sql_matches
            .into_iter()
            .map(
                |(index_id, template_id, index_template_json)| IndexTemplateMatch {
                    index_id,
                    template_id,
                    index_template_json,
                },
            )
            .collect();
        let response = FindIndexTemplateMatchesResponse { matches };
        Ok(response)
    }

    async fn list_index_templates(
        &self,
        _request: ListIndexTemplatesRequest,
    ) -> MetastoreResult<ListIndexTemplatesResponse> {
        let pg_index_templates_json: Vec<(String,)> = sqlx::query_as(
            "SELECT index_template_json FROM index_templates ORDER BY template_id ASC",
        )
        .fetch_all(&self.connection_pool)
        .await?;
        let index_templates_json: Vec<String> = pg_index_templates_json
            .into_iter()
            .map(|(index_template_json,)| index_template_json)
            .collect();
        let response = ListIndexTemplatesResponse {
            index_templates_json,
        };
        Ok(response)
    }

    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> MetastoreResult<EmptyResponse> {
        sqlx::query("DELETE FROM index_templates WHERE template_id = ANY($1)")
            .bind(&request.template_ids)
            .execute(&self.connection_pool)
            .await?;
        Ok(EmptyResponse {})
    }

    async fn get_cluster_identity(
        &self,
        _: GetClusterIdentityRequest,
    ) -> MetastoreResult<GetClusterIdentityResponse> {
        // `ON CONFLICT DO NOTHING RETURNING` returns NULL if no insert happens.
        // To always get the value, we use this pattern:
        let (uuid,) = sqlx::query_as(
            r"
                INSERT INTO kv (key, value)
                VALUES ('cluster_identity', $1)
                ON CONFLICT (key) DO UPDATE SET key = EXCLUDED.key
                RETURNING value
            ",
        )
        .bind(Uuid::new_v4().hyphenated().to_string())
        .fetch_one(&self.connection_pool)
        .await?;
        Ok(GetClusterIdentityResponse { uuid })
    }
}

async fn open_or_fetch_shard<'e>(
    executor: impl Executor<'e, Database = Postgres> + Clone,
    subrequest: &OpenShardSubrequest,
) -> MetastoreResult<Shard> {
    const OPEN_SHARDS_QUERY: &str = include_str!("queries/shards/open.sql");

    let pg_shard_opt: Option<PgShard> = sqlx::query_as(OPEN_SHARDS_QUERY)
        .bind(subrequest.index_uid())
        .bind(&subrequest.source_id)
        .bind(subrequest.shard_id().as_str())
        .bind(&subrequest.leader_id)
        .bind(&subrequest.follower_id)
        .bind(subrequest.doc_mapping_uid)
        .bind(&subrequest.publish_token)
        // Use a timestamp generated by the metastore node to avoid clock drift issues
        .bind(OffsetDateTime::now_utc())
        .fetch_optional(executor.clone())
        .await?;

    if let Some(pg_shard) = pg_shard_opt {
        let shard: Shard = pg_shard.into();
        info!(
            index_uid=%shard.index_uid(),
            source_id=%shard.source_id,
            shard_id=%shard.shard_id(),
            leader_id=%shard.leader_id,
            follower_id=?shard.follower_id,
            "opened shard"
        );
        return Ok(shard);
    }
    const FETCH_SHARD_QUERY: &str = include_str!("queries/shards/fetch.sql");

    let pg_shard_opt: Option<PgShard> = sqlx::query_as(FETCH_SHARD_QUERY)
        .bind(subrequest.index_uid())
        .bind(&subrequest.source_id)
        .bind(subrequest.shard_id().as_str())
        .fetch_optional(executor)
        .await?;

    if let Some(pg_shard) = pg_shard_opt {
        return Ok(pg_shard.into());
    }
    Err(MetastoreError::NotFound(EntityKind::Source {
        index_id: subrequest.index_uid().to_string(),
        source_id: subrequest.source_id.clone(),
    }))
}

impl MetastoreServiceExt for PostgresqlMetastore {}

/// Builds the SQL query that returns indexes matching at least one pattern in
/// `index_id_patterns`, and none of the patterns starting with '-'
///
/// For each pattern, we check whether the pattern is valid and replace `*` by `%`
/// to build a SQL `LIKE` query.
fn build_index_id_patterns_sql_query(index_id_patterns: &[String]) -> anyhow::Result<String> {
    let mut positive_patterns = Vec::new();
    let mut negative_patterns = Vec::new();
    for pattern in index_id_patterns {
        if let Some(negative_pattern) = pattern.strip_prefix('-') {
            negative_patterns.push(negative_pattern.to_string());
        } else {
            positive_patterns.push(pattern);
        }
    }

    if positive_patterns.is_empty() {
        anyhow::bail!("The list of index id patterns may not be empty.");
    }

    if index_id_patterns.iter().any(|pattern| pattern == "*") && negative_patterns.is_empty() {
        return Ok("SELECT * FROM indexes".to_string());
    }

    let mut where_like_query = String::new();
    for (index_id_pattern_idx, index_id_pattern) in positive_patterns.iter().enumerate() {
        validate_index_id_pattern(index_id_pattern, false).map_err(|error| {
            MetastoreError::Internal {
                message: "failed to build list indexes query".to_string(),
                cause: error.to_string(),
            }
        })?;
        if index_id_pattern_idx != 0 {
            where_like_query.push_str(" OR ");
        }
        if index_id_pattern.contains('*') {
            let sql_pattern = index_id_pattern.replace('*', "%");
            let _ = write!(where_like_query, "index_id LIKE '{sql_pattern}'");
        } else {
            let _ = write!(where_like_query, "index_id = '{index_id_pattern}'");
        }
    }
    let mut negative_like_query = String::new();
    for index_id_pattern in negative_patterns.iter() {
        validate_index_id_pattern(index_id_pattern, false).map_err(|error| {
            MetastoreError::Internal {
                message: "failed to build list indexes query".to_string(),
                cause: error.to_string(),
            }
        })?;
        negative_like_query.push_str(" AND ");
        if index_id_pattern.contains('*') {
            let sql_pattern = index_id_pattern.replace('*', "%");
            let _ = write!(negative_like_query, "index_id NOT LIKE '{sql_pattern}'");
        } else {
            let _ = write!(negative_like_query, "index_id <> '{index_id_pattern}'");
        }
    }

    Ok(format!(
        "SELECT * FROM indexes WHERE ({where_like_query}){negative_like_query}"
    ))
}

/// A postgres metastore factory
#[cfg(test)]
#[async_trait]
impl crate::tests::DefaultForTest for PostgresqlMetastore {
    async fn default_for_test() -> Self {
        // We cannot use a singleton here,
        // because sqlx needs the runtime used to create a connection to
        // not being dropped.
        //
        // Each unit test runs its own tokio Runtime, so a singleton would mean
        // tying the connection pool to the runtime of one unit test.
        // Concretely this results in a "IO driver has terminated"
        // once the first unit test finishes and its runtime is dropped.
        //
        // The number of connections to Postgres should not be
        // too catastrophic, as it is limited by the number of concurrent
        // unit tests running (= number of test-threads).
        dotenvy::dotenv().ok();
        let uri: Uri = std::env::var("QW_TEST_DATABASE_URL")
            .expect("environment variable `QW_TEST_DATABASE_URL` should be set")
            .parse()
            .expect("environment variable `QW_TEST_DATABASE_URL` should be a valid URI");
        PostgresqlMetastore::new(&PostgresMetastoreConfig::default(), &uri)
            .await
            .expect("failed to initialize PostgreSQL metastore test")
    }
}

#[cfg(test)]
mod tests {
    use async_trait::async_trait;
    use quickwit_common::uri::Protocol;
    use quickwit_doc_mapper::tag_pruning::TagFilterAst;
    use quickwit_proto::ingest::Shard;
    use quickwit_proto::metastore::MetastoreService;
    use quickwit_proto::types::{IndexUid, SourceId};
    use sea_query::{Asterisk, PostgresQueryBuilder, Query};
    use time::OffsetDateTime;

    use super::*;
    use crate::metastore::postgres::metastore::build_index_id_patterns_sql_query;
    use crate::metastore::postgres::model::{PgShard, Splits};
    use crate::tests::DefaultForTest;
    use crate::tests::shard::ReadWriteShardsForTest;
    use crate::{ListSplitsQuery, SplitState, metastore_test_suite};

    #[async_trait]
    impl ReadWriteShardsForTest for PostgresqlMetastore {
        async fn insert_shards(
            &self,
            index_uid: &IndexUid,
            source_id: &SourceId,
            shards: Vec<Shard>,
        ) {
            const INSERT_SHARD_QUERY: &str = include_str!("queries/shards/insert.sql");

            for shard in shards {
                assert_eq!(&shard.source_id, source_id);
                assert_eq!(shard.index_uid(), index_uid);
                // explicit destructuring to ensure new fields are properly handled
                let Shard {
                    doc_mapping_uid,
                    follower_id,
                    index_uid,
                    leader_id,
                    publish_position_inclusive,
                    publish_token,
                    shard_id,
                    shard_state,
                    source_id,
                    update_timestamp,
                } = shard;
                let shard_state_name = ShardState::try_from(shard_state)
                    .unwrap()
                    .as_json_str_name();
                let update_timestamp = OffsetDateTime::from_unix_timestamp(update_timestamp)
                    .expect("Bad timestamp format");
                sqlx::query(INSERT_SHARD_QUERY)
                    .bind(index_uid)
                    .bind(source_id)
                    .bind(shard_id.unwrap())
                    .bind(shard_state_name)
                    .bind(leader_id)
                    .bind(follower_id)
                    .bind(doc_mapping_uid)
                    .bind(publish_position_inclusive.unwrap().to_string())
                    .bind(publish_token)
                    .bind(update_timestamp)
                    .execute(&self.connection_pool)
                    .await
                    .unwrap();
            }
        }

        async fn list_all_shards(&self, index_uid: &IndexUid, source_id: &SourceId) -> Vec<Shard> {
            let pg_shards: Vec<PgShard> = sqlx::query_as(
                r#"
                SELECT *
                FROM shards
                WHERE
                    index_uid = $1
                    AND source_id = $2
                "#,
            )
            .bind(index_uid)
            .bind(source_id)
            .fetch_all(&self.connection_pool)
            .await
            .unwrap();

            pg_shards
                .into_iter()
                .map(|pg_shard| pg_shard.into())
                .collect()
        }
    }

    metastore_test_suite!(crate::PostgresqlMetastore);

    #[tokio::test]
    async fn test_metastore_connectivity_and_endpoints() {
        let metastore = PostgresqlMetastore::default_for_test().await;
        metastore.check_connectivity().await.unwrap();
        assert_eq!(metastore.endpoints()[0].protocol(), Protocol::PostgreSQL);
    }

    #[test]
    fn test_single_sql_query_builder() {
        let mut select_statement = Query::select();

        let sql = select_statement.column(Asterisk).from(Splits::Table);
        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "split_state" IN ('Staged')"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Published);
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "split_state" IN ('Published')"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_states([SplitState::Published, SplitState::MarkedForDeletion]);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "split_state" IN ('Published', 'MarkedForDeletion')"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_update_timestamp_lt(51);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "update_timestamp" < TO_TIMESTAMP(51)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_create_timestamp_lte(55);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "create_timestamp" <= TO_TIMESTAMP(55)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let maturity_evaluation_datetime = OffsetDateTime::from_unix_timestamp(55).unwrap();
        let query = ListSplitsQuery::for_index(index_uid.clone())
            .retain_mature(maturity_evaluation_datetime);
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ("maturity_timestamp" = TO_TIMESTAMP(0) OR "maturity_timestamp" <= TO_TIMESTAMP(55))"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .retain_immature(maturity_evaluation_datetime);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "maturity_timestamp" > TO_TIMESTAMP(55)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_delete_opstamp_gte(4);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "delete_opstamp" >= 4"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_time_range_start_gt(45);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ("time_range_end" > 45 OR "time_range_end" IS NULL)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_time_range_end_lt(45);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ("time_range_start" < 45 OR "time_range_start" IS NULL)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_tags_filter(TagFilterAst::Tag {
                is_present: false,
                tag: "tag-2".to_string(),
            });
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND (NOT ($$tag-2$$ = ANY(tags)))"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_offset(4);
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') ORDER BY "split_id" ASC OFFSET 4"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone()).sort_by_index_uid();
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') ORDER BY "index_uid" ASC, "split_id" ASC"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query =
            ListSplitsQuery::for_index(index_uid.clone()).after_split(&crate::SplitMetadata {
                index_uid: index_uid.clone(),
                split_id: "my_split".to_string(),
                ..Default::default()
            });
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ("index_uid", "split_id") > ('{index_uid}', 'my_split')"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_all_indexes().with_split_state(SplitState::Staged);
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            r#"SELECT * FROM "splits" WHERE "split_state" IN ('Staged')"#
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_all_indexes().with_max_time_range_end(42);
        append_query_filters_and_order_by(sql, &query);

        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            r#"SELECT * FROM "splits" WHERE "time_range_end" <= 42"#
        );
    }

    #[test]
    fn test_combination_sql_query_builder() {
        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let index_uid = IndexUid::new_with_random_ulid("test-index");
        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_time_range_start_gt(0)
            .with_time_range_end_lt(40);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ("time_range_end" > 0 OR "time_range_end" IS NULL) AND ("time_range_start" < 40 OR "time_range_start" IS NULL)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_time_range_start_gt(45)
            .with_delete_opstamp_gt(0);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ("time_range_end" > 45 OR "time_range_end" IS NULL) AND "delete_opstamp" > 0"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_update_timestamp_lt(51)
            .with_create_timestamp_lte(63);
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND "update_timestamp" < TO_TIMESTAMP(51) AND "create_timestamp" <= TO_TIMESTAMP(63)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_time_range_start_gt(90)
            .with_tags_filter(TagFilterAst::Tag {
                is_present: true,
                tag: "tag-1".to_string(),
            });
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}') AND ($$tag-1$$ = ANY(tags)) AND ("time_range_end" > 90 OR "time_range_end" IS NULL)"#
            )
        );

        let mut select_statement = Query::select();
        let sql = select_statement.column(Asterisk).from(Splits::Table);

        let index_uid_2 = IndexUid::new_with_random_ulid("test-index-2");
        let query =
            ListSplitsQuery::try_from_index_uids(vec![index_uid.clone(), index_uid_2.clone()])
                .unwrap();
        append_query_filters_and_order_by(sql, &query);
        assert_eq!(
            sql.to_string(PostgresQueryBuilder),
            format!(
                r#"SELECT * FROM "splits" WHERE "index_uid" IN ('{index_uid}', '{index_uid_2}')"#
            )
        );
    }

    #[test]
    fn test_index_id_pattern_like_query() {
        assert_eq!(
            &build_index_id_patterns_sql_query(&["*-index-*-last*".to_string()]).unwrap(),
            "SELECT * FROM indexes WHERE (index_id LIKE '%-index-%-last%')"
        );
        assert_eq!(
            &build_index_id_patterns_sql_query(&[
                "*-index-*-last*".to_string(),
                "another-index".to_string()
            ])
            .unwrap(),
            "SELECT * FROM indexes WHERE (index_id LIKE '%-index-%-last%' OR index_id = \
             'another-index')"
        );
        assert_eq!(
            &build_index_id_patterns_sql_query(&[
                "*-index-*-last**".to_string(),
                "another-index".to_string(),
                "*".to_string()
            ])
            .unwrap(),
            "SELECT * FROM indexes"
        );
        assert_eq!(
            build_index_id_patterns_sql_query(&["*-index-*-&-last**".to_string()])
                .unwrap_err()
                .to_string(),
            "internal error: failed to build list indexes query; cause: `index ID pattern \
             `*-index-*-&-last**` is invalid: patterns must match the following regular \
             expression: `^[a-zA-Z\\*][a-zA-Z0-9-_\\.\\*]{0,254}$``"
        );

        assert_eq!(
            &build_index_id_patterns_sql_query(&["*".to_string(), "-index-name".to_string()])
                .unwrap(),
            "SELECT * FROM indexes WHERE (index_id LIKE '%') AND index_id <> 'index-name'"
        );

        assert_eq!(
            &build_index_id_patterns_sql_query(&[
                "*-index-*-last*".to_string(),
                "another-index".to_string(),
                "-*-index-1-last*".to_string(),
                "-index-2-last".to_string(),
            ])
            .unwrap(),
            "SELECT * FROM indexes WHERE (index_id LIKE '%-index-%-last%' OR index_id = \
             'another-index') AND index_id NOT LIKE '%-index-1-last%' AND index_id <> \
             'index-2-last'"
        );
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{IntGauge, new_gauge};

#[derive(Clone)]
pub(super) struct PostgresMetrics {
    pub acquire_connections: IntGauge,
    pub active_connections: IntGauge,
    pub idle_connections: IntGauge,
}

impl Default for PostgresMetrics {
    fn default() -> Self {
        Self {
            acquire_connections: new_gauge(
                "acquire_connections",
                "Number of connections being acquired.",
                "metastore",
                &[],
            ),
            active_connections: new_gauge(
                "active_connections",
                "Number of active (used + idle) connections.",
                "metastore",
                &[],
            ),
            idle_connections: new_gauge(
                "idle_connections",
                "Number of idle connections.",
                "metastore",
                &[],
            ),
        }
    }
}

pub(super) static POSTGRES_METRICS: Lazy<PostgresMetrics> = Lazy::new(PostgresMetrics::default);


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/migrator.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;

use quickwit_proto::metastore::{MetastoreError, MetastoreResult};
use sqlx::migrate::{Migrate, Migrator};
use sqlx::{Acquire, PgConnection, Postgres};
use tracing::{error, instrument};

use super::pool::TrackedPool;

fn get_migrations() -> Migrator {
    sqlx::migrate!("migrations/postgresql")
}

/// Initializes the database and runs the SQL migrations stored in the
/// `quickwit-metastore/migrations` directory.
#[instrument(skip_all)]
pub(super) async fn run_migrations(
    pool: &TrackedPool<Postgres>,
    skip_migrations: bool,
    skip_locking: bool,
) -> MetastoreResult<()> {
    let mut tx = pool.begin().await?;
    let conn = tx.acquire().await?;

    let mut migrator = get_migrations();

    if skip_locking {
        migrator.set_locking(false);
    }

    if !skip_migrations {
        // this is an hidden function, made to get "around the annoying "implementation of `Acquire`
        // is not general enough" error", which is the error we get otherwise.
        let migrate_result = migrator.run_direct(conn).await;

        let Err(migrate_error) = migrate_result else {
            tx.commit().await?;
            return Ok(());
        };
        tx.rollback().await?;
        error!(error=%migrate_error, "failed to run PostgreSQL migrations");

        Err(MetastoreError::Internal {
            message: "failed to run PostgreSQL migrations".to_string(),
            cause: migrate_error.to_string(),
        })
    } else {
        check_migrations(migrator, conn).await
    }
}

async fn check_migrations(migrator: Migrator, conn: &mut PgConnection) -> MetastoreResult<()> {
    let dirty = match conn.dirty_version().await {
        Ok(dirty) => dirty,
        Err(migrate_error) => {
            error!(error=%migrate_error, "failed to validate PostgreSQL migrations");

            return Err(MetastoreError::Internal {
                message: "failed to validate PostgreSQL migrations".to_string(),
                cause: migrate_error.to_string(),
            });
        }
    };
    if let Some(dirty) = dirty {
        error!("migration {dirty} is dirty");

        return Err(MetastoreError::Internal {
            message: "failed to validate PostgreSQL migrations".to_string(),
            cause: format!("migration {dirty} is dirty"),
        });
    };
    let applied_migrations = match conn.list_applied_migrations().await {
        Ok(applied_migrations) => applied_migrations,
        Err(migrate_error) => {
            error!(error=%migrate_error, "failed to validate PostgreSQL migrations");

            return Err(MetastoreError::Internal {
                message: "failed to validate PostgreSQL migrations".to_string(),
                cause: migrate_error.to_string(),
            });
        }
    };
    let expected_migrations: BTreeMap<_, _> = migrator
        .iter()
        .filter(|migration| migration.migration_type.is_up_migration())
        .map(|migration| (migration.version, migration))
        .collect();
    if applied_migrations.len() < expected_migrations.len() {
        error!(
            "missing migrations, expected {} migrations, only {} present in database",
            expected_migrations.len(),
            applied_migrations.len()
        );

        return Err(MetastoreError::Internal {
            message: "failed to validate PostgreSQL migrations".to_string(),
            cause: format!(
                "missing migrations, expected {} migrations, only {} present in database",
                expected_migrations.len(),
                applied_migrations.len()
            ),
        });
    }
    for applied_migration in applied_migrations {
        let Some(migration) = expected_migrations.get(&applied_migration.version) else {
            error!(
                "found unknown migration {} in database",
                applied_migration.version
            );

            return Err(MetastoreError::Internal {
                message: "failed to validate PostgreSQL migrations".to_string(),
                cause: format!(
                    "found unknown migration {} in database",
                    applied_migration.version
                ),
            });
        };
        if migration.checksum != applied_migration.checksum {
            error!(
                "migration {} differ between database and expected value",
                applied_migration.version
            );

            return Err(MetastoreError::Internal {
                message: "failed to validate PostgreSQL migrations".to_string(),
                cause: format!(
                    "migration {} differ between database and expected value",
                    applied_migration.version
                ),
            });
        }
    }
    Ok(())
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use quickwit_common::uri::Uri;
    use sqlx::Acquire;
    use sqlx::migrate::Migrate;

    use super::{get_migrations, run_migrations};
    use crate::metastore::postgres::utils::establish_connection;

    #[tokio::test]
    #[serial_test::file_serial]
    async fn test_metastore_check_migration() {
        let _ = tracing_subscriber::fmt::try_init();

        dotenvy::dotenv().ok();
        let uri: Uri = std::env::var("QW_TEST_DATABASE_URL")
            .expect("environment variable `QW_TEST_DATABASE_URL` should be set")
            .parse()
            .expect("environment variable `QW_TEST_DATABASE_URL` should be a valid URI");

        {
            let connection_pool =
                establish_connection(&uri, 1, 5, Duration::from_secs(2), None, None, false)
                    .await
                    .unwrap();
            // make sure migrations are run
            run_migrations(&connection_pool, false, false)
                .await
                .unwrap();

            // we just ran migration, nothing else to run
            run_migrations(&connection_pool, true, false).await.unwrap();

            let migrations = get_migrations();
            let last_migration = migrations
                .iter()
                .map(|migration| migration.version)
                .max()
                .expect("no migration exists?");
            let up_migration = migrations
                .iter()
                .find(|migration| {
                    migration.version == last_migration
                        && migration.migration_type.is_up_migration()
                })
                .unwrap();
            let down_migration = migrations
                .iter()
                .find(|migration| {
                    migration.version == last_migration
                        && migration.migration_type.is_down_migration()
                })
                .unwrap();
            let mut conn = connection_pool.acquire().await.unwrap();

            conn.revert(down_migration).await.unwrap();

            run_migrations(&connection_pool, true, false)
                .await
                .unwrap_err();

            conn.apply(up_migration).await.unwrap();
        }

        {
            let connection_pool =
                establish_connection(&uri, 1, 5, Duration::from_secs(2), None, None, true)
                    .await
                    .unwrap();
            // error because we are in read only mode, and we try to run migrations
            run_migrations(&connection_pool, false, false)
                .await
                .unwrap_err();
            // okay because all migrations were already run before
            run_migrations(&connection_pool, true, false).await.unwrap();
        }
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod error;
mod factory;
mod metastore;
mod metrics;
mod migrator;
mod model;
mod pool;
mod split_stream;
mod tags;
mod utils;

pub use factory::PostgresqlMetastoreFactory;
pub use metastore::PostgresqlMetastore;

const QW_POSTGRES_SKIP_MIGRATIONS_ENV_KEY: &str = "QW_POSTGRES_SKIP_MIGRATIONS";
const QW_POSTGRES_SKIP_MIGRATION_LOCKING_ENV_KEY: &str = "QW_POSTGRES_SKIP_MIGRATION_LOCKING";
const QW_POSTGRES_READ_ONLY_ENV_KEY: &str = "QW_POSTGRES_READ_ONLY";


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/model.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![allow(dead_code)]

use std::convert::TryInto;
use std::str::FromStr;

use quickwit_proto::ingest::{Shard, ShardState};
use quickwit_proto::metastore::{DeleteQuery, DeleteTask, MetastoreError, MetastoreResult};
use quickwit_proto::types::{DocMappingUid, IndexId, IndexUid, ShardId, SourceId, SplitId};
use sea_query::{Iden, Write};
use tracing::error;

use crate::{IndexMetadata, Split, SplitMetadata, SplitState};

#[derive(Iden, Clone, Copy)]
#[allow(dead_code)]
pub enum Indexes {
    Table,
    IndexUid,
    IndexId,
    IndexMetadataJson,
    CreateTimestamp,
}

/// A model structure for handling index metadata in a database.
#[derive(sqlx::FromRow)]
pub(super) struct PgIndex {
    /// Index UID. The index UID identifies the index when querying the metastore from the
    /// application.
    #[sqlx(try_from = "String")]
    pub index_uid: IndexUid,
    /// Index ID. The index ID is used to resolve user queries.
    pub index_id: IndexId,
    // A JSON string containing all of the IndexMetadata.
    pub index_metadata_json: String,
    /// Timestamp for tracking when the split was created.
    pub create_timestamp: sqlx::types::time::PrimitiveDateTime,
}

impl PgIndex {
    /// Deserializes index metadata from JSON string stored in column and sets appropriate
    /// timestamps.
    pub fn index_metadata(&self) -> MetastoreResult<IndexMetadata> {
        let mut index_metadata = serde_json::from_str::<IndexMetadata>(&self.index_metadata_json)
            .map_err(|error| {
            error!(index_id=%self.index_id, error=?error, "failed to deserialize index metadata");

            MetastoreError::JsonDeserializeError {
                struct_name: "IndexMetadata".to_string(),
                message: error.to_string(),
            }
        })?;
        // `create_timestamp` and `update_timestamp` are stored in dedicated columns but are also
        // duplicated in [`IndexMetadata`]. We must override the duplicates with the authentic
        // values upon deserialization.
        index_metadata.create_timestamp = self.create_timestamp.assume_utc().unix_timestamp();
        Ok(index_metadata)
    }
}

#[derive(Iden, Clone, Copy)]
#[allow(dead_code)]
pub enum Splits {
    Table,
    SplitId,
    SplitState,
    TimeRangeStart,
    TimeRangeEnd,
    CreateTimestamp,
    UpdateTimestamp,
    PublishTimestamp,
    MaturityTimestamp,
    Tags,
    SplitMetadataJson,
    IndexUid,
    NodeId,
    DeleteOpstamp,
}

pub(super) struct ToTimestampFunc;

impl Iden for ToTimestampFunc {
    fn unquoted(&self, s: &mut dyn Write) {
        write!(s, "TO_TIMESTAMP").unwrap()
    }
}

/// A model structure for handling split metadata in a database.
#[derive(sqlx::FromRow)]
pub(super) struct PgSplit {
    /// Split ID.
    pub split_id: SplitId,
    /// The state of the split. With `update_timestamp`, this is the only mutable attribute of the
    /// split.
    pub split_state: String,
    /// If a timestamp field is available, the min timestamp of the split.
    pub time_range_start: Option<i64>,
    /// If a timestamp field is available, the max timestamp of the split.
    pub time_range_end: Option<i64>,
    /// Timestamp for tracking when the split was created.
    pub create_timestamp: sqlx::types::time::PrimitiveDateTime,
    /// Timestamp for tracking when the split was last updated.
    pub update_timestamp: sqlx::types::time::PrimitiveDateTime,
    /// Timestamp for tracking when the split was published.
    pub publish_timestamp: Option<sqlx::types::time::PrimitiveDateTime>,
    /// Timestamp for tracking when the split becomes mature.
    /// If a split is already mature, this timestamp is set to 0.
    pub maturity_timestamp: sqlx::types::time::PrimitiveDateTime,
    /// A list of tags for categorizing and searching group of splits.
    pub tags: Vec<String>,
    // The split's metadata serialized as a JSON string.
    pub split_metadata_json: String,
    /// Index UID. It is used as a foreign key in the database.
    #[sqlx(try_from = "String")]
    pub index_uid: IndexUid,
    /// Delete opstamp.
    pub delete_opstamp: i64,
}

impl PgSplit {
    /// Deserializes and returns the split's metadata.
    fn split_metadata(&self) -> MetastoreResult<SplitMetadata> {
        serde_json::from_str::<SplitMetadata>(&self.split_metadata_json).map_err(|error| {
            error!(index_id=%self.index_uid.index_id, split_id=%self.split_id, error=?error, "failed to deserialize split metadata");

            MetastoreError::JsonDeserializeError {
                struct_name: "SplitMetadata".to_string(),
                message: error.to_string(),
            }
        })
    }

    /// Deserializes and returns the split's state.
    fn split_state(&self) -> MetastoreResult<SplitState> {
        SplitState::from_str(&self.split_state).map_err(|error| {
            error!(index_id=%self.index_uid.index_id, split_id=%self.split_id, split_state=?self.split_state, error=?error, "failed to deserialize split state");
            MetastoreError::JsonDeserializeError {
                struct_name: "SplitState".to_string(),
                message: error,
            }
        })
    }
}

impl TryInto<Split> for PgSplit {
    type Error = MetastoreError;

    fn try_into(self) -> Result<Split, Self::Error> {
        let mut split_metadata = self.split_metadata()?;
        // `create_timestamp` and `delete_opstamp` are duplicated in `SplitMetadata` and needs to be
        // overridden with the "true" value stored in a column.
        split_metadata.create_timestamp = self.create_timestamp.assume_utc().unix_timestamp();
        let split_state = self.split_state()?;
        let update_timestamp = self.update_timestamp.assume_utc().unix_timestamp();
        let publish_timestamp = self
            .publish_timestamp
            .map(|publish_timestamp| publish_timestamp.assume_utc().unix_timestamp());
        split_metadata.index_uid = self.index_uid;
        split_metadata.delete_opstamp = self.delete_opstamp as u64;
        Ok(Split {
            split_metadata,
            split_state,
            update_timestamp,
            publish_timestamp,
        })
    }
}

/// A model structure for handling split metadata in a database.
#[derive(sqlx::FromRow)]
pub(super) struct PgDeleteTask {
    /// Create timestamp.
    pub create_timestamp: sqlx::types::time::PrimitiveDateTime,
    /// Monotonic increasing unique opstamp.
    pub opstamp: i64,
    /// Index uid.
    #[sqlx(try_from = "String")]
    pub index_uid: IndexUid,
    /// Query serialized as a JSON string.
    pub delete_query_json: String,
}

impl PgDeleteTask {
    /// Deserializes and returns the split's metadata.
    fn delete_query(&self) -> MetastoreResult<DeleteQuery> {
        serde_json::from_str::<DeleteQuery>(&self.delete_query_json).map_err(|error| {
            error!(index_id=%self.index_uid.index_id, opstamp=%self.opstamp, error=?error, "failed to deserialize delete query");

            MetastoreError::JsonDeserializeError {
                struct_name: "DeleteQuery".to_string(),
                message: error.to_string(),
            }
        })
    }
}

impl TryInto<DeleteTask> for PgDeleteTask {
    type Error = MetastoreError;

    fn try_into(self) -> Result<DeleteTask, Self::Error> {
        let delete_query = self.delete_query()?;
        Ok(DeleteTask {
            create_timestamp: self.create_timestamp.assume_utc().unix_timestamp(),
            opstamp: self.opstamp as u64,
            delete_query: Some(delete_query),
        })
    }
}

#[derive(Iden, Clone, Copy)]
pub(super) enum Shards {
    Table,
    IndexUid,
    SourceId,
    ShardId,
    ShardState,
    LeaderId,
    FollowerId,
    PublishPositionInclusive,
    PublishToken,
}

#[derive(sqlx::Type, PartialEq, Debug)]
#[sqlx(type_name = "SHARD_STATE", rename_all = "snake_case")]
pub(super) enum PgShardState {
    Unspecified,
    Open,
    Unavailable,
    Closed,
}

impl From<PgShardState> for ShardState {
    fn from(pg_shard_state: PgShardState) -> Self {
        match pg_shard_state {
            PgShardState::Unspecified => ShardState::Unspecified,
            PgShardState::Open => ShardState::Open,
            PgShardState::Unavailable => ShardState::Unavailable,
            PgShardState::Closed => ShardState::Closed,
        }
    }
}

#[derive(sqlx::FromRow, Debug)]
pub(super) struct PgShard {
    #[sqlx(try_from = "String")]
    pub index_uid: IndexUid,
    #[sqlx(try_from = "String")]
    pub source_id: SourceId,
    #[sqlx(try_from = "String")]
    pub shard_id: ShardId,
    pub leader_id: String,
    pub follower_id: Option<String>,
    pub shard_state: PgShardState,
    #[sqlx(try_from = "String")]
    pub doc_mapping_uid: DocMappingUid,
    pub publish_position_inclusive: String,
    pub publish_token: Option<String>,
    pub update_timestamp: sqlx::types::time::PrimitiveDateTime,
}

impl From<PgShard> for Shard {
    fn from(pg_shard: PgShard) -> Self {
        Shard {
            index_uid: Some(pg_shard.index_uid),
            source_id: pg_shard.source_id,
            shard_id: Some(pg_shard.shard_id),
            shard_state: ShardState::from(pg_shard.shard_state) as i32,
            leader_id: pg_shard.leader_id,
            follower_id: pg_shard.follower_id,
            doc_mapping_uid: Some(pg_shard.doc_mapping_uid),
            publish_position_inclusive: Some(pg_shard.publish_position_inclusive.into()),
            publish_token: pg_shard.publish_token,
            update_timestamp: pg_shard.update_timestamp.assume_utc().unix_timestamp(),
        }
    }
}

#[derive(sqlx::FromRow, Debug)]
pub(super) struct PgIndexTemplate {
    pub index_template_json: String,
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/pool.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use futures::future::BoxFuture;
use futures::stream::BoxStream;
use quickwit_common::metrics::GaugeGuard;
use sqlx::pool::PoolConnection;
use sqlx::pool::maybe::MaybePoolConnection;
use sqlx::{
    Acquire, Database, Describe, Either, Error, Execute, Executor, Pool, Postgres, Transaction,
};

use super::metrics::POSTGRES_METRICS;

#[derive(Debug)]
pub(super) struct TrackedPool<DB: Database> {
    inner_pool: Pool<DB>,
}

impl TrackedPool<Postgres> {
    pub fn new(inner_pool: Pool<Postgres>) -> Self {
        Self { inner_pool }
    }
}

impl<DB: Database> Clone for TrackedPool<DB> {
    fn clone(&self) -> Self {
        Self {
            inner_pool: self.inner_pool.clone(),
        }
    }
}

impl<'a, DB: Database> Acquire<'a> for &TrackedPool<DB> {
    type Database = DB;

    type Connection = PoolConnection<DB>;

    fn acquire(self) -> BoxFuture<'static, Result<Self::Connection, Error>> {
        let acquire_conn_fut = self.inner_pool.acquire();

        POSTGRES_METRICS
            .active_connections
            .set(self.inner_pool.size() as i64);
        POSTGRES_METRICS
            .idle_connections
            .set(self.inner_pool.num_idle() as i64);

        Box::pin(async move {
            let mut gauge_guard = GaugeGuard::from_gauge(&POSTGRES_METRICS.acquire_connections);
            gauge_guard.add(1);

            let conn = acquire_conn_fut.await?;
            Ok(conn)
        })
    }

    fn begin(self) -> BoxFuture<'static, Result<Transaction<'a, DB>, Error>> {
        let acquire_conn_fut = self.acquire();

        Box::pin(async move {
            Transaction::begin(
                MaybePoolConnection::PoolConnection(acquire_conn_fut.await?),
                None,
            )
            .await
        })
    }
}

impl<DB: Database> Executor<'_> for &TrackedPool<DB>
where for<'c> &'c mut DB::Connection: Executor<'c, Database = DB>
{
    type Database = DB;

    fn fetch_many<'e, 'q: 'e, E>(
        self,
        query: E,
    ) -> BoxStream<'e, Result<Either<DB::QueryResult, DB::Row>, Error>>
    where
        E: Execute<'q, Self::Database> + 'q,
    {
        self.inner_pool.fetch_many(query)
    }

    fn fetch_optional<'e, 'q: 'e, E>(
        self,
        query: E,
    ) -> BoxFuture<'e, Result<Option<DB::Row>, Error>>
    where
        E: Execute<'q, Self::Database> + 'q,
    {
        self.inner_pool.fetch_optional(query)
    }

    fn prepare_with<'e, 'q: 'e>(
        self,
        sql: &'q str,
        parameters: &'e [<Self::Database as Database>::TypeInfo],
    ) -> BoxFuture<'e, Result<<Self::Database as Database>::Statement<'q>, Error>> {
        self.inner_pool.prepare_with(sql, parameters)
    }

    #[doc(hidden)]
    fn describe<'e, 'q: 'e>(
        self,
        sql: &'q str,
    ) -> BoxFuture<'e, Result<Describe<Self::Database>, Error>> {
        self.inner_pool.describe(sql)
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/index_templates/find.sql
================================================
SELECT DISTINCT ON (index_id)
    index_id,
    template_id,
    index_template_json
FROM
    unnest($1) AS index_ids(index_id)
    JOIN index_templates ON index_ids.index_id LIKE ANY (index_templates.positive_index_id_patterns)
        AND (cardinality(index_templates.negative_index_id_patterns) = 0
            OR index_ids.index_id NOT LIKE ANY (index_templates.negative_index_id_patterns))
    ORDER BY
        index_id,
        - priority,
        template_id ASC


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/index_templates/insert.sql
================================================
INSERT INTO index_templates(template_id, positive_index_id_patterns, negative_index_id_patterns, priority, index_template_json)
    VALUES ($1, $2, $3, $4, $5)
ON CONFLICT (template_id)
    DO NOTHING


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/index_templates/upsert.sql
================================================
INSERT INTO index_templates(template_id, positive_index_id_patterns, negative_index_id_patterns, priority, index_template_json)
    VALUES ($1, $2, $3, $4, $5)
ON CONFLICT (template_id)
    DO UPDATE SET
        positive_index_id_patterns = $2, negative_index_id_patterns = $3, priority = $4, index_template_json = $5


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/indexes_metadata.sql
================================================
SELECT
    *
FROM
    indexes
WHERE
    index_id = ANY ($1)
    OR index_uid = ANY ($2)


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/acquire.sql
================================================
UPDATE
    shards
SET
    publish_token = $4
WHERE
    index_uid = $1
    AND source_id = $2
    AND shard_id = ANY ($3)
RETURNING
    *


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/delete.sql
================================================
DELETE FROM shards
WHERE index_uid = $1
    AND source_id = $2
    AND shard_id = ANY ($3)
    AND ($4
        OR publish_position_inclusive LIKE '~%')


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/fetch.sql
================================================
SELECT
    *
FROM
    shards
WHERE
    index_uid = $1
    AND source_id = $2
    AND shard_id = $3


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/find_not_deletable.sql
================================================
SELECT
    *
FROM
    shards
WHERE
    index_uid = $1
    AND source_id = $2
    AND shard_id = ANY ($3)
    AND publish_position_inclusive NOT LIKE '~%'


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/insert.sql
================================================
INSERT INTO shards(index_uid, source_id, shard_id, shard_state, leader_id, follower_id, doc_mapping_uid, publish_position_inclusive, publish_token, update_timestamp)
    VALUES ($1, $2, $3, CAST($4 AS SHARD_STATE), $5, $6, $7, $8, $9, $10)


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/open.sql
================================================
INSERT INTO shards(index_uid, source_id, shard_id, leader_id, follower_id, doc_mapping_uid, publish_token, update_timestamp)
    VALUES ($1, $2, $3, $4, $5, $6, $7, $8)
ON CONFLICT
    DO NOTHING
RETURNING
    *


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/prune_age.sql
================================================
DELETE FROM shards
WHERE index_uid = $1
    AND source_id = $2
    AND update_timestamp < $3


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/queries/shards/prune_count.sql
================================================
WITH recent_shards AS (
    SELECT shard_id
    FROM shards
    WHERE index_uid = $1
        AND source_id = $2
    ORDER BY update_timestamp DESC
    LIMIT $3
)
DELETE FROM shards
WHERE index_uid = $1
    AND source_id = $2
    AND shard_id NOT IN (SELECT shard_id FROM recent_shards)


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/split_stream.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::pin::Pin;
use std::task::{Context, Poll};

use futures::stream::BoxStream;
use ouroboros::self_referencing;
use sqlx::Postgres;
use tokio_stream::Stream;

use super::pool::TrackedPool;

#[self_referencing(pub_extras)]
pub struct SplitStream<T> {
    connection_pool: TrackedPool<Postgres>,
    sql: String,
    #[borrows(connection_pool, sql)]
    #[covariant]
    inner: BoxStream<'this, Result<T, sqlx::Error>>,
}

impl<T> Stream for SplitStream<T> {
    type Item = Result<T, sqlx::Error>;

    fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
        SplitStream::with_inner_mut(&mut self, |this| Pin::new(&mut this.as_mut()).poll_next(cx))
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/tags.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_doc_mapper::tag_pruning::TagFilterAst;
use sea_query::{Cond, Expr, all};

// We use dollar-quoted strings in PostgreSQL.
//
// In order to ensure that we do not risk SQL injection,
// we need to generate a string that does not appear in
// the literal we want to dollar quote.
fn generate_dollar_guard(tag: &str) -> String {
    if !tag.contains('$') {
        // That's our happy path here.
        return String::new();
    }
    let mut dollar_guard = String::new();
    loop {
        dollar_guard.push_str("QuickwitGuard");
        // This terminates because `dollar_guard`
        // will eventually be longer than `tag`.
        if !tag.contains(&dollar_guard) {
            return dollar_guard;
        }
    }
}

/// Takes a tag filter AST and returns a SQL expression that can be used as
/// a filter.
pub(super) fn generate_sql_condition(tag_ast: &TagFilterAst) -> Cond {
    match tag_ast {
        TagFilterAst::And(child_asts) => {
            if child_asts.is_empty() {
                return all![Expr::cust("TRUE")];
            }
            child_asts
                .iter()
                .map(generate_sql_condition)
                .fold(Cond::all(), |cond, child_cond| cond.add(child_cond))
        }
        TagFilterAst::Or(child_asts) => {
            if child_asts.is_empty() {
                return all![Expr::cust("TRUE")];
            }
            child_asts
                .iter()
                .map(generate_sql_condition)
                .fold(Cond::any(), |cond, child_cond| cond.add(child_cond))
        }
        TagFilterAst::Tag { tag, is_present } => {
            let dollar_guard = generate_dollar_guard(tag);
            let expr_str = format!("${dollar_guard}${tag}${dollar_guard}$ = ANY(tags)");
            let expr = if *is_present {
                Expr::cust(expr_str)
            } else {
                Expr::cust(expr_str).not()
            };
            all![expr]
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_doc_mapper::tag_pruning::{no_tag, tag};
    use sea_query::any;

    use super::*;

    fn test_tags_filter_expression_helper(tags_ast: TagFilterAst, expected: Cond) {
        assert_eq!(generate_sql_condition(&tags_ast), expected);
    }

    #[test]
    fn test_tags_filter_expression_single_tag() {
        let tags_ast = tag("my_field:titi");

        let expected = all![Expr::cust("$$my_field:titi$$ = ANY(tags)")];

        test_tags_filter_expression_helper(tags_ast, expected);
    }

    #[test]
    fn test_tags_filter_expression_not_tag() {
        let expected = all![Expr::cust("$$my_field:titi$$ = ANY(tags)").not()];

        test_tags_filter_expression_helper(no_tag("my_field:titi"), expected);
    }

    #[test]
    fn test_tags_filter_expression_ands() {
        let tags_ast = TagFilterAst::And(vec![tag("tag:val1"), tag("tag:val2"), tag("tag:val3")]);

        let expected = all![
            Expr::cust("$$tag:val1$$ = ANY(tags)"),
            Expr::cust("$$tag:val2$$ = ANY(tags)"),
            Expr::cust("$$tag:val3$$ = ANY(tags)"),
        ];

        test_tags_filter_expression_helper(tags_ast, expected);
    }

    #[test]
    fn test_tags_filter_expression_and_or() {
        let tags_ast = TagFilterAst::Or(vec![
            TagFilterAst::And(vec![tag("tag:val1"), tag("tag:val2")]),
            tag("tag:val3"),
        ]);

        let expected = any![
            all![
                Expr::cust("$$tag:val1$$ = ANY(tags)"),
                Expr::cust("$$tag:val2$$ = ANY(tags)"),
            ],
            Expr::cust("$$tag:val3$$ = ANY(tags)"),
        ];

        test_tags_filter_expression_helper(tags_ast, expected);
    }

    #[test]
    fn test_tags_filter_expression_and_or_correct_parenthesis() {
        let tags_ast = TagFilterAst::And(vec![
            TagFilterAst::Or(vec![tag("tag:val1"), tag("tag:val2")]),
            tag("tag:val3"),
        ]);

        let expected = all![
            any![
                Expr::cust("$$tag:val1$$ = ANY(tags)"),
                Expr::cust("$$tag:val2$$ = ANY(tags)"),
            ],
            Expr::cust("$$tag:val3$$ = ANY(tags)"),
        ];

        test_tags_filter_expression_helper(tags_ast, expected);
    }

    #[test]
    fn test_tags_sql_injection_attempt() {
        let tags_ast = tag("tag:$$;DELETE FROM something_evil");

        let expected = all![Expr::cust(
            "$QuickwitGuard$tag:$$;DELETE FROM something_evil$QuickwitGuard$ = ANY(tags)"
        ),];

        test_tags_filter_expression_helper(tags_ast, expected);

        let tags_ast = tag("tag:$QuickwitGuard$;DELETE FROM something_evil");

        let expected = all![Expr::cust(
            "$QuickwitGuardQuickwitGuard$tag:$QuickwitGuard$;DELETE FROM \
             something_evil$QuickwitGuardQuickwitGuard$ = ANY(tags)"
        )];

        test_tags_filter_expression_helper(tags_ast, expected);
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore/postgres/utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Display;
use std::ops::Bound;
use std::str::FromStr;
use std::time::Duration;

use quickwit_common::uri::Uri;
use quickwit_proto::metastore::{MetastoreError, MetastoreResult};
use sea_query::{Expr, Func, Order, SelectStatement, any};
use sqlx::postgres::{PgConnectOptions, PgPoolOptions};
use sqlx::{ConnectOptions, Postgres};
use tracing::error;
use tracing::log::LevelFilter;

use super::model::{Splits, ToTimestampFunc};
use super::pool::TrackedPool;
use super::tags::generate_sql_condition;
use crate::metastore::{FilterRange, SortBy};
use crate::{ListSplitsQuery, SplitMaturity, SplitMetadata};

/// Establishes a connection to the given database URI.
pub(super) async fn establish_connection(
    connection_uri: &Uri,
    min_connections: usize,
    max_connections: usize,
    acquire_timeout: Duration,
    idle_timeout_opt: Option<Duration>,
    max_lifetime_opt: Option<Duration>,
    read_only: bool,
) -> MetastoreResult<TrackedPool<Postgres>> {
    let pool_options = PgPoolOptions::new()
        .min_connections(min_connections as u32)
        .max_connections(max_connections as u32)
        .acquire_timeout(acquire_timeout)
        .idle_timeout(idle_timeout_opt)
        .max_lifetime(max_lifetime_opt);

    let mut connect_options: PgConnectOptions =
        PgConnectOptions::from_str(connection_uri.as_str())?
            .application_name("quickwit-metastore")
            .log_statements(LevelFilter::Info);

    if read_only {
        // this isn't a security mechanism, only a safeguard against involontary missuse
        connect_options = connect_options.options([("default_transaction_read_only", "on")]);
    }
    let sqlx_pool = pool_options
        .connect_with(connect_options)
        .await
        .map_err(|error| {
            error!(connection_uri=%connection_uri, error=?error, "failed to establish connection to database");
            MetastoreError::Connection {
                message: error.to_string(),
            }
        })?;
    let tracked_pool = TrackedPool::new(sqlx_pool);
    Ok(tracked_pool)
}

/// Extends an existing SQL string with the generated filter range appended to the query.
///
/// This method is **not** SQL injection proof and should not be used with user-defined values.
pub(super) fn append_range_filters<V: Display>(
    sql: &mut SelectStatement,
    field_name: Splits,
    filter_range: &FilterRange<V>,
    value_formatter: impl Fn(&V) -> Expr,
) {
    if let Bound::Included(value) = &filter_range.start {
        sql.cond_where(Expr::col(field_name).gte((value_formatter)(value)));
    };

    if let Bound::Excluded(value) = &filter_range.start {
        sql.cond_where(Expr::col(field_name).gt((value_formatter)(value)));
    };

    if let Bound::Included(value) = &filter_range.end {
        sql.cond_where(Expr::col(field_name).lte((value_formatter)(value)));
    };

    if let Bound::Excluded(value) = &filter_range.end {
        sql.cond_where(Expr::col(field_name).lt((value_formatter)(value)));
    };
}

pub(super) fn append_query_filters_and_order_by(
    sql: &mut SelectStatement,
    query: &ListSplitsQuery,
) {
    if let Some(index_uids) = &query.index_uids {
        // Note: `ListSplitsQuery` builder enforces a non empty `index_uids` list.
        // TODO we should explore IN VALUES, = ANY and similar constructs in case they perform
        // better.
        sql.cond_where(Expr::col(Splits::IndexUid).is_in(index_uids));
    }

    if let Some(node_id) = &query.node_id {
        sql.cond_where(Expr::col(Splits::NodeId).eq(node_id));
    };

    if !query.split_states.is_empty() {
        sql.cond_where(
            Expr::col(Splits::SplitState)
                .is_in(query.split_states.iter().map(|val| val.to_string())),
        );
    };

    if let Some(tags) = &query.tags {
        sql.cond_where(generate_sql_condition(tags));
    };

    if let Some(v) = query.max_time_range_end {
        sql.cond_where(Expr::col(Splits::TimeRangeEnd).lte(v));
    }

    match query.time_range.start {
        Bound::Included(v) => {
            sql.cond_where(any![
                Expr::col(Splits::TimeRangeEnd).gte(v),
                Expr::col(Splits::TimeRangeEnd).is_null()
            ]);
        }
        Bound::Excluded(v) => {
            sql.cond_where(any![
                Expr::col(Splits::TimeRangeEnd).gt(v),
                Expr::col(Splits::TimeRangeEnd).is_null()
            ]);
        }
        Bound::Unbounded => {}
    };

    match query.time_range.end {
        Bound::Included(v) => {
            sql.cond_where(any![
                Expr::col(Splits::TimeRangeStart).lte(v),
                Expr::col(Splits::TimeRangeStart).is_null()
            ]);
        }
        Bound::Excluded(v) => {
            sql.cond_where(any![
                Expr::col(Splits::TimeRangeStart).lt(v),
                Expr::col(Splits::TimeRangeStart).is_null()
            ]);
        }
        Bound::Unbounded => {}
    };

    match &query.mature {
        Bound::Included(evaluation_datetime) => {
            sql.cond_where(any![
                Expr::col(Splits::MaturityTimestamp)
                    .eq(Func::cust(ToTimestampFunc).arg(Expr::val(0))),
                Expr::col(Splits::MaturityTimestamp).lte(
                    Func::cust(ToTimestampFunc)
                        .arg(Expr::val(evaluation_datetime.unix_timestamp()))
                )
            ]);
        }
        Bound::Excluded(evaluation_datetime) => {
            sql.cond_where(Expr::col(Splits::MaturityTimestamp).gt(
                Func::cust(ToTimestampFunc).arg(Expr::val(evaluation_datetime.unix_timestamp())),
            ));
        }
        Bound::Unbounded => {}
    };
    append_range_filters(
        sql,
        Splits::UpdateTimestamp,
        &query.update_timestamp,
        |&val| Expr::expr(Func::cust(ToTimestampFunc).arg(Expr::val(val))),
    );
    append_range_filters(
        sql,
        Splits::CreateTimestamp,
        &query.create_timestamp,
        |&val| Expr::expr(Func::cust(ToTimestampFunc).arg(Expr::val(val))),
    );
    append_range_filters(sql, Splits::DeleteOpstamp, &query.delete_opstamp, |&val| {
        Expr::expr(val)
    });

    if let Some((index_uid, split_id)) = &query.after_split {
        sql.cond_where(
            Expr::tuple([
                Expr::col(Splits::IndexUid).into(),
                Expr::col(Splits::SplitId).into(),
            ])
            .gt(Expr::tuple([Expr::value(index_uid), Expr::value(split_id)])),
        );
    }

    match query.sort_by {
        SortBy::Staleness => {
            sql.order_by(Splits::DeleteOpstamp, Order::Asc)
                .order_by(Splits::PublishTimestamp, Order::Asc);
        }
        SortBy::IndexUid => {
            sql.order_by(Splits::IndexUid, Order::Asc)
                .order_by(Splits::SplitId, Order::Asc);
        }
        SortBy::None => (),
    }

    if let Some(limit) = query.limit {
        sql.limit(limit as u64);
    }

    if let Some(offset) = query.offset {
        sql.order_by(Splits::SplitId, Order::Asc)
            .offset(offset as u64);
    }
}

/// Returns the unix timestamp at which the split becomes mature.
/// If the split is mature (`SplitMaturity::Mature`), we return 0
/// as we don't want the maturity to depend on datetime.
pub(super) fn split_maturity_timestamp(split_metadata: &SplitMetadata) -> i64 {
    match split_metadata.maturity {
        SplitMaturity::Mature => 0,
        SplitMaturity::Immature { maturation_period } => {
            split_metadata.create_timestamp + maturation_period.as_secs() as i64
        }
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore_factory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_config::{MetastoreBackend, MetastoreConfig};
use quickwit_proto::metastore::MetastoreServiceClient;

use crate::MetastoreResolverError;

/// A metastore factory builds a [`MetastoreServiceClient`] object for a target [`MetastoreBackend`]
/// from a [`MetastoreConfig`] and a [`Uri`].
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait]
pub trait MetastoreFactory: Send + Sync + 'static {
    /// Returns the metastore backend targeted by the factory.
    fn backend(&self) -> MetastoreBackend;

    /// Returns the appropriate [`MetastoreServiceClient`] object for the `uri`.
    async fn resolve(
        &self,
        metastore_config: &MetastoreConfig,
        uri: &Uri,
    ) -> Result<MetastoreServiceClient, MetastoreResolverError>;
}

/// A metastore factory for handling unsupported or unavailable metastore backends.
#[derive(Clone)]
pub struct UnsupportedMetastore {
    backend: MetastoreBackend,
    message: &'static str,
}

impl UnsupportedMetastore {
    /// Creates a new [`UnsupportedMetastore`].
    pub fn new(backend: MetastoreBackend, message: &'static str) -> Self {
        Self { backend, message }
    }
}

#[async_trait]
impl MetastoreFactory for UnsupportedMetastore {
    fn backend(&self) -> MetastoreBackend {
        self.backend
    }

    async fn resolve(
        &self,
        _metastore_config: &MetastoreConfig,
        _uri: &Uri,
    ) -> Result<MetastoreServiceClient, MetastoreResolverError> {
        Err(MetastoreResolverError::UnsupportedBackend(
            self.message.to_string(),
        ))
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/metastore_resolver.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::sync::Arc;

use anyhow::ensure;
use once_cell::sync::Lazy;
use quickwit_common::uri::{Protocol, Uri};
use quickwit_config::{MetastoreBackend, MetastoreConfig, MetastoreConfigs};
use quickwit_proto::metastore::MetastoreServiceClient;
use quickwit_storage::StorageResolver;

use crate::metastore::file_backed::FileBackedMetastoreFactory;
#[cfg(feature = "postgres")]
use crate::metastore::postgres::PostgresqlMetastoreFactory;
use crate::{MetastoreFactory, MetastoreResolverError};

type FactoryAndConfig = (Box<dyn MetastoreFactory>, MetastoreConfig);

/// Returns the [`MetastoreServiceClient`] instance associated with the protocol of a URI. The
/// actual creation of metastore objects is delegated to pre-registered [`MetastoreFactory`]. The
/// resolver is only responsible for dispatching to the appropriate factory.
#[derive(Clone)]
pub struct MetastoreResolver {
    per_backend_factories: Arc<HashMap<MetastoreBackend, FactoryAndConfig>>,
}

impl fmt::Debug for MetastoreResolver {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("MetastoreResolver").finish()
    }
}

impl MetastoreResolver {
    /// Creates an empty [`MetastoreResolverBuilder`].
    pub fn builder() -> MetastoreResolverBuilder {
        MetastoreResolverBuilder::default()
    }

    /// Resolves the given `uri`.
    pub async fn resolve(
        &self,
        uri: &Uri,
    ) -> Result<MetastoreServiceClient, MetastoreResolverError> {
        let backend = match uri.protocol() {
            Protocol::Azure => MetastoreBackend::File,
            Protocol::Google => MetastoreBackend::File,
            Protocol::File => MetastoreBackend::File,
            Protocol::Ram => MetastoreBackend::File,
            Protocol::S3 => MetastoreBackend::File,
            Protocol::PostgreSQL => MetastoreBackend::PostgreSQL,
            _ => {
                return Err(MetastoreResolverError::UnsupportedBackend(
                    "no implementation exists for this backend".to_string(),
                ));
            }
        };
        let (metastore_factory, metastore_config) = self
            .per_backend_factories
            .get(&backend)
            .ok_or(MetastoreResolverError::UnsupportedBackend(
                "no metastore factory is registered for this backend".to_string(),
            ))?;
        let metastore = metastore_factory.resolve(metastore_config, uri).await?;
        Ok(metastore)
    }

    /// Creates and returns a [`MetastoreResolver`] holding the default configuration for each
    /// backend. Note that if the environment (env vars, instance metadata, ...) fails
    /// to provide the necessary credentials, the default Azure or S3 file-backed metastores
    /// returned by this resolver will not work.
    pub fn unconfigured() -> Self {
        static METASTORE_RESOLVER: Lazy<MetastoreResolver> = Lazy::new(|| {
            MetastoreResolver::configured(
                StorageResolver::unconfigured(),
                &MetastoreConfigs::default(),
            )
        });
        METASTORE_RESOLVER.clone()
    }

    /// Creates and returns a [`MetastoreResolver`].
    pub fn configured(
        storage_resolver: StorageResolver,
        metastore_configs: &MetastoreConfigs,
    ) -> Self {
        let mut builder = MetastoreResolver::builder().register(
            FileBackedMetastoreFactory::new(storage_resolver),
            metastore_configs
                .find_file()
                .cloned()
                .unwrap_or_default()
                .into(),
        );
        #[cfg(feature = "postgres")]
        {
            builder = builder.register(
                PostgresqlMetastoreFactory::default(),
                metastore_configs
                    .find_postgres()
                    .cloned()
                    .unwrap_or_default()
                    .into(),
            );
        }
        #[cfg(not(feature = "postgres"))]
        {
            use quickwit_config::PostgresMetastoreConfig;

            use crate::UnsupportedMetastore;

            builder = builder.register(
                UnsupportedMetastore::new(
                    MetastoreBackend::PostgreSQL,
                    "Quickwit was compiled without the `postgres` feature",
                ),
                PostgresMetastoreConfig::default().into(),
            );
        }
        builder
            .build()
            .expect("metastore factory and config backends should match")
    }
}

#[derive(Default)]
pub struct MetastoreResolverBuilder {
    per_protocol_factories: HashMap<MetastoreBackend, (Box<dyn MetastoreFactory>, MetastoreConfig)>,
}

impl MetastoreResolverBuilder {
    pub fn register<S: MetastoreFactory>(
        mut self,
        metastore_factory: S,
        metastore_config: MetastoreConfig,
    ) -> Self {
        self.per_protocol_factories.insert(
            metastore_factory.backend(),
            (Box::new(metastore_factory), metastore_config),
        );
        self
    }

    pub fn build(self) -> anyhow::Result<MetastoreResolver> {
        for (metastore_factory, metastore_config) in self.per_protocol_factories.values() {
            ensure!(
                metastore_factory.backend() == metastore_config.backend(),
                "metastore factory and config backends do not match: {:?} vs. {:?}",
                metastore_factory.backend(),
                metastore_config.backend(),
            );
        }
        let metastore_resolver = MetastoreResolver {
            per_backend_factories: Arc::new(self.per_protocol_factories),
        };
        Ok(metastore_resolver)
    }
}

#[cfg(test)]
mod tests {
    use std::str::FromStr;

    use super::*;

    #[tokio::test]
    async fn test_metastore_resolver_should_not_raise_errors_on_file() {
        let metastore_resolver = MetastoreResolver::unconfigured();
        let tmp_dir = tempfile::tempdir().unwrap();
        let metastore_filepath = format!("file://{}/metastore", tmp_dir.path().display());
        let metastore_uri = Uri::from_str(&metastore_filepath).unwrap();
        metastore_resolver.resolve(&metastore_uri).await.unwrap();
    }

    #[cfg(feature = "postgres")]
    #[tokio::test]
    async fn test_postgres_and_postgresql_protocol_accepted() {
        use std::env;
        let metastore_resolver = MetastoreResolver::unconfigured();
        // If the database defined in the env var or the default one is not up, the
        // test block after making 10 attempts with a timeout of 10s each = 100s.
        let test_database_url = env::var("QW_TEST_DATABASE_URL").unwrap_or_else(|_| {
            "postgres://quickwit-dev:quickwit-dev@localhost/quickwit-metastore-dev".to_string()
        });
        let (_uri_protocol, uri_path) = test_database_url.split_once("://").unwrap();
        for protocol in &["postgres", "postgresql"] {
            let postgres_uri = Uri::from_str(&format!("{protocol}://{uri_path}")).unwrap();
            metastore_resolver.resolve(&postgres_uri).await.unwrap();
        }
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/split_metadata.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::fmt;
use std::ops::{Range, RangeInclusive};
use std::path::PathBuf;
use std::str::FromStr;
use std::time::Duration;

use bytesize::ByteSize;
use quickwit_proto::types::{DocMappingUid, IndexUid, SourceId, SplitId};
use serde::{Deserialize, Serialize};
use serde_with::{DurationMilliSeconds, serde_as};
use time::OffsetDateTime;

use crate::split_metadata_version::VersionedSplitMetadata;

/// Carries split metadata.
#[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
pub struct Split {
    /// The state of the split.
    pub split_state: SplitState,

    /// Timestamp for tracking when the split was last updated.
    pub update_timestamp: i64,

    /// Timestamp for tracking when the split was published.
    pub publish_timestamp: Option<i64>,

    #[serde(flatten)]
    #[schema(value_type = VersionedSplitMetadata)]
    /// Immutable part of the split.
    pub split_metadata: SplitMetadata,
}

impl Split {
    /// Returns the split_id.
    pub fn split_id(&self) -> &str {
        &self.split_metadata.split_id
    }
}

/// Carries immutable split metadata.
/// This struct can deserialize older format automatically
/// but can only serialize to the last version.
#[derive(Clone, Default, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
#[serde(into = "VersionedSplitMetadata")]
#[serde(try_from = "VersionedSplitMetadata")]
pub struct SplitMetadata {
    /// Split ID. Joined with the index URI (<index URI>/<split ID>), this ID
    /// should be enough to uniquely identify a split.
    /// In reality, some information may be implicitly configured
    /// in the storage resolver: for instance, the Amazon S3 region.
    #[schema(value_type = String)]
    pub split_id: SplitId,

    /// Id of the index this split belongs to.
    pub index_uid: IndexUid,

    /// Partition to which the split belongs to.
    ///
    /// Partitions are usually meant to isolate documents based on some field like
    /// `tenant_id`. For this reason, ideally splits with a different `partition_id`
    /// should not be merged together. Merging two splits with different `partition_id`
    /// does not hurt correctness however.
    pub partition_id: u64,

    /// Source ID.
    pub source_id: SourceId,

    /// Node ID.
    pub node_id: String,

    /// Number of records (or documents) in the split.
    /// TODO make u64
    pub num_docs: usize,

    /// Sum of the size (in bytes) of the raw documents in this split.
    ///
    /// Note this is not the split file size. It is the size of the original
    /// JSON payloads.
    pub uncompressed_docs_size_in_bytes: u64,

    /// If a timestamp field is available, the min / max timestamp in
    /// the split, expressed in seconds.
    pub time_range: Option<RangeInclusive<i64>>,

    /// Timestamp for tracking when the split was created.
    pub create_timestamp: i64,

    /// Split maturity either `Mature` or `Immature` with a given maturation period.
    pub maturity: SplitMaturity,

    /// Set of unique tags values of form `{field_name}:{field_value}`.
    /// The set is filled at indexing with values from each field registered
    /// in the [`DocMapping`](quickwit_config::DocMapping) `tag_fields` attribute and only when
    /// cardinality of a given field is less or equal to [`MAX_VALUES_PER_TAG_FIELD`].
    /// An additional special tag of the form `{field_name}!` is added to the set
    /// to indicate that this field `field_name` was indeed registered in `tag_fields`.
    /// When cardinality is strictly higher than [`MAX_VALUES_PER_TAG_FIELD`],
    /// no field value is added to the set.
    ///
    /// [`MAX_VALUES_PER_TAG_FIELD`]: https://github.com/quickwit-oss/quickwit/blob/main/quickwit-indexing/src/actors/packager.rs#L36
    pub tags: BTreeSet<String>,

    /// Contains the range of bytes of the footer that needs to be downloaded
    /// in order to open a split.
    ///
    /// The footer offsets
    /// make it possible to download the footer in a single call to `.get_slice(...)`.
    pub footer_offsets: Range<u64>,

    /// Delete opstamp.
    pub delete_opstamp: u64,

    /// Number of merge operations that was involved to create
    /// this split.
    pub num_merge_ops: usize,

    /// Doc mapping UID used when creating this split. This split may only be merged with other
    /// splits using the same doc mapping UID.
    pub doc_mapping_uid: DocMappingUid,
}

impl fmt::Debug for SplitMetadata {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let mut debug_struct = f.debug_struct("SplitMetadata");
        debug_struct.field("split_id", &self.split_id);
        debug_struct.field("index_uid", &self.index_uid);
        debug_struct.field("partition_id", &self.partition_id);
        debug_struct.field("source_id", &self.source_id);
        debug_struct.field("node_id", &self.node_id);
        debug_struct.field("num_docs", &self.num_docs);
        debug_struct.field(
            "uncompressed_docs_size_in_bytes",
            &self.uncompressed_docs_size_in_bytes,
        );
        debug_struct.field("time_range", &self.time_range);
        debug_struct.field("create_timestamp", &self.create_timestamp);
        debug_struct.field("maturity", &self.maturity);
        if !self.tags.is_empty() {
            let mut tags_iter = self.tags.iter();
            let mut tags_str = String::new();
            tags_str.push('{');
            for _ in 0..4 {
                if let Some(tag) = tags_iter.next() {
                    tags_str.push('"');
                    tags_str.push_str(tag);
                    tags_str.push_str("\", ");
                } else {
                    break;
                }
            }
            if tags_iter.next().is_some() {
                let remaining_count = self.tags.len() - 4;
                tags_str.push_str(&format!("and {remaining_count} more"));
            } else {
                tags_str.pop();
                tags_str.pop();
            }
            tags_str.push('}');
            debug_struct.field("tags", &tags_str);
        }
        debug_struct.field("footer_offsets", &self.footer_offsets);
        debug_struct.field("delete_opstamp", &self.delete_opstamp);
        debug_struct.field("num_merge_ops", &self.num_merge_ops);
        debug_struct.finish()
    }
}

impl SplitMetadata {
    /// Creates a new instance of split metadata.
    pub fn new(
        split_id: SplitId,
        index_uid: IndexUid,
        partition_id: u64,
        source_id: SourceId,
        node_id: String,
    ) -> Self {
        Self {
            split_id,
            index_uid,
            partition_id,
            source_id,
            node_id,
            create_timestamp: utc_now_timestamp(),
            ..Default::default()
        }
    }

    /// Returns the split_id.
    pub fn split_id(&self) -> &str {
        &self.split_id
    }

    /// Returns true if the split is mature at the unix `timestamp`.
    pub fn is_mature(&self, datetime: OffsetDateTime) -> bool {
        match self.maturity {
            SplitMaturity::Mature => true,
            SplitMaturity::Immature {
                maturation_period: time_to_maturity,
            } => {
                self.create_timestamp + time_to_maturity.as_secs() as i64
                    <= datetime.unix_timestamp()
            }
        }
    }

    #[cfg(any(test, feature = "testsuite"))]
    /// Returns an instance of `SplitMetadata` for testing.
    pub fn for_test(split_id: SplitId) -> SplitMetadata {
        SplitMetadata {
            split_id,
            ..Default::default()
        }
    }

    /// Converts the split metadata into a [`SplitInfo`].
    pub fn as_split_info(&self) -> SplitInfo {
        let file_name = quickwit_common::split_file(self.split_id());

        SplitInfo {
            uncompressed_docs_size_bytes: ByteSize(self.uncompressed_docs_size_in_bytes),
            file_name: PathBuf::from(file_name),
            file_size_bytes: ByteSize(self.footer_offsets.end),
            split_id: self.split_id.clone(),
            num_docs: self.num_docs,
        }
    }
}

/// A summarized version of the split metadata for display purposes.
#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
pub struct SplitInfo {
    /// The split ID.
    #[schema(value_type = String)]
    pub split_id: SplitId,
    /// The number of documents in the split.
    pub num_docs: usize,
    /// The sum of the sizes of the original JSON payloads in bytes.
    #[schema(value_type = u64)]
    pub uncompressed_docs_size_bytes: ByteSize,
    /// The name of the split file on disk.
    #[schema(value_type = String)]
    pub file_name: PathBuf,
    /// The size of the split file on disk in bytes.
    #[schema(value_type = u64)]
    pub file_size_bytes: ByteSize,
}

#[cfg(any(test, feature = "testsuite"))]
impl quickwit_config::TestableForRegression for SplitMetadata {
    fn sample_for_regression() -> Self {
        SplitMetadata {
            split_id: "split".to_string(),
            index_uid: IndexUid::for_test("my-index", 1),
            source_id: "source".to_string(),
            node_id: "node".to_string(),
            delete_opstamp: 10,
            partition_id: 7u64,
            num_docs: 12303,
            uncompressed_docs_size_in_bytes: 234234,
            time_range: Some(121000..=130198),
            create_timestamp: 3,
            maturity: SplitMaturity::Immature {
                maturation_period: Duration::from_secs(4),
            },
            tags: ["234".to_string(), "aaa".to_string()].into_iter().collect(),
            footer_offsets: 1000..2000,
            num_merge_ops: 3,
            doc_mapping_uid: DocMappingUid::default(),
        }
    }

    fn assert_equality(&self, other: &Self) {
        assert_eq!(self, other);
    }
}

/// A split state.
#[derive(Clone, Copy, Debug, Serialize, Deserialize, Eq, PartialEq, utoipa::ToSchema)]
pub enum SplitState {
    /// The split is almost ready. Some of its files may have been uploaded in the storage.
    Staged,

    /// The split is ready and published.
    Published,

    /// The split is marked for deletion.
    MarkedForDeletion,
}

impl fmt::Display for SplitState {
    fn fmt(&self, f: &mut fmt::Formatter) -> std::fmt::Result {
        write!(f, "{self:?}")
    }
}

impl SplitState {
    /// Returns a string representation of the given enum.
    pub fn as_str(&self) -> &'static str {
        match self {
            SplitState::Staged => "Staged",
            SplitState::Published => "Published",
            SplitState::MarkedForDeletion => "MarkedForDeletion",
        }
    }
}

impl FromStr for SplitState {
    type Err = String;

    fn from_str(input: &str) -> Result<SplitState, Self::Err> {
        let split_state = match input {
            "Staged" => SplitState::Staged,
            "Published" => SplitState::Published,
            "MarkedForDeletion" => SplitState::MarkedForDeletion,
            "ScheduledForDeletion" => SplitState::MarkedForDeletion, // Deprecated
            "New" => SplitState::Staged,                             // Deprecated
            _ => return Err(format!("unknown split state `{input}`")),
        };
        Ok(split_state)
    }
}

/// `SplitMaturity` defines the maturity of a split, it is either `Mature`
/// or `Immature` with a given maturation period.
/// The maturity is determined by the `MergePolicy`.
#[serde_as]
#[derive(Clone, Copy, Debug, Default, Eq, Serialize, Deserialize, PartialEq, PartialOrd, Ord)]
#[serde(tag = "type")]
#[serde(rename_all = "snake_case")]
pub enum SplitMaturity {
    /// The split is mature and no longer a candidates for merges.
    #[default]
    Mature,
    /// The split is immature and can undergo merges until `maturation_period` passes,
    /// measured relatively from the split's creation timestamp.
    Immature {
        /// Maturation period.
        #[serde_as(as = "DurationMilliSeconds<u64>")]
        #[serde(rename = "maturation_period_millis")]
        maturation_period: Duration,
    },
}

/// Helper function to provide a UTC now timestamp to use
/// as a default in deserialization.
///
/// During unit test, the value is constant.
pub fn utc_now_timestamp() -> i64 {
    if cfg!(any(test, feature = "testsuite")) {
        1640577000
    } else {
        OffsetDateTime::now_utc().unix_timestamp()
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_split_maturity_serialization() {
        {
            let split_maturity = super::SplitMaturity::Immature {
                maturation_period: std::time::Duration::from_millis(10),
            };
            let serialized = serde_json::to_string(&split_maturity).unwrap();
            assert_eq!(
                serialized,
                r#"{"type":"immature","maturation_period_millis":10}"#
            );
            let deserialized: super::SplitMaturity = serde_json::from_str(&serialized).unwrap();
            assert_eq!(deserialized, split_maturity);
        }
        {
            let split_maturity = super::SplitMaturity::Mature;
            let serialized = serde_json::to_string(&split_maturity).unwrap();
            assert_eq!(serialized, r#"{"type":"mature"}"#);
            let deserialized: super::SplitMaturity = serde_json::from_str(&serialized).unwrap();
            assert_eq!(deserialized, split_maturity);
        }
    }

    #[test]
    fn test_split_metadata_debug() {
        let split_metadata = SplitMetadata {
            split_id: "split-1".to_string(),
            index_uid: IndexUid::for_test("00000000-0000-0000-0000-000000000000", 0),
            partition_id: 0,
            source_id: "source-1".to_string(),
            node_id: "node-1".to_string(),
            num_docs: 100,
            uncompressed_docs_size_in_bytes: 1024,
            time_range: Some(0..=100),
            create_timestamp: 1629867600,
            maturity: SplitMaturity::Mature,
            tags: {
                let mut tags = BTreeSet::new();
                tags.insert("🐱".to_string());
                tags.insert("🙀".to_string());
                tags.insert("😻".to_string());
                tags.insert("😼".to_string());
                tags.insert("😿".to_string());
                tags
            },
            footer_offsets: 0..1024,
            delete_opstamp: 0,
            num_merge_ops: 0,
            doc_mapping_uid: DocMappingUid::default(),
        };

        let expected_output = "SplitMetadata { split_id: \"split-1\", index_uid: IndexUid { \
                               index_id: \"00000000-0000-0000-0000-000000000000\", \
                               incarnation_id: Ulid(0) }, partition_id: 0, source_id: \
                               \"source-1\", node_id: \"node-1\", num_docs: 100, \
                               uncompressed_docs_size_in_bytes: 1024, time_range: Some(0..=100), \
                               create_timestamp: 1629867600, maturity: Mature, tags: \
                               \"{\\\"🐱\\\", \\\"😻\\\", \\\"😼\\\", \\\"😿\\\", and 1 more}\", \
                               footer_offsets: 0..1024, delete_opstamp: 0, num_merge_ops: 0 }";

        assert_eq!(format!("{split_metadata:?}"), expected_output);
    }

    #[test]
    fn test_spit_maturity_order() {
        assert!(
            SplitMaturity::Mature
                < SplitMaturity::Immature {
                    maturation_period: Duration::from_secs(0)
                }
        );
        assert!(
            SplitMaturity::Immature {
                maturation_period: Duration::from_secs(0)
            } < SplitMaturity::Immature {
                maturation_period: Duration::from_secs(1)
            }
        );
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/split_metadata_version.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::ops::{Range, RangeInclusive};

use quickwit_proto::types::{DocMappingUid, IndexUid, SplitId};
use serde::{Deserialize, Serialize};

use crate::SplitMetadata;
use crate::split_metadata::{SplitMaturity, utc_now_timestamp};

#[derive(Clone, Debug, Default, Eq, PartialEq, Serialize, Deserialize, utoipa::ToSchema)]
pub(crate) struct SplitMetadataV0_8 {
    /// Split ID. Joined with the index URI (<index URI>/<split ID>), this ID
    /// should be enough to uniquely identify a split.
    /// In reality, some information may be implicitly configured
    /// in the storage resolver: for instance, the Amazon S3 region.
    #[schema(value_type = String)]
    pub split_id: SplitId,

    /// Uid of the index this split belongs to.
    #[schema(value_type = String)]
    #[serde(alias = "index_id")]
    pub index_uid: IndexUid,

    #[serde(default)]
    pub partition_id: u64,

    #[serde(default)]
    pub source_id: Option<String>,

    #[serde(default)]
    pub node_id: Option<String>,

    /// Number of records (or documents) in the split.
    pub num_docs: usize,

    /// Sum of the size (in bytes) of the raw documents in this split.
    ///
    /// Note this is not the split file size. It is the size of the original
    /// JSON payloads.
    #[serde(alias = "size_in_bytes")]
    pub uncompressed_docs_size_in_bytes: u64,

    #[schema(value_type = Option<Object>)]
    /// If a timestamp field is available, the min / max timestamp in
    /// the split.
    pub time_range: Option<RangeInclusive<i64>>,

    /// Timestamp for tracking when the split was created.
    #[serde(default = "utc_now_timestamp")]
    pub create_timestamp: i64,

    /// Split maturity either `Mature` or `Immature` with a given maturation period.
    #[serde(default)]
    #[schema(value_type = Value)]
    pub maturity: SplitMaturity,

    #[serde(default)]
    #[schema(value_type = Vec<String>)]
    /// A set of tags for categorizing and searching group of splits.
    pub tags: BTreeSet<String>,

    #[schema(value_type = Object)]
    /// Contains the range of bytes of the footer that needs to be downloaded
    /// in order to open a split.
    ///
    /// The footer offsets
    /// make it possible to download the footer in a single call to `.get_slice(...)`.
    pub footer_offsets: Range<u64>,

    /// Split delete opstamp.
    #[serde(default)]
    pub delete_opstamp: u64,

    #[serde(default)]
    num_merge_ops: usize,

    // we default fill with zero: we don't know the right uid, and it's correct to assume all
    // splits before when updates first appeared are compatible with each other.
    #[serde(default)]
    doc_mapping_uid: DocMappingUid,
}

impl From<SplitMetadataV0_8> for SplitMetadata {
    fn from(v8: SplitMetadataV0_8) -> Self {
        let source_id = v8.source_id.unwrap_or_else(|| "unknown".to_string());

        let node_id = if let Some(node_id) = v8.node_id {
            // The previous version encoded `v1.node_id` as `{node_id}/{pipeline_ord}`.
            // Since pipeline_ord is no longer needed, we only extract the `node_id` portion
            // to keep backward compatibility.  This has the advantage of avoiding a
            // brand new version.
            if let Some((node_id, _)) = node_id.rsplit_once('/') {
                node_id.to_string()
            } else {
                node_id
            }
        } else {
            "unknown".to_string()
        };

        SplitMetadata {
            split_id: v8.split_id,
            index_uid: v8.index_uid,
            partition_id: v8.partition_id,
            source_id,
            node_id,
            delete_opstamp: v8.delete_opstamp,
            num_docs: v8.num_docs,
            uncompressed_docs_size_in_bytes: v8.uncompressed_docs_size_in_bytes,
            time_range: v8.time_range,
            create_timestamp: v8.create_timestamp,
            maturity: v8.maturity,
            tags: v8.tags,
            footer_offsets: v8.footer_offsets,
            num_merge_ops: v8.num_merge_ops,
            doc_mapping_uid: v8.doc_mapping_uid,
        }
    }
}

impl From<SplitMetadata> for SplitMetadataV0_8 {
    fn from(split: SplitMetadata) -> Self {
        SplitMetadataV0_8 {
            split_id: split.split_id,
            index_uid: split.index_uid,
            partition_id: split.partition_id,
            source_id: Some(split.source_id),
            node_id: Some(split.node_id),
            delete_opstamp: split.delete_opstamp,
            num_docs: split.num_docs,
            uncompressed_docs_size_in_bytes: split.uncompressed_docs_size_in_bytes,
            time_range: split.time_range,
            create_timestamp: split.create_timestamp,
            maturity: split.maturity,
            tags: split.tags,
            footer_offsets: split.footer_offsets,
            num_merge_ops: split.num_merge_ops,
            doc_mapping_uid: split.doc_mapping_uid,
        }
    }
}

#[derive(Serialize, Deserialize, utoipa::ToSchema)]
#[serde(tag = "version")]
pub(crate) enum VersionedSplitMetadata {
    #[serde(rename = "0.9")]
    // Retro compatibility.
    #[serde(alias = "0.8")]
    #[serde(alias = "0.7")]
    V0_8(SplitMetadataV0_8),
}

impl From<VersionedSplitMetadata> for SplitMetadata {
    fn from(versioned_helper: VersionedSplitMetadata) -> Self {
        match versioned_helper {
            VersionedSplitMetadata::V0_8(v0_8) => v0_8.into(),
        }
    }
}

impl From<SplitMetadata> for VersionedSplitMetadata {
    fn from(split_metadata: SplitMetadata) -> Self {
        VersionedSplitMetadata::V0_8(split_metadata.into())
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/delete_task.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::rand::append_random_suffix;
use quickwit_config::IndexConfig;
use quickwit_proto::metastore::{
    CreateIndexRequest, DeleteIndexRequest, DeleteQuery, EntityKind, LastDeleteOpstampRequest,
    ListDeleteTasksRequest, MetastoreError,
};
use quickwit_proto::types::IndexUid;
use quickwit_query::query_ast::qast_json_helper;

use super::DefaultForTest;
use crate::tests::cleanup_index;
use crate::{CreateIndexRequestExt, MetastoreServiceExt};

pub async fn test_metastore_create_delete_task<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;
    let index_id = append_random_suffix("add-delete-task");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();
    let delete_query = DeleteQuery {
        index_uid: Some(index_uid.clone()),
        query_ast: qast_json_helper("my_field:my_value", &[]),
        start_timestamp: Some(1),
        end_timestamp: Some(2),
    };

    // Create a delete task on non-existing index.
    let error = metastore
        .create_delete_task(DeleteQuery {
            index_uid: Some(IndexUid::new_with_random_ulid("does-not-exist")),
            ..delete_query.clone()
        })
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    // Create a delete task on an index with wrong incarnation_id
    let error = metastore
        .create_delete_task(DeleteQuery {
            index_uid: Some(IndexUid::for_test(&index_id, 12345)),
            ..delete_query.clone()
        })
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    // Create a delete task.
    let delete_task_1 = metastore
        .create_delete_task(delete_query.clone())
        .await
        .unwrap();
    assert!(delete_task_1.opstamp > 0);
    let delete_query_1 = delete_task_1.delete_query.unwrap();
    assert_eq!(delete_query_1.index_uid, delete_query.index_uid);
    assert_eq!(delete_query_1.start_timestamp, delete_query.start_timestamp);
    assert_eq!(delete_query_1.end_timestamp, delete_query.end_timestamp);
    let delete_task_2 = metastore
        .create_delete_task(delete_query.clone())
        .await
        .unwrap();
    assert!(delete_task_2.opstamp > delete_task_1.opstamp);

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_last_delete_opstamp<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;
    let index_id_1 = append_random_suffix("test-last-delete-opstamp-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);
    let index_id_2 = append_random_suffix("test-last-delete-opstamp-2");
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);
    let index_uid_1 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_1).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_2 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_2).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();

    let delete_query_index_1 = DeleteQuery {
        index_uid: Some(index_uid_1.clone()),
        query_ast: qast_json_helper("my_field:my_value", &[]),
        start_timestamp: Some(1),
        end_timestamp: Some(2),
    };
    let delete_query_index_2 = DeleteQuery {
        index_uid: Some(index_uid_2.clone()),
        query_ast: qast_json_helper("my_field:my_value", &[]),
        start_timestamp: Some(1),
        end_timestamp: Some(2),
    };

    let last_opstamp_index_1_with_no_task = metastore
        .last_delete_opstamp(LastDeleteOpstampRequest {
            index_uid: Some(index_uid_1.clone()),
        })
        .await
        .unwrap()
        .last_delete_opstamp;
    assert_eq!(last_opstamp_index_1_with_no_task, 0);

    // Create a delete task.
    metastore
        .create_delete_task(delete_query_index_1.clone())
        .await
        .unwrap();
    let delete_task_2 = metastore
        .create_delete_task(delete_query_index_1.clone())
        .await
        .unwrap();
    let delete_task_3 = metastore
        .create_delete_task(delete_query_index_2.clone())
        .await
        .unwrap();

    let last_opstamp_index_1 = metastore
        .last_delete_opstamp(LastDeleteOpstampRequest {
            index_uid: Some(index_uid_1.clone()),
        })
        .await
        .unwrap()
        .last_delete_opstamp;
    let last_opstamp_index_2 = metastore
        .last_delete_opstamp(LastDeleteOpstampRequest {
            index_uid: Some(index_uid_2.clone()),
        })
        .await
        .unwrap()
        .last_delete_opstamp;
    assert_eq!(last_opstamp_index_1, delete_task_2.opstamp);
    assert_eq!(last_opstamp_index_2, delete_task_3.opstamp);
    cleanup_index(&mut metastore, index_uid_1).await;
    cleanup_index(&mut metastore, index_uid_2).await;
}

pub async fn test_metastore_delete_index_with_tasks<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let metastore = MetastoreToTest::default_for_test().await;
    let index_id = append_random_suffix("delete-delete-tasks");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();
    let delete_query = DeleteQuery {
        index_uid: Some(index_uid.clone()),
        query_ast: qast_json_helper("my_field:my_value", &[]),
        start_timestamp: Some(1),
        end_timestamp: Some(2),
    };
    let _ = metastore
        .create_delete_task(delete_query.clone())
        .await
        .unwrap();
    let _ = metastore
        .create_delete_task(delete_query.clone())
        .await
        .unwrap();

    metastore
        .delete_index(DeleteIndexRequest {
            index_uid: Some(index_uid),
        })
        .await
        .unwrap();
}

pub async fn test_metastore_list_delete_tasks<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;
    let index_id_1 = append_random_suffix("test-list-delete-tasks-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);
    let index_id_2 = append_random_suffix("test-list-delete-tasks-2");
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);
    let index_uid_1 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_1).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_2 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_2).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let delete_query_index_1 = DeleteQuery {
        index_uid: Some(index_uid_1.clone()),
        query_ast: qast_json_helper("my_field:my_value", &[]),
        start_timestamp: Some(1),
        end_timestamp: Some(2),
    };
    let delete_query_index_2 = DeleteQuery {
        index_uid: Some(index_uid_2.clone()),
        query_ast: qast_json_helper("my_field:my_value", &[]),
        start_timestamp: Some(1),
        end_timestamp: Some(2),
    };

    // Create a delete task.
    let delete_task_1 = metastore
        .create_delete_task(delete_query_index_1.clone())
        .await
        .unwrap();
    let delete_task_2 = metastore
        .create_delete_task(delete_query_index_1.clone())
        .await
        .unwrap();
    let _ = metastore
        .create_delete_task(delete_query_index_2.clone())
        .await
        .unwrap();

    let all_index_id_1_delete_tasks = metastore
        .list_delete_tasks(ListDeleteTasksRequest::new(index_uid_1.clone(), 0))
        .await
        .unwrap()
        .delete_tasks;
    assert_eq!(all_index_id_1_delete_tasks.len(), 2);

    let recent_index_id_1_delete_tasks = metastore
        .list_delete_tasks(ListDeleteTasksRequest::new(
            index_uid_1.clone(),
            delete_task_1.opstamp,
        ))
        .await
        .unwrap()
        .delete_tasks;
    assert_eq!(recent_index_id_1_delete_tasks.len(), 1);
    assert_eq!(
        recent_index_id_1_delete_tasks[0].opstamp,
        delete_task_2.opstamp
    );
    cleanup_index(&mut metastore, index_uid_1).await;
    cleanup_index(&mut metastore, index_uid_2).await;
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/get_identity.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// Index API tests
//
//  - create_index
//  - index_exists
//  - index_metadata
//  - list_indexes
//  - delete_index

use quickwit_proto::metastore::{GetClusterIdentityRequest, MetastoreService};
use uuid::Uuid;

use super::DefaultForTest;
use crate::MetastoreServiceExt;

pub async fn test_metastore_get_identity<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let metastore = MetastoreToTest::default_for_test().await;

    let identity_1 = metastore
        .get_cluster_identity(GetClusterIdentityRequest {})
        .await
        .unwrap()
        .uuid;

    let identity_2 = metastore
        .get_cluster_identity(GetClusterIdentityRequest {})
        .await
        .unwrap()
        .uuid;

    assert_eq!(identity_1, identity_2);
    assert_ne!(identity_1, Uuid::nil().hyphenated().to_string());
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/index.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// Index API tests
//
//  - create_index
//  - index_exists
//  - index_metadata
//  - list_indexes
//  - delete_index

use std::num::NonZeroUsize;

use quickwit_common::rand::append_random_suffix;
use quickwit_config::merge_policy_config::{MergePolicyConfig, StableLogMergePolicyConfig};
use quickwit_config::{
    CLI_SOURCE_ID, INGEST_V2_SOURCE_ID, IndexConfig, IndexingSettings, IngestSettings,
    RetentionPolicy, SearchSettings, SourceConfig,
};
use quickwit_doc_mapper::{Cardinality, FieldMappingEntry, FieldMappingType, QuickwitJsonOptions};
use quickwit_proto::metastore::{
    CreateIndexRequest, DeleteIndexRequest, EntityKind, IndexMetadataFailure,
    IndexMetadataFailureReason, IndexMetadataRequest, IndexMetadataSubrequest, IndexStats,
    IndexesMetadataRequest, ListIndexStatsRequest, ListIndexesMetadataRequest, MetastoreError,
    MetastoreService, PublishSplitsRequest, SplitStats, StageSplitsRequest, UpdateIndexRequest,
};
use quickwit_proto::types::{DocMappingUid, IndexUid};

use super::DefaultForTest;
use crate::tests::cleanup_index;
use crate::{
    CreateIndexRequestExt, IndexMetadataResponseExt, IndexesMetadataResponseExt,
    ListIndexesMetadataResponseExt, MetastoreServiceExt, SplitMetadata, StageSplitsRequestExt,
    UpdateIndexRequestExt,
};

pub async fn test_metastore_create_index<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-create-index");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid = metastore
        .create_index(create_index_request.clone())
        .await
        .unwrap()
        .index_uid()
        .clone();

    assert!(metastore.index_exists(&index_id).await.unwrap());

    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();

    assert_eq!(index_metadata.index_id(), index_id);
    assert_eq!(index_metadata.index_uri(), &index_uri);

    let error = metastore
        .create_index(create_index_request)
        .await
        .unwrap_err();
    assert!(matches!(error, MetastoreError::AlreadyExists { .. }));

    cleanup_index(&mut metastore, index_uid).await;
}

async fn setup_metastore_for_update<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() -> (MetastoreToTest, IndexUid, IndexConfig) {
    let metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-update-index");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid = metastore
        .create_index(create_index_request.clone())
        .await
        .unwrap()
        .index_uid()
        .clone();

    (metastore, index_uid, index_config)
}

pub async fn test_metastore_update_retention_policy<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let (mut metastore, index_uid, index_config) =
        setup_metastore_for_update::<MetastoreToTest>().await;
    let new_retention_policy_opt = Some(RetentionPolicy {
        retention_period: String::from("3 days"),
        evaluation_schedule: String::from("daily"),
    });

    // set and unset retention policy multiple times
    for loop_retention_policy_opt in [
        None,
        new_retention_policy_opt.clone(),
        new_retention_policy_opt.clone(),
        None,
    ] {
        let index_update = UpdateIndexRequest::try_from_updates(
            index_uid.clone(),
            &index_config.doc_mapping,
            &index_config.indexing_settings,
            &index_config.ingest_settings,
            &index_config.search_settings,
            &loop_retention_policy_opt,
        )
        .unwrap();
        let response_metadata = metastore
            .update_index(index_update)
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(response_metadata.index_uid, index_uid);
        assert_eq!(
            response_metadata.index_config.retention_policy_opt,
            loop_retention_policy_opt
        );
        let updated_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(
                index_uid.index_id.to_string(),
            ))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(response_metadata, updated_metadata);
    }
    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_update_ingest_settings<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let (mut metastore, index_uid, index_config) =
        setup_metastore_for_update::<MetastoreToTest>().await;

    let ingest_settings = IngestSettings {
        min_shards: NonZeroUsize::new(12).unwrap(),
        ..Default::default()
    };
    let index_update_request = UpdateIndexRequest::try_from_updates(
        index_uid.clone(),
        &index_config.doc_mapping,
        &index_config.indexing_settings,
        &ingest_settings,
        &index_config.search_settings,
        &index_config.retention_policy_opt,
    )
    .unwrap();

    let min_shards = metastore
        .update_index(index_update_request)
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap()
        .index_config
        .ingest_settings
        .min_shards
        .get();
    assert_eq!(min_shards, 12);

    let index_metadata_request = IndexMetadataRequest::for_index_uid(index_uid.clone());

    let min_shards = metastore
        .index_metadata(index_metadata_request)
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap()
        .index_config
        .ingest_settings
        .min_shards
        .get();
    assert_eq!(min_shards, 12);

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_update_search_settings<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let (mut metastore, index_uid, index_config) =
        setup_metastore_for_update::<MetastoreToTest>().await;

    for default_search_fields in [
        Vec::new(),
        vec!["body".to_string()],
        vec!["body".to_string()],
        vec!["body".to_string(), "owner".to_string()],
        Vec::new(),
    ] {
        let search_settings = SearchSettings {
            default_search_fields: default_search_fields.clone(),
        };
        let index_update = UpdateIndexRequest::try_from_updates(
            index_uid.clone(),
            &index_config.doc_mapping,
            &index_config.indexing_settings,
            &index_config.ingest_settings,
            &search_settings,
            &index_config.retention_policy_opt,
        )
        .unwrap();
        let response_metadata = metastore
            .update_index(index_update)
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(
            response_metadata
                .index_config
                .search_settings
                .default_search_fields,
            default_search_fields
        );
        let updated_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(
                index_uid.index_id.to_string(),
            ))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(
            updated_metadata
                .index_config
                .search_settings
                .default_search_fields,
            default_search_fields
        );
    }
    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_update_indexing_settings<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let (mut metastore, index_uid, index_config) =
        setup_metastore_for_update::<MetastoreToTest>().await;

    for merge_policy in [
        MergePolicyConfig::Nop,
        MergePolicyConfig::Nop,
        MergePolicyConfig::StableLog(StableLogMergePolicyConfig {
            merge_factor: 5,
            ..Default::default()
        }),
    ] {
        let indexing_settings = IndexingSettings {
            merge_policy: merge_policy.clone(),
            ..Default::default()
        };
        let index_update = UpdateIndexRequest::try_from_updates(
            index_uid.clone(),
            &index_config.doc_mapping,
            &indexing_settings,
            &index_config.ingest_settings,
            &index_config.search_settings,
            &index_config.retention_policy_opt,
        )
        .unwrap();
        let resp_metadata = metastore
            .update_index(index_update)
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(
            resp_metadata.index_config.indexing_settings.merge_policy,
            merge_policy
        );
        let updated_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(
                index_uid.index_id.to_string(),
            ))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(
            updated_metadata.index_config.indexing_settings.merge_policy,
            merge_policy
        );
    }
    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_update_doc_mapping<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let (mut metastore, index_uid, index_config) =
        setup_metastore_for_update::<MetastoreToTest>().await;

    let json_options = QuickwitJsonOptions {
        description: None,
        stored: false,
        indexing_options: None,
        expand_dots: false,
        fast: Default::default(),
    };

    let initial = index_config.doc_mapping.clone();
    let mut new_field = initial.clone();
    new_field.field_mappings.push(FieldMappingEntry {
        name: "new_field".to_string(),
        mapping_type: FieldMappingType::Json(json_options.clone(), Cardinality::SingleValued),
    });
    new_field.doc_mapping_uid = DocMappingUid::random();
    let mut new_field_stored = initial.clone();
    new_field_stored.field_mappings.push(FieldMappingEntry {
        name: "new_field".to_string(),
        mapping_type: FieldMappingType::Json(
            QuickwitJsonOptions {
                stored: true,
                ..json_options
            },
            Cardinality::SingleValued,
        ),
    });
    new_field_stored.doc_mapping_uid = DocMappingUid::random();

    for loop_doc_mapping in [initial.clone(), new_field, new_field_stored, initial] {
        let index_update = UpdateIndexRequest::try_from_updates(
            index_uid.clone(),
            &loop_doc_mapping,
            &index_config.indexing_settings,
            &index_config.ingest_settings,
            &index_config.search_settings,
            &index_config.retention_policy_opt,
        )
        .unwrap();
        let resp_metadata = metastore
            .update_index(index_update)
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(resp_metadata.index_config.doc_mapping, loop_doc_mapping);
        let updated_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(
                index_uid.index_id.to_string(),
            ))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(updated_metadata.index_config.doc_mapping, loop_doc_mapping);
    }
    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_create_index_with_sources<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-create-index-with-sources");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let index_config_json = serde_json::to_string(&index_config).unwrap();

    let source_configs_json = vec![
        serde_json::to_string(&SourceConfig::cli()).unwrap(),
        serde_json::to_string(&SourceConfig::ingest_v2()).unwrap(),
    ];
    let create_index_request = CreateIndexRequest {
        index_config_json,
        source_configs_json,
    };
    let index_uid: IndexUid = metastore
        .create_index(create_index_request.clone())
        .await
        .unwrap()
        .index_uid()
        .clone();

    assert!(metastore.index_exists(&index_id).await.unwrap());

    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();

    assert_eq!(index_metadata.index_id(), index_id);
    assert_eq!(index_metadata.index_uri(), &index_uri);

    assert_eq!(index_metadata.sources.len(), 2);
    assert!(index_metadata.sources.contains_key(CLI_SOURCE_ID));
    assert!(index_metadata.sources.contains_key(INGEST_V2_SOURCE_ID));

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_create_index_enforces_index_id_maximum_length<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix(format!("very-long-index-{}", "a".repeat(233)).as_str());
    assert_eq!(index_id.len(), 255);
    let index_uri = format!("ram:///indexes/{index_id}");

    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    assert!(metastore.index_exists(&index_id).await.unwrap());

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_index_exists<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-index-exists");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();

    assert!(!metastore.index_exists(&index_id).await.unwrap());

    let index_uid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    assert!(metastore.index_exists(&index_id).await.unwrap());

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_index_metadata<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-index-metadata");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let error = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();

    assert_eq!(index_metadata.index_id(), index_id);
    assert_eq!(index_metadata.index_uri(), &index_uri);

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_indexes_metadata<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id_0 = append_random_suffix("test-indexes-metadata-0");
    let index_uri_0 = format!("ram:///indexes/{index_id_0}");
    let index_config_0 = IndexConfig::for_test(&index_id_0, &index_uri_0);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_0).unwrap();
    let index_uid_0: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let index_id_1 = append_random_suffix("test-indexes-metadata-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_1).unwrap();
    let index_uid_1: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let indexes_metadata_request = IndexesMetadataRequest {
        subrequests: vec![
            IndexMetadataSubrequest {
                index_id: None,
                index_uid: None,
            },
            IndexMetadataSubrequest {
                index_id: Some(index_id_0.clone()),
                index_uid: None,
            },
            IndexMetadataSubrequest {
                index_id: Some("test-indexes-metadata-foo".to_string()),
                index_uid: None,
            },
            IndexMetadataSubrequest {
                index_id: None,
                index_uid: Some(index_uid_1.clone()),
            },
            IndexMetadataSubrequest {
                index_id: None,
                index_uid: Some(IndexUid::for_test("test-indexes-metadata-bar", 123)),
            },
        ],
    };
    let mut indexes_metadata_response = metastore
        .indexes_metadata(indexes_metadata_request)
        .await
        .unwrap();

    let failures = &mut indexes_metadata_response.failures;
    assert_eq!(failures.len(), 3);

    failures.sort_by(|left, right| left.index_id().cmp(right.index_id()));

    let expected_failure_0 = IndexMetadataFailure {
        index_id: None,
        index_uid: None,
        reason: IndexMetadataFailureReason::Internal as i32,
    };
    assert_eq!(failures[0], expected_failure_0);

    let expected_failure_1 = IndexMetadataFailure {
        index_id: None,
        index_uid: Some(IndexUid::for_test("test-indexes-metadata-bar", 123)),
        reason: IndexMetadataFailureReason::NotFound as i32,
    };
    assert_eq!(failures[1], expected_failure_1);

    let expected_failure_2 = IndexMetadataFailure {
        index_id: Some("test-indexes-metadata-foo".to_string()),
        index_uid: None,
        reason: IndexMetadataFailureReason::NotFound as i32,
    };
    assert_eq!(failures[2], expected_failure_2);

    let mut indexes_metadata = indexes_metadata_response
        .deserialize_indexes_metadata()
        .await
        .unwrap();
    assert_eq!(indexes_metadata.len(), 2);

    indexes_metadata.sort_by(|left, right| left.index_id().cmp(right.index_id()));
    assert_eq!(indexes_metadata[0].index_id(), index_id_0);
    assert_eq!(indexes_metadata[1].index_id(), index_id_1);

    cleanup_index(&mut metastore, index_uid_0).await;
    cleanup_index(&mut metastore, index_uid_1).await;
}

pub async fn test_metastore_list_all_indexes<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id_prefix = append_random_suffix("test-list-all-indexes");
    let index_id_1 = format!("{index_id_prefix}-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let index_id_2 = format!("{index_id_prefix}-2");
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);
    let indexes_count = metastore
        .list_indexes_metadata(ListIndexesMetadataRequest::all())
        .await
        .unwrap()
        .deserialize_indexes_metadata()
        .await
        .unwrap()
        .into_iter()
        .filter(|index| index.index_id().starts_with(&index_id_prefix))
        .count();
    assert_eq!(indexes_count, 0);

    let index_uid_1 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_1).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_2 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_2).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();

    let indexes_count = metastore
        .list_indexes_metadata(ListIndexesMetadataRequest::all())
        .await
        .unwrap()
        .deserialize_indexes_metadata()
        .await
        .unwrap()
        .into_iter()
        .filter(|index| index.index_id().starts_with(&index_id_prefix))
        .count();
    assert_eq!(indexes_count, 2);

    cleanup_index(&mut metastore, index_uid_1).await;
    cleanup_index(&mut metastore, index_uid_2).await;
}

pub async fn test_metastore_list_indexes<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id_fragment = append_random_suffix("test-list-indexes");
    let index_id_1 = format!("prefix-1-{index_id_fragment}-suffix-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let index_id_2 = format!("prefix-2-{index_id_fragment}-suffix-2");
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);

    let index_id_3 = format!("prefix.3.{index_id_fragment}.3");
    let index_uri_3 = format!("ram:///indexes/{index_id_3}");
    let index_config_3 = IndexConfig::for_test(&index_id_3, &index_uri_3);

    let index_id_4 = format!("p-4-{index_id_fragment}-suffix-4");
    let index_uri_4 = format!("ram:///indexes/{index_id_4}");
    let index_config_4 = IndexConfig::for_test(&index_id_4, &index_uri_4);

    let index_id_5 = format!("my-exact-index-{index_id_fragment}-5");
    let index_uri_5 = format!("ram:///indexes/{index_id_5}");
    let index_config_5 = IndexConfig::for_test(&index_id_5, &index_uri_5);

    let index_id_patterns = vec![
        format!("prefix-*-{index_id_fragment}-suffix-*"),
        format!("prefix*{index_id_fragment}*suffix-*"),
        format!("my-exact-index-{index_id_fragment}-5"),
    ];
    let indexes_count = metastore
        .list_indexes_metadata(ListIndexesMetadataRequest { index_id_patterns })
        .await
        .unwrap()
        .deserialize_indexes_metadata()
        .await
        .unwrap()
        .len();
    assert_eq!(indexes_count, 0);

    let index_uid_1 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_1).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_2 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_2).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_3 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_3).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_4 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_4).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();
    let index_uid_5 = metastore
        .create_index(CreateIndexRequest::try_from_index_config(&index_config_5).unwrap())
        .await
        .unwrap()
        .index_uid()
        .clone();

    let index_id_patterns = vec![
        format!("prefix-*-{index_id_fragment}-suffix-*"),
        format!("my-exact-index-{index_id_fragment}-5"),
    ];
    let indexes_count = metastore
        .list_indexes_metadata(ListIndexesMetadataRequest { index_id_patterns })
        .await
        .unwrap()
        .deserialize_indexes_metadata()
        .await
        .unwrap()
        .len();
    assert_eq!(indexes_count, 3);

    cleanup_index(&mut metastore, index_uid_1).await;
    cleanup_index(&mut metastore, index_uid_2).await;
    cleanup_index(&mut metastore, index_uid_3).await;
    cleanup_index(&mut metastore, index_uid_4).await;
    cleanup_index(&mut metastore, index_uid_5).await;
}

pub async fn test_metastore_delete_index<
    MetastoreToTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-delete-index");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let index_uid_not_existing = IndexUid::new_with_random_ulid("index-not-found");
    let error = metastore
        .delete_index(DeleteIndexRequest {
            index_uid: Some(index_uid_not_existing.clone()),
        })
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let error = metastore
        .delete_index(DeleteIndexRequest {
            index_uid: Some(index_uid_not_existing),
        })
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    metastore
        .delete_index(DeleteIndexRequest {
            index_uid: index_uid.clone().into(),
        })
        .await
        .unwrap();

    assert!(!metastore.index_exists(&index_id).await.unwrap());

    let split_id = format!("{index_id}--split");
    let split_metadata = SplitMetadata {
        split_id: split_id.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid
        .unwrap();

    let stage_splits_request =
        StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata).unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    // TODO: We should not be able to delete an index that has remaining splits, at least not as
    // a default behavior. Let's implement the logic that allows this test to pass.
    // let error = metastore.delete_index(index_uid).await.unwrap_err();
    // assert!(matches!(error, MetastoreError::IndexNotEmpty { .. }));
    // let splits = metastore.list_all_splits(index_uid.clone()).await.unwrap();
    // assert_eq!(splits.len(), 1)

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_list_index_stats<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let metastore = MetastoreToTest::default_for_test().await;

    let index_id_1 = append_random_suffix("test-list-index-stats");
    let index_uid_1 = IndexUid::new_with_random_ulid(&index_id_1);
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let index_id_2 = append_random_suffix("test-list-index-stats");
    let index_uid_2 = IndexUid::new_with_random_ulid(&index_id_2);
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);

    let split_id_1 = format!("{index_id_1}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid_1.clone(),
        footer_offsets: 0..2048,
        ..Default::default()
    };

    let split_id_2 = format!("{index_id_1}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid_1.clone(),
        footer_offsets: 0..2048,
        ..Default::default()
    };

    let split_id_3 = format!("{index_id_1}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid_2.clone(),
        footer_offsets: 0..1000,
        ..Default::default()
    };

    // add split-1 and split-2 to index-1
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_1).unwrap();
    let index_uid_1: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
        index_uid_1.clone(),
        vec![split_metadata_1.clone(), split_metadata_2.clone()],
    )
    .unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid_1.clone()),
        staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    // add split-3 to index-2
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_2).unwrap();
    let index_uid_2: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
        index_uid_2.clone(),
        vec![split_metadata_3.clone()],
    )
    .unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    let expected_stats_1 = IndexStats {
        index_uid: Some(index_uid_1.clone()),
        staged: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
        published: Some(SplitStats {
            num_splits: 2,
            total_size_bytes: 4096,
        }),
        marked_for_deletion: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
    };
    let expected_stats_2 = IndexStats {
        index_uid: Some(index_uid_2.clone()),
        staged: Some(SplitStats {
            num_splits: 1,
            total_size_bytes: 1000,
        }),
        published: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
        marked_for_deletion: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
    };

    let response = metastore
        .list_index_stats(ListIndexStatsRequest {
            index_id_patterns: vec!["test-list-index-stats*".to_string()],
        })
        .await
        .unwrap();

    let index_stats_1 = response
        .index_stats
        .iter()
        .find(|index| index.index_uid == Some(index_uid_1.clone()))
        .expect("Should find index 1");

    assert_eq!(index_stats_1, &expected_stats_1);

    let index_stats_2 = response
        .index_stats
        .iter()
        .find(|index| index.index_uid == Some(index_uid_2.clone()))
        .expect("Should find index 2");
    assert_eq!(index_stats_2, &expected_stats_2);
}

pub async fn test_metastore_list_index_stats_no_splits<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-list-index-stats-no-splits");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();

    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let expected_stats = IndexStats {
        index_uid: Some(index_uid.clone()),
        staged: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
        published: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
        marked_for_deletion: Some(SplitStats {
            num_splits: 0,
            total_size_bytes: 0,
        }),
    };

    let response = metastore
        .list_index_stats(ListIndexStatsRequest {
            index_id_patterns: vec!["test-list-index-stats-no-splits*".to_string()],
        })
        .await
        .unwrap();

    let index_stats = response
        .index_stats
        .iter()
        .find(|index| index.index_uid == Some(index_uid.clone()))
        .expect("Should find index");

    assert_eq!(index_stats, &expected_stats);
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/list_splits.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use futures::TryStreamExt;
use itertools::Itertools;
use quickwit_common::rand::append_random_suffix;
use quickwit_config::IndexConfig;
use quickwit_doc_mapper::tag_pruning::{TagFilterAst, no_tag, tag};
use quickwit_proto::metastore::{
    CreateIndexRequest, ListSplitsRequest, ListStaleSplitsRequest, MarkSplitsForDeletionRequest,
    PublishSplitsRequest, StageSplitsRequest,
};
use quickwit_proto::types::{IndexUid, NodeId, SplitId};
use time::OffsetDateTime;
use tokio::time::sleep;
use tracing::info;

use super::{DefaultForTest, to_btree_set};
use crate::metastore::MetastoreServiceStreamSplitsExt;
use crate::tests::{cleanup_index, collect_split_ids};
use crate::{
    CreateIndexRequestExt, ListSplitsQuery, ListSplitsRequestExt, ListSplitsResponseExt,
    MetastoreServiceExt, SplitMaturity, SplitMetadata, SplitState, StageSplitsRequestExt,
};

pub async fn test_metastore_list_all_splits<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-list-all-splits");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let split_id_3 = format!("{index_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let split_id_4 = format!("{index_id}--split-4");
    let split_metadata_4 = SplitMetadata {
        split_id: split_id_4.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let split_id_5 = format!("{index_id}--split-5");
    let split_metadata_5 = SplitMetadata {
        split_id: split_id_5.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let split_id_6 = format!("{index_id}--split-6");
    let split_metadata_6 = SplitMetadata {
        split_id: split_id_6.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };

    let no_splits = metastore
        .list_splits(
            ListSplitsRequest::try_from_index_uid(IndexUid::new_with_random_ulid(
                "index-not-found",
            ))
            .unwrap(),
        )
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    assert!(no_splits.is_empty());

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
        index_uid.clone(),
        vec![
            split_metadata_1,
            split_metadata_2,
            split_metadata_3,
            split_metadata_4,
            split_metadata_5,
            split_metadata_6,
        ],
    )
    .unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid.clone()),
        staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    let mark_splits_for_deletion = MarkSplitsForDeletionRequest::new(
        index_uid.clone(),
        vec![split_id_3.clone(), split_id_4.clone()],
    );
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion)
        .await
        .unwrap();

    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    let split_ids = collect_split_ids(&splits);
    assert_eq!(
        split_ids,
        &[
            &split_id_1,
            &split_id_2,
            &split_id_3,
            &split_id_4,
            &split_id_5,
            &split_id_6
        ]
    );

    cleanup_index(&mut metastore, index_uid.clone()).await;
}

pub async fn test_metastore_stream_splits<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-stream-splits");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let mut split_metadatas_to_create = Vec::new();
    for split_idx in 1..1001 {
        let split_id = format!("{index_id}--split-{split_idx:0>4}");
        let split_metadata = SplitMetadata {
            split_id: split_id.clone(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        split_metadatas_to_create.push(split_metadata);

        if split_idx > 0 && split_idx % 100 == 0 {
            let staged_split_ids: Vec<SplitId> = split_metadatas_to_create
                .iter()
                .map(|split_metadata| split_metadata.split_id.clone())
                .collect();
            let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
                index_uid.clone(),
                split_metadatas_to_create.clone(),
            )
            .unwrap();
            metastore.stage_splits(stage_splits_request).await.unwrap();
            let publish_splits_request = PublishSplitsRequest {
                index_uid: Some(index_uid.clone()),
                staged_split_ids,
                ..Default::default()
            };
            metastore
                .publish_splits(publish_splits_request)
                .await
                .unwrap();
            split_metadatas_to_create.clear();
        }
    }

    let stream_splits_request = ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap();
    let mut stream_response = metastore.list_splits(stream_splits_request).await.unwrap();
    let mut all_splits = Vec::new();
    for _ in 0..10 {
        let mut splits = stream_response
            .try_next()
            .await
            .unwrap()
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 100);
        all_splits.append(&mut splits);
    }
    all_splits.sort_by_key(|split| split.split_id().to_string());
    assert_eq!(all_splits[0].split_id(), format!("{index_id}--split-0001"));
    assert_eq!(
        all_splits[all_splits.len() - 1].split_id(),
        format!("{index_id}--split-1000")
    );
}

pub async fn test_metastore_list_splits<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();

    let index_id = append_random_suffix("test-list-splits");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        time_range: Some(0..=99),
        create_timestamp: current_timestamp,
        maturity: SplitMaturity::Immature {
            maturation_period: Duration::from_secs(0),
        },
        tags: to_btree_set(&["tag!", "tag:foo", "$tag!", "$tag:bar"]),
        delete_opstamp: 3,
        ..Default::default()
    };

    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        time_range: Some(100..=199),
        create_timestamp: current_timestamp,
        maturity: SplitMaturity::Immature {
            maturation_period: Duration::from_secs(10),
        },
        tags: to_btree_set(&["tag!", "$tag!", "$tag:bar"]),
        delete_opstamp: 1,
        ..Default::default()
    };

    let split_id_3 = format!("{index_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid.clone(),
        time_range: Some(200..=299),
        create_timestamp: current_timestamp,
        maturity: SplitMaturity::Immature {
            maturation_period: Duration::from_secs(20),
        },
        tags: to_btree_set(&["tag!", "tag:foo", "tag:baz", "$tag!"]),
        delete_opstamp: 5,
        ..Default::default()
    };

    let split_id_4 = format!("{index_id}--split-4");
    let split_metadata_4 = SplitMetadata {
        split_id: split_id_4.clone(),
        index_uid: index_uid.clone(),
        time_range: Some(300..=399),
        tags: to_btree_set(&["tag!", "tag:foo", "$tag!"]),
        delete_opstamp: 7,
        ..Default::default()
    };

    let split_id_5 = format!("{index_id}--split-5");
    let split_metadata_5 = SplitMetadata {
        split_id: split_id_5.clone(),
        index_uid: index_uid.clone(),
        time_range: None,
        create_timestamp: current_timestamp,
        tags: to_btree_set(&["tag!", "tag:baz", "tag:biz", "$tag!"]),
        delete_opstamp: 9,
        ..Default::default()
    };

    {
        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());
    }
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            vec![
                split_metadata_1.clone(),
                split_metadata_2.clone(),
                split_metadata_3.clone(),
                split_metadata_4.clone(),
                split_metadata_5.clone(),
            ],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_limit(3);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(
            splits.len(),
            3,
            "Expected number of splits returned to match limit.",
        );

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_offset(3);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        assert_eq!(
            splits.len(),
            2,
            "Expected 3 splits to be skipped out of the 5 provided splits.",
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(99);

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids: Vec<&str> = splits
            .iter()
            .map(|split| split.split_id())
            .sorted()
            .collect();
        assert_eq!(split_ids, &[&split_id_1, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(200);

        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_3, &split_id_4, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_end_lt(200);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_1, &split_id_2, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(100);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_1, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(101);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_1, &split_id_2, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(199);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_1, &split_id_2, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(200);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_1, &split_id_2, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(201);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_1, &split_id_2, &split_id_3, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(299);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_1, &split_id_2, &split_id_3, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(300);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_1, &split_id_2, &split_id_3, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(0)
            .with_time_range_end_lt(301);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[
                &split_id_1,
                &split_id_2,
                &split_id_3,
                &split_id_4,
                &split_id_5
            ]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(301)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_4, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(300)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_4, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(299)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_3, &split_id_4, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(201)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_3, &split_id_4, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(200)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_3, &split_id_4, &split_id_5]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(199)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_2, &split_id_3, &split_id_4, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(101)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_2, &split_id_3, &split_id_4, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(101)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_2, &split_id_3, &split_id_4, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(100)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);

        assert_eq!(
            split_ids,
            &[&split_id_2, &split_id_3, &split_id_4, &split_id_5]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(99)
            .with_time_range_end_lt(400);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[
                &split_id_1,
                &split_id_2,
                &split_id_3,
                &split_id_4,
                &split_id_5
            ]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_time_range_start_gte(1000)
            .with_time_range_end_lt(1100);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_5]);

        // Artificially increase the create_timestamp
        sleep(Duration::from_secs(1)).await;
        // add a split without tag
        let split_id_6 = format!("{index_id}--split-6");
        let split_metadata_6 = SplitMetadata {
            split_id: split_id_6.clone(),
            index_uid: index_uid.clone(),
            time_range: None,
            create_timestamp: OffsetDateTime::now_utc().unix_timestamp(),
            ..Default::default()
        };
        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            vec![split_metadata_6.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let query =
            ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[
                &split_id_1,
                &split_id_2,
                &split_id_3,
                &split_id_4,
                &split_id_5,
                &split_id_6,
            ]
        );

        let tag_filter_ast = TagFilterAst::Or(vec![
            TagFilterAst::Or(vec![no_tag("$tag!"), tag("$tag:bar")]),
            TagFilterAst::Or(vec![no_tag("tag!"), tag("tag:baz")]),
        ]);
        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::Staged)
            .with_tags_filter(tag_filter_ast);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[
                &split_id_1,
                &split_id_2,
                &split_id_3,
                &split_id_5,
                &split_id_6,
            ]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_update_timestamp_gte(current_timestamp);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[
                &split_id_1,
                &split_id_2,
                &split_id_3,
                &split_id_4,
                &split_id_5,
                &split_id_6,
            ]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_update_timestamp_gte(split_metadata_6.create_timestamp);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids: Vec<&String> = splits
            .iter()
            .map(|split| &split.split_metadata.split_id)
            .sorted()
            .collect();
        assert_eq!(split_ids, vec![&split_id_6]);

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .with_create_timestamp_lt(split_metadata_6.create_timestamp);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[
                &split_id_1,
                &split_id_2,
                &split_id_3,
                &split_id_4,
                &split_id_5,
            ]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone()).with_delete_opstamp_lt(6);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_1, &split_id_2, &split_id_3, &split_id_6,]
        );

        // Test maturity filter
        let maturity_evaluation_timestamp =
            OffsetDateTime::from_unix_timestamp(current_timestamp).unwrap();
        let query = ListSplitsQuery::for_index(index_uid.clone())
            .retain_mature(maturity_evaluation_timestamp);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(
            split_ids,
            &[&split_id_1, &split_id_4, &split_id_5, &split_id_6,]
        );

        let query = ListSplitsQuery::for_index(index_uid.clone())
            .retain_immature(maturity_evaluation_timestamp);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        let split_ids = collect_split_ids(&splits);
        assert_eq!(split_ids, &[&split_id_2, &split_id_3]);

        cleanup_index(&mut metastore, index_uid).await;
    }
}

pub async fn test_metastore_list_splits_by_node_id<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let metastore = MetastoreToTest::default_for_test().await;

    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    let index_id = append_random_suffix("test-list-splits-by-node-id");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid
        .unwrap();

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 20,
        node_id: "test-node-1".to_string(),
        ..Default::default()
    };
    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 10,
        node_id: "test-node-2".to_string(),
        ..Default::default()
    };
    let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
        index_uid.clone(),
        vec![split_metadata_1.clone(), split_metadata_2.clone()],
    )
    .unwrap();

    metastore.stage_splits(stage_splits_request).await.unwrap();

    let list_splits_query =
        ListSplitsQuery::for_index(index_uid.clone()).with_node_id(NodeId::from("test-node-1"));
    let list_splits_request =
        ListSplitsRequest::try_from_list_splits_query(&list_splits_query).unwrap();

    let splits = metastore
        .list_splits(list_splits_request)
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();

    assert_eq!(splits.len(), 1);
    assert_eq!(splits[0].split_metadata.split_id, split_id_1);
    assert_eq!(splits[0].split_metadata.node_id, "test-node-1");
}

pub async fn test_metastore_list_stale_splits<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;
    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    let index_id = append_random_suffix("test-list-stale-splits");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 20,
        ..Default::default()
    };
    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 10,
        ..Default::default()
    };
    let split_id_3 = format!("{index_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 0,
        ..Default::default()
    };
    let split_id_4 = format!("{index_id}--split-4");
    let split_metadata_4 = SplitMetadata {
        split_id: split_id_4.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 20,
        ..Default::default()
    };
    // immature split
    let split_id_5 = format!("{index_id}--split-5");
    let split_metadata_5 = SplitMetadata {
        split_id: split_id_5.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        maturity: SplitMaturity::Immature {
            maturation_period: Duration::from_secs(100),
        },
        delete_opstamp: 0,
        ..Default::default()
    };

    let list_stale_splits_request = ListStaleSplitsRequest {
        index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
        delete_opstamp: 0,
        num_splits: 100,
    };
    let no_splits = metastore
        .list_stale_splits(list_stale_splits_request)
        .await
        .unwrap()
        .deserialize_splits()
        .await
        .unwrap();
    assert!(no_splits.is_empty());

    {
        info!("list stale splits on an index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            vec![
                split_metadata_1.clone(),
                split_metadata_2.clone(),
                split_metadata_3.clone(),
                split_metadata_5.clone(),
            ],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        // Sleep for 1 second to have different publish timestamps.
        sleep(Duration::from_secs(1)).await;

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            vec![split_metadata_4.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: index_uid.clone().into(),
            staged_split_ids: vec![split_id_4.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();
        // Sleep for 1 second to have different publish timestamps.
        tokio::time::sleep(Duration::from_secs(1)).await;
        let publish_splits_request = PublishSplitsRequest {
            index_uid: index_uid.clone().into(),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone(), split_id_5.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();
        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: index_uid.clone().into(),
            delete_opstamp: 100,
            num_splits: 1,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 1);
        assert_eq!(
            splits[0].split_metadata.delete_opstamp,
            split_metadata_2.delete_opstamp
        );

        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: index_uid.clone().into(),
            delete_opstamp: 100,
            num_splits: 4,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 3);
        assert_eq!(splits[0].split_id(), split_metadata_2.split_id());
        assert_eq!(splits[1].split_id(), split_metadata_4.split_id());
        assert_eq!(splits[2].split_id(), split_metadata_1.split_id());
        assert_eq!(
            splits[2].split_metadata.delete_opstamp,
            split_metadata_1.delete_opstamp
        );

        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: index_uid.clone().into(),
            delete_opstamp: 20,
            num_splits: 2,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 1);
        assert_eq!(
            splits[0].split_metadata.delete_opstamp,
            split_metadata_2.delete_opstamp
        );

        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: index_uid.clone().into(),
            delete_opstamp: 10,
            num_splits: 2,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert!(splits.is_empty());
        cleanup_index(&mut metastore, index_uid).await;
    }
}

pub async fn test_metastore_list_sorted_splits<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let split_id = append_random_suffix("test-list-sorted-splits-");
    let index_id_1 = append_random_suffix("test-list-sorted-splits-1");
    let index_uid_1 = IndexUid::new_with_random_ulid(&index_id_1);
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let index_id_2 = append_random_suffix("test-list-sorted-splits-2");
    let index_uid_2 = IndexUid::new_with_random_ulid(&index_id_2);
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);

    let split_id_1 = format!("{split_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid_1.clone(),
        delete_opstamp: 5,
        ..Default::default()
    };
    let split_id_2 = format!("{split_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid_2.clone(),
        delete_opstamp: 3,
        ..Default::default()
    };
    let split_id_3 = format!("{split_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid_1.clone(),
        delete_opstamp: 1,
        ..Default::default()
    };
    let split_id_4 = format!("{split_id}--split-4");
    let split_metadata_4 = SplitMetadata {
        split_id: split_id_4.clone(),
        index_uid: index_uid_2.clone(),
        delete_opstamp: 0,
        ..Default::default()
    };
    let split_id_5 = format!("{split_id}--split-5");
    let split_metadata_5 = SplitMetadata {
        split_id: split_id_5.clone(),
        index_uid: index_uid_1.clone(),
        delete_opstamp: 2,
        ..Default::default()
    };
    let split_id_6 = format!("{split_id}--split-6");
    let split_metadata_6 = SplitMetadata {
        split_id: split_id_6.clone(),
        index_uid: index_uid_2.clone(),
        delete_opstamp: 4,
        ..Default::default()
    };

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_1).unwrap();
    let index_uid_1: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_2).unwrap();
    let index_uid_2: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    {
        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid_1.clone(),
            vec![split_metadata_1, split_metadata_3, split_metadata_5],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid_1.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid_1.clone(), vec![split_id_3.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid_2.clone(),
            vec![split_metadata_2, split_metadata_4, split_metadata_6],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid_2.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid_2.clone(), vec![split_id_4.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();
    }

    let query =
        ListSplitsQuery::try_from_index_uids(vec![index_uid_1.clone(), index_uid_2.clone()])
            .unwrap()
            .sort_by_staleness();
    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    // we don't use collect_split_ids because it sorts splits internally
    let split_ids = splits
        .iter()
        .map(|split| split.split_id())
        .collect::<Vec<_>>();
    assert_eq!(
        split_ids,
        &[
            &split_id_4,
            &split_id_3,
            &split_id_5,
            &split_id_2,
            &split_id_6,
            &split_id_1,
        ]
    );

    let query =
        ListSplitsQuery::try_from_index_uids(vec![index_uid_1.clone(), index_uid_2.clone()])
            .unwrap()
            .sort_by_index_uid();
    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    // we don't use collect_split_ids because it sorts splits internally
    let split_ids = splits
        .iter()
        .map(|split| split.split_id())
        .collect::<Vec<_>>();
    assert_eq!(
        split_ids,
        &[
            &split_id_1,
            &split_id_3,
            &split_id_5,
            &split_id_2,
            &split_id_4,
            &split_id_6,
        ]
    );

    cleanup_index(&mut metastore, index_uid_1.clone()).await;
    cleanup_index(&mut metastore, index_uid_2.clone()).await;
}

pub async fn test_metastore_list_after_split<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let split_id = append_random_suffix("test-list-sorted-splits-");
    let index_id_1 = append_random_suffix("test-list-sorted-splits-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let index_id_2 = append_random_suffix("test-list-sorted-splits-2");
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_1).unwrap();
    let index_uid_1: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_2).unwrap();
    let index_uid_2: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let split_id_1 = format!("{split_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid_1.clone(),
        ..Default::default()
    };
    let split_id_2 = format!("{split_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid_2.clone(),
        ..Default::default()
    };
    let split_id_3 = format!("{split_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid_1.clone(),
        ..Default::default()
    };
    let split_id_4 = format!("{split_id}--split-4");
    let split_metadata_4 = SplitMetadata {
        split_id: split_id_4.clone(),
        index_uid: index_uid_2.clone(),
        ..Default::default()
    };
    let split_id_5 = format!("{split_id}--split-5");
    let split_metadata_5 = SplitMetadata {
        split_id: split_id_5.clone(),
        index_uid: index_uid_1.clone(),
        ..Default::default()
    };
    let split_id_6 = format!("{split_id}--split-6");
    let split_metadata_6 = SplitMetadata {
        split_id: split_id_6.clone(),
        index_uid: index_uid_2.clone(),
        ..Default::default()
    };

    {
        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid_1.clone(),
            vec![
                split_metadata_1.clone(),
                split_metadata_3.clone(),
                split_metadata_5.clone(),
            ],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid_1.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid_1.clone(), vec![split_id_3.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid_2.clone(),
            vec![
                split_metadata_2.clone(),
                split_metadata_4.clone(),
                split_metadata_6.clone(),
            ],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid_2.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid_2.clone(), vec![split_id_4.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();
    }

    let expected_all = [
        &split_metadata_1,
        &split_metadata_3,
        &split_metadata_5,
        &split_metadata_2,
        &split_metadata_4,
        &split_metadata_6,
    ];

    for i in 0..expected_all.len() {
        let after = expected_all[i];
        let expected_res = expected_all[(i + 1)..]
            .iter()
            .map(|split| (&split.index_uid, &split.split_id))
            .collect::<Vec<_>>();

        let query =
            ListSplitsQuery::try_from_index_uids(vec![index_uid_1.clone(), index_uid_2.clone()])
                .unwrap()
                .sort_by_index_uid()
                .after_split(after);
        let splits = metastore
            .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap();
        // we don't use collect_split_ids because it sorts splits internally
        let split_ids = splits
            .iter()
            .map(|split| {
                (
                    &split.split_metadata.index_uid,
                    &split.split_metadata.split_id,
                )
            })
            .collect::<Vec<_>>();
        assert_eq!(split_ids, expected_res,);
    }

    cleanup_index(&mut metastore, index_uid_1.clone()).await;
    cleanup_index(&mut metastore, index_uid_2.clone()).await;
}

pub async fn test_metastore_list_splits_from_all_indexes<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let split_id = append_random_suffix("test-list-sorted-splits-");
    let index_id_1 = append_random_suffix("test-list-sorted-splits-1");
    let index_uri_1 = format!("ram:///indexes/{index_id_1}");
    let index_config_1 = IndexConfig::for_test(&index_id_1, &index_uri_1);

    let index_id_2 = append_random_suffix("test-list-sorted-splits-2");
    let index_uri_2 = format!("ram:///indexes/{index_id_2}");
    let index_config_2 = IndexConfig::for_test(&index_id_2, &index_uri_2);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_1).unwrap();
    let index_uid_1: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config_2).unwrap();
    let index_uid_2: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let split_id_1 = format!("{split_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid_1.clone(),
        ..Default::default()
    };
    let split_id_2 = format!("{split_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid_2.clone(),
        ..Default::default()
    };
    let split_id_3 = format!("{split_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid_1.clone(),
        ..Default::default()
    };
    let split_id_4 = format!("{split_id}--split-4");
    let split_metadata_4 = SplitMetadata {
        split_id: split_id_4.clone(),
        index_uid: index_uid_2.clone(),
        ..Default::default()
    };
    let split_id_5 = format!("{split_id}--split-5");
    let split_metadata_5 = SplitMetadata {
        split_id: split_id_5.clone(),
        index_uid: index_uid_1.clone(),
        ..Default::default()
    };
    let split_id_6 = format!("{split_id}--split-6");
    let split_metadata_6 = SplitMetadata {
        split_id: split_id_6.clone(),
        index_uid: index_uid_2.clone(),
        ..Default::default()
    };

    {
        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid_1.clone(),
            vec![
                split_metadata_1.clone(),
                split_metadata_3.clone(),
                split_metadata_5.clone(),
            ],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid_1.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid_1.clone(), vec![split_id_3.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid_2.clone(),
            vec![
                split_metadata_2.clone(),
                split_metadata_4.clone(),
                split_metadata_6.clone(),
            ],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid_2.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion =
            MarkSplitsForDeletionRequest::new(index_uid_2.clone(), vec![split_id_4.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion)
            .await
            .unwrap();
    }

    let expected_all = [
        &split_metadata_1,
        &split_metadata_3,
        &split_metadata_5,
        &split_metadata_2,
        &split_metadata_4,
        &split_metadata_6,
    ];

    let expected_res = expected_all[1..]
        .iter()
        .map(|split| (&split.index_uid, &split.split_id))
        .collect::<Vec<_>>();

    let query = ListSplitsQuery::for_all_indexes()
        .sort_by_index_uid()
        .after_split(expected_all[0]);
    let splits = metastore
        .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    // we don't use collect_split_ids because it sorts splits internally
    let split_ids = splits
        .iter()
        .map(|split| {
            (
                &split.split_metadata.index_uid,
                &split.split_metadata.split_id,
            )
        })
        // when running this test against a clean database, this line isn't needed. In practice,
        // any test that leaves any split behind breaks this test if we remove this filter
        .filter(|(index_uid, _split_id)| {
            [index_uid_1.clone(), index_uid_2.clone()].contains(index_uid)
        })
        .collect::<Vec<_>>();
    assert_eq!(split_ids, expected_res);

    cleanup_index(&mut metastore, index_uid_1.clone()).await;
    cleanup_index(&mut metastore, index_uid_2.clone()).await;
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;

use async_trait::async_trait;
use bytesize::ByteSize;
use itertools::Itertools;
use quickwit_proto::metastore::metastore_service_grpc_client::MetastoreServiceGrpcClient;
use quickwit_proto::metastore::{
    DeleteIndexRequest, DeleteSplitsRequest, ListSplitsRequest, MarkSplitsForDeletionRequest,
    MetastoreServiceClient, MetastoreServiceGrpcClientAdapter,
};
use quickwit_proto::tonic::transport::Channel;
use quickwit_proto::types::IndexUid;

pub(crate) mod delete_task;
pub(crate) mod get_identity;
pub(crate) mod index;
pub(crate) mod list_splits;
pub(crate) mod shard;
pub(crate) mod source;
pub(crate) mod split;
pub(crate) mod template;

use crate::metastore::MetastoreServiceStreamSplitsExt;
use crate::{ListSplitsRequestExt, MetastoreServiceExt, Split};

const MAX_GRPC_MESSAGE_SIZE: ByteSize = ByteSize::mib(1);

#[async_trait]
pub trait DefaultForTest {
    async fn default_for_test() -> Self;
}

// We implement the trait to test the gRPC adapter backed by a file backed metastore.
#[async_trait]
impl DefaultForTest for MetastoreServiceGrpcClientAdapter<MetastoreServiceGrpcClient<Channel>> {
    async fn default_for_test() -> Self {
        use quickwit_proto::tonic::transport::Server;
        use quickwit_storage::RamStorage;

        use crate::FileBackedMetastore;
        let metastore =
            FileBackedMetastore::try_new(std::sync::Arc::new(RamStorage::default()), None)
                .await
                .unwrap();
        let (client, server) = tokio::io::duplex(1024);
        tokio::spawn(async move {
            Server::builder()
                .add_service(
                    MetastoreServiceClient::new(metastore).as_grpc_service(MAX_GRPC_MESSAGE_SIZE),
                )
                .serve_with_incoming(futures::stream::iter(vec![Ok::<_, std::io::Error>(server)]))
                .await
        });
        let channel = create_channel(client).await.unwrap();
        let (_, connection_keys_watcher) =
            tokio::sync::watch::channel(std::collections::HashSet::new());

        MetastoreServiceGrpcClientAdapter::new(
            MetastoreServiceGrpcClient::new(channel),
            connection_keys_watcher,
        )
    }
}

impl MetastoreServiceExt
    for MetastoreServiceGrpcClientAdapter<MetastoreServiceGrpcClient<Channel>>
{
}

async fn create_channel(client: tokio::io::DuplexStream) -> anyhow::Result<Channel> {
    use http::Uri;
    use quickwit_proto::tonic::transport::Endpoint;

    let mut outer_client_opt = Some(client);
    let channel = Endpoint::try_from("http://test.server")?
        .connect_with_connector(tower::service_fn(move |_: Uri| {
            let inner_client_opt = outer_client_opt.take();
            async move {
                let client = inner_client_opt
                    .ok_or_else(|| std::io::Error::other("client already taken"))?;
                std::io::Result::Ok(hyper_util::rt::TokioIo::new(client))
            }
        }))
        .await?;
    Ok(channel)
}

// crate::metastore_test_suite!(
//     quickwit_proto::metastore::MetastoreServiceGrpcClientAdapter<
//         quickwit_proto::metastore::metastore_service_grpc_client::MetastoreServiceGrpcClient<
//             quickwit_proto::tonic::transport::Channel,
//         >,
//     >
// );

fn collect_split_ids(splits: &[Split]) -> Vec<&str> {
    splits
        .iter()
        .map(|split| split.split_id())
        .sorted()
        .collect()
}

fn to_btree_set(tags: &[&str]) -> BTreeSet<String> {
    tags.iter().map(|tag| tag.to_string()).collect()
}

async fn cleanup_index(metastore: &mut dyn MetastoreServiceExt, index_uid: IndexUid) {
    // List all splits.
    let all_splits = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();

    if !all_splits.is_empty() {
        let all_split_ids: Vec<String> = all_splits
            .iter()
            .map(|split| split.split_id().to_string())
            .collect();

        // Mark splits for deletion.
        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), all_split_ids.clone());
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        // Delete splits.
        let delete_splits_request = DeleteSplitsRequest {
            index_uid: index_uid.clone().into(),
            split_ids: all_split_ids,
        };
        metastore
            .delete_splits(delete_splits_request)
            .await
            .unwrap();
    }
    // Delete index.
    metastore
        .delete_index(DeleteIndexRequest {
            index_uid: index_uid.clone().into(),
        })
        .await
        .unwrap();
}

/// macro used to generate a testsuite for an implementation of Metastore
#[macro_export]
macro_rules! metastore_test_suite {
    ($metastore_type:ty) => {
        #[cfg(test)]
        mod common_tests {

            // Index API tests
            //
            //  - create_index
            //  - update_index
            //  - index_exists
            //  - index_metadata
            //  - indexes_metadata
            //  - list_indexes
            //  - delete_index
            //  - list_index_stats

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_create_index() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_create_index::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_create_index_with_sources() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_create_index_with_sources::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_retention_policy() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_update_retention_policy::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_search_settings() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_update_search_settings::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_doc_mapping() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_update_doc_mapping::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_indexing_settings() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_update_indexing_settings::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_ingest_settings() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_update_ingest_settings::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_create_index_enforces_index_id_maximum_length() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_create_index_enforces_index_id_maximum_length::<
                    $metastore_type,
                >()
                .await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_index_exists() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_index_exists::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_index_metadata() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_index_metadata::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_indexes_metadata() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_indexes_metadata::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_indexes() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_list_indexes::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_all_indexes() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_list_all_indexes::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_delete_index() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_delete_index::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_index_stats() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_list_index_stats::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_index_stats_no_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::index::test_metastore_list_index_stats_no_splits::<$metastore_type>().await;
            }

            // Split API tests
            //
            //  - stage_splits
            //  - publish_splits
            //  - stream_splits
            //  - mark_splits_for_deletion
            //  - delete_splits

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_publish_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_publish_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_publish_splits_concurrency() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_publish_splits_concurrency::<$metastore_type>(
                )
                .await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_publish_splits_empty_splits_array_is_allowed() {
                $crate::tests::split::test_metastore_publish_splits_empty_splits_array_is_allowed::<
                            $metastore_type,
                        >()
                        .await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_replace_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_replace_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_mark_splits_for_deletion() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_mark_splits_for_deletion::<$metastore_type>()
                    .await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_delete_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_delete_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_stream_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_stream_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_all_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_all_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_splits::<$metastore_type>().await;
            }


            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_splits_by_node() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_splits_by_node_id::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_split_update_timestamp() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_split_update_timestamp::<$metastore_type>()
                    .await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_add_source() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::source::test_metastore_add_source::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_source() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::source::test_metastore_update_source::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_toggle_source() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::source::test_metastore_toggle_source::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_delete_source() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::source::test_metastore_delete_source::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_reset_checkpoint() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::source::test_metastore_reset_checkpoint::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_create_delete_task() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::delete_task::test_metastore_create_delete_task::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_last_delete_opstamp() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::delete_task::test_metastore_last_delete_opstamp::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_delete_index_with_tasks() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::delete_task::test_metastore_delete_index_with_tasks::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_delete_tasks() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::delete_task::test_metastore_list_delete_tasks::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_stale_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_stale_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_sorted_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_sorted_splits::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_after_split() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_after_split::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_splits_from_all_indexes() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::list_splits::test_metastore_list_splits_from_all_indexes::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_update_splits_delete_opstamp() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_update_splits_delete_opstamp::<$metastore_type>()
                    .await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_stage_splits() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::split::test_metastore_stage_splits::<$metastore_type>().await;
            }

            /// Shard API tests

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_open_shards() {
                $crate::tests::shard::test_metastore_open_shards::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_acquire_shards() {
                $crate::tests::shard::test_metastore_acquire_shards::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_shards() {
                $crate::tests::shard::test_metastore_list_shards::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_delete_shards() {
                $crate::tests::shard::test_metastore_delete_shards::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_prune_shards() {
                $crate::tests::shard::test_metastore_prune_shards::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::serial]
            async fn test_metastore_apply_checkpoint_delta_v2_single_shard() {
                $crate::tests::shard::test_metastore_apply_checkpoint_delta_v2_single_shard::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_apply_checkpoint_delta_v2_multi_shards() {
                $crate::tests::shard::test_metastore_apply_checkpoint_delta_v2_multi_shards::<$metastore_type>().await;
            }

            /// Index Template API tests

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_create_index_template() {
                $crate::tests::template::test_metastore_create_index_template::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_get_index_template() {
                $crate::tests::template::test_metastore_get_index_template::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_find_index_template_matches() {
                $crate::tests::template::test_metastore_find_index_template_matches::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_list_index_templates() {
                $crate::tests::template::test_metastore_list_index_templates::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_delete_index_templates() {
                $crate::tests::template::test_metastore_delete_index_templates::<$metastore_type>().await;
            }

            #[tokio::test]
            #[serial_test::file_serial]
            async fn test_metastore_get_identity() {
                let _ = tracing_subscriber::fmt::try_init();
                $crate::tests::get_identity::test_metastore_get_identity::<$metastore_type>().await;
            }
        }
    };
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/shard.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use async_trait::async_trait;
use itertools::Itertools;
use quickwit_common::rand::append_random_suffix;
use quickwit_config::{IndexConfig, SourceConfig};
use quickwit_proto::compatibility_shard_update_timestamp;
use quickwit_proto::ingest::{Shard, ShardState};
use quickwit_proto::metastore::{
    AcquireShardsRequest, AddSourceRequest, CreateIndexRequest, DeleteShardsRequest, EntityKind,
    ListShardsRequest, ListShardsSubrequest, MetastoreError, MetastoreService, OpenShardSubrequest,
    OpenShardsRequest, PruneShardsRequest, PublishSplitsRequest,
};
use quickwit_proto::types::{DocMappingUid, IndexUid, Position, ShardId, SourceId};
use time::OffsetDateTime;

use super::DefaultForTest;
use crate::checkpoint::{IndexCheckpointDelta, PartitionId, SourceCheckpointDelta};
use crate::tests::cleanup_index;
use crate::{AddSourceRequestExt, CreateIndexRequestExt, MetastoreServiceExt};

#[async_trait]
pub trait ReadWriteShardsForTest {
    async fn insert_shards(&self, index_uid: &IndexUid, source_id: &SourceId, shards: Vec<Shard>);

    async fn list_all_shards(&self, index_uid: &IndexUid, source_id: &SourceId) -> Vec<Shard>;
}

struct TestIndex {
    index_uid: IndexUid,
    source_id: SourceId,
}

impl TestIndex {
    async fn create_index_with_source(
        metastore: &mut dyn MetastoreService,
        index_id: &str,
        source_config: SourceConfig,
    ) -> Self {
        let index_id = append_random_suffix(index_id);
        let index_uri = format!("ram:///indexes/{index_id}");
        let index_config = IndexConfig::for_test(&index_id, &index_uri);

        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let create_index_response = metastore.create_index(create_index_request).await.unwrap();
        let index_uid: IndexUid = create_index_response.index_uid().clone();

        let add_source_request =
            AddSourceRequest::try_from_source_config(index_uid.clone(), &source_config).unwrap();
        metastore.add_source(add_source_request).await.unwrap();

        Self {
            index_uid,
            source_id: source_config.source_id,
        }
    }
}

pub async fn test_metastore_open_shards<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index = TestIndex::create_index_with_source(
        &mut metastore,
        "test-open-shards",
        SourceConfig::ingest_v2(),
    )
    .await;

    // Test empty request.
    let open_shards_request = OpenShardsRequest {
        subrequests: Vec::new(),
    };
    let open_shards_response = metastore.open_shards(open_shards_request).await.unwrap();
    assert!(open_shards_response.subresponses.is_empty());

    // Test index not found.
    // let open_shards_request = OpenShardsRequest {
    //     subrequests: vec![OpenShardSubrequest {
    //         index_uid: "index-does-not-exist:0".to_string(),
    //         source_id: test_index.source_id.clone(),
    //         leader_id: "test-ingester-foo".to_string(),
    //         ..Default::default()
    //     }],
    // };
    // let error = metastore
    //     .open_shards(open_shards_request)
    //     .await
    //     .unwrap_err();
    // assert!(
    //     matches!(error, MetastoreError::NotFound(EntityKind::Index { index_id }) if index_id ==
    // "index-does-not-exist") );

    // // Test source not found.
    // let open_shards_request = OpenShardsRequest {
    //     subrequests: vec![OpenShardSubrequest {
    //         index_uid: Some(test_index.index_uid.clone()),
    //         source_id: "source-does-not-exist".to_string(),
    //         leader_id: "test-ingester-foo".to_string(),
    //         ..Default::default()
    //     }],
    // };
    // let error = metastore
    //     .open_shards(open_shards_request)
    //     .await
    //     .unwrap_err();
    // assert!(
    //     matches!(error, MetastoreError::NotFound(EntityKind::Source { source_id, ..}) if
    // source_id == "source-does-not-exist") );

    // Test open shard #1.
    let open_shards_request = OpenShardsRequest {
        subrequests: vec![OpenShardSubrequest {
            subrequest_id: 0,
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-ingester-foo".to_string(),
            follower_id: Some("test-ingester-bar".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_token: None,
        }],
    };
    let open_shards_response = metastore.open_shards(open_shards_request).await.unwrap();
    assert_eq!(open_shards_response.subresponses.len(), 1);

    let subresponse = &open_shards_response.subresponses[0];
    assert_eq!(subresponse.subrequest_id, 0);

    let shard = subresponse.open_shard();
    assert_eq!(shard.index_uid(), &test_index.index_uid);
    assert_eq!(shard.source_id, test_index.source_id);
    assert_eq!(shard.shard_id(), ShardId::from(1));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.leader_id, "test-ingester-foo");
    assert_eq!(shard.follower_id(), "test-ingester-bar");
    assert_eq!(shard.doc_mapping_uid(), DocMappingUid::default(),);
    assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
    let shard_ts = shard.update_timestamp;
    assert_ne!(shard_ts, compatibility_shard_update_timestamp());
    assert_ne!(shard_ts, 0);
    assert!(shard.publish_token.is_none());

    // Test open shard #1 is idempotent.
    let open_shards_request = OpenShardsRequest {
        subrequests: vec![OpenShardSubrequest {
            subrequest_id: 0,
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            leader_id: "test-ingester-foo".to_string(),
            follower_id: Some("test-ingester-bar".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_token: Some("publish-token-baz".to_string()),
        }],
    };
    let open_shards_response = metastore.open_shards(open_shards_request).await.unwrap();
    assert_eq!(open_shards_response.subresponses.len(), 1);

    let subresponse = &open_shards_response.subresponses[0];
    assert_eq!(subresponse.subrequest_id, 0);

    let shard = subresponse.open_shard();
    assert_eq!(shard.index_uid(), &test_index.index_uid);
    assert_eq!(shard.source_id, test_index.source_id);
    assert_eq!(shard.shard_id(), ShardId::from(1));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.leader_id, "test-ingester-foo");
    assert_eq!(shard.follower_id(), "test-ingester-bar");
    assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
    assert_eq!(shard.update_timestamp, shard_ts);
    assert!(shard.publish_token.is_none());

    // Test open shard #2.
    let open_shards_request = OpenShardsRequest {
        subrequests: vec![OpenShardSubrequest {
            subrequest_id: 0,
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            leader_id: "test-ingester-foo".to_string(),
            follower_id: None,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_token: Some("publish-token-open".to_string()),
        }],
    };
    let open_shards_response = metastore.open_shards(open_shards_request).await.unwrap();
    assert_eq!(open_shards_response.subresponses.len(), 1);

    let subresponse = &open_shards_response.subresponses[0];
    assert_eq!(subresponse.subrequest_id, 0);

    let shard = subresponse.open_shard();
    assert_eq!(shard.index_uid(), &test_index.index_uid);
    assert_eq!(shard.source_id, test_index.source_id);
    assert_eq!(shard.shard_id(), ShardId::from(2));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.leader_id, "test-ingester-foo");
    assert!(shard.follower_id.is_none());
    assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
    assert_eq!(shard.publish_token(), "publish-token-open");

    cleanup_index(&mut metastore, test_index.index_uid).await;
}

pub async fn test_metastore_acquire_shards<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index = TestIndex::create_index_with_source(
        &mut metastore,
        "test-acquire-shards",
        SourceConfig::ingest_v2(),
    )
    .await;

    let shards = vec![
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Closed as i32,
            leader_id: "test-ingester-foo".to_string(),
            follower_id: Some("test-ingester-bar".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            publish_token: Some("test-publish-token-foo".to_string()),
            update_timestamp: 1724158996,
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Open as i32,
            leader_id: "test-ingester-bar".to_string(),
            follower_id: Some("test-ingester-qux".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            publish_token: Some("test-publish-token-bar".to_string()),
            update_timestamp: 1724158996,
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(3)),
            shard_state: ShardState::Open as i32,
            leader_id: "test-ingester-qux".to_string(),
            follower_id: Some("test-ingester-baz".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            publish_token: None,
            update_timestamp: 1724158996,
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(4)),
            shard_state: ShardState::Open as i32,
            leader_id: "test-ingester-baz".to_string(),
            follower_id: Some("test-ingester-tux".to_string()),
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            publish_token: None,
            update_timestamp: 1724158996,
        },
    ];
    metastore
        .insert_shards(&test_index.index_uid, &test_index.source_id, shards)
        .await;

    // Test acquire shards.
    let acquire_shards_request = AcquireShardsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        source_id: test_index.source_id.clone(),
        shard_ids: vec![
            ShardId::from(1),
            ShardId::from(2),
            ShardId::from(3),
            ShardId::from(666),
        ], // shard 666 does not exist
        publish_token: "test-publish-token-foo".to_string(),
    };
    let mut acquire_shards_response = metastore
        .acquire_shards(acquire_shards_request)
        .await
        .unwrap();

    acquire_shards_response
        .acquired_shards
        .sort_unstable_by(|left, right| left.shard_id().cmp(right.shard_id()));

    let shard = &acquire_shards_response.acquired_shards[0];
    assert_eq!(shard.index_uid(), &test_index.index_uid);
    assert_eq!(shard.source_id, test_index.source_id);
    assert_eq!(shard.shard_id(), ShardId::from(1));
    assert_eq!(shard.shard_state(), ShardState::Closed);
    assert_eq!(shard.leader_id, "test-ingester-foo");
    assert_eq!(shard.follower_id(), "test-ingester-bar");
    assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
    assert_eq!(shard.publish_token(), "test-publish-token-foo");

    let shard = &acquire_shards_response.acquired_shards[1];
    assert_eq!(shard.index_uid(), &test_index.index_uid);
    assert_eq!(shard.source_id, test_index.source_id);
    assert_eq!(shard.shard_id(), ShardId::from(2));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.leader_id, "test-ingester-bar");
    assert_eq!(shard.follower_id(), "test-ingester-qux");
    assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
    assert_eq!(shard.publish_token(), "test-publish-token-foo");

    let shard = &acquire_shards_response.acquired_shards[2];
    assert_eq!(shard.index_uid(), &test_index.index_uid);
    assert_eq!(shard.source_id, test_index.source_id);
    assert_eq!(shard.shard_id(), ShardId::from(3));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.leader_id, "test-ingester-qux");
    assert_eq!(shard.follower_id(), "test-ingester-baz");
    assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
    assert_eq!(shard.publish_token(), "test-publish-token-foo");

    cleanup_index(&mut metastore, test_index.index_uid).await;
}

pub async fn test_metastore_list_shards<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index_0 = TestIndex::create_index_with_source(
        &mut metastore,
        "test-list-shards-0",
        SourceConfig::ingest_v2(),
    )
    .await;

    let test_index_1 = TestIndex::create_index_with_source(
        &mut metastore,
        "test-list-shards-1",
        SourceConfig::ingest_v2(),
    )
    .await;

    for test_index in [&test_index_0, &test_index_1] {
        let shards = vec![
            Shard {
                index_uid: Some(test_index.index_uid.clone()),
                source_id: test_index.source_id.clone(),
                shard_id: Some(ShardId::from(1)),
                shard_state: ShardState::Open as i32,
                leader_id: "test-ingester-foo".to_string(),
                follower_id: Some("test-ingester-bar".to_string()),
                doc_mapping_uid: Some(DocMappingUid::default()),
                publish_position_inclusive: Some(Position::Beginning),
                publish_token: Some("test-publish-token-foo".to_string()),
                update_timestamp: 1724158996,
            },
            Shard {
                index_uid: Some(test_index.index_uid.clone()),
                source_id: test_index.source_id.clone(),
                shard_id: Some(ShardId::from(2)),
                shard_state: ShardState::Closed as i32,
                leader_id: "test-ingester-bar".to_string(),
                follower_id: Some("test-ingester-qux".to_string()),
                doc_mapping_uid: Some(DocMappingUid::default()),
                publish_position_inclusive: Some(Position::Beginning),
                publish_token: Some("test-publish-token-bar".to_string()),
                update_timestamp: 1724158997,
            },
        ];
        metastore
            .insert_shards(&test_index.index_uid, &test_index.source_id, shards)
            .await;
    }

    // Test list shards.
    let list_shards_request = ListShardsRequest {
        subrequests: vec![
            ListShardsSubrequest {
                index_uid: Some(test_index_0.index_uid.clone()),
                source_id: test_index_0.source_id.clone(),
                shard_state: None,
            },
            ListShardsSubrequest {
                index_uid: Some(test_index_1.index_uid.clone()),
                source_id: test_index_1.source_id.clone(),
                shard_state: None,
            },
        ],
    };
    let mut list_shards_response = metastore.list_shards(list_shards_request).await.unwrap();
    assert_eq!(list_shards_response.subresponses.len(), 2);

    list_shards_response
        .subresponses
        .sort_unstable_by(|left, right| left.index_uid().cmp(right.index_uid()));

    for (idx, test_index) in [&test_index_0, &test_index_1].into_iter().enumerate() {
        let subresponse = &mut list_shards_response.subresponses[idx];
        assert_eq!(subresponse.index_uid(), &test_index.index_uid);
        assert_eq!(subresponse.source_id, test_index.source_id);
        assert_eq!(subresponse.shards.len(), 2);

        subresponse
            .shards
            .sort_unstable_by(|left, right| left.shard_id.cmp(&right.shard_id));

        let shard = &subresponse.shards[0];
        assert_eq!(shard.index_uid(), &test_index.index_uid);
        assert_eq!(shard.source_id, test_index.source_id);
        assert_eq!(shard.shard_id(), ShardId::from(1));
        assert_eq!(shard.shard_state(), ShardState::Open);
        assert_eq!(shard.leader_id, "test-ingester-foo");
        assert_eq!(shard.follower_id(), "test-ingester-bar");
        assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
        assert_eq!(shard.publish_token(), "test-publish-token-foo");
        assert_eq!(shard.update_timestamp, 1724158996);

        let shard = &subresponse.shards[1];
        assert_eq!(shard.index_uid(), &test_index.index_uid);
        assert_eq!(shard.source_id, test_index.source_id);
        assert_eq!(shard.shard_id(), ShardId::from(2));
        assert_eq!(shard.shard_state(), ShardState::Closed);
        assert_eq!(shard.leader_id, "test-ingester-bar");
        assert_eq!(shard.follower_id(), "test-ingester-qux");
        assert_eq!(shard.publish_position_inclusive(), Position::Beginning);
        assert_eq!(shard.publish_token(), "test-publish-token-bar");
        assert_eq!(shard.update_timestamp, 1724158997);
    }

    // Test list shards with shard state filter.
    let list_shards_request = ListShardsRequest {
        subrequests: vec![
            ListShardsSubrequest {
                index_uid: Some(test_index_0.index_uid.clone()),
                source_id: test_index_0.source_id.clone(),
                shard_state: Some(ShardState::Open as i32),
            },
            ListShardsSubrequest {
                index_uid: Some(test_index_1.index_uid.clone()),
                source_id: test_index_1.source_id.clone(),
                shard_state: Some(ShardState::Closed as i32),
            },
        ],
    };
    let mut list_shards_response = metastore.list_shards(list_shards_request).await.unwrap();
    assert_eq!(list_shards_response.subresponses.len(), 2);

    list_shards_response
        .subresponses
        .sort_unstable_by(|left, right| left.index_uid().cmp(right.index_uid()));

    assert_eq!(list_shards_response.subresponses[0].shards.len(), 1);

    let shard = &list_shards_response.subresponses[0].shards[0];
    assert_eq!(shard.shard_id(), ShardId::from(1));
    assert_eq!(shard.shard_state(), ShardState::Open);

    assert_eq!(list_shards_response.subresponses[1].shards.len(), 1);

    let shard = &list_shards_response.subresponses[1].shards[0];
    assert_eq!(shard.shard_id(), ShardId::from(2));
    assert_eq!(shard.shard_state(), ShardState::Closed);

    let list_shards_request = ListShardsRequest {
        subrequests: vec![ListShardsSubrequest {
            index_uid: Some(test_index_0.index_uid.clone()),
            source_id: test_index_0.source_id.clone(),
            shard_state: Some(ShardState::Unavailable as i32),
        }],
    };
    let list_shards_response = metastore.list_shards(list_shards_request).await.unwrap();
    assert_eq!(list_shards_response.subresponses.len(), 1);
    assert!(list_shards_response.subresponses[0].shards.is_empty());

    cleanup_index(&mut metastore, test_index_0.index_uid).await;
}

pub async fn test_metastore_delete_shards<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index = TestIndex::create_index_with_source(
        &mut metastore,
        "test-delete-shards",
        SourceConfig::ingest_v2(),
    )
    .await;

    let shards = vec![
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            ..Default::default()
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            ..Default::default()
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(3)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Eof(None)),
            ..Default::default()
        },
    ];
    metastore
        .insert_shards(&test_index.index_uid, &test_index.source_id, shards)
        .await;

    // Attempt to delete shards #1, #2, #3, and #4.
    let delete_index_request = DeleteShardsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        source_id: test_index.source_id.clone(),
        shard_ids: vec![
            ShardId::from(1),
            ShardId::from(2),
            ShardId::from(3),
            ShardId::from(4),
        ],
        force: false,
    };
    let mut response = metastore.delete_shards(delete_index_request).await.unwrap();

    assert_eq!(response.index_uid(), &test_index.index_uid);
    assert_eq!(response.source_id, test_index.source_id);
    assert_eq!(response.successes.len(), 2);
    assert_eq!(response.failures.len(), 2);

    response.successes.sort_unstable();
    assert_eq!(response.successes[0], ShardId::from(3));
    assert_eq!(response.successes[1], ShardId::from(4));

    response.failures.sort_unstable();
    assert_eq!(response.failures[0], ShardId::from(1));
    assert_eq!(response.failures[1], ShardId::from(2));

    let mut all_shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;
    assert_eq!(all_shards.len(), 2);

    all_shards.sort_unstable_by(|left, right| left.shard_id.cmp(&right.shard_id));

    assert_eq!(all_shards[0].shard_id(), ShardId::from(1));
    assert_eq!(all_shards[1].shard_id(), ShardId::from(2));

    // Attempt to delete shards #1, #2, #3, and #4.
    let delete_index_request = DeleteShardsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        source_id: test_index.source_id.clone(),
        shard_ids: vec![
            ShardId::from(1),
            ShardId::from(2),
            ShardId::from(3),
            ShardId::from(4),
        ],
        force: true,
    };
    let mut response = metastore.delete_shards(delete_index_request).await.unwrap();

    assert_eq!(response.index_uid(), &test_index.index_uid);
    assert_eq!(response.source_id, test_index.source_id);

    assert_eq!(response.successes.len(), 4);
    assert_eq!(response.failures.len(), 0);

    response.successes.sort_unstable();
    assert_eq!(response.successes[0], ShardId::from(1));
    assert_eq!(response.successes[1], ShardId::from(2));
    assert_eq!(response.successes[2], ShardId::from(3));
    assert_eq!(response.successes[3], ShardId::from(4));

    let all_shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;

    assert_eq!(all_shards.len(), 0);

    cleanup_index(&mut metastore, test_index.index_uid).await;
}

pub async fn test_metastore_prune_shards<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index = TestIndex::create_index_with_source(
        &mut metastore,
        "test-prune-shards",
        SourceConfig::ingest_v2(),
    )
    .await;

    let now_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    let oldest_shard_age = 10000u32;

    // Create shards with timestamp intervals of 100s starting from
    // now_timestamp - oldest_shard_age
    let shards = (0..100)
        .map(|shard_id| Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(shard_id)),
            shard_state: ShardState::Closed as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::Beginning),
            update_timestamp: now_timestamp - oldest_shard_age as i64 + shard_id as i64 * 100,
            ..Default::default()
        })
        .collect_vec();

    metastore
        .insert_shards(&test_index.index_uid, &test_index.source_id, shards)
        .await;

    // noop prune request
    {
        let prune_index_request = PruneShardsRequest {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            max_age_secs: None,
            max_count: None,
            interval_secs: None,
        };
        metastore.prune_shards(prune_index_request).await.unwrap();
        let all_shards = metastore
            .list_all_shards(&test_index.index_uid, &test_index.source_id)
            .await;
        assert_eq!(all_shards.len(), 100);
    }

    // delete shards 4 last shards with age limit
    {
        let prune_index_request = PruneShardsRequest {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            max_age_secs: Some(oldest_shard_age - 350),
            max_count: None,
            interval_secs: None,
        };
        metastore.prune_shards(prune_index_request).await.unwrap();

        let mut all_shards = metastore
            .list_all_shards(&test_index.index_uid, &test_index.source_id)
            .await;
        assert_eq!(all_shards.len(), 96);
        all_shards.sort_unstable_by_key(|shard| shard.update_timestamp);
        assert_eq!(all_shards[0].shard_id(), ShardId::from(4));
        assert_eq!(all_shards[95].shard_id(), ShardId::from(99));
    }

    // delete 6 more shards with count limit
    {
        let prune_index_request = PruneShardsRequest {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            max_age_secs: None,
            max_count: Some(90),
            interval_secs: None,
        };
        metastore.prune_shards(prune_index_request).await.unwrap();
        let mut all_shards = metastore
            .list_all_shards(&test_index.index_uid, &test_index.source_id)
            .await;
        assert_eq!(all_shards.len(), 90);
        all_shards.sort_unstable_by_key(|shard| shard.update_timestamp);
        assert_eq!(all_shards[0].shard_id(), ShardId::from(10));
        assert_eq!(all_shards[89].shard_id(), ShardId::from(99));
    }

    // age limit is the limiting factor, delete 10 more shards
    let prune_index_request = PruneShardsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        source_id: test_index.source_id.clone(),
        max_age_secs: Some(oldest_shard_age - 2950),
        max_count: Some(80),
        interval_secs: None,
    };
    metastore.prune_shards(prune_index_request).await.unwrap();
    let all_shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;
    assert_eq!(all_shards.len(), 70);

    // count limit is the limiting factor, delete 20 more shards
    let prune_index_request = PruneShardsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        source_id: test_index.source_id.clone(),
        max_age_secs: Some(oldest_shard_age - 4000),
        max_count: Some(50),
        interval_secs: None,
    };
    metastore.prune_shards(prune_index_request).await.unwrap();
    let all_shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;
    assert_eq!(all_shards.len(), 50);

    cleanup_index(&mut metastore, test_index.index_uid).await;
}

pub async fn test_metastore_apply_checkpoint_delta_v2_single_shard<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index = TestIndex::create_index_with_source(
        &mut metastore,
        "test-delete-shards",
        SourceConfig::ingest_v2(),
    )
    .await;

    let mut source_delta = SourceCheckpointDelta::default();
    source_delta
        .record_partition_delta(
            PartitionId::from(0u64),
            Position::Beginning,
            Position::offset(0u64),
        )
        .unwrap();
    let index_checkpoint_delta = IndexCheckpointDelta {
        source_id: test_index.source_id.clone(),
        source_delta,
    };
    let index_checkpoint_delta_json = serde_json::to_string(&index_checkpoint_delta).unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        staged_split_ids: Vec::new(),
        replaced_split_ids: Vec::new(),
        index_checkpoint_delta_json_opt: Some(index_checkpoint_delta_json),
        publish_token_opt: Some("test-publish-token-foo".to_string()),
    };
    let error = metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Shard { .. })
    ));

    let dummy_create_timestamp = 1;
    let shards = vec![Shard {
        index_uid: Some(test_index.index_uid.clone()),
        source_id: test_index.source_id.clone(),
        shard_id: Some(ShardId::from(0)),
        shard_state: ShardState::Open as i32,
        doc_mapping_uid: Some(DocMappingUid::default()),
        publish_position_inclusive: Some(Position::Beginning),
        publish_token: Some("test-publish-token-bar".to_string()),
        update_timestamp: dummy_create_timestamp,
        ..Default::default()
    }];
    metastore
        .insert_shards(&test_index.index_uid, &test_index.source_id, shards)
        .await;

    let index_checkpoint_delta_json = serde_json::to_string(&index_checkpoint_delta).unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        staged_split_ids: Vec::new(),
        replaced_split_ids: Vec::new(),
        index_checkpoint_delta_json_opt: Some(index_checkpoint_delta_json),
        publish_token_opt: Some("test-publish-token-foo".to_string()),
    };
    let error = metastore
        .publish_splits(publish_splits_request.clone())
        .await
        .unwrap_err();
    assert!(
        matches!(error, MetastoreError::InvalidArgument { message } if message.contains("token"))
    );

    let index_checkpoint_delta_json = serde_json::to_string(&index_checkpoint_delta).unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        staged_split_ids: Vec::new(),
        replaced_split_ids: Vec::new(),
        index_checkpoint_delta_json_opt: Some(index_checkpoint_delta_json),
        publish_token_opt: Some("test-publish-token-bar".to_string()),
    };
    metastore
        .publish_splits(publish_splits_request.clone())
        .await
        .unwrap();

    let shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;
    assert_eq!(shards.len(), 1);
    assert_eq!(shards[0].shard_state(), ShardState::Open);
    assert_eq!(
        shards[0].publish_position_inclusive(),
        Position::offset(0u64)
    );
    assert!(
        shards[0].update_timestamp > dummy_create_timestamp,
        "shard timestamp was not updated"
    );

    let index_checkpoint_delta_json = serde_json::to_string(&index_checkpoint_delta).unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        staged_split_ids: Vec::new(),
        replaced_split_ids: Vec::new(),
        index_checkpoint_delta_json_opt: Some(index_checkpoint_delta_json),
        publish_token_opt: Some("test-publish-token-bar".to_string()),
    };
    let error = metastore
        .publish_splits(publish_splits_request.clone())
        .await
        .unwrap_err();
    assert!(
        matches!(error, MetastoreError::InvalidArgument { message } if message.contains("checkpoint"))
    );

    let mut source_delta = SourceCheckpointDelta::default();
    source_delta
        .record_partition_delta(
            PartitionId::from(0u64),
            Position::offset(0u64),
            Position::eof(1u64),
        )
        .unwrap();
    let index_checkpoint_delta = IndexCheckpointDelta {
        source_id: test_index.source_id.clone(),
        source_delta,
    };
    let index_checkpoint_delta_json = serde_json::to_string(&index_checkpoint_delta).unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        staged_split_ids: Vec::new(),
        replaced_split_ids: Vec::new(),
        index_checkpoint_delta_json_opt: Some(index_checkpoint_delta_json),
        publish_token_opt: Some("test-publish-token-bar".to_string()),
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    let shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;
    assert_eq!(shards.len(), 1);
    assert_eq!(shards[0].shard_state(), ShardState::Closed);
    assert_eq!(shards[0].publish_position_inclusive(), Position::eof(1u64));
    cleanup_index(&mut metastore, test_index.index_uid).await;
}

pub async fn test_metastore_apply_checkpoint_delta_v2_multi_shards<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest + ReadWriteShardsForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;

    let test_index = TestIndex::create_index_with_source(
        &mut metastore,
        "test-delete-shards",
        SourceConfig::ingest_v2(),
    )
    .await;

    let dummy_create_timestamp = 1;
    let shards = vec![
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(0)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::offset(0u64)),
            publish_token: Some("test-publish-token-foo".to_string()),
            update_timestamp: dummy_create_timestamp,
            ..Default::default()
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(1)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::offset(1u64)),
            publish_token: Some("test-publish-token-foo".to_string()),
            update_timestamp: dummy_create_timestamp,
            ..Default::default()
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(2)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::offset(2u64)),
            publish_token: Some("test-publish-token-foo".to_string()),
            update_timestamp: dummy_create_timestamp,
            ..Default::default()
        },
        Shard {
            index_uid: Some(test_index.index_uid.clone()),
            source_id: test_index.source_id.clone(),
            shard_id: Some(ShardId::from(3)),
            shard_state: ShardState::Open as i32,
            doc_mapping_uid: Some(DocMappingUid::default()),
            publish_position_inclusive: Some(Position::offset(3u64)),
            publish_token: Some("test-publish-token-bar".to_string()),
            update_timestamp: dummy_create_timestamp,
            ..Default::default()
        },
    ];
    metastore
        .insert_shards(&test_index.index_uid, &test_index.source_id, shards)
        .await;

    let mut source_delta = SourceCheckpointDelta::default();
    source_delta
        .record_partition_delta(
            PartitionId::from(0u64),
            Position::offset(0u64),
            Position::offset(10u64),
        )
        .unwrap();
    source_delta
        .record_partition_delta(
            PartitionId::from(1u64),
            Position::offset(1u64),
            Position::offset(11u64),
        )
        .unwrap();
    source_delta
        .record_partition_delta(
            PartitionId::from(2u64),
            Position::offset(2u64),
            Position::eof(12u64),
        )
        .unwrap();
    let index_checkpoint_delta = IndexCheckpointDelta {
        source_id: test_index.source_id.clone(),
        source_delta,
    };
    let index_checkpoint_delta_json = serde_json::to_string(&index_checkpoint_delta).unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(test_index.index_uid.clone()),
        staged_split_ids: Vec::new(),
        replaced_split_ids: Vec::new(),
        index_checkpoint_delta_json_opt: Some(index_checkpoint_delta_json),
        publish_token_opt: Some("test-publish-token-foo".to_string()),
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    let mut shards = metastore
        .list_all_shards(&test_index.index_uid, &test_index.source_id)
        .await;
    assert_eq!(shards.len(), 4);

    shards.sort_unstable_by(|left, right| left.shard_id.cmp(&right.shard_id));

    let shard = &shards[0];
    assert_eq!(shard.shard_id(), ShardId::from(0));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.publish_position_inclusive(), Position::offset(10u64));
    assert!(shard.update_timestamp > dummy_create_timestamp);

    let shard = &shards[1];
    assert_eq!(shard.shard_id(), ShardId::from(1));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.publish_position_inclusive(), Position::offset(11u64));
    assert!(shard.update_timestamp > dummy_create_timestamp);

    let shard = &shards[2];
    assert_eq!(shard.shard_id(), ShardId::from(2));
    assert_eq!(shard.shard_state(), ShardState::Closed);
    assert_eq!(shard.publish_position_inclusive(), Position::eof(12u64));
    assert!(shard.update_timestamp > dummy_create_timestamp);

    let shard = &shards[3];
    assert_eq!(shard.shard_id(), ShardId::from(3));
    assert_eq!(shard.shard_state(), ShardState::Open);
    assert_eq!(shard.publish_position_inclusive(), Position::offset(3u64));
    assert_eq!(shard.update_timestamp, dummy_create_timestamp);

    cleanup_index(&mut metastore, test_index.index_uid).await;
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/source.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroUsize;

use quickwit_common::rand::append_random_suffix;
use quickwit_config::{
    IndexConfig, SourceConfig, SourceInputFormat, SourceParams, TransformConfig,
};
use quickwit_proto::metastore::{
    AddSourceRequest, CreateIndexRequest, DeleteSourceRequest, EntityKind, IndexMetadataRequest,
    MetastoreError, PublishSplitsRequest, ResetSourceCheckpointRequest, SourceType,
    StageSplitsRequest, ToggleSourceRequest, UpdateSourceRequest,
};
use quickwit_proto::types::IndexUid;

use super::DefaultForTest;
use crate::checkpoint::SourceCheckpoint;
use crate::metastore::UpdateSourceRequestExt;
use crate::tests::cleanup_index;
use crate::{
    AddSourceRequestExt, CreateIndexRequestExt, IndexMetadataResponseExt, MetastoreServiceExt,
    SplitMetadata, StageSplitsRequestExt,
};

pub async fn test_metastore_add_source<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-add-source");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let source_id = format!("{index_id}--source");

    let source = SourceConfig {
        source_id: source_id.to_string(),
        num_pipelines: NonZeroUsize::MIN,
        enabled: true,
        source_params: SourceParams::void(),
        transform_config: None,
        input_format: SourceInputFormat::Json,
    };

    assert_eq!(
        metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap()
            .checkpoint
            .source_checkpoint(&source_id),
        None
    );

    let add_source_request =
        AddSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap();
    metastore.add_source(add_source_request).await.unwrap();

    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();

    let sources = &index_metadata.sources;
    assert_eq!(sources.len(), 1);
    assert!(sources.contains_key(&source_id));
    assert_eq!(sources.get(&source_id).unwrap().source_id, source_id);
    assert_eq!(
        sources.get(&source_id).unwrap().source_type(),
        SourceType::Void
    );
    assert_eq!(
        index_metadata.checkpoint.source_checkpoint(&source_id),
        Some(&SourceCheckpoint::default())
    );

    assert!(matches!(
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::AlreadyExists(EntityKind::Source { .. })
    ));
    assert!(matches!(
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(
                    IndexUid::new_with_random_ulid("index-not-found"),
                    &source
                )
                .unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));
    assert!(matches!(
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(
                    IndexUid::new_with_random_ulid(&index_id),
                    &source
                )
                .unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));
    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_update_source<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-add-source");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let source_id = format!("{index_id}--source");

    let mut source = SourceConfig {
        source_id: source_id.to_string(),
        num_pipelines: NonZeroUsize::MIN,
        enabled: true,
        source_params: SourceParams::void(),
        transform_config: None,
        input_format: SourceInputFormat::Json,
    };

    assert_eq!(
        metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap()
            .checkpoint
            .source_checkpoint(&source_id),
        None
    );

    let add_source_request =
        AddSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap();
    metastore.add_source(add_source_request).await.unwrap();

    source.transform_config = Some(TransformConfig::new("del(.username)".to_string(), None));

    // Update the source twice with the same value to validate indempotency
    for _ in 0..2 {
        let update_source_request =
            UpdateSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap();
        metastore
            .update_source(update_source_request)
            .await
            .unwrap();

        let index_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();

        let sources = &index_metadata.sources;
        assert_eq!(sources.len(), 1);
        assert!(sources.contains_key(&source_id));
        assert_eq!(sources.get(&source_id).unwrap().source_id, source_id);
        assert_eq!(
            sources.get(&source_id).unwrap().source_type(),
            SourceType::Void
        );
        assert_eq!(
            sources.get(&source_id).unwrap().transform_config,
            Some(TransformConfig::new("del(.username)".to_string(), None))
        );
        assert_eq!(
            index_metadata.checkpoint.source_checkpoint(&source_id),
            Some(&SourceCheckpoint::default())
        );
    }

    source.source_id = "unknown-src-id".to_string();
    assert!(matches!(
        metastore
            .update_source(
                UpdateSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Source { .. })
    ));
    source.source_id = source_id;
    assert!(matches!(
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(
                    IndexUid::new_with_random_ulid("index-not-found"),
                    &source
                )
                .unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_toggle_source<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-toggle-source");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let source_id = format!("{index_id}--source");
    let source = SourceConfig {
        source_id: source_id.to_string(),
        num_pipelines: NonZeroUsize::MIN,
        enabled: true,
        source_params: SourceParams::void(),
        transform_config: None,
        input_format: SourceInputFormat::Json,
    };
    let add_source_request =
        AddSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap();
    metastore.add_source(add_source_request).await.unwrap();
    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();
    let source = index_metadata.sources.get(&source_id).unwrap();
    assert_eq!(source.enabled, true);

    // Disable source.
    metastore
        .toggle_source(ToggleSourceRequest {
            index_uid: index_uid.clone().into(),
            source_id: source.source_id.clone(),
            enable: false,
        })
        .await
        .unwrap();
    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();
    let source = index_metadata.sources.get(&source_id).unwrap();
    assert_eq!(source.enabled, false);

    // Enable source.
    metastore
        .toggle_source(ToggleSourceRequest {
            index_uid: index_uid.clone().into(),
            source_id: source.source_id.clone(),
            enable: true,
        })
        .await
        .unwrap();
    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();
    let source = index_metadata.sources.get(&source_id).unwrap();
    assert_eq!(source.enabled, true);

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_delete_source<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-delete-source");
    let index_uri = format!("ram:///indexes/{index_id}");
    let source_id = format!("{index_id}--source");

    let source = SourceConfig {
        source_id: source_id.to_string(),
        num_pipelines: NonZeroUsize::MIN,
        enabled: true,
        source_params: SourceParams::void(),
        transform_config: None,
        input_format: SourceInputFormat::Json,
    };

    let index_config = IndexConfig::for_test(&index_id, index_uri.as_str());

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();
    assert!(matches!(
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(
                    IndexUid::new_with_random_ulid("index-not-found"),
                    &source
                )
                .unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));
    assert!(matches!(
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(
                    IndexUid::new_with_random_ulid(&index_id),
                    &source
                )
                .unwrap()
            )
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    metastore
        .add_source(AddSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap())
        .await
        .unwrap();
    metastore
        .delete_source(DeleteSourceRequest {
            index_uid: index_uid.clone().into(),
            source_id: source_id.clone(),
        })
        .await
        .unwrap();

    let sources = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap()
        .sources;
    assert!(sources.is_empty());

    assert!(matches!(
        metastore
            .delete_source(DeleteSourceRequest {
                index_uid: index_uid.clone().into(),
                source_id: source_id.to_string()
            })
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Source { .. })
    ));
    assert!(matches!(
        metastore
            .delete_source(DeleteSourceRequest {
                index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
                source_id: source_id.to_string()
            })
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));
    assert!(matches!(
        metastore
            .delete_source(DeleteSourceRequest {
                index_uid: Some(IndexUid::new_with_random_ulid(&index_id)),
                source_id: source_id.to_string()
            })
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_reset_checkpoint<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-reset-checkpoint");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let source_ids: Vec<String> = (0..2).map(|i| format!("{index_id}--source-{i}")).collect();
    let split_ids: Vec<String> = (0..2).map(|i| format!("{index_id}--split-{i}")).collect();

    for (source_id, split_id) in source_ids.iter().zip(split_ids.iter()) {
        let source = SourceConfig {
            source_id: source_id.clone(),
            num_pipelines: NonZeroUsize::MIN,
            enabled: true,
            source_params: SourceParams::void(),
            transform_config: None,
            input_format: SourceInputFormat::Json,
        };
        metastore
            .add_source(
                AddSourceRequest::try_from_source_config(index_uid.clone(), &source).unwrap(),
            )
            .await
            .unwrap();

        let split_metadata = SplitMetadata {
            split_id: split_id.clone(),
            index_uid: index_uid.clone(),
            ..Default::default()
        };
        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();
    }
    assert!(
        !metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap()
            .checkpoint
            .is_empty()
    );

    metastore
        .reset_source_checkpoint(ResetSourceCheckpointRequest {
            index_uid: index_uid.clone().into(),
            source_id: source_ids[0].clone(),
        })
        .await
        .unwrap();

    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();
    assert!(
        index_metadata
            .checkpoint
            .source_checkpoint(&source_ids[0])
            .is_none()
    );

    assert!(
        index_metadata
            .checkpoint
            .source_checkpoint(&source_ids[1])
            .is_some()
    );

    assert!(matches!(
        metastore
            .reset_source_checkpoint(ResetSourceCheckpointRequest {
                index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
                source_id: source_ids[1].clone(),
            })
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    assert!(matches!(
        metastore
            .reset_source_checkpoint(ResetSourceCheckpointRequest {
                index_uid: Some(IndexUid::new_with_random_ulid(&index_id)),
                source_id: source_ids[1].to_string(),
            })
            .await
            .unwrap_err(),
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    metastore
        .reset_source_checkpoint(ResetSourceCheckpointRequest {
            index_uid: index_uid.clone().into(),
            source_id: source_ids[1].to_string(),
        })
        .await
        .unwrap();

    assert!(
        metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap()
            .checkpoint
            .is_empty()
    );

    cleanup_index(&mut metastore, index_uid).await;
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/split.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use futures::future::try_join_all;
use quickwit_common::rand::append_random_suffix;
use quickwit_config::{IndexConfig, SourceConfig, SourceParams};
use quickwit_proto::metastore::{
    CreateIndexRequest, DeleteSplitsRequest, EntityKind, IndexMetadataRequest, ListSplitsRequest,
    ListStaleSplitsRequest, MarkSplitsForDeletionRequest, MetastoreError, PublishSplitsRequest,
    StageSplitsRequest, UpdateSplitsDeleteOpstampRequest,
};
use quickwit_proto::types::{IndexUid, Position};
use time::OffsetDateTime;
use tokio::time::sleep;
use tracing::{error, info};

use super::DefaultForTest;
use crate::checkpoint::{IndexCheckpointDelta, PartitionId, SourceCheckpointDelta};
use crate::metastore::MetastoreServiceStreamSplitsExt;
use crate::tests::cleanup_index;
use crate::{
    CreateIndexRequestExt, IndexMetadataResponseExt, ListSplitsQuery, ListSplitsRequestExt,
    ListSplitsResponseExt, MetastoreServiceExt, SplitMetadata, SplitState, StageSplitsRequestExt,
};

pub async fn test_metastore_publish_splits_empty_splits_array_is_allowed<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-publish-splits-empty");
    let non_existent_index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");

    let source_id = format!("{index_id}--source");

    // Publish a split on a non-existent index
    {
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(non_existent_index_uid),
            index_checkpoint_delta_json_opt: Some({
                let offsets = 1..10;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Index { .. })
        ));
    }

    // Update the checkpoint, by publishing an empty array of splits with a non-empty
    // checkpoint. This operation is allowed and used in the Indexer.
    {
        let index_config = IndexConfig::for_test(&index_id, &index_uri);
        let source_configs = &[SourceConfig::for_test(&source_id, SourceParams::void())];
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            index_checkpoint_delta_json_opt: Some({
                let offsets = 0..100;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let index_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        let source_checkpoint = index_metadata
            .checkpoint
            .source_checkpoint(&source_id)
            .unwrap();
        assert_eq!(source_checkpoint.num_partitions(), 1);
        assert_eq!(
            source_checkpoint
                .position_for_partition(&PartitionId::default())
                .unwrap(),
            &Position::offset(100u64 - 1)
        );
        cleanup_index(&mut metastore, index_uid).await;
    }
}

pub async fn test_metastore_publish_splits<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();

    let index_id = append_random_suffix("test-publish-splits");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let source_id = format!("{index_id}--source");
    let source_configs = &[SourceConfig::for_test(&source_id, SourceParams::void())];

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        time_range: Some(0..=99),
        create_timestamp: current_timestamp,
        ..Default::default()
    };

    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        time_range: Some(30..=99),
        create_timestamp: current_timestamp,
        ..Default::default()
    };

    // Publish a split on a non-existent index
    {
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
            staged_split_ids: vec!["split-not-found".to_string()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 0..10;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Index { .. })
        ));
    }

    // Publish a split on a wrong index uid
    {
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(IndexUid::new_with_random_ulid(&index_id)),
            staged_split_ids: vec!["split-not-found".to_string()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 0..10;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Index { .. })
        ));
    }

    // Publish a non-existent split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec!["split-not-found".to_string()],
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a staged split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a published split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 1..12;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::FailedPrecondition {
                entity: EntityKind::Splits { .. },
                ..
            }
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a non-staged split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 12..15;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id_1.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 15..18;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::FailedPrecondition {
                entity: EntityKind::Splits { .. },
                ..
            }
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a staged split and non-existent split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), "split-not-found".to_string()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 15..18;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a published split and non-existent split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 15..18;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), "split-not-found".to_string()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 18..24;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a non-staged split and non-existent split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 18..24;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id_1.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), "split-not-found".to_string()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 24..26;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish staged splits on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_2)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 24..26;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish a staged split and published split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            [split_metadata_1.clone(), split_metadata_2.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 26..28;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 28..30;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::FailedPrecondition {
                entity: EntityKind::Splits { .. },
                ..
            }
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Publish published splits on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_and_source_configs(&index_config, source_configs)
                .unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            [split_metadata_1.clone(), split_metadata_2.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 30..31;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            index_checkpoint_delta_json_opt: Some({
                let offsets = 30..31;
                let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
                serde_json::to_string(&checkpoint_delta).unwrap()
            }),
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::FailedPrecondition {
                entity: EntityKind::CheckpointDelta { .. },
                ..
            }
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }
}

pub async fn test_metastore_publish_splits_concurrency<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest + Clone,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-publish-concurrency");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let source_id = format!("{index_id}--source");

    let source_config = SourceConfig::for_test(&source_id, SourceParams::void());
    let create_index_request =
        CreateIndexRequest::try_from_index_and_source_configs(&index_config, &[source_config])
            .unwrap();

    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let mut join_handles = Vec::with_capacity(10);

    for partition_id in 0..10 {
        let metastore_clone = metastore.clone();
        let index_id = index_id.clone();
        let source_id = source_id.clone();

        let join_handle = tokio::spawn({
            let index_uid = index_uid.clone();
            async move {
                let split_id = format!("{index_id}--split-{partition_id}");
                let split_metadata = SplitMetadata {
                    split_id: split_id.clone(),
                    index_uid: index_uid.clone(),
                    ..Default::default()
                };
                let stage_splits_request =
                    StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata)
                        .unwrap();
                metastore_clone
                    .stage_splits(stage_splits_request)
                    .await
                    .unwrap();
                let source_delta = SourceCheckpointDelta::from_partition_delta(
                    PartitionId::from(partition_id as u64),
                    Position::Beginning,
                    Position::offset(partition_id as u64),
                )
                .unwrap();
                let checkpoint_delta = IndexCheckpointDelta {
                    source_id,
                    source_delta,
                };
                let publish_splits_request = PublishSplitsRequest {
                    index_uid: Some(index_uid.clone()),
                    staged_split_ids: vec![split_id.clone()],
                    index_checkpoint_delta_json_opt: Some(
                        serde_json::to_string(&checkpoint_delta).unwrap(),
                    ),
                    ..Default::default()
                };
                metastore_clone
                    .publish_splits(publish_splits_request)
                    .await
                    .unwrap();
            }
        });
        join_handles.push(join_handle);
    }
    try_join_all(join_handles).await.unwrap();

    let index_metadata = metastore
        .index_metadata(IndexMetadataRequest::for_index_id(index_id.to_string()))
        .await
        .unwrap()
        .deserialize_index_metadata()
        .unwrap();
    let source_checkpoint = index_metadata
        .checkpoint
        .source_checkpoint(&source_id)
        .unwrap();

    assert_eq!(source_checkpoint.num_partitions(), 10);

    cleanup_index(&mut metastore, index_uid).await
}

pub async fn test_metastore_replace_splits<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();

    let index_id = append_random_suffix("test-replace-splits");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        time_range: None,
        create_timestamp: current_timestamp,
        ..Default::default()
    };

    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        time_range: None,
        create_timestamp: current_timestamp,
        ..Default::default()
    };

    let split_id_3 = format!("{index_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid.clone(),
        time_range: None,
        create_timestamp: current_timestamp,
        ..Default::default()
    };

    // Replace splits on a non-existent index
    {
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
            staged_split_ids: vec!["split-not-found-1".to_string()],
            replaced_split_ids: vec!["split-not-found-2".to_string()],
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Index { .. })
        ));
    }

    // Replace a non-existent split on an index
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec!["split-not-found-1".to_string()],
            replaced_split_ids: vec!["split-not-found-2".to_string()],
            ..Default::default()
        };
        // TODO source id
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Replace a publish split with a non existing split
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        // TODO Source id
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            replaced_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Replace a publish split with a deleted split
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            [split_metadata_1.clone(), split_metadata_2.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id_2.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        // TODO source_id
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            replaced_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::FailedPrecondition {
                entity: EntityKind::Splits { .. },
                ..
            }
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Replace a publish split with mixed splits
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_2)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_2.clone(), split_id_3.clone()],
            replaced_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request) // TODO source id
            .await
            .unwrap_err();
        assert!(matches!(
            error,
            MetastoreError::NotFound(EntityKind::Splits { .. })
        ));

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Replace a deleted split with a new split
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let mark_splits_for_deletion_request =
            MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id_1.clone()]);
        metastore
            .mark_splits_for_deletion(mark_splits_for_deletion_request)
            .await
            .unwrap();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_2)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_2.clone()],
            replaced_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        let error = metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap_err();
        assert!(
            matches!(error, MetastoreError::FailedPrecondition { entity: EntityKind::Splits { split_ids }, .. } if split_ids == [split_id_1.clone()])
        );

        cleanup_index(&mut metastore, index_uid).await;
    }

    // Replace a publish split with staged splits
    {
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request =
            StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1)
                .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            [split_metadata_2.clone(), split_metadata_3.clone()],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();

        // TODO Source id
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_2.clone(), split_id_3.clone()],
            replaced_split_ids: vec![split_id_1.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        cleanup_index(&mut metastore, index_uid).await;
    }
}

pub async fn test_metastore_mark_splits_for_deletion<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();

    let index_id = append_random_suffix("test-mark-splits-for-deletion");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);
    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();

    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let mark_splits_for_deletion_request = MarkSplitsForDeletionRequest::new(
        "index-not-found:00000000000000000000000000"
            .parse()
            .unwrap(),
        Vec::new(),
    );
    let error = metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let mark_splits_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid.clone(), vec!["split-not-found".to_string()]);
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap();

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        ..Default::default()
    };
    let stage_splits_request =
        StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1).unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        ..Default::default()
    };
    let stage_splits_request =
        StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_2).unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid.clone()),
        staged_split_ids: vec![split_id_2.clone()],
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    let split_id_3 = format!("{index_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        ..Default::default()
    };
    let stage_splits_request =
        StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_3).unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid.clone()),
        staged_split_ids: vec![split_id_3.clone()],
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    // Sleep for 1s so we can observe the timestamp update.
    sleep(Duration::from_secs(1)).await;

    let mark_splits_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id_3.clone()]);
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap();

    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(
        &ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::MarkedForDeletion),
    )
    .unwrap();
    let marked_splits = metastore
        .list_splits(list_splits_request)
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();

    assert_eq!(marked_splits.len(), 1);
    assert_eq!(marked_splits[0].split_id(), split_id_3);

    let split_3_update_timestamp = marked_splits[0].update_timestamp;
    assert!(current_timestamp < split_3_update_timestamp);

    // Sleep for 1s so we can observe the timestamp update.
    sleep(Duration::from_secs(1)).await;

    let mark_splits_for_deletion_request = MarkSplitsForDeletionRequest::new(
        index_uid.clone(),
        vec![
            split_id_1.clone(),
            split_id_2.clone(),
            split_id_3.clone(),
            "split-not-found".to_string(),
        ],
    );
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap();

    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(
        &ListSplitsQuery::for_index(index_uid.clone())
            .with_split_state(SplitState::MarkedForDeletion),
    )
    .unwrap();
    let mut marked_splits = metastore
        .list_splits(list_splits_request)
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();

    marked_splits.sort_by_key(|split| split.split_id().to_string());

    assert_eq!(marked_splits.len(), 3);

    assert_eq!(marked_splits[0].split_id(), split_id_1);
    assert!(current_timestamp + 2 <= marked_splits[0].update_timestamp);

    assert_eq!(marked_splits[1].split_id(), split_id_2);
    assert!(current_timestamp + 2 <= marked_splits[1].update_timestamp);

    assert_eq!(marked_splits[2].split_id(), split_id_3);
    assert_eq!(marked_splits[2].update_timestamp, split_3_update_timestamp);

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_delete_splits<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let index_id = append_random_suffix("test-delete-splits");
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    let delete_splits_request = DeleteSplitsRequest {
        index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
        split_ids: Vec::new(),
    };
    let error = metastore
        .delete_splits(delete_splits_request)
        .await
        .unwrap_err();

    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let index_not_existing_uid = IndexUid::new_with_random_ulid(&index_id);
    // Check error if index does not exist.
    let delete_splits_request = DeleteSplitsRequest {
        index_uid: Some(index_not_existing_uid),
        split_ids: Vec::new(),
    };
    let error = metastore
        .delete_splits(delete_splits_request)
        .await
        .unwrap_err();

    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let delete_splits_request = DeleteSplitsRequest {
        index_uid: Some(index_uid.clone()),
        split_ids: vec!["split-not-found".to_string()],
    };
    metastore
        .delete_splits(delete_splits_request)
        .await
        .unwrap();

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let stage_splits_request =
        StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_1).unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid.clone()),
        staged_split_ids: vec![split_id_1.clone()],
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();

    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        ..Default::default()
    };
    let stage_splits_request =
        StageSplitsRequest::try_from_split_metadata(index_uid.clone(), &split_metadata_2).unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    let delete_splits_request = DeleteSplitsRequest {
        index_uid: Some(index_uid.clone()),
        split_ids: vec![split_id_1.clone(), split_id_2.clone()],
    };
    let error = metastore
        .delete_splits(delete_splits_request)
        .await
        .unwrap_err();

    assert!(matches!(
        error,
        MetastoreError::FailedPrecondition {
            entity: EntityKind::Splits { .. },
            ..
        }
    ));

    assert_eq!(
        metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap()
            .len(),
        2
    );

    let mark_splits_for_deletion_request = MarkSplitsForDeletionRequest::new(
        index_uid.clone(),
        vec![split_id_1.clone(), split_id_2.clone()],
    );
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap();

    let delete_splits_request = DeleteSplitsRequest {
        index_uid: Some(index_uid.clone()),
        split_ids: vec![
            split_id_1.clone(),
            split_id_2.clone(),
            "split-not-found".to_string(),
        ],
    };
    metastore
        .delete_splits(delete_splits_request)
        .await
        .unwrap();

    assert_eq!(
        metastore
            .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
            .await
            .unwrap()
            .collect_splits()
            .await
            .unwrap()
            .len(),
        0
    );

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_split_update_timestamp<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;

    let mut current_timestamp = OffsetDateTime::now_utc().unix_timestamp();

    let index_id = append_random_suffix("split-update-timestamp");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let source_id = format!("{index_id}--source");
    let source_config = SourceConfig::for_test(&source_id, SourceParams::void());

    let split_id = format!("{index_id}--split");
    let split_metadata = SplitMetadata {
        split_id: split_id.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        ..Default::default()
    };

    // Create an index
    let create_index_request =
        CreateIndexRequest::try_from_index_and_source_configs(&index_config, &[source_config])
            .unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    // wait for 1s, stage split & check `update_timestamp`
    sleep(Duration::from_secs(1)).await;
    let stage_splits_request =
        StageSplitsRequest::try_from_splits_metadata(index_uid.clone(), [split_metadata.clone()])
            .unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    sleep(Duration::from_secs(1)).await;
    let split_meta = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap()[0]
        .clone();
    assert!(split_meta.update_timestamp > current_timestamp);
    assert!(split_meta.publish_timestamp.is_none());

    current_timestamp = split_meta.update_timestamp;

    // wait for 1s, publish split & check `update_timestamp`
    sleep(Duration::from_secs(1)).await;
    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid.clone()),
        staged_split_ids: vec![split_id.clone()],
        index_checkpoint_delta_json_opt: Some({
            let offsets = 0..5;
            let checkpoint_delta = IndexCheckpointDelta::for_test(&source_id, offsets);
            serde_json::to_string(&checkpoint_delta).unwrap()
        }),
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();
    let split_meta = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap()[0]
        .clone();
    assert!(split_meta.update_timestamp > current_timestamp);
    assert_eq!(
        split_meta.publish_timestamp,
        Some(split_meta.update_timestamp)
    );
    current_timestamp = split_meta.update_timestamp;

    // wait for 1s, mark split for deletion & check `update_timestamp`
    sleep(Duration::from_secs(1)).await;
    let mark_splits_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id.clone()]);
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap();
    let split_meta = metastore
        .list_splits(ListSplitsRequest::try_from_index_uid(index_uid.clone()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap()[0]
        .clone();
    assert!(split_meta.update_timestamp > current_timestamp);
    assert!(split_meta.publish_timestamp.is_some());

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_stage_splits<MetastoreToTest: MetastoreServiceExt + DefaultForTest>() {
    let mut metastore = MetastoreToTest::default_for_test().await;
    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    let index_id = append_random_suffix("test-stage-splits");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 20,
        node_id: "node-1".to_string(),
        ..Default::default()
    };
    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 10,
        node_id: "node-2".to_string(),
        ..Default::default()
    };

    // Stage a splits on a non-existent index
    let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
        IndexUid::new_with_random_ulid("index-not-found"),
        [split_metadata_1.clone()],
    )
    .unwrap();
    let error = metastore
        .stage_splits(stage_splits_request)
        .await
        .unwrap_err();
    assert!(matches!(
        error,
        MetastoreError::NotFound(EntityKind::Index { .. })
    ));

    let create_index_request = CreateIndexRequest::try_from_index_config(&index_config).unwrap();
    let index_uid: IndexUid = metastore
        .create_index(create_index_request)
        .await
        .unwrap()
        .index_uid()
        .clone();

    // Stage a split on an index
    let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
        index_uid.clone(),
        [split_metadata_1.clone(), split_metadata_2.clone()],
    )
    .unwrap();
    metastore.stage_splits(stage_splits_request).await.unwrap();

    let query = ListSplitsQuery::for_index(index_uid.clone()).with_split_state(SplitState::Staged);
    let mut splits = metastore
        .list_splits(ListSplitsRequest::try_from_list_splits_query(&query).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();

    assert_eq!(splits.len(), 2);
    splits.sort_unstable_by(|left, right| left.split_id().cmp(right.split_id()));

    assert_eq!(splits[0].split_id(), &split_id_1);
    assert_eq!(splits[0].split_metadata.node_id, "node-1");

    assert_eq!(splits[1].split_id(), &split_id_2);
    assert_eq!(splits[1].split_metadata.node_id, "node-2");

    // Stage a existent-staged-split on an index
    let stage_splits_request =
        StageSplitsRequest::try_from_splits_metadata(index_uid.clone(), [split_metadata_1.clone()])
            .unwrap();
    metastore
        .stage_splits(stage_splits_request)
        .await
        .expect("Pre-existing staged splits should be updated.");

    let publish_splits_request = PublishSplitsRequest {
        index_uid: Some(index_uid.clone()),
        staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
        ..Default::default()
    };
    metastore
        .publish_splits(publish_splits_request)
        .await
        .unwrap();
    let stage_splits_request =
        StageSplitsRequest::try_from_splits_metadata(index_uid.clone(), [split_metadata_1.clone()])
            .unwrap();
    let error = metastore
        .stage_splits(stage_splits_request)
        .await
        .expect_err("Metastore should not allow splits which are not `Staged` to be overwritten.");
    assert!(matches!(
        error,
        MetastoreError::FailedPrecondition {
            entity: EntityKind::Splits { .. },
            ..
        }
    ),);

    let mark_splits_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid.clone(), vec![split_id_2.clone()]);
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await
        .unwrap();
    let stage_splits_request =
        StageSplitsRequest::try_from_splits_metadata(index_uid.clone(), [split_metadata_2.clone()])
            .unwrap();
    let error = metastore
        .stage_splits(stage_splits_request)
        .await
        .expect_err("Metastore should not allow splits which are not `Staged` to be overwritten.");
    assert!(matches!(
        error,
        MetastoreError::FailedPrecondition {
            entity: EntityKind::Splits { .. },
            ..
        }
    ),);

    cleanup_index(&mut metastore, index_uid).await;
}

pub async fn test_metastore_update_splits_delete_opstamp<
    MetastoreToTest: MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreToTest::default_for_test().await;
    let current_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    let index_id = append_random_suffix("update-splits-delete-opstamp");
    let index_uid = IndexUid::new_with_random_ulid(&index_id);
    let index_uri = format!("ram:///indexes/{index_id}");
    let index_config = IndexConfig::for_test(&index_id, &index_uri);

    let split_id_1 = format!("{index_id}--split-1");
    let split_metadata_1 = SplitMetadata {
        split_id: split_id_1.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 20,
        ..Default::default()
    };
    let split_id_2 = format!("{index_id}--split-2");
    let split_metadata_2 = SplitMetadata {
        split_id: split_id_2.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 10,
        ..Default::default()
    };
    let split_id_3 = format!("{index_id}--split-3");
    let split_metadata_3 = SplitMetadata {
        split_id: split_id_3.clone(),
        index_uid: index_uid.clone(),
        create_timestamp: current_timestamp,
        delete_opstamp: 0,
        ..Default::default()
    };

    {
        info!("update splits delete opstamp on a non-existent index");
        let update_splits_delete_opstamp_request = UpdateSplitsDeleteOpstampRequest {
            index_uid: Some(IndexUid::new_with_random_ulid("index-not-found")),
            split_ids: vec![split_id_1.clone()],
            delete_opstamp: 10,
        };
        let metastore_err = metastore
            .update_splits_delete_opstamp(update_splits_delete_opstamp_request)
            .await
            .unwrap_err();
        error!(err=?metastore_err);
        assert!(matches!(
            metastore_err,
            MetastoreError::NotFound(EntityKind::Index { .. })
        ));
    }

    {
        info!("update splits delete opstamp on an index");
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        let index_uid: IndexUid = metastore
            .create_index(create_index_request)
            .await
            .unwrap()
            .index_uid()
            .clone();

        let stage_splits_request = StageSplitsRequest::try_from_splits_metadata(
            index_uid.clone(),
            [split_metadata_1, split_metadata_2, split_metadata_3],
        )
        .unwrap();
        metastore.stage_splits(stage_splits_request).await.unwrap();
        let publish_splits_request = PublishSplitsRequest {
            index_uid: Some(index_uid.clone()),
            staged_split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            ..Default::default()
        };
        metastore
            .publish_splits(publish_splits_request)
            .await
            .unwrap();

        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: Some(index_uid.clone()),
            delete_opstamp: 100,
            num_splits: 2,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 2);

        let update_splits_delete_opstamp_request = UpdateSplitsDeleteOpstampRequest {
            index_uid: Some(index_uid.clone()),
            split_ids: vec![split_id_1.clone(), split_id_2.clone()],
            delete_opstamp: 100,
        };
        metastore
            .update_splits_delete_opstamp(update_splits_delete_opstamp_request)
            .await
            .unwrap();

        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: Some(index_uid.clone()),
            delete_opstamp: 100,
            num_splits: 2,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 0);

        let list_stale_splits_request = ListStaleSplitsRequest {
            index_uid: Some(index_uid.clone()),
            delete_opstamp: 200,
            num_splits: 2,
        };
        let splits = metastore
            .list_stale_splits(list_stale_splits_request)
            .await
            .unwrap()
            .deserialize_splits()
            .await
            .unwrap();
        assert_eq!(splits.len(), 2);
        assert_eq!(splits[0].split_metadata.delete_opstamp, 100);
        assert_eq!(splits[1].split_metadata.delete_opstamp, 100);

        cleanup_index(&mut metastore, index_uid).await;
    }
}


================================================
FILE: quickwit/quickwit-metastore/src/tests/template.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::rand::append_random_suffix;
use quickwit_config::IndexTemplate;
use quickwit_proto::metastore::{
    CreateIndexTemplateRequest, DeleteIndexTemplatesRequest, EntityKind,
    FindIndexTemplateMatchesRequest, GetIndexTemplateRequest, ListIndexTemplatesRequest,
    MetastoreError, MetastoreResult, MetastoreService, serde_utils,
};

use super::DefaultForTest;
use crate::MetastoreServiceExt;

async fn list_all_index_templates(
    metastore: &mut dyn MetastoreService,
) -> MetastoreResult<Vec<IndexTemplate>> {
    let list_index_templates_request = ListIndexTemplatesRequest {};
    let list_index_templates_response = metastore
        .list_index_templates(list_index_templates_request)
        .await?;
    list_index_templates_response
        .index_templates_json
        .into_iter()
        .map(|index_template_json| serde_utils::from_json_str(&index_template_json))
        .collect()
}

async fn cleanup_templates(metastore: &mut dyn MetastoreService) {
    let template_ids = list_all_index_templates(metastore)
        .await
        .unwrap()
        .into_iter()
        .map(|index_template| index_template.template_id)
        .collect::<Vec<_>>();

    let delete_templates_request = DeleteIndexTemplatesRequest { template_ids };
    metastore
        .delete_index_templates(delete_templates_request)
        .await
        .unwrap();
}

pub async fn test_metastore_create_index_template<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;
    cleanup_templates(&mut metastore).await;

    let template_id = append_random_suffix("test-create-template");
    let index_template = IndexTemplate::for_test(&template_id, &["test-template-*"], 100);
    let index_template_json = serde_json::to_string(&index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: index_template_json.clone(),
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let index_templates = list_all_index_templates(&mut metastore).await.unwrap();
    assert_eq!(index_templates.len(), 1);

    assert_eq!(index_templates[0].template_id, template_id);
    assert_eq!(index_templates[0].index_id_patterns, ["test-template-*"]);
    assert_eq!(index_templates[0].priority, 100);

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: index_template_json.clone(),
        overwrite: false,
    };
    let error = metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap_err();
    assert!(
        matches!(error, MetastoreError::AlreadyExists(EntityKind::IndexTemplate { template_id }) if template_id.starts_with("test-create-template"))
    );

    let index_template = IndexTemplate::for_test(&template_id, &["test-template-*"], 200);
    let index_template_json = serde_json::to_string(&index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: index_template_json.clone(),
        overwrite: true,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let index_templates = list_all_index_templates(&mut metastore).await.unwrap();
    assert_eq!(index_templates.len(), 1);

    let index_templates = list_all_index_templates(&mut metastore).await.unwrap();
    assert_eq!(index_templates.len(), 1);
    assert_eq!(index_templates[0].priority, 200);
}

pub async fn test_metastore_get_index_template<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;
    cleanup_templates(&mut metastore).await;

    let template_id = append_random_suffix("test-get-template");
    let index_template = IndexTemplate::for_test(&template_id, &["test-template"], 100);
    let index_template_json = serde_json::to_string(&index_template).unwrap();

    let get_index_template_request = GetIndexTemplateRequest {
        template_id: template_id.clone(),
    };
    let error = metastore
        .get_index_template(get_index_template_request.clone())
        .await
        .unwrap_err();
    assert!(
        matches!(error, MetastoreError::NotFound(EntityKind::IndexTemplate { template_id }) if template_id.starts_with("test-get-template"))
    );

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let get_index_template_response = metastore
        .get_index_template(get_index_template_request.clone())
        .await
        .unwrap();
    let index_template: IndexTemplate =
        serde_utils::from_json_str(&get_index_template_response.index_template_json).unwrap();

    assert_eq!(index_template.template_id, template_id);
    assert_eq!(index_template.index_id_patterns, ["test-template"]);
    assert_eq!(index_template.priority, 100);
}

pub async fn test_metastore_find_index_template_matches<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;
    cleanup_templates(&mut metastore).await;

    let foo_template_id = append_random_suffix("test-template-foo");
    let foo_index_template = IndexTemplate::for_test(
        &foo_template_id,
        &["test-index-foo*", "-test-index-fool"],
        200,
    );
    let foo_index_template_json = serde_json::to_string(&foo_index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: foo_index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let foobar_template_id = append_random_suffix("test-template-foobar");
    let foobar_index_template =
        IndexTemplate::for_test(&foobar_template_id, &["test-index-foobar*"], 100);
    let foobar_index_template_json = serde_json::to_string(&foobar_index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: foobar_index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let bar_template_id = append_random_suffix("test-template-bar");
    let bar_index_template = IndexTemplate::for_test(&bar_template_id, &["test-index-bar*"], 100);
    let bar_index_template_json = serde_json::to_string(&bar_index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: bar_index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let find_index_template_matches = FindIndexTemplateMatchesRequest {
        index_ids: vec![
            "test-index-foo".to_string(),
            "test-index-fool".to_string(),
            "test-index-foobar".to_string(),
            "test-index-bar".to_string(),
            "test-index-qux".to_string(),
        ],
    };
    let find_index_template_matches_response = metastore
        .find_index_template_matches(find_index_template_matches)
        .await
        .unwrap();
    let mut matches = find_index_template_matches_response.matches;
    matches.sort_unstable_by(|left, right| left.index_id.cmp(&right.index_id));

    assert_eq!(matches.len(), 3);

    assert_eq!(matches[0].index_id, "test-index-bar");
    assert_eq!(matches[0].template_id, bar_template_id);

    assert_eq!(matches[1].index_id, "test-index-foo");
    assert_eq!(matches[1].template_id, foo_template_id);

    assert_eq!(matches[2].index_id, "test-index-foobar");
    assert_eq!(matches[2].template_id, foo_template_id);
}

pub async fn test_metastore_list_index_templates<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;
    cleanup_templates(&mut metastore).await;

    let list_index_templates_request = ListIndexTemplatesRequest {};
    let list_index_templates_response = metastore
        .list_index_templates(list_index_templates_request)
        .await
        .unwrap();
    assert_eq!(list_index_templates_response.index_templates_json.len(), 0);

    let template_id = append_random_suffix("test-list-template");
    let index_template = IndexTemplate::for_test(&template_id, &["test-template"], 100);
    let index_template_json = serde_json::to_string(&index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let list_index_templates_request = ListIndexTemplatesRequest {};
    let list_index_templates_response = metastore
        .list_index_templates(list_index_templates_request)
        .await
        .unwrap();
    assert_eq!(list_index_templates_response.index_templates_json.len(), 1);

    let index_template: IndexTemplate =
        serde_utils::from_json_str(&list_index_templates_response.index_templates_json[0]).unwrap();

    assert_eq!(index_template.template_id, template_id);
    assert_eq!(index_template.index_id_patterns, ["test-template"]);
    assert_eq!(
        index_template.index_root_uri.unwrap().as_str(),
        "ram:///indexes"
    );
    assert_eq!(index_template.priority, 100);
    assert_eq!(index_template.description.unwrap(), "Test description.");
    assert_eq!(index_template.doc_mapping.timestamp_field.unwrap(), "ts");
}

pub async fn test_metastore_delete_index_templates<
    MetastoreUnderTest: MetastoreService + MetastoreServiceExt + DefaultForTest,
>() {
    let mut metastore = MetastoreUnderTest::default_for_test().await;
    cleanup_templates(&mut metastore).await;

    let foo_template_id = append_random_suffix("test-template-foo");
    let foo_index_template = IndexTemplate::for_test(&foo_template_id, &["test-index-foo*"], 100);
    let foo_index_template_json = serde_json::to_string(&foo_index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: foo_index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let bar_template_id = append_random_suffix("test-template-bar");
    let bar_index_template = IndexTemplate::for_test(&bar_template_id, &["test-index-bar*"], 100);
    let bar_index_template_json = serde_json::to_string(&bar_index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: bar_index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let qux_template_id = append_random_suffix("test-template-qux");
    let qux_index_template = IndexTemplate::for_test(&qux_template_id, &["test-index-qux*"], 100);
    let qux_index_template_json = serde_json::to_string(&qux_index_template).unwrap();

    let create_index_template_request = CreateIndexTemplateRequest {
        index_template_json: qux_index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template_request)
        .await
        .unwrap();

    let delete_index_templates_request = DeleteIndexTemplatesRequest {
        template_ids: vec![foo_template_id.clone(), bar_template_id.clone()],
    };
    metastore
        .delete_index_templates(delete_index_templates_request.clone())
        .await
        .unwrap();

    // Test idempotency.
    metastore
        .delete_index_templates(delete_index_templates_request.clone())
        .await
        .unwrap();

    let index_templates = list_all_index_templates(&mut metastore).await.unwrap();
    assert_eq!(index_templates.len(), 1);
    assert_eq!(index_templates[0].template_id, qux_template_id);
}


================================================
FILE: quickwit/quickwit-metastore/test-data/.gitignore
================================================
*.modified.json


================================================
FILE: quickwit/quickwit-metastore/test-data/file-backed-index/v0.7.expected.json
================================================
{
  "version": "0.9",
  "index": {
    "version": "0.9",
    "index_uid": "my-index:00000000000000000000000000",
    "index_config": {
      "version": "0.9",
      "index_id": "my-index",
      "index_uri": "s3://quickwit-indexes/my-index",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000000",
        "mode": "dynamic",
        "dynamic_mapping": {
          "indexed": true,
          "tokenizer": "raw",
          "record": "basic",
          "stored": true,
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          }
        },
        "field_mappings": [
          {
            "name": "tenant_id",
            "type": "u64",
            "stored": true,
            "indexed": true,
            "fast": true,
            "coerce": true,
            "output_format": "number"
          },
          {
            "name": "timestamp",
            "type": "datetime",
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "output_format": "rfc3339",
            "fast_precision": "seconds",
            "indexed": true,
            "stored": true,
            "fast": true
          },
          {
            "name": "log_level",
            "type": "text",
            "indexed": true,
            "tokenizer": "raw",
            "record": "basic",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          },
          {
            "name": "message",
            "type": "text",
            "indexed": true,
            "tokenizer": "default",
            "record": "position",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          }
        ],
        "timestamp_field": "timestamp",
        "tag_fields": [
          "log_level",
          "tenant_id"
        ],
        "partition_key": "tenant_id",
        "max_num_partitions": 100,
        "index_field_presence": true,
        "store_document_size": false,
        "store_source": true,
        "tokenizers": [
          {
            "name": "custom_tokenizer",
            "type": "regex",
            "pattern": "[^\\p{L}\\p{N}]+",
            "filters": []
          }
        ]
      },
      "indexing_settings": {
        "commit_timeout_secs": 301,
        "docstore_compression_level": 8,
        "docstore_blocksize": 1000000,
        "split_num_docs_target": 10000001,
        "merge_policy": {
          "type": "stable_log",
          "min_level_num_docs": 100000,
          "merge_factor": 9,
          "max_merge_factor": 11,
          "maturation_period": "2days"
        },
        "resources": {
          "heap_size": 50000000
        }
      },
      "ingest_settings": {
        "min_shards": 1
      },
      "search_settings": {
        "default_search_fields": [
          "message"
        ]
      },
      "retention": {
        "period": "90 days",
        "schedule": "daily"
      }
    },
    "checkpoint": {
      "kafka-source": {
        "00000000000000000000": "00000000000000000042"
      }
    },
    "create_timestamp": 1789,
    "sources": [
      {
        "version": "0.9",
        "source_id": "kafka-source",
        "num_pipelines": 2,
        "enabled": true,
        "source_type": "kafka",
        "params": {
          "topic": "kafka-topic",
          "client_params": {}
        },
        "transform": {
          "script": ".message = downcase(string!(.message))",
          "timezone": "UTC"
        },
        "input_format": "json"
      }
    ]
  },
  "splits": [
    {
      "split_state": "Published",
      "update_timestamp": 1789,
      "publish_timestamp": 1789,
      "version": "0.9",
      "split_id": "split",
      "index_uid": "my-index:00000000000000000000000000",
      "partition_id": 7,
      "source_id": "source",
      "node_id": "node",
      "num_docs": 12303,
      "uncompressed_docs_size_in_bytes": 234234,
      "time_range": {
        "start": 121000,
        "end": 130198
      },
      "create_timestamp": 3,
      "maturity": {
        "type": "immature",
        "maturation_period_millis": 4000
      },
      "tags": [
        "234",
        "aaa"
      ],
      "footer_offsets": {
        "start": 1000,
        "end": 2000
      },
      "delete_opstamp": 10,
      "num_merge_ops": 3,
      "doc_mapping_uid": "00000000000000000000000000"
    }
  ],
  "shards": {
    "_ingest-source": [
      {
        "index_uid": "my-index:00000000000000000000000000",
        "source_id": "_ingest-source",
        "shard_id": "00000000000000000001",
        "leader_id": "leader-ingester",
        "follower_id": "follower-ingester",
        "shard_state": 1,
        "publish_position_inclusive": "",
        "doc_mapping_uid": "00000000000000000000000000",
        "update_timestamp": 1704067200
      }
    ]
  },
  "delete_tasks": [
    {
      "create_timestamp": 0,
      "opstamp": 10,
      "delete_query": {
        "index_uid": "my-index:00000000000000000000000000",
        "query_ast": "{\"type\":\"bool\",\"must\":[{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Harry\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}},{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Potter\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}}]}"
      }
    }
  ]
}


================================================
FILE: quickwit/quickwit-metastore/test-data/file-backed-index/v0.7.json
================================================
{
  "delete_tasks": [
    {
      "create_timestamp": 0,
      "delete_query": {
        "index_uid": "my-index:00000000000000000000000000",
        "query_ast": "{\"type\":\"bool\",\"must\":[{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Harry\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}},{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Potter\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}}]}"
      },
      "opstamp": 10
    }
  ],
  "index": {
    "checkpoint": {
      "kafka-source": {
        "00000000000000000000": "00000000000000000042"
      }
    },
    "create_timestamp": 1789,
    "index_config": {
      "doc_mapping": {
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "coerce": true,
            "fast": true,
            "indexed": true,
            "name": "tenant_id",
            "output_format": "number",
            "stored": true,
            "type": "u64"
          },
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "timestamp",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "fast": false,
            "fieldnorms": false,
            "indexed": true,
            "name": "log_level",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "text"
          },
          {
            "fast": false,
            "fieldnorms": false,
            "indexed": true,
            "name": "message",
            "record": "position",
            "stored": true,
            "tokenizer": "default",
            "type": "text"
          }
        ],
        "index_field_presence": true,
        "max_num_partitions": 100,
        "mode": "dynamic",
        "partition_key": "tenant_id",
        "store_source": true,
        "tag_fields": [
          "log_level",
          "tenant_id"
        ],
        "timestamp_field": "timestamp",
        "tokenizers": [
          {
            "filters": [],
            "name": "custom_tokenizer",
            "pattern": "[^\\p{L}\\p{N}]+",
            "type": "regex"
          }
        ]
      },
      "index_id": "my-index",
      "index_uri": "s3://quickwit-indexes/my-index",
      "indexing_settings": {
        "commit_timeout_secs": 301,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 11,
          "merge_factor": 9,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": "50.0 MB"
        },
        "split_num_docs_target": 10000001
      },
      "retention": {
        "period": "90 days",
        "schedule": "daily"
      },
      "search_settings": {
        "default_search_fields": [
          "message"
        ]
      },
      "version": "0.7"
    },
    "index_uid": "my-index:00000000000000000000000000",
    "sources": [
      {
        "desired_num_pipelines": 2,
        "enabled": true,
        "input_format": "json",
        "max_num_pipelines_per_indexer": 2,
        "params": {
          "client_params": {},
          "topic": "kafka-topic"
        },
        "source_id": "kafka-source",
        "source_type": "kafka",
        "transform": {
          "script": ".message = downcase(string!(.message))",
          "timezone": "UTC"
        },
        "version": "0.7"
      }
    ],
    "version": "0.7"
  },
  "shards": {
    "_ingest-source": [
      {
        "index_uid": "my-index:00000000000000000000000000",
        "shard_id": "00000000000000000001",
        "source_id": "_ingest-source",
        "shard_state": 1,
        "leader_id": "leader-ingester",
        "follower_id": "follower-ingester",
        "publish_position_inclusive": ""
      }
    ]
  },
  "splits": [
    {
      "create_timestamp": 3,
      "delete_opstamp": 10,
      "footer_offsets": {
        "end": 2000,
        "start": 1000
      },
      "index_uid": "my-index:00000000000000000000000000",
      "maturity": {
        "maturation_period_millis": 4000,
        "type": "immature"
      },
      "node_id": "node",
      "num_docs": 12303,
      "num_merge_ops": 3,
      "partition_id": 7,
      "publish_timestamp": 1789,
      "source_id": "source",
      "split_id": "split",
      "split_state": "Published",
      "tags": [
        "234",
        "aaa"
      ],
      "time_range": {
        "end": 130198,
        "start": 121000
      },
      "uncompressed_docs_size_in_bytes": 234234,
      "update_timestamp": 1789,
      "version": "0.7"
    }
  ],
  "version": "0.7"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/file-backed-index/v0.8.expected.json
================================================
{
  "version": "0.9",
  "index": {
    "version": "0.9",
    "index_uid": "my-index:00000000000000000000000000",
    "index_config": {
      "version": "0.9",
      "index_id": "my-index",
      "index_uri": "s3://quickwit-indexes/my-index",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000000",
        "mode": "dynamic",
        "dynamic_mapping": {
          "indexed": true,
          "tokenizer": "raw",
          "record": "basic",
          "stored": true,
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          }
        },
        "field_mappings": [
          {
            "name": "tenant_id",
            "type": "u64",
            "stored": true,
            "indexed": true,
            "fast": true,
            "coerce": true,
            "output_format": "number"
          },
          {
            "name": "timestamp",
            "type": "datetime",
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "output_format": "rfc3339",
            "fast_precision": "seconds",
            "indexed": true,
            "stored": true,
            "fast": true
          },
          {
            "name": "log_level",
            "type": "text",
            "indexed": true,
            "tokenizer": "raw",
            "record": "basic",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          },
          {
            "name": "message",
            "type": "text",
            "indexed": true,
            "tokenizer": "default",
            "record": "position",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          }
        ],
        "timestamp_field": "timestamp",
        "tag_fields": [
          "log_level",
          "tenant_id"
        ],
        "partition_key": "tenant_id",
        "max_num_partitions": 100,
        "index_field_presence": true,
        "store_document_size": false,
        "store_source": true,
        "tokenizers": [
          {
            "name": "custom_tokenizer",
            "type": "regex",
            "pattern": "[^\\p{L}\\p{N}]+",
            "filters": []
          }
        ]
      },
      "indexing_settings": {
        "commit_timeout_secs": 301,
        "docstore_compression_level": 8,
        "docstore_blocksize": 1000000,
        "split_num_docs_target": 10000001,
        "merge_policy": {
          "type": "stable_log",
          "min_level_num_docs": 100000,
          "merge_factor": 9,
          "max_merge_factor": 11,
          "maturation_period": "2days"
        },
        "resources": {
          "heap_size": 50000000
        }
      },
      "ingest_settings": {
        "min_shards": 1
      },
      "search_settings": {
        "default_search_fields": [
          "message"
        ]
      },
      "retention": {
        "period": "90 days",
        "schedule": "daily"
      }
    },
    "checkpoint": {
      "kafka-source": {
        "00000000000000000000": "00000000000000000042"
      }
    },
    "create_timestamp": 1789,
    "sources": [
      {
        "version": "0.9",
        "source_id": "kafka-source",
        "num_pipelines": 2,
        "enabled": true,
        "source_type": "kafka",
        "params": {
          "topic": "kafka-topic",
          "client_params": {}
        },
        "transform": {
          "script": ".message = downcase(string!(.message))",
          "timezone": "UTC"
        },
        "input_format": "json"
      }
    ]
  },
  "splits": [
    {
      "split_state": "Published",
      "update_timestamp": 1789,
      "publish_timestamp": 1789,
      "version": "0.9",
      "split_id": "split",
      "index_uid": "my-index:00000000000000000000000000",
      "partition_id": 7,
      "source_id": "source",
      "node_id": "node",
      "num_docs": 12303,
      "uncompressed_docs_size_in_bytes": 234234,
      "time_range": {
        "start": 121000,
        "end": 130198
      },
      "create_timestamp": 3,
      "maturity": {
        "type": "immature",
        "maturation_period_millis": 4000
      },
      "tags": [
        "234",
        "aaa"
      ],
      "footer_offsets": {
        "start": 1000,
        "end": 2000
      },
      "delete_opstamp": 10,
      "num_merge_ops": 3,
      "doc_mapping_uid": "00000000000000000000000000"
    }
  ],
  "shards": {
    "_ingest-source": [
      {
        "index_uid": "my-index:00000000000000000000000000",
        "source_id": "_ingest-source",
        "shard_id": "00000000000000000001",
        "leader_id": "leader-ingester",
        "follower_id": "follower-ingester",
        "shard_state": 1,
        "publish_position_inclusive": "",
        "doc_mapping_uid": "00000000000000000000000000",
        "update_timestamp": 1704067200
      }
    ]
  },
  "delete_tasks": [
    {
      "create_timestamp": 0,
      "opstamp": 10,
      "delete_query": {
        "index_uid": "my-index:00000000000000000000000000",
        "query_ast": "{\"type\":\"bool\",\"must\":[{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Harry\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}},{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Potter\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}}]}"
      }
    }
  ]
}


================================================
FILE: quickwit/quickwit-metastore/test-data/file-backed-index/v0.8.json
================================================
{
  "delete_tasks": [
    {
      "create_timestamp": 0,
      "delete_query": {
        "index_uid": "my-index:00000000000000000000000000",
        "query_ast": "{\"type\":\"bool\",\"must\":[{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Harry\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}},{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Potter\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}}}]}"
      },
      "opstamp": 10
    }
  ],
  "index": {
    "checkpoint": {
      "kafka-source": {
        "00000000000000000000": "00000000000000000042"
      }
    },
    "create_timestamp": 1789,
    "index_config": {
      "doc_mapping": {
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "coerce": true,
            "fast": true,
            "indexed": true,
            "name": "tenant_id",
            "output_format": "number",
            "stored": true,
            "type": "u64"
          },
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "timestamp",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "fast": false,
            "fieldnorms": false,
            "indexed": true,
            "name": "log_level",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "text"
          },
          {
            "fast": false,
            "fieldnorms": false,
            "indexed": true,
            "name": "message",
            "record": "position",
            "stored": true,
            "tokenizer": "default",
            "type": "text"
          }
        ],
        "index_field_presence": true,
        "max_num_partitions": 100,
        "mode": "dynamic",
        "partition_key": "tenant_id",
        "store_document_size": false,
        "store_source": true,
        "tag_fields": [
          "log_level",
          "tenant_id"
        ],
        "timestamp_field": "timestamp",
        "tokenizers": [
          {
            "filters": [],
            "name": "custom_tokenizer",
            "pattern": "[^\\p{L}\\p{N}]+",
            "type": "regex"
          }
        ]
      },
      "index_id": "my-index",
      "index_uri": "s3://quickwit-indexes/my-index",
      "indexing_settings": {
        "commit_timeout_secs": 301,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 11,
          "merge_factor": 9,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": "50.0 MB"
        },
        "split_num_docs_target": 10000001
      },
      "retention": {
        "period": "90 days",
        "schedule": "daily"
      },
      "search_settings": {
        "default_search_fields": [
          "message"
        ]
      },
      "version": "0.8"
    },
    "index_uid": "my-index:00000000000000000000000000",
    "sources": [
      {
        "enabled": true,
        "input_format": "json",
        "num_pipelines": 2,
        "params": {
          "client_params": {},
          "topic": "kafka-topic"
        },
        "source_id": "kafka-source",
        "source_type": "kafka",
        "transform": {
          "script": ".message = downcase(string!(.message))",
          "timezone": "UTC"
        },
        "version": "0.8"
      }
    ],
    "version": "0.8"
  },
  "shards": {
    "_ingest-source": [
      {
        "index_uid": "my-index:00000000000000000000000000",
        "shard_id": "00000000000000000001",
        "source_id": "_ingest-source",
        "shard_state": 1,
        "leader_id": "leader-ingester",
        "follower_id": "follower-ingester",
        "publish_position_inclusive": ""
      }
    ]
  },
  "splits": [
    {
      "create_timestamp": 3,
      "delete_opstamp": 10,
      "footer_offsets": {
        "end": 2000,
        "start": 1000
      },
      "index_uid": "my-index:00000000000000000000000000",
      "maturity": {
        "maturation_period_millis": 4000,
        "type": "immature"
      },
      "node_id": "node",
      "num_docs": 12303,
      "num_merge_ops": 3,
      "partition_id": 7,
      "publish_timestamp": 1789,
      "source_id": "source",
      "split_id": "split",
      "split_state": "Published",
      "tags": [
        "234",
        "aaa"
      ],
      "time_range": {
        "end": 130198,
        "start": 121000
      },
      "uncompressed_docs_size_in_bytes": 234234,
      "update_timestamp": 1789,
      "version": "0.8"
    }
  ],
  "version": "0.8"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/file-backed-index/v0.9.expected.json
================================================
{
  "version": "0.9",
  "index": {
    "version": "0.9",
    "index_uid": "my-index:00000000000000000000000001",
    "index_config": {
      "version": "0.9",
      "index_id": "my-index",
      "index_uri": "s3://quickwit-indexes/my-index",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000001",
        "mode": "dynamic",
        "dynamic_mapping": {
          "indexed": true,
          "tokenizer": "raw",
          "record": "basic",
          "stored": true,
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          }
        },
        "field_mappings": [
          {
            "name": "tenant_id",
            "type": "u64",
            "stored": true,
            "indexed": true,
            "fast": true,
            "coerce": true,
            "output_format": "number"
          },
          {
            "name": "timestamp",
            "type": "datetime",
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "output_format": "rfc3339",
            "fast_precision": "seconds",
            "indexed": true,
            "stored": true,
            "fast": true
          },
          {
            "name": "log_level",
            "type": "text",
            "indexed": true,
            "tokenizer": "raw",
            "record": "basic",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          },
          {
            "name": "message",
            "type": "text",
            "indexed": true,
            "tokenizer": "default",
            "record": "position",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          }
        ],
        "timestamp_field": "timestamp",
        "tag_fields": [
          "log_level",
          "tenant_id"
        ],
        "partition_key": "tenant_id",
        "max_num_partitions": 100,
        "index_field_presence": true,
        "store_document_size": false,
        "store_source": true,
        "tokenizers": [
          {
            "name": "custom_tokenizer",
            "type": "regex",
            "pattern": "[^\\p{L}\\p{N}]+",
            "filters": []
          }
        ]
      },
      "indexing_settings": {
        "commit_timeout_secs": 301,
        "docstore_compression_level": 8,
        "docstore_blocksize": 1000000,
        "split_num_docs_target": 10000001,
        "merge_policy": {
          "type": "stable_log",
          "min_level_num_docs": 100000,
          "merge_factor": 9,
          "max_merge_factor": 11,
          "maturation_period": "2days"
        },
        "resources": {
          "heap_size": 50000000
        }
      },
      "ingest_settings": {
        "min_shards": 12
      },
      "search_settings": {
        "default_search_fields": [
          "message"
        ]
      },
      "retention": {
        "period": "90 days",
        "schedule": "daily"
      }
    },
    "checkpoint": {
      "kafka-source": {
        "00000000000000000000": "00000000000000000042"
      }
    },
    "create_timestamp": 1789,
    "sources": [
      {
        "version": "0.9",
        "source_id": "kafka-source",
        "num_pipelines": 2,
        "enabled": true,
        "source_type": "kafka",
        "params": {
          "topic": "kafka-topic",
          "client_params": {}
        },
        "transform": {
          "script": ".message = downcase(string!(.message))",
          "timezone": "UTC"
        },
        "input_format": "json"
      }
    ]
  },
  "splits": [
    {
      "split_state": "Published",
      "update_timestamp": 1789,
      "publish_timestamp": 1789,
      "version": "0.9",
      "split_id": "split",
      "index_uid": "my-index:00000000000000000000000001",
      "partition_id": 7,
      "source_id": "source",
      "node_id": "node",
      "num_docs": 12303,
      "uncompressed_docs_size_in_bytes": 234234,
      "time_range": {
        "start": 121000,
        "end": 130198
      },
      "create_timestamp": 3,
      "maturity": {
        "type": "immature",
        "maturation_period_millis": 4000
      },
      "tags": [
        "234",
        "aaa"
      ],
      "footer_offsets": {
        "start": 1000,
        "end": 2000
      },
      "delete_opstamp": 10,
      "num_merge_ops": 3,
      "doc_mapping_uid": "00000000000000000000000000"
    }
  ],
  "shards": {
    "_ingest-source": [
      {
        "index_uid": "my-index:00000000000000000000000001",
        "source_id": "_ingest-source",
        "shard_id": "00000000000000000001",
        "leader_id": "leader-ingester",
        "follower_id": "follower-ingester",
        "shard_state": 1,
        "publish_position_inclusive": "",
        "doc_mapping_uid": "00000000000000000000000001",
        "update_timestamp": 1724240908
      }
    ]
  },
  "delete_tasks": [
    {
      "create_timestamp": 0,
      "opstamp": 10,
      "delete_query": {
        "index_uid": "my-index:00000000000000000000000001",
        "query_ast": "{\"type\":\"bool\",\"must\":[{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Harry\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}},\"lenient\":false},{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Potter\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}},\"lenient\":false}]}"
      }
    }
  ]
}


================================================
FILE: quickwit/quickwit-metastore/test-data/file-backed-index/v0.9.json
================================================
{
  "version": "0.9",
  "index": {
    "version": "0.9",
    "index_uid": "my-index:00000000000000000000000001",
    "index_config": {
      "version": "0.9",
      "index_id": "my-index",
      "index_uri": "s3://quickwit-indexes/my-index",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000001",
        "mode": "dynamic",
        "dynamic_mapping": {
          "indexed": true,
          "tokenizer": "raw",
          "record": "basic",
          "stored": true,
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          }
        },
        "field_mappings": [
          {
            "name": "tenant_id",
            "type": "u64",
            "stored": true,
            "indexed": true,
            "fast": true,
            "coerce": true,
            "output_format": "number"
          },
          {
            "name": "timestamp",
            "type": "datetime",
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "output_format": "rfc3339",
            "fast_precision": "seconds",
            "indexed": true,
            "stored": true,
            "fast": true
          },
          {
            "name": "log_level",
            "type": "text",
            "indexed": true,
            "tokenizer": "raw",
            "record": "basic",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          },
          {
            "name": "message",
            "type": "text",
            "indexed": true,
            "tokenizer": "default",
            "record": "position",
            "fieldnorms": false,
            "stored": true,
            "fast": false
          }
        ],
        "timestamp_field": "timestamp",
        "tag_fields": [
          "log_level",
          "tenant_id"
        ],
        "partition_key": "tenant_id",
        "max_num_partitions": 100,
        "index_field_presence": true,
        "store_document_size": false,
        "store_source": true,
        "tokenizers": [
          {
            "name": "custom_tokenizer",
            "type": "regex",
            "pattern": "[^\\p{L}\\p{N}]+",
            "filters": []
          }
        ]
      },
      "indexing_settings": {
        "commit_timeout_secs": 301,
        "docstore_compression_level": 8,
        "docstore_blocksize": 1000000,
        "split_num_docs_target": 10000001,
        "merge_policy": {
          "type": "stable_log",
          "min_level_num_docs": 100000,
          "merge_factor": 9,
          "max_merge_factor": 11,
          "maturation_period": "2days"
        },
        "resources": {
          "heap_size": 50000000
        }
      },
      "ingest_settings": {
        "min_shards": 12
      },
      "search_settings": {
        "default_search_fields": [
          "message"
        ]
      },
      "retention": {
        "period": "90 days",
        "schedule": "daily"
      }
    },
    "checkpoint": {
      "kafka-source": {
        "00000000000000000000": "00000000000000000042"
      }
    },
    "create_timestamp": 1789,
    "sources": [
      {
        "version": "0.9",
        "source_id": "kafka-source",
        "num_pipelines": 2,
        "enabled": true,
        "source_type": "kafka",
        "params": {
          "topic": "kafka-topic",
          "client_params": {}
        },
        "transform": {
          "script": ".message = downcase(string!(.message))",
          "timezone": "UTC"
        },
        "input_format": "json"
      }
    ]
  },
  "splits": [
    {
      "split_state": "Published",
      "update_timestamp": 1789,
      "publish_timestamp": 1789,
      "version": "0.9",
      "split_id": "split",
      "index_uid": "my-index:00000000000000000000000001",
      "partition_id": 7,
      "source_id": "source",
      "node_id": "node",
      "num_docs": 12303,
      "uncompressed_docs_size_in_bytes": 234234,
      "time_range": {
        "start": 121000,
        "end": 130198
      },
      "create_timestamp": 3,
      "maturity": {
        "type": "immature",
        "maturation_period_millis": 4000
      },
      "tags": [
        "234",
        "aaa"
      ],
      "footer_offsets": {
        "start": 1000,
        "end": 2000
      },
      "delete_opstamp": 10,
      "num_merge_ops": 3,
      "doc_mapping_uid": "00000000000000000000000000"
    }
  ],
  "shards": {
    "_ingest-source": [
      {
        "index_uid": "my-index:00000000000000000000000001",
        "source_id": "_ingest-source",
        "shard_id": "00000000000000000001",
        "leader_id": "leader-ingester",
        "follower_id": "follower-ingester",
        "shard_state": 1,
        "publish_position_inclusive": "",
        "doc_mapping_uid": "00000000000000000000000001",
        "update_timestamp": 1724240908
      }
    ]
  },
  "delete_tasks": [
    {
      "create_timestamp": 0,
      "opstamp": 10,
      "delete_query": {
        "index_uid": "my-index:00000000000000000000000001",
        "query_ast": "{\"type\":\"bool\",\"must\":[{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Harry\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}},\"lenient\":false},{\"type\":\"full_text\",\"field\":\"body\",\"text\":\"Potter\",\"params\":{\"mode\":{\"type\":\"phrase_fallback_to_intersection\"}},\"lenient\":false}]}"
      }
    }
  ]
}


================================================
FILE: quickwit/quickwit-metastore/test-data/index-metadata/v0.7.expected.json
================================================
{
  "checkpoint": {
    "kafka-source": {
      "00000000000000000000": "00000000000000000042"
    }
  },
  "create_timestamp": 1789,
  "index_config": {
    "doc_mapping": {
      "doc_mapping_uid": "00000000000000000000000000",
      "dynamic_mapping": {
        "expand_dots": true,
        "fast": {
          "normalizer": "raw"
        },
        "indexed": true,
        "record": "basic",
        "stored": true,
        "tokenizer": "raw"
      },
      "field_mappings": [
        {
          "coerce": true,
          "fast": true,
          "indexed": true,
          "name": "tenant_id",
          "output_format": "number",
          "stored": true,
          "type": "u64"
        },
        {
          "fast": true,
          "fast_precision": "seconds",
          "indexed": true,
          "input_formats": [
            "rfc3339",
            "unix_timestamp"
          ],
          "name": "timestamp",
          "output_format": "rfc3339",
          "stored": true,
          "type": "datetime"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "log_level",
          "record": "basic",
          "stored": true,
          "tokenizer": "raw",
          "type": "text"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "message",
          "record": "position",
          "stored": true,
          "tokenizer": "default",
          "type": "text"
        }
      ],
      "index_field_presence": true,
      "max_num_partitions": 100,
      "mode": "dynamic",
      "partition_key": "tenant_id",
      "store_document_size": false,
      "store_source": true,
      "tag_fields": [
        "log_level",
        "tenant_id"
      ],
      "timestamp_field": "timestamp",
      "tokenizers": [
        {
          "filters": [],
          "name": "custom_tokenizer",
          "pattern": "[^\\p{L}\\p{N}]+",
          "type": "regex"
        }
      ]
    },
    "index_id": "my-index",
    "index_uri": "s3://quickwit-indexes/my-index",
    "indexing_settings": {
      "commit_timeout_secs": 301,
      "docstore_blocksize": 1000000,
      "docstore_compression_level": 8,
      "merge_policy": {
        "maturation_period": "2days",
        "max_merge_factor": 11,
        "merge_factor": 9,
        "min_level_num_docs": 100000,
        "type": "stable_log"
      },
      "resources": {
        "heap_size": 50000000
      },
      "split_num_docs_target": 10000001
    },
    "ingest_settings": {
      "min_shards": 1
    },
    "retention": {
      "period": "90 days",
      "schedule": "daily"
    },
    "search_settings": {
      "default_search_fields": [
        "message"
      ]
    },
    "version": "0.9"
  },
  "index_uid": "my-index:00000000000000000000000000",
  "sources": [
    {
      "enabled": true,
      "input_format": "json",
      "num_pipelines": 2,
      "params": {
        "client_params": {},
        "topic": "kafka-topic"
      },
      "source_id": "kafka-source",
      "source_type": "kafka",
      "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "UTC"
      },
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/index-metadata/v0.7.json
================================================
{
  "checkpoint": {
    "kafka-source": {
      "00000000000000000000": "00000000000000000042"
    }
  },
  "create_timestamp": 1789,
  "index_config": {
    "doc_mapping": {
      "dynamic_mapping": {
        "expand_dots": true,
        "fast": {
          "normalizer": "raw"
        },
        "indexed": true,
        "record": "basic",
        "stored": true,
        "tokenizer": "raw"
      },
      "field_mappings": [
        {
          "coerce": true,
          "fast": true,
          "indexed": true,
          "name": "tenant_id",
          "output_format": "number",
          "stored": true,
          "type": "u64"
        },
        {
          "fast": true,
          "fast_precision": "seconds",
          "indexed": true,
          "input_formats": [
            "rfc3339",
            "unix_timestamp"
          ],
          "name": "timestamp",
          "output_format": "rfc3339",
          "stored": true,
          "type": "datetime"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "log_level",
          "record": "basic",
          "stored": true,
          "tokenizer": "raw",
          "type": "text"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "message",
          "record": "position",
          "stored": true,
          "tokenizer": "default",
          "type": "text"
        }
      ],
      "index_field_presence": true,
      "max_num_partitions": 100,
      "mode": "dynamic",
      "partition_key": "tenant_id",
      "store_source": true,
      "tag_fields": [
        "log_level",
        "tenant_id"
      ],
      "timestamp_field": "timestamp",
      "tokenizers": [
        {
          "filters": [],
          "name": "custom_tokenizer",
          "pattern": "[^\\p{L}\\p{N}]+",
          "type": "regex"
        }
      ]
    },
    "index_id": "my-index",
    "index_uri": "s3://quickwit-indexes/my-index",
    "indexing_settings": {
      "commit_timeout_secs": 301,
      "docstore_blocksize": 1000000,
      "docstore_compression_level": 8,
      "merge_policy": {
        "maturation_period": "2days",
        "max_merge_factor": 11,
        "merge_factor": 9,
        "min_level_num_docs": 100000,
        "type": "stable_log"
      },
      "resources": {
        "heap_size": "50.0 MB"
      },
      "split_num_docs_target": 10000001
    },
    "retention": {
      "period": "90 days",
      "schedule": "daily"
    },
    "search_settings": {
      "default_search_fields": [
        "message"
      ]
    },
    "version": "0.7"
  },
  "index_uid": "my-index:00000000000000000000000000",
  "sources": [
    {
      "desired_num_pipelines": 2,
      "enabled": true,
      "input_format": "json",
      "max_num_pipelines_per_indexer": 2,
      "params": {
        "client_params": {},
        "topic": "kafka-topic"
      },
      "source_id": "kafka-source",
      "source_type": "kafka",
      "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "UTC"
      },
      "version": "0.7"
    }
  ],
  "version": "0.7"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/index-metadata/v0.8.expected.json
================================================
{
  "checkpoint": {
    "kafka-source": {
      "00000000000000000000": "00000000000000000042"
    }
  },
  "create_timestamp": 1789,
  "index_config": {
    "doc_mapping": {
      "doc_mapping_uid": "00000000000000000000000000",
      "dynamic_mapping": {
        "expand_dots": true,
        "fast": {
          "normalizer": "raw"
        },
        "indexed": true,
        "record": "basic",
        "stored": true,
        "tokenizer": "raw"
      },
      "field_mappings": [
        {
          "coerce": true,
          "fast": true,
          "indexed": true,
          "name": "tenant_id",
          "output_format": "number",
          "stored": true,
          "type": "u64"
        },
        {
          "fast": true,
          "fast_precision": "seconds",
          "indexed": true,
          "input_formats": [
            "rfc3339",
            "unix_timestamp"
          ],
          "name": "timestamp",
          "output_format": "rfc3339",
          "stored": true,
          "type": "datetime"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "log_level",
          "record": "basic",
          "stored": true,
          "tokenizer": "raw",
          "type": "text"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "message",
          "record": "position",
          "stored": true,
          "tokenizer": "default",
          "type": "text"
        }
      ],
      "index_field_presence": true,
      "max_num_partitions": 100,
      "mode": "dynamic",
      "partition_key": "tenant_id",
      "store_document_size": false,
      "store_source": true,
      "tag_fields": [
        "log_level",
        "tenant_id"
      ],
      "timestamp_field": "timestamp",
      "tokenizers": [
        {
          "filters": [],
          "name": "custom_tokenizer",
          "pattern": "[^\\p{L}\\p{N}]+",
          "type": "regex"
        }
      ]
    },
    "index_id": "my-index",
    "index_uri": "s3://quickwit-indexes/my-index",
    "indexing_settings": {
      "commit_timeout_secs": 301,
      "docstore_blocksize": 1000000,
      "docstore_compression_level": 8,
      "merge_policy": {
        "maturation_period": "2days",
        "max_merge_factor": 11,
        "merge_factor": 9,
        "min_level_num_docs": 100000,
        "type": "stable_log"
      },
      "resources": {
        "heap_size": 50000000
      },
      "split_num_docs_target": 10000001
    },
    "ingest_settings": {
      "min_shards": 1
    },
    "retention": {
      "period": "90 days",
      "schedule": "daily"
    },
    "search_settings": {
      "default_search_fields": [
        "message"
      ]
    },
    "version": "0.9"
  },
  "index_uid": "my-index:00000000000000000000000000",
  "sources": [
    {
      "enabled": true,
      "input_format": "json",
      "num_pipelines": 2,
      "params": {
        "client_params": {},
        "topic": "kafka-topic"
      },
      "source_id": "kafka-source",
      "source_type": "kafka",
      "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "UTC"
      },
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/index-metadata/v0.8.json
================================================
{
  "checkpoint": {
    "kafka-source": {
      "00000000000000000000": "00000000000000000042"
    }
  },
  "create_timestamp": 1789,
  "index_config": {
    "doc_mapping": {
      "dynamic_mapping": {
        "expand_dots": true,
        "fast": {
          "normalizer": "raw"
        },
        "indexed": true,
        "record": "basic",
        "stored": true,
        "tokenizer": "raw"
      },
      "field_mappings": [
        {
          "coerce": true,
          "fast": true,
          "indexed": true,
          "name": "tenant_id",
          "output_format": "number",
          "stored": true,
          "type": "u64"
        },
        {
          "fast": true,
          "fast_precision": "seconds",
          "indexed": true,
          "input_formats": [
            "rfc3339",
            "unix_timestamp"
          ],
          "name": "timestamp",
          "output_format": "rfc3339",
          "stored": true,
          "type": "datetime"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "log_level",
          "record": "basic",
          "stored": true,
          "tokenizer": "raw",
          "type": "text"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "message",
          "record": "position",
          "stored": true,
          "tokenizer": "default",
          "type": "text"
        }
      ],
      "index_field_presence": true,
      "max_num_partitions": 100,
      "mode": "dynamic",
      "partition_key": "tenant_id",
      "store_document_size": false,
      "store_source": true,
      "tag_fields": [
        "log_level",
        "tenant_id"
      ],
      "timestamp_field": "timestamp",
      "tokenizers": [
        {
          "filters": [],
          "name": "custom_tokenizer",
          "pattern": "[^\\p{L}\\p{N}]+",
          "type": "regex"
        }
      ]
    },
    "index_id": "my-index",
    "index_uri": "s3://quickwit-indexes/my-index",
    "indexing_settings": {
      "commit_timeout_secs": 301,
      "docstore_blocksize": 1000000,
      "docstore_compression_level": 8,
      "merge_policy": {
        "maturation_period": "2days",
        "max_merge_factor": 11,
        "merge_factor": 9,
        "min_level_num_docs": 100000,
        "type": "stable_log"
      },
      "resources": {
        "heap_size": "50.0 MB"
      },
      "split_num_docs_target": 10000001
    },
    "retention": {
      "period": "90 days",
      "schedule": "daily"
    },
    "search_settings": {
      "default_search_fields": [
        "message"
      ]
    },
    "version": "0.8"
  },
  "index_uid": "my-index:00000000000000000000000000",
  "sources": [
    {
      "enabled": true,
      "input_format": "json",
      "num_pipelines": 2,
      "params": {
        "client_params": {},
        "topic": "kafka-topic"
      },
      "source_id": "kafka-source",
      "source_type": "kafka",
      "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "UTC"
      },
      "version": "0.8"
    }
  ],
  "version": "0.8"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/index-metadata/v0.9.expected.json
================================================
{
  "checkpoint": {
    "kafka-source": {
      "00000000000000000000": "00000000000000000042"
    }
  },
  "create_timestamp": 1789,
  "index_config": {
    "doc_mapping": {
      "doc_mapping_uid": "00000000000000000000000001",
      "dynamic_mapping": {
        "expand_dots": true,
        "fast": {
          "normalizer": "raw"
        },
        "indexed": true,
        "record": "basic",
        "stored": true,
        "tokenizer": "raw"
      },
      "field_mappings": [
        {
          "coerce": true,
          "fast": true,
          "indexed": true,
          "name": "tenant_id",
          "output_format": "number",
          "stored": true,
          "type": "u64"
        },
        {
          "fast": true,
          "fast_precision": "seconds",
          "indexed": true,
          "input_formats": [
            "rfc3339",
            "unix_timestamp"
          ],
          "name": "timestamp",
          "output_format": "rfc3339",
          "stored": true,
          "type": "datetime"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "log_level",
          "record": "basic",
          "stored": true,
          "tokenizer": "raw",
          "type": "text"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "message",
          "record": "position",
          "stored": true,
          "tokenizer": "default",
          "type": "text"
        }
      ],
      "index_field_presence": true,
      "max_num_partitions": 100,
      "mode": "dynamic",
      "partition_key": "tenant_id",
      "store_document_size": false,
      "store_source": true,
      "tag_fields": [
        "log_level",
        "tenant_id"
      ],
      "timestamp_field": "timestamp",
      "tokenizers": [
        {
          "filters": [],
          "name": "custom_tokenizer",
          "pattern": "[^\\p{L}\\p{N}]+",
          "type": "regex"
        }
      ]
    },
    "index_id": "my-index",
    "index_uri": "s3://quickwit-indexes/my-index",
    "indexing_settings": {
      "commit_timeout_secs": 301,
      "docstore_blocksize": 1000000,
      "docstore_compression_level": 8,
      "merge_policy": {
        "maturation_period": "2days",
        "max_merge_factor": 11,
        "merge_factor": 9,
        "min_level_num_docs": 100000,
        "type": "stable_log"
      },
      "resources": {
        "heap_size": 50000000
      },
      "split_num_docs_target": 10000001
    },
    "retention": {
      "period": "90 days",
      "schedule": "daily"
    },
    "ingest_settings": {
      "min_shards": 12
    },
    "search_settings": {
      "default_search_fields": [
        "message"
      ]
    },
    "version": "0.9"
  },
  "index_uid": "my-index:00000000000000000000000001",
  "sources": [
    {
      "enabled": true,
      "input_format": "json",
      "num_pipelines": 2,
      "params": {
        "client_params": {},
        "topic": "kafka-topic"
      },
      "source_id": "kafka-source",
      "source_type": "kafka",
      "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "UTC"
      },
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/index-metadata/v0.9.json
================================================
{
  "checkpoint": {
    "kafka-source": {
      "00000000000000000000": "00000000000000000042"
    }
  },
  "create_timestamp": 1789,
  "index_config": {
    "doc_mapping": {
      "doc_mapping_uid": "00000000000000000000000001",
      "dynamic_mapping": {
        "expand_dots": true,
        "fast": {
          "normalizer": "raw"
        },
        "indexed": true,
        "record": "basic",
        "stored": true,
        "tokenizer": "raw"
      },
      "field_mappings": [
        {
          "coerce": true,
          "fast": true,
          "indexed": true,
          "name": "tenant_id",
          "output_format": "number",
          "stored": true,
          "type": "u64"
        },
        {
          "fast": true,
          "fast_precision": "seconds",
          "indexed": true,
          "input_formats": [
            "rfc3339",
            "unix_timestamp"
          ],
          "name": "timestamp",
          "output_format": "rfc3339",
          "stored": true,
          "type": "datetime"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "log_level",
          "record": "basic",
          "stored": true,
          "tokenizer": "raw",
          "type": "text"
        },
        {
          "fast": false,
          "fieldnorms": false,
          "indexed": true,
          "name": "message",
          "record": "position",
          "stored": true,
          "tokenizer": "default",
          "type": "text"
        }
      ],
      "index_field_presence": true,
      "max_num_partitions": 100,
      "mode": "dynamic",
      "partition_key": "tenant_id",
      "store_document_size": false,
      "store_source": true,
      "tag_fields": [
        "log_level",
        "tenant_id"
      ],
      "timestamp_field": "timestamp",
      "tokenizers": [
        {
          "filters": [],
          "name": "custom_tokenizer",
          "pattern": "[^\\p{L}\\p{N}]+",
          "type": "regex"
        }
      ]
    },
    "index_id": "my-index",
    "index_uri": "s3://quickwit-indexes/my-index",
    "indexing_settings": {
      "commit_timeout_secs": 301,
      "docstore_blocksize": 1000000,
      "docstore_compression_level": 8,
      "merge_policy": {
        "maturation_period": "2days",
        "max_merge_factor": 11,
        "merge_factor": 9,
        "min_level_num_docs": 100000,
        "type": "stable_log"
      },
      "resources": {
        "heap_size": 50000000
      },
      "split_num_docs_target": 10000001
    },
    "retention": {
      "period": "90 days",
      "schedule": "daily"
    },
    "ingest_settings": {
      "min_shards": 12
    },
    "search_settings": {
      "default_search_fields": [
        "message"
      ]
    },
    "version": "0.9"
  },
  "index_uid": "my-index:00000000000000000000000001",
  "sources": [
    {
      "enabled": true,
      "input_format": "json",
      "num_pipelines": 2,
      "params": {
        "client_params": {},
        "topic": "kafka-topic"
      },
      "source_id": "kafka-source",
      "source_type": "kafka",
      "transform": {
        "script": ".message = downcase(string!(.message))",
        "timezone": "UTC"
      },
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/manifest/v0.7.expected.json
================================================
{
  "indexes": {
    "test-index-1": "creating",
    "test-index-2": "active",
    "test-index-3": "deleting"
  },
  "templates": [
    {
      "description": "Test description.",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000000",
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "ts",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "expand_dots": true,
            "fast": false,
            "indexed": true,
            "name": "message",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "json"
          }
        ],
        "index_field_presence": false,
        "max_num_partitions": 200,
        "mode": "dynamic",
        "store_document_size": false,
        "store_source": false,
        "tag_fields": [],
        "timestamp_field": "ts",
        "tokenizers": []
      },
      "index_id_patterns": [
        "test-index-foo*",
        "-test-index-foobar"
      ],
      "index_root_uri": "ram:///indexes",
      "indexing_settings": {
        "commit_timeout_secs": 60,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 12,
          "merge_factor": 10,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": 2000000000
        },
        "split_num_docs_target": 10000000
      },
      "priority": 100,
      "retention": {
        "period": "42 days",
        "schedule": "daily"
      },
      "ingest_settings": {
        "min_shards": 1
      },
      "search_settings": {
        "default_search_fields": []
      },
      "template_id": "test-template",
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/manifest/v0.7.json
================================================
{
  "indexes": {
    "test-index-1": "creating",
    "test-index-2": "active",
    "test-index-3": "deleting"
  },
  "templates": [
    {
      "description": "Test description.",
      "doc_mapping": {
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "ts",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "expand_dots": true,
            "fast": false,
            "indexed": true,
            "name": "message",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "json"
          }
        ],
        "index_field_presence": false,
        "max_num_partitions": 200,
        "mode": "dynamic",
        "store_source": false,
        "tag_fields": [],
        "timestamp_field": "ts",
        "tokenizers": []
      },
      "index_id_patterns": [
        "test-index-foo*",
        "-test-index-foobar"
      ],
      "index_root_uri": "ram:///indexes",
      "indexing_settings": {
        "commit_timeout_secs": 60,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 12,
          "merge_factor": 10,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": "2.0 GB"
        },
        "split_num_docs_target": 10000000
      },
      "priority": 100,
      "retention": {
        "period": "42 days",
        "schedule": "daily"
      },
      "search_settings": {
        "default_search_fields": []
      },
      "template_id": "test-template",
      "version": "0.7"
    }
  ],
  "version": "0.7"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/manifest/v0.8.expected.json
================================================
{
  "indexes": {
    "test-index-1": "creating",
    "test-index-2": "active",
    "test-index-3": "deleting"
  },
  "templates": [
    {
      "description": "Test description.",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000000",
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "ts",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "expand_dots": true,
            "fast": false,
            "indexed": true,
            "name": "message",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "json"
          }
        ],
        "index_field_presence": false,
        "max_num_partitions": 200,
        "mode": "dynamic",
        "store_document_size": false,
        "store_source": false,
        "tag_fields": [],
        "timestamp_field": "ts",
        "tokenizers": []
      },
      "index_id_patterns": [
        "test-index-foo*",
        "-test-index-foobar"
      ],
      "index_root_uri": "ram:///indexes",
      "indexing_settings": {
        "commit_timeout_secs": 60,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 12,
          "merge_factor": 10,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": 2000000000
        },
        "split_num_docs_target": 10000000
      },
      "priority": 100,
      "ingest_settings": {
        "min_shards": 1
      },
      "retention": {
        "period": "42 days",
        "schedule": "daily"
      },
      "search_settings": {
        "default_search_fields": []
      },
      "template_id": "test-template",
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/manifest/v0.8.json
================================================
{
  "indexes": {
    "test-index-1": "creating",
    "test-index-2": "active",
    "test-index-3": "deleting"
  },
  "templates": [
    {
      "description": "Test description.",
      "doc_mapping": {
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "ts",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "expand_dots": true,
            "fast": false,
            "indexed": true,
            "name": "message",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "json"
          }
        ],
        "index_field_presence": false,
        "max_num_partitions": 200,
        "mode": "dynamic",
        "store_document_size": false,
        "store_source": false,
        "tag_fields": [],
        "timestamp_field": "ts",
        "tokenizers": []
      },
      "index_id_patterns": [
        "test-index-foo*",
        "-test-index-foobar"
      ],
      "index_root_uri": "ram:///indexes",
      "indexing_settings": {
        "commit_timeout_secs": 60,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 12,
          "merge_factor": 10,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": "2.0 GB"
        },
        "split_num_docs_target": 10000000
      },
      "priority": 100,
      "retention": {
        "period": "42 days",
        "schedule": "daily"
      },
      "search_settings": {
        "default_search_fields": []
      },
      "template_id": "test-template",
      "version": "0.8"
    }
  ],
  "version": "0.8"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/manifest/v0.9.expected.json
================================================
{
  "indexes": {
    "test-index-1": "creating",
    "test-index-2": "active",
    "test-index-3": "deleting"
  },
  "templates": [
    {
      "description": "Test description.",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000001",
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "ts",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "expand_dots": true,
            "fast": false,
            "indexed": true,
            "name": "message",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "json"
          }
        ],
        "index_field_presence": false,
        "max_num_partitions": 200,
        "mode": "dynamic",
        "store_document_size": false,
        "store_source": false,
        "tag_fields": [],
        "timestamp_field": "ts",
        "tokenizers": []
      },
      "index_id_patterns": [
        "test-index-foo*",
        "-test-index-foobar"
      ],
      "index_root_uri": "ram:///indexes",
      "indexing_settings": {
        "commit_timeout_secs": 60,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 12,
          "merge_factor": 10,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": 2000000000
        },
        "split_num_docs_target": 10000000
      },
      "ingest_settings": {
        "min_shards": 1
      },
      "priority": 100,
      "retention": {
        "period": "42 days",
        "schedule": "daily"
      },
      "search_settings": {
        "default_search_fields": []
      },
      "template_id": "test-template",
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/manifest/v0.9.json
================================================
{
  "indexes": {
    "test-index-1": "creating",
    "test-index-2": "active",
    "test-index-3": "deleting"
  },
  "templates": [
    {
      "description": "Test description.",
      "doc_mapping": {
        "doc_mapping_uid": "00000000000000000000000001",
        "dynamic_mapping": {
          "expand_dots": true,
          "fast": {
            "normalizer": "raw"
          },
          "indexed": true,
          "record": "basic",
          "stored": true,
          "tokenizer": "raw"
        },
        "field_mappings": [
          {
            "fast": true,
            "fast_precision": "seconds",
            "indexed": true,
            "input_formats": [
              "rfc3339",
              "unix_timestamp"
            ],
            "name": "ts",
            "output_format": "rfc3339",
            "stored": true,
            "type": "datetime"
          },
          {
            "expand_dots": true,
            "fast": false,
            "indexed": true,
            "name": "message",
            "record": "basic",
            "stored": true,
            "tokenizer": "raw",
            "type": "json"
          }
        ],
        "index_field_presence": false,
        "max_num_partitions": 200,
        "mode": "dynamic",
        "store_document_size": false,
        "store_source": false,
        "tag_fields": [],
        "timestamp_field": "ts",
        "tokenizers": []
      },
      "index_id_patterns": [
        "test-index-foo*",
        "-test-index-foobar"
      ],
      "index_root_uri": "ram:///indexes",
      "indexing_settings": {
        "commit_timeout_secs": 60,
        "docstore_blocksize": 1000000,
        "docstore_compression_level": 8,
        "merge_policy": {
          "maturation_period": "2days",
          "max_merge_factor": 12,
          "merge_factor": 10,
          "min_level_num_docs": 100000,
          "type": "stable_log"
        },
        "resources": {
          "heap_size": 2000000000
        },
        "split_num_docs_target": 10000000
      },
      "priority": 100,
      "retention": {
        "period": "42 days",
        "schedule": "daily"
      },
      "ingest_settings": {
        "min_shards": 1
      },
      "search_settings": {
        "default_search_fields": []
      },
      "template_id": "test-template",
      "version": "0.9"
    }
  ],
  "version": "0.9"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/split-metadata/v0.7.expected.json
================================================
{
  "version": "0.9",
  "split_id": "split",
  "index_uid": "my-index:00000000000000000000000000",
  "partition_id": 7,
  "source_id": "source",
  "node_id": "node",
  "num_docs": 12303,
  "uncompressed_docs_size_in_bytes": 234234,
  "time_range": {
    "start": 121000,
    "end": 130198
  },
  "create_timestamp": 3,
  "maturity": {
    "type": "immature",
    "maturation_period_millis": 4000
  },
  "tags": [
    "234",
    "aaa"
  ],
  "footer_offsets": {
    "start": 1000,
    "end": 2000
  },
  "delete_opstamp": 10,
  "num_merge_ops": 3,
  "doc_mapping_uid": "00000000000000000000000000"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/split-metadata/v0.7.json
================================================
{
  "create_timestamp": 3,
  "delete_opstamp": 10,
  "footer_offsets": {
    "end": 2000,
    "start": 1000
  },
  "index_uid": "my-index:00000000000000000000000000",
  "maturity": {
    "maturation_period_millis": 4000,
    "type": "immature"
  },
  "node_id": "node",
  "num_docs": 12303,
  "num_merge_ops": 3,
  "partition_id": 7,
  "source_id": "source",
  "split_id": "split",
  "tags": [
    "234",
    "aaa"
  ],
  "time_range": {
    "end": 130198,
    "start": 121000
  },
  "uncompressed_docs_size_in_bytes": 234234,
  "version": "0.7"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/split-metadata/v0.8.expected.json
================================================
{
  "version": "0.9",
  "split_id": "split",
  "index_uid": "my-index:00000000000000000000000000",
  "partition_id": 7,
  "source_id": "source",
  "node_id": "node",
  "num_docs": 12303,
  "uncompressed_docs_size_in_bytes": 234234,
  "time_range": {
    "start": 121000,
    "end": 130198
  },
  "create_timestamp": 3,
  "maturity": {
    "type": "immature",
    "maturation_period_millis": 4000
  },
  "tags": [
    "234",
    "aaa"
  ],
  "footer_offsets": {
    "start": 1000,
    "end": 2000
  },
  "delete_opstamp": 10,
  "num_merge_ops": 3,
  "doc_mapping_uid": "00000000000000000000000000"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/split-metadata/v0.8.json
================================================
{
  "create_timestamp": 3,
  "delete_opstamp": 10,
  "footer_offsets": {
    "end": 2000,
    "start": 1000
  },
  "index_uid": "my-index:00000000000000000000000000",
  "maturity": {
    "maturation_period_millis": 4000,
    "type": "immature"
  },
  "node_id": "node",
  "num_docs": 12303,
  "num_merge_ops": 3,
  "partition_id": 7,
  "source_id": "source",
  "split_id": "split",
  "tags": [
    "234",
    "aaa"
  ],
  "time_range": {
    "end": 130198,
    "start": 121000
  },
  "uncompressed_docs_size_in_bytes": 234234,
  "version": "0.8"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/split-metadata/v0.9.expected.json
================================================
{
  "version": "0.9",
  "split_id": "split",
  "index_uid": "my-index:00000000000000000000000001",
  "partition_id": 7,
  "source_id": "source",
  "node_id": "node",
  "num_docs": 12303,
  "uncompressed_docs_size_in_bytes": 234234,
  "time_range": {
    "start": 121000,
    "end": 130198
  },
  "create_timestamp": 3,
  "maturity": {
    "type": "immature",
    "maturation_period_millis": 4000
  },
  "tags": [
    "234",
    "aaa"
  ],
  "footer_offsets": {
    "start": 1000,
    "end": 2000
  },
  "delete_opstamp": 10,
  "num_merge_ops": 3,
  "doc_mapping_uid": "00000000000000000000000000"
}


================================================
FILE: quickwit/quickwit-metastore/test-data/split-metadata/v0.9.json
================================================
{
  "version": "0.9",
  "split_id": "split",
  "index_uid": "my-index:00000000000000000000000001",
  "partition_id": 7,
  "source_id": "source",
  "node_id": "node",
  "num_docs": 12303,
  "uncompressed_docs_size_in_bytes": 234234,
  "time_range": {
    "start": 121000,
    "end": 130198
  },
  "create_timestamp": 3,
  "maturity": {
    "type": "immature",
    "maturation_period_millis": 4000
  },
  "tags": [
    "234",
    "aaa"
  ],
  "footer_offsets": {
    "start": 1000,
    "end": 2000
  },
  "delete_opstamp": 10,
  "num_merge_ops": 3,
  "doc_mapping_uid": "00000000000000000000000000"
}


================================================
FILE: quickwit/quickwit-metastore-utils/Cargo.toml
================================================
[package]
name = "quickwit-metastore-utils"
description = "Metastore utilities"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[[bin]]
name = "replay"

[[bin]]
name = "proxy"

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
quickwit-proto = { workspace = true }
serde = "1"
serde_json = { workspace = true }
structopt = "0.3"
tokio = { workspace = true }


================================================
FILE: quickwit/quickwit-metastore-utils/src/bin/README.md
================================================
# Replay

Replay is a small util that sequentially replays a bunch of gRPC calls made to the
quickwit metastore, as fast as possible.

Right now, both the grpc address and the file are hardcoded.

To run it:

- run `cargo run --release --bin replay` from the `quickwit-metastore` directory.

It assumes a quickwit metastore service is running on `localhost:7280`

To get that, simply run:
`./quickwit run --service metastore`

A minimal `quickwit.yaml` to run against the postgres could be

```yaml
version: "0.7"
metastore_uri: postgres://quickwit-dev:quickwit-dev@localhost/quickwit-metastore-dev
```

To run postgres

`docker-compose up postgres` from the quickwit root directory.

# Warning

The replay file first request is creating the index.
That request actually includes an index_config json data, and this part is about to be heavily changed.

For the moment, I recommend experimenting on top of quickwit rev 2b0e3963f67303f4e6a362d53fa8bebd3cbad33e.

# Warning 2

The replay data does not delete the index and the splits.

It is required to run
`TRUNCATE TABLE indexes CASCADE;`
via
`psql -h localhost -U quickwit-dev quickwit-metastore-dev`

to rerun the replay data.


================================================
FILE: quickwit/quickwit-metastore-utils/src/bin/proxy.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::net::SocketAddr;
use std::path::PathBuf;
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_metastore_utils::{GrpcCall, GrpcRequest};
use quickwit_proto::metastore::*;
use quickwit_proto::tonic;
use quickwit_proto::tonic::transport::Channel;
use quickwit_proto::tonic::{Request, Response, Status};
use structopt::StructOpt;
use tokio::fs::File;
use tokio::io::{AsyncWriteExt, BufWriter};
use tokio::sync::Mutex;
use tokio::time::Instant;

struct Inner {
    start: Instant,
    client: MetastoreServiceClient,
    file: BufWriter<File>,
}

struct MetastoreProxyService {
    inner: Arc<Mutex<Inner>>,
}

impl MetastoreProxyService {
    pub fn new(client: MetastoreServiceClient, record_file: File) -> Self {
        let inner = Inner {
            start: Instant::now(),
            client,
            file: BufWriter::new(record_file),
        };
        Self {
            inner: Arc::new(Mutex::new(inner)),
        }
    }
}

impl Inner {
    async fn record<T: Into<GrpcRequest>>(&mut self, req: T) -> anyhow::Result<()> {
        let now = Instant::now();
        let grpc_request = req.into();
        let elapsed = now - self.start;
        let grpc_call = GrpcCall {
            ts: elapsed.as_millis() as u64,
            grpc_request,
        };
        let mut buf = serde_json::to_vec(&grpc_call)?;
        buf.push(b'\n');
        self.file.write_all(&buf).await?;
        Ok(())
    }
}

#[async_trait]
impl MetastoreService for MetastoreProxyService {
    /// Creates an index.
    async fn create_index(
        &self,
        request: tonic::Request<CreateIndexRequest>,
    ) -> Result<tonic::Response<CreateIndexResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.create_index(request).await?;
        Ok(resp)
    }
    /// Gets an index metadata.
    async fn index_metadata(
        &self,
        request: tonic::Request<IndexMetadataRequest>,
    ) -> Result<tonic::Response<IndexMetadataResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.index_metadata(request).await?;
        Ok(resp)
    }
    /// Gets an indexes metadatas.
    async fn list_indexes_metadata(
        &self,
        request: tonic::Request<ListIndexesMetadataRequest>,
    ) -> Result<tonic::Response<ListIndexesMetadataResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.list_indexes_metadata(request).await?;
        Ok(resp)
    }
    /// Deletes an index
    async fn delete_index(
        &self,
        request: tonic::Request<DeleteIndexRequest>,
    ) -> Result<tonic::Response<DeleteIndexResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.delete_index(request).await?;
        Ok(resp)
    }
    /// Gets splits from index.
    async fn list_splits(
        &self,
        request: tonic::Request<ListSplitsRequest>,
    ) -> Result<tonic::Response<ListSplitsResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.list_splits(request).await?;
        Ok(resp)
    }
    /// Stages several splits.
    async fn stage_splits(
        &self,
        request: Request<StageSplitsRequest>,
    ) -> Result<Response<SplitResponse>, Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.stage_splits(request).await?;
        Ok(resp)
    }
    /// Publishes split.
    async fn publish_splits(
        &self,
        request: tonic::Request<PublishSplitsRequest>,
    ) -> Result<tonic::Response<SplitResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.publish_splits(request).await?;
        Ok(resp)
    }
    /// Marks splits for deletion.
    async fn mark_splits_for_deletion(
        &self,
        request: tonic::Request<MarkSplitsForDeletionRequest>,
    ) -> Result<tonic::Response<SplitResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.mark_splits_for_deletion(request).await?;
        Ok(resp)
    }
    /// Deletes splits.
    async fn delete_splits(
        &self,
        request: tonic::Request<DeleteSplitsRequest>,
    ) -> Result<tonic::Response<SplitResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.delete_splits(request).await?;
        Ok(resp)
    }
    /// Adds source.
    async fn add_source(
        &self,
        request: tonic::Request<AddSourceRequest>,
    ) -> Result<tonic::Response<SourceResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.add_source(request).await?;
        Ok(resp)
    }
    /// Toggles source.
    async fn toggle_source(
        &self,
        request: tonic::Request<ToggleSourceRequest>,
    ) -> Result<tonic::Response<SourceResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.toggle_source(request).await?;
        Ok(resp)
    }
    /// Removes source.
    async fn delete_source(
        &self,
        request: tonic::Request<DeleteSourceRequest>,
    ) -> Result<tonic::Response<SourceResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.delete_source(request).await?;
        Ok(resp)
    }
    /// Resets source checkpoint.
    async fn reset_source_checkpoint(
        &self,
        request: tonic::Request<ResetSourceCheckpointRequest>,
    ) -> Result<tonic::Response<SourceResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.reset_source_checkpoint(request).await?;
        Ok(resp)
    }
    /// Gets last opstamp for a given `index_id`.
    async fn last_delete_opstamp(
        &self,
        request: tonic::Request<LastDeleteOpstampRequest>,
    ) -> Result<tonic::Response<LastDeleteOpstampResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.last_delete_opstamp(request).await?;
        Ok(resp)
    }
    /// Creates a delete task.
    async fn create_delete_task(
        &self,
        request: tonic::Request<DeleteQuery>,
    ) -> Result<tonic::Response<DeleteTask>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.create_delete_task(request).await?;
        Ok(resp)
    }
    /// Updates splits `delete_opstamp`.
    async fn update_splits_delete_opstamp(
        &self,
        request: tonic::Request<UpdateSplitsDeleteOpstampRequest>,
    ) -> Result<tonic::Response<UpdateSplitsDeleteOpstampResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.update_splits_delete_opstamp(request).await?;
        Ok(resp)
    }
    /// Lists delete tasks with `delete_task.opstamp` > `opstamp_start` for a given `index_id`.
    async fn list_delete_tasks(
        &self,
        request: tonic::Request<ListDeleteTasksRequest>,
    ) -> Result<tonic::Response<ListDeleteTasksResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.list_delete_tasks(request).await?;
        Ok(resp)
    }
    //// Lists splits with `split.delete_opstamp` < `delete_opstamp` for a given `index_id`.
    async fn list_stale_splits(
        &self,
        request: tonic::Request<ListStaleSplitsRequest>,
    ) -> Result<tonic::Response<ListSplitsResponse>, tonic::Status> {
        let mut lock = self.inner.lock().await;
        lock.record(request.get_ref().clone()).await.unwrap();
        let resp = lock.client.list_stale_splits(request).await?;
        Ok(resp)
    }
}

#[derive(Debug, StructOpt)]
#[structopt(name = "proxy", about = "A quickwit-metastore recording proxy.")]
struct Opt {
    #[structopt(default_value = "127.0.0.1:7291")]
    listen_to: SocketAddr,
    #[structopt(long, default_value = "http://127.0.0.1:7281")]
    forward_to: String,
    #[structopt(long, default_value = "./replay.ndjson")]
    file: PathBuf,
}

#[tokio::main]
async fn main() -> anyhow::Result<()> {
    let opt = Opt::from_args();
    let client = MetastoreServiceClient::connect(opt.forward_to.clone()).await?;
    let file = File::create(&opt.file).await?;
    let service = MetastoreProxyService::new(client, file);
    let server = MetastoreServiceServer::new(service);
    println!(
        "Listening to {}, Forwarding to {}",
        opt.listen_to, opt.forward_to
    );
    tonic::transport::Server::builder()
        .add_service(server)
        .serve(opt.listen_to)
        .await?;
    Ok(())
}


================================================
FILE: quickwit/quickwit-metastore-utils/src/bin/replay.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::PathBuf;

use quickwit_metastore_utils::{GrpcCall, GrpcRequest};
use quickwit_proto::metastore::metastore_service_client::MetastoreServiceClient;
use quickwit_proto::tonic::transport::Channel;
use structopt::StructOpt;
use tokio::fs::File;
use tokio::io::AsyncBufReadExt;

async fn replay_grpc_request(
    client: &mut MetastoreServiceClient<Channel>,
    req: GrpcRequest,
) -> anyhow::Result<()> {
    match req {
        GrpcRequest::CreateIndexRequest(req) => {
            client.create_index(req).await?;
        }
        GrpcRequest::IndexMetadataRequest(req) => {
            client.index_metadata(req).await?;
        }
        GrpcRequest::ListIndexesMetadataRequest(req) => {
            client.list_indexes_metadata(req).await?;
        }
        GrpcRequest::DeleteIndexRequest(req) => {
            client.delete_index(req).await?;
        }
        GrpcRequest::ListSplitsRequest(req) => {
            client.list_splits(req).await?;
        }
        GrpcRequest::StageSplitsRequest(req) => {
            client.stage_splits(req).await?;
        }
        GrpcRequest::PublishSplitsRequest(req) => {
            client.publish_splits(req).await?;
        }
        GrpcRequest::MarkSplitsForDeletionRequest(req) => {
            client.mark_splits_for_deletion(req).await?;
        }
        GrpcRequest::DeleteSplitsRequest(req) => {
            client.delete_splits(req).await?;
        }
        GrpcRequest::AddSourceRequest(req) => {
            client.add_source(req).await?;
        }
        GrpcRequest::ToggleSourceRequest(req) => {
            client.toggle_source(req).await?;
        }
        GrpcRequest::DeleteSourceRequest(req) => {
            client.delete_source(req).await?;
        }
        GrpcRequest::LastDeleteOpstampRequest(req) => {
            client.last_delete_opstamp(req).await?;
        }
        GrpcRequest::ResetSourceCheckpointRequest(req) => {
            client.reset_source_checkpoint(req).await?;
        }
        GrpcRequest::DeleteQuery(req) => {
            client.create_delete_task(req).await?;
        }
        GrpcRequest::UpdateSplitsDeleteOpstampRequest(req) => {
            client.update_splits_delete_opstamp(req).await?;
        }
        GrpcRequest::ListDeleteTasksRequest(req) => {
            client.list_delete_tasks(req).await?;
        }
        GrpcRequest::ListStaleSplitsRequest(req) => {
            client.list_stale_splits(req).await?;
        }
    }
    Ok(())
}

#[derive(Debug, StructOpt)]
#[structopt(
    name = "replay",
    about = "A quickwit-metastore program to replay request log generated by proxy"
)]
struct Opt {
    #[structopt(
        long,
        default_value = "./replay-data/requests-partition-wikitenant.ndjson"
    )]
    file: PathBuf,
    #[structopt(long, default_value = "http://127.0.0.1:7281")]
    forward_to: String,
}

#[tokio::main]
async fn main() -> anyhow::Result<()> {
    let opt = Opt::from_args();
    let file = File::open(&opt.file).await?;
    let buffered = tokio::io::BufReader::new(file);
    let mut lines = buffered.lines();
    let mut client = MetastoreServiceClient::connect(opt.forward_to.clone()).await?;
    let mut i = 0;
    while let Some(line) = lines.next_line().await? {
        println!("line {i} = {line}");
        let grpc_call: GrpcCall = serde_json::from_str(&line)?;
        replay_grpc_request(&mut client, grpc_call.grpc_request).await?;
        i += 1;
    }
    Ok(())
}


================================================
FILE: quickwit/quickwit-metastore-utils/src/grpc_request.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_proto::metastore::*;

// The macros below are generating a req enum of the form
//
// ```
// enum GrpcRequest {
//    CreateIndexRequest(CreateIndexRequest),
//    IndexMetadataRequest(IndexMetadataRequest),
//    ...
// }
// ```
//
// And adds a From<SpecificRequest> implementation for
// every specific request.

macro_rules! build_req_enum {
    ( $($key:ident,)* ) => {
        use serde::{Serialize, Deserialize};
        #[derive(Serialize, Deserialize)]
        #[serde(tag="type")]
        pub enum GrpcRequest {
            $( $key($key), )*
        }
    }
}

macro_rules! generate_req_enum {
    ( $($key:ident,)* ) => {
        build_req_enum!($($key,)*);
        req_from_impls!($($key,)*);
    }
}

macro_rules! req_from_impls {
    ($name:ident,) => {
        impl From<$name> for GrpcRequest {
            fn from(req: $name) -> Self {
                GrpcRequest::$name(req)
            }
        }
    };
    ($name:ident, $($other:ident,)+) => {
        req_from_impls!($name,);
        req_from_impls!($($other,)+);
    }
}

generate_req_enum!(
    CreateIndexRequest,
    IndexMetadataRequest,
    ListIndexesMetadataRequest,
    DeleteIndexRequest,
    ListSplitsRequest,
    StageSplitsRequest,
    PublishSplitsRequest,
    MarkSplitsForDeletionRequest,
    DeleteSplitsRequest,
    AddSourceRequest,
    ToggleSourceRequest,
    DeleteSourceRequest,
    LastDeleteOpstampRequest,
    ResetSourceCheckpointRequest,
    DeleteQuery,
    UpdateSplitsDeleteOpstampRequest,
    ListDeleteTasksRequest,
    ListStaleSplitsRequest,
);


================================================
FILE: quickwit/quickwit-metastore-utils/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

mod grpc_request;
pub use grpc_request::GrpcRequest;
use serde::{Deserialize, Serialize};

#[derive(Serialize, Deserialize)]
pub struct GrpcCall {
    pub ts: u64,
    pub grpc_request: GrpcRequest,
}


================================================
FILE: quickwit/quickwit-opentelemetry/Cargo.toml
================================================
[package]
name = "quickwit-opentelemetry"
description = "Telemetry server"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
once_cell = { workspace = true }
prost = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
thiserror = { workspace = true }
time = { workspace = true }
tokio = { workspace = true }
tonic = { workspace = true }
tracing = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-ingest = { workspace = true }
quickwit-proto = { workspace = true }

[dev-dependencies]
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }

[features]
testsuite = []


================================================
FILE: quickwit/quickwit-opentelemetry/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![deny(clippy::disallowed_methods)]

pub mod otlp;


================================================
FILE: quickwit/quickwit-opentelemetry/src/otlp/logs.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use async_trait::async_trait;
use prost::Message;
use quickwit_common::thread_pool::run_cpu_intensive;
use quickwit_common::uri::Uri;
use quickwit_config::{ConfigFormat, IndexConfig, load_index_config_from_user_config};
use quickwit_ingest::{CommitType, JsonDocBatchV2Builder};
use quickwit_proto::ingest::DocBatchV2;
use quickwit_proto::ingest::router::IngestRouterServiceClient;
use quickwit_proto::opentelemetry::proto::collector::logs::v1::logs_service_server::LogsService;
use quickwit_proto::opentelemetry::proto::collector::logs::v1::{
    ExportLogsPartialSuccess, ExportLogsServiceRequest, ExportLogsServiceResponse,
};
use quickwit_proto::types::{DocUidGenerator, IndexId};
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;
use time::OffsetDateTime;
use tonic::{Request, Response, Status};
use tracing::field::Empty;
use tracing::{Span as RuntimeSpan, error, instrument, warn};

use super::{
    OtelSignal, SpanId, TraceId, TryFromSpanIdError, TryFromTraceIdError,
    extract_otel_index_id_from_metadata, ingest_doc_batch_v2, is_zero, parse_log_record_body,
};
use crate::otlp::extract_attributes;
use crate::otlp::metrics::OTLP_SERVICE_METRICS;

pub const OTEL_LOGS_INDEX_ID: &str = "otel-logs-v0_9";

const OTEL_LOGS_INDEX_CONFIG: &str = r#"
version: 0.8

index_id: ${INDEX_ID}

doc_mapping:
  mode: strict
  field_mappings:
    - name: timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
      indexed: false
      fast: true
      fast_precision: milliseconds
    - name: observed_timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
    - name: service_name
      type: text
      tokenizer: raw
      fast: true
    - name: severity_text
      type: text
      tokenizer: raw
      fast: true
    - name: severity_number
      type: u64
      fast: true
    - name: body
      type: json
      tokenizer: default
    - name: attributes
      type: json
      tokenizer: raw
      fast: true
    - name: dropped_attributes_count
      type: u64
      indexed: false
    - name: trace_id
      type: bytes
      input_format: hex
      output_format: hex
    - name: span_id
      type: bytes
      input_format: hex
      output_format: hex
    - name: trace_flags
      type: u64
      indexed: false
    - name: resource_attributes
      type: json
      tokenizer: raw
      fast: true
    - name: resource_dropped_attributes_count
      type: u64
      indexed: false
    - name: scope_name
      type: text
      indexed: false
    - name: scope_version
      type: text
      indexed: false
    - name: scope_attributes
      type: json
      indexed: false
    - name: scope_dropped_attributes_count
      type: u64
      indexed: false

  timestamp_field: timestamp_nanos

  # partition_key: hash_mod(service_name, 100)
  # tag_fields: [service_name]

indexing_settings:
  commit_timeout_secs: 5

search_settings:
  default_search_fields: [body.message]
"#;

#[derive(Debug, thiserror::Error)]
pub enum OtlpLogsError {
    #[error("failed to deserialize JSON log records: `{0}`")]
    Json(#[from] serde_json::Error),
    #[error("failed to deserialize Protobuf log records: `{0}`")]
    Protobuf(#[from] prost::DecodeError),
    #[error("failed to parse log record: `{0}`")]
    SpanId(#[from] TryFromSpanIdError),
    #[error("failed to parse log record: `{0}`")]
    TraceId(#[from] TryFromTraceIdError),
}

#[derive(Debug, Serialize, Deserialize)]
pub struct LogRecord {
    pub timestamp_nanos: u64,
    pub observed_timestamp_nanos: u64,
    #[serde(default)]
    #[serde(skip_serializing_if = "String::is_empty")]
    pub service_name: String,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub severity_text: Option<String>,
    pub severity_number: i32,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub body: Option<JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub dropped_attributes_count: u32,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub trace_id: Option<TraceId>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub span_id: Option<SpanId>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub trace_flags: Option<u32>,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub resource_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub resource_dropped_attributes_count: u32,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub scope_name: Option<String>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub scope_version: Option<String>,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub scope_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub scope_dropped_attributes_count: u32,
}

struct ParsedLogRecords {
    doc_batch: DocBatchV2,
    num_log_records: u64,
    num_parse_errors: u64,
    error_message: String,
}

#[derive(Clone)]
pub struct OtlpGrpcLogsService {
    ingest_router: IngestRouterServiceClient,
}

impl OtlpGrpcLogsService {
    pub fn new(ingest_router: IngestRouterServiceClient) -> Self {
        Self { ingest_router }
    }

    pub fn index_config(default_index_root_uri: &Uri) -> anyhow::Result<IndexConfig> {
        let index_config_str = OTEL_LOGS_INDEX_CONFIG.replace("${INDEX_ID}", OTEL_LOGS_INDEX_ID);
        let index_config = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            index_config_str.as_bytes(),
            default_index_root_uri,
        )?;
        Ok(index_config)
    }

    async fn export_inner(
        &mut self,
        request: ExportLogsServiceRequest,
        index_id: IndexId,
        labels: [&str; 4],
    ) -> Result<ExportLogsServiceResponse, Status> {
        let ParsedLogRecords {
            doc_batch,
            num_log_records,
            num_parse_errors,
            error_message,
        } = run_cpu_intensive({
            let parent_span = RuntimeSpan::current();
            || Self::parse_logs(request, parent_span)
        })
        .await
        .map_err(|join_error| {
            error!(error=?join_error, "failed to parse log records");
            Status::internal("failed to parse log records")
        })??;
        if num_log_records == num_parse_errors {
            return Err(tonic::Status::internal(error_message));
        }
        let num_bytes = doc_batch.num_bytes() as u64;
        self.store_logs(index_id, doc_batch).await?;

        OTLP_SERVICE_METRICS
            .ingested_log_records_total
            .with_label_values(labels)
            .inc_by(num_log_records);
        OTLP_SERVICE_METRICS
            .ingested_bytes_total
            .with_label_values(labels)
            .inc_by(num_bytes);

        let response = ExportLogsServiceResponse {
            // `rejected_log_records=0` and `error_message=""` is consided a "full" success.
            partial_success: Some(ExportLogsPartialSuccess {
                rejected_log_records: num_parse_errors as i64,
                error_message,
            }),
        };
        Ok(response)
    }

    #[instrument(skip_all, parent = parent_span, fields(num_log_records = Empty, num_bytes = Empty, num_parse_errors = Empty))]
    #[allow(clippy::result_large_err)]
    fn parse_logs(
        request: ExportLogsServiceRequest,
        parent_span: RuntimeSpan,
    ) -> tonic::Result<ParsedLogRecords> {
        let log_records = parse_otlp_logs(request)?;
        let mut num_parse_errors = 0;
        let num_log_records = log_records.len() as u64;
        let mut error_message = String::new();

        let mut doc_batch_builder = JsonDocBatchV2Builder::with_num_docs(num_log_records as usize);
        let mut doc_uid_generator = DocUidGenerator::default();
        for log_record in log_records {
            let doc_uid = doc_uid_generator.next_doc_uid();
            if let Err(error) = doc_batch_builder.add_doc(doc_uid, log_record) {
                error!(error=?error, "failed to JSON serialize span");
                error_message = format!("failed to JSON serialize span: {error:?}");
                num_parse_errors += 1;
            }
        }
        let doc_batch = doc_batch_builder.build();
        let current_span = RuntimeSpan::current();
        current_span.record("num_log_records", num_log_records);
        current_span.record("num_bytes", doc_batch.num_bytes());
        current_span.record("num_parse_errors", num_parse_errors);

        let parsed_logs = ParsedLogRecords {
            doc_batch,
            num_log_records,
            num_parse_errors,
            error_message,
        };
        Ok(parsed_logs)
    }

    #[instrument(skip_all, fields(num_bytes = doc_batch.num_bytes()))]
    async fn store_logs(
        &mut self,
        index_id: String,
        doc_batch: DocBatchV2,
    ) -> Result<(), tonic::Status> {
        ingest_doc_batch_v2(
            self.ingest_router.clone(),
            index_id,
            doc_batch,
            CommitType::Auto,
        )
        .await?;
        Ok(())
    }

    async fn export_instrumented(
        &mut self,
        request: ExportLogsServiceRequest,
        index_id: IndexId,
    ) -> Result<ExportLogsServiceResponse, Status> {
        let start = std::time::Instant::now();

        let labels = ["logs", &index_id, "grpc", "protobuf"];

        OTLP_SERVICE_METRICS
            .requests_total
            .with_label_values(labels)
            .inc();
        let (export_res, is_error) =
            match self.export_inner(request, index_id.clone(), labels).await {
                ok @ Ok(_) => (ok, "false"),
                err @ Err(_) => {
                    OTLP_SERVICE_METRICS
                        .request_errors_total
                        .with_label_values(labels)
                        .inc();
                    (err, "true")
                }
            };
        let elapsed = start.elapsed().as_secs_f64();
        let labels = ["logs", &index_id, "grpc", "protobuf", is_error];
        OTLP_SERVICE_METRICS
            .request_duration_seconds
            .with_label_values(labels)
            .observe(elapsed);

        export_res
    }
}

#[async_trait]
impl LogsService for OtlpGrpcLogsService {
    #[instrument(name = "ingest_logs", skip_all)]
    async fn export(
        &self,
        request: Request<ExportLogsServiceRequest>,
    ) -> Result<Response<ExportLogsServiceResponse>, Status> {
        let index_id = extract_otel_index_id_from_metadata(request.metadata(), OtelSignal::Logs)?;
        let request = request.into_inner();
        self.clone()
            .export_instrumented(request, index_id)
            .await
            .map(Response::new)
    }
}

fn parse_otlp_logs(request: ExportLogsServiceRequest) -> Result<Vec<LogRecord>, OtlpLogsError> {
    let num_log_records = request
        .resource_logs
        .iter()
        .flat_map(|resource_log| resource_log.scope_logs.iter())
        .map(|scope_logs| scope_logs.log_records.len())
        .sum();
    let mut log_records = Vec::with_capacity(num_log_records);

    for resource_logs in request.resource_logs {
        let mut resource_attributes = extract_attributes(
            resource_logs
                .resource
                .clone()
                .map(|rsrc| rsrc.attributes)
                .unwrap_or_default(),
        );
        let resource_dropped_attributes_count = resource_logs
            .resource
            .map(|rsrc| rsrc.dropped_attributes_count)
            .unwrap_or(0);

        let service_name = match resource_attributes.remove("service.name") {
            Some(JsonValue::String(value)) => value.to_string(),
            _ => "unknown_service".to_string(),
        };
        for scope_logs in resource_logs.scope_logs {
            let scope_name = scope_logs
                .scope
                .as_ref()
                .map(|scope| &scope.name)
                .filter(|name| !name.is_empty());
            let scope_version = scope_logs
                .scope
                .as_ref()
                .map(|scope| &scope.version)
                .filter(|version| !version.is_empty());
            let scope_attributes = extract_attributes(
                scope_logs
                    .scope
                    .clone()
                    .map(|scope| scope.attributes)
                    .unwrap_or_default(),
            );
            let scope_dropped_attributes_count = scope_logs
                .scope
                .as_ref()
                .map(|scope| scope.dropped_attributes_count)
                .unwrap_or(0);

            for log_record in scope_logs.log_records {
                let observed_timestamp_nanos = if log_record.observed_time_unix_nano == 0 {
                    // As per OTEL model spec, this field SHOULD be set once the
                    // event is observed by OpenTelemetry. If it's not set, we
                    // consider ourselves as the first OTEL observers.
                    OffsetDateTime::now_utc().unix_timestamp_nanos() as u64
                } else {
                    log_record.observed_time_unix_nano
                };

                let timestamp_nanos = if log_record.time_unix_nano == 0 {
                    observed_timestamp_nanos
                } else {
                    // When only one timestamp is supported by a recipients, the
                    // OTEL spec recommends using the `Timestamp` field if
                    // present, otherwise `ObservedTimestamp`. Even though our
                    // model supports multiple timestamps, we have only one
                    // field that that can be our `timestamp_field` and it
                    // should be the one that is commonly used for queries.
                    log_record.time_unix_nano
                };

                let trace_id = if log_record.trace_id.iter().any(|&byte| byte != 0) {
                    let trace_id = TraceId::try_from(log_record.trace_id)?;
                    Some(trace_id)
                } else {
                    None
                };
                let span_id = if log_record.span_id.iter().any(|&byte| byte != 0) {
                    let span_id = SpanId::try_from(log_record.span_id)?;
                    Some(span_id)
                } else {
                    None
                };
                let trace_flags = Some(log_record.flags);

                let severity_text = if !log_record.severity_text.is_empty() {
                    Some(log_record.severity_text)
                } else {
                    None
                };
                let severity_number = log_record.severity_number;
                let body = log_record.body.and_then(parse_log_record_body);
                let attributes = extract_attributes(log_record.attributes);
                let dropped_attributes_count = log_record.dropped_attributes_count;

                let log_record = LogRecord {
                    timestamp_nanos,
                    observed_timestamp_nanos,
                    service_name: service_name.clone(),
                    severity_text,
                    severity_number,
                    body,
                    attributes,
                    trace_id,
                    span_id,
                    trace_flags,
                    dropped_attributes_count,
                    resource_attributes: resource_attributes.clone(),
                    resource_dropped_attributes_count,
                    scope_name: scope_name.cloned(),
                    scope_version: scope_version.cloned(),
                    scope_attributes: scope_attributes.clone(),
                    scope_dropped_attributes_count,
                };
                log_records.push(log_record);
            }
        }
    }
    Ok(log_records)
}

/// An iterator of JSON OTLP log records for use in the doc processor.
pub struct JsonLogIterator {
    logs: std::vec::IntoIter<LogRecord>,
    current_log_idx: usize,
    num_logs: usize,
    avg_log_size: usize,
    avg_log_size_rem: usize,
}

impl JsonLogIterator {
    fn new(logs: Vec<LogRecord>, num_bytes: usize) -> Self {
        let num_logs = logs.len();
        let avg_log_size = num_bytes.checked_div(num_logs).unwrap_or(0);
        let avg_log_size_rem = avg_log_size + num_bytes.checked_rem(num_logs).unwrap_or(0);

        Self {
            logs: logs.into_iter(),
            current_log_idx: 0,
            num_logs,
            avg_log_size,
            avg_log_size_rem,
        }
    }
}

impl Iterator for JsonLogIterator {
    type Item = (JsonValue, usize);

    fn next(&mut self) -> Option<Self::Item> {
        let log_opt = self
            .logs
            .next()
            .map(|log| serde_json::to_value(log).expect("`LogRecord` should be JSON serializable"));
        if log_opt.is_some() {
            self.current_log_idx += 1;
        }
        if self.current_log_idx < self.num_logs {
            log_opt.map(|span| (span, self.avg_log_size))
        } else {
            log_opt.map(|span| (span, self.avg_log_size_rem))
        }
    }
}

pub fn parse_otlp_logs_json(payload_json: &[u8]) -> Result<JsonLogIterator, OtlpLogsError> {
    let request: ExportLogsServiceRequest = serde_json::from_slice(payload_json)?;
    let log_records = parse_otlp_logs(request)?;
    Ok(JsonLogIterator::new(log_records, payload_json.len()))
}

pub fn parse_otlp_logs_protobuf(payload_proto: &[u8]) -> Result<JsonLogIterator, OtlpLogsError> {
    let request = ExportLogsServiceRequest::decode(payload_proto)?;
    let log_records = parse_otlp_logs(request)?;
    Ok(JsonLogIterator::new(log_records, payload_proto.len()))
}

#[cfg(test)]
mod tests {
    use quickwit_metastore::{CreateIndexRequestExt, metastore_for_test};
    use quickwit_proto::metastore::{CreateIndexRequest, MetastoreService};

    use super::*;

    #[test]
    fn test_index_config_is_valid() {
        let index_config =
            OtlpGrpcLogsService::index_config(&Uri::for_test("ram:///indexes")).unwrap();
        assert_eq!(index_config.index_id, OTEL_LOGS_INDEX_ID);
    }

    #[tokio::test]
    async fn test_create_index() {
        let metastore = metastore_for_test();
        let index_config =
            OtlpGrpcLogsService::index_config(&Uri::for_test("ram:///indexes")).unwrap();
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        metastore.create_index(create_index_request).await.unwrap();
    }
}


================================================
FILE: quickwit/quickwit-opentelemetry/src/otlp/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    HistogramVec, IntCounterVec, exponential_buckets, new_counter_vec, new_histogram_vec,
};

pub struct OtlpServiceMetrics {
    pub requests_total: IntCounterVec<4>,
    pub request_errors_total: IntCounterVec<4>,
    pub request_duration_seconds: HistogramVec<5>,
    pub ingested_log_records_total: IntCounterVec<4>,
    pub ingested_spans_total: IntCounterVec<4>,
    pub ingested_bytes_total: IntCounterVec<4>,
}

impl Default for OtlpServiceMetrics {
    fn default() -> Self {
        Self {
            requests_total: new_counter_vec(
                "requests_total",
                "Number of requests",
                "otlp",
                &[],
                ["service", "index", "transport", "format"],
            ),
            request_errors_total: new_counter_vec(
                "request_errors_total",
                "Number of failed requests",
                "otlp",
                &[],
                ["service", "index", "transport", "format"],
            ),
            request_duration_seconds: new_histogram_vec(
                "request_duration_seconds",
                "Duration of requests",
                "otlp",
                &[],
                ["service", "index", "transport", "format", "error"],
                exponential_buckets(0.02, 2.0, 8).unwrap(),
            ),
            ingested_log_records_total: new_counter_vec(
                "ingested_log_records_total",
                "Number of log records ingested",
                "otlp",
                &[],
                ["service", "index", "transport", "format"],
            ),
            ingested_spans_total: new_counter_vec(
                "ingested_spans_total",
                "Number of spans ingested",
                "otlp",
                &[],
                ["service", "index", "transport", "format"],
            ),
            ingested_bytes_total: new_counter_vec(
                "ingested_bytes_total",
                "Number of bytes ingested",
                "otlp",
                &[],
                ["service", "index", "transport", "format"],
            ),
        }
    }
}

/// `OTLP_SERVICE_METRICS` exposes metrics for each OTLP service.
pub static OTLP_SERVICE_METRICS: Lazy<OtlpServiceMetrics> = Lazy::new(OtlpServiceMetrics::default);


================================================
FILE: quickwit/quickwit-opentelemetry/src/otlp/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use quickwit_common::rate_limited_warn;
use quickwit_config::{INGEST_V2_SOURCE_ID, validate_identifier, validate_index_id_pattern};
use quickwit_ingest::{CommitType, IngestServiceError};
use quickwit_proto::ingest::DocBatchV2;
use quickwit_proto::ingest::router::{
    IngestRequestV2, IngestRouterService, IngestRouterServiceClient, IngestSubrequest,
};
use quickwit_proto::opentelemetry::proto::common::v1::any_value::Value as OtlpValue;
use quickwit_proto::opentelemetry::proto::common::v1::{
    AnyValue as OtlpAnyValue, ArrayValue as OtlpArrayValue, KeyValue as OtlpKeyValue,
};
use serde_json::{Number as JsonNumber, Value as JsonValue};

mod logs;
mod metrics;
#[cfg(any(test, feature = "testsuite"))]
mod test_utils;
mod traces;

pub use logs::{
    JsonLogIterator, OTEL_LOGS_INDEX_ID, OtlpGrpcLogsService, OtlpLogsError, parse_otlp_logs_json,
    parse_otlp_logs_protobuf,
};
pub use quickwit_proto::search::{SpanId, TraceId, TryFromSpanIdError, TryFromTraceIdError};
#[cfg(any(test, feature = "testsuite"))]
pub use test_utils::make_resource_spans_for_test;
use tonic::Status;
pub use traces::{
    Event, JsonSpanIterator, Link, OTEL_TRACES_INDEX_ID, OTEL_TRACES_INDEX_ID_PATTERN,
    OtlpGrpcTracesService, OtlpTracesError, Span, SpanFingerprint, SpanKind, SpanStatus,
    parse_otlp_spans_json, parse_otlp_spans_protobuf,
};

#[derive(Debug, Clone, Copy)]
pub enum OtelSignal {
    Logs,
    Traces,
}

impl OtelSignal {
    pub fn header_name(&self) -> &'static str {
        match self {
            OtelSignal::Logs => "qw-otel-logs-index",
            OtelSignal::Traces => "qw-otel-traces-index",
        }
    }

    pub fn default_index_id(&self) -> &'static str {
        match self {
            OtelSignal::Logs => OTEL_LOGS_INDEX_ID,
            OtelSignal::Traces => OTEL_TRACES_INDEX_ID,
        }
    }
}

impl From<OtlpLogsError> for tonic::Status {
    fn from(error: OtlpLogsError) -> Self {
        tonic::Status::invalid_argument(error.to_string())
    }
}

impl From<OtlpTracesError> for tonic::Status {
    fn from(error: OtlpTracesError) -> Self {
        tonic::Status::invalid_argument(error.to_string())
    }
}

// An `Attribute` is a key-value pair, which MUST have the following properties:
// - The attribute key MUST be a non-null and non-empty string.
// - The attribute value is either:
//  - A primitive type: string, boolean, double precision floating point (IEEE 754-1985) or signed
//    64 bit integer.
//  - An array of primitive type values. The array MUST be homogeneous, i.e., it MUST NOT contain
//    values of different types.
//
// <https://github.com/open-telemetry/opentelemetry-specification/tree/main/specification/common#attribute>
pub(crate) fn extract_attributes(attributes: Vec<OtlpKeyValue>) -> HashMap<String, JsonValue> {
    let mut attrs = HashMap::with_capacity(attributes.len());

    for attribute in attributes {
        if attribute.key.is_empty() {
            continue;
        }
        if let Some(value) = attribute
            .value
            .and_then(|any_value| any_value.value)
            .and_then(oltp_value_to_json_value)
        {
            attrs.insert(attribute.key, value);
        }
    }
    attrs
}

fn oltp_value_to_json_value(value: OtlpValue) -> Option<JsonValue> {
    match value {
        OtlpValue::ArrayValue(OtlpArrayValue { values }) => Some(
            values
                .into_iter()
                .filter_map(|value| match value.value {
                    Some(value) => oltp_value_to_json_value(value),
                    None => None,
                })
                .collect(),
        ),
        OtlpValue::BoolValue(bool_value) => Some(JsonValue::Bool(bool_value)),
        OtlpValue::DoubleValue(double_value) => {
            JsonNumber::from_f64(double_value).map(JsonValue::Number)
        }
        OtlpValue::IntValue(int_value) => Some(JsonValue::Number(JsonNumber::from(int_value))),
        OtlpValue::KvlistValue(key_values) => {
            let mut map = serde_json::Map::with_capacity(key_values.values.len());

            for key_value in key_values.values {
                if let Some(value) = key_value
                    .value
                    .and_then(|any_value| any_value.value)
                    .and_then(oltp_value_to_json_value)
                {
                    map.insert(key_value.key, value);
                }
            }
            Some(JsonValue::Object(map))
        }
        OtlpValue::StringValue(string_value) => Some(JsonValue::String(string_value)),
        OtlpValue::BytesValue(_) => {
            rate_limited_warn!(limit_per_min = 10, "ignoring unsupported OTLP bytes value");
            None
        }
    }
}

pub(crate) fn parse_log_record_body(body: OtlpAnyValue) -> Option<JsonValue> {
    body.value.and_then(oltp_value_to_json_value).map(|value| {
        if value.is_string() {
            let mut map = serde_json::Map::with_capacity(1);
            map.insert("message".to_string(), value);
            JsonValue::Object(map)
        } else {
            value
        }
    })
}

fn is_zero(count: &u32) -> bool {
    *count == 0
}

#[allow(clippy::result_large_err)]
pub fn extract_otel_traces_index_id_patterns_from_metadata(
    metadata: &tonic::metadata::MetadataMap,
) -> Result<Vec<String>, Status> {
    let comma_separated_index_id_patterns = metadata
        .get(OtelSignal::Traces.header_name())
        .map(|index| index.to_str())
        .transpose()
        .map_err(|error| {
            Status::internal(format!(
                "failed to extract index ID from request header: {error}",
            ))
        })?
        .unwrap_or(OTEL_TRACES_INDEX_ID_PATTERN);
    let mut index_id_patterns = Vec::new();
    for index_id_pattern in comma_separated_index_id_patterns.split(',') {
        if index_id_pattern.is_empty() {
            continue;
        }
        validate_index_id_pattern(index_id_pattern, true).map_err(|error| {
            Status::internal(format!(
                "invalid index ID pattern in request header: {error}",
            ))
        })?;
        index_id_patterns.push(index_id_pattern.to_string());
    }
    Ok(index_id_patterns)
}

#[allow(clippy::result_large_err)]
pub(crate) fn extract_otel_index_id_from_metadata(
    metadata: &tonic::metadata::MetadataMap,
    otel_signal: OtelSignal,
) -> Result<String, Status> {
    let index_id = metadata
        .get(otel_signal.header_name())
        .map(|index: &tonic::metadata::MetadataValue<tonic::metadata::Ascii>| index.to_str())
        .transpose()
        .map_err(|error| {
            Status::internal(format!(
                "failed to extract index ID from request metadata: {error}",
            ))
        })?
        .unwrap_or_else(|| otel_signal.default_index_id());
    validate_identifier("index_id", index_id).map_err(|error| {
        Status::internal(format!(
            "invalid index ID pattern in request metadata: {error}",
        ))
    })?;
    Ok(index_id.to_string())
}

async fn ingest_doc_batch_v2(
    ingest_router: IngestRouterServiceClient,
    index_id: String,
    doc_batch: DocBatchV2,
    commit_type: CommitType,
) -> Result<(), IngestServiceError> {
    let subrequest = IngestSubrequest {
        subrequest_id: 0,
        index_id,
        source_id: INGEST_V2_SOURCE_ID.to_string(),
        doc_batch: Some(doc_batch),
    };
    let request = IngestRequestV2 {
        commit_type: commit_type.into(),
        subrequests: vec![subrequest],
    };
    let mut response = ingest_router.ingest(request).await?;
    let num_responses = response.successes.len() + response.failures.len();
    if num_responses != 1 {
        return Err(IngestServiceError::Internal(format!(
            "expected a single failure or success, got {num_responses}"
        )));
    }
    if response.successes.pop().is_some() {
        return Ok(());
    }
    let ingest_failure = response.failures.pop().unwrap();
    Err(ingest_failure.into())
}

#[cfg(test)]
mod tests {
    use quickwit_proto::opentelemetry::proto::common::v1::any_value::{
        Value as OtlpValue, Value as OtlpAnyValueValue,
    };
    use quickwit_proto::opentelemetry::proto::common::v1::{
        ArrayValue as OtlpArrayValue, KeyValueList as OtlpKeyValueList,
    };
    use serde_json::{Value as JsonValue, json};

    use super::*;
    use crate::otlp::{extract_attributes, oltp_value_to_json_value, parse_log_record_body};

    #[test]
    fn test_oltp_value_to_json_value() {
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::ArrayValue(OtlpArrayValue { values: Vec::new() })),
            Some(json!([]))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::ArrayValue(OtlpArrayValue {
                values: vec![
                    OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::IntValue(1337))
                    },
                    OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue("1337".to_string()))
                    }
                ]
            })),
            Some(json!([1337, "1337"]))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::BoolValue(true)),
            Some(json!(true))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::DoubleValue(12.0)),
            Some(json!(12.0))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::IntValue(42)),
            Some(json!(42))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::KvlistValue(OtlpKeyValueList {
                values: Vec::new()
            })),
            Some(json!({}))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::KvlistValue(OtlpKeyValueList {
                values: vec![
                    OtlpKeyValue {
                        key: "foo".to_string(),
                        value: Some(OtlpAnyValue {
                            value: Some(OtlpAnyValueValue::IntValue(1337))
                        })
                    },
                    OtlpKeyValue {
                        key: "bar".to_string(),
                        value: Some(OtlpAnyValue {
                            value: Some(OtlpAnyValueValue::StringValue("1337".to_string()))
                        })
                    }
                ]
            })),
            Some(json!({
                "foo": 1337,
                "bar": "1337"
            }))
        );
        assert_eq!(
            oltp_value_to_json_value(OtlpValue::StringValue("foo".to_string())),
            Some(json!("foo"))
        );
    }

    #[test]
    fn test_extract_attributes() {
        assert!(extract_attributes(Vec::new()).is_empty());

        let attributes = vec![
            OtlpKeyValue {
                key: "".to_string(),
                value: None,
            },
            OtlpKeyValue {
                key: "".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::BoolValue(true)),
                }),
            },
            OtlpKeyValue {
                key: "empty_value".to_string(),
                value: None,
            },
            OtlpKeyValue {
                key: "empty_value_value".to_string(),
                value: Some(OtlpAnyValue { value: None }),
            },
        ];
        assert!(extract_attributes(attributes).is_empty());

        let attributes = vec![
            OtlpKeyValue {
                key: "array_key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::ArrayValue(OtlpArrayValue {
                        values: vec![OtlpAnyValue {
                            value: Some(OtlpAnyValueValue::IntValue(1337)),
                        }],
                    })),
                }),
            },
            OtlpKeyValue {
                key: "bool_key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::BoolValue(true)),
                }),
            },
            OtlpKeyValue {
                key: "double_key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::DoubleValue(12.0)),
                }),
            },
            OtlpKeyValue {
                key: "int_key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::IntValue(42)),
                }),
            },
            OtlpKeyValue {
                key: "string_key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::StringValue("foo".to_string())),
                }),
            },
        ];
        let expected_attributes = HashMap::from_iter([
            ("array_key".to_string(), json!([1337])),
            ("bool_key".to_string(), json!(true)),
            ("double_key".to_string(), json!(12.0)),
            ("int_key".to_string(), json!(42)),
            ("string_key".to_string(), json!("foo")),
        ]);
        assert_eq!(extract_attributes(attributes), expected_attributes);
    }

    #[test]
    fn test_parse_log_record_body() {
        let value = parse_log_record_body(OtlpAnyValue {
            value: Some(OtlpAnyValueValue::StringValue("body".to_string())),
        })
        .unwrap();
        let JsonValue::Object(map) = value else {
            panic!("Expected object, got {value:?}");
        };
        assert_eq!(map.len(), 1);
        assert_eq!(map["message"], json!("body"));
    }

    #[test]
    fn test_extract_otel_index_id_patterns_from_metadata() {
        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo,bar".parse().unwrap());
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(&metadata).unwrap();
        assert_eq!(
            index_id_patterns,
            vec!["foo".to_string(), "bar".to_string()]
        );

        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("bad-header", "foo,bar".parse().unwrap());
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(&metadata).unwrap();
        assert_eq!(index_id_patterns, vec![OTEL_TRACES_INDEX_ID_PATTERN]);

        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo,bar".parse().unwrap());
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(&metadata).unwrap();
        assert_eq!(
            index_id_patterns,
            vec!["foo".to_string(), "bar".to_string()]
        );

        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo,bar,".parse().unwrap());
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(&metadata).unwrap();
        assert_eq!(
            index_id_patterns,
            vec!["foo".to_string(), "bar".to_string()]
        );

        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo,bar,,".parse().unwrap());
        let index_id_patterns =
            extract_otel_traces_index_id_patterns_from_metadata(&metadata).unwrap();
        assert_eq!(
            index_id_patterns,
            vec!["foo".to_string(), "bar".to_string()]
        );

        // invalid index ID pattern
        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo,bar, ,".parse().unwrap());
        let extract_res = extract_otel_traces_index_id_patterns_from_metadata(&metadata);
        assert!(extract_res.is_err());
    }

    #[test]
    fn test_extract_otel_index_id_from_metadata() {
        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-logs-index", "foo".parse().unwrap());
        let index_id = extract_otel_index_id_from_metadata(&metadata, OtelSignal::Logs).unwrap();
        assert_eq!(index_id, "foo");

        // default index ID
        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("wrong-header", "foo".parse().unwrap());
        let index_id = extract_otel_index_id_from_metadata(&metadata, OtelSignal::Logs).unwrap();
        assert_eq!(index_id, OTEL_LOGS_INDEX_ID);

        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo".parse().unwrap());
        let index_id = extract_otel_index_id_from_metadata(&metadata, OtelSignal::Traces).unwrap();
        assert_eq!(index_id, "foo");

        // default index ID
        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("wrong-header", "foo".parse().unwrap());
        let index_id = extract_otel_index_id_from_metadata(&metadata, OtelSignal::Traces).unwrap();
        assert_eq!(index_id, OTEL_TRACES_INDEX_ID);

        // invalid index ID
        let mut metadata = tonic::metadata::MetadataMap::new();
        metadata.insert("qw-otel-traces-index", "foo bar".parse().unwrap());
        let extract_res = extract_otel_index_id_from_metadata(&metadata, OtelSignal::Traces);
        assert!(extract_res.is_err());
    }
}


================================================
FILE: quickwit/quickwit-opentelemetry/src/otlp/test_utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use quickwit_proto::opentelemetry::proto::common::v1::any_value::Value as OtlpAnyValueValue;
use quickwit_proto::opentelemetry::proto::common::v1::{
    AnyValue as OtlpAnyValue, ArrayValue, InstrumentationScope, KeyValue as OtlpKeyValue,
};
use quickwit_proto::opentelemetry::proto::resource::v1::Resource;
use quickwit_proto::opentelemetry::proto::trace::v1::span::{Event as OtlpEvent, Link as OtlpLink};
use quickwit_proto::opentelemetry::proto::trace::v1::{
    ResourceSpans, ScopeSpans, Span as OtlpSpan, Status as OtlpStatus,
};
use time::OffsetDateTime;

fn now_minus_x_secs(now: &OffsetDateTime, secs: u64) -> u64 {
    (*now - Duration::from_secs(secs)).unix_timestamp_nanos() as u64
}

pub fn make_resource_spans_for_test() -> Vec<ResourceSpans> {
    let now: OffsetDateTime = OffsetDateTime::now_utc();

    let attributes = vec![OtlpKeyValue {
        key: "span_key".to_string(),
        value: Some(OtlpAnyValue {
            value: Some(OtlpAnyValueValue::StringValue("span_value".to_string())),
        }),
    }];
    let events = vec![OtlpEvent {
        name: "event_name".to_string(),
        time_unix_nano: 1_000_500_003,
        attributes: vec![OtlpKeyValue {
            key: "event_key".to_string(),
            value: Some(OtlpAnyValue {
                value: Some(OtlpAnyValueValue::StringValue("event_value".to_string())),
            }),
        }],
        dropped_attributes_count: 6,
    }];
    let links = vec![OtlpLink {
        trace_id: vec![4; 16],
        span_id: vec![5; 8],
        trace_state: "link_key1=link_value1,link_key2=link_value2".to_string(),
        attributes: vec![OtlpKeyValue {
            key: "link_key".to_string(),
            value: Some(OtlpAnyValue {
                value: Some(OtlpAnyValueValue::StringValue("link_value".to_string())),
            }),
        }],
        dropped_attributes_count: 7,
    }];
    let spans = vec![
        OtlpSpan {
            trace_id: vec![1; 16],
            span_id: vec![1; 8],
            parent_span_id: Vec::new(),
            trace_state: "key1=value1,key2=value2".to_string(),
            name: "stage_splits".to_string(),
            kind: 1, // Internal
            start_time_unix_nano: now_minus_x_secs(&now, 6),
            end_time_unix_nano: now_minus_x_secs(&now, 5),
            attributes: Vec::new(),
            dropped_attributes_count: 0,
            events: Vec::new(),
            dropped_events_count: 0,
            links: Vec::new(),
            dropped_links_count: 0,
            status: None,
        },
        OtlpSpan {
            trace_id: vec![2; 16],
            span_id: vec![2; 8],
            parent_span_id: Vec::new(),
            trace_state: "key1=value1,key2=value2".to_string(),
            name: "publish_splits".to_string(),
            kind: 2, // Server
            start_time_unix_nano: now_minus_x_secs(&now, 4),
            end_time_unix_nano: now_minus_x_secs(&now, 3),
            attributes: Vec::new(),
            dropped_attributes_count: 0,
            events: Vec::new(),
            dropped_events_count: 0,
            links: Vec::new(),
            dropped_links_count: 0,
            status: None,
        },
        OtlpSpan {
            trace_id: vec![3; 16],
            span_id: vec![3; 8],
            parent_span_id: Vec::new(),
            trace_state: "key1=value1,key2=value2".to_string(),
            name: "list_splits".to_string(),
            kind: 3, // Client
            start_time_unix_nano: now_minus_x_secs(&now, 2),
            end_time_unix_nano: now_minus_x_secs(&now, 1),
            attributes,
            dropped_attributes_count: 0,
            events: Vec::new(),
            dropped_events_count: 0,
            links: Vec::new(),
            dropped_links_count: 0,
            status: Some(OtlpStatus {
                code: 1,
                message: "".to_string(),
            }),
        },
        OtlpSpan {
            trace_id: vec![4; 16],
            span_id: vec![4; 8],
            parent_span_id: Vec::new(),
            trace_state: "key1=value1,key2=value2".to_string(),
            name: "list_splits".to_string(),
            kind: 3, // Client
            start_time_unix_nano: now_minus_x_secs(&now, 2),
            end_time_unix_nano: now_minus_x_secs(&now, 1),
            attributes: Vec::new(),
            dropped_attributes_count: 0,
            events: Vec::new(),
            dropped_events_count: 0,
            links: Vec::new(),
            dropped_links_count: 0,
            status: Some(OtlpStatus {
                code: 2,
                message: "An error occurred.".to_string(),
            }),
        },
        OtlpSpan {
            trace_id: vec![5; 16],
            span_id: vec![5; 8],
            parent_span_id: Vec::new(),
            trace_state: "key1=value1,key2=value2".to_string(),
            name: "delete_splits".to_string(),
            kind: 3, // Client
            start_time_unix_nano: now_minus_x_secs(&now, 2),
            end_time_unix_nano: now_minus_x_secs(&now, 1),
            attributes: Vec::new(),
            dropped_attributes_count: 0,
            events,
            dropped_events_count: 0,
            links,
            dropped_links_count: 0,
            status: Some(OtlpStatus {
                code: 2,
                message: "Storage error.".to_string(),
            }),
        },
    ];
    let scope_spans = vec![ScopeSpans {
        scope: Some(InstrumentationScope {
            name: "opentelemetry-otlp".to_string(),
            version: "0.11.0".to_string(),
            attributes: Vec::new(),
            dropped_attributes_count: 0,
        }),
        spans,
        schema_url: "".to_string(),
    }];
    let resource_attributes = vec![
        OtlpKeyValue {
            key: "service.name".to_string(),
            value: Some(OtlpAnyValue {
                value: Some(OtlpAnyValueValue::StringValue("quickwit".to_string())),
            }),
        },
        OtlpKeyValue {
            key: "tags".to_string(),
            value: Some(OtlpAnyValue {
                value: Some(OtlpAnyValueValue::ArrayValue(ArrayValue {
                    values: vec![OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue("foo".to_string())),
                    }],
                })),
            }),
        },
    ];
    let resource_spans = ResourceSpans {
        resource: Some(Resource {
            attributes: resource_attributes,
            dropped_attributes_count: 0,
        }),
        scope_spans,
        schema_url: "".to_string(),
    };
    vec![resource_spans]
}


================================================
FILE: quickwit/quickwit-opentelemetry/src/otlp/traces.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::PartialEq;
use std::collections::HashMap;
use std::str::FromStr;

use async_trait::async_trait;
use prost::Message;
use quickwit_common::thread_pool::run_cpu_intensive;
use quickwit_common::uri::Uri;
use quickwit_config::{ConfigFormat, IndexConfig, load_index_config_from_user_config};
use quickwit_ingest::{CommitType, JsonDocBatchV2Builder};
use quickwit_proto::ingest::DocBatchV2;
use quickwit_proto::ingest::router::IngestRouterServiceClient;
use quickwit_proto::opentelemetry::proto::collector::trace::v1::trace_service_server::TraceService;
use quickwit_proto::opentelemetry::proto::collector::trace::v1::{
    ExportTracePartialSuccess, ExportTraceServiceRequest, ExportTraceServiceResponse,
};
use quickwit_proto::opentelemetry::proto::common::v1::InstrumentationScope;
use quickwit_proto::opentelemetry::proto::resource::v1::Resource as OtlpResource;
use quickwit_proto::opentelemetry::proto::trace::v1::span::Link as OtlpLink;
use quickwit_proto::opentelemetry::proto::trace::v1::status::StatusCode as OtlpStatusCode;
use quickwit_proto::opentelemetry::proto::trace::v1::{Span as OtlpSpan, Status as OtlpStatus};
use quickwit_proto::types::{DocUidGenerator, IndexId};
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;
use tonic::{Request, Response, Status};
use tracing::field::Empty;
use tracing::{Span as RuntimeSpan, error, instrument, warn};

use super::{
    OtelSignal, TryFromSpanIdError, TryFromTraceIdError, extract_otel_index_id_from_metadata,
    ingest_doc_batch_v2, is_zero,
};
use crate::otlp::metrics::OTLP_SERVICE_METRICS;
use crate::otlp::{SpanId, TraceId, extract_attributes};

pub const OTEL_TRACES_INDEX_ID: &str = "otel-traces-v0_9";
pub const OTEL_TRACES_INDEX_ID_PATTERN: &str = "otel-traces-v0_*";

const OTEL_TRACES_INDEX_CONFIG: &str = r#"
version: 0.8

index_id: ${INDEX_ID}

doc_mapping:
  mode: strict
  field_mappings:
    - name: trace_id
      type: bytes
      input_format: hex
      output_format: hex
      fast: true
    - name: trace_state
      type: text
      indexed: false
    - name: service_name
      type: text
      tokenizer: raw
      fast: true
    - name: resource_attributes
      type: json
      tokenizer: raw
    - name: resource_dropped_attributes_count
      type: u64
      indexed: false
    - name: scope_name
      type: text
      indexed: false
    - name: scope_version
      type: text
      indexed: false
    - name: scope_attributes
      type: json
      indexed: false
    - name: scope_dropped_attributes_count
      type: u64
      indexed: false
    - name: span_id
      type: bytes
      input_format: hex
      output_format: hex
    - name: span_kind
      type: u64
    - name: span_name
      type: text
      tokenizer: raw
      fast: true
    - name: span_fingerprint
      type: text
      tokenizer: raw
    - name: span_start_timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
      indexed: false
      fast: true
      fast_precision: milliseconds
    - name: span_end_timestamp_nanos
      type: datetime
      input_formats: [unix_timestamp]
      output_format: unix_timestamp_nanos
      indexed: false
      fast: false
    - name: span_duration_millis
      type: u64
      indexed: false
      fast: true
    - name: span_attributes
      type: json
      tokenizer: raw
      fast: true
    - name: span_dropped_attributes_count
      type: u64
      indexed: false
    - name: span_dropped_events_count
      type: u64
      indexed: false
    - name: span_dropped_links_count
      type: u64
      indexed: false
    - name: span_status
      type: json
      indexed: true
    - name: parent_span_id
      type: bytes
      input_format: hex
      output_format: hex
      indexed: false
    - name: is_root
      type: bool
      indexed: true
      stored: false
    - name: events
      type: array<json>
      tokenizer: raw
      fast: true
    - name: event_names
      type: array<text>
      tokenizer: default
      record: position
      stored: false
    - name: links
      type: array<json>
      tokenizer: raw

  timestamp_field: span_start_timestamp_nanos

  # partition_key: hash_mod(service_name, 100)
  # tag_fields: [service_name]

indexing_settings:
  commit_timeout_secs: 5

search_settings:
  default_search_fields: [service_name, span_name, event_names]
"#;

#[derive(Debug, thiserror::Error)]
pub enum OtlpTracesError {
    #[error("failed to deserialize JSON spans: `{0}`")]
    Json(#[from] serde_json::Error),
    #[error("failed to deserialize Protobuf spans: `{0}`")]
    Protobuf(#[from] prost::DecodeError),
    #[error("failed to parse span: `{0}`")]
    SpanId(#[from] TryFromSpanIdError),
    #[error("failed to parse span: `{0}`")]
    TraceId(#[from] TryFromTraceIdError),
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct Span {
    pub trace_id: TraceId,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub trace_state: Option<String>,
    pub service_name: String,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub resource_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub resource_dropped_attributes_count: u32,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub scope_name: Option<String>,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub scope_version: Option<String>,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub scope_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub scope_dropped_attributes_count: u32,
    pub span_id: SpanId,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub span_kind: u32,
    pub span_name: String,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub span_fingerprint: Option<SpanFingerprint>,
    pub span_start_timestamp_nanos: u64,
    pub span_end_timestamp_nanos: u64,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub span_duration_millis: Option<u64>,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub span_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub span_dropped_attributes_count: u32,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub span_dropped_events_count: u32,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub span_dropped_links_count: u32,
    #[serde(default)]
    #[serde(skip_serializing_if = "SpanStatus::is_unset")]
    pub span_status: SpanStatus,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub parent_span_id: Option<SpanId>,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub is_root: Option<bool>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Vec::is_empty")]
    pub events: Vec<Event>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Vec::is_empty")]
    pub event_names: Vec<String>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Vec::is_empty")]
    pub links: Vec<Link>,
}

impl Span {
    fn from_otlp(
        span: OtlpSpan,
        resource: &Resource,
        scope: &Scope,
    ) -> Result<Self, OtlpTracesError> {
        let trace_id = TraceId::try_from(span.trace_id)?;
        let span_id = SpanId::try_from(span.span_id)?;
        let parent_span_id = if !span.parent_span_id.is_empty() {
            Some(SpanId::try_from(span.parent_span_id)?)
        } else {
            None
        };
        let span_name = if !span.name.is_empty() {
            span.name
        } else {
            "unknown".to_string()
        };
        let span_fingerprint =
            SpanFingerprint::new(&resource.service_name, span.kind.into(), &span_name);
        let span_duration_nanos = span.end_time_unix_nano - span.start_time_unix_nano;
        let span_duration_millis = Some(span_duration_nanos / 1_000_000);
        let span_attributes = extract_attributes(span.attributes);

        let events: Vec<Event> = span
            .events
            .into_iter()
            .map(|event| Event {
                event_timestamp_nanos: event.time_unix_nano,
                event_name: event.name,
                event_attributes: extract_attributes(event.attributes),
                event_dropped_attributes_count: event.dropped_attributes_count,
            })
            .collect();
        let event_names: Vec<String> = events
            .iter()
            .map(|event| event.event_name.clone())
            .collect();
        let links: Vec<Link> = span
            .links
            .into_iter()
            .map(Link::try_from_otlp)
            .collect::<Result<_, _>>()?;
        let trace_state = if span.trace_state.is_empty() {
            None
        } else {
            Some(span.trace_state)
        };
        let span = Span {
            trace_id,
            trace_state,
            service_name: resource.service_name.clone(),
            resource_attributes: resource.attributes.clone(),
            resource_dropped_attributes_count: resource.dropped_attributes_count,
            scope_name: scope.name.clone(),
            scope_version: scope.version.clone(),
            scope_attributes: scope.attributes.clone(),
            scope_dropped_attributes_count: scope.dropped_attributes_count,
            span_id,
            span_kind: span.kind as u32,
            span_name,
            span_fingerprint: Some(span_fingerprint),
            span_start_timestamp_nanos: span.start_time_unix_nano,
            span_end_timestamp_nanos: span.end_time_unix_nano,
            span_duration_millis,
            span_attributes,
            span_dropped_attributes_count: span.dropped_attributes_count,
            span_dropped_events_count: span.dropped_events_count,
            span_dropped_links_count: span.dropped_links_count,
            span_status: span.status.map(SpanStatus::from_otlp).unwrap_or_default(),
            is_root: Some(parent_span_id.is_none()),
            parent_span_id,
            events,
            event_names,
            links,
        };
        Ok(span)
    }
}

#[derive(Debug, Clone)]
pub struct SpanKind(i32);

impl SpanKind {
    pub fn as_char(&self) -> char {
        match self.0 {
            0 => '0',
            1 => '1',
            2 => '2',
            3 => '3',
            4 => '4',
            5 => '5',
            _ => {
                panic!("Unexpected span kind: {}", self.0);
            }
        }
    }
    pub fn as_jaeger(&self) -> &'static str {
        match self.0 {
            0 => "unspecified",
            1 => "internal",
            2 => "server",
            3 => "client",
            4 => "producer",
            5 => "consumer",
            _ => {
                panic!("Unexpected span kind: {}", self.0);
            }
        }
    }

    pub fn as_otlp(&self) -> &'static str {
        match self.0 {
            0 => "SPAN_KIND_UNSPECIFIED",
            1 => "SPAN_KIND_INTERNAL",
            2 => "SPAN_KIND_SERVER",
            3 => "SPAN_KIND_CLIENT",
            4 => "SPAN_KIND_PRODUCER",
            5 => "SPAN_KIND_CONSUMER",
            _ => {
                panic!("Unexpected span kind: {}", self.0);
            }
        }
    }
}

impl From<i32> for SpanKind {
    fn from(span_kind: i32) -> Self {
        Self(span_kind)
    }
}

impl FromStr for SpanKind {
    type Err = String;

    fn from_str(span_kind: &str) -> Result<Self, Self::Err> {
        let span_kind_i32 = match span_kind {
            "0" | "unspecified" | "SPAN_KIND_UNSPECIFIED" => 0,
            "1" | "internal" | "SPAN_KIND_INTERNAL" => 1,
            "2" | "server" | "SPAN_KIND_SERVER" => 2,
            "3" | "client" | "SPAN_KIND_CLIENT" => 3,
            "4" | "producer" | "SPAN_KIND_PRODUCER" => 4,
            "5" | "consumer" | "SPAN_KIND_CONSUMER" => 5,
            _ => {
                if !span_kind.is_empty() {
                    warn!(span_kind=%span_kind, "unexpected span kind");
                }
                return Err(format!("Unexpected span kind: {span_kind}"));
            }
        };
        Ok(Self(span_kind_i32))
    }
}

/// Concatenation of the service name, span kind, and span name.
#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct SpanFingerprint(String);

impl SpanFingerprint {
    /// Null character used to separate the service name, span kind, and span name.
    const NULL_CHAR: char = '\u{0}';

    /// Start of heading character, the next character after null.
    const SOH_CHAR: char = '\u{1}';

    pub fn new(service_name: &str, span_kind: SpanKind, span_name: &str) -> Self {
        Self(format!(
            "{service_name}{separator}{span_kind}{separator}{span_name}",
            separator = Self::NULL_CHAR,
            span_kind = span_kind.0
        ))
    }

    pub fn as_str(&self) -> &str {
        self.0.as_str()
    }

    pub fn from_string(fingerprint: String) -> Self {
        Self(fingerprint)
    }

    pub fn service_name(&self) -> Option<&str> {
        self.0.split(Self::NULL_CHAR).next()
    }

    pub fn span_kind(&self) -> Option<SpanKind> {
        self.0
            .split(Self::NULL_CHAR)
            .nth(1)
            .and_then(|span_kind| SpanKind::from_str(span_kind).ok())
    }

    pub fn span_name(&self) -> Option<&str> {
        self.0.split(Self::NULL_CHAR).nth(2)
    }

    pub fn start_key(service_name: &str, span_kind_opt: Option<SpanKind>) -> Option<Vec<u8>> {
        if service_name.is_empty() {
            return None;
        }
        let mut start_key = service_name.as_bytes().to_vec();
        start_key.push(Self::NULL_CHAR as u8);

        if let Some(span_kind) = span_kind_opt {
            start_key.push(span_kind.as_char() as u8);
            start_key.push(Self::NULL_CHAR as u8);
        }
        Some(start_key)
    }

    pub fn end_key(service_name: &str, span_kind_opt: Option<SpanKind>) -> Option<Vec<u8>> {
        if service_name.is_empty() {
            return None;
        }
        let mut end_key = service_name.as_bytes().to_vec();

        if let Some(span_kind) = span_kind_opt {
            end_key.push(Self::NULL_CHAR as u8);
            end_key.push(span_kind.as_char() as u8);
        }
        end_key.push(Self::SOH_CHAR as u8);
        Some(end_key)
    }
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct SpanStatus {
    pub code: OtlpStatusCode,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub message: Option<String>,
}

impl SpanStatus {
    pub fn is_unset(&self) -> bool {
        self.code == OtlpStatusCode::Unset
    }

    fn from_otlp(span_status: OtlpStatus) -> Self {
        if span_status.code() == OtlpStatusCode::Ok {
            Self {
                code: OtlpStatusCode::Ok,
                message: None,
            }
        } else if span_status.code() == OtlpStatusCode::Error {
            let message = if span_status.message.is_empty() {
                None
            } else {
                Some(span_status.message)
            };
            Self {
                code: OtlpStatusCode::Error,
                message,
            }
        } else {
            Self::default()
        }
    }
}

impl Default for SpanStatus {
    fn default() -> Self {
        Self {
            code: OtlpStatusCode::Unset,
            message: None,
        }
    }
}

const UNKNOWN_SERVICE: &str = "unknown_service";

const SERVICE_NAME_KEY: &str = "service.name";

struct Resource {
    service_name: String,
    attributes: HashMap<String, JsonValue>,
    dropped_attributes_count: u32,
}

impl Default for Resource {
    fn default() -> Self {
        Self {
            service_name: UNKNOWN_SERVICE.to_string(),
            attributes: HashMap::new(),
            dropped_attributes_count: 0,
        }
    }
}

impl Resource {
    fn from_otlp(resource: OtlpResource) -> Self {
        let mut attributes = extract_attributes(resource.attributes);
        let service_name = match attributes.remove(SERVICE_NAME_KEY) {
            Some(JsonValue::String(value)) => value,
            _ => UNKNOWN_SERVICE.to_string(),
        };
        Self {
            service_name,
            attributes,
            dropped_attributes_count: resource.dropped_attributes_count,
        }
    }
}

#[derive(Default)]
struct Scope {
    name: Option<String>,
    version: Option<String>,
    attributes: HashMap<String, JsonValue>,
    dropped_attributes_count: u32,
}

impl Scope {
    fn from_otlp(scope: InstrumentationScope) -> Self {
        let name = Some(scope.name).filter(|name| !name.is_empty());
        let version = Some(scope.version).filter(|version| !version.is_empty());
        let attributes = extract_attributes(scope.attributes);
        Self {
            name,
            version,
            attributes,
            dropped_attributes_count: scope.dropped_attributes_count,
        }
    }
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct Event {
    pub event_timestamp_nanos: u64,
    pub event_name: String,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub event_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub event_dropped_attributes_count: u32,
}

#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct Link {
    pub link_trace_id: TraceId,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub link_trace_state: Option<String>,
    pub link_span_id: SpanId,
    #[serde(default)]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub link_attributes: HashMap<String, JsonValue>,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_zero")]
    pub link_dropped_attributes_count: u32,
}

impl Link {
    fn try_from_otlp(link: OtlpLink) -> Result<Link, OtlpTracesError> {
        let link_trace_id = TraceId::try_from(link.trace_id)?;
        let link_span_id = SpanId::try_from(link.span_id)?;
        let link = Link {
            link_trace_id,
            link_trace_state: if !link.trace_state.is_empty() {
                Some(link.trace_state)
            } else {
                None
            },
            link_span_id,
            link_attributes: extract_attributes(link.attributes),
            link_dropped_attributes_count: link.dropped_attributes_count,
        };
        Ok(link)
    }
}

fn parse_otlp_spans(request: ExportTraceServiceRequest) -> Result<Vec<Span>, OtlpTracesError> {
    let num_spans = request
        .resource_spans
        .iter()
        .flat_map(|resource_spans| resource_spans.scope_spans.iter())
        .map(|scope_spans| scope_spans.spans.len())
        .sum();
    let mut spans = Vec::with_capacity(num_spans);

    for resource_spans in request.resource_spans {
        let resource = resource_spans
            .resource
            .map(Resource::from_otlp)
            .unwrap_or_default();
        for scope_spans in resource_spans.scope_spans {
            let scope = scope_spans.scope.map(Scope::from_otlp).unwrap_or_default();
            for span in scope_spans.spans {
                let span = Span::from_otlp(span, &resource, &scope)?;
                spans.push(span);
            }
        }
    }
    Ok(spans)
}

struct ParsedSpans {
    doc_batch: DocBatchV2,
    num_spans: u64,
    num_parse_errors: u64,
    error_message: String,
}

#[derive(Debug, Clone)]
pub struct OtlpGrpcTracesService {
    ingest_router: IngestRouterServiceClient,
    commit_type: CommitType,
}

impl OtlpGrpcTracesService {
    pub fn new(
        ingest_router: IngestRouterServiceClient,
        commit_type_opt: Option<CommitType>,
    ) -> Self {
        Self {
            ingest_router,
            commit_type: commit_type_opt.unwrap_or_default(),
        }
    }

    pub fn index_config(default_index_root_uri: &Uri) -> anyhow::Result<IndexConfig> {
        let index_config_str =
            OTEL_TRACES_INDEX_CONFIG.replace("${INDEX_ID}", OTEL_TRACES_INDEX_ID);
        let index_config = load_index_config_from_user_config(
            ConfigFormat::Yaml,
            index_config_str.as_bytes(),
            default_index_root_uri,
        )?;
        Ok(index_config)
    }

    pub async fn export_inner(
        &mut self,
        request: ExportTraceServiceRequest,
        index_id: IndexId,
        labels: [&str; 4],
    ) -> Result<ExportTraceServiceResponse, Status> {
        let ParsedSpans {
            doc_batch,
            num_spans,
            num_parse_errors,
            error_message,
        } = run_cpu_intensive({
            let parent_span = RuntimeSpan::current();
            || Self::parse_spans(request, parent_span)
        })
        .await
        .map_err(|join_error| {
            error!(error=%join_error, "failed to parse spans");
            Status::internal("failed to parse spans")
        })??;
        if num_spans == 0 {
            return Err(tonic::Status::invalid_argument("request is empty"));
        }
        if num_spans == num_parse_errors {
            return Err(tonic::Status::internal(error_message));
        }
        let num_bytes = doc_batch.num_bytes() as u64;
        self.store_spans(index_id, doc_batch).await?;

        OTLP_SERVICE_METRICS
            .ingested_spans_total
            .with_label_values(labels)
            .inc_by(num_spans);
        OTLP_SERVICE_METRICS
            .ingested_bytes_total
            .with_label_values(labels)
            .inc_by(num_bytes);

        let response = ExportTraceServiceResponse {
            // `rejected_spans=0` and `error_message=""` is considered a "full" success.
            partial_success: Some(ExportTracePartialSuccess {
                rejected_spans: num_parse_errors as i64,
                error_message,
            }),
        };
        Ok(response)
    }

    #[instrument(skip_all, parent = parent_span, fields(num_spans = Empty, num_bytes = Empty, num_parse_errors = Empty))]
    #[allow(clippy::result_large_err)]
    fn parse_spans(
        request: ExportTraceServiceRequest,
        parent_span: RuntimeSpan,
    ) -> tonic::Result<ParsedSpans> {
        let spans = parse_otlp_spans(request)?;
        let num_spans = spans.len() as u64;
        let mut num_parse_errors = 0;
        let mut error_message = String::new();

        let mut doc_batch_builder = JsonDocBatchV2Builder::with_num_docs(num_spans as usize);
        let mut doc_uid_generator = DocUidGenerator::default();
        for span in spans {
            let doc_uid = doc_uid_generator.next_doc_uid();
            if let Err(error) = doc_batch_builder.add_doc(doc_uid, span) {
                error!(error=?error, "failed to JSON serialize span");
                error_message = format!("failed to JSON serialize span: {error:?}");
                num_parse_errors += 1;
            }
        }
        let doc_batch = doc_batch_builder.build();
        let current_span = RuntimeSpan::current();
        current_span.record("num_spans", num_spans);
        current_span.record("num_bytes", doc_batch.num_bytes());
        current_span.record("num_parse_errors", num_parse_errors);

        let parsed_spans = ParsedSpans {
            doc_batch,
            num_spans,
            num_parse_errors,
            error_message,
        };
        Ok(parsed_spans)
    }

    #[instrument(skip_all, fields(num_bytes = doc_batch.num_bytes()))]
    async fn store_spans(
        &mut self,
        index_id: String,
        doc_batch: DocBatchV2,
    ) -> Result<(), tonic::Status> {
        ingest_doc_batch_v2(
            self.ingest_router.clone(),
            index_id,
            doc_batch,
            self.commit_type,
        )
        .await?;
        Ok(())
    }

    async fn export_instrumented(
        &mut self,
        request: ExportTraceServiceRequest,
        index_id: IndexId,
    ) -> Result<ExportTraceServiceResponse, Status> {
        let start = std::time::Instant::now();

        let labels = ["trace", &index_id, "grpc", "protobuf"];

        OTLP_SERVICE_METRICS
            .requests_total
            .with_label_values(labels)
            .inc();
        let (export_res, is_error) =
            match self.export_inner(request, index_id.clone(), labels).await {
                ok @ Ok(_) => (ok, "false"),
                err @ Err(_) => {
                    OTLP_SERVICE_METRICS
                        .request_errors_total
                        .with_label_values(labels)
                        .inc();
                    (err, "true")
                }
            };
        let elapsed = start.elapsed().as_secs_f64();
        let labels = ["trace", &index_id, "grpc", "protobuf", is_error];
        OTLP_SERVICE_METRICS
            .request_duration_seconds
            .with_label_values(labels)
            .observe(elapsed);

        export_res
    }
}

#[async_trait]
impl TraceService for OtlpGrpcTracesService {
    #[instrument(name = "ingest_spans", skip_all)]
    async fn export(
        &self,
        request: Request<ExportTraceServiceRequest>,
    ) -> Result<Response<ExportTraceServiceResponse>, Status> {
        let index_id = extract_otel_index_id_from_metadata(request.metadata(), OtelSignal::Traces)?;
        let request = request.into_inner();
        self.clone()
            .export_instrumented(request, index_id)
            .await
            .map(Response::new)
    }
}

/// An iterator of JSON OTLP spans for use in the doc processor.
pub struct JsonSpanIterator {
    spans: std::vec::IntoIter<Span>,
    current_span_idx: usize,
    num_spans: usize,
    avg_span_size: usize,
    avg_span_size_rem: usize,
}

impl JsonSpanIterator {
    fn new(spans: Vec<Span>, num_bytes: usize) -> Self {
        let num_spans = spans.len();
        let avg_span_size = num_bytes.checked_div(num_spans).unwrap_or(0);
        let avg_span_size_rem = avg_span_size + num_bytes.checked_rem(num_spans).unwrap_or(0);

        Self {
            spans: spans.into_iter(),
            current_span_idx: 0,
            num_spans,
            avg_span_size,
            avg_span_size_rem,
        }
    }
}

impl Iterator for JsonSpanIterator {
    type Item = (JsonValue, usize);

    fn next(&mut self) -> Option<Self::Item> {
        let span_opt = self
            .spans
            .next()
            .map(|span| serde_json::to_value(span).expect("`Span` should be JSON serializable"));
        if span_opt.is_some() {
            self.current_span_idx += 1;
        }
        if self.current_span_idx < self.num_spans {
            span_opt.map(|span| (span, self.avg_span_size))
        } else {
            span_opt.map(|span| (span, self.avg_span_size_rem))
        }
    }
}

pub fn parse_otlp_spans_json(payload_json: &[u8]) -> Result<JsonSpanIterator, OtlpTracesError> {
    let request: ExportTraceServiceRequest = serde_json::from_slice(payload_json)?;
    let spans = parse_otlp_spans(request)?;
    Ok(JsonSpanIterator::new(spans, payload_json.len()))
}

pub fn parse_otlp_spans_protobuf(
    payload_proto: &[u8],
) -> Result<JsonSpanIterator, OtlpTracesError> {
    let request = ExportTraceServiceRequest::decode(payload_proto)?;
    let spans = parse_otlp_spans(request)?;
    Ok(JsonSpanIterator::new(spans, payload_proto.len()))
}

#[cfg(test)]
mod tests {
    use quickwit_metastore::{CreateIndexRequestExt, metastore_for_test};
    use quickwit_proto::metastore::{CreateIndexRequest, MetastoreService};
    use quickwit_proto::opentelemetry::proto::common::v1::any_value::Value as OtlpAnyValueValue;
    use quickwit_proto::opentelemetry::proto::common::v1::{
        AnyValue as OtlpAnyValue, KeyValue as OtlpKeyValue,
    };
    use quickwit_proto::opentelemetry::proto::trace::v1::span::{
        Event as OtlpEvent, Link as OtlpLink,
    };
    use serde_json::json;

    use super::*;

    #[test]
    fn test_index_config_is_valid() {
        let index_config =
            OtlpGrpcTracesService::index_config(&Uri::for_test("ram:///indexes")).unwrap();
        assert_eq!(index_config.index_id, OTEL_TRACES_INDEX_ID);
    }

    #[tokio::test]
    async fn test_create_index() {
        let metastore = metastore_for_test();
        let index_config =
            OtlpGrpcTracesService::index_config(&Uri::for_test("ram:///indexes")).unwrap();
        let create_index_request =
            CreateIndexRequest::try_from_index_config(&index_config).unwrap();
        metastore.create_index(create_index_request).await.unwrap();
    }

    #[test]
    fn test_resource_from_otlp() {
        let otlp_resource = OtlpResource {
            attributes: vec![
                OtlpKeyValue {
                    key: "service.name".to_string(),
                    value: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue("quickwit".to_string())),
                    }),
                },
                OtlpKeyValue {
                    key: "key".to_string(),
                    value: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue("value".to_string())),
                    }),
                },
            ],
            dropped_attributes_count: 1,
        };
        let resource = Resource::from_otlp(otlp_resource);
        assert_eq!(
            resource.attributes,
            HashMap::from_iter([("key".to_string(), json!("value"))])
        );
        assert_eq!(resource.service_name, "quickwit");
        assert_eq!(resource.dropped_attributes_count, 1);
    }

    #[test]
    fn test_scope_from_otlp() {
        let otlp_scope = InstrumentationScope {
            name: "opentelemetry-otlp".to_string(),
            version: "0.11.0".to_string(),
            attributes: vec![OtlpKeyValue {
                key: "key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::StringValue("value".to_string())),
                }),
            }],
            dropped_attributes_count: 1,
        };
        let scope = Scope::from_otlp(otlp_scope);
        assert_eq!(scope.name.unwrap(), "opentelemetry-otlp");
        assert_eq!(scope.version.unwrap(), "0.11.0");
        assert_eq!(
            scope.attributes,
            HashMap::from_iter([("key".to_string(), json!("value"))])
        );
        assert_eq!(scope.dropped_attributes_count, 1);
    }

    #[test]
    fn test_span_from_otlp() {
        {
            // Test minimal span.
            let otlp_span = OtlpSpan {
                trace_id: vec![1; 16],
                span_id: vec![2; 8],
                parent_span_id: vec![3; 8],
                trace_state: "".to_string(),
                name: "publish_splits".to_string(),
                kind: 2, // Server
                start_time_unix_nano: 1_000_000_001,
                end_time_unix_nano: 1_001_000_002,
                attributes: Vec::new(),
                dropped_attributes_count: 3,
                events: Vec::new(),
                dropped_events_count: 4,
                links: Vec::new(),
                dropped_links_count: 5,
                status: None,
            };
            let span = Span::from_otlp(otlp_span, &Resource::default(), &Scope::default()).unwrap();

            assert_eq!(span.service_name, UNKNOWN_SERVICE);
            assert!(span.resource_attributes.is_empty());
            assert_eq!(span.resource_dropped_attributes_count, 0);

            assert!(span.scope_name.is_none());
            assert!(span.scope_version.is_none());
            assert!(span.scope_attributes.is_empty());
            assert_eq!(span.scope_dropped_attributes_count, 0);

            assert_eq!(span.trace_id, TraceId::new([1; 16]));
            assert!(span.trace_state.is_none());

            assert_eq!(span.parent_span_id, Some(SpanId::new([3; 8])));
            assert_eq!(span.span_id, SpanId::new([2; 8]));
            assert_eq!(span.span_kind, 2);
            assert_eq!(span.span_name, "publish_splits");
            assert_eq!(
                span.span_fingerprint.unwrap(),
                SpanFingerprint::new(UNKNOWN_SERVICE, SpanKind(2), "publish_splits")
            );
            assert_eq!(span.span_start_timestamp_nanos, 1_000_000_001);
            assert_eq!(span.span_end_timestamp_nanos, 1_001_000_002);
            assert_eq!(span.span_duration_millis.unwrap(), 1);
            assert!(span.span_attributes.is_empty());
            assert_eq!(span.span_dropped_attributes_count, 3);
            assert_eq!(span.span_status.code, OtlpStatusCode::Unset);

            assert!(span.events.is_empty());
            assert!(span.event_names.is_empty());
            assert_eq!(span.span_dropped_events_count, 4);

            assert!(span.links.is_empty());
            assert_eq!(span.span_dropped_links_count, 5);
        }
        {
            let resource = Resource {
                service_name: "quickwit".to_string(),
                attributes: HashMap::from_iter([(
                    "resource_key".to_string(),
                    json!("resource_value"),
                )]),
                dropped_attributes_count: 1,
            };
            let scope = Scope {
                name: Some("opentelemetry-otlp".to_string()),
                version: Some("0.11.0".to_string()),
                attributes: HashMap::from_iter([("scope_key".to_string(), json!("scope_value"))]),
                dropped_attributes_count: 2,
            };

            let events = vec![OtlpEvent {
                name: "event_name".to_string(),
                time_unix_nano: 1_000_500_003,
                attributes: vec![OtlpKeyValue {
                    key: "event_key".to_string(),
                    value: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue("event_value".to_string())),
                    }),
                }],
                dropped_attributes_count: 6,
            }];
            let links = vec![OtlpLink {
                trace_id: vec![4; 16],
                span_id: vec![5; 8],
                trace_state: "link_key1=link_value1,link_key2=link_value2".to_string(),
                attributes: vec![OtlpKeyValue {
                    key: "link_key".to_string(),
                    value: Some(OtlpAnyValue {
                        value: Some(OtlpAnyValueValue::StringValue("link_value".to_string())),
                    }),
                }],
                dropped_attributes_count: 7,
            }];
            let attributes = vec![OtlpKeyValue {
                key: "span_key".to_string(),
                value: Some(OtlpAnyValue {
                    value: Some(OtlpAnyValueValue::StringValue("span_value".to_string())),
                }),
            }];
            let otlp_span = OtlpSpan {
                trace_id: vec![1; 16],
                span_id: vec![2; 8],
                parent_span_id: vec![3; 8],
                trace_state: "key1=value1,key2=value2".to_string(),
                name: "publish_splits".to_string(),
                kind: 2, // Server
                start_time_unix_nano: 1_000_000_001,
                end_time_unix_nano: 1_001_000_002,
                attributes,
                dropped_attributes_count: 3,
                events,
                dropped_events_count: 4,
                links,
                dropped_links_count: 5,
                status: Some(OtlpStatus {
                    code: 2,
                    message: "An error occurred.".to_string(),
                }),
            };
            let span = Span::from_otlp(otlp_span, &resource, &scope).unwrap();

            assert_eq!(span.service_name, "quickwit");
            assert_eq!(
                span.resource_attributes,
                HashMap::from_iter([("resource_key".to_string(), json!("resource_value"))],)
            );
            assert_eq!(span.resource_dropped_attributes_count, 1);

            assert_eq!(span.scope_name.unwrap(), "opentelemetry-otlp");
            assert_eq!(span.scope_version.unwrap(), "0.11.0");
            assert_eq!(
                span.scope_attributes,
                HashMap::from_iter([("scope_key".to_string(), json!("scope_value"))])
            );
            assert_eq!(span.scope_dropped_attributes_count, 2);

            assert_eq!(span.trace_id, TraceId::new([1; 16]));
            assert_eq!(span.trace_state.unwrap(), "key1=value1,key2=value2");

            assert_eq!(span.parent_span_id, Some(SpanId::new([3; 8])));
            assert_eq!(span.span_id, SpanId::new([2; 8]));
            assert_eq!(span.span_kind, 2);
            assert_eq!(span.span_name, "publish_splits");
            assert_eq!(
                span.span_fingerprint.unwrap(),
                SpanFingerprint::new("quickwit", SpanKind(2), "publish_splits")
            );
            assert_eq!(span.span_start_timestamp_nanos, 1_000_000_001);
            assert_eq!(span.span_end_timestamp_nanos, 1_001_000_002);
            assert_eq!(span.span_duration_millis.unwrap(), 1);
            assert_eq!(
                span.span_attributes,
                HashMap::from_iter([("span_key".to_string(), json!("span_value"))])
            );
            assert_eq!(span.span_dropped_attributes_count, 3);
            assert_eq!(span.span_status.code, OtlpStatusCode::Error);
            assert_eq!(span.span_status.message.unwrap(), "An error occurred.");

            assert_eq!(
                span.events,
                vec![Event {
                    event_name: "event_name".to_string(),
                    event_timestamp_nanos: 1_000_500_003,
                    event_attributes: HashMap::from_iter([(
                        "event_key".to_string(),
                        json!("event_value")
                    )]),
                    event_dropped_attributes_count: 6,
                }]
            );
            assert_eq!(span.event_names, vec!["event_name".to_string()]);
            assert_eq!(span.span_dropped_events_count, 4);

            assert_eq!(
                span.links,
                vec![Link {
                    link_trace_id: TraceId::new([4; 16]),
                    link_span_id: SpanId::new([5; 8]),
                    link_trace_state: Some(
                        "link_key1=link_value1,link_key2=link_value2".to_string()
                    ),
                    link_attributes: HashMap::from_iter([(
                        "link_key".to_string(),
                        json!("link_value")
                    )]),
                    link_dropped_attributes_count: 7,
                }]
            );
            assert_eq!(span.span_dropped_links_count, 5);
        }
    }

    #[test]
    fn test_span_fingerprint() {
        let span_fingerprint = SpanFingerprint::new("quickwit", SpanKind(2), "publish_splits");
        assert_eq!(
            span_fingerprint.as_str(),
            "quickwit\u{0}2\u{0}publish_splits"
        );

        let start_key_opt = SpanFingerprint::start_key("", None);
        assert!(start_key_opt.is_none());

        let start_key = SpanFingerprint::start_key("quickwit", None)
            .map(String::from_utf8)
            .unwrap()
            .unwrap();
        assert_eq!(start_key, "quickwit\u{0}");
        let end_key = SpanFingerprint::end_key("quickwit", None)
            .map(String::from_utf8)
            .unwrap()
            .unwrap();
        assert_eq!(end_key, "quickwit\u{1}");

        let start_key = SpanFingerprint::start_key("quickwit", Some(SpanKind::from(1)))
            .map(String::from_utf8)
            .unwrap()
            .unwrap();
        assert_eq!(start_key, "quickwit\u{0}1\u{0}");
        let end_key = SpanFingerprint::end_key("quickwit", Some(SpanKind::from(1)))
            .map(String::from_utf8)
            .unwrap()
            .unwrap();
        assert_eq!(end_key, "quickwit\u{0}1\u{1}");
    }

    #[test]
    fn test_span_status_from_otlp() {
        let otlp_status = OtlpStatus {
            code: 0,
            message: "".to_string(),
        };
        assert!(SpanStatus::from_otlp(otlp_status).is_unset());

        let otlp_status = OtlpStatus {
            code: 1,
            message: "".to_string(),
        };
        let span_status = SpanStatus::from_otlp(otlp_status);
        assert_eq!(span_status.code, OtlpStatusCode::Ok);
        assert!(span_status.message.is_none());

        let otlp_status = OtlpStatus {
            code: 2,
            message: "An error occurred.".to_string(),
        };
        let span_status = SpanStatus::from_otlp(otlp_status);
        assert_eq!(span_status.code, OtlpStatusCode::Error);
        assert_eq!(span_status.message.unwrap(), "An error occurred.");
    }

    #[test]
    fn test_span_serde() {
        {
            let expected_span = Span {
                trace_id: TraceId::new([1; 16]),
                trace_state: None,
                service_name: "quickwit".to_string(),
                resource_attributes: HashMap::new(),
                resource_dropped_attributes_count: 0,
                scope_name: None,
                scope_version: None,
                scope_attributes: HashMap::new(),
                scope_dropped_attributes_count: 0,
                span_id: SpanId::new([2; 8]),
                span_kind: 0,
                span_name: "publish_splits".to_string(),
                span_fingerprint: Some(SpanFingerprint::new(
                    "quickwit",
                    SpanKind(2),
                    "publish_splits",
                )),
                span_start_timestamp_nanos: 0,
                span_end_timestamp_nanos: 1_000,
                span_duration_millis: Some(1),
                span_attributes: HashMap::new(),
                span_dropped_attributes_count: 0,
                span_dropped_events_count: 0,
                span_dropped_links_count: 0,
                span_status: SpanStatus::default(),
                parent_span_id: None,
                is_root: Some(true),
                events: Vec::new(),
                event_names: Vec::new(),
                links: Vec::new(),
            };
            let span_json = serde_json::to_string_pretty(&expected_span).unwrap();
            let span = serde_json::from_str::<Span>(&span_json).unwrap();
            assert_eq!(span, expected_span);
        }
        {
            let expected_span = Span {
                trace_id: TraceId::new([1; 16]),
                trace_state: Some("key1=value1,key2=value2".to_string()),
                service_name: "quickwit".to_string(),
                resource_attributes: HashMap::from([(
                    "resource_key".to_string(),
                    json!("resource_value"),
                )]),
                resource_dropped_attributes_count: 1,
                scope_name: Some("scope_name".to_string()),
                scope_version: Some("scope_version".to_string()),
                scope_attributes: HashMap::from([("scope_key".to_string(), json!("scope_value"))]),
                scope_dropped_attributes_count: 1,
                span_id: SpanId::new([2; 8]),
                span_kind: 1,
                span_name: "publish_splits".to_string(),
                span_fingerprint: Some(SpanFingerprint::new(
                    "quickwit",
                    SpanKind(2),
                    "publish_splits",
                )),
                span_start_timestamp_nanos: 0,
                span_end_timestamp_nanos: 1_000,
                span_duration_millis: Some(1),
                span_attributes: HashMap::from([("span_key".to_string(), json!("span_value"))]),
                span_dropped_attributes_count: 1,
                span_dropped_events_count: 1,
                span_dropped_links_count: 1,
                span_status: SpanStatus {
                    code: OtlpStatusCode::Ok,
                    message: None,
                },
                parent_span_id: Some(SpanId::new([3; 8])),
                is_root: Some(false),
                events: vec![Event {
                    event_timestamp_nanos: 1,
                    event_name: "event_name".to_string(),
                    event_attributes: HashMap::new(),
                    event_dropped_attributes_count: 0,
                }],
                event_names: vec!["event_name".to_string()],
                links: vec![Link {
                    link_trace_id: TraceId::new([1; 16]),
                    link_span_id: SpanId::new([4; 8]),
                    link_trace_state: None,
                    link_attributes: HashMap::new(),
                    link_dropped_attributes_count: 0,
                }],
            };
            let span_json = serde_json::to_string_pretty(&expected_span).unwrap();
            let span = serde_json::from_str::<Span>(&span_json).unwrap();
            assert_eq!(span, expected_span);
        }
    }

    #[test]
    fn test_json_span_iterator() {
        let mut json_span_iterator = JsonSpanIterator::new(Vec::new(), 0);
        assert!(json_span_iterator.next().is_none());

        let span_0 = Span {
            trace_id: TraceId::new([1; 16]),
            trace_state: None,
            service_name: "quickwit".to_string(),
            resource_attributes: HashMap::new(),
            resource_dropped_attributes_count: 0,
            scope_name: None,
            scope_version: None,
            scope_attributes: HashMap::new(),
            scope_dropped_attributes_count: 0,
            span_id: SpanId::new([2; 8]),
            span_kind: 0,
            span_name: "publish_splits".to_string(),
            span_fingerprint: Some(SpanFingerprint::new(
                "quickwit",
                SpanKind(2),
                "publish_splits",
            )),
            span_start_timestamp_nanos: 1_000_000_001,
            span_end_timestamp_nanos: 1_000_000_002,
            span_duration_millis: Some(1),
            span_attributes: HashMap::new(),
            span_dropped_attributes_count: 0,
            span_dropped_events_count: 0,
            span_dropped_links_count: 0,
            span_status: SpanStatus::default(),
            parent_span_id: None,
            is_root: Some(true),
            events: Vec::new(),
            event_names: Vec::new(),
            links: Vec::new(),
        };

        let spans = vec![span_0.clone()];
        let mut json_span_iterator = JsonSpanIterator::new(spans, 3);

        assert_eq!(
            json_span_iterator.next(),
            Some((serde_json::to_value(&span_0).unwrap(), 3))
        );
        assert!(json_span_iterator.next().is_none());

        let mut span_1 = span_0.clone();
        span_1.span_id = SpanId::new([3; 8]);

        let spans = vec![span_0.clone(), span_1.clone()];
        let mut json_span_iterator = JsonSpanIterator::new(spans, 7);

        assert_eq!(
            json_span_iterator.next(),
            Some((serde_json::to_value(&span_0).unwrap(), 3))
        );
        assert_eq!(
            json_span_iterator.next(),
            Some((serde_json::to_value(&span_1).unwrap(), 4))
        );
        assert!(json_span_iterator.next().is_none());
    }
}


================================================
FILE: quickwit/quickwit-proto/.gitignore
================================================
gogoproto.rs
google.protobuf.rs


================================================
FILE: quickwit/quickwit-proto/Cargo.toml
================================================
[package]
name = "quickwit-proto"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
bytestring = { workspace = true }
futures = { workspace = true, optional = true }
hex = { workspace = true  }
http = { workspace = true }
mockall = { workspace = true, optional = true }
opentelemetry = { workspace = true }
prost = { workspace = true }
prost-types = { workspace = true }
sea-query = { workspace = true, optional = true }
serde = { workspace = true }
serde_json = { workspace = true }
sqlx = { workspace = true, optional = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tonic = { workspace = true, features = [
    "tls-native-roots",
    "server",
    "channel",
] }
tonic-prost = { workspace = true }
tower = { workspace = true }
tracing = { workspace = true }
tracing-opentelemetry = { workspace = true }
ulid = { workspace = true }
utoipa = { workspace = true }
zstd = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-common = { workspace = true }

[dev-dependencies]
futures = { workspace = true }
mockall = { workspace = true }

[build-dependencies]
glob = "0.3"
prost-build = { workspace = true }
tonic-build = { workspace = true }
tonic-prost-build = { workspace = true }

quickwit-codegen = { workspace = true }

[features]
postgres = ["sea-query", "sqlx"]
testsuite = ["mockall", "futures"]


================================================
FILE: quickwit/quickwit-proto/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::PathBuf;

use glob::glob;
use quickwit_codegen::Codegen;

fn main() -> Result<(), Box<dyn std::error::Error>> {
    // Prost + tonic + Quickwit codegen for control plane, indexing, metastore, ingest and search
    // services.
    //
    // Cluster service.
    let mut prost_config = prost_build::Config::default();
    prost_config.file_descriptor_set_path("src/codegen/quickwit/cluster_descriptor.bin");

    Codegen::builder()
        .with_prost_config(prost_config)
        .with_protos(&["protos/quickwit/cluster.proto"])
        .with_output_dir("src/codegen/quickwit")
        .with_result_type_path("crate::cluster::ClusterResult")
        .with_error_type_path("crate::cluster::ClusterError")
        .generate_rpc_name_impls()
        .run()
        .unwrap();

    // Control plane.
    let mut prost_config = prost_build::Config::default();
    prost_config.file_descriptor_set_path("src/codegen/quickwit/control_plane_descriptor.bin");

    prost_config
        .extern_path(
            ".quickwit.common.DocMappingUid",
            "crate::types::DocMappingUid",
        )
        .extern_path(".quickwit.common.IndexUid", "crate::types::IndexUid");

    Codegen::builder()
        .with_prost_config(prost_config)
        .with_protos(&["protos/quickwit/control_plane.proto"])
        .with_includes(&["protos"])
        .with_output_dir("src/codegen/quickwit")
        .with_result_type_path("crate::control_plane::ControlPlaneResult")
        .with_error_type_path("crate::control_plane::ControlPlaneError")
        .run()
        .unwrap();

    // Developer service.
    let mut prost_config = prost_build::Config::default();
    prost_config
        .bytes(["GetDebugInfoResponse.debug_info_json"])
        .file_descriptor_set_path("src/codegen/quickwit/developer_descriptor.bin");

    Codegen::builder()
        .with_prost_config(prost_config)
        .with_protos(&["protos/quickwit/developer.proto"])
        .with_output_dir("src/codegen/quickwit")
        .with_result_type_path("crate::developer::DeveloperResult")
        .with_error_type_path("crate::developer::DeveloperError")
        .generate_rpc_name_impls()
        .run()
        .unwrap();

    // Indexing Service.
    let mut prost_config = prost_build::Config::default();
    prost_config
        .extern_path(
            ".quickwit.indexing.PipelineUid",
            "crate::types::PipelineUid",
        )
        .extern_path(".quickwit.common.IndexUid", "crate::types::IndexUid")
        .extern_path(".quickwit.ingest.ShardId", "crate::types::ShardId")
        .file_descriptor_set_path("src/codegen/quickwit/indexing_descriptor.bin");

    Codegen::builder()
        .with_prost_config(prost_config)
        .with_protos(&["protos/quickwit/indexing.proto"])
        .with_includes(&["protos"])
        .with_output_dir("src/codegen/quickwit")
        .with_result_type_path("crate::indexing::IndexingResult")
        .with_error_type_path("crate::indexing::IndexingError")
        .run()
        .unwrap();

    // Metastore service.
    let mut prost_config = prost_build::Config::default();
    prost_config
        .bytes([
            "IndexesMetadataResponse.indexes_metadata_json_zstd",
            "ListIndexesMetadataResponse.indexes_metadata_json_zstd",
        ])
        .extern_path(
            ".quickwit.common.DocMappingUid",
            "crate::types::DocMappingUid",
        )
        .extern_path(".quickwit.common.IndexUid", "crate::types::IndexUid")
        .extern_path(".quickwit.ingest.ShardId", "crate::types::ShardId")
        .field_attribute("DeleteQuery.index_uid", "#[schema(value_type = String)]")
        .field_attribute("DeleteQuery.index_uid", "#[serde(alias = \"index_id\")]")
        .field_attribute("DeleteQuery.query_ast", "#[serde(alias = \"query\")]")
        .field_attribute(
            "DeleteQuery.start_timestamp",
            "#[serde(skip_serializing_if = \"Option::is_none\")]",
        )
        .field_attribute(
            "DeleteQuery.end_timestamp",
            "#[serde(skip_serializing_if = \"Option::is_none\")]",
        )
        .file_descriptor_set_path("src/codegen/quickwit/metastore_descriptor.bin");

    Codegen::builder()
        .with_prost_config(prost_config)
        .with_protos(&["protos/quickwit/metastore.proto"])
        .with_includes(&["protos"])
        .with_output_dir("src/codegen/quickwit")
        .with_result_type_path("crate::metastore::MetastoreResult")
        .with_error_type_path("crate::metastore::MetastoreError")
        .generate_extra_service_methods()
        .generate_rpc_name_impls()
        .run()
        .unwrap();

    // Ingest service (metastore service proto should be generated before ingest).
    let mut prost_config = prost_build::Config::default();
    prost_config
        .bytes([
            "DocBatchV2.doc_buffer",
            "MRecordBatch.mrecord_buffer",
            "Position.position",
        ])
        .extern_path(
            ".quickwit.common.DocMappingUid",
            "crate::types::DocMappingUid",
        )
        .extern_path(".quickwit.common.DocUid", "crate::types::DocUid")
        .extern_path(".quickwit.common.IndexUid", "crate::types::IndexUid")
        .extern_path(".quickwit.ingest.Position", "crate::types::Position")
        .extern_path(".quickwit.ingest.ShardId", "crate::types::ShardId")
        .field_attribute(
            "Shard.follower_id",
            "#[serde(default, skip_serializing_if = \"Option::is_none\")]",
        )
        .field_attribute(
            "Shard.publish_position_inclusive",
            "#[serde(default, skip_serializing_if = \"Option::is_none\")]",
        )
        .field_attribute(
            "Shard.publish_token",
            "#[serde(default, skip_serializing_if = \"Option::is_none\")]",
        )
        .field_attribute(
            "Shard.replication_position_inclusive",
            "#[serde(default, skip_serializing_if = \"Option::is_none\")]",
        )
        .field_attribute(
            "Shard.update_timestamp",
            "#[serde(default = \"super::compatibility_shard_update_timestamp\")]",
        )
        .file_descriptor_set_path("src/codegen/quickwit/ingest_descriptor.bin");

    Codegen::builder()
        .with_prost_config(prost_config)
        .with_protos(&[
            "protos/quickwit/ingester.proto",
            "protos/quickwit/router.proto",
        ])
        .with_includes(&["protos"])
        .with_output_dir("src/codegen/quickwit")
        .with_result_type_path("crate::ingest::IngestV2Result")
        .with_error_type_path("crate::ingest::IngestV2Error")
        .generate_rpc_name_impls()
        .run()
        .unwrap();

    // Search service.
    let mut prost_config = prost_build::Config::default();
    prost_config
        .file_descriptor_set_path("src/codegen/quickwit/search_descriptor.bin")
        .protoc_arg("--experimental_allow_proto3_optional");

    tonic_prost_build::configure()
        .enum_attribute(".", "#[serde(rename_all=\"snake_case\")]")
        .type_attribute(
            ".",
            "#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]",
        )
        .type_attribute("PartialHit.sort_value", "#[derive(Copy)]")
        .type_attribute("SortByValue", "#[derive(Ord, PartialOrd)]")
        .type_attribute("SearchRequest", "#[derive(Hash, Eq)]")
        .type_attribute("PartialHit", "#[derive(Hash, Eq)]")
        .out_dir("src/codegen/quickwit")
        .compile_with_config(
            prost_config,
            &[std::path::PathBuf::from("protos/quickwit/search.proto")],
            &[std::path::PathBuf::from("protos")],
        )?;

    // Jaeger proto
    let protos = find_protos("protos/third-party/jaeger");

    let mut prost_config = prost_build::Config::default();
    prost_config.type_attribute("Operation", "#[derive(Ord, PartialOrd)]");

    tonic_prost_build::configure()
        .out_dir("src/codegen/jaeger")
        .compile_with_config(
            prost_config,
            &protos,
            &[
                std::path::PathBuf::from("protos/third-party/jaeger"),
                std::path::PathBuf::from("protos/third-party"),
            ],
        )?;

    // OTEL proto
    let mut prost_config = prost_build::Config::default();
    prost_config.protoc_arg("--experimental_allow_proto3_optional");

    let protos = find_protos("protos/third-party/opentelemetry");
    tonic_prost_build::configure()
        .type_attribute(".", "#[derive(serde::Serialize, serde::Deserialize)]")
        .type_attribute("StatusCode", r#"#[serde(rename_all = "snake_case")]"#)
        .type_attribute(
            "ExportLogsServiceResponse",
            r#"#[derive(utoipa::ToSchema)]"#,
        )
        .out_dir("src/codegen/opentelemetry")
        .compile_with_config(
            prost_config,
            &protos,
            &[std::path::PathBuf::from("protos/third-party")],
        )?;
    Ok(())
}

fn find_protos(dir_path: &str) -> Vec<PathBuf> {
    glob(&format!("{dir_path}/**/*.proto"))
        .unwrap()
        .flatten()
        .collect()
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/cluster.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.cluster;

message ChitchatId {
  string node_id = 1;
  uint64 generation_id = 2;
  string gossip_advertise_addr = 3;
}

enum DeletionStatus {
    Set = 0;
    Deleted = 1;
    DeleteAfterTtl = 2;
}

message VersionedKeyValue {
  string key = 1;
  string value = 2;
  uint64 version = 3;
  DeletionStatus status = 4;
}

message NodeState {
  ChitchatId chitchat_id = 1;
  repeated VersionedKeyValue key_values = 2;
  uint64 max_version = 3;
  uint64 last_gc_version = 4;
}

service ClusterService {
  rpc FetchClusterState(FetchClusterStateRequest) returns (FetchClusterStateResponse);
}

message FetchClusterStateRequest {
  string cluster_id = 1;
}

message FetchClusterStateResponse {
  string cluster_id = 1;
  repeated NodeState node_states = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/common.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.common;

// The corresponding Rust struct [`crate::types::DocMappingUid`] is defined manually and
// externally provided during code generation (see `build.rs`).
//
// Modify at your own risk.
message DocMappingUid {
  // ULID encoded as a sequence of 16 bytes (big-endian u128).
  bytes doc_mapping_uid = 1;
}

// The corresponding Rust struct [`crate::types::DocUid`] is defined manually and
// externally provided during code generation (see `build.rs`).
//
// Modify at your own risk.
message DocUid {
  // ULID encoded as a sequence of 16 bytes (big-endian u128).
  bytes doc_uid = 1;
}

// The corresponding Rust struct [`crate::types::IndexUid`] is defined manually and
// externally provided during code generation (see `build.rs`).
//
// Modify at your own risk.
message IndexUid {
  string index_id = 1;
  // ULID encoded as a sequence of 16 bytes (big-endian u128).
  bytes incarnation_id = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/control_plane.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.control_plane;

import "quickwit/common.proto";
import "quickwit/indexing.proto";
import "quickwit/ingest.proto";
import "quickwit/metastore.proto";

service ControlPlaneService {
  // The control plane acts as a proxy for the metastore for a subset of the API so it can track the state of the
  // metastore accurately and react to events in real-time.

  // The following RPCs are forwarded and handled by the metastore:
  // - `create_index`
  // - `update_index`
  // - `delete_index`
  // - `add_source`
  // - `toggle_source`
  // - `delete_source`

  // Index API

  // Creates a new index.
  rpc CreateIndex(quickwit.metastore.CreateIndexRequest) returns (quickwit.metastore.CreateIndexResponse);

  // Updates an index.
  rpc UpdateIndex(quickwit.metastore.UpdateIndexRequest) returns (quickwit.metastore.IndexMetadataResponse);

  // Deletes an index.
  rpc DeleteIndex(quickwit.metastore.DeleteIndexRequest) returns (quickwit.metastore.EmptyResponse);

  // Source API

  // Adds a source to an index.
  rpc AddSource(quickwit.metastore.AddSourceRequest) returns (quickwit.metastore.EmptyResponse);

  // Update a source.
  rpc UpdateSource(quickwit.metastore.UpdateSourceRequest) returns (quickwit.metastore.EmptyResponse);

  // Enables or disables a source.
  rpc ToggleSource(quickwit.metastore.ToggleSourceRequest) returns (quickwit.metastore.EmptyResponse);

  // Removes a source from an index.
  rpc DeleteSource(quickwit.metastore.DeleteSourceRequest) returns (quickwit.metastore.EmptyResponse);

  // Shard API

  // Returns the list of open shards for one or several sources. If the control plane is not able to find any
  // for a source, it will pick a pair of leader-follower ingesters and will open a new shard.
  rpc GetOrCreateOpenShards(GetOrCreateOpenShardsRequest) returns (GetOrCreateOpenShardsResponse);

  // Asks the control plane whether the shards listed in the request should be deleted or truncated.
  rpc AdviseResetShards(AdviseResetShardsRequest) returns (AdviseResetShardsResponse);

  // Performs a debounced shard pruning request to the metastore.
  rpc PruneShards(quickwit.metastore.PruneShardsRequest) returns (quickwit.metastore.EmptyResponse);
}

// Shard API

message GetOrCreateOpenShardsRequest {
  // There should be at most one subrequest per index per request.
  repeated GetOrCreateOpenShardsSubrequest subrequests = 1;
  repeated quickwit.ingest.ShardIds closed_shards = 2;
  // The control plane should return shards that are not present on the supplied leaders.
  //
  // The control plane does not change the status of those leaders just from this signal.
  // It will check the status of its own ingester pool.
  repeated string unavailable_leaders = 3;
}

message GetOrCreateOpenShardsSubrequest {
  uint32 subrequest_id = 1;
  string index_id = 2;
  string source_id = 3;
}

message GetOrCreateOpenShardsResponse {
  repeated GetOrCreateOpenShardsSuccess successes = 1;
  repeated GetOrCreateOpenShardsFailure failures = 2;
}

message GetOrCreateOpenShardsSuccess {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  repeated quickwit.ingest.Shard open_shards = 4;
}

enum GetOrCreateOpenShardsFailureReason {
  GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_UNSPECIFIED = 0;
  GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_INDEX_NOT_FOUND = 1;
  GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_SOURCE_NOT_FOUND = 2;
  GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_NO_INGESTERS_AVAILABLE = 3;
}

message GetOrCreateOpenShardsFailure {
  uint32 subrequest_id = 1;
  string index_id = 2;
  string source_id = 3;
  GetOrCreateOpenShardsFailureReason reason = 4;
}

message AdviseResetShardsRequest {
  repeated quickwit.ingest.ShardIds shard_ids = 1;
  string ingester_id = 2;
}

message AdviseResetShardsResponse {
  repeated quickwit.ingest.ShardIds shards_to_delete = 1;
  repeated quickwit.ingest.ShardIdPositions shards_to_truncate = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/developer.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.developer;

service DeveloperService {
  rpc GetDebugInfo(GetDebugInfoRequest) returns (GetDebugInfoResponse);

  // rpc SetLogLevel(SetLogLevelRequest) returns (SetLogLevelResponse);
}

message GetDebugInfoRequest {
  // Restricts the debug info to the given roles.
  repeated string roles = 1;
}

message GetDebugInfoResponse {
  bytes debug_info_json = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/indexing.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.indexing;

import "quickwit/common.proto";
import "quickwit/ingest.proto";

service IndexingService {
  // Apply an indexing plan on the node.
  rpc ApplyIndexingPlan(ApplyIndexingPlanRequest) returns (ApplyIndexingPlanResponse);
}

message ApplyIndexingPlanRequest {
  repeated IndexingTask indexing_tasks = 1;
}

message PipelineUid {
  bytes pipeline_uid = 1;
}

message IndexingTask {
  // The tasks's index UID.
  quickwit.common.IndexUid index_uid = 1;
  // The task's source ID.
  string source_id = 2;
  // pipeline id
  PipelineUid pipeline_uid = 4;
  // The shards assigned to the indexer.
  repeated quickwit.ingest.ShardId shard_ids = 3;
  // Fingerprint of the pipeline parameters. Anything that should cause a pipeline restart (such
  // as updating indexing settings, the doc mapping or the source) should influence this value.
  uint64 params_fingerprint = 6;
}

message ApplyIndexingPlanResponse {}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/ingest.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.ingest;

import "quickwit/common.proto";

// The corresponding Rust struct [`crate::types::Position`] is defined manually and
// externally provided during code generation (see `build.rs`).
//
// Modify at your own risk.
message Position {
  bytes position = 1;
}

// The corresponding Rust struct [`crate::types::ShardId`] is defined manually and
// externally provided during code generation (see `build.rs`).
//
// Modify at your own risk.
message ShardId {
  bytes shard_id = 1;
}

// Shard primary key.
message ShardPKey {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  ShardId shard_id = 3;
}

enum CommitTypeV2 {
  COMMIT_TYPE_V2_UNSPECIFIED = 0;
  COMMIT_TYPE_V2_AUTO = 1;
  COMMIT_TYPE_V2_WAIT_FOR = 2;
  COMMIT_TYPE_V2_FORCE = 3;
}

message DocBatchV2 {
  bytes doc_buffer = 1;
  repeated uint32 doc_lengths = 2;
  repeated quickwit.common.DocUid doc_uids = 3;
}

message MRecordBatch {
  // Buffer of encoded and then concatenated mrecords.
  bytes mrecord_buffer = 1;
  // Lengths of the mrecords in the buffer.
  repeated uint32 mrecord_lengths = 2;
}

enum ShardState {
  SHARD_STATE_UNSPECIFIED = 0;
  // The shard is open and accepts write requests.
  SHARD_STATE_OPEN = 1;
  // The ingester hosting the shard is unavailable.
  SHARD_STATE_UNAVAILABLE = 2;
  // The shard is closed and cannot be written to.
  // It can be safely deleted if the publish position is superior or equal to `~eof`.
  SHARD_STATE_CLOSED = 3;
}

message Shard {
  // Immutable fields
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  ShardId shard_id = 3;
  // The node ID of the ingester to which all the write requests for this shard should be sent to.
  string leader_id = 4;
  // The node ID of the ingester holding a copy of the data.
  optional string follower_id = 5;

  // Mutable fields
  ShardState shard_state = 8;
  // Position up to which indexers have indexed and published the records stored in the shard.
  // It is updated asynchronously in a best effort manner by the indexers and indicates the position up to which the log can be safely truncated.
  Position publish_position_inclusive = 9;
  // A publish token that ensures only one indexer works on a given shard at a time.
  // For instance, if an indexer goes rogue, eventually the control plane will detect it and assign the shard to another indexer, which will override the publish token.
  optional string publish_token = 10;

  // The UID of the index doc mapping when the shard was created.
  quickwit.common.DocMappingUid doc_mapping_uid = 11;

  // Time when the shard was last updated
  int64 update_timestamp = 12;
}

// A group of shards belonging to the same index and source.
message ShardIds {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  repeated ShardId shard_ids = 3;
}

message ShardIdPositions {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  repeated ShardIdPosition shard_positions = 3;
}

message ShardIdPosition {
  ShardId shard_id = 1;
  Position publish_position_inclusive = 2;
}

enum ParseFailureReason {
  PARSE_FAILURE_REASON_UNSPECIFIED = 0;
  PARSE_FAILURE_REASON_INVALID_JSON = 1;
  PARSE_FAILURE_REASON_INVALID_SCHEMA = 2;
}

message ParseFailure {
  quickwit.common.DocUid doc_uid = 1;
  ParseFailureReason reason = 2;
  string message = 3;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/ingester.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.ingest.ingester;

import "quickwit/common.proto";
import "quickwit/ingest.proto";

service IngesterService {
  // Persists batches of documents to primary shards hosted on a leader.
  rpc Persist(PersistRequest) returns (PersistResponse);

  // Opens a replication stream from a leader to a follower.
  rpc OpenReplicationStream(stream SynReplicationMessage) returns (stream AckReplicationMessage);

  // Streams records from a leader or a follower. The client can optionally specify a range of positions to fetch,
  // otherwise the stream will go indefinitely or until the shard is closed.
  rpc OpenFetchStream(OpenFetchStreamRequest) returns (stream FetchMessage);

  // Streams status updates, called "observations", from an ingester.
  rpc OpenObservationStream(OpenObservationStreamRequest) returns (stream ObservationMessage);

  // Creates and initializes a set of newly opened shards. This RPC is called by the control plane on leaders.
  rpc InitShards(InitShardsRequest) returns (InitShardsResponse);

  // Only retain the shards that are listed in the request.
  // Other shards are deleted.
  rpc RetainShards(RetainShardsRequest) returns (RetainShardsResponse);

  // Truncates a set of shards at the given positions. This RPC is called by indexers on leaders AND followers.
  rpc TruncateShards(TruncateShardsRequest) returns (TruncateShardsResponse);

  // Closes a set of shards. This RPC is called by the control plane.
  rpc CloseShards(CloseShardsRequest) returns (CloseShardsResponse);

  // Decommissions the ingester.
  rpc Decommission(DecommissionRequest) returns (DecommissionResponse);
}

message RetainShardsForSource {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  repeated quickwit.ingest.ShardId shard_ids = 3;
}

message RetainShardsRequest {
  repeated RetainShardsForSource retain_shards_for_sources = 1;
}

message RetainShardsResponse {
}

message PersistRequest {
  string leader_id = 1;
  quickwit.ingest.CommitTypeV2 commit_type = 3;
  repeated PersistSubrequest subrequests = 4;
}

message PersistSubrequest {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.DocBatchV2 doc_batch = 5;
  reserved 4;
}

message PersistResponse {
  string leader_id = 1;
  repeated PersistSuccess successes = 2;
  repeated PersistFailure failures = 3;
  RoutingUpdate routing_update = 4;
}

message RoutingUpdate {
  uint32 capacity_score = 1;
  repeated SourceShardUpdate source_shard_updates = 2;
  repeated quickwit.ingest.ShardIds closed_shards = 3;
}

message SourceShardUpdate {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  uint32 open_shard_count = 3;
}

message PersistSuccess {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  quickwit.ingest.Position replication_position_inclusive = 5;
  uint32 num_persisted_docs = 6;
  repeated quickwit.ingest.ParseFailure parse_failures = 7;
}


enum PersistFailureReason {
  PERSIST_FAILURE_REASON_UNSPECIFIED = 0;
  PERSIST_FAILURE_REASON_WAL_FULL = 4;
  PERSIST_FAILURE_REASON_TIMEOUT = 5;
  PERSIST_FAILURE_REASON_NO_SHARDS_AVAILABLE = 6;
  PERSIST_FAILURE_REASON_NODE_UNAVAILABLE = 7;
}

message PersistFailure {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  PersistFailureReason reason = 5;
  reserved 4;
}

message SynReplicationMessage {
  oneof message {
    OpenReplicationStreamRequest open_request = 1;
    InitReplicaRequest init_request = 2;
    ReplicateRequest replicate_request = 3;
  }
}

message AckReplicationMessage {
  oneof message {
    OpenReplicationStreamResponse open_response = 1;
    InitReplicaResponse init_response = 2;
    ReplicateResponse replicate_response = 3;
  }
}

message OpenReplicationStreamRequest {
  string leader_id = 1;
  string follower_id = 2;
  // Position of the request in the replication stream.
  uint64 replication_seqno = 3;
}

message OpenReplicationStreamResponse {
  // Position of the response in the replication stream. It should match the position of the request.
  uint64 replication_seqno = 1;
}

message InitReplicaRequest {
  Shard replica_shard = 1;
  uint64 replication_seqno = 2;
}

message InitReplicaResponse {
  uint64 replication_seqno = 1;
}

message ReplicateRequest {
  string leader_id = 1;
  string follower_id = 2;
  quickwit.ingest.CommitTypeV2 commit_type = 3;
  repeated ReplicateSubrequest subrequests = 4;
  // Position of the request in the replication stream.
  uint64 replication_seqno = 5;
}

message ReplicateSubrequest {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  quickwit.ingest.Position from_position_exclusive = 5;
  ingest.DocBatchV2 doc_batch = 6;
}

message ReplicateResponse {
  string follower_id = 1;
  repeated ReplicateSuccess successes = 2;
  repeated ReplicateFailure failures = 3;
  // Position of the response in the replication stream. It should match the position of the request.
  uint64 replication_seqno = 4;
}

message ReplicateSuccess {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  quickwit.ingest.Position replication_position_inclusive = 5;
}

enum ReplicateFailureReason {
  REPLICATE_FAILURE_REASON_UNSPECIFIED = 0;
  REPLICATE_FAILURE_REASON_SHARD_NOT_FOUND = 1;
  REPLICATE_FAILURE_REASON_SHARD_CLOSED = 2;
  reserved 3; // REPLICATE_FAILURE_REASON_RATE_LIMITED = 3;
  REPLICATE_FAILURE_REASON_WAL_FULL = 4;
}

message ReplicateFailure {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  ReplicateFailureReason reason = 5;
}

message TruncateShardsRequest {
  string ingester_id = 1;
  repeated TruncateShardsSubrequest subrequests = 2;
}

message TruncateShardsSubrequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  quickwit.ingest.ShardId shard_id = 3;
  // The position up to which the shard should be truncated (inclusive).
  quickwit.ingest.Position truncate_up_to_position_inclusive = 4;
}

message TruncateShardsResponse {
  // TODO
}

message OpenFetchStreamRequest {
  string client_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  quickwit.ingest.Position from_position_exclusive = 5;
}

message FetchMessage {
  oneof message {
    FetchPayload payload = 1;
    FetchEof eof = 2;
  }
}

message FetchPayload {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  quickwit.ingest.ShardId shard_id = 3;
  quickwit.ingest.MRecordBatch mrecord_batch = 4;
  quickwit.ingest.Position from_position_exclusive = 5;
  quickwit.ingest.Position to_position_inclusive = 6;
}

message FetchEof {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  quickwit.ingest.ShardId shard_id = 3;
  quickwit.ingest.Position eof_position = 4;
}

message InitShardsRequest {
  reserved 1;
  repeated InitShardSubrequest subrequests = 2;
}

message InitShardSubrequest {
  uint32 subrequest_id = 1;
  quickwit.ingest.Shard shard = 2;
  string doc_mapping_json = 3;
  bool validate_docs = 4;
}

message InitShardsResponse {
  repeated InitShardSuccess successes = 1;
  repeated InitShardFailure failures = 2;
}

message InitShardSuccess {
  uint32 subrequest_id = 1;
  quickwit.ingest.Shard shard = 2;
}

message InitShardFailure {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  // InitShardFailureReason reason = 5;
}

message CloseShardsRequest {
  reserved 1;
  repeated quickwit.ingest.ShardPKey shard_pkeys = 2;
}

message CloseShardsResponse {
  repeated quickwit.ingest.ShardPKey successes = 1;
}

message DecommissionRequest {
}

message DecommissionResponse {
}

message OpenObservationStreamRequest {
}

enum IngesterStatus {
  INGESTER_STATUS_UNSPECIFIED = 0;
  // The ingester is live but not ready yet to accept requests.
  INGESTER_STATUS_INITIALIZING = 1;
  // The ingester is ready and accepts read and write requests.
  INGESTER_STATUS_READY = 2;
  // The ingester is about to be decommissioned. It still accepts read and write requests, but will not accept write requests in a few seconds and should be avoided by future write requests.
  INGESTER_STATUS_RETIRING = 6;
  // The ingester is being decommissioned. It accepts read requests but rejects write requests
  // (open shards, persist, and replicate requests). It will transition to `Decommissioned` once
  // all shards are fully indexed.
  INGESTER_STATUS_DECOMMISSIONING = 3;
  // The ingester no longer accepts read and write requests. It does not hold any data and can
  // be safely removed from the cluster.
  INGESTER_STATUS_DECOMMISSIONED = 4;
  // The ingester failed to initialize and is not ready to accept requests.
  INGESTER_STATUS_FAILED = 5;
}

message ObservationMessage {
  string node_id = 1;
  IngesterStatus Status = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/metastore.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.metastore;

import "quickwit/common.proto";
import "quickwit/ingest.proto";

enum SourceType {
  SOURCE_TYPE_UNSPECIFIED = 0;
  SOURCE_TYPE_CLI = 1;
  SOURCE_TYPE_FILE = 2;
  SOURCE_TYPE_INGEST_V1 = 4;
  SOURCE_TYPE_INGEST_V2 = 5;
  // Apache Kafka
  SOURCE_TYPE_KAFKA = 6;
  // Amazon Kinesis
  SOURCE_TYPE_KINESIS = 7;
  SOURCE_TYPE_NATS = 8;
  // Google Cloud Pub/Sub
  SOURCE_TYPE_PUB_SUB = 3;
  // Apache Pulsar
  SOURCE_TYPE_PULSAR = 9;
  SOURCE_TYPE_VEC = 10;
  SOURCE_TYPE_VOID = 11;
  SOURCE_TYPE_STDIN = 13;
}

// Metastore meant to manage Quickwit's indexes, their splits and delete tasks.
//
// I. Index and splits management.
//
// Quickwit needs a way to ensure that we can cleanup unused files,
// and this process needs to be resilient to any fail-stop failures.
// We rely on atomically transitioning the status of splits.
//
// The split state goes through the following life cycle:
// 1. `Staged`
//   - Start uploading the split files.
// 2. `Published`
//   - Uploading the split files is complete and the split is searchable.
// 3. `MarkedForDeletion`
//   - Mark the split for deletion.
//
// If a split has a file in the storage, it MUST be registered in the metastore,
// and its state can be as follows:
// - `Staged`: The split is almost ready. Some of its files may have been uploaded in the storage.
// - `Published`: The split is ready and published.
// - `MarkedForDeletion`: The split is marked for deletion.
//
// Before creating any file, we need to stage the split. If there is a failure, upon recovery, we
// schedule for deletion all the staged splits. A client may not necessarily remove files from
// storage right after marking it for deletion. A CLI client may delete files right away, but a
// more serious deployment should probably only delete those files after a grace period so that the
// running search queries can complete.
//
// II. Delete tasks management.
//
// A delete task is defined on a given index and by a search query. It can be
// applied to all the splits of the index.
//
// Quickwit needs a way to track that a delete task has been applied to a split. This is ensured
// by two mechanisms:
// - On creation of a delete task, we give to the task a monotically increasing opstamp (uniqueness
//   and monotonically increasing must be true at the index level).
// - When a delete task is executed on a split, that is when the documents matched by the search
//   query are removed from the splits, we update the split's `delete_opstamp` to the value of the
//   task's opstamp. This marks the split as "up-to-date" regarding this delete task. If new delete
//   tasks are added, we will know that we need to run these delete tasks on the splits as its
//   `delete_optstamp` will be inferior to the `opstamp` of the new tasks.
//
// For splits created after a given delete task, Quickwit's indexing ensures that these splits
// are created with a `delete_opstamp` equal the latest opstamp of the tasks of the
// corresponding index.
service MetastoreService {
  // Creates an index.
  //
  // This API creates a new index in the metastore.
  // An error will occur if an index that already exists in the storage is specified.
  rpc CreateIndex(CreateIndexRequest) returns (CreateIndexResponse);

  // Update an index.
  rpc UpdateIndex(UpdateIndexRequest) returns (IndexMetadataResponse);

  // Returns the `IndexMetadata` of an index identified by its IndexID or its IndexUID.
  rpc IndexMetadata(IndexMetadataRequest) returns (IndexMetadataResponse);

  // Fetches the metadata of a list of indexes identified by their Index IDs or UIDs.
  rpc IndexesMetadata(IndexesMetadataRequest) returns (IndexesMetadataResponse);

  // Gets an indexes metadatas.
  rpc ListIndexesMetadata(ListIndexesMetadataRequest) returns (ListIndexesMetadataResponse);

  // Deletes an index
  rpc DeleteIndex(DeleteIndexRequest) returns (EmptyResponse);

  // Returns a list of size info for each index.
  rpc ListIndexStats(ListIndexStatsRequest) returns (ListIndexStatsResponse);

  // Streams splits from index.
  rpc ListSplits(ListSplitsRequest) returns (stream ListSplitsResponse);

  // Stages several splits.
  rpc StageSplits(StageSplitsRequest) returns (EmptyResponse);

  // Publishes split.
  rpc PublishSplits(PublishSplitsRequest) returns (EmptyResponse);

  // Marks splits for deletion.
  rpc MarkSplitsForDeletion(MarkSplitsForDeletionRequest) returns (EmptyResponse);

  // Deletes splits.
  rpc DeleteSplits(DeleteSplitsRequest) returns (EmptyResponse);

  // Adds a source.
  rpc AddSource(AddSourceRequest) returns (EmptyResponse);

  // Updates a source.
  rpc UpdateSource(UpdateSourceRequest) returns (EmptyResponse);

  // Toggles (turns on or off) source.
  rpc ToggleSource(ToggleSourceRequest) returns (EmptyResponse);

  // Removes source.
  rpc DeleteSource(DeleteSourceRequest) returns (EmptyResponse);

  // Resets source checkpoint.
  rpc ResetSourceCheckpoint(ResetSourceCheckpointRequest) returns (EmptyResponse);

  // Gets last opstamp for a given `index_id`.
  rpc LastDeleteOpstamp(LastDeleteOpstampRequest) returns (LastDeleteOpstampResponse);

  // Creates a delete task.
  rpc CreateDeleteTask(DeleteQuery) returns (DeleteTask);

  // Updates splits `delete_opstamp`.
  rpc UpdateSplitsDeleteOpstamp(UpdateSplitsDeleteOpstampRequest) returns (UpdateSplitsDeleteOpstampResponse);

  // Lists delete tasks with `delete_task.opstamp` > `opstamp_start` for a given `index_id`.
  rpc ListDeleteTasks(ListDeleteTasksRequest) returns (ListDeleteTasksResponse);

  // Lists splits with `split.delete_opstamp` < `delete_opstamp` for a given `index_id`.
  rpc ListStaleSplits(ListStaleSplitsRequest) returns (ListSplitsResponse);

  // Shard API
  //
  // Note that for the file-backed metastore implementation, the requests are not processed atomically.
  // Indeed, each request comprises one or more subrequests that target different indexes and sources processed
  // independently. Responses list the requests that succeeded or failed in the fields `successes` and
  // `failures`.
  rpc OpenShards(OpenShardsRequest) returns (OpenShardsResponse);

  // Acquires a set of shards for indexing. This RPC locks the shards for publishing thanks to a publish token and only
  // the last indexer that has acquired the shards is allowed to publish. The response returns for each subrequest the
  // list of acquired shards along with the positions to index from.
  //
  // If a requested shard is missing, this method does not return an error. It should simply return the list of
  // shards that were actually acquired.
  //
  // For this reason, AcquireShards.acquire_shards may return less subresponse than there was in the request.
  // Also they may be returned in any order.
  rpc AcquireShards(AcquireShardsRequest) returns (AcquireShardsResponse);

  // Deletes a set of shards. This RPC deletes the shards from the metastore.
  // If the shard did not exist to begin with, the operation is successful and does not return any error.
  rpc DeleteShards(DeleteShardsRequest) returns (DeleteShardsResponse);

  // Deletes outdated shards. This RPC deletes the shards from the metastore.
  rpc PruneShards(PruneShardsRequest) returns (EmptyResponse);

  rpc ListShards(ListShardsRequest) returns (ListShardsResponse);

  // Index Template API
  //
  // Index templates are used to create indexes with a predefined configuration.

  // Creates an index template.
  rpc CreateIndexTemplate(CreateIndexTemplateRequest) returns (EmptyResponse);

  // Fetches an index template.
  rpc GetIndexTemplate(GetIndexTemplateRequest) returns (GetIndexTemplateResponse);

  // Finds matching index templates.
  rpc FindIndexTemplateMatches(FindIndexTemplateMatchesRequest) returns (FindIndexTemplateMatchesResponse);

  // Returns all the index templates.
  rpc ListIndexTemplates(ListIndexTemplatesRequest) returns (ListIndexTemplatesResponse);

  // Deletes index templates.
  rpc DeleteIndexTemplates(DeleteIndexTemplatesRequest) returns (EmptyResponse);

  // Get cluster identity
  rpc GetClusterIdentity(GetClusterIdentityRequest) returns (GetClusterIdentityResponse);
}

message EmptyResponse {
}

message CreateIndexRequest {
  string index_config_json = 2;
  repeated string source_configs_json = 3;
}

message CreateIndexResponse {
  quickwit.common.IndexUid index_uid = 1;
  string index_metadata_json = 2;
}

message UpdateIndexRequest {
  quickwit.common.IndexUid index_uid = 1;
  string doc_mapping_json = 5;
  string indexing_settings_json = 4;
  string ingest_settings_json = 6;
  string search_settings_json = 2;
  optional string retention_policy_json_opt = 3;
}

message ListIndexesMetadataRequest {
  reserved  1;
  // List of patterns an index should match or not match to get considered
  // An index must match at least one positive pattern (a pattern not starting
  // with a '-'), and no negative pattern (a pattern starting with a '-').
  repeated string index_id_patterns = 2;
}

message ListIndexesMetadataResponse {
  // Deprecated (v0.9.0), use `indexes_metadata_json_zstd` instead.
  optional string indexes_metadata_json_opt = 1;
  // A JSON serialized then ZSTD compressed list of `IndexMetadata`: `Vec<IndexMetadata> | JSON | ZSTD`.
  // We don't use `repeated` here to increase the compression rate and ratio.
  bytes indexes_metadata_json_zstd = 2;
}

message DeleteIndexRequest {
  quickwit.common.IndexUid index_uid = 1;
}

// Request the metadata of an index.
// Either `index_uid` or `index_id` must be specified.
//
// If both are supplied, `index_uid` is used.
message IndexMetadataRequest {
  optional string index_id = 1;
  optional quickwit.common.IndexUid index_uid = 2;
}

message IndexMetadataResponse {
  string index_metadata_serialized_json = 1;
}

message IndexesMetadataRequest {
  repeated IndexMetadataSubrequest subrequests = 1;
}

message IndexMetadataSubrequest {
  optional string index_id = 1;
  optional quickwit.common.IndexUid index_uid = 2;
}

message IndexesMetadataResponse {
  // A JSON serialized then ZSTD compressed list of `IndexMetadata`: `Vec<IndexMetadata> | JSON | ZSTD`.
  // We don't use `repeated` here to increase the compression rate and ratio.
  bytes indexes_metadata_json_zstd = 1;
  repeated IndexMetadataFailure failures = 2;
}

message IndexMetadataFailure {
  optional string index_id = 1;
  optional quickwit.common.IndexUid index_uid = 2;
  IndexMetadataFailureReason reason = 3;
}

enum IndexMetadataFailureReason {
  INDEX_METADATA_FAILURE_REASON_UNSPECIFIED = 0;
  INDEX_METADATA_FAILURE_REASON_NOT_FOUND = 1;
  INDEX_METADATA_FAILURE_REASON_INTERNAL = 2;
}

message ListIndexStatsRequest {
  // List of patterns an index should match or not match to get considered
  // An index must match at least one positive pattern (a pattern not starting
  // with a '-'), and no negative pattern (a pattern starting with a '-').
  repeated string index_id_patterns = 1;
}

message ListIndexStatsResponse {
  // list of IndexStats. each one has the index id, the number of splits and the total size.
  repeated IndexStats index_stats = 1;
}

message IndexStats {
  quickwit.common.IndexUid index_uid = 1;
  SplitStats staged = 2;
  SplitStats published = 3;
  SplitStats marked_for_deletion = 4;
}

message SplitStats {
  uint64 num_splits = 1;
  uint64 total_size_bytes = 2;
}

message ListSplitsRequest {
  // Predicate used to filter splits.
  // The predicate is expressed as a JSON serialized
  // `ListSplitsQuery`.
  string query_json = 1;
}

message ListSplitsResponse {
  // TODO use repeated and encode splits json individually.
  string splits_serialized_json = 1;
}

message StageSplitsRequest {
  quickwit.common.IndexUid index_uid = 1;
  string split_metadata_list_serialized_json = 2;
}

message PublishSplitsRequest {
  quickwit.common.IndexUid index_uid = 1;
  repeated string staged_split_ids = 2;
  repeated string replaced_split_ids = 3;
  optional string index_checkpoint_delta_json_opt = 4;
  optional string publish_token_opt = 5;
}

message MarkSplitsForDeletionRequest {
  quickwit.common.IndexUid index_uid = 2;
  repeated string split_ids = 3;
}

message DeleteSplitsRequest {
  quickwit.common.IndexUid index_uid = 2;
  repeated string split_ids = 3;
}

message AddSourceRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_config_json = 2;
}

message UpdateSourceRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_config_json = 2;
}

message ToggleSourceRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  bool enable = 3;
}

message DeleteSourceRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
}

message ResetSourceCheckpointRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
}

//
// Delete tasks API.
//

message DeleteTask {
  int64 create_timestamp = 1;
  uint64 opstamp = 2;
  DeleteQuery delete_query = 3;
}

message DeleteQuery {
  reserved 4, 5;

  // Index UID.
  quickwit.common.IndexUid index_uid = 1;
  // If set, restrict search to documents with a `timestamp >= start_timestamp`.
  optional int64 start_timestamp = 2;
  // If set, restrict search to documents with a `timestamp < end_timestamp``.
  optional int64 end_timestamp = 3;
  // Query AST serialized in JSON
  string query_ast = 6;
}

message UpdateSplitsDeleteOpstampRequest {
  quickwit.common.IndexUid index_uid = 1;
  repeated string split_ids = 2;
  uint64 delete_opstamp = 3;
}

message UpdateSplitsDeleteOpstampResponse {}

message LastDeleteOpstampRequest {
  quickwit.common.IndexUid index_uid = 1;
}

message LastDeleteOpstampResponse {
  uint64 last_delete_opstamp = 1;
}

message ListStaleSplitsRequest {
  quickwit.common.IndexUid index_uid = 1;
  uint64 delete_opstamp = 2;
  uint64 num_splits = 3;
}

message ListDeleteTasksRequest {
  quickwit.common.IndexUid index_uid = 1;
  uint64 opstamp_start = 2;
}

message ListDeleteTasksResponse {
  repeated DeleteTask delete_tasks = 1;
}

//
// Shard API
//

message OpenShardsRequest {
  repeated OpenShardSubrequest subrequests = 1;
}

message OpenShardSubrequest {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  string leader_id = 5;
  optional string follower_id = 6;
  quickwit.common.DocMappingUid doc_mapping_uid = 7;
  optional string publish_token = 8;
}

message OpenShardsResponse {
  repeated OpenShardSubresponse subresponses = 1;
}

message OpenShardSubresponse {
  reserved 2, 3;

  uint32 subrequest_id = 1;
  quickwit.ingest.Shard open_shard = 4;
}

message AcquireShardsRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  repeated quickwit.ingest.ShardId shard_ids = 3;
  string publish_token = 4;
}

message AcquireShardsResponse {
  // List of acquired shards, in no specific order.
  repeated quickwit.ingest.Shard acquired_shards = 3;
}

message DeleteShardsRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  repeated quickwit.ingest.ShardId shard_ids = 3;
  // If false, only shards at EOF positions will be deleted.
  bool force = 4;
}

message DeleteShardsResponse {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  // List of shard IDs that were successfully deleted.
  repeated quickwit.ingest.ShardId successes = 3;
  // List of shard IDs that could not be deleted because `force` was set to `false` in the request,
  // and the shards are not at EOF, i.e., not fully indexed.
  repeated quickwit.ingest.ShardId failures = 4;
}

message PruneShardsRequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  // The maximum age of the shards to keep, in seconds.
  optional uint32 max_age_secs = 5;
  // The maximum number of the shards to keep. Delete older shards first.
  optional uint32 max_count = 6;
  // The interval between two pruning operations, in seconds.
  optional uint32 interval_secs = 7;
}

message ListShardsRequest {
  repeated ListShardsSubrequest subrequests = 1;
}

message ListShardsSubrequest {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  optional quickwit.ingest.ShardState shard_state = 3;
}

message ListShardsResponse {
  repeated ListShardsSubresponse subresponses = 1;
}

message ListShardsSubresponse {
  quickwit.common.IndexUid index_uid = 1;
  string source_id = 2;
  repeated quickwit.ingest.Shard shards = 3;
}

//
// Index Template API
//

message CreateIndexTemplateRequest {
  string index_template_json = 1;
  bool overwrite = 2;
}

message GetIndexTemplateRequest {
  string template_id = 1;
}

message GetIndexTemplateResponse {
  string index_template_json = 1;
}

message FindIndexTemplateMatchesRequest {
  repeated string index_ids = 1;
}

message FindIndexTemplateMatchesResponse {
  repeated IndexTemplateMatch matches = 1;
}

message IndexTemplateMatch {
  string index_id = 1;
  string template_id = 2;
  string index_template_json = 3;
}

message ListIndexTemplatesRequest {
}

message ListIndexTemplatesResponse {
  repeated string index_templates_json = 1;
}

message DeleteIndexTemplatesRequest {
  repeated string template_ids = 1;
}

message GetClusterIdentityRequest {
}

message GetClusterIdentityResponse {
  string uuid = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/router.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.ingest.router;

import "quickwit/common.proto";
import "quickwit/ingest.proto";

service IngestRouterService {
  // Ingests batches of documents for one or multiple indexes.
  // TODO: Describe error cases and how to handle them.
  rpc Ingest(IngestRequestV2) returns (IngestResponseV2);
}

message IngestRequestV2 {
  // There should be at most one subrequest per index per request.
  repeated IngestSubrequest subrequests = 1;
  quickwit.ingest.CommitTypeV2 commit_type = 2;
}

message IngestSubrequest {
  // The subrequest ID is used to identify the various subrequests and responses
  // (ingest, persist, replicate) at play during the ingest and replication
  // process.
  uint32 subrequest_id = 1;
  string index_id = 2;
  string source_id = 3;
  quickwit.ingest.DocBatchV2 doc_batch = 4;
}

message IngestResponseV2 {
  repeated IngestSuccess successes  = 1;
  repeated IngestFailure failures  = 2;
}

message IngestSuccess {
  uint32 subrequest_id = 1;
  quickwit.common.IndexUid index_uid = 2;
  string source_id = 3;
  quickwit.ingest.ShardId shard_id = 4;
  // Replication position inclusive.
  quickwit.ingest.Position replication_position_inclusive = 5;
  uint32 num_ingested_docs = 6;
  repeated quickwit.ingest.ParseFailure parse_failures = 7;
}

enum IngestFailureReason {
  INGEST_FAILURE_REASON_UNSPECIFIED = 0;
  INGEST_FAILURE_REASON_INDEX_NOT_FOUND = 1;
  INGEST_FAILURE_REASON_SOURCE_NOT_FOUND = 2;
  INGEST_FAILURE_REASON_INTERNAL = 3;
  INGEST_FAILURE_REASON_NO_SHARDS_AVAILABLE = 4;
  INGEST_FAILURE_REASON_SHARD_RATE_LIMITED = 5;
  INGEST_FAILURE_REASON_WAL_FULL = 6;
  INGEST_FAILURE_REASON_TIMEOUT = 7;
  INGEST_FAILURE_REASON_ROUTER_LOAD_SHEDDING = 8;
  INGEST_FAILURE_REASON_LOAD_SHEDDING = 9;
  INGEST_FAILURE_REASON_CIRCUIT_BREAKER = 10;
}

message IngestFailure {
  uint32 subrequest_id = 1;
  string index_id = 2;
  string source_id = 3;
  IngestFailureReason reason = 5;
}


================================================
FILE: quickwit/quickwit-proto/protos/quickwit/search.proto
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package quickwit.search;

service SearchService {
  // Root search API.
  // This RPC identifies the set of splits on which the query should run on,
  // and dispatch the several calls to `LeafSearch`.
  //
  // It is also in charge of merging back the results.
  rpc RootSearch(SearchRequest) returns (SearchResponse);

  // Perform a leaf search on a given set of splits.
  //
  // It is like a regular search except that:
  // - the node should perform the search locally instead of dispatching
  //   it to other nodes.
  // - it should be applied on the given subset of splits
  // - Hit content is not fetched, and we instead return so called `PartialHit`.
  rpc LeafSearch(LeafSearchRequest) returns (LeafSearchResponse);

  /// Fetches the documents contents from the document store.
  /// This methods takes `PartialHit`s and returns `Hit`s.
  rpc FetchDocs(FetchDocsRequest) returns (FetchDocsResponse);

  // Root list terms API.
  // This RPC identifies the set of splits on which the query should run on,
  // and dispatches the several calls to `LeafListTerms`.
  //
  // It is also in charge of merging back the results.
  rpc RootListTerms(ListTermsRequest) returns (ListTermsResponse);

  // Performs a leaf list terms on a given set of splits.
  //
  // It is like a regular list term except that:
  // - the node should perform the listing locally instead of dispatching
  //   it to other nodes.
  // - it should be applied on the given subset of splits
  rpc LeafListTerms(LeafListTermsRequest) returns (LeafListTermsResponse);

  // Performs a scroll request.
  rpc Scroll(ScrollRequest) returns (SearchResponse);

  // gRPC request used to store a key in the local storage of the targeted node.
  // This RPC is used in the mini distributed immutable KV store embedded in quickwit.
  rpc PutKV(PutKVRequest) returns (PutKVResponse);

  // Gets a key from the local storage of the targeted node.
  // This RPC is used in the mini distributed immutable KV store embedded in quickwit.
  rpc GetKV(GetKVRequest) returns (GetKVResponse);

  rpc ReportSplits(ReportSplitsRequest) returns (ReportSplitsResponse);

  rpc ListFields(ListFieldsRequest) returns (ListFieldsResponse);

  rpc LeafListFields(LeafListFieldsRequest) returns (ListFieldsResponse);

  // Describe how a search would be processed.
  rpc SearchPlan(SearchRequest) returns (SearchPlanResponse);
}

/// Scroll Request
message ScrollRequest {
  /// The `scroll_id` is the given in the response of a search request including a scroll.
  string scroll_id = 1;
  optional uint32 scroll_ttl_secs = 2;
}

message PutKVRequest {
  bytes key = 1;
  bytes payload = 2;
  uint32 ttl_secs = 3;
}

message PutKVResponse {}

message GetKVRequest {
  bytes key = 1;
}

message GetKVResponse {
  optional bytes payload = 1;
}


message ReportSplit {
  // Split id (ULID format `01HAV29D4XY3D462FS3D8K5Q2H`)
  string split_id = 2;
  // The storage uri. This URI does NOT include the split id.
  string storage_uri = 1;
}

message ReportSplitsRequest {
  repeated ReportSplit report_splits = 1;
}

message ReportSplitsResponse {}

// -- ListFields -------------------

message ListFieldsRequest {
  // Index ID patterns
  repeated string index_id_patterns = 1;
  // Optional limit query to a list of fields
  // Wildcard expressions are supported.
  repeated string fields = 2;

  // Time filter, expressed in seconds since epoch.
  // That filter is to be interpreted as the semi-open interval:
  // [start_timestamp, end_timestamp).
  optional int64 start_timestamp = 3;
  optional int64 end_timestamp = 4;

  // JSON-serialized QueryAst for index_filter support.
  // When provided, only fields from documents matching this query are returned.
  optional string query_ast = 5;

  // Control if the request will fail if split_ids contains a split that does not exist.
  // optional bool fail_on_missing_index = 6;
}

message LeafListFieldsRequest {
  // The index id
  string index_id = 1;
  // The index uri
  string index_uri = 2;
  // Index split ids to apply the query on.
  // This ids are resolved from the index_uri defined in the search_request.
  repeated SplitIdAndFooterOffsets split_offsets = 3;

  // Optional limit query to a list of fields
  // Wildcard expressions are supported.
  repeated string fields = 4;
}

message ListFieldsResponse {
  repeated ListFieldsEntryResponse fields = 1;
}

message ListFieldsEntryResponse {
  string field_name = 1;
  ListFieldType field_type = 2;
  // The index ids the field exists
  repeated string index_ids = 3;
  // True means the field is searchable (indexed) in at least some indices.
  // False means the field is not searchable in any indices.
  bool searchable = 4;
  // True means the field is aggregatable (fast) in at least some indices.
  // False means the field is not aggregatable in any indices.
  bool aggregatable = 5;
  // The index ids the field exists, but is not searchable.
  repeated string non_searchable_index_ids = 6;
  // The index ids the field exists, but is not aggregatable
  repeated string non_aggregatable_index_ids = 7;
}

enum ListFieldType {
    STR = 0;
    U64 = 1;
    I64 = 2;
    F64 = 3;
    BOOL = 4;
    DATE = 5;
    FACET = 6;
    BYTES = 7;
    IP_ADDR = 8;
    JSON = 9;
}
message ListFields {
  repeated ListFieldsEntryResponse fields = 1;
}
// -- Search -------------------

message SearchRequest {
  // Index ID patterns
  repeated string index_id_patterns = 1;

  // deprecated `query``
  reserved 2;

  // Json object representing Quickwit's QueryAst.
  string query_ast = 13;

  // deprecated `search_fields``
  reserved 3;

  // Time filter, expressed in seconds since epoch.
  // That filter is to be interpreted as the semi-open interval:
  // [start_timestamp, end_timestamp).
  // If the query AST contains a range query over the timestamp field,
  // then the the bounds of the range query are used directly and
  // these two fields are ignored.
  optional int64 start_timestamp = 4;
  optional int64 end_timestamp = 5;

  // Maximum number of hits to return.
  uint64 max_hits = 6;

  // First hit to return. Together with max_hits, this parameter
  // can be used for pagination.
  //
  // E.g.
  // The results with rank [start_offset..start_offset + max_hits) are returned.
  uint64 start_offset = 7;

  // deprecated tag field
  reserved 8;

  // deprecated `sort_order``
  reserved 9;

  // deprecated `sort_by_field``
  reserved 10;

  // json serialized aggregation_request
  optional string aggregation_request = 11;

  // Fields to extract snippet on
  repeated string snippet_fields = 12;

  // Optional sort by one or more fields (limited to 2 at the moment).
  repeated SortField sort_fields = 14;

  // If set, the search response will include a search id
  // that will make it possible to paginate through the results
  // in a consistent manner.
  optional uint32 scroll_ttl_secs = 15;

  // Document with sort tuple smaller or equal to this are discarded to
  // enable pagination.
  // If split_id is empty, no comparison with _shard_doc should be done
  optional PartialHit search_after = 16;

  CountHits count_hits = 17;

  // When an exact index ID is provided (not a pattern), the query fails only if
  // that index is not found and this parameter is set to `false`.
  bool ignore_missing_indexes = 18;

  // When true, skip finalization of aggregation results and return
  // the raw IntermediateAggregationResults bytes instead.
  bool skip_aggregation_finalization = 19;
}

enum CountHits {
  // Count all hits, querying all splits.
  COUNT_ALL = 0;
  // Give an underestimate of the number of hits, possibly skipping entire
  // splits if they are otherwise not needed to fulfull a query.
  UNDERESTIMATE = 1;
}

message SortField {
  string field_name = 1;
  SortOrder sort_order = 2;
  // Optional sort value format for datetime field only.
  // If none, the default output format for datetime field is
  // unix_timestamp_nanos.
  optional SortDatetimeFormat sort_datetime_format = 3;
}

enum SortOrder {
  // Ascending order.
  ASC = 0;
  // Descending order.
  DESC = 1; //< This will be the default value;
}

// Sort value format for datetime field.
// We keep an enum with only one format
// for future extension.
enum SortDatetimeFormat {
  UNIX_TIMESTAMP_MILLIS = 0;
  UNIX_TIMESTAMP_NANOS = 1;
}

message SearchResponse {
  // Number of hits matching the query.
  uint64 num_hits = 1;
  // Matched hits
  repeated Hit hits = 2;
  // Elapsed time to perform the request. This time is measured
  // server-side and expressed in microseconds.
  uint64 elapsed_time_micros = 3;

  // The searcherrors that occurred formatted as string.
  repeated string errors = 4;

  // used to be json-encoded aggregation
  reserved 5;

  // Postcard-encoded aggregation response
  optional bytes aggregation_postcard = 9;

  // Scroll Id (only set if scroll_secs was set in the request)
  optional string scroll_id = 6;

  // Returns the list of splits for which search failed.
  // For the moment, the cause is unknown.
  //
  // It is up to the caller to decide whether to interpret
  // this as an overall failure or to present the partial results
  // to the end user.
  repeated SplitSearchError failed_splits = 7;

  // Total number of successful splits searched.
  uint64 num_successful_splits = 8;
}

message SearchPlanResponse {
  string result = 1;
}

message SplitSearchError {
  // The searcherror that occurred formatted as string.
  string error = 1;

  // Split id that failed.
  string split_id = 2;

  // Flag to indicate if the error can be considered a retryable error
  bool retryable_error = 3;
}

// A LeafSearchRequest can span multiple indices.
message LeafSearchRequest {
  // Search request. This is a perfect copy of the original search request
  // that was sent to root apart from the start_offset, max_hits params and index_id_patterns.
  // index_id_patterns contains the actual index ids queried on that leaf.
  SearchRequest search_request = 1;

  // List of leaf requests, one per index.
  repeated LeafRequestRef leaf_requests = 7;

  // List of unique doc_mappers serialized as json.
  repeated string doc_mappers = 8;

  // List of index uris
  // Index URI. The index URI defines the location of the storage that contains the
  // split files.
  repeated string index_uris = 9;
}

message ResourceStats {
    uint64 short_lived_cache_num_bytes = 1;
    uint64 split_num_docs = 2;
    uint64 warmup_microsecs = 3;
    uint64 cpu_thread_pool_wait_microsecs = 4;
    uint64 cpu_microsecs = 5;
}

// LeafRequestRef references data in LeafSearchRequest to deduplicate data.
message LeafRequestRef {
  // The ordinal of the doc_mapper in `LeafSearchRequest.doc_mappers`
  uint32 doc_mapper_ord = 1;

  // The ordinal of the index uri in LeafSearchRequest.index_uris
  uint32 index_uri_ord = 2;

  // Index split ids to apply the query on.
  // This ids are resolved from the index_uri defined in the search_request.
  repeated SplitIdAndFooterOffsets split_offsets = 3;
}

message SplitIdAndFooterOffsets {
  // Index split id to apply the query on.
  // This id is resolved from the index_uri defined in the search_request.
  string split_id = 1;
  // The offset of the start of footer in the split bundle. The footer contains the file bundle metadata and the hotcache.
  uint64 split_footer_start = 2;
  // The offset of the end of the footer in split bundle. The footer contains the file bundle metadata and the hotcache.
  uint64 split_footer_end = 3;
  // The lowest timestamp appearing in the split, in seconds since epoch
  optional int64 timestamp_start = 4;
  // The highest timestamp appearing in the split, in seconds since epoch
  optional int64 timestamp_end = 5;
  // The number of docs in the split
  uint64 num_docs = 6;
}

// Hits returned by a FetchDocRequest.
//
// The json that is joined is the raw tantivy json doc.
// It is very different from a quickwit json doc.
//
// For instance:
// - it may contain a _source and a _dynamic field.
// - since tantivy has no notion of cardinality,
//  all fields are arrays.
// - since tantivy has no notion of object, the object is
//  flattened by concatenating the path to the root.
//
// See  `quickwit_search::convert_leaf_hit`
message LeafHit {
  // The actual content of the hit/
  string leaf_json = 1;
  // The partial hit (ie: the sorting field + the document address)
  PartialHit partial_hit = 2;
  // A snippet of the matching content
  optional string leaf_snippet_json = 3;
}

message Hit {
  // The actual content of the hit
  string json = 1;
  // The partial hit (ie: the sorting field + the document address)
  PartialHit partial_hit = 2;
  // A snippet of the matching content
  optional string snippet = 3;
  // The index id of the hit
  string index_id = 4;
}


// A partial hit, is a hit for which we have not fetch the content yet.
// Instead, it holds a document_uri which is enough information to
// go and fetch the actual document data, by performing a `get_doc(...)`
// request.
message PartialHit {
  // Value of the sorting key for the given document.
  //
  // Quickwit only computes top-K of this sorting field.
  // If the user requested for a bottom-K of a given fast field, then quickwit simply
  // emits an decreasing mapping of this fast field.
  //
  // In case of a tie, quickwit uses the increasing order of
  // - the split_id,
  // - the segment_ord,
  // - the doc id.

  // Deprecated
  reserved 1;
  // Room for eventual future sorted key types.
  reserved 12 to 20;
  SortByValue sort_value = 10;
  SortByValue sort_value2 = 11;

  string split_id = 2;

  // (segment_ord, doc) form a tantivy DocAddress, which is sufficient to identify a document
  // within a split
  uint32 segment_ord = 3;

  // The DocId identifies a unique document at the scale of a tantivy segment.
  uint32 doc_id = 4;
}

message SortByValue {
  oneof sort_value {
  uint64 u64 = 1;
  int64 i64 = 2;
  double f64 = 3;
  bool boolean = 4;
  }
  // Room for eventual future sorted key types.
  reserved 5 to 20;
}

message LeafSearchResponse {
  // Total number of documents matched by the query.
  uint64 num_hits = 1;

  // List of the best top-K candidates for the given leaf query.
  repeated PartialHit partial_hits = 2;

  // The list of splits that failed. LeafSearchResponse can be an aggregation of results, so there may be multiple.
  repeated SplitSearchError failed_splits = 3;

  // Total number of attempt to search into splits.
  // We do have:
  // `num_splits_requested == num_successful_splits + num_failed_splits.len()`
  // But we do not necessarily have:
  // `num_splits_requested = num_attempted_splits because of retries.`
  uint64 num_attempted_splits = 4;

  // Total number of successful splits searched.
  uint64 num_successful_splits = 7;

  // Deprecated json serialized intermediate aggregation_result.
  reserved 5;

  // postcard serialized intermediate aggregation_result.
  optional bytes intermediate_aggregation_result = 6;

  ResourceStats resource_stats = 8;
}

// The result of searching a single split in a Lambda invocation.
// Each result is tagged with its split_id so that ordering is irrelevant.
message LambdaSingleSplitResult {
  // The split that was searched.
  string split_id = 1;
  oneof outcome {
    // On success, the leaf search response for this split.
    LeafSearchResponse response = 2;
    // On failure, the error message.
    string error = 3;
  }
}

// Wrapper for per-split results from a Lambda invocation.
message LambdaSearchResponses {
  reserved 1; // was: repeated LeafSearchResponse responses
  repeated LambdaSingleSplitResult split_results = 2;
}

message SnippetRequest {
  repeated string snippet_fields = 1;
  string query_ast_resolved = 2;
}

message FetchDocsRequest {
  // Request fetching the content of a given list of partial_hits.
  repeated PartialHit partial_hits = 1;

  // Split footer offsets. They are required for fetch docs to
  // fetch the document content in two reads, when the footer is not
  // cached.
  repeated SplitIdAndFooterOffsets split_offsets = 3;

  // Index URI. The index URI defines the location of the storage that contains the
  // split files.
  string index_uri = 4;

  optional SnippetRequest snippet_request = 7;

  // `DocMapper` as json serialized trait.
  string doc_mapper = 6;

  reserved 5;
}

message FetchDocsResponse {
  // List of complete hits.
  repeated LeafHit hits = 1;
}

message ListTermsRequest {
  // Index ID patterns
  repeated string index_id_patterns = 1;

  // Field to search on
  string field = 3;

  // Time filter
  optional int64 start_timestamp = 4;
  optional int64 end_timestamp = 5;

  // Maximum number of hits to return.
  optional uint64 max_hits = 6;

  // start_key is included, end_key is excluded
  optional bytes start_key = 7;
  optional bytes end_key = 8;
}

message ListTermsResponse {
  // Number of hits matching the query.
  uint64 num_hits = 1;
  // Matched hits
  repeated bytes terms = 2;
  // Elapsed time to perform the request. This time is measured
  // server-side and expressed in microseconds.
  uint64 elapsed_time_micros = 3;

  // The searcherrors that occurred formatted as string.
  repeated string errors = 4;
}

message LeafListTermsRequest {
  // Search request. This is a perfect copy of the original list request,
  ListTermsRequest list_terms_request = 1;

  // Index split ids to apply the query on.
  // This ids are resolved from the index_uri defined in the search_request.
  repeated SplitIdAndFooterOffsets split_offsets = 2;

  // Index URI. The index URI defines the location of the storage that contains the
  // split files.
  string index_uri = 3;
}

message LeafListTermsResponse {
  // Total number of documents matched by the query.
  uint64 num_hits = 1;

  // List of the first K terms the given leaf query.
  repeated bytes terms = 2;

  // The list of splits that failed. LeafSearchResponse can be an aggregation of results, so there may be multiple.
  repeated SplitSearchError failed_splits = 3;

  // Total number of single split search attempted.
  uint64 num_attempted_splits = 4;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/gogoproto/gogo.proto
================================================
// Protocol Buffers for Go with Gadgets
//
// Copyright (c) 2013, The GoGo Authors. All rights reserved.
// http://github.com/gogo/protobuf
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto2";
package gogoproto;

import "google/protobuf/descriptor.proto";

option java_package = "com.google.protobuf";
option java_outer_classname = "GoGoProtos";
option go_package = "github.com/gogo/protobuf/gogoproto";

extend google.protobuf.EnumOptions {
	optional bool goproto_enum_prefix = 62001;
	optional bool goproto_enum_stringer = 62021;
	optional bool enum_stringer = 62022;
	optional string enum_customname = 62023;
	optional bool enumdecl = 62024;
}

extend google.protobuf.EnumValueOptions {
	optional string enumvalue_customname = 66001;
}

extend google.protobuf.FileOptions {
	optional bool goproto_getters_all = 63001;
	optional bool goproto_enum_prefix_all = 63002;
	optional bool goproto_stringer_all = 63003;
	optional bool verbose_equal_all = 63004;
	optional bool face_all = 63005;
	optional bool gostring_all = 63006;
	optional bool populate_all = 63007;
	optional bool stringer_all = 63008;
	optional bool onlyone_all = 63009;

	optional bool equal_all = 63013;
	optional bool description_all = 63014;
	optional bool testgen_all = 63015;
	optional bool benchgen_all = 63016;
	optional bool marshaler_all = 63017;
	optional bool unmarshaler_all = 63018;
	optional bool stable_marshaler_all = 63019;

	optional bool sizer_all = 63020;

	optional bool goproto_enum_stringer_all = 63021;
	optional bool enum_stringer_all = 63022;

	optional bool unsafe_marshaler_all = 63023;
	optional bool unsafe_unmarshaler_all = 63024;

	optional bool goproto_extensions_map_all = 63025;
	optional bool goproto_unrecognized_all = 63026;
	optional bool gogoproto_import = 63027;
	optional bool protosizer_all = 63028;
	optional bool compare_all = 63029;
    optional bool typedecl_all = 63030;
    optional bool enumdecl_all = 63031;

	optional bool goproto_registration = 63032;
	optional bool messagename_all = 63033;

	optional bool goproto_sizecache_all = 63034;
	optional bool goproto_unkeyed_all = 63035;
}

extend google.protobuf.MessageOptions {
	optional bool goproto_getters = 64001;
	optional bool goproto_stringer = 64003;
	optional bool verbose_equal = 64004;
	optional bool face = 64005;
	optional bool gostring = 64006;
	optional bool populate = 64007;
	optional bool stringer = 67008;
	optional bool onlyone = 64009;

	optional bool equal = 64013;
	optional bool description = 64014;
	optional bool testgen = 64015;
	optional bool benchgen = 64016;
	optional bool marshaler = 64017;
	optional bool unmarshaler = 64018;
	optional bool stable_marshaler = 64019;

	optional bool sizer = 64020;

	optional bool unsafe_marshaler = 64023;
	optional bool unsafe_unmarshaler = 64024;

	optional bool goproto_extensions_map = 64025;
	optional bool goproto_unrecognized = 64026;

	optional bool protosizer = 64028;
	optional bool compare = 64029;

	optional bool typedecl = 64030;

	optional bool messagename = 64033;

	optional bool goproto_sizecache = 64034;
	optional bool goproto_unkeyed = 64035;
}

extend google.protobuf.FieldOptions {
	optional bool nullable = 65001;
	optional bool embed = 65002;
	optional string customtype = 65003;
	optional string customname = 65004;
	optional string jsontag = 65005;
	optional string moretags = 65006;
	optional string casttype = 65007;
	optional string castkey = 65008;
	optional string castvalue = 65009;

	optional bool stdtime = 65010;
	optional bool stdduration = 65011;
	optional bool wktpointer = 65012;

}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/any.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option go_package = "google.golang.org/protobuf/types/known/anypb";
option java_package = "com.google.protobuf";
option java_outer_classname = "AnyProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";

// `Any` contains an arbitrary serialized protocol buffer message along with a
// URL that describes the type of the serialized message.
//
// Protobuf library provides support to pack/unpack Any values in the form
// of utility functions or additional generated methods of the Any type.
//
// Example 1: Pack and unpack a message in C++.
//
//     Foo foo = ...;
//     Any any;
//     any.PackFrom(foo);
//     ...
//     if (any.UnpackTo(&foo)) {
//       ...
//     }
//
// Example 2: Pack and unpack a message in Java.
//
//     Foo foo = ...;
//     Any any = Any.pack(foo);
//     ...
//     if (any.is(Foo.class)) {
//       foo = any.unpack(Foo.class);
//     }
//
// Example 3: Pack and unpack a message in Python.
//
//     foo = Foo(...)
//     any = Any()
//     any.Pack(foo)
//     ...
//     if any.Is(Foo.DESCRIPTOR):
//       any.Unpack(foo)
//       ...
//
// Example 4: Pack and unpack a message in Go
//
//      foo := &pb.Foo{...}
//      any, err := anypb.New(foo)
//      if err != nil {
//        ...
//      }
//      ...
//      foo := &pb.Foo{}
//      if err := any.UnmarshalTo(foo); err != nil {
//        ...
//      }
//
// The pack methods provided by protobuf library will by default use
// 'type.googleapis.com/full.type.name' as the type URL and the unpack
// methods only use the fully qualified type name after the last '/'
// in the type URL, for example "foo.bar.com/x/y.z" will yield type
// name "y.z".
//
//
// JSON
//
// The JSON representation of an `Any` value uses the regular
// representation of the deserialized, embedded message, with an
// additional field `@type` which contains the type URL. Example:
//
//     package google.profile;
//     message Person {
//       string first_name = 1;
//       string last_name = 2;
//     }
//
//     {
//       "@type": "type.googleapis.com/google.profile.Person",
//       "firstName": <string>,
//       "lastName": <string>
//     }
//
// If the embedded message type is well-known and has a custom JSON
// representation, that representation will be embedded adding a field
// `value` which holds the custom JSON in addition to the `@type`
// field. Example (for message [google.protobuf.Duration][]):
//
//     {
//       "@type": "type.googleapis.com/google.protobuf.Duration",
//       "value": "1.212s"
//     }
//
message Any {
  // A URL/resource name that uniquely identifies the type of the serialized
  // protocol buffer message. This string must contain at least
  // one "/" character. The last segment of the URL's path must represent
  // the fully qualified name of the type (as in
  // `path/google.protobuf.Duration`). The name should be in a canonical form
  // (e.g., leading "." is not accepted).
  //
  // In practice, teams usually precompile into the binary all types that they
  // expect it to use in the context of Any. However, for URLs which use the
  // scheme `http`, `https`, or no scheme, one can optionally set up a type
  // server that maps type URLs to message definitions as follows:
  //
  // * If no scheme is provided, `https` is assumed.
  // * An HTTP GET on the URL must yield a [google.protobuf.Type][]
  //   value in binary format, or produce an error.
  // * Applications are allowed to cache lookup results based on the
  //   URL, or have them precompiled into a binary to avoid any
  //   lookup. Therefore, binary compatibility needs to be preserved
  //   on changes to types. (Use versioned type names to manage
  //   breaking changes.)
  //
  // Note: this functionality is not currently available in the official
  // protobuf release, and it is not used for type URLs beginning with
  // type.googleapis.com.
  //
  // Schemes other than `http`, `https` (or the empty scheme) might be
  // used with implementation specific semantics.
  //
  string type_url = 1;

  // Must be a valid serialized protocol buffer of the above specified type.
  bytes value = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/api.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

import "google/protobuf/source_context.proto";
import "google/protobuf/type.proto";

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option java_package = "com.google.protobuf";
option java_outer_classname = "ApiProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";
option go_package = "google.golang.org/protobuf/types/known/apipb";

// Api is a light-weight descriptor for an API Interface.
//
// Interfaces are also described as "protocol buffer services" in some contexts,
// such as by the "service" keyword in a .proto file, but they are different
// from API Services, which represent a concrete implementation of an interface
// as opposed to simply a description of methods and bindings. They are also
// sometimes simply referred to as "APIs" in other contexts, such as the name of
// this message itself. See https://cloud.google.com/apis/design/glossary for
// detailed terminology.
message Api {
  // The fully qualified name of this interface, including package name
  // followed by the interface's simple name.
  string name = 1;

  // The methods of this interface, in unspecified order.
  repeated Method methods = 2;

  // Any metadata attached to the interface.
  repeated Option options = 3;

  // A version string for this interface. If specified, must have the form
  // `major-version.minor-version`, as in `1.10`. If the minor version is
  // omitted, it defaults to zero. If the entire version field is empty, the
  // major version is derived from the package name, as outlined below. If the
  // field is not empty, the version in the package name will be verified to be
  // consistent with what is provided here.
  //
  // The versioning schema uses [semantic
  // versioning](http://semver.org) where the major version number
  // indicates a breaking change and the minor version an additive,
  // non-breaking change. Both version numbers are signals to users
  // what to expect from different versions, and should be carefully
  // chosen based on the product plan.
  //
  // The major version is also reflected in the package name of the
  // interface, which must end in `v<major-version>`, as in
  // `google.feature.v1`. For major versions 0 and 1, the suffix can
  // be omitted. Zero major versions must only be used for
  // experimental, non-GA interfaces.
  //
  //
  string version = 4;

  // Source context for the protocol buffer service represented by this
  // message.
  SourceContext source_context = 5;

  // Included interfaces. See [Mixin][].
  repeated Mixin mixins = 6;

  // The source syntax of the service.
  Syntax syntax = 7;
}

// Method represents a method of an API interface.
message Method {
  // The simple name of this method.
  string name = 1;

  // A URL of the input message type.
  string request_type_url = 2;

  // If true, the request is streamed.
  bool request_streaming = 3;

  // The URL of the output message type.
  string response_type_url = 4;

  // If true, the response is streamed.
  bool response_streaming = 5;

  // Any metadata attached to the method.
  repeated Option options = 6;

  // The source syntax of this method.
  Syntax syntax = 7;
}

// Declares an API Interface to be included in this interface. The including
// interface must redeclare all the methods from the included interface, but
// documentation and options are inherited as follows:
//
// - If after comment and whitespace stripping, the documentation
//   string of the redeclared method is empty, it will be inherited
//   from the original method.
//
// - Each annotation belonging to the service config (http,
//   visibility) which is not set in the redeclared method will be
//   inherited.
//
// - If an http annotation is inherited, the path pattern will be
//   modified as follows. Any version prefix will be replaced by the
//   version of the including interface plus the [root][] path if
//   specified.
//
// Example of a simple mixin:
//
//     package google.acl.v1;
//     service AccessControl {
//       // Get the underlying ACL object.
//       rpc GetAcl(GetAclRequest) returns (Acl) {
//         option (google.api.http).get = "/v1/{resource=**}:getAcl";
//       }
//     }
//
//     package google.storage.v2;
//     service Storage {
//       rpc GetAcl(GetAclRequest) returns (Acl);
//
//       // Get a data record.
//       rpc GetData(GetDataRequest) returns (Data) {
//         option (google.api.http).get = "/v2/{resource=**}";
//       }
//     }
//
// Example of a mixin configuration:
//
//     apis:
//     - name: google.storage.v2.Storage
//       mixins:
//       - name: google.acl.v1.AccessControl
//
// The mixin construct implies that all methods in `AccessControl` are
// also declared with same name and request/response types in
// `Storage`. A documentation generator or annotation processor will
// see the effective `Storage.GetAcl` method after inheriting
// documentation and annotations as follows:
//
//     service Storage {
//       // Get the underlying ACL object.
//       rpc GetAcl(GetAclRequest) returns (Acl) {
//         option (google.api.http).get = "/v2/{resource=**}:getAcl";
//       }
//       ...
//     }
//
// Note how the version in the path pattern changed from `v1` to `v2`.
//
// If the `root` field in the mixin is specified, it should be a
// relative path under which inherited HTTP paths are placed. Example:
//
//     apis:
//     - name: google.storage.v2.Storage
//       mixins:
//       - name: google.acl.v1.AccessControl
//         root: acls
//
// This implies the following inherited HTTP annotation:
//
//     service Storage {
//       // Get the underlying ACL object.
//       rpc GetAcl(GetAclRequest) returns (Acl) {
//         option (google.api.http).get = "/v2/acls/{resource=**}:getAcl";
//       }
//       ...
//     }
message Mixin {
  // The fully qualified name of the interface which is included.
  string name = 1;

  // If non-empty specifies a path under which inherited HTTP paths
  // are rooted.
  string root = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/descriptor.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

// Author: kenton@google.com (Kenton Varda)
//  Based on original Protocol Buffers design by
//  Sanjay Ghemawat, Jeff Dean, and others.
//
// The messages in this file describe the definitions found in .proto files.
// A valid .proto file can be translated directly to a FileDescriptorProto
// without any other information (e.g. without reading its imports).


syntax = "proto2";

package google.protobuf;

option go_package = "google.golang.org/protobuf/types/descriptorpb";
option java_package = "com.google.protobuf";
option java_outer_classname = "DescriptorProtos";
option csharp_namespace = "Google.Protobuf.Reflection";
option objc_class_prefix = "GPB";
option cc_enable_arenas = true;

// descriptor.proto must be optimized for speed because reflection-based
// algorithms don't work during bootstrapping.
option optimize_for = SPEED;

// The protocol compiler can output a FileDescriptorSet containing the .proto
// files it parses.
message FileDescriptorSet {
  repeated FileDescriptorProto file = 1;
}

// Describes a complete .proto file.
message FileDescriptorProto {
  optional string name = 1;     // file name, relative to root of source tree
  optional string package = 2;  // e.g. "foo", "foo.bar", etc.

  // Names of files imported by this file.
  repeated string dependency = 3;
  // Indexes of the public imported files in the dependency list above.
  repeated int32 public_dependency = 10;
  // Indexes of the weak imported files in the dependency list.
  // For Google-internal migration only. Do not use.
  repeated int32 weak_dependency = 11;

  // All top-level definitions in this file.
  repeated DescriptorProto message_type = 4;
  repeated EnumDescriptorProto enum_type = 5;
  repeated ServiceDescriptorProto service = 6;
  repeated FieldDescriptorProto extension = 7;

  optional FileOptions options = 8;

  // This field contains optional information about the original source code.
  // You may safely remove this entire field without harming runtime
  // functionality of the descriptors -- the information is needed only by
  // development tools.
  optional SourceCodeInfo source_code_info = 9;

  // The syntax of the proto file.
  // The supported values are "proto2" and "proto3".
  optional string syntax = 12;
}

// Describes a message type.
message DescriptorProto {
  optional string name = 1;

  repeated FieldDescriptorProto field = 2;
  repeated FieldDescriptorProto extension = 6;

  repeated DescriptorProto nested_type = 3;
  repeated EnumDescriptorProto enum_type = 4;

  message ExtensionRange {
    optional int32 start = 1;  // Inclusive.
    optional int32 end = 2;    // Exclusive.

    optional ExtensionRangeOptions options = 3;
  }
  repeated ExtensionRange extension_range = 5;

  repeated OneofDescriptorProto oneof_decl = 8;

  optional MessageOptions options = 7;

  // Range of reserved tag numbers. Reserved tag numbers may not be used by
  // fields or extension ranges in the same message. Reserved ranges may
  // not overlap.
  message ReservedRange {
    optional int32 start = 1;  // Inclusive.
    optional int32 end = 2;    // Exclusive.
  }
  repeated ReservedRange reserved_range = 9;
  // Reserved field names, which may not be used by fields in the same message.
  // A given name may only be reserved once.
  repeated string reserved_name = 10;
}

message ExtensionRangeOptions {
  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;


  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}

// Describes a field within a message.
message FieldDescriptorProto {
  enum Type {
    // 0 is reserved for errors.
    // Order is weird for historical reasons.
    TYPE_DOUBLE = 1;
    TYPE_FLOAT = 2;
    // Not ZigZag encoded.  Negative numbers take 10 bytes.  Use TYPE_SINT64 if
    // negative values are likely.
    TYPE_INT64 = 3;
    TYPE_UINT64 = 4;
    // Not ZigZag encoded.  Negative numbers take 10 bytes.  Use TYPE_SINT32 if
    // negative values are likely.
    TYPE_INT32 = 5;
    TYPE_FIXED64 = 6;
    TYPE_FIXED32 = 7;
    TYPE_BOOL = 8;
    TYPE_STRING = 9;
    // Tag-delimited aggregate.
    // Group type is deprecated and not supported in proto3. However, Proto3
    // implementations should still be able to parse the group wire format and
    // treat group fields as unknown fields.
    TYPE_GROUP = 10;
    TYPE_MESSAGE = 11;  // Length-delimited aggregate.

    // New in version 2.
    TYPE_BYTES = 12;
    TYPE_UINT32 = 13;
    TYPE_ENUM = 14;
    TYPE_SFIXED32 = 15;
    TYPE_SFIXED64 = 16;
    TYPE_SINT32 = 17;  // Uses ZigZag encoding.
    TYPE_SINT64 = 18;  // Uses ZigZag encoding.
  }

  enum Label {
    // 0 is reserved for errors
    LABEL_OPTIONAL = 1;
    LABEL_REQUIRED = 2;
    LABEL_REPEATED = 3;
  }

  optional string name = 1;
  optional int32 number = 3;
  optional Label label = 4;

  // If type_name is set, this need not be set.  If both this and type_name
  // are set, this must be one of TYPE_ENUM, TYPE_MESSAGE or TYPE_GROUP.
  optional Type type = 5;

  // For message and enum types, this is the name of the type.  If the name
  // starts with a '.', it is fully-qualified.  Otherwise, C++-like scoping
  // rules are used to find the type (i.e. first the nested types within this
  // message are searched, then within the parent, on up to the root
  // namespace).
  optional string type_name = 6;

  // For extensions, this is the name of the type being extended.  It is
  // resolved in the same manner as type_name.
  optional string extendee = 2;

  // For numeric types, contains the original text representation of the value.
  // For booleans, "true" or "false".
  // For strings, contains the default text contents (not escaped in any way).
  // For bytes, contains the C escaped value.  All bytes >= 128 are escaped.
  optional string default_value = 7;

  // If set, gives the index of a oneof in the containing type's oneof_decl
  // list.  This field is a member of that oneof.
  optional int32 oneof_index = 9;

  // JSON name of this field. The value is set by protocol compiler. If the
  // user has set a "json_name" option on this field, that option's value
  // will be used. Otherwise, it's deduced from the field's name by converting
  // it to camelCase.
  optional string json_name = 10;

  optional FieldOptions options = 8;

  // If true, this is a proto3 "optional". When a proto3 field is optional, it
  // tracks presence regardless of field type.
  //
  // When proto3_optional is true, this field must be belong to a oneof to
  // signal to old proto3 clients that presence is tracked for this field. This
  // oneof is known as a "synthetic" oneof, and this field must be its sole
  // member (each proto3 optional field gets its own synthetic oneof). Synthetic
  // oneofs exist in the descriptor only, and do not generate any API. Synthetic
  // oneofs must be ordered after all "real" oneofs.
  //
  // For message fields, proto3_optional doesn't create any semantic change,
  // since non-repeated message fields always track presence. However it still
  // indicates the semantic detail of whether the user wrote "optional" or not.
  // This can be useful for round-tripping the .proto file. For consistency we
  // give message fields a synthetic oneof also, even though it is not required
  // to track presence. This is especially important because the parser can't
  // tell if a field is a message or an enum, so it must always create a
  // synthetic oneof.
  //
  // Proto2 optional fields do not set this flag, because they already indicate
  // optional with `LABEL_OPTIONAL`.
  optional bool proto3_optional = 17;
}

// Describes a oneof.
message OneofDescriptorProto {
  optional string name = 1;
  optional OneofOptions options = 2;
}

// Describes an enum type.
message EnumDescriptorProto {
  optional string name = 1;

  repeated EnumValueDescriptorProto value = 2;

  optional EnumOptions options = 3;

  // Range of reserved numeric values. Reserved values may not be used by
  // entries in the same enum. Reserved ranges may not overlap.
  //
  // Note that this is distinct from DescriptorProto.ReservedRange in that it
  // is inclusive such that it can appropriately represent the entire int32
  // domain.
  message EnumReservedRange {
    optional int32 start = 1;  // Inclusive.
    optional int32 end = 2;    // Inclusive.
  }

  // Range of reserved numeric values. Reserved numeric values may not be used
  // by enum values in the same enum declaration. Reserved ranges may not
  // overlap.
  repeated EnumReservedRange reserved_range = 4;

  // Reserved enum value names, which may not be reused. A given name may only
  // be reserved once.
  repeated string reserved_name = 5;
}

// Describes a value within an enum.
message EnumValueDescriptorProto {
  optional string name = 1;
  optional int32 number = 2;

  optional EnumValueOptions options = 3;
}

// Describes a service.
message ServiceDescriptorProto {
  optional string name = 1;
  repeated MethodDescriptorProto method = 2;

  optional ServiceOptions options = 3;
}

// Describes a method of a service.
message MethodDescriptorProto {
  optional string name = 1;

  // Input and output type names.  These are resolved in the same way as
  // FieldDescriptorProto.type_name, but must refer to a message type.
  optional string input_type = 2;
  optional string output_type = 3;

  optional MethodOptions options = 4;

  // Identifies if client streams multiple client messages
  optional bool client_streaming = 5 [default = false];
  // Identifies if server streams multiple server messages
  optional bool server_streaming = 6 [default = false];
}


// ===================================================================
// Options

// Each of the definitions above may have "options" attached.  These are
// just annotations which may cause code to be generated slightly differently
// or may contain hints for code that manipulates protocol messages.
//
// Clients may define custom options as extensions of the *Options messages.
// These extensions may not yet be known at parsing time, so the parser cannot
// store the values in them.  Instead it stores them in a field in the *Options
// message called uninterpreted_option. This field must have the same name
// across all *Options messages. We then use this field to populate the
// extensions when we build a descriptor, at which point all protos have been
// parsed and so all extensions are known.
//
// Extension numbers for custom options may be chosen as follows:
// * For options which will only be used within a single application or
//   organization, or for experimental options, use field numbers 50000
//   through 99999.  It is up to you to ensure that you do not use the
//   same number for multiple options.
// * For options which will be published and used publicly by multiple
//   independent entities, e-mail protobuf-global-extension-registry@google.com
//   to reserve extension numbers. Simply provide your project name (e.g.
//   Objective-C plugin) and your project website (if available) -- there's no
//   need to explain how you intend to use them. Usually you only need one
//   extension number. You can declare multiple options with only one extension
//   number by putting them in a sub-message. See the Custom Options section of
//   the docs for examples:
//   https://developers.google.com/protocol-buffers/docs/proto#options
//   If this turns out to be popular, a web service will be set up
//   to automatically assign option numbers.

message FileOptions {

  // Sets the Java package where classes generated from this .proto will be
  // placed.  By default, the proto package is used, but this is often
  // inappropriate because proto packages do not normally start with backwards
  // domain names.
  optional string java_package = 1;


  // Controls the name of the wrapper Java class generated for the .proto file.
  // That class will always contain the .proto file's getDescriptor() method as
  // well as any top-level extensions defined in the .proto file.
  // If java_multiple_files is disabled, then all the other classes from the
  // .proto file will be nested inside the single wrapper outer class.
  optional string java_outer_classname = 8;

  // If enabled, then the Java code generator will generate a separate .java
  // file for each top-level message, enum, and service defined in the .proto
  // file.  Thus, these types will *not* be nested inside the wrapper class
  // named by java_outer_classname.  However, the wrapper class will still be
  // generated to contain the file's getDescriptor() method as well as any
  // top-level extensions defined in the file.
  optional bool java_multiple_files = 10 [default = false];

  // This option does nothing.
  optional bool java_generate_equals_and_hash = 20 [deprecated=true];

  // If set true, then the Java2 code generator will generate code that
  // throws an exception whenever an attempt is made to assign a non-UTF-8
  // byte sequence to a string field.
  // Message reflection will do the same.
  // However, an extension field still accepts non-UTF-8 byte sequences.
  // This option has no effect on when used with the lite runtime.
  optional bool java_string_check_utf8 = 27 [default = false];


  // Generated classes can be optimized for speed or code size.
  enum OptimizeMode {
    SPEED = 1;         // Generate complete code for parsing, serialization,
                       // etc.
    CODE_SIZE = 2;     // Use ReflectionOps to implement these methods.
    LITE_RUNTIME = 3;  // Generate code using MessageLite and the lite runtime.
  }
  optional OptimizeMode optimize_for = 9 [default = SPEED];

  // Sets the Go package where structs generated from this .proto will be
  // placed. If omitted, the Go package will be derived from the following:
  //   - The basename of the package import path, if provided.
  //   - Otherwise, the package statement in the .proto file, if present.
  //   - Otherwise, the basename of the .proto file, without extension.
  optional string go_package = 11;


  // Should generic services be generated in each language?  "Generic" services
  // are not specific to any particular RPC system.  They are generated by the
  // main code generators in each language (without additional plugins).
  // Generic services were the only kind of service generation supported by
  // early versions of google.protobuf.
  //
  // Generic services are now considered deprecated in favor of using plugins
  // that generate code specific to your particular RPC system.  Therefore,
  // these default to false.  Old code which depends on generic services should
  // explicitly set them to true.
  optional bool cc_generic_services = 16 [default = false];
  optional bool java_generic_services = 17 [default = false];
  optional bool py_generic_services = 18 [default = false];
  optional bool php_generic_services = 42 [default = false];

  // Is this file deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for everything in the file, or it will be completely ignored; in the very
  // least, this is a formalization for deprecating files.
  optional bool deprecated = 23 [default = false];

  // Enables the use of arenas for the proto messages in this file. This applies
  // only to generated classes for C++.
  optional bool cc_enable_arenas = 31 [default = true];


  // Sets the objective c class prefix which is prepended to all objective c
  // generated classes from this .proto. There is no default.
  optional string objc_class_prefix = 36;

  // Namespace for generated classes; defaults to the package.
  optional string csharp_namespace = 37;

  // By default Swift generators will take the proto package and CamelCase it
  // replacing '.' with underscore and use that to prefix the types/symbols
  // defined. When this options is provided, they will use this value instead
  // to prefix the types/symbols defined.
  optional string swift_prefix = 39;

  // Sets the php class prefix which is prepended to all php generated classes
  // from this .proto. Default is empty.
  optional string php_class_prefix = 40;

  // Use this option to change the namespace of php generated classes. Default
  // is empty. When this option is empty, the package name will be used for
  // determining the namespace.
  optional string php_namespace = 41;

  // Use this option to change the namespace of php generated metadata classes.
  // Default is empty. When this option is empty, the proto file name will be
  // used for determining the namespace.
  optional string php_metadata_namespace = 44;

  // Use this option to change the package of ruby generated classes. Default
  // is empty. When this option is not set, the package name will be used for
  // determining the ruby package.
  optional string ruby_package = 45;


  // The parser stores options it doesn't recognize here.
  // See the documentation for the "Options" section above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message.
  // See the documentation for the "Options" section above.
  extensions 1000 to max;

  reserved 38;
}

message MessageOptions {
  // Set true to use the old proto1 MessageSet wire format for extensions.
  // This is provided for backwards-compatibility with the MessageSet wire
  // format.  You should not use this for any other reason:  It's less
  // efficient, has fewer features, and is more complicated.
  //
  // The message must be defined exactly as follows:
  //   message Foo {
  //     option message_set_wire_format = true;
  //     extensions 4 to max;
  //   }
  // Note that the message cannot have any defined fields; MessageSets only
  // have extensions.
  //
  // All extensions of your type must be singular messages; e.g. they cannot
  // be int32s, enums, or repeated messages.
  //
  // Because this is an option, the above two restrictions are not enforced by
  // the protocol compiler.
  optional bool message_set_wire_format = 1 [default = false];

  // Disables the generation of the standard "descriptor()" accessor, which can
  // conflict with a field of the same name.  This is meant to make migration
  // from proto1 easier; new code should avoid fields named "descriptor".
  optional bool no_standard_descriptor_accessor = 2 [default = false];

  // Is this message deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for the message, or it will be completely ignored; in the very least,
  // this is a formalization for deprecating messages.
  optional bool deprecated = 3 [default = false];

  reserved 4, 5, 6;

  // Whether the message is an automatically generated map entry type for the
  // maps field.
  //
  // For maps fields:
  //     map<KeyType, ValueType> map_field = 1;
  // The parsed descriptor looks like:
  //     message MapFieldEntry {
  //         option map_entry = true;
  //         optional KeyType key = 1;
  //         optional ValueType value = 2;
  //     }
  //     repeated MapFieldEntry map_field = 1;
  //
  // Implementations may choose not to generate the map_entry=true message, but
  // use a native map in the target language to hold the keys and values.
  // The reflection APIs in such implementations still need to work as
  // if the field is a repeated message field.
  //
  // NOTE: Do not set the option in .proto files. Always use the maps syntax
  // instead. The option should only be implicitly set by the proto compiler
  // parser.
  optional bool map_entry = 7;

  reserved 8;  // javalite_serializable
  reserved 9;  // javanano_as_lite


  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}

message FieldOptions {
  // The ctype option instructs the C++ code generator to use a different
  // representation of the field than it normally would.  See the specific
  // options below.  This option is not yet implemented in the open source
  // release -- sorry, we'll try to include it in a future version!
  optional CType ctype = 1 [default = STRING];
  enum CType {
    // Default mode.
    STRING = 0;

    CORD = 1;

    STRING_PIECE = 2;
  }
  // The packed option can be enabled for repeated primitive fields to enable
  // a more efficient representation on the wire. Rather than repeatedly
  // writing the tag and type for each element, the entire array is encoded as
  // a single length-delimited blob. In proto3, only explicit setting it to
  // false will avoid using packed encoding.
  optional bool packed = 2;

  // The jstype option determines the JavaScript type used for values of the
  // field.  The option is permitted only for 64 bit integral and fixed types
  // (int64, uint64, sint64, fixed64, sfixed64).  A field with jstype JS_STRING
  // is represented as JavaScript string, which avoids loss of precision that
  // can happen when a large value is converted to a floating point JavaScript.
  // Specifying JS_NUMBER for the jstype causes the generated JavaScript code to
  // use the JavaScript "number" type.  The behavior of the default option
  // JS_NORMAL is implementation dependent.
  //
  // This option is an enum to permit additional types to be added, e.g.
  // goog.math.Integer.
  optional JSType jstype = 6 [default = JS_NORMAL];
  enum JSType {
    // Use the default type.
    JS_NORMAL = 0;

    // Use JavaScript strings.
    JS_STRING = 1;

    // Use JavaScript numbers.
    JS_NUMBER = 2;
  }

  // Should this field be parsed lazily?  Lazy applies only to message-type
  // fields.  It means that when the outer message is initially parsed, the
  // inner message's contents will not be parsed but instead stored in encoded
  // form.  The inner message will actually be parsed when it is first accessed.
  //
  // This is only a hint.  Implementations are free to choose whether to use
  // eager or lazy parsing regardless of the value of this option.  However,
  // setting this option true suggests that the protocol author believes that
  // using lazy parsing on this field is worth the additional bookkeeping
  // overhead typically needed to implement it.
  //
  // This option does not affect the public interface of any generated code;
  // all method signatures remain the same.  Furthermore, thread-safety of the
  // interface is not affected by this option; const methods remain safe to
  // call from multiple threads concurrently, while non-const methods continue
  // to require exclusive access.
  //
  //
  // Note that implementations may choose not to check required fields within
  // a lazy sub-message.  That is, calling IsInitialized() on the outer message
  // may return true even if the inner message has missing required fields.
  // This is necessary because otherwise the inner message would have to be
  // parsed in order to perform the check, defeating the purpose of lazy
  // parsing.  An implementation which chooses not to check required fields
  // must be consistent about it.  That is, for any particular sub-message, the
  // implementation must either *always* check its required fields, or *never*
  // check its required fields, regardless of whether or not the message has
  // been parsed.
  //
  // As of 2021, lazy does no correctness checks on the byte stream during
  // parsing.  This may lead to crashes if and when an invalid byte stream is
  // finally parsed upon access.
  //
  // TODO(b/211906113):  Enable validation on lazy fields.
  optional bool lazy = 5 [default = false];

  // unverified_lazy does no correctness checks on the byte stream. This should
  // only be used where lazy with verification is prohibitive for performance
  // reasons.
  optional bool unverified_lazy = 15 [default = false];

  // Is this field deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for accessors, or it will be completely ignored; in the very least, this
  // is a formalization for deprecating fields.
  optional bool deprecated = 3 [default = false];

  // For Google-internal migration only. Do not use.
  optional bool weak = 10 [default = false];


  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;

  reserved 4;  // removed jtype
}

message OneofOptions {
  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}

message EnumOptions {

  // Set this option to true to allow mapping different tag names to the same
  // value.
  optional bool allow_alias = 2;

  // Is this enum deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for the enum, or it will be completely ignored; in the very least, this
  // is a formalization for deprecating enums.
  optional bool deprecated = 3 [default = false];

  reserved 5;  // javanano_as_lite

  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}

message EnumValueOptions {
  // Is this enum value deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for the enum value, or it will be completely ignored; in the very least,
  // this is a formalization for deprecating enum values.
  optional bool deprecated = 1 [default = false];

  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}

message ServiceOptions {

  // Note:  Field numbers 1 through 32 are reserved for Google's internal RPC
  //   framework.  We apologize for hoarding these numbers to ourselves, but
  //   we were already using them long before we decided to release Protocol
  //   Buffers.

  // Is this service deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for the service, or it will be completely ignored; in the very least,
  // this is a formalization for deprecating services.
  optional bool deprecated = 33 [default = false];

  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}

message MethodOptions {

  // Note:  Field numbers 1 through 32 are reserved for Google's internal RPC
  //   framework.  We apologize for hoarding these numbers to ourselves, but
  //   we were already using them long before we decided to release Protocol
  //   Buffers.

  // Is this method deprecated?
  // Depending on the target platform, this can emit Deprecated annotations
  // for the method, or it will be completely ignored; in the very least,
  // this is a formalization for deprecating methods.
  optional bool deprecated = 33 [default = false];

  // Is this method side-effect-free (or safe in HTTP parlance), or idempotent,
  // or neither? HTTP based RPC implementation may choose GET verb for safe
  // methods, and PUT verb for idempotent methods instead of the default POST.
  enum IdempotencyLevel {
    IDEMPOTENCY_UNKNOWN = 0;
    NO_SIDE_EFFECTS = 1;  // implies idempotent
    IDEMPOTENT = 2;       // idempotent, but may have side effects
  }
  optional IdempotencyLevel idempotency_level = 34
      [default = IDEMPOTENCY_UNKNOWN];

  // The parser stores options it doesn't recognize here. See above.
  repeated UninterpretedOption uninterpreted_option = 999;

  // Clients can define custom options in extensions of this message. See above.
  extensions 1000 to max;
}


// A message representing a option the parser does not recognize. This only
// appears in options protos created by the compiler::Parser class.
// DescriptorPool resolves these when building Descriptor objects. Therefore,
// options protos in descriptor objects (e.g. returned by Descriptor::options(),
// or produced by Descriptor::CopyTo()) will never have UninterpretedOptions
// in them.
message UninterpretedOption {
  // The name of the uninterpreted option.  Each string represents a segment in
  // a dot-separated name.  is_extension is true iff a segment represents an
  // extension (denoted with parentheses in options specs in .proto files).
  // E.g.,{ ["foo", false], ["bar.baz", true], ["moo", false] } represents
  // "foo.(bar.baz).moo".
  message NamePart {
    required string name_part = 1;
    required bool is_extension = 2;
  }
  repeated NamePart name = 2;

  // The value of the uninterpreted option, in whatever type the tokenizer
  // identified it as during parsing. Exactly one of these should be set.
  optional string identifier_value = 3;
  optional uint64 positive_int_value = 4;
  optional int64 negative_int_value = 5;
  optional double double_value = 6;
  optional bytes string_value = 7;
  optional string aggregate_value = 8;
}

// ===================================================================
// Optional source code info

// Encapsulates information about the original source file from which a
// FileDescriptorProto was generated.
message SourceCodeInfo {
  // A Location identifies a piece of source code in a .proto file which
  // corresponds to a particular definition.  This information is intended
  // to be useful to IDEs, code indexers, documentation generators, and similar
  // tools.
  //
  // For example, say we have a file like:
  //   message Foo {
  //     optional string foo = 1;
  //   }
  // Let's look at just the field definition:
  //   optional string foo = 1;
  //   ^       ^^     ^^  ^  ^^^
  //   a       bc     de  f  ghi
  // We have the following locations:
  //   span   path               represents
  //   [a,i)  [ 4, 0, 2, 0 ]     The whole field definition.
  //   [a,b)  [ 4, 0, 2, 0, 4 ]  The label (optional).
  //   [c,d)  [ 4, 0, 2, 0, 5 ]  The type (string).
  //   [e,f)  [ 4, 0, 2, 0, 1 ]  The name (foo).
  //   [g,h)  [ 4, 0, 2, 0, 3 ]  The number (1).
  //
  // Notes:
  // - A location may refer to a repeated field itself (i.e. not to any
  //   particular index within it).  This is used whenever a set of elements are
  //   logically enclosed in a single code segment.  For example, an entire
  //   extend block (possibly containing multiple extension definitions) will
  //   have an outer location whose path refers to the "extensions" repeated
  //   field without an index.
  // - Multiple locations may have the same path.  This happens when a single
  //   logical declaration is spread out across multiple places.  The most
  //   obvious example is the "extend" block again -- there may be multiple
  //   extend blocks in the same scope, each of which will have the same path.
  // - A location's span is not always a subset of its parent's span.  For
  //   example, the "extendee" of an extension declaration appears at the
  //   beginning of the "extend" block and is shared by all extensions within
  //   the block.
  // - Just because a location's span is a subset of some other location's span
  //   does not mean that it is a descendant.  For example, a "group" defines
  //   both a type and a field in a single declaration.  Thus, the locations
  //   corresponding to the type and field and their components will overlap.
  // - Code which tries to interpret locations should probably be designed to
  //   ignore those that it doesn't understand, as more types of locations could
  //   be recorded in the future.
  repeated Location location = 1;
  message Location {
    // Identifies which part of the FileDescriptorProto was defined at this
    // location.
    //
    // Each element is a field number or an index.  They form a path from
    // the root FileDescriptorProto to the place where the definition occurs.
    // For example, this path:
    //   [ 4, 3, 2, 7, 1 ]
    // refers to:
    //   file.message_type(3)  // 4, 3
    //       .field(7)         // 2, 7
    //       .name()           // 1
    // This is because FileDescriptorProto.message_type has field number 4:
    //   repeated DescriptorProto message_type = 4;
    // and DescriptorProto.field has field number 2:
    //   repeated FieldDescriptorProto field = 2;
    // and FieldDescriptorProto.name has field number 1:
    //   optional string name = 1;
    //
    // Thus, the above path gives the location of a field name.  If we removed
    // the last element:
    //   [ 4, 3, 2, 7 ]
    // this path refers to the whole field declaration (from the beginning
    // of the label to the terminating semicolon).
    repeated int32 path = 1 [packed = true];

    // Always has exactly three or four elements: start line, start column,
    // end line (optional, otherwise assumed same as start line), end column.
    // These are packed into a single field for efficiency.  Note that line
    // and column numbers are zero-based -- typically you will want to add
    // 1 to each before displaying to a user.
    repeated int32 span = 2 [packed = true];

    // If this SourceCodeInfo represents a complete declaration, these are any
    // comments appearing before and after the declaration which appear to be
    // attached to the declaration.
    //
    // A series of line comments appearing on consecutive lines, with no other
    // tokens appearing on those lines, will be treated as a single comment.
    //
    // leading_detached_comments will keep paragraphs of comments that appear
    // before (but not connected to) the current element. Each paragraph,
    // separated by empty lines, will be one comment element in the repeated
    // field.
    //
    // Only the comment content is provided; comment markers (e.g. //) are
    // stripped out.  For block comments, leading whitespace and an asterisk
    // will be stripped from the beginning of each line other than the first.
    // Newlines are included in the output.
    //
    // Examples:
    //
    //   optional int32 foo = 1;  // Comment attached to foo.
    //   // Comment attached to bar.
    //   optional int32 bar = 2;
    //
    //   optional string baz = 3;
    //   // Comment attached to baz.
    //   // Another line attached to baz.
    //
    //   // Comment attached to moo.
    //   //
    //   // Another line attached to moo.
    //   optional double moo = 4;
    //
    //   // Detached comment for corge. This is not leading or trailing comments
    //   // to moo or corge because there are blank lines separating it from
    //   // both.
    //
    //   // Detached comment for corge paragraph 2.
    //
    //   optional string corge = 5;
    //   /* Block comment attached
    //    * to corge.  Leading asterisks
    //    * will be removed. */
    //   /* Block comment attached to
    //    * grault. */
    //   optional int32 grault = 6;
    //
    //   // ignored detached comments.
    optional string leading_comments = 3;
    optional string trailing_comments = 4;
    repeated string leading_detached_comments = 6;
  }
}

// Describes the relationship between generated code and its original source
// file. A GeneratedCodeInfo message is associated with only one generated
// source file, but may contain references to different source .proto files.
message GeneratedCodeInfo {
  // An Annotation connects some span of text in generated code to an element
  // of its generating .proto file.
  repeated Annotation annotation = 1;
  message Annotation {
    // Identifies the element in the original source .proto file. This field
    // is formatted the same as SourceCodeInfo.Location.path.
    repeated int32 path = 1 [packed = true];

    // Identifies the filesystem path to the original source .proto.
    optional string source_file = 2;

    // Identifies the starting offset in bytes in the generated code
    // that relates to the identified object.
    optional int32 begin = 3;

    // Identifies the ending offset in bytes in the generated code that
    // relates to the identified offset. The end offset should be one past
    // the last relevant byte (so the length of the text = end - begin).
    optional int32 end = 4;
  }
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/duration.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option cc_enable_arenas = true;
option go_package = "google.golang.org/protobuf/types/known/durationpb";
option java_package = "com.google.protobuf";
option java_outer_classname = "DurationProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";

// A Duration represents a signed, fixed-length span of time represented
// as a count of seconds and fractions of seconds at nanosecond
// resolution. It is independent of any calendar and concepts like "day"
// or "month". It is related to Timestamp in that the difference between
// two Timestamp values is a Duration and it can be added or subtracted
// from a Timestamp. Range is approximately +-10,000 years.
//
// # Examples
//
// Example 1: Compute Duration from two Timestamps in pseudo code.
//
//     Timestamp start = ...;
//     Timestamp end = ...;
//     Duration duration = ...;
//
//     duration.seconds = end.seconds - start.seconds;
//     duration.nanos = end.nanos - start.nanos;
//
//     if (duration.seconds < 0 && duration.nanos > 0) {
//       duration.seconds += 1;
//       duration.nanos -= 1000000000;
//     } else if (duration.seconds > 0 && duration.nanos < 0) {
//       duration.seconds -= 1;
//       duration.nanos += 1000000000;
//     }
//
// Example 2: Compute Timestamp from Timestamp + Duration in pseudo code.
//
//     Timestamp start = ...;
//     Duration duration = ...;
//     Timestamp end = ...;
//
//     end.seconds = start.seconds + duration.seconds;
//     end.nanos = start.nanos + duration.nanos;
//
//     if (end.nanos < 0) {
//       end.seconds -= 1;
//       end.nanos += 1000000000;
//     } else if (end.nanos >= 1000000000) {
//       end.seconds += 1;
//       end.nanos -= 1000000000;
//     }
//
// Example 3: Compute Duration from datetime.timedelta in Python.
//
//     td = datetime.timedelta(days=3, minutes=10)
//     duration = Duration()
//     duration.FromTimedelta(td)
//
// # JSON Mapping
//
// In JSON format, the Duration type is encoded as a string rather than an
// object, where the string ends in the suffix "s" (indicating seconds) and
// is preceded by the number of seconds, with nanoseconds expressed as
// fractional seconds. For example, 3 seconds with 0 nanoseconds should be
// encoded in JSON format as "3s", while 3 seconds and 1 nanosecond should
// be expressed in JSON format as "3.000000001s", and 3 seconds and 1
// microsecond should be expressed in JSON format as "3.000001s".
//
//
message Duration {
  // Signed seconds of the span of time. Must be from -315,576,000,000
  // to +315,576,000,000 inclusive. Note: these bounds are computed from:
  // 60 sec/min * 60 min/hr * 24 hr/day * 365.25 days/year * 10000 years
  int64 seconds = 1;

  // Signed fractions of a second at nanosecond resolution of the span
  // of time. Durations less than one second are represented with a 0
  // `seconds` field and a positive or negative `nanos` field. For durations
  // of one second or more, a non-zero value for the `nanos` field must be
  // of the same sign as the `seconds` field. Must be from -999,999,999
  // to +999,999,999 inclusive.
  int32 nanos = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/empty.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option go_package = "google.golang.org/protobuf/types/known/emptypb";
option java_package = "com.google.protobuf";
option java_outer_classname = "EmptyProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";
option cc_enable_arenas = true;

// A generic empty message that you can re-use to avoid defining duplicated
// empty messages in your APIs. A typical example is to use it as the request
// or the response type of an API method. For instance:
//
//     service Foo {
//       rpc Bar(google.protobuf.Empty) returns (google.protobuf.Empty);
//     }
//
message Empty {}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/field_mask.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option java_package = "com.google.protobuf";
option java_outer_classname = "FieldMaskProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";
option go_package = "google.golang.org/protobuf/types/known/fieldmaskpb";
option cc_enable_arenas = true;

// `FieldMask` represents a set of symbolic field paths, for example:
//
//     paths: "f.a"
//     paths: "f.b.d"
//
// Here `f` represents a field in some root message, `a` and `b`
// fields in the message found in `f`, and `d` a field found in the
// message in `f.b`.
//
// Field masks are used to specify a subset of fields that should be
// returned by a get operation or modified by an update operation.
// Field masks also have a custom JSON encoding (see below).
//
// # Field Masks in Projections
//
// When used in the context of a projection, a response message or
// sub-message is filtered by the API to only contain those fields as
// specified in the mask. For example, if the mask in the previous
// example is applied to a response message as follows:
//
//     f {
//       a : 22
//       b {
//         d : 1
//         x : 2
//       }
//       y : 13
//     }
//     z: 8
//
// The result will not contain specific values for fields x,y and z
// (their value will be set to the default, and omitted in proto text
// output):
//
//
//     f {
//       a : 22
//       b {
//         d : 1
//       }
//     }
//
// A repeated field is not allowed except at the last position of a
// paths string.
//
// If a FieldMask object is not present in a get operation, the
// operation applies to all fields (as if a FieldMask of all fields
// had been specified).
//
// Note that a field mask does not necessarily apply to the
// top-level response message. In case of a REST get operation, the
// field mask applies directly to the response, but in case of a REST
// list operation, the mask instead applies to each individual message
// in the returned resource list. In case of a REST custom method,
// other definitions may be used. Where the mask applies will be
// clearly documented together with its declaration in the API.  In
// any case, the effect on the returned resource/resources is required
// behavior for APIs.
//
// # Field Masks in Update Operations
//
// A field mask in update operations specifies which fields of the
// targeted resource are going to be updated. The API is required
// to only change the values of the fields as specified in the mask
// and leave the others untouched. If a resource is passed in to
// describe the updated values, the API ignores the values of all
// fields not covered by the mask.
//
// If a repeated field is specified for an update operation, new values will
// be appended to the existing repeated field in the target resource. Note that
// a repeated field is only allowed in the last position of a `paths` string.
//
// If a sub-message is specified in the last position of the field mask for an
// update operation, then new value will be merged into the existing sub-message
// in the target resource.
//
// For example, given the target message:
//
//     f {
//       b {
//         d: 1
//         x: 2
//       }
//       c: [1]
//     }
//
// And an update message:
//
//     f {
//       b {
//         d: 10
//       }
//       c: [2]
//     }
//
// then if the field mask is:
//
//  paths: ["f.b", "f.c"]
//
// then the result will be:
//
//     f {
//       b {
//         d: 10
//         x: 2
//       }
//       c: [1, 2]
//     }
//
// An implementation may provide options to override this default behavior for
// repeated and message fields.
//
// In order to reset a field's value to the default, the field must
// be in the mask and set to the default value in the provided resource.
// Hence, in order to reset all fields of a resource, provide a default
// instance of the resource and set all fields in the mask, or do
// not provide a mask as described below.
//
// If a field mask is not present on update, the operation applies to
// all fields (as if a field mask of all fields has been specified).
// Note that in the presence of schema evolution, this may mean that
// fields the client does not know and has therefore not filled into
// the request will be reset to their default. If this is unwanted
// behavior, a specific service may require a client to always specify
// a field mask, producing an error if not.
//
// As with get operations, the location of the resource which
// describes the updated values in the request message depends on the
// operation kind. In any case, the effect of the field mask is
// required to be honored by the API.
//
// ## Considerations for HTTP REST
//
// The HTTP kind of an update operation which uses a field mask must
// be set to PATCH instead of PUT in order to satisfy HTTP semantics
// (PUT must only be used for full updates).
//
// # JSON Encoding of Field Masks
//
// In JSON, a field mask is encoded as a single string where paths are
// separated by a comma. Fields name in each path are converted
// to/from lower-camel naming conventions.
//
// As an example, consider the following message declarations:
//
//     message Profile {
//       User user = 1;
//       Photo photo = 2;
//     }
//     message User {
//       string display_name = 1;
//       string address = 2;
//     }
//
// In proto a field mask for `Profile` may look as such:
//
//     mask {
//       paths: "user.display_name"
//       paths: "photo"
//     }
//
// In JSON, the same mask is represented as below:
//
//     {
//       mask: "user.displayName,photo"
//     }
//
// # Field Masks and Oneof Fields
//
// Field masks treat fields in oneofs just as regular fields. Consider the
// following message:
//
//     message SampleMessage {
//       oneof test_oneof {
//         string name = 4;
//         SubMessage sub_message = 9;
//       }
//     }
//
// The field mask can be:
//
//     mask {
//       paths: "name"
//     }
//
// Or:
//
//     mask {
//       paths: "sub_message"
//     }
//
// Note that oneof type names ("test_oneof" in this case) cannot be used in
// paths.
//
// ## Field Mask Verification
//
// The implementation of any API method which has a FieldMask type field in the
// request should verify the included field paths, and return an
// `INVALID_ARGUMENT` error if any path is unmappable.
message FieldMask {
  // The set of field mask paths.
  repeated string paths = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/source_context.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option java_package = "com.google.protobuf";
option java_outer_classname = "SourceContextProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";
option go_package = "google.golang.org/protobuf/types/known/sourcecontextpb";

// `SourceContext` represents information about the source of a
// protobuf element, like the file in which it is defined.
message SourceContext {
  // The path-qualified name of the .proto file that contained the associated
  // protobuf element.  For example: `"google/protobuf/source_context.proto"`.
  string file_name = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/struct.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option cc_enable_arenas = true;
option go_package = "google.golang.org/protobuf/types/known/structpb";
option java_package = "com.google.protobuf";
option java_outer_classname = "StructProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";

// `Struct` represents a structured data value, consisting of fields
// which map to dynamically typed values. In some languages, `Struct`
// might be supported by a native representation. For example, in
// scripting languages like JS a struct is represented as an
// object. The details of that representation are described together
// with the proto support for the language.
//
// The JSON representation for `Struct` is JSON object.
message Struct {
  // Unordered map of dynamically typed values.
  map<string, Value> fields = 1;
}

// `Value` represents a dynamically typed value which can be either
// null, a number, a string, a boolean, a recursive struct value, or a
// list of values. A producer of value is expected to set one of these
// variants. Absence of any variant indicates an error.
//
// The JSON representation for `Value` is JSON value.
message Value {
  // The kind of value.
  oneof kind {
    // Represents a null value.
    NullValue null_value = 1;
    // Represents a double value.
    double number_value = 2;
    // Represents a string value.
    string string_value = 3;
    // Represents a boolean value.
    bool bool_value = 4;
    // Represents a structured value.
    Struct struct_value = 5;
    // Represents a repeated `Value`.
    ListValue list_value = 6;
  }
}

// `NullValue` is a singleton enumeration to represent the null value for the
// `Value` type union.
//
//  The JSON representation for `NullValue` is JSON `null`.
enum NullValue {
  // Null value.
  NULL_VALUE = 0;
}

// `ListValue` is a wrapper around a repeated field of values.
//
// The JSON representation for `ListValue` is JSON array.
message ListValue {
  // Repeated field of dynamically typed values.
  repeated Value values = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/timestamp.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option cc_enable_arenas = true;
option go_package = "google.golang.org/protobuf/types/known/timestamppb";
option java_package = "com.google.protobuf";
option java_outer_classname = "TimestampProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";

// A Timestamp represents a point in time independent of any time zone or local
// calendar, encoded as a count of seconds and fractions of seconds at
// nanosecond resolution. The count is relative to an epoch at UTC midnight on
// January 1, 1970, in the proleptic Gregorian calendar which extends the
// Gregorian calendar backwards to year one.
//
// All minutes are 60 seconds long. Leap seconds are "smeared" so that no leap
// second table is needed for interpretation, using a [24-hour linear
// smear](https://developers.google.com/time/smear).
//
// The range is from 0001-01-01T00:00:00Z to 9999-12-31T23:59:59.999999999Z. By
// restricting to that range, we ensure that we can convert to and from [RFC
// 3339](https://www.ietf.org/rfc/rfc3339.txt) date strings.
//
// # Examples
//
// Example 1: Compute Timestamp from POSIX `time()`.
//
//     Timestamp timestamp;
//     timestamp.set_seconds(time(NULL));
//     timestamp.set_nanos(0);
//
// Example 2: Compute Timestamp from POSIX `gettimeofday()`.
//
//     struct timeval tv;
//     gettimeofday(&tv, NULL);
//
//     Timestamp timestamp;
//     timestamp.set_seconds(tv.tv_sec);
//     timestamp.set_nanos(tv.tv_usec * 1000);
//
// Example 3: Compute Timestamp from Win32 `GetSystemTimeAsFileTime()`.
//
//     FILETIME ft;
//     GetSystemTimeAsFileTime(&ft);
//     UINT64 ticks = (((UINT64)ft.dwHighDateTime) << 32) | ft.dwLowDateTime;
//
//     // A Windows tick is 100 nanoseconds. Windows epoch 1601-01-01T00:00:00Z
//     // is 11644473600 seconds before Unix epoch 1970-01-01T00:00:00Z.
//     Timestamp timestamp;
//     timestamp.set_seconds((INT64) ((ticks / 10000000) - 11644473600LL));
//     timestamp.set_nanos((INT32) ((ticks % 10000000) * 100));
//
// Example 4: Compute Timestamp from Java `System.currentTimeMillis()`.
//
//     long millis = System.currentTimeMillis();
//
//     Timestamp timestamp = Timestamp.newBuilder().setSeconds(millis / 1000)
//         .setNanos((int) ((millis % 1000) * 1000000)).build();
//
//
// Example 5: Compute Timestamp from Java `Instant.now()`.
//
//     Instant now = Instant.now();
//
//     Timestamp timestamp =
//         Timestamp.newBuilder().setSeconds(now.getEpochSecond())
//             .setNanos(now.getNano()).build();
//
//
// Example 6: Compute Timestamp from current time in Python.
//
//     timestamp = Timestamp()
//     timestamp.GetCurrentTime()
//
// # JSON Mapping
//
// In JSON format, the Timestamp type is encoded as a string in the
// [RFC 3339](https://www.ietf.org/rfc/rfc3339.txt) format. That is, the
// format is "{year}-{month}-{day}T{hour}:{min}:{sec}[.{frac_sec}]Z"
// where {year} is always expressed using four digits while {month}, {day},
// {hour}, {min}, and {sec} are zero-padded to two digits each. The fractional
// seconds, which can go up to 9 digits (i.e. up to 1 nanosecond resolution),
// are optional. The "Z" suffix indicates the timezone ("UTC"); the timezone
// is required. A proto3 JSON serializer should always use UTC (as indicated by
// "Z") when printing the Timestamp type and a proto3 JSON parser should be
// able to accept both UTC and other timezones (as indicated by an offset).
//
// For example, "2017-01-15T01:30:15.01Z" encodes 15.01 seconds past
// 01:30 UTC on January 15, 2017.
//
// In JavaScript, one can convert a Date object to this format using the
// standard
// [toISOString()](https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects/Date/toISOString)
// method. In Python, a standard `datetime.datetime` object can be converted
// to this format using
// [`strftime`](https://docs.python.org/2/library/time.html#time.strftime) with
// the time format spec '%Y-%m-%dT%H:%M:%S.%fZ'. Likewise, in Java, one can use
// the Joda Time's [`ISODateTimeFormat.dateTime()`](
// http://www.joda.org/joda-time/apidocs/org/joda/time/format/ISODateTimeFormat.html#dateTime%2D%2D
// ) to obtain a formatter capable of generating timestamps in this format.
//
//
message Timestamp {
  // Represents seconds of UTC time since Unix epoch
  // 1970-01-01T00:00:00Z. Must be from 0001-01-01T00:00:00Z to
  // 9999-12-31T23:59:59Z inclusive.
  int64 seconds = 1;

  // Non-negative fractions of a second at nanosecond resolution. Negative
  // second values with fractions must still have non-negative nanos values
  // that count forward in time. Must be from 0 to 999,999,999
  // inclusive.
  int32 nanos = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/type.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

syntax = "proto3";

package google.protobuf;

import "google/protobuf/any.proto";
import "google/protobuf/source_context.proto";

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option cc_enable_arenas = true;
option java_package = "com.google.protobuf";
option java_outer_classname = "TypeProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";
option go_package = "google.golang.org/protobuf/types/known/typepb";

// A protocol buffer message type.
message Type {
  // The fully qualified message name.
  string name = 1;
  // The list of fields.
  repeated Field fields = 2;
  // The list of types appearing in `oneof` definitions in this type.
  repeated string oneofs = 3;
  // The protocol buffer options.
  repeated Option options = 4;
  // The source context.
  SourceContext source_context = 5;
  // The source syntax.
  Syntax syntax = 6;
}

// A single field of a message type.
message Field {
  // Basic field types.
  enum Kind {
    // Field type unknown.
    TYPE_UNKNOWN = 0;
    // Field type double.
    TYPE_DOUBLE = 1;
    // Field type float.
    TYPE_FLOAT = 2;
    // Field type int64.
    TYPE_INT64 = 3;
    // Field type uint64.
    TYPE_UINT64 = 4;
    // Field type int32.
    TYPE_INT32 = 5;
    // Field type fixed64.
    TYPE_FIXED64 = 6;
    // Field type fixed32.
    TYPE_FIXED32 = 7;
    // Field type bool.
    TYPE_BOOL = 8;
    // Field type string.
    TYPE_STRING = 9;
    // Field type group. Proto2 syntax only, and deprecated.
    TYPE_GROUP = 10;
    // Field type message.
    TYPE_MESSAGE = 11;
    // Field type bytes.
    TYPE_BYTES = 12;
    // Field type uint32.
    TYPE_UINT32 = 13;
    // Field type enum.
    TYPE_ENUM = 14;
    // Field type sfixed32.
    TYPE_SFIXED32 = 15;
    // Field type sfixed64.
    TYPE_SFIXED64 = 16;
    // Field type sint32.
    TYPE_SINT32 = 17;
    // Field type sint64.
    TYPE_SINT64 = 18;
  }

  // Whether a field is optional, required, or repeated.
  enum Cardinality {
    // For fields with unknown cardinality.
    CARDINALITY_UNKNOWN = 0;
    // For optional fields.
    CARDINALITY_OPTIONAL = 1;
    // For required fields. Proto2 syntax only.
    CARDINALITY_REQUIRED = 2;
    // For repeated fields.
    CARDINALITY_REPEATED = 3;
  }

  // The field type.
  Kind kind = 1;
  // The field cardinality.
  Cardinality cardinality = 2;
  // The field number.
  int32 number = 3;
  // The field name.
  string name = 4;
  // The field type URL, without the scheme, for message or enumeration
  // types. Example: `"type.googleapis.com/google.protobuf.Timestamp"`.
  string type_url = 6;
  // The index of the field type in `Type.oneofs`, for message or enumeration
  // types. The first type has index 1; zero means the type is not in the list.
  int32 oneof_index = 7;
  // Whether to use alternative packed wire representation.
  bool packed = 8;
  // The protocol buffer options.
  repeated Option options = 9;
  // The field JSON name.
  string json_name = 10;
  // The string value of the default value of this field. Proto2 syntax only.
  string default_value = 11;
}

// Enum type definition.
message Enum {
  // Enum type name.
  string name = 1;
  // Enum value definitions.
  repeated EnumValue enumvalue = 2;
  // Protocol buffer options.
  repeated Option options = 3;
  // The source context.
  SourceContext source_context = 4;
  // The source syntax.
  Syntax syntax = 5;
}

// Enum value definition.
message EnumValue {
  // Enum value name.
  string name = 1;
  // Enum value number.
  int32 number = 2;
  // Protocol buffer options.
  repeated Option options = 3;
}

// A protocol buffer option, which can be attached to a message, field,
// enumeration, etc.
message Option {
  // The option's name. For protobuf built-in options (options defined in
  // descriptor.proto), this is the short name. For example, `"map_entry"`.
  // For custom options, it should be the fully-qualified name. For example,
  // `"google.api.http"`.
  string name = 1;
  // The option's value packed in an Any message. If the value is a primitive,
  // the corresponding wrapper type defined in google/protobuf/wrappers.proto
  // should be used. If the value is an enum, it should be stored as an int32
  // value using the google.protobuf.Int32Value type.
  Any value = 2;
}

// The syntax in which a protocol buffer element is defined.
enum Syntax {
  // Syntax `proto2`.
  SYNTAX_PROTO2 = 0;
  // Syntax `proto3`.
  SYNTAX_PROTO3 = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/google/protobuf/wrappers.proto
================================================
// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// https://developers.google.com/protocol-buffers/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

// Wrappers for primitive (non-message) types. These types are useful
// for embedding primitives in the `google.protobuf.Any` type and for places
// where we need to distinguish between the absence of a primitive
// typed field and its default value.
//
// These wrappers have no meaningful use within repeated fields as they lack
// the ability to detect presence on individual elements.
// These wrappers have no meaningful use within a map or a oneof since
// individual entries of a map or fields of a oneof can already detect presence.

syntax = "proto3";

package google.protobuf;

option csharp_namespace = "Google.Protobuf.WellKnownTypes";
option cc_enable_arenas = true;
option go_package = "google.golang.org/protobuf/types/known/wrapperspb";
option java_package = "com.google.protobuf";
option java_outer_classname = "WrappersProto";
option java_multiple_files = true;
option objc_class_prefix = "GPB";

// Wrapper message for `double`.
//
// The JSON representation for `DoubleValue` is JSON number.
message DoubleValue {
  // The double value.
  double value = 1;
}

// Wrapper message for `float`.
//
// The JSON representation for `FloatValue` is JSON number.
message FloatValue {
  // The float value.
  float value = 1;
}

// Wrapper message for `int64`.
//
// The JSON representation for `Int64Value` is JSON string.
message Int64Value {
  // The int64 value.
  int64 value = 1;
}

// Wrapper message for `uint64`.
//
// The JSON representation for `UInt64Value` is JSON string.
message UInt64Value {
  // The uint64 value.
  uint64 value = 1;
}

// Wrapper message for `int32`.
//
// The JSON representation for `Int32Value` is JSON number.
message Int32Value {
  // The int32 value.
  int32 value = 1;
}

// Wrapper message for `uint32`.
//
// The JSON representation for `UInt32Value` is JSON number.
message UInt32Value {
  // The uint32 value.
  uint32 value = 1;
}

// Wrapper message for `bool`.
//
// The JSON representation for `BoolValue` is JSON `true` and `false`.
message BoolValue {
  // The bool value.
  bool value = 1;
}

// Wrapper message for `string`.
//
// The JSON representation for `StringValue` is JSON string.
message StringValue {
  // The string value.
  string value = 1;
}

// Wrapper message for `bytes`.
//
// The JSON representation for `BytesValue` is JSON string.
message BytesValue {
  // The bytes value.
  bytes value = 1;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/jaeger/model.proto
================================================
// Copyright (c) 2018 Uber Technologies, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax="proto3";

package jaeger.api_v2;

import "gogoproto/gogo.proto";
import "google/protobuf/timestamp.proto";
import "google/protobuf/duration.proto";

// TODO: document all types and fields

// TODO: once this moves to jaeger-idl repo, we may want to change Go pkg to api_v2
// and rewrite it to model only in this repo. That should make it easier to generate
// classes in other languages.
option go_package = "model";
option java_package = "io.jaegertracing.api_v2";

// Enable gogoprotobuf extensions (https://github.com/gogo/protobuf/blob/master/extensions.md).
// Enable custom Marshal method.
option (gogoproto.marshaler_all) = true;
// Enable custom Unmarshal method.
option (gogoproto.unmarshaler_all) = true;
// Enable custom Size method (Required by Marshal and Unmarshal).
option (gogoproto.sizer_all) = true;

enum ValueType {
  STRING  = 0;
  BOOL    = 1;
  INT64   = 2;
  FLOAT64 = 3;
  BINARY  = 4;
};

message KeyValue {
  option (gogoproto.equal) = true;
  option (gogoproto.compare) = true;

  string    key      = 1;
  ValueType v_type    = 2;
  string    v_str     = 3;
  bool      v_bool    = 4;
  int64     v_int64   = 5;
  double    v_float64 = 6;
  bytes     v_binary  = 7;
}

message Log {
  google.protobuf.Timestamp timestamp = 1 [
    (gogoproto.stdtime) = true,
    (gogoproto.nullable) = false
  ];
  repeated KeyValue fields = 2 [
    (gogoproto.nullable) = false
  ];
}

enum SpanRefType {
  CHILD_OF = 0;
  FOLLOWS_FROM = 1;
};

message SpanRef {
  bytes trace_id = 1 [
    (gogoproto.nullable) = false,
    (gogoproto.customtype) = "TraceID",
    (gogoproto.customname) = "TraceID"
  ];
  bytes span_id = 2 [
    (gogoproto.nullable) = false,
    (gogoproto.customtype) = "SpanID",
    (gogoproto.customname) = "SpanID"
  ];
  SpanRefType ref_type = 3;
}

message Process {
  string service_name = 1;
  repeated KeyValue tags = 2 [
    (gogoproto.nullable) = false
  ];
}

message Span {
  bytes trace_id = 1 [
    (gogoproto.nullable) = false,
    (gogoproto.customtype) = "TraceID",
    (gogoproto.customname) = "TraceID"
  ];
  bytes span_id = 2 [
    (gogoproto.nullable) = false,
    (gogoproto.customtype) = "SpanID",
    (gogoproto.customname) = "SpanID"
  ];
  string operation_name = 3;
  repeated SpanRef references = 4 [
    (gogoproto.nullable) = false
  ];
  uint32 flags = 5 [
    (gogoproto.nullable) = false,
    (gogoproto.customtype) = "Flags"
  ];
  google.protobuf.Timestamp start_time = 6 [
    (gogoproto.stdtime) = true,
    (gogoproto.nullable) = false
  ];
  google.protobuf.Duration duration = 7 [
    (gogoproto.stdduration) = true,
    (gogoproto.nullable) = false
  ];
  repeated KeyValue tags = 8 [
    (gogoproto.nullable) = false
  ];
  repeated Log logs = 9 [
    (gogoproto.nullable) = false
  ];
  Process process = 10;
  string process_id = 11 [
    (gogoproto.customname) = "ProcessID"
  ];
  repeated string warnings = 12;
}

message Trace {
  message ProcessMapping {
      string process_id = 1 [
        (gogoproto.customname) = "ProcessID"
      ];
      Process process = 2 [
        (gogoproto.nullable) = false
      ];
  }
  repeated Span spans = 1;
  repeated ProcessMapping process_map = 2 [
    (gogoproto.nullable) = false
  ];
  repeated string warnings = 3;
}

// Note that both Span and Batch may contain a Process.
// This is different from the Thrift model which was only used
// for transport, because Proto model is also used by the backend
// as the domain model, where once a batch is received it is split
// into individual spans which are all processed independently,
// and therefore they all need a Process. As far as on-the-wire
// semantics, both Batch and Spans in the same message may contain
// their own instances of Process, with span.Process taking priority
// over batch.Process.
message Batch {
    repeated Span spans = 1;
    Process process = 2 [
      (gogoproto.nullable) = true
    ];
}

message DependencyLink {
  string parent = 1;
  string child = 2;
  uint64 call_count = 3;
  string source = 4;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/jaeger/storage/v2/trace_storage.proto
================================================
// Copyright (c) 2024 The Jaeger Authors.
// SPDX-License-Identifier: Apache-2.0

syntax = "proto3";

package jaeger.storage.v2;

import "google/protobuf/duration.proto";
import "google/protobuf/timestamp.proto";
import "opentelemetry/proto/trace/v1/trace.proto";

option go_package = "storage";

// GetTraceParams represents the query for a single trace from the storage backend.
message GetTraceParams {
  // trace_id is a 16 byte array containing the unique identifier for the trace to query.
  bytes trace_id = 1;

  // start_time is the start of the time interval to search for the trace_id.
  //
  // This field is optional.
  google.protobuf.Timestamp start_time = 2;

  // end_time is the end of the time interval to search for the trace_id.
  //
  // This field is optional.
  google.protobuf.Timestamp end_time = 3;
}

// GetTracesRequest represents a request to retrieve multiple traces.
message GetTracesRequest {
  repeated GetTraceParams query = 1;
}

// GetServicesRequest represents a request to get service names.
message GetServicesRequest {}

// GetServicesResponse represents the response for GetServicesRequest.
message GetServicesResponse {
  repeated string services = 1;
}

// GetOperationsRequest represents a request to get operation names.
message GetOperationsRequest {
  // service is the name of the service for which to get operation names.
  //
  // This field is required.
  string service = 1;

  // span_kind is the type of span which is used to distinguish between
  // spans generated in a particular context.
  //
  // This field is optional.
  string span_kind = 2;
}

// Operation contains information about an operation for a given service.
message Operation {
  string name = 1;
  string span_kind = 2;
}

// GetOperationsResponse represents the response for GetOperationsRequest.
message GetOperationsResponse {
  repeated Operation operations = 1;
}

// KeyValue and all its associated types are copied from opentelemetry-proto/common/v1/common.proto
// (https://github.com/open-telemetry/opentelemetry-proto/blob/main/opentelemetry/proto/common/v1/common.proto).
// This type is used to store attributes in traces.
message KeyValue {
  string key = 1;
  AnyValue value = 2;
}

message AnyValue {
  oneof value {
    string string_value = 1;
    bool bool_value = 2;
    int64 int_value = 3;
    double double_value = 4;
    ArrayValue array_value = 5;
    KeyValueList kvlist_value = 6;
    bytes bytes_value = 7;
  }
}

message KeyValueList {
  repeated KeyValue values = 1;
}

message ArrayValue {
  repeated AnyValue values = 1;
}

// TraceQueryParameters contains query parameters to find traces. For a detailed
// definition of each field in this message, refer to `TraceQueryParameters` in `jaeger.api_v3`
// (https://github.com/jaegertracing/jaeger-idl/blob/main/proto/api_v3/query_service.proto).
message TraceQueryParameters {
  string service_name = 1;
  string operation_name = 2;
  repeated KeyValue attributes = 3;
  google.protobuf.Timestamp start_time_min = 4;
  google.protobuf.Timestamp start_time_max = 5;
  google.protobuf.Duration duration_min = 6;
  google.protobuf.Duration duration_max = 7;
  int32 search_depth = 8;
}

// FindTracesRequest represents a request to find traces.
// It can be used to retrieve the traces (FindTraces) or simply
// the trace IDs (FindTraceIDs).
message FindTracesRequest {
  TraceQueryParameters query = 1;
}

// FoundTraceID is a wrapper around trace ID returned from FindTraceIDs
// with an optional time range that may be used in GetTraces calls.
//
// The time range is provided as an optimization hint for some storage backends
// that can perform more efficient queries when they know the approximate time range.
// The value should not be used for precise time-based filtering or assumptions.
// It is meant as a rough boundary and may not be populated in all cases.
message FoundTraceID {
  bytes trace_id = 1;
  google.protobuf.Timestamp start = 2;
  google.protobuf.Timestamp end = 3;
}

// FindTraceIDsResponse represents the response for FindTracesRequest.
message FindTraceIDsResponse {
  repeated FoundTraceID trace_ids = 1;
}

// TraceReader is a service that allows reading traces from storage.
// Note that if you implement this service, you should also implement
// OTEL's TraceService in package opentelemetry.proto.collector.trace.v1
// to allow pushing traces to the storage backend
// (<https://github.com/open-telemetry/opentelemetry-proto/blob/main/opentelemetry/proto/collector/trace/v1/trace_service.proto>)
service TraceReader {
  // GetTraces returns a stream that retrieves all traces with given IDs.
  //
  // Chunking requirements:
  // - A single TracesData chunk MUST NOT contain spans from multiple traces.
  // - Large traces MAY be split across multiple, *consecutive* TracesData chunks.
  // - Each returned TracesData object MUST NOT be empty.
  //
  // Edge cases:
  // - If no spans are found for any given trace ID, the ID is ignored.
  // - If none of the trace IDs are found in the storage, an empty response is returned.
  rpc GetTraces(GetTracesRequest) returns (stream opentelemetry.proto.trace.v1.TracesData) {}

  // GetServices returns all service names known to the backend from traces
  // within its retention period.
  rpc GetServices(GetServicesRequest) returns (GetServicesResponse) {}

  // GetOperations returns all operation names for a given service
  // known to the backend from traces within its retention period.
  rpc GetOperations(GetOperationsRequest) returns (GetOperationsResponse) {}

  // FindTraces returns a stream that retrieves traces matching query parameters.
  //
  // The chunking rules are the same as for GetTraces.
  //
  // If no matching traces are found, an empty stream is returned.
  rpc FindTraces(FindTracesRequest) returns (stream opentelemetry.proto.trace.v1.TracesData) {}

  // FindTraceIDs returns a stream that retrieves IDs of traces matching query parameters.
  //
  // If no matching traces are found, an empty stream is returned.
  //
  // This call behaves identically to FindTraces, except that it returns only the list
  // of matching trace IDs. This is useful in some contexts, such as batch jobs, where a
  // large list of trace IDs may be queried first and then the full traces are loaded
  // in batches.
  rpc FindTraceIDs(FindTracesRequest) returns (FindTraceIDsResponse) {}
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/jaeger/storage.proto
================================================
// Copyright (c) 2019 The Jaeger Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package jaeger.storage.v1;

option go_package = "storage_v1";

import "gogoproto/gogo.proto";
import "google/protobuf/timestamp.proto";
import "google/protobuf/duration.proto";

import "model.proto";

// Enable gogoprotobuf extensions (https://github.com/gogo/protobuf/blob/master/extensions.md).
// Enable custom Marshal method.
option (gogoproto.marshaler_all) = true;
// Enable custom Unmarshal method.
option (gogoproto.unmarshaler_all) = true;
// Enable custom Size method (Required by Marshal and Unmarshal).
option (gogoproto.sizer_all) = true;

message GetDependenciesRequest {
    google.protobuf.Timestamp start_time = 1 [
      (gogoproto.stdtime) = true,
      (gogoproto.nullable) = false
    ];
    google.protobuf.Timestamp end_time = 2 [
      (gogoproto.stdtime) = true,
      (gogoproto.nullable) = false
    ];
}

message GetDependenciesResponse {
    repeated jaeger.api_v2.DependencyLink dependencies = 1 [
      (gogoproto.nullable) = false
    ];
}

message WriteSpanRequest {
    jaeger.api_v2.Span span = 1;
}

// empty; extensible in the future
message WriteSpanResponse {

}

// empty; extensible in the future
message CloseWriterRequest {
}

// empty; extensible in the future
message CloseWriterResponse {
}

message GetTraceRequest {
    bytes trace_id = 1 [
      (gogoproto.nullable) = false,
      (gogoproto.customtype) = "github.com/jaegertracing/jaeger/model.TraceID",
      (gogoproto.customname) = "TraceID"
    ];
}

message GetServicesRequest {}

message GetServicesResponse {
    repeated string services = 1;
}

message GetOperationsRequest {
    string service = 1;
    string span_kind = 2;
}

message Operation {
    string name = 1;
    string span_kind = 2;
}

message GetOperationsResponse {
    repeated string operationNames = 1; // deprecated
    repeated Operation operations = 2;
}

message TraceQueryParameters {
    string service_name = 1;
    string operation_name = 2;
    map<string, string> tags = 3;
    google.protobuf.Timestamp start_time_min = 4 [
      (gogoproto.stdtime) = true,
      (gogoproto.nullable) = false
    ];
    google.protobuf.Timestamp start_time_max = 5 [
      (gogoproto.stdtime) = true,
      (gogoproto.nullable) = false
    ];
    google.protobuf.Duration duration_min = 6 [
      (gogoproto.stdduration) = true,
      (gogoproto.nullable) = false
    ];
    google.protobuf.Duration duration_max = 7 [
      (gogoproto.stdduration) = true,
      (gogoproto.nullable) = false
    ];
    int32 num_traces = 8;
}

message FindTracesRequest {
    TraceQueryParameters query = 1;
}

message SpansResponseChunk {
    repeated jaeger.api_v2.Span spans = 1  [
      (gogoproto.nullable) = false
    ];
}

message FindTraceIDsRequest {
    TraceQueryParameters query = 1;
}

message FindTraceIDsResponse {
    repeated bytes trace_ids = 1 [
      (gogoproto.nullable) = false,
      (gogoproto.customtype) = "github.com/jaegertracing/jaeger/model.TraceID",
      (gogoproto.customname) = "TraceIDs"
    ];
}

service SpanWriterPlugin {
    // spanstore/Writer
    rpc WriteSpan(WriteSpanRequest) returns (WriteSpanResponse);
    rpc Close(CloseWriterRequest) returns (CloseWriterResponse);
}

service StreamingSpanWriterPlugin {
    rpc WriteSpanStream(stream WriteSpanRequest) returns (WriteSpanResponse);
}

service SpanReaderPlugin {
    // spanstore/Reader
    rpc GetTrace(GetTraceRequest) returns (stream SpansResponseChunk);
    rpc GetServices(GetServicesRequest) returns (GetServicesResponse);
    rpc GetOperations(GetOperationsRequest) returns (GetOperationsResponse);
    rpc FindTraces(FindTracesRequest) returns (stream SpansResponseChunk);
    rpc FindTraceIDs(FindTraceIDsRequest) returns (FindTraceIDsResponse);
}

service ArchiveSpanWriterPlugin {
    // spanstore/Writer
    rpc WriteArchiveSpan(WriteSpanRequest) returns (WriteSpanResponse);
}

service ArchiveSpanReaderPlugin {
    // spanstore/Reader
    rpc GetArchiveTrace(GetTraceRequest) returns (stream SpansResponseChunk);
}

service DependenciesReaderPlugin {
    // dependencystore/Reader
    rpc GetDependencies(GetDependenciesRequest) returns (GetDependenciesResponse);
}

// empty; extensible in the future
message CapabilitiesRequest {

}

message CapabilitiesResponse {
    bool archiveSpanReader = 1;
    bool archiveSpanWriter = 2;
    bool streamingSpanWriter = 3;
}

service PluginCapabilities {
    rpc Capabilities(CapabilitiesRequest) returns (CapabilitiesResponse);
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/README.md
================================================
# OpenTelemetry Collector Proto

This package describes the OpenTelemetry collector protocol.

## Packages

1. `common` package contains the common messages shared between different services.
2. `trace` package contains the Trace Service protos.
3. `metrics` package contains the Metrics Service protos.
4. `logs` package contains the Logs Service protos.


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/logs/v1/logs_service.proto
================================================
// Copyright 2020, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.collector.logs.v1;

import "opentelemetry/proto/logs/v1/logs.proto";

option csharp_namespace = "OpenTelemetry.Proto.Collector.Logs.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.collector.logs.v1";
option java_outer_classname = "LogsServiceProto";
option go_package = "go.opentelemetry.io/proto/otlp/collector/logs/v1";

// Service that can be used to push logs between one Application instrumented with
// OpenTelemetry and an collector, or between an collector and a central collector (in this
// case logs are sent/received to/from multiple Applications).
service LogsService {
  // For performance reasons, it is recommended to keep this RPC
  // alive for the entire life of the application.
  rpc Export(ExportLogsServiceRequest) returns (ExportLogsServiceResponse) {}
}

message ExportLogsServiceRequest {
  // An array of ResourceLogs.
  // For data coming from a single resource this array will typically contain one
  // element. Intermediary nodes (such as OpenTelemetry Collector) that receive
  // data from multiple origins typically batch the data before forwarding further and
  // in that case this array will contain multiple elements.
  repeated opentelemetry.proto.logs.v1.ResourceLogs resource_logs = 1;
}

message ExportLogsServiceResponse {
  // The details of a partially successful export request.
  //
  // If the request is only partially accepted
  // (i.e. when the server accepts only parts of the data and rejects the rest)
  // the server MUST initialize the `partial_success` field and MUST
  // set the `rejected_<signal>` with the number of items it rejected.
  //
  // Servers MAY also make use of the `partial_success` field to convey
  // warnings/suggestions to senders even when the request was fully accepted.
  // In such cases, the `rejected_<signal>` MUST have a value of `0` and
  // the `error_message` MUST be non-empty.
  //
  // A `partial_success` message with an empty value (`rejected_<signal>1 = 0 and
  // `error_message` = "") is equivalent to it not being set/present. Senders
  // SHOULD interpret it the same way as in the full success case.
  ExportLogsPartialSuccess partial_success = 1;
}

message ExportLogsPartialSuccess {
  // The number of rejected log records.
  //
  // A `rejected_<signal>` field holding a `0` value indicates that the
  // request was fully accepted.
  int64 rejected_log_records = 1;

  // A developer-facing human-readable message in English. It should be used
  // either to explain why the server rejected parts of the data during a partial
  // success or to convey warnings/suggestions during a full success. The message
  // should offer guidance on how users can address such issues.
  //
  // error_message is an optional field. An error_message with an empty value
  // is equivalent to it not being set.
  string error_message = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/logs/v1/logs_service_http.yaml
================================================
# This is an API configuration to generate an HTTP/JSON -> gRPC gateway for the
# OpenTelemetry service using github.com/grpc-ecosystem/grpc-gateway.
type: google.api.Service
config_version: 3
http:
 rules:
 - selector: opentelemetry.proto.collector.logs.v1.LogsService.Export
   post: /v1/logs
   body: "*"

================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/metrics/v1/metrics_service.proto
================================================
// Copyright 2019, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.collector.metrics.v1;

import "opentelemetry/proto/metrics/v1/metrics.proto";

option csharp_namespace = "OpenTelemetry.Proto.Collector.Metrics.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.collector.metrics.v1";
option java_outer_classname = "MetricsServiceProto";
option go_package = "go.opentelemetry.io/proto/otlp/collector/metrics/v1";

// Service that can be used to push metrics between one Application
// instrumented with OpenTelemetry and a collector, or between a collector and a
// central collector.
service MetricsService {
  // For performance reasons, it is recommended to keep this RPC
  // alive for the entire life of the application.
  rpc Export(ExportMetricsServiceRequest) returns (ExportMetricsServiceResponse) {}
}

message ExportMetricsServiceRequest {
  // An array of ResourceMetrics.
  // For data coming from a single resource this array will typically contain one
  // element. Intermediary nodes (such as OpenTelemetry Collector) that receive
  // data from multiple origins typically batch the data before forwarding further and
  // in that case this array will contain multiple elements.
  repeated opentelemetry.proto.metrics.v1.ResourceMetrics resource_metrics = 1;
}

message ExportMetricsServiceResponse {
  // The details of a partially successful export request.
  //
  // If the request is only partially accepted
  // (i.e. when the server accepts only parts of the data and rejects the rest)
  // the server MUST initialize the `partial_success` field and MUST
  // set the `rejected_<signal>` with the number of items it rejected.
  //
  // Servers MAY also make use of the `partial_success` field to convey
  // warnings/suggestions to senders even when the request was fully accepted.
  // In such cases, the `rejected_<signal>` MUST have a value of `0` and
  // the `error_message` MUST be non-empty.
  //
  // A `partial_success` message with an empty value (rejected_<signal> = 0 and
  // `error_message` = "") is equivalent to it not being set/present. Senders
  // SHOULD interpret it the same way as in the full success case.
  ExportMetricsPartialSuccess partial_success = 1;
}

message ExportMetricsPartialSuccess {
  // The number of rejected data points.
  //
  // A `rejected_<signal>` field holding a `0` value indicates that the
  // request was fully accepted.
  int64 rejected_data_points = 1;

  // A developer-facing human-readable message in English. It should be used
  // either to explain why the server rejected parts of the data during a partial
  // success or to convey warnings/suggestions during a full success. The message
  // should offer guidance on how users can address such issues.
  //
  // error_message is an optional field. An error_message with an empty value
  // is equivalent to it not being set.
  string error_message = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/metrics/v1/metrics_service_http.yaml
================================================
# This is an API configuration to generate an HTTP/JSON -> gRPC gateway for the
# OpenTelemetry service using github.com/grpc-ecosystem/grpc-gateway.
type: google.api.Service
config_version: 3
http:
 rules:
 - selector: opentelemetry.proto.collector.metrics.v1.MetricsService.Export
   post: /v1/metrics
   body: "*"

================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/trace/v1/trace_service.proto
================================================
// Copyright 2019, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.collector.trace.v1;

import "opentelemetry/proto/trace/v1/trace.proto";

option csharp_namespace = "OpenTelemetry.Proto.Collector.Trace.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.collector.trace.v1";
option java_outer_classname = "TraceServiceProto";
option go_package = "go.opentelemetry.io/proto/otlp/collector/trace/v1";

// Service that can be used to push spans between one Application instrumented with
// OpenTelemetry and a collector, or between a collector and a central collector (in this
// case spans are sent/received to/from multiple Applications).
service TraceService {
  // For performance reasons, it is recommended to keep this RPC
  // alive for the entire life of the application.
  rpc Export(ExportTraceServiceRequest) returns (ExportTraceServiceResponse) {}
}

message ExportTraceServiceRequest {
  // An array of ResourceSpans.
  // For data coming from a single resource this array will typically contain one
  // element. Intermediary nodes (such as OpenTelemetry Collector) that receive
  // data from multiple origins typically batch the data before forwarding further and
  // in that case this array will contain multiple elements.
  repeated opentelemetry.proto.trace.v1.ResourceSpans resource_spans = 1;
}

message ExportTraceServiceResponse {
  // The details of a partially successful export request.
  //
  // If the request is only partially accepted
  // (i.e. when the server accepts only parts of the data and rejects the rest)
  // the server MUST initialize the `partial_success` field and MUST
  // set the `rejected_<signal>` with the number of items it rejected.
  //
  // Servers MAY also make use of the `partial_success` field to convey
  // warnings/suggestions to senders even when the request was fully accepted.
  // In such cases, the `rejected_<signal>` MUST have a value of `0` and
  // the `error_message` MUST be non-empty.
  //
  // A `partial_success` message with an empty value (rejected_<signal> = 0 and
  // `error_message` = "") is equivalent to it not being set/present. Senders
  // SHOULD interpret it the same way as in the full success case.
  ExportTracePartialSuccess partial_success = 1;
}

message ExportTracePartialSuccess {
  // The number of rejected spans.
  //
  // A `rejected_<signal>` field holding a `0` value indicates that the
  // request was fully accepted.
  int64 rejected_spans = 1;

  // A developer-facing human-readable message in English. It should be used
  // either to explain why the server rejected parts of the data during a partial
  // success or to convey warnings/suggestions during a full success. The message
  // should offer guidance on how users can address such issues.
  //
  // error_message is an optional field. An error_message with an empty value
  // is equivalent to it not being set.
  string error_message = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/collector/trace/v1/trace_service_http.yaml
================================================
# This is an API configuration to generate an HTTP/JSON -> gRPC gateway for the
# OpenTelemetry service using github.com/grpc-ecosystem/grpc-gateway.
type: google.api.Service
config_version: 3
http:
 rules:
 - selector: opentelemetry.proto.collector.trace.v1.TraceService.Export
   post: /v1/trace
   body: "*"

================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/common/v1/common.proto
================================================
// Copyright 2019, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.common.v1;

option csharp_namespace = "OpenTelemetry.Proto.Common.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.common.v1";
option java_outer_classname = "CommonProto";
option go_package = "go.opentelemetry.io/proto/otlp/common/v1";

// AnyValue is used to represent any type of attribute value. AnyValue may contain a
// primitive value such as a string or integer or it may contain an arbitrary nested
// object containing arrays, key-value lists and primitives.
message AnyValue {
  // The value is one of the listed fields. It is valid for all values to be unspecified
  // in which case this AnyValue is considered to be "empty".
  oneof value {
    string string_value = 1;
    bool bool_value = 2;
    int64 int_value = 3;
    double double_value = 4;
    ArrayValue array_value = 5;
    KeyValueList kvlist_value = 6;
    bytes bytes_value = 7;
  }
}

// ArrayValue is a list of AnyValue messages. We need ArrayValue as a message
// since oneof in AnyValue does not allow repeated fields.
message ArrayValue {
  // Array of values. The array may be empty (contain 0 elements).
  repeated AnyValue values = 1;
}

// KeyValueList is a list of KeyValue messages. We need KeyValueList as a message
// since `oneof` in AnyValue does not allow repeated fields. Everywhere else where we need
// a list of KeyValue messages (e.g. in Span) we use `repeated KeyValue` directly to
// avoid unnecessary extra wrapping (which slows down the protocol). The 2 approaches
// are semantically equivalent.
message KeyValueList {
  // A collection of key/value pairs of key-value pairs. The list may be empty (may
  // contain 0 elements).
  // The keys MUST be unique (it is not allowed to have more than one
  // value with the same key).
  repeated KeyValue values = 1;
}

// KeyValue is a key-value pair that is used to store Span attributes, Link
// attributes, etc.
message KeyValue {
  string key = 1;
  AnyValue value = 2;
}

// InstrumentationScope is a message representing the instrumentation scope information
// such as the fully qualified name and version. 
message InstrumentationScope {
  // An empty instrumentation scope name means the name is unknown.
  string name = 1;
  string version = 2;
  repeated KeyValue attributes = 3;
  uint32 dropped_attributes_count = 4;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/logs/v1/logs.proto
================================================
// Copyright 2020, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.logs.v1;

import "opentelemetry/proto/common/v1/common.proto";
import "opentelemetry/proto/resource/v1/resource.proto";

option csharp_namespace = "OpenTelemetry.Proto.Logs.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.logs.v1";
option java_outer_classname = "LogsProto";
option go_package = "go.opentelemetry.io/proto/otlp/logs/v1";

// LogsData represents the logs data that can be stored in a persistent storage,
// OR can be embedded by other protocols that transfer OTLP logs data but do not
// implement the OTLP protocol.
//
// The main difference between this message and collector protocol is that
// in this message there will not be any "control" or "metadata" specific to
// OTLP protocol.
//
// When new fields are added into this message, the OTLP request MUST be updated
// as well.
message LogsData {
  // An array of ResourceLogs.
  // For data coming from a single resource this array will typically contain
  // one element. Intermediary nodes that receive data from multiple origins
  // typically batch the data before forwarding further and in that case this
  // array will contain multiple elements.
  repeated ResourceLogs resource_logs = 1;
}

// A collection of ScopeLogs from a Resource.
message ResourceLogs {
  reserved 1000;

  // The resource for the logs in this message.
  // If this field is not set then resource info is unknown.
  opentelemetry.proto.resource.v1.Resource resource = 1;

  // A list of ScopeLogs that originate from a resource.
  repeated ScopeLogs scope_logs = 2;

  // This schema_url applies to the data in the "resource" field. It does not apply
  // to the data in the "scope_logs" field which have their own schema_url field.
  string schema_url = 3;
}

// A collection of Logs produced by a Scope.
message ScopeLogs {
  // The instrumentation scope information for the logs in this message.
  // Semantically when InstrumentationScope isn't set, it is equivalent with
  // an empty instrumentation scope name (unknown).
  opentelemetry.proto.common.v1.InstrumentationScope scope = 1;

  // A list of log records.
  repeated LogRecord log_records = 2;

  // This schema_url applies to all logs in the "logs" field.
  string schema_url = 3;
}

// Possible values for LogRecord.SeverityNumber.
enum SeverityNumber {
  // UNSPECIFIED is the default SeverityNumber, it MUST NOT be used.
  SEVERITY_NUMBER_UNSPECIFIED = 0;
  SEVERITY_NUMBER_TRACE  = 1;
  SEVERITY_NUMBER_TRACE2 = 2;
  SEVERITY_NUMBER_TRACE3 = 3;
  SEVERITY_NUMBER_TRACE4 = 4;
  SEVERITY_NUMBER_DEBUG  = 5;
  SEVERITY_NUMBER_DEBUG2 = 6;
  SEVERITY_NUMBER_DEBUG3 = 7;
  SEVERITY_NUMBER_DEBUG4 = 8;
  SEVERITY_NUMBER_INFO   = 9;
  SEVERITY_NUMBER_INFO2  = 10;
  SEVERITY_NUMBER_INFO3  = 11;
  SEVERITY_NUMBER_INFO4  = 12;
  SEVERITY_NUMBER_WARN   = 13;
  SEVERITY_NUMBER_WARN2  = 14;
  SEVERITY_NUMBER_WARN3  = 15;
  SEVERITY_NUMBER_WARN4  = 16;
  SEVERITY_NUMBER_ERROR  = 17;
  SEVERITY_NUMBER_ERROR2 = 18;
  SEVERITY_NUMBER_ERROR3 = 19;
  SEVERITY_NUMBER_ERROR4 = 20;
  SEVERITY_NUMBER_FATAL  = 21;
  SEVERITY_NUMBER_FATAL2 = 22;
  SEVERITY_NUMBER_FATAL3 = 23;
  SEVERITY_NUMBER_FATAL4 = 24;
}

// Masks for LogRecord.flags field.
enum LogRecordFlags {
  LOG_RECORD_FLAG_UNSPECIFIED = 0;
  LOG_RECORD_FLAG_TRACE_FLAGS_MASK = 0x000000FF;
}

// A log record according to OpenTelemetry Log Data Model:
// https://github.com/open-telemetry/oteps/blob/main/text/logs/0097-log-data-model.md
message LogRecord {
  reserved 4;

  // time_unix_nano is the time when the event occurred.
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
  // Value of 0 indicates unknown or missing timestamp.
  fixed64 time_unix_nano = 1;

  // Time when the event was observed by the collection system.
  // For events that originate in OpenTelemetry (e.g. using OpenTelemetry Logging SDK)
  // this timestamp is typically set at the generation time and is equal to Timestamp.
  // For events originating externally and collected by OpenTelemetry (e.g. using
  // Collector) this is the time when OpenTelemetry's code observed the event measured
  // by the clock of the OpenTelemetry code. This field MUST be set once the event is
  // observed by OpenTelemetry.
  //
  // For converting OpenTelemetry log data to formats that support only one timestamp or
  // when receiving OpenTelemetry log data by recipients that support only one timestamp
  // internally the following logic is recommended:
  //   - Use time_unix_nano if it is present, otherwise use observed_time_unix_nano.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
  // Value of 0 indicates unknown or missing timestamp.
  fixed64 observed_time_unix_nano = 11;

  // Numerical value of the severity, normalized to values described in Log Data Model.
  // [Optional].
  SeverityNumber severity_number = 2;

  // The severity text (also known as log level). The original string representation as
  // it is known at the source. [Optional].
  string severity_text = 3;

  // A value containing the body of the log record. Can be for example a human-readable
  // string message (including multi-line) describing the event in a free form or it can
  // be a structured data composed of arrays and maps of other values. [Optional].
  opentelemetry.proto.common.v1.AnyValue body = 5;

  // Additional attributes that describe the specific event occurrence. [Optional].
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 6;
  uint32 dropped_attributes_count = 7;

  // Flags, a bit field. 8 least significant bits are the trace flags as
  // defined in W3C Trace Context specification. 24 most significant bits are reserved
  // and must be set to 0. Readers must not assume that 24 most significant bits
  // will be zero and must correctly mask the bits when reading 8-bit trace flag (use
  // flags & TRACE_FLAGS_MASK). [Optional].
  fixed32 flags = 8;

  // A unique identifier for a trace. All logs from the same trace share
  // the same `trace_id`. The ID is a 16-byte array. An ID with all zeroes
  // is considered invalid. Can be set for logs that are part of request processing
  // and have an assigned trace id. [Optional].
  bytes trace_id = 9;

  // A unique identifier for a span within a trace, assigned when the span
  // is created. The ID is an 8-byte array. An ID with all zeroes is considered
  // invalid. Can be set for logs that are part of a particular processing span.
  // If span_id is present trace_id SHOULD be also present. [Optional].
  bytes span_id = 10;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/metrics/v1/metrics.proto
================================================
// Copyright 2019, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.metrics.v1;

import "opentelemetry/proto/common/v1/common.proto";
import "opentelemetry/proto/resource/v1/resource.proto";

option csharp_namespace = "OpenTelemetry.Proto.Metrics.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.metrics.v1";
option java_outer_classname = "MetricsProto";
option go_package = "go.opentelemetry.io/proto/otlp/metrics/v1";

// MetricsData represents the metrics data that can be stored in a persistent
// storage, OR can be embedded by other protocols that transfer OTLP metrics
// data but do not implement the OTLP protocol.
//
// The main difference between this message and collector protocol is that
// in this message there will not be any "control" or "metadata" specific to
// OTLP protocol.
//
// When new fields are added into this message, the OTLP request MUST be updated
// as well.
message MetricsData {
  // An array of ResourceMetrics.
  // For data coming from a single resource this array will typically contain
  // one element. Intermediary nodes that receive data from multiple origins
  // typically batch the data before forwarding further and in that case this
  // array will contain multiple elements.
  repeated ResourceMetrics resource_metrics = 1;
}

// A collection of ScopeMetrics from a Resource.
message ResourceMetrics {
  reserved 1000;

  // The resource for the metrics in this message.
  // If this field is not set then no resource info is known.
  opentelemetry.proto.resource.v1.Resource resource = 1;

  // A list of metrics that originate from a resource.
  repeated ScopeMetrics scope_metrics = 2;

  // This schema_url applies to the data in the "resource" field. It does not apply
  // to the data in the "scope_metrics" field which have their own schema_url field.
  string schema_url = 3;
}

// A collection of Metrics produced by an Scope.
message ScopeMetrics {
  // The instrumentation scope information for the metrics in this message.
  // Semantically when InstrumentationScope isn't set, it is equivalent with
  // an empty instrumentation scope name (unknown).
  opentelemetry.proto.common.v1.InstrumentationScope scope = 1;

  // A list of metrics that originate from an instrumentation library.
  repeated Metric metrics = 2;

  // This schema_url applies to all metrics in the "metrics" field.
  string schema_url = 3;
}

// Defines a Metric which has one or more timeseries.  The following is a
// brief summary of the Metric data model.  For more details, see:
//
//   https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/metrics/data-model.md
//
//
// The data model and relation between entities is shown in the
// diagram below. Here, "DataPoint" is the term used to refer to any
// one of the specific data point value types, and "points" is the term used
// to refer to any one of the lists of points contained in the Metric.
//
// - Metric is composed of a metadata and data.
// - Metadata part contains a name, description, unit.
// - Data is one of the possible types (Sum, Gauge, Histogram, Summary).
// - DataPoint contains timestamps, attributes, and one of the possible value type
//   fields.
//
//     Metric
//  +------------+
//  |name        |
//  |description |
//  |unit        |     +------------------------------------+
//  |data        |---> |Gauge, Sum, Histogram, Summary, ... |
//  +------------+     +------------------------------------+
//
//    Data [One of Gauge, Sum, Histogram, Summary, ...]
//  +-----------+
//  |...        |  // Metadata about the Data.
//  |points     |--+
//  +-----------+  |
//                 |      +---------------------------+
//                 |      |DataPoint 1                |
//                 v      |+------+------+   +------+ |
//              +-----+   ||label |label |...|label | |
//              |  1  |-->||value1|value2|...|valueN| |
//              +-----+   |+------+------+   +------+ |
//              |  .  |   |+-----+                    |
//              |  .  |   ||value|                    |
//              |  .  |   |+-----+                    |
//              |  .  |   +---------------------------+
//              |  .  |                   .
//              |  .  |                   .
//              |  .  |                   .
//              |  .  |   +---------------------------+
//              |  .  |   |DataPoint M                |
//              +-----+   |+------+------+   +------+ |
//              |  M  |-->||label |label |...|label | |
//              +-----+   ||value1|value2|...|valueN| |
//                        |+------+------+   +------+ |
//                        |+-----+                    |
//                        ||value|                    |
//                        |+-----+                    |
//                        +---------------------------+
//
// Each distinct type of DataPoint represents the output of a specific
// aggregation function, the result of applying the DataPoint's
// associated function of to one or more measurements.
//
// All DataPoint types have three common fields:
// - Attributes includes key-value pairs associated with the data point
// - TimeUnixNano is required, set to the end time of the aggregation
// - StartTimeUnixNano is optional, but strongly encouraged for DataPoints
//   having an AggregationTemporality field, as discussed below.
//
// Both TimeUnixNano and StartTimeUnixNano values are expressed as
// UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
//
// # TimeUnixNano
//
// This field is required, having consistent interpretation across
// DataPoint types.  TimeUnixNano is the moment corresponding to when
// the data point's aggregate value was captured.
//
// Data points with the 0 value for TimeUnixNano SHOULD be rejected
// by consumers.
//
// # StartTimeUnixNano
//
// StartTimeUnixNano in general allows detecting when a sequence of
// observations is unbroken.  This field indicates to consumers the
// start time for points with cumulative and delta
// AggregationTemporality, and it should be included whenever possible
// to support correct rate calculation.  Although it may be omitted
// when the start time is truly unknown, setting StartTimeUnixNano is
// strongly encouraged.
message Metric {
  reserved 4, 6, 8;

  // name of the metric, including its DNS name prefix. It must be unique.
  string name = 1;

  // description of the metric, which can be used in documentation.
  string description = 2;

  // unit in which the metric value is reported. Follows the format
  // described by http://unitsofmeasure.org/ucum.html.
  string unit = 3;

  // Data determines the aggregation type (if any) of the metric, what is the
  // reported value type for the data points, as well as the relatationship to
  // the time interval over which they are reported.
  oneof data {
    Gauge gauge = 5;
    Sum sum = 7;
    Histogram histogram = 9;
    ExponentialHistogram exponential_histogram = 10;
    Summary summary = 11;
  }
}

// Gauge represents the type of a scalar metric that always exports the
// "current value" for every data point. It should be used for an "unknown"
// aggregation.
//
// A Gauge does not support different aggregation temporalities. Given the
// aggregation is unknown, points cannot be combined using the same
// aggregation, regardless of aggregation temporalities. Therefore,
// AggregationTemporality is not included. Consequently, this also means
// "StartTimeUnixNano" is ignored for all data points.
message Gauge {
  repeated NumberDataPoint data_points = 1;
}

// Sum represents the type of a scalar metric that is calculated as a sum of all
// reported measurements over a time interval.
message Sum {
  repeated NumberDataPoint data_points = 1;

  // aggregation_temporality describes if the aggregator reports delta changes
  // since last report time, or cumulative changes since a fixed start time.
  AggregationTemporality aggregation_temporality = 2;

  // If "true" means that the sum is monotonic.
  bool is_monotonic = 3;
}

// Histogram represents the type of a metric that is calculated by aggregating
// as a Histogram of all reported measurements over a time interval.
message Histogram {
  repeated HistogramDataPoint data_points = 1;

  // aggregation_temporality describes if the aggregator reports delta changes
  // since last report time, or cumulative changes since a fixed start time.
  AggregationTemporality aggregation_temporality = 2;
}

// ExponentialHistogram represents the type of a metric that is calculated by aggregating
// as a ExponentialHistogram of all reported double measurements over a time interval.
message ExponentialHistogram {
  repeated ExponentialHistogramDataPoint data_points = 1;

  // aggregation_temporality describes if the aggregator reports delta changes
  // since last report time, or cumulative changes since a fixed start time.
  AggregationTemporality aggregation_temporality = 2;
}

// Summary metric data are used to convey quantile summaries,
// a Prometheus (see: https://prometheus.io/docs/concepts/metric_types/#summary)
// and OpenMetrics (see: https://github.com/OpenObservability/OpenMetrics/blob/4dbf6075567ab43296eed941037c12951faafb92/protos/prometheus.proto#L45)
// data type. These data points cannot always be merged in a meaningful way.
// While they can be useful in some applications, histogram data points are
// recommended for new applications.
message Summary {
  repeated SummaryDataPoint data_points = 1;
}

// AggregationTemporality defines how a metric aggregator reports aggregated
// values. It describes how those values relate to the time interval over
// which they are aggregated.
enum AggregationTemporality {
  // UNSPECIFIED is the default AggregationTemporality, it MUST not be used.
  AGGREGATION_TEMPORALITY_UNSPECIFIED = 0;

  // DELTA is an AggregationTemporality for a metric aggregator which reports
  // changes since last report time. Successive metrics contain aggregation of
  // values from continuous and non-overlapping intervals.
  //
  // The values for a DELTA metric are based only on the time interval
  // associated with one measurement cycle. There is no dependency on
  // previous measurements like is the case for CUMULATIVE metrics.
  //
  // For example, consider a system measuring the number of requests that
  // it receives and reports the sum of these requests every second as a
  // DELTA metric:
  //
  //   1. The system starts receiving at time=t_0.
  //   2. A request is received, the system measures 1 request.
  //   3. A request is received, the system measures 1 request.
  //   4. A request is received, the system measures 1 request.
  //   5. The 1 second collection cycle ends. A metric is exported for the
  //      number of requests received over the interval of time t_0 to
  //      t_0+1 with a value of 3.
  //   6. A request is received, the system measures 1 request.
  //   7. A request is received, the system measures 1 request.
  //   8. The 1 second collection cycle ends. A metric is exported for the
  //      number of requests received over the interval of time t_0+1 to
  //      t_0+2 with a value of 2.
  AGGREGATION_TEMPORALITY_DELTA = 1;

  // CUMULATIVE is an AggregationTemporality for a metric aggregator which
  // reports changes since a fixed start time. This means that current values
  // of a CUMULATIVE metric depend on all previous measurements since the
  // start time. Because of this, the sender is required to retain this state
  // in some form. If this state is lost or invalidated, the CUMULATIVE metric
  // values MUST be reset and a new fixed start time following the last
  // reported measurement time sent MUST be used.
  //
  // For example, consider a system measuring the number of requests that
  // it receives and reports the sum of these requests every second as a
  // CUMULATIVE metric:
  //
  //   1. The system starts receiving at time=t_0.
  //   2. A request is received, the system measures 1 request.
  //   3. A request is received, the system measures 1 request.
  //   4. A request is received, the system measures 1 request.
  //   5. The 1 second collection cycle ends. A metric is exported for the
  //      number of requests received over the interval of time t_0 to
  //      t_0+1 with a value of 3.
  //   6. A request is received, the system measures 1 request.
  //   7. A request is received, the system measures 1 request.
  //   8. The 1 second collection cycle ends. A metric is exported for the
  //      number of requests received over the interval of time t_0 to
  //      t_0+2 with a value of 5.
  //   9. The system experiences a fault and loses state.
  //   10. The system recovers and resumes receiving at time=t_1.
  //   11. A request is received, the system measures 1 request.
  //   12. The 1 second collection cycle ends. A metric is exported for the
  //      number of requests received over the interval of time t_1 to
  //      t_0+1 with a value of 1.
  //
  // Note: Even though, when reporting changes since last report time, using
  // CUMULATIVE is valid, it is not recommended. This may cause problems for
  // systems that do not use start_time to determine when the aggregation
  // value was reset (e.g. Prometheus).
  AGGREGATION_TEMPORALITY_CUMULATIVE = 2;
}

// DataPointFlags is defined as a protobuf 'uint32' type and is to be used as a
// bit-field representing 32 distinct boolean flags.  Each flag defined in this
// enum is a bit-mask.  To test the presence of a single flag in the flags of
// a data point, for example, use an expression like:
//
//   (point.flags & FLAG_NO_RECORDED_VALUE) == FLAG_NO_RECORDED_VALUE
//
enum DataPointFlags {
  FLAG_NONE = 0;

  // This DataPoint is valid but has no recorded value.  This value
  // SHOULD be used to reflect explicitly missing data in a series, as
  // for an equivalent to the Prometheus "staleness marker".
  FLAG_NO_RECORDED_VALUE = 1;

  // Bits 2-31 are reserved for future use.
}

// NumberDataPoint is a single data point in a timeseries that describes the
// time-varying scalar value of a metric.
message NumberDataPoint {
  reserved 1;

  // The set of key/value pairs that uniquely identify the timeseries from
  // where this point belongs. The list may be empty (may contain 0 elements).
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 7;

  // StartTimeUnixNano is optional but strongly encouraged, see the
  // the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 start_time_unix_nano = 2;

  // TimeUnixNano is required, see the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 time_unix_nano = 3;

  // The value itself.  A point is considered invalid when one of the recognized
  // value fields is not present inside this oneof.
  oneof value {
    double as_double = 4;
    sfixed64 as_int = 6;
  }

  // (Optional) List of exemplars collected from
  // measurements that were used to form the data point
  repeated Exemplar exemplars = 5;

  // Flags that apply to this specific data point.  See DataPointFlags
  // for the available flags and their meaning.
  uint32 flags = 8;
}

// HistogramDataPoint is a single data point in a timeseries that describes the
// time-varying values of a Histogram. A Histogram contains summary statistics
// for a population of values, it may optionally contain the distribution of
// those values across a set of buckets.
//
// If the histogram contains the distribution of values, then both
// "explicit_bounds" and "bucket counts" fields must be defined.
// If the histogram does not contain the distribution of values, then both
// "explicit_bounds" and "bucket_counts" must be omitted and only "count" and
// "sum" are known.
message HistogramDataPoint {
  reserved 1;

  // The set of key/value pairs that uniquely identify the timeseries from
  // where this point belongs. The list may be empty (may contain 0 elements).
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 9;

  // StartTimeUnixNano is optional but strongly encouraged, see the
  // the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 start_time_unix_nano = 2;

  // TimeUnixNano is required, see the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 time_unix_nano = 3;

  // count is the number of values in the population. Must be non-negative. This
  // value must be equal to the sum of the "count" fields in buckets if a
  // histogram is provided.
  fixed64 count = 4;

  // sum of the values in the population. If count is zero then this field
  // must be zero.
  //
  // Note: Sum should only be filled out when measuring non-negative discrete
  // events, and is assumed to be monotonic over the values of these events.
  // Negative events *can* be recorded, but sum should not be filled out when
  // doing so.  This is specifically to enforce compatibility w/ OpenMetrics,
  // see: https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#histogram
  optional double sum = 5;

  // bucket_counts is an optional field contains the count values of histogram
  // for each bucket.
  //
  // The sum of the bucket_counts must equal the value in the count field.
  //
  // The number of elements in bucket_counts array must be by one greater than
  // the number of elements in explicit_bounds array.
  repeated fixed64 bucket_counts = 6;

  // explicit_bounds specifies buckets with explicitly defined bounds for values.
  //
  // The boundaries for bucket at index i are:
  //
  // (-infinity, explicit_bounds[i]] for i == 0
  // (explicit_bounds[i-1], explicit_bounds[i]] for 0 < i < size(explicit_bounds)
  // (explicit_bounds[i-1], +infinity) for i == size(explicit_bounds)
  //
  // The values in the explicit_bounds array must be strictly increasing.
  //
  // Histogram buckets are inclusive of their upper boundary, except the last
  // bucket where the boundary is at infinity. This format is intentionally
  // compatible with the OpenMetrics histogram definition.
  repeated double explicit_bounds = 7;

  // (Optional) List of exemplars collected from
  // measurements that were used to form the data point
  repeated Exemplar exemplars = 8;

  // Flags that apply to this specific data point.  See DataPointFlags
  // for the available flags and their meaning.
  uint32 flags = 10;

  // min is the minimum value over (start_time, end_time].
  optional double min = 11;

  // max is the maximum value over (start_time, end_time].
  optional double max = 12;
}

// ExponentialHistogramDataPoint is a single data point in a timeseries that describes the
// time-varying values of a ExponentialHistogram of double values. A ExponentialHistogram contains
// summary statistics for a population of values, it may optionally contain the
// distribution of those values across a set of buckets.
//
message ExponentialHistogramDataPoint {
  // The set of key/value pairs that uniquely identify the timeseries from
  // where this point belongs. The list may be empty (may contain 0 elements).
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 1;

  // StartTimeUnixNano is optional but strongly encouraged, see the
  // the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 start_time_unix_nano = 2;

  // TimeUnixNano is required, see the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 time_unix_nano = 3;

  // count is the number of values in the population. Must be
  // non-negative. This value must be equal to the sum of the "bucket_counts"
  // values in the positive and negative Buckets plus the "zero_count" field.
  fixed64 count = 4;

  // sum of the values in the population. If count is zero then this field
  // must be zero.
  //
  // Note: Sum should only be filled out when measuring non-negative discrete
  // events, and is assumed to be monotonic over the values of these events.
  // Negative events *can* be recorded, but sum should not be filled out when
  // doing so.  This is specifically to enforce compatibility w/ OpenMetrics,
  // see: https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#histogram
  optional double sum = 5;
  
  // scale describes the resolution of the histogram.  Boundaries are
  // located at powers of the base, where:
  //
  //   base = (2^(2^-scale))
  //
  // The histogram bucket identified by `index`, a signed integer,
  // contains values that are greater than (base^index) and
  // less than or equal to (base^(index+1)).
  //
  // The positive and negative ranges of the histogram are expressed
  // separately.  Negative values are mapped by their absolute value
  // into the negative range using the same scale as the positive range.
  //
  // scale is not restricted by the protocol, as the permissible
  // values depend on the range of the data.
  sint32 scale = 6;

  // zero_count is the count of values that are either exactly zero or
  // within the region considered zero by the instrumentation at the
  // tolerated degree of precision.  This bucket stores values that
  // cannot be expressed using the standard exponential formula as
  // well as values that have been rounded to zero.
  //
  // Implementations MAY consider the zero bucket to have probability
  // mass equal to (zero_count / count).
  fixed64 zero_count = 7;

  // positive carries the positive range of exponential bucket counts.
  Buckets positive = 8;

  // negative carries the negative range of exponential bucket counts.
  Buckets negative = 9;

  // Buckets are a set of bucket counts, encoded in a contiguous array
  // of counts.
  message Buckets {
    // Offset is the bucket index of the first entry in the bucket_counts array.
    // 
    // Note: This uses a varint encoding as a simple form of compression.
    sint32 offset = 1;

    // Count is an array of counts, where count[i] carries the count
    // of the bucket at index (offset+i).  count[i] is the count of
    // values greater than base^(offset+i) and less or equal to than
    // base^(offset+i+1).
    //
    // Note: By contrast, the explicit HistogramDataPoint uses
    // fixed64.  This field is expected to have many buckets,
    // especially zeros, so uint64 has been selected to ensure
    // varint encoding.
    repeated uint64 bucket_counts = 2;
  } 

  // Flags that apply to this specific data point.  See DataPointFlags
  // for the available flags and their meaning.
  uint32 flags = 10;

  // (Optional) List of exemplars collected from
  // measurements that were used to form the data point
  repeated Exemplar exemplars = 11;

  // min is the minimum value over (start_time, end_time].
  optional double min = 12;

  // max is the maximum value over (start_time, end_time].
  optional double max = 13;
}

// SummaryDataPoint is a single data point in a timeseries that describes the
// time-varying values of a Summary metric.
message SummaryDataPoint {
  reserved 1;

  // The set of key/value pairs that uniquely identify the timeseries from
  // where this point belongs. The list may be empty (may contain 0 elements).
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 7;

  // StartTimeUnixNano is optional but strongly encouraged, see the
  // the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 start_time_unix_nano = 2;

  // TimeUnixNano is required, see the detailed comments above Metric.
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 time_unix_nano = 3;

  // count is the number of values in the population. Must be non-negative.
  fixed64 count = 4;

  // sum of the values in the population. If count is zero then this field
  // must be zero.
  //
  // Note: Sum should only be filled out when measuring non-negative discrete
  // events, and is assumed to be monotonic over the values of these events.
  // Negative events *can* be recorded, but sum should not be filled out when
  // doing so.  This is specifically to enforce compatibility w/ OpenMetrics,
  // see: https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#summary
  double sum = 5;

  // Represents the value at a given quantile of a distribution.
  //
  // To record Min and Max values following conventions are used:
  // - The 1.0 quantile is equivalent to the maximum value observed.
  // - The 0.0 quantile is equivalent to the minimum value observed.
  //
  // See the following issue for more context:
  // https://github.com/open-telemetry/opentelemetry-proto/issues/125
  message ValueAtQuantile {
    // The quantile of a distribution. Must be in the interval
    // [0.0, 1.0].
    double quantile = 1;

    // The value at the given quantile of a distribution.
    //
    // Quantile values must NOT be negative.
    double value = 2;
  }

  // (Optional) list of values at different quantiles of the distribution calculated
  // from the current snapshot. The quantiles must be strictly increasing.
  repeated ValueAtQuantile quantile_values = 6;

  // Flags that apply to this specific data point.  See DataPointFlags
  // for the available flags and their meaning.
  uint32 flags = 8;
}

// A representation of an exemplar, which is a sample input measurement.
// Exemplars also hold information about the environment when the measurement
// was recorded, for example the span and trace ID of the active span when the
// exemplar was recorded.
message Exemplar {
  reserved 1;

  // The set of key/value pairs that were filtered out by the aggregator, but
  // recorded alongside the original measurement. Only key/value pairs that were
  // filtered out by the aggregator should be included
  repeated opentelemetry.proto.common.v1.KeyValue filtered_attributes = 7;

  // time_unix_nano is the exact time when this exemplar was recorded
  //
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
  // 1970.
  fixed64 time_unix_nano = 2;

  // The value of the measurement that was recorded. An exemplar is
  // considered invalid when one of the recognized value fields is not present
  // inside this oneof.
  oneof value {
    double as_double = 3;
    sfixed64 as_int = 6;
  }

  // (Optional) Span ID of the exemplar trace.
  // span_id may be missing if the measurement is not recorded inside a trace
  // or if the trace is not sampled.
  bytes span_id = 4;

  // (Optional) Trace ID of the exemplar trace.
  // trace_id may be missing if the measurement is not recorded inside a trace
  // or if the trace is not sampled.
  bytes trace_id = 5;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/resource/v1/resource.proto
================================================
// Copyright 2019, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.resource.v1;

import "opentelemetry/proto/common/v1/common.proto";

option csharp_namespace = "OpenTelemetry.Proto.Resource.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.resource.v1";
option java_outer_classname = "ResourceProto";
option go_package = "go.opentelemetry.io/proto/otlp/resource/v1";

// Resource information.
message Resource {
  // Set of attributes that describe the resource.
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 1;

  // dropped_attributes_count is the number of dropped attributes. If the value is 0, then
  // no attributes were dropped.
  uint32 dropped_attributes_count = 2;
}


================================================
FILE: quickwit/quickwit-proto/protos/third-party/opentelemetry/proto/trace/v1/trace.proto
================================================
// Copyright 2019, OpenTelemetry Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

syntax = "proto3";

package opentelemetry.proto.trace.v1;

import "opentelemetry/proto/common/v1/common.proto";
import "opentelemetry/proto/resource/v1/resource.proto";

option csharp_namespace = "OpenTelemetry.Proto.Trace.V1";
option java_multiple_files = true;
option java_package = "io.opentelemetry.proto.trace.v1";
option java_outer_classname = "TraceProto";
option go_package = "go.opentelemetry.io/proto/otlp/trace/v1";

// TracesData represents the traces data that can be stored in a persistent storage,
// OR can be embedded by other protocols that transfer OTLP traces data but do
// not implement the OTLP protocol.
//
// The main difference between this message and collector protocol is that
// in this message there will not be any "control" or "metadata" specific to
// OTLP protocol.
//
// When new fields are added into this message, the OTLP request MUST be updated
// as well.
message TracesData {
  // An array of ResourceSpans.
  // For data coming from a single resource this array will typically contain
  // one element. Intermediary nodes that receive data from multiple origins
  // typically batch the data before forwarding further and in that case this
  // array will contain multiple elements.
  repeated ResourceSpans resource_spans = 1;
}

// A collection of ScopeSpans from a Resource.
message ResourceSpans {
  reserved 1000;

  // The resource for the spans in this message.
  // If this field is not set then no resource info is known.
  opentelemetry.proto.resource.v1.Resource resource = 1;

  // A list of ScopeSpans that originate from a resource.
  repeated ScopeSpans scope_spans = 2;

  // This schema_url applies to the data in the "resource" field. It does not apply
  // to the data in the "scope_spans" field which have their own schema_url field.
  string schema_url = 3;
}

// A collection of Spans produced by an InstrumentationScope.
message ScopeSpans {
  // The instrumentation scope information for the spans in this message.
  // Semantically when InstrumentationScope isn't set, it is equivalent with
  // an empty instrumentation scope name (unknown).
  opentelemetry.proto.common.v1.InstrumentationScope scope = 1;

  // A list of Spans that originate from an instrumentation scope.
  repeated Span spans = 2;

  // This schema_url applies to all spans and span events in the "spans" field.
  string schema_url = 3;
}

// A Span represents a single operation performed by a single component of the system.
//
// The next available field id is 17.
message Span {
  // A unique identifier for a trace. All spans from the same trace share
  // the same `trace_id`. The ID is a 16-byte array. An ID with all zeroes
  // is considered invalid.
  //
  // This field is semantically required. Receiver should generate new
  // random trace_id if empty or invalid trace_id was received.
  //
  // This field is required.
  bytes trace_id = 1;

  // A unique identifier for a span within a trace, assigned when the span
  // is created. The ID is an 8-byte array. An ID with all zeroes is considered
  // invalid.
  //
  // This field is semantically required. Receiver should generate new
  // random span_id if empty or invalid span_id was received.
  //
  // This field is required.
  bytes span_id = 2;

  // trace_state conveys information about request position in multiple distributed tracing graphs.
  // It is a trace_state in w3c-trace-context format: https://www.w3.org/TR/trace-context/#tracestate-header
  // See also https://github.com/w3c/distributed-tracing for more details about this field.
  string trace_state = 3;

  // The `span_id` of this span's parent span. If this is a root span, then this
  // field must be empty. The ID is an 8-byte array.
  bytes parent_span_id = 4;

  // A description of the span's operation.
  //
  // For example, the name can be a qualified method name or a file name
  // and a line number where the operation is called. A best practice is to use
  // the same display name at the same call point in an application.
  // This makes it easier to correlate spans in different traces.
  //
  // This field is semantically required to be set to non-empty string.
  // Empty value is equivalent to an unknown span name.
  //
  // This field is required.
  string name = 5;

  // SpanKind is the type of span. Can be used to specify additional relationships between spans
  // in addition to a parent/child relationship.
  enum SpanKind {
    // Unspecified. Do NOT use as default.
    // Implementations MAY assume SpanKind to be INTERNAL when receiving UNSPECIFIED.
    SPAN_KIND_UNSPECIFIED = 0;

    // Indicates that the span represents an internal operation within an application,
    // as opposed to an operation happening at the boundaries. Default value.
    SPAN_KIND_INTERNAL = 1;

    // Indicates that the span covers server-side handling of an RPC or other
    // remote network request.
    SPAN_KIND_SERVER = 2;

    // Indicates that the span describes a request to some remote service.
    SPAN_KIND_CLIENT = 3;

    // Indicates that the span describes a producer sending a message to a broker.
    // Unlike CLIENT and SERVER, there is often no direct critical path latency relationship
    // between producer and consumer spans. A PRODUCER span ends when the message was accepted
    // by the broker while the logical processing of the message might span a much longer time.
    SPAN_KIND_PRODUCER = 4;

    // Indicates that the span describes consumer receiving a message from a broker.
    // Like the PRODUCER kind, there is often no direct critical path latency relationship
    // between producer and consumer spans.
    SPAN_KIND_CONSUMER = 5;
  }

  // Distinguishes between spans generated in a particular context. For example,
  // two spans with the same name may be distinguished using `CLIENT` (caller)
  // and `SERVER` (callee) to identify queueing latency associated with the span.
  SpanKind kind = 6;

  // start_time_unix_nano is the start time of the span. On the client side, this is the time
  // kept by the local machine where the span execution starts. On the server side, this
  // is the time when the server's application handler starts running.
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
  //
  // This field is semantically required and it is expected that end_time >= start_time.
  fixed64 start_time_unix_nano = 7;

  // end_time_unix_nano is the end time of the span. On the client side, this is the time
  // kept by the local machine where the span execution ends. On the server side, this
  // is the time when the server application handler stops running.
  // Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
  //
  // This field is semantically required and it is expected that end_time >= start_time.
  fixed64 end_time_unix_nano = 8;

  // attributes is a collection of key/value pairs. Note, global attributes
  // like server name can be set using the resource API. Examples of attributes:
  //
  //     "/http/user_agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36"
  //     "/http/server_latency": 300
  //     "abc.com/myattribute": true
  //     "abc.com/score": 10.239
  //
  // The OpenTelemetry API specification further restricts the allowed value types:
  // https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/common/README.md#attribute
  // Attribute keys MUST be unique (it is not allowed to have more than one
  // attribute with the same key).
  repeated opentelemetry.proto.common.v1.KeyValue attributes = 9;

  // dropped_attributes_count is the number of attributes that were discarded. Attributes
  // can be discarded because their keys are too long or because there are too many
  // attributes. If this value is 0, then no attributes were dropped.
  uint32 dropped_attributes_count = 10;

  // Event is a time-stamped annotation of the span, consisting of user-supplied
  // text description and key-value pairs.
  message Event {
    // time_unix_nano is the time the event occurred.
    fixed64 time_unix_nano = 1;

    // name of the event.
    // This field is semantically required to be set to non-empty string.
    string name = 2;

    // attributes is a collection of attribute key/value pairs on the event.
    // Attribute keys MUST be unique (it is not allowed to have more than one
    // attribute with the same key).
    repeated opentelemetry.proto.common.v1.KeyValue attributes = 3;

    // dropped_attributes_count is the number of dropped attributes. If the value is 0,
    // then no attributes were dropped.
    uint32 dropped_attributes_count = 4;
  }

  // events is a collection of Event items.
  repeated Event events = 11;

  // dropped_events_count is the number of dropped events. If the value is 0, then no
  // events were dropped.
  uint32 dropped_events_count = 12;

  // A pointer from the current span to another span in the same trace or in a
  // different trace. For example, this can be used in batching operations,
  // where a single batch handler processes multiple requests from different
  // traces or when the handler receives a request from a different project.
  message Link {
    // A unique identifier of a trace that this linked span is part of. The ID is a
    // 16-byte array.
    bytes trace_id = 1;

    // A unique identifier for the linked span. The ID is an 8-byte array.
    bytes span_id = 2;

    // The trace_state associated with the link.
    string trace_state = 3;

    // attributes is a collection of attribute key/value pairs on the link.
    // Attribute keys MUST be unique (it is not allowed to have more than one
    // attribute with the same key).
    repeated opentelemetry.proto.common.v1.KeyValue attributes = 4;

    // dropped_attributes_count is the number of dropped attributes. If the value is 0,
    // then no attributes were dropped.
    uint32 dropped_attributes_count = 5;
  }

  // links is a collection of Links, which are references from this span to a span
  // in the same or different trace.
  repeated Link links = 13;

  // dropped_links_count is the number of dropped links after the maximum size was
  // enforced. If this value is 0, then no links were dropped.
  uint32 dropped_links_count = 14;

  // An optional final status for this span. Semantically when Status isn't set, it means
  // span's status code is unset, i.e. assume STATUS_CODE_UNSET (code = 0).
  Status status = 15;
}

// The Status type defines a logical error model that is suitable for different
// programming environments, including REST APIs and RPC APIs.
message Status {
  reserved 1;

  // A developer-facing human readable error message.
  string message = 2;

  // For the semantics of status codes see
  // https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#set-status
  enum StatusCode {
    // The default status.
    STATUS_CODE_UNSET               = 0;
    // The Span has been validated by an Application developer or Operator to 
    // have completed successfully.
    STATUS_CODE_OK                  = 1;
    // The Span contains an error.
    STATUS_CODE_ERROR               = 2;
  };

  // The status code.
  StatusCode code = 3;
}


================================================
FILE: quickwit/quickwit-proto/src/cluster/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::rate_limited_error;
use quickwit_common::tower::MakeLoadShedError;
use serde::{Deserialize, Serialize};
use thiserror;

use crate::GrpcServiceError;
use crate::error::{ServiceError, ServiceErrorCode};

include!("../codegen/quickwit/quickwit.cluster.rs");

pub const CLUSTER_PLANE_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/cluster_descriptor.bin");

pub type ClusterResult<T> = std::result::Result<T, ClusterError>;

#[derive(Debug, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum ClusterError {
    #[error("internal error: {0}")]
    Internal(String),
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests,
    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl ServiceError for ClusterError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(err_msg) => {
                rate_limited_error!(limit_per_min = 6, "cluster internal error: {err_msg}");
                ServiceErrorCode::Internal
            }
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for ClusterError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}

impl MakeLoadShedError for ClusterError {
    fn make_load_shed_error() -> Self {
        ClusterError::TooManyRequests
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/jaeger/jaeger.api_v2.rs
================================================
// This file is @generated by prost-build.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValue {
    #[prost(string, tag = "1")]
    pub key: ::prost::alloc::string::String,
    #[prost(enumeration = "ValueType", tag = "2")]
    pub v_type: i32,
    #[prost(string, tag = "3")]
    pub v_str: ::prost::alloc::string::String,
    #[prost(bool, tag = "4")]
    pub v_bool: bool,
    #[prost(int64, tag = "5")]
    pub v_int64: i64,
    #[prost(double, tag = "6")]
    pub v_float64: f64,
    #[prost(bytes = "vec", tag = "7")]
    pub v_binary: ::prost::alloc::vec::Vec<u8>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Log {
    #[prost(message, optional, tag = "1")]
    pub timestamp: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, repeated, tag = "2")]
    pub fields: ::prost::alloc::vec::Vec<KeyValue>,
}
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SpanRef {
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    #[prost(bytes = "vec", tag = "2")]
    pub span_id: ::prost::alloc::vec::Vec<u8>,
    #[prost(enumeration = "SpanRefType", tag = "3")]
    pub ref_type: i32,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Process {
    #[prost(string, tag = "1")]
    pub service_name: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "2")]
    pub tags: ::prost::alloc::vec::Vec<KeyValue>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Span {
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    #[prost(bytes = "vec", tag = "2")]
    pub span_id: ::prost::alloc::vec::Vec<u8>,
    #[prost(string, tag = "3")]
    pub operation_name: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "4")]
    pub references: ::prost::alloc::vec::Vec<SpanRef>,
    #[prost(uint32, tag = "5")]
    pub flags: u32,
    #[prost(message, optional, tag = "6")]
    pub start_time: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "7")]
    pub duration: ::core::option::Option<::prost_types::Duration>,
    #[prost(message, repeated, tag = "8")]
    pub tags: ::prost::alloc::vec::Vec<KeyValue>,
    #[prost(message, repeated, tag = "9")]
    pub logs: ::prost::alloc::vec::Vec<Log>,
    #[prost(message, optional, tag = "10")]
    pub process: ::core::option::Option<Process>,
    #[prost(string, tag = "11")]
    pub process_id: ::prost::alloc::string::String,
    #[prost(string, repeated, tag = "12")]
    pub warnings: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Trace {
    #[prost(message, repeated, tag = "1")]
    pub spans: ::prost::alloc::vec::Vec<Span>,
    #[prost(message, repeated, tag = "2")]
    pub process_map: ::prost::alloc::vec::Vec<trace::ProcessMapping>,
    #[prost(string, repeated, tag = "3")]
    pub warnings: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
/// Nested message and enum types in `Trace`.
pub mod trace {
    #[derive(Clone, PartialEq, ::prost::Message)]
    pub struct ProcessMapping {
        #[prost(string, tag = "1")]
        pub process_id: ::prost::alloc::string::String,
        #[prost(message, optional, tag = "2")]
        pub process: ::core::option::Option<super::Process>,
    }
}
/// Note that both Span and Batch may contain a Process.
/// This is different from the Thrift model which was only used
/// for transport, because Proto model is also used by the backend
/// as the domain model, where once a batch is received it is split
/// into individual spans which are all processed independently,
/// and therefore they all need a Process. As far as on-the-wire
/// semantics, both Batch and Spans in the same message may contain
/// their own instances of Process, with span.Process taking priority
/// over batch.Process.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Batch {
    #[prost(message, repeated, tag = "1")]
    pub spans: ::prost::alloc::vec::Vec<Span>,
    #[prost(message, optional, tag = "2")]
    pub process: ::core::option::Option<Process>,
}
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DependencyLink {
    #[prost(string, tag = "1")]
    pub parent: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub child: ::prost::alloc::string::String,
    #[prost(uint64, tag = "3")]
    pub call_count: u64,
    #[prost(string, tag = "4")]
    pub source: ::prost::alloc::string::String,
}
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum ValueType {
    String = 0,
    Bool = 1,
    Int64 = 2,
    Float64 = 3,
    Binary = 4,
}
impl ValueType {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::String => "STRING",
            Self::Bool => "BOOL",
            Self::Int64 => "INT64",
            Self::Float64 => "FLOAT64",
            Self::Binary => "BINARY",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "STRING" => Some(Self::String),
            "BOOL" => Some(Self::Bool),
            "INT64" => Some(Self::Int64),
            "FLOAT64" => Some(Self::Float64),
            "BINARY" => Some(Self::Binary),
            _ => None,
        }
    }
}
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum SpanRefType {
    ChildOf = 0,
    FollowsFrom = 1,
}
impl SpanRefType {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::ChildOf => "CHILD_OF",
            Self::FollowsFrom => "FOLLOWS_FROM",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "CHILD_OF" => Some(Self::ChildOf),
            "FOLLOWS_FROM" => Some(Self::FollowsFrom),
            _ => None,
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/jaeger/jaeger.storage.v1.rs
================================================
// This file is @generated by prost-build.
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetDependenciesRequest {
    #[prost(message, optional, tag = "1")]
    pub start_time: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "2")]
    pub end_time: ::core::option::Option<::prost_types::Timestamp>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetDependenciesResponse {
    #[prost(message, repeated, tag = "1")]
    pub dependencies: ::prost::alloc::vec::Vec<super::super::api_v2::DependencyLink>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct WriteSpanRequest {
    #[prost(message, optional, tag = "1")]
    pub span: ::core::option::Option<super::super::api_v2::Span>,
}
/// empty; extensible in the future
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct WriteSpanResponse {}
/// empty; extensible in the future
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CloseWriterRequest {}
/// empty; extensible in the future
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CloseWriterResponse {}
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetTraceRequest {
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
}
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetServicesRequest {}
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetServicesResponse {
    #[prost(string, repeated, tag = "1")]
    pub services: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetOperationsRequest {
    #[prost(string, tag = "1")]
    pub service: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub span_kind: ::prost::alloc::string::String,
}
#[derive(Ord, PartialOrd)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct Operation {
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub span_kind: ::prost::alloc::string::String,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetOperationsResponse {
    /// deprecated
    #[prost(string, repeated, tag = "1")]
    pub operation_names: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    #[prost(message, repeated, tag = "2")]
    pub operations: ::prost::alloc::vec::Vec<Operation>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct TraceQueryParameters {
    #[prost(string, tag = "1")]
    pub service_name: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub operation_name: ::prost::alloc::string::String,
    #[prost(map = "string, string", tag = "3")]
    pub tags: ::std::collections::HashMap<
        ::prost::alloc::string::String,
        ::prost::alloc::string::String,
    >,
    #[prost(message, optional, tag = "4")]
    pub start_time_min: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "5")]
    pub start_time_max: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "6")]
    pub duration_min: ::core::option::Option<::prost_types::Duration>,
    #[prost(message, optional, tag = "7")]
    pub duration_max: ::core::option::Option<::prost_types::Duration>,
    #[prost(int32, tag = "8")]
    pub num_traces: i32,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FindTracesRequest {
    #[prost(message, optional, tag = "1")]
    pub query: ::core::option::Option<TraceQueryParameters>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct SpansResponseChunk {
    #[prost(message, repeated, tag = "1")]
    pub spans: ::prost::alloc::vec::Vec<super::super::api_v2::Span>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FindTraceIDsRequest {
    #[prost(message, optional, tag = "1")]
    pub query: ::core::option::Option<TraceQueryParameters>,
}
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FindTraceIDsResponse {
    #[prost(bytes = "vec", repeated, tag = "1")]
    pub trace_ids: ::prost::alloc::vec::Vec<::prost::alloc::vec::Vec<u8>>,
}
/// empty; extensible in the future
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CapabilitiesRequest {}
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CapabilitiesResponse {
    #[prost(bool, tag = "1")]
    pub archive_span_reader: bool,
    #[prost(bool, tag = "2")]
    pub archive_span_writer: bool,
    #[prost(bool, tag = "3")]
    pub streaming_span_writer: bool,
}
/// Generated client implementations.
pub mod span_writer_plugin_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct SpanWriterPluginClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl SpanWriterPluginClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> SpanWriterPluginClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> SpanWriterPluginClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            SpanWriterPluginClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// spanstore/Writer
        pub async fn write_span(
            &mut self,
            request: impl tonic::IntoRequest<super::WriteSpanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::WriteSpanResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanWriterPlugin/WriteSpan",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v1.SpanWriterPlugin", "WriteSpan"),
                );
            self.inner.unary(req, path, codec).await
        }
        pub async fn close(
            &mut self,
            request: impl tonic::IntoRequest<super::CloseWriterRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CloseWriterResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanWriterPlugin/Close",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("jaeger.storage.v1.SpanWriterPlugin", "Close"));
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod span_writer_plugin_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with SpanWriterPluginServer.
    #[async_trait]
    pub trait SpanWriterPlugin: std::marker::Send + std::marker::Sync + 'static {
        /// spanstore/Writer
        async fn write_span(
            &self,
            request: tonic::Request<super::WriteSpanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::WriteSpanResponse>,
            tonic::Status,
        >;
        async fn close(
            &self,
            request: tonic::Request<super::CloseWriterRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CloseWriterResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct SpanWriterPluginServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> SpanWriterPluginServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for SpanWriterPluginServer<T>
    where
        T: SpanWriterPlugin,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.SpanWriterPlugin/WriteSpan" => {
                    #[allow(non_camel_case_types)]
                    struct WriteSpanSvc<T: SpanWriterPlugin>(pub Arc<T>);
                    impl<
                        T: SpanWriterPlugin,
                    > tonic::server::UnaryService<super::WriteSpanRequest>
                    for WriteSpanSvc<T> {
                        type Response = super::WriteSpanResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::WriteSpanRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanWriterPlugin>::write_span(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = WriteSpanSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v1.SpanWriterPlugin/Close" => {
                    #[allow(non_camel_case_types)]
                    struct CloseSvc<T: SpanWriterPlugin>(pub Arc<T>);
                    impl<
                        T: SpanWriterPlugin,
                    > tonic::server::UnaryService<super::CloseWriterRequest>
                    for CloseSvc<T> {
                        type Response = super::CloseWriterResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::CloseWriterRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanWriterPlugin>::close(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CloseSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for SpanWriterPluginServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.SpanWriterPlugin";
    impl<T> tonic::server::NamedService for SpanWriterPluginServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}
/// Generated client implementations.
pub mod streaming_span_writer_plugin_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct StreamingSpanWriterPluginClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl StreamingSpanWriterPluginClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> StreamingSpanWriterPluginClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> StreamingSpanWriterPluginClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            StreamingSpanWriterPluginClient::new(
                InterceptedService::new(inner, interceptor),
            )
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        pub async fn write_span_stream(
            &mut self,
            request: impl tonic::IntoStreamingRequest<Message = super::WriteSpanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::WriteSpanResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.StreamingSpanWriterPlugin/WriteSpanStream",
            );
            let mut req = request.into_streaming_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "jaeger.storage.v1.StreamingSpanWriterPlugin",
                        "WriteSpanStream",
                    ),
                );
            self.inner.client_streaming(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod streaming_span_writer_plugin_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with StreamingSpanWriterPluginServer.
    #[async_trait]
    pub trait StreamingSpanWriterPlugin: std::marker::Send + std::marker::Sync + 'static {
        async fn write_span_stream(
            &self,
            request: tonic::Request<tonic::Streaming<super::WriteSpanRequest>>,
        ) -> std::result::Result<
            tonic::Response<super::WriteSpanResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct StreamingSpanWriterPluginServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> StreamingSpanWriterPluginServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for StreamingSpanWriterPluginServer<T>
    where
        T: StreamingSpanWriterPlugin,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.StreamingSpanWriterPlugin/WriteSpanStream" => {
                    #[allow(non_camel_case_types)]
                    struct WriteSpanStreamSvc<T: StreamingSpanWriterPlugin>(pub Arc<T>);
                    impl<
                        T: StreamingSpanWriterPlugin,
                    > tonic::server::ClientStreamingService<super::WriteSpanRequest>
                    for WriteSpanStreamSvc<T> {
                        type Response = super::WriteSpanResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                tonic::Streaming<super::WriteSpanRequest>,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as StreamingSpanWriterPlugin>::write_span_stream(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = WriteSpanStreamSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.client_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for StreamingSpanWriterPluginServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.StreamingSpanWriterPlugin";
    impl<T> tonic::server::NamedService for StreamingSpanWriterPluginServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}
/// Generated client implementations.
pub mod span_reader_plugin_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct SpanReaderPluginClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl SpanReaderPluginClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> SpanReaderPluginClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> SpanReaderPluginClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            SpanReaderPluginClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// spanstore/Reader
        pub async fn get_trace(
            &mut self,
            request: impl tonic::IntoRequest<super::GetTraceRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::SpansResponseChunk>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanReaderPlugin/GetTrace",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v1.SpanReaderPlugin", "GetTrace"),
                );
            self.inner.server_streaming(req, path, codec).await
        }
        pub async fn get_services(
            &mut self,
            request: impl tonic::IntoRequest<super::GetServicesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetServicesResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanReaderPlugin/GetServices",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v1.SpanReaderPlugin", "GetServices"),
                );
            self.inner.unary(req, path, codec).await
        }
        pub async fn get_operations(
            &mut self,
            request: impl tonic::IntoRequest<super::GetOperationsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetOperationsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanReaderPlugin/GetOperations",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "jaeger.storage.v1.SpanReaderPlugin",
                        "GetOperations",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        pub async fn find_traces(
            &mut self,
            request: impl tonic::IntoRequest<super::FindTracesRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::SpansResponseChunk>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanReaderPlugin/FindTraces",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v1.SpanReaderPlugin", "FindTraces"),
                );
            self.inner.server_streaming(req, path, codec).await
        }
        pub async fn find_trace_i_ds(
            &mut self,
            request: impl tonic::IntoRequest<super::FindTraceIDsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FindTraceIDsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.SpanReaderPlugin/FindTraceIDs",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v1.SpanReaderPlugin", "FindTraceIDs"),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod span_reader_plugin_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with SpanReaderPluginServer.
    #[async_trait]
    pub trait SpanReaderPlugin: std::marker::Send + std::marker::Sync + 'static {
        /// Server streaming response type for the GetTrace method.
        type GetTraceStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::SpansResponseChunk, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// spanstore/Reader
        async fn get_trace(
            &self,
            request: tonic::Request<super::GetTraceRequest>,
        ) -> std::result::Result<tonic::Response<Self::GetTraceStream>, tonic::Status>;
        async fn get_services(
            &self,
            request: tonic::Request<super::GetServicesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetServicesResponse>,
            tonic::Status,
        >;
        async fn get_operations(
            &self,
            request: tonic::Request<super::GetOperationsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetOperationsResponse>,
            tonic::Status,
        >;
        /// Server streaming response type for the FindTraces method.
        type FindTracesStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::SpansResponseChunk, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        async fn find_traces(
            &self,
            request: tonic::Request<super::FindTracesRequest>,
        ) -> std::result::Result<tonic::Response<Self::FindTracesStream>, tonic::Status>;
        async fn find_trace_i_ds(
            &self,
            request: tonic::Request<super::FindTraceIDsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FindTraceIDsResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct SpanReaderPluginServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> SpanReaderPluginServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for SpanReaderPluginServer<T>
    where
        T: SpanReaderPlugin,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.SpanReaderPlugin/GetTrace" => {
                    #[allow(non_camel_case_types)]
                    struct GetTraceSvc<T: SpanReaderPlugin>(pub Arc<T>);
                    impl<
                        T: SpanReaderPlugin,
                    > tonic::server::ServerStreamingService<super::GetTraceRequest>
                    for GetTraceSvc<T> {
                        type Response = super::SpansResponseChunk;
                        type ResponseStream = T::GetTraceStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetTraceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanReaderPlugin>::get_trace(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetTraceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v1.SpanReaderPlugin/GetServices" => {
                    #[allow(non_camel_case_types)]
                    struct GetServicesSvc<T: SpanReaderPlugin>(pub Arc<T>);
                    impl<
                        T: SpanReaderPlugin,
                    > tonic::server::UnaryService<super::GetServicesRequest>
                    for GetServicesSvc<T> {
                        type Response = super::GetServicesResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetServicesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanReaderPlugin>::get_services(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetServicesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v1.SpanReaderPlugin/GetOperations" => {
                    #[allow(non_camel_case_types)]
                    struct GetOperationsSvc<T: SpanReaderPlugin>(pub Arc<T>);
                    impl<
                        T: SpanReaderPlugin,
                    > tonic::server::UnaryService<super::GetOperationsRequest>
                    for GetOperationsSvc<T> {
                        type Response = super::GetOperationsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetOperationsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanReaderPlugin>::get_operations(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetOperationsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v1.SpanReaderPlugin/FindTraces" => {
                    #[allow(non_camel_case_types)]
                    struct FindTracesSvc<T: SpanReaderPlugin>(pub Arc<T>);
                    impl<
                        T: SpanReaderPlugin,
                    > tonic::server::ServerStreamingService<super::FindTracesRequest>
                    for FindTracesSvc<T> {
                        type Response = super::SpansResponseChunk;
                        type ResponseStream = T::FindTracesStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FindTracesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanReaderPlugin>::find_traces(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FindTracesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v1.SpanReaderPlugin/FindTraceIDs" => {
                    #[allow(non_camel_case_types)]
                    struct FindTraceIDsSvc<T: SpanReaderPlugin>(pub Arc<T>);
                    impl<
                        T: SpanReaderPlugin,
                    > tonic::server::UnaryService<super::FindTraceIDsRequest>
                    for FindTraceIDsSvc<T> {
                        type Response = super::FindTraceIDsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FindTraceIDsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SpanReaderPlugin>::find_trace_i_ds(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FindTraceIDsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for SpanReaderPluginServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.SpanReaderPlugin";
    impl<T> tonic::server::NamedService for SpanReaderPluginServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}
/// Generated client implementations.
pub mod archive_span_writer_plugin_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct ArchiveSpanWriterPluginClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl ArchiveSpanWriterPluginClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> ArchiveSpanWriterPluginClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> ArchiveSpanWriterPluginClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            ArchiveSpanWriterPluginClient::new(
                InterceptedService::new(inner, interceptor),
            )
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// spanstore/Writer
        pub async fn write_archive_span(
            &mut self,
            request: impl tonic::IntoRequest<super::WriteSpanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::WriteSpanResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.ArchiveSpanWriterPlugin/WriteArchiveSpan",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "jaeger.storage.v1.ArchiveSpanWriterPlugin",
                        "WriteArchiveSpan",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod archive_span_writer_plugin_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with ArchiveSpanWriterPluginServer.
    #[async_trait]
    pub trait ArchiveSpanWriterPlugin: std::marker::Send + std::marker::Sync + 'static {
        /// spanstore/Writer
        async fn write_archive_span(
            &self,
            request: tonic::Request<super::WriteSpanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::WriteSpanResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct ArchiveSpanWriterPluginServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> ArchiveSpanWriterPluginServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for ArchiveSpanWriterPluginServer<T>
    where
        T: ArchiveSpanWriterPlugin,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.ArchiveSpanWriterPlugin/WriteArchiveSpan" => {
                    #[allow(non_camel_case_types)]
                    struct WriteArchiveSpanSvc<T: ArchiveSpanWriterPlugin>(pub Arc<T>);
                    impl<
                        T: ArchiveSpanWriterPlugin,
                    > tonic::server::UnaryService<super::WriteSpanRequest>
                    for WriteArchiveSpanSvc<T> {
                        type Response = super::WriteSpanResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::WriteSpanRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ArchiveSpanWriterPlugin>::write_archive_span(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = WriteArchiveSpanSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for ArchiveSpanWriterPluginServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.ArchiveSpanWriterPlugin";
    impl<T> tonic::server::NamedService for ArchiveSpanWriterPluginServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}
/// Generated client implementations.
pub mod archive_span_reader_plugin_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct ArchiveSpanReaderPluginClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl ArchiveSpanReaderPluginClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> ArchiveSpanReaderPluginClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> ArchiveSpanReaderPluginClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            ArchiveSpanReaderPluginClient::new(
                InterceptedService::new(inner, interceptor),
            )
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// spanstore/Reader
        pub async fn get_archive_trace(
            &mut self,
            request: impl tonic::IntoRequest<super::GetTraceRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::SpansResponseChunk>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.ArchiveSpanReaderPlugin/GetArchiveTrace",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "jaeger.storage.v1.ArchiveSpanReaderPlugin",
                        "GetArchiveTrace",
                    ),
                );
            self.inner.server_streaming(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod archive_span_reader_plugin_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with ArchiveSpanReaderPluginServer.
    #[async_trait]
    pub trait ArchiveSpanReaderPlugin: std::marker::Send + std::marker::Sync + 'static {
        /// Server streaming response type for the GetArchiveTrace method.
        type GetArchiveTraceStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::SpansResponseChunk, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// spanstore/Reader
        async fn get_archive_trace(
            &self,
            request: tonic::Request<super::GetTraceRequest>,
        ) -> std::result::Result<
            tonic::Response<Self::GetArchiveTraceStream>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct ArchiveSpanReaderPluginServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> ArchiveSpanReaderPluginServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for ArchiveSpanReaderPluginServer<T>
    where
        T: ArchiveSpanReaderPlugin,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.ArchiveSpanReaderPlugin/GetArchiveTrace" => {
                    #[allow(non_camel_case_types)]
                    struct GetArchiveTraceSvc<T: ArchiveSpanReaderPlugin>(pub Arc<T>);
                    impl<
                        T: ArchiveSpanReaderPlugin,
                    > tonic::server::ServerStreamingService<super::GetTraceRequest>
                    for GetArchiveTraceSvc<T> {
                        type Response = super::SpansResponseChunk;
                        type ResponseStream = T::GetArchiveTraceStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetTraceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ArchiveSpanReaderPlugin>::get_archive_trace(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetArchiveTraceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for ArchiveSpanReaderPluginServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.ArchiveSpanReaderPlugin";
    impl<T> tonic::server::NamedService for ArchiveSpanReaderPluginServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}
/// Generated client implementations.
pub mod dependencies_reader_plugin_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct DependenciesReaderPluginClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl DependenciesReaderPluginClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> DependenciesReaderPluginClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> DependenciesReaderPluginClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            DependenciesReaderPluginClient::new(
                InterceptedService::new(inner, interceptor),
            )
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// dependencystore/Reader
        pub async fn get_dependencies(
            &mut self,
            request: impl tonic::IntoRequest<super::GetDependenciesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetDependenciesResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.DependenciesReaderPlugin/GetDependencies",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "jaeger.storage.v1.DependenciesReaderPlugin",
                        "GetDependencies",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod dependencies_reader_plugin_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with DependenciesReaderPluginServer.
    #[async_trait]
    pub trait DependenciesReaderPlugin: std::marker::Send + std::marker::Sync + 'static {
        /// dependencystore/Reader
        async fn get_dependencies(
            &self,
            request: tonic::Request<super::GetDependenciesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetDependenciesResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct DependenciesReaderPluginServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> DependenciesReaderPluginServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for DependenciesReaderPluginServer<T>
    where
        T: DependenciesReaderPlugin,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.DependenciesReaderPlugin/GetDependencies" => {
                    #[allow(non_camel_case_types)]
                    struct GetDependenciesSvc<T: DependenciesReaderPlugin>(pub Arc<T>);
                    impl<
                        T: DependenciesReaderPlugin,
                    > tonic::server::UnaryService<super::GetDependenciesRequest>
                    for GetDependenciesSvc<T> {
                        type Response = super::GetDependenciesResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetDependenciesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as DependenciesReaderPlugin>::get_dependencies(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetDependenciesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for DependenciesReaderPluginServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.DependenciesReaderPlugin";
    impl<T> tonic::server::NamedService for DependenciesReaderPluginServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}
/// Generated client implementations.
pub mod plugin_capabilities_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct PluginCapabilitiesClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl PluginCapabilitiesClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> PluginCapabilitiesClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> PluginCapabilitiesClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            PluginCapabilitiesClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        pub async fn capabilities(
            &mut self,
            request: impl tonic::IntoRequest<super::CapabilitiesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CapabilitiesResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v1.PluginCapabilities/Capabilities",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "jaeger.storage.v1.PluginCapabilities",
                        "Capabilities",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod plugin_capabilities_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with PluginCapabilitiesServer.
    #[async_trait]
    pub trait PluginCapabilities: std::marker::Send + std::marker::Sync + 'static {
        async fn capabilities(
            &self,
            request: tonic::Request<super::CapabilitiesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CapabilitiesResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct PluginCapabilitiesServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> PluginCapabilitiesServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for PluginCapabilitiesServer<T>
    where
        T: PluginCapabilities,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v1.PluginCapabilities/Capabilities" => {
                    #[allow(non_camel_case_types)]
                    struct CapabilitiesSvc<T: PluginCapabilities>(pub Arc<T>);
                    impl<
                        T: PluginCapabilities,
                    > tonic::server::UnaryService<super::CapabilitiesRequest>
                    for CapabilitiesSvc<T> {
                        type Response = super::CapabilitiesResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::CapabilitiesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as PluginCapabilities>::capabilities(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CapabilitiesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for PluginCapabilitiesServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v1.PluginCapabilities";
    impl<T> tonic::server::NamedService for PluginCapabilitiesServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/jaeger/jaeger.storage.v2.rs
================================================
// This file is @generated by prost-build.
/// GetTraceParams represents the query for a single trace from the storage backend.
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetTraceParams {
    /// trace_id is a 16 byte array containing the unique identifier for the trace to query.
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    /// start_time is the start of the time interval to search for the trace_id.
    ///
    /// This field is optional.
    #[prost(message, optional, tag = "2")]
    pub start_time: ::core::option::Option<::prost_types::Timestamp>,
    /// end_time is the end of the time interval to search for the trace_id.
    ///
    /// This field is optional.
    #[prost(message, optional, tag = "3")]
    pub end_time: ::core::option::Option<::prost_types::Timestamp>,
}
/// GetTracesRequest represents a request to retrieve multiple traces.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetTracesRequest {
    #[prost(message, repeated, tag = "1")]
    pub query: ::prost::alloc::vec::Vec<GetTraceParams>,
}
/// GetServicesRequest represents a request to get service names.
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetServicesRequest {}
/// GetServicesResponse represents the response for GetServicesRequest.
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetServicesResponse {
    #[prost(string, repeated, tag = "1")]
    pub services: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
/// GetOperationsRequest represents a request to get operation names.
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetOperationsRequest {
    /// service is the name of the service for which to get operation names.
    ///
    /// This field is required.
    #[prost(string, tag = "1")]
    pub service: ::prost::alloc::string::String,
    /// span_kind is the type of span which is used to distinguish between
    /// spans generated in a particular context.
    ///
    /// This field is optional.
    #[prost(string, tag = "2")]
    pub span_kind: ::prost::alloc::string::String,
}
/// Operation contains information about an operation for a given service.
#[derive(Ord, PartialOrd)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct Operation {
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub span_kind: ::prost::alloc::string::String,
}
/// GetOperationsResponse represents the response for GetOperationsRequest.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetOperationsResponse {
    #[prost(message, repeated, tag = "1")]
    pub operations: ::prost::alloc::vec::Vec<Operation>,
}
/// KeyValue and all its associated types are copied from opentelemetry-proto/common/v1/common.proto
/// (<https://github.com/open-telemetry/opentelemetry-proto/blob/main/opentelemetry/proto/common/v1/common.proto>).
/// This type is used to store attributes in traces.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValue {
    #[prost(string, tag = "1")]
    pub key: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "2")]
    pub value: ::core::option::Option<AnyValue>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AnyValue {
    #[prost(oneof = "any_value::Value", tags = "1, 2, 3, 4, 5, 6, 7")]
    pub value: ::core::option::Option<any_value::Value>,
}
/// Nested message and enum types in `AnyValue`.
pub mod any_value {
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Value {
        #[prost(string, tag = "1")]
        StringValue(::prost::alloc::string::String),
        #[prost(bool, tag = "2")]
        BoolValue(bool),
        #[prost(int64, tag = "3")]
        IntValue(i64),
        #[prost(double, tag = "4")]
        DoubleValue(f64),
        #[prost(message, tag = "5")]
        ArrayValue(super::ArrayValue),
        #[prost(message, tag = "6")]
        KvlistValue(super::KeyValueList),
        #[prost(bytes, tag = "7")]
        BytesValue(::prost::alloc::vec::Vec<u8>),
    }
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValueList {
    #[prost(message, repeated, tag = "1")]
    pub values: ::prost::alloc::vec::Vec<KeyValue>,
}
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ArrayValue {
    #[prost(message, repeated, tag = "1")]
    pub values: ::prost::alloc::vec::Vec<AnyValue>,
}
/// TraceQueryParameters contains query parameters to find traces. For a detailed
/// definition of each field in this message, refer to `TraceQueryParameters` in `jaeger.api_v3`
/// (<https://github.com/jaegertracing/jaeger-idl/blob/main/proto/api_v3/query_service.proto>).
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct TraceQueryParameters {
    #[prost(string, tag = "1")]
    pub service_name: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub operation_name: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub attributes: ::prost::alloc::vec::Vec<KeyValue>,
    #[prost(message, optional, tag = "4")]
    pub start_time_min: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "5")]
    pub start_time_max: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "6")]
    pub duration_min: ::core::option::Option<::prost_types::Duration>,
    #[prost(message, optional, tag = "7")]
    pub duration_max: ::core::option::Option<::prost_types::Duration>,
    #[prost(int32, tag = "8")]
    pub search_depth: i32,
}
/// FindTracesRequest represents a request to find traces.
/// It can be used to retrieve the traces (FindTraces) or simply
/// the trace IDs (FindTraceIDs).
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FindTracesRequest {
    #[prost(message, optional, tag = "1")]
    pub query: ::core::option::Option<TraceQueryParameters>,
}
/// FoundTraceID is a wrapper around trace ID returned from FindTraceIDs
/// with an optional time range that may be used in GetTraces calls.
///
/// The time range is provided as an optimization hint for some storage backends
/// that can perform more efficient queries when they know the approximate time range.
/// The value should not be used for precise time-based filtering or assumptions.
/// It is meant as a rough boundary and may not be populated in all cases.
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FoundTraceId {
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    #[prost(message, optional, tag = "2")]
    pub start: ::core::option::Option<::prost_types::Timestamp>,
    #[prost(message, optional, tag = "3")]
    pub end: ::core::option::Option<::prost_types::Timestamp>,
}
/// FindTraceIDsResponse represents the response for FindTracesRequest.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FindTraceIDsResponse {
    #[prost(message, repeated, tag = "1")]
    pub trace_ids: ::prost::alloc::vec::Vec<FoundTraceId>,
}
/// Generated client implementations.
pub mod trace_reader_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    /// TraceReader is a service that allows reading traces from storage.
    /// Note that if you implement this service, you should also implement
    /// OTEL's TraceService in package opentelemetry.proto.collector.trace.v1
    /// to allow pushing traces to the storage backend
    /// (<https://github.com/open-telemetry/opentelemetry-proto/blob/main/opentelemetry/proto/collector/trace/v1/trace_service.proto>)
    #[derive(Debug, Clone)]
    pub struct TraceReaderClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl TraceReaderClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> TraceReaderClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> TraceReaderClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            TraceReaderClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// GetTraces returns a stream that retrieves all traces with given IDs.
        ///
        /// Chunking requirements:
        ///
        /// * A single TracesData chunk MUST NOT contain spans from multiple traces.
        /// * Large traces MAY be split across multiple, *consecutive* TracesData chunks.
        /// * Each returned TracesData object MUST NOT be empty.
        ///
        /// Edge cases:
        ///
        /// * If no spans are found for any given trace ID, the ID is ignored.
        /// * If none of the trace IDs are found in the storage, an empty response is returned.
        pub async fn get_traces(
            &mut self,
            request: impl tonic::IntoRequest<super::GetTracesRequest>,
        ) -> std::result::Result<
            tonic::Response<
                tonic::codec::Streaming<
                    super::super::super::super::opentelemetry::proto::trace::v1::TracesData,
                >,
            >,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v2.TraceReader/GetTraces",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("jaeger.storage.v2.TraceReader", "GetTraces"));
            self.inner.server_streaming(req, path, codec).await
        }
        /// GetServices returns all service names known to the backend from traces
        /// within its retention period.
        pub async fn get_services(
            &mut self,
            request: impl tonic::IntoRequest<super::GetServicesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetServicesResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v2.TraceReader/GetServices",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("jaeger.storage.v2.TraceReader", "GetServices"));
            self.inner.unary(req, path, codec).await
        }
        /// GetOperations returns all operation names for a given service
        /// known to the backend from traces within its retention period.
        pub async fn get_operations(
            &mut self,
            request: impl tonic::IntoRequest<super::GetOperationsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetOperationsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v2.TraceReader/GetOperations",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v2.TraceReader", "GetOperations"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// FindTraces returns a stream that retrieves traces matching query parameters.
        ///
        /// The chunking rules are the same as for GetTraces.
        ///
        /// If no matching traces are found, an empty stream is returned.
        pub async fn find_traces(
            &mut self,
            request: impl tonic::IntoRequest<super::FindTracesRequest>,
        ) -> std::result::Result<
            tonic::Response<
                tonic::codec::Streaming<
                    super::super::super::super::opentelemetry::proto::trace::v1::TracesData,
                >,
            >,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v2.TraceReader/FindTraces",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("jaeger.storage.v2.TraceReader", "FindTraces"));
            self.inner.server_streaming(req, path, codec).await
        }
        /// FindTraceIDs returns a stream that retrieves IDs of traces matching query parameters.
        ///
        /// If no matching traces are found, an empty stream is returned.
        ///
        /// This call behaves identically to FindTraces, except that it returns only the list
        /// of matching trace IDs. This is useful in some contexts, such as batch jobs, where a
        /// large list of trace IDs may be queried first and then the full traces are loaded
        /// in batches.
        pub async fn find_trace_i_ds(
            &mut self,
            request: impl tonic::IntoRequest<super::FindTracesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FindTraceIDsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/jaeger.storage.v2.TraceReader/FindTraceIDs",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("jaeger.storage.v2.TraceReader", "FindTraceIDs"),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod trace_reader_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with TraceReaderServer.
    #[async_trait]
    pub trait TraceReader: std::marker::Send + std::marker::Sync + 'static {
        /// Server streaming response type for the GetTraces method.
        type GetTracesStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<
                    super::super::super::super::opentelemetry::proto::trace::v1::TracesData,
                    tonic::Status,
                >,
            >
            + std::marker::Send
            + 'static;
        /// GetTraces returns a stream that retrieves all traces with given IDs.
        ///
        /// Chunking requirements:
        ///
        /// * A single TracesData chunk MUST NOT contain spans from multiple traces.
        /// * Large traces MAY be split across multiple, *consecutive* TracesData chunks.
        /// * Each returned TracesData object MUST NOT be empty.
        ///
        /// Edge cases:
        ///
        /// * If no spans are found for any given trace ID, the ID is ignored.
        /// * If none of the trace IDs are found in the storage, an empty response is returned.
        async fn get_traces(
            &self,
            request: tonic::Request<super::GetTracesRequest>,
        ) -> std::result::Result<tonic::Response<Self::GetTracesStream>, tonic::Status>;
        /// GetServices returns all service names known to the backend from traces
        /// within its retention period.
        async fn get_services(
            &self,
            request: tonic::Request<super::GetServicesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetServicesResponse>,
            tonic::Status,
        >;
        /// GetOperations returns all operation names for a given service
        /// known to the backend from traces within its retention period.
        async fn get_operations(
            &self,
            request: tonic::Request<super::GetOperationsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetOperationsResponse>,
            tonic::Status,
        >;
        /// Server streaming response type for the FindTraces method.
        type FindTracesStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<
                    super::super::super::super::opentelemetry::proto::trace::v1::TracesData,
                    tonic::Status,
                >,
            >
            + std::marker::Send
            + 'static;
        /// FindTraces returns a stream that retrieves traces matching query parameters.
        ///
        /// The chunking rules are the same as for GetTraces.
        ///
        /// If no matching traces are found, an empty stream is returned.
        async fn find_traces(
            &self,
            request: tonic::Request<super::FindTracesRequest>,
        ) -> std::result::Result<tonic::Response<Self::FindTracesStream>, tonic::Status>;
        /// FindTraceIDs returns a stream that retrieves IDs of traces matching query parameters.
        ///
        /// If no matching traces are found, an empty stream is returned.
        ///
        /// This call behaves identically to FindTraces, except that it returns only the list
        /// of matching trace IDs. This is useful in some contexts, such as batch jobs, where a
        /// large list of trace IDs may be queried first and then the full traces are loaded
        /// in batches.
        async fn find_trace_i_ds(
            &self,
            request: tonic::Request<super::FindTracesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FindTraceIDsResponse>,
            tonic::Status,
        >;
    }
    /// TraceReader is a service that allows reading traces from storage.
    /// Note that if you implement this service, you should also implement
    /// OTEL's TraceService in package opentelemetry.proto.collector.trace.v1
    /// to allow pushing traces to the storage backend
    /// (<https://github.com/open-telemetry/opentelemetry-proto/blob/main/opentelemetry/proto/collector/trace/v1/trace_service.proto>)
    #[derive(Debug)]
    pub struct TraceReaderServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> TraceReaderServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for TraceReaderServer<T>
    where
        T: TraceReader,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/jaeger.storage.v2.TraceReader/GetTraces" => {
                    #[allow(non_camel_case_types)]
                    struct GetTracesSvc<T: TraceReader>(pub Arc<T>);
                    impl<
                        T: TraceReader,
                    > tonic::server::ServerStreamingService<super::GetTracesRequest>
                    for GetTracesSvc<T> {
                        type Response = super::super::super::super::opentelemetry::proto::trace::v1::TracesData;
                        type ResponseStream = T::GetTracesStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetTracesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as TraceReader>::get_traces(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetTracesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v2.TraceReader/GetServices" => {
                    #[allow(non_camel_case_types)]
                    struct GetServicesSvc<T: TraceReader>(pub Arc<T>);
                    impl<
                        T: TraceReader,
                    > tonic::server::UnaryService<super::GetServicesRequest>
                    for GetServicesSvc<T> {
                        type Response = super::GetServicesResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetServicesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as TraceReader>::get_services(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetServicesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v2.TraceReader/GetOperations" => {
                    #[allow(non_camel_case_types)]
                    struct GetOperationsSvc<T: TraceReader>(pub Arc<T>);
                    impl<
                        T: TraceReader,
                    > tonic::server::UnaryService<super::GetOperationsRequest>
                    for GetOperationsSvc<T> {
                        type Response = super::GetOperationsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetOperationsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as TraceReader>::get_operations(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetOperationsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v2.TraceReader/FindTraces" => {
                    #[allow(non_camel_case_types)]
                    struct FindTracesSvc<T: TraceReader>(pub Arc<T>);
                    impl<
                        T: TraceReader,
                    > tonic::server::ServerStreamingService<super::FindTracesRequest>
                    for FindTracesSvc<T> {
                        type Response = super::super::super::super::opentelemetry::proto::trace::v1::TracesData;
                        type ResponseStream = T::FindTracesStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FindTracesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as TraceReader>::find_traces(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FindTracesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/jaeger.storage.v2.TraceReader/FindTraceIDs" => {
                    #[allow(non_camel_case_types)]
                    struct FindTraceIDsSvc<T: TraceReader>(pub Arc<T>);
                    impl<
                        T: TraceReader,
                    > tonic::server::UnaryService<super::FindTracesRequest>
                    for FindTraceIDsSvc<T> {
                        type Response = super::FindTraceIDsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FindTracesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as TraceReader>::find_trace_i_ds(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FindTraceIDsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for TraceReaderServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "jaeger.storage.v2.TraceReader";
    impl<T> tonic::server::NamedService for TraceReaderServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/jaeger/opentelemetry.proto.common.v1.rs
================================================
// This file is @generated by prost-build.
/// AnyValue is used to represent any type of attribute value. AnyValue may contain a
/// primitive value such as a string or integer or it may contain an arbitrary nested
/// object containing arrays, key-value lists and primitives.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AnyValue {
    /// The value is one of the listed fields. It is valid for all values to be unspecified
    /// in which case this AnyValue is considered to be "empty".
    #[prost(oneof = "any_value::Value", tags = "1, 2, 3, 4, 5, 6, 7")]
    pub value: ::core::option::Option<any_value::Value>,
}
/// Nested message and enum types in `AnyValue`.
pub mod any_value {
    /// The value is one of the listed fields. It is valid for all values to be unspecified
    /// in which case this AnyValue is considered to be "empty".
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Value {
        #[prost(string, tag = "1")]
        StringValue(::prost::alloc::string::String),
        #[prost(bool, tag = "2")]
        BoolValue(bool),
        #[prost(int64, tag = "3")]
        IntValue(i64),
        #[prost(double, tag = "4")]
        DoubleValue(f64),
        #[prost(message, tag = "5")]
        ArrayValue(super::ArrayValue),
        #[prost(message, tag = "6")]
        KvlistValue(super::KeyValueList),
        #[prost(bytes, tag = "7")]
        BytesValue(::prost::alloc::vec::Vec<u8>),
    }
}
/// ArrayValue is a list of AnyValue messages. We need ArrayValue as a message
/// since oneof in AnyValue does not allow repeated fields.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ArrayValue {
    /// Array of values. The array may be empty (contain 0 elements).
    #[prost(message, repeated, tag = "1")]
    pub values: ::prost::alloc::vec::Vec<AnyValue>,
}
/// KeyValueList is a list of KeyValue messages. We need KeyValueList as a message
/// since `oneof` in AnyValue does not allow repeated fields. Everywhere else where we need
/// a list of KeyValue messages (e.g. in Span) we use `repeated KeyValue` directly to
/// avoid unnecessary extra wrapping (which slows down the protocol). The 2 approaches
/// are semantically equivalent.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValueList {
    /// A collection of key/value pairs of key-value pairs. The list may be empty (may
    /// contain 0 elements).
    /// The keys MUST be unique (it is not allowed to have more than one
    /// value with the same key).
    #[prost(message, repeated, tag = "1")]
    pub values: ::prost::alloc::vec::Vec<KeyValue>,
}
/// KeyValue is a key-value pair that is used to store Span attributes, Link
/// attributes, etc.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValue {
    #[prost(string, tag = "1")]
    pub key: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "2")]
    pub value: ::core::option::Option<AnyValue>,
}
/// InstrumentationScope is a message representing the instrumentation scope information
/// such as the fully qualified name and version.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct InstrumentationScope {
    /// An empty instrumentation scope name means the name is unknown.
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub version: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub attributes: ::prost::alloc::vec::Vec<KeyValue>,
    #[prost(uint32, tag = "4")]
    pub dropped_attributes_count: u32,
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/jaeger/opentelemetry.proto.resource.v1.rs
================================================
// This file is @generated by prost-build.
/// Resource information.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Resource {
    /// Set of attributes that describe the resource.
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "1")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// dropped_attributes_count is the number of dropped attributes. If the value is 0, then
    /// no attributes were dropped.
    #[prost(uint32, tag = "2")]
    pub dropped_attributes_count: u32,
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/jaeger/opentelemetry.proto.trace.v1.rs
================================================
// This file is @generated by prost-build.
/// TracesData represents the traces data that can be stored in a persistent storage,
/// OR can be embedded by other protocols that transfer OTLP traces data but do
/// not implement the OTLP protocol.
///
/// The main difference between this message and collector protocol is that
/// in this message there will not be any "control" or "metadata" specific to
/// OTLP protocol.
///
/// When new fields are added into this message, the OTLP request MUST be updated
/// as well.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct TracesData {
    /// An array of ResourceSpans.
    /// For data coming from a single resource this array will typically contain
    /// one element. Intermediary nodes that receive data from multiple origins
    /// typically batch the data before forwarding further and in that case this
    /// array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_spans: ::prost::alloc::vec::Vec<ResourceSpans>,
}
/// A collection of ScopeSpans from a Resource.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ResourceSpans {
    /// The resource for the spans in this message.
    /// If this field is not set then no resource info is known.
    #[prost(message, optional, tag = "1")]
    pub resource: ::core::option::Option<super::super::resource::v1::Resource>,
    /// A list of ScopeSpans that originate from a resource.
    #[prost(message, repeated, tag = "2")]
    pub scope_spans: ::prost::alloc::vec::Vec<ScopeSpans>,
    /// This schema_url applies to the data in the "resource" field. It does not apply
    /// to the data in the "scope_spans" field which have their own schema_url field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A collection of Spans produced by an InstrumentationScope.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ScopeSpans {
    /// The instrumentation scope information for the spans in this message.
    /// Semantically when InstrumentationScope isn't set, it is equivalent with
    /// an empty instrumentation scope name (unknown).
    #[prost(message, optional, tag = "1")]
    pub scope: ::core::option::Option<super::super::common::v1::InstrumentationScope>,
    /// A list of Spans that originate from an instrumentation scope.
    #[prost(message, repeated, tag = "2")]
    pub spans: ::prost::alloc::vec::Vec<Span>,
    /// This schema_url applies to all spans and span events in the "spans" field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A Span represents a single operation performed by a single component of the system.
///
/// The next available field id is 17.
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Span {
    /// A unique identifier for a trace. All spans from the same trace share
    /// the same `trace_id`. The ID is a 16-byte array. An ID with all zeroes
    /// is considered invalid.
    ///
    /// This field is semantically required. Receiver should generate new
    /// random trace_id if empty or invalid trace_id was received.
    ///
    /// This field is required.
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    /// A unique identifier for a span within a trace, assigned when the span
    /// is created. The ID is an 8-byte array. An ID with all zeroes is considered
    /// invalid.
    ///
    /// This field is semantically required. Receiver should generate new
    /// random span_id if empty or invalid span_id was received.
    ///
    /// This field is required.
    #[prost(bytes = "vec", tag = "2")]
    pub span_id: ::prost::alloc::vec::Vec<u8>,
    /// trace_state conveys information about request position in multiple distributed tracing graphs.
    /// It is a trace_state in w3c-trace-context format: <https://www.w3.org/TR/trace-context/#tracestate-header>
    /// See also <https://github.com/w3c/distributed-tracing> for more details about this field.
    #[prost(string, tag = "3")]
    pub trace_state: ::prost::alloc::string::String,
    /// The `span_id` of this span's parent span. If this is a root span, then this
    /// field must be empty. The ID is an 8-byte array.
    #[prost(bytes = "vec", tag = "4")]
    pub parent_span_id: ::prost::alloc::vec::Vec<u8>,
    /// A description of the span's operation.
    ///
    /// For example, the name can be a qualified method name or a file name
    /// and a line number where the operation is called. A best practice is to use
    /// the same display name at the same call point in an application.
    /// This makes it easier to correlate spans in different traces.
    ///
    /// This field is semantically required to be set to non-empty string.
    /// Empty value is equivalent to an unknown span name.
    ///
    /// This field is required.
    #[prost(string, tag = "5")]
    pub name: ::prost::alloc::string::String,
    /// Distinguishes between spans generated in a particular context. For example,
    /// two spans with the same name may be distinguished using `CLIENT` (caller)
    /// and `SERVER` (callee) to identify queueing latency associated with the span.
    #[prost(enumeration = "span::SpanKind", tag = "6")]
    pub kind: i32,
    /// start_time_unix_nano is the start time of the span. On the client side, this is the time
    /// kept by the local machine where the span execution starts. On the server side, this
    /// is the time when the server's application handler starts running.
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
    ///
    /// This field is semantically required and it is expected that end_time >= start_time.
    #[prost(fixed64, tag = "7")]
    pub start_time_unix_nano: u64,
    /// end_time_unix_nano is the end time of the span. On the client side, this is the time
    /// kept by the local machine where the span execution ends. On the server side, this
    /// is the time when the server application handler stops running.
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
    ///
    /// This field is semantically required and it is expected that end_time >= start_time.
    #[prost(fixed64, tag = "8")]
    pub end_time_unix_nano: u64,
    /// attributes is a collection of key/value pairs. Note, global attributes
    /// like server name can be set using the resource API. Examples of attributes:
    ///
    /// ```text
    /// "/http/user_agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36"
    /// "/http/server_latency": 300
    /// "abc.com/myattribute": true
    /// "abc.com/score": 10.239
    /// ```
    ///
    /// The OpenTelemetry API specification further restricts the allowed value types:
    /// <https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/common/README.md#attribute>
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "9")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// dropped_attributes_count is the number of attributes that were discarded. Attributes
    /// can be discarded because their keys are too long or because there are too many
    /// attributes. If this value is 0, then no attributes were dropped.
    #[prost(uint32, tag = "10")]
    pub dropped_attributes_count: u32,
    /// events is a collection of Event items.
    #[prost(message, repeated, tag = "11")]
    pub events: ::prost::alloc::vec::Vec<span::Event>,
    /// dropped_events_count is the number of dropped events. If the value is 0, then no
    /// events were dropped.
    #[prost(uint32, tag = "12")]
    pub dropped_events_count: u32,
    /// links is a collection of Links, which are references from this span to a span
    /// in the same or different trace.
    #[prost(message, repeated, tag = "13")]
    pub links: ::prost::alloc::vec::Vec<span::Link>,
    /// dropped_links_count is the number of dropped links after the maximum size was
    /// enforced. If this value is 0, then no links were dropped.
    #[prost(uint32, tag = "14")]
    pub dropped_links_count: u32,
    /// An optional final status for this span. Semantically when Status isn't set, it means
    /// span's status code is unset, i.e. assume STATUS_CODE_UNSET (code = 0).
    #[prost(message, optional, tag = "15")]
    pub status: ::core::option::Option<Status>,
}
/// Nested message and enum types in `Span`.
pub mod span {
    /// Event is a time-stamped annotation of the span, consisting of user-supplied
    /// text description and key-value pairs.
    #[derive(Clone, PartialEq, ::prost::Message)]
    pub struct Event {
        /// time_unix_nano is the time the event occurred.
        #[prost(fixed64, tag = "1")]
        pub time_unix_nano: u64,
        /// name of the event.
        /// This field is semantically required to be set to non-empty string.
        #[prost(string, tag = "2")]
        pub name: ::prost::alloc::string::String,
        /// attributes is a collection of attribute key/value pairs on the event.
        /// Attribute keys MUST be unique (it is not allowed to have more than one
        /// attribute with the same key).
        #[prost(message, repeated, tag = "3")]
        pub attributes: ::prost::alloc::vec::Vec<
            super::super::super::common::v1::KeyValue,
        >,
        /// dropped_attributes_count is the number of dropped attributes. If the value is 0,
        /// then no attributes were dropped.
        #[prost(uint32, tag = "4")]
        pub dropped_attributes_count: u32,
    }
    /// A pointer from the current span to another span in the same trace or in a
    /// different trace. For example, this can be used in batching operations,
    /// where a single batch handler processes multiple requests from different
    /// traces or when the handler receives a request from a different project.
    #[derive(Clone, PartialEq, ::prost::Message)]
    pub struct Link {
        /// A unique identifier of a trace that this linked span is part of. The ID is a
        /// 16-byte array.
        #[prost(bytes = "vec", tag = "1")]
        pub trace_id: ::prost::alloc::vec::Vec<u8>,
        /// A unique identifier for the linked span. The ID is an 8-byte array.
        #[prost(bytes = "vec", tag = "2")]
        pub span_id: ::prost::alloc::vec::Vec<u8>,
        /// The trace_state associated with the link.
        #[prost(string, tag = "3")]
        pub trace_state: ::prost::alloc::string::String,
        /// attributes is a collection of attribute key/value pairs on the link.
        /// Attribute keys MUST be unique (it is not allowed to have more than one
        /// attribute with the same key).
        #[prost(message, repeated, tag = "4")]
        pub attributes: ::prost::alloc::vec::Vec<
            super::super::super::common::v1::KeyValue,
        >,
        /// dropped_attributes_count is the number of dropped attributes. If the value is 0,
        /// then no attributes were dropped.
        #[prost(uint32, tag = "5")]
        pub dropped_attributes_count: u32,
    }
    /// SpanKind is the type of span. Can be used to specify additional relationships between spans
    /// in addition to a parent/child relationship.
    #[derive(
        Clone,
        Copy,
        Debug,
        PartialEq,
        Eq,
        Hash,
        PartialOrd,
        Ord,
        ::prost::Enumeration
    )]
    #[repr(i32)]
    pub enum SpanKind {
        /// Unspecified. Do NOT use as default.
        /// Implementations MAY assume SpanKind to be INTERNAL when receiving UNSPECIFIED.
        Unspecified = 0,
        /// Indicates that the span represents an internal operation within an application,
        /// as opposed to an operation happening at the boundaries. Default value.
        Internal = 1,
        /// Indicates that the span covers server-side handling of an RPC or other
        /// remote network request.
        Server = 2,
        /// Indicates that the span describes a request to some remote service.
        Client = 3,
        /// Indicates that the span describes a producer sending a message to a broker.
        /// Unlike CLIENT and SERVER, there is often no direct critical path latency relationship
        /// between producer and consumer spans. A PRODUCER span ends when the message was accepted
        /// by the broker while the logical processing of the message might span a much longer time.
        Producer = 4,
        /// Indicates that the span describes consumer receiving a message from a broker.
        /// Like the PRODUCER kind, there is often no direct critical path latency relationship
        /// between producer and consumer spans.
        Consumer = 5,
    }
    impl SpanKind {
        /// String value of the enum field names used in the ProtoBuf definition.
        ///
        /// The values are not transformed in any way and thus are considered stable
        /// (if the ProtoBuf definition does not change) and safe for programmatic use.
        pub fn as_str_name(&self) -> &'static str {
            match self {
                Self::Unspecified => "SPAN_KIND_UNSPECIFIED",
                Self::Internal => "SPAN_KIND_INTERNAL",
                Self::Server => "SPAN_KIND_SERVER",
                Self::Client => "SPAN_KIND_CLIENT",
                Self::Producer => "SPAN_KIND_PRODUCER",
                Self::Consumer => "SPAN_KIND_CONSUMER",
            }
        }
        /// Creates an enum from field names used in the ProtoBuf definition.
        pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
            match value {
                "SPAN_KIND_UNSPECIFIED" => Some(Self::Unspecified),
                "SPAN_KIND_INTERNAL" => Some(Self::Internal),
                "SPAN_KIND_SERVER" => Some(Self::Server),
                "SPAN_KIND_CLIENT" => Some(Self::Client),
                "SPAN_KIND_PRODUCER" => Some(Self::Producer),
                "SPAN_KIND_CONSUMER" => Some(Self::Consumer),
                _ => None,
            }
        }
    }
}
/// The Status type defines a logical error model that is suitable for different
/// programming environments, including REST APIs and RPC APIs.
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct Status {
    /// A developer-facing human readable error message.
    #[prost(string, tag = "2")]
    pub message: ::prost::alloc::string::String,
    /// The status code.
    #[prost(enumeration = "status::StatusCode", tag = "3")]
    pub code: i32,
}
/// Nested message and enum types in `Status`.
pub mod status {
    /// For the semantics of status codes see
    /// <https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#set-status>
    #[derive(
        Clone,
        Copy,
        Debug,
        PartialEq,
        Eq,
        Hash,
        PartialOrd,
        Ord,
        ::prost::Enumeration
    )]
    #[repr(i32)]
    pub enum StatusCode {
        /// The default status.
        Unset = 0,
        /// The Span has been validated by an Application developer or Operator to
        /// have completed successfully.
        Ok = 1,
        /// The Span contains an error.
        Error = 2,
    }
    impl StatusCode {
        /// String value of the enum field names used in the ProtoBuf definition.
        ///
        /// The values are not transformed in any way and thus are considered stable
        /// (if the ProtoBuf definition does not change) and safe for programmatic use.
        pub fn as_str_name(&self) -> &'static str {
            match self {
                Self::Unset => "STATUS_CODE_UNSET",
                Self::Ok => "STATUS_CODE_OK",
                Self::Error => "STATUS_CODE_ERROR",
            }
        }
        /// Creates an enum from field names used in the ProtoBuf definition.
        pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
            match value {
                "STATUS_CODE_UNSET" => Some(Self::Unset),
                "STATUS_CODE_OK" => Some(Self::Ok),
                "STATUS_CODE_ERROR" => Some(Self::Error),
                _ => None,
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.collector.logs.v1.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ExportLogsServiceRequest {
    /// An array of ResourceLogs.
    /// For data coming from a single resource this array will typically contain one
    /// element. Intermediary nodes (such as OpenTelemetry Collector) that receive
    /// data from multiple origins typically batch the data before forwarding further and
    /// in that case this array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_logs: ::prost::alloc::vec::Vec<
        super::super::super::logs::v1::ResourceLogs,
    >,
}
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ExportLogsServiceResponse {
    /// The details of a partially successful export request.
    ///
    /// If the request is only partially accepted
    /// (i.e. when the server accepts only parts of the data and rejects the rest)
    /// the server MUST initialize the `partial_success` field and MUST
    /// set the `rejected_<signal>` with the number of items it rejected.
    ///
    /// Servers MAY also make use of the `partial_success` field to convey
    /// warnings/suggestions to senders even when the request was fully accepted.
    /// In such cases, the `rejected_<signal>` MUST have a value of `0` and
    /// the `error_message` MUST be non-empty.
    ///
    /// A `partial_success` message with an empty value (`rejected_<signal>1 = 0 and  `error_message\` = "") is equivalent to it not being set/present. Senders
    /// SHOULD interpret it the same way as in the full success case.
    #[prost(message, optional, tag = "1")]
    pub partial_success: ::core::option::Option<ExportLogsPartialSuccess>,
}
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ExportLogsPartialSuccess {
    /// The number of rejected log records.
    ///
    /// A `rejected_<signal>` field holding a `0` value indicates that the
    /// request was fully accepted.
    #[prost(int64, tag = "1")]
    pub rejected_log_records: i64,
    /// A developer-facing human-readable message in English. It should be used
    /// either to explain why the server rejected parts of the data during a partial
    /// success or to convey warnings/suggestions during a full success. The message
    /// should offer guidance on how users can address such issues.
    ///
    /// error_message is an optional field. An error_message with an empty value
    /// is equivalent to it not being set.
    #[prost(string, tag = "2")]
    pub error_message: ::prost::alloc::string::String,
}
/// Generated client implementations.
pub mod logs_service_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    /// Service that can be used to push logs between one Application instrumented with
    /// OpenTelemetry and an collector, or between an collector and a central collector (in this
    /// case logs are sent/received to/from multiple Applications).
    #[derive(Debug, Clone)]
    pub struct LogsServiceClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl LogsServiceClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> LogsServiceClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> LogsServiceClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            LogsServiceClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// For performance reasons, it is recommended to keep this RPC
        /// alive for the entire life of the application.
        pub async fn export(
            &mut self,
            request: impl tonic::IntoRequest<super::ExportLogsServiceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ExportLogsServiceResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/opentelemetry.proto.collector.logs.v1.LogsService/Export",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "opentelemetry.proto.collector.logs.v1.LogsService",
                        "Export",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod logs_service_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with LogsServiceServer.
    #[async_trait]
    pub trait LogsService: std::marker::Send + std::marker::Sync + 'static {
        /// For performance reasons, it is recommended to keep this RPC
        /// alive for the entire life of the application.
        async fn export(
            &self,
            request: tonic::Request<super::ExportLogsServiceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ExportLogsServiceResponse>,
            tonic::Status,
        >;
    }
    /// Service that can be used to push logs between one Application instrumented with
    /// OpenTelemetry and an collector, or between an collector and a central collector (in this
    /// case logs are sent/received to/from multiple Applications).
    #[derive(Debug)]
    pub struct LogsServiceServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> LogsServiceServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for LogsServiceServer<T>
    where
        T: LogsService,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/opentelemetry.proto.collector.logs.v1.LogsService/Export" => {
                    #[allow(non_camel_case_types)]
                    struct ExportSvc<T: LogsService>(pub Arc<T>);
                    impl<
                        T: LogsService,
                    > tonic::server::UnaryService<super::ExportLogsServiceRequest>
                    for ExportSvc<T> {
                        type Response = super::ExportLogsServiceResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ExportLogsServiceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as LogsService>::export(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ExportSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for LogsServiceServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "opentelemetry.proto.collector.logs.v1.LogsService";
    impl<T> tonic::server::NamedService for LogsServiceServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.collector.metrics.v1.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ExportMetricsServiceRequest {
    /// An array of ResourceMetrics.
    /// For data coming from a single resource this array will typically contain one
    /// element. Intermediary nodes (such as OpenTelemetry Collector) that receive
    /// data from multiple origins typically batch the data before forwarding further and
    /// in that case this array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_metrics: ::prost::alloc::vec::Vec<
        super::super::super::metrics::v1::ResourceMetrics,
    >,
}
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ExportMetricsServiceResponse {
    /// The details of a partially successful export request.
    ///
    /// If the request is only partially accepted
    /// (i.e. when the server accepts only parts of the data and rejects the rest)
    /// the server MUST initialize the `partial_success` field and MUST
    /// set the `rejected_<signal>` with the number of items it rejected.
    ///
    /// Servers MAY also make use of the `partial_success` field to convey
    /// warnings/suggestions to senders even when the request was fully accepted.
    /// In such cases, the `rejected_<signal>` MUST have a value of `0` and
    /// the `error_message` MUST be non-empty.
    ///
    /// A `partial_success` message with an empty value (rejected\_<signal> = 0 and
    /// `error_message` = "") is equivalent to it not being set/present. Senders
    /// SHOULD interpret it the same way as in the full success case.
    #[prost(message, optional, tag = "1")]
    pub partial_success: ::core::option::Option<ExportMetricsPartialSuccess>,
}
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ExportMetricsPartialSuccess {
    /// The number of rejected data points.
    ///
    /// A `rejected_<signal>` field holding a `0` value indicates that the
    /// request was fully accepted.
    #[prost(int64, tag = "1")]
    pub rejected_data_points: i64,
    /// A developer-facing human-readable message in English. It should be used
    /// either to explain why the server rejected parts of the data during a partial
    /// success or to convey warnings/suggestions during a full success. The message
    /// should offer guidance on how users can address such issues.
    ///
    /// error_message is an optional field. An error_message with an empty value
    /// is equivalent to it not being set.
    #[prost(string, tag = "2")]
    pub error_message: ::prost::alloc::string::String,
}
/// Generated client implementations.
pub mod metrics_service_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    /// Service that can be used to push metrics between one Application
    /// instrumented with OpenTelemetry and a collector, or between a collector and a
    /// central collector.
    #[derive(Debug, Clone)]
    pub struct MetricsServiceClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl MetricsServiceClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> MetricsServiceClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> MetricsServiceClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            MetricsServiceClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// For performance reasons, it is recommended to keep this RPC
        /// alive for the entire life of the application.
        pub async fn export(
            &mut self,
            request: impl tonic::IntoRequest<super::ExportMetricsServiceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ExportMetricsServiceResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/opentelemetry.proto.collector.metrics.v1.MetricsService/Export",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "opentelemetry.proto.collector.metrics.v1.MetricsService",
                        "Export",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod metrics_service_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with MetricsServiceServer.
    #[async_trait]
    pub trait MetricsService: std::marker::Send + std::marker::Sync + 'static {
        /// For performance reasons, it is recommended to keep this RPC
        /// alive for the entire life of the application.
        async fn export(
            &self,
            request: tonic::Request<super::ExportMetricsServiceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ExportMetricsServiceResponse>,
            tonic::Status,
        >;
    }
    /// Service that can be used to push metrics between one Application
    /// instrumented with OpenTelemetry and a collector, or between a collector and a
    /// central collector.
    #[derive(Debug)]
    pub struct MetricsServiceServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> MetricsServiceServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for MetricsServiceServer<T>
    where
        T: MetricsService,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/opentelemetry.proto.collector.metrics.v1.MetricsService/Export" => {
                    #[allow(non_camel_case_types)]
                    struct ExportSvc<T: MetricsService>(pub Arc<T>);
                    impl<
                        T: MetricsService,
                    > tonic::server::UnaryService<super::ExportMetricsServiceRequest>
                    for ExportSvc<T> {
                        type Response = super::ExportMetricsServiceResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ExportMetricsServiceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetricsService>::export(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ExportSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for MetricsServiceServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "opentelemetry.proto.collector.metrics.v1.MetricsService";
    impl<T> tonic::server::NamedService for MetricsServiceServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.collector.trace.v1.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ExportTraceServiceRequest {
    /// An array of ResourceSpans.
    /// For data coming from a single resource this array will typically contain one
    /// element. Intermediary nodes (such as OpenTelemetry Collector) that receive
    /// data from multiple origins typically batch the data before forwarding further and
    /// in that case this array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_spans: ::prost::alloc::vec::Vec<
        super::super::super::trace::v1::ResourceSpans,
    >,
}
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ExportTraceServiceResponse {
    /// The details of a partially successful export request.
    ///
    /// If the request is only partially accepted
    /// (i.e. when the server accepts only parts of the data and rejects the rest)
    /// the server MUST initialize the `partial_success` field and MUST
    /// set the `rejected_<signal>` with the number of items it rejected.
    ///
    /// Servers MAY also make use of the `partial_success` field to convey
    /// warnings/suggestions to senders even when the request was fully accepted.
    /// In such cases, the `rejected_<signal>` MUST have a value of `0` and
    /// the `error_message` MUST be non-empty.
    ///
    /// A `partial_success` message with an empty value (rejected\_<signal> = 0 and
    /// `error_message` = "") is equivalent to it not being set/present. Senders
    /// SHOULD interpret it the same way as in the full success case.
    #[prost(message, optional, tag = "1")]
    pub partial_success: ::core::option::Option<ExportTracePartialSuccess>,
}
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ExportTracePartialSuccess {
    /// The number of rejected spans.
    ///
    /// A `rejected_<signal>` field holding a `0` value indicates that the
    /// request was fully accepted.
    #[prost(int64, tag = "1")]
    pub rejected_spans: i64,
    /// A developer-facing human-readable message in English. It should be used
    /// either to explain why the server rejected parts of the data during a partial
    /// success or to convey warnings/suggestions during a full success. The message
    /// should offer guidance on how users can address such issues.
    ///
    /// error_message is an optional field. An error_message with an empty value
    /// is equivalent to it not being set.
    #[prost(string, tag = "2")]
    pub error_message: ::prost::alloc::string::String,
}
/// Generated client implementations.
pub mod trace_service_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    /// Service that can be used to push spans between one Application instrumented with
    /// OpenTelemetry and a collector, or between a collector and a central collector (in this
    /// case spans are sent/received to/from multiple Applications).
    #[derive(Debug, Clone)]
    pub struct TraceServiceClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl TraceServiceClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> TraceServiceClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> TraceServiceClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            TraceServiceClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// For performance reasons, it is recommended to keep this RPC
        /// alive for the entire life of the application.
        pub async fn export(
            &mut self,
            request: impl tonic::IntoRequest<super::ExportTraceServiceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ExportTraceServiceResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/opentelemetry.proto.collector.trace.v1.TraceService/Export",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "opentelemetry.proto.collector.trace.v1.TraceService",
                        "Export",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod trace_service_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with TraceServiceServer.
    #[async_trait]
    pub trait TraceService: std::marker::Send + std::marker::Sync + 'static {
        /// For performance reasons, it is recommended to keep this RPC
        /// alive for the entire life of the application.
        async fn export(
            &self,
            request: tonic::Request<super::ExportTraceServiceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ExportTraceServiceResponse>,
            tonic::Status,
        >;
    }
    /// Service that can be used to push spans between one Application instrumented with
    /// OpenTelemetry and a collector, or between a collector and a central collector (in this
    /// case spans are sent/received to/from multiple Applications).
    #[derive(Debug)]
    pub struct TraceServiceServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> TraceServiceServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for TraceServiceServer<T>
    where
        T: TraceService,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/opentelemetry.proto.collector.trace.v1.TraceService/Export" => {
                    #[allow(non_camel_case_types)]
                    struct ExportSvc<T: TraceService>(pub Arc<T>);
                    impl<
                        T: TraceService,
                    > tonic::server::UnaryService<super::ExportTraceServiceRequest>
                    for ExportSvc<T> {
                        type Response = super::ExportTraceServiceResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ExportTraceServiceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as TraceService>::export(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ExportSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for TraceServiceServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "opentelemetry.proto.collector.trace.v1.TraceService";
    impl<T> tonic::server::NamedService for TraceServiceServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.common.v1.rs
================================================
// This file is @generated by prost-build.
/// AnyValue is used to represent any type of attribute value. AnyValue may contain a
/// primitive value such as a string or integer or it may contain an arbitrary nested
/// object containing arrays, key-value lists and primitives.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AnyValue {
    /// The value is one of the listed fields. It is valid for all values to be unspecified
    /// in which case this AnyValue is considered to be "empty".
    #[prost(oneof = "any_value::Value", tags = "1, 2, 3, 4, 5, 6, 7")]
    pub value: ::core::option::Option<any_value::Value>,
}
/// Nested message and enum types in `AnyValue`.
pub mod any_value {
    /// The value is one of the listed fields. It is valid for all values to be unspecified
    /// in which case this AnyValue is considered to be "empty".
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Value {
        #[prost(string, tag = "1")]
        StringValue(::prost::alloc::string::String),
        #[prost(bool, tag = "2")]
        BoolValue(bool),
        #[prost(int64, tag = "3")]
        IntValue(i64),
        #[prost(double, tag = "4")]
        DoubleValue(f64),
        #[prost(message, tag = "5")]
        ArrayValue(super::ArrayValue),
        #[prost(message, tag = "6")]
        KvlistValue(super::KeyValueList),
        #[prost(bytes, tag = "7")]
        BytesValue(::prost::alloc::vec::Vec<u8>),
    }
}
/// ArrayValue is a list of AnyValue messages. We need ArrayValue as a message
/// since oneof in AnyValue does not allow repeated fields.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ArrayValue {
    /// Array of values. The array may be empty (contain 0 elements).
    #[prost(message, repeated, tag = "1")]
    pub values: ::prost::alloc::vec::Vec<AnyValue>,
}
/// KeyValueList is a list of KeyValue messages. We need KeyValueList as a message
/// since `oneof` in AnyValue does not allow repeated fields. Everywhere else where we need
/// a list of KeyValue messages (e.g. in Span) we use `repeated KeyValue` directly to
/// avoid unnecessary extra wrapping (which slows down the protocol). The 2 approaches
/// are semantically equivalent.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValueList {
    /// A collection of key/value pairs of key-value pairs. The list may be empty (may
    /// contain 0 elements).
    /// The keys MUST be unique (it is not allowed to have more than one
    /// value with the same key).
    #[prost(message, repeated, tag = "1")]
    pub values: ::prost::alloc::vec::Vec<KeyValue>,
}
/// KeyValue is a key-value pair that is used to store Span attributes, Link
/// attributes, etc.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct KeyValue {
    #[prost(string, tag = "1")]
    pub key: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "2")]
    pub value: ::core::option::Option<AnyValue>,
}
/// InstrumentationScope is a message representing the instrumentation scope information
/// such as the fully qualified name and version.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct InstrumentationScope {
    /// An empty instrumentation scope name means the name is unknown.
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub version: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub attributes: ::prost::alloc::vec::Vec<KeyValue>,
    #[prost(uint32, tag = "4")]
    pub dropped_attributes_count: u32,
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.logs.v1.rs
================================================
// This file is @generated by prost-build.
/// LogsData represents the logs data that can be stored in a persistent storage,
/// OR can be embedded by other protocols that transfer OTLP logs data but do not
/// implement the OTLP protocol.
///
/// The main difference between this message and collector protocol is that
/// in this message there will not be any "control" or "metadata" specific to
/// OTLP protocol.
///
/// When new fields are added into this message, the OTLP request MUST be updated
/// as well.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LogsData {
    /// An array of ResourceLogs.
    /// For data coming from a single resource this array will typically contain
    /// one element. Intermediary nodes that receive data from multiple origins
    /// typically batch the data before forwarding further and in that case this
    /// array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_logs: ::prost::alloc::vec::Vec<ResourceLogs>,
}
/// A collection of ScopeLogs from a Resource.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ResourceLogs {
    /// The resource for the logs in this message.
    /// If this field is not set then resource info is unknown.
    #[prost(message, optional, tag = "1")]
    pub resource: ::core::option::Option<super::super::resource::v1::Resource>,
    /// A list of ScopeLogs that originate from a resource.
    #[prost(message, repeated, tag = "2")]
    pub scope_logs: ::prost::alloc::vec::Vec<ScopeLogs>,
    /// This schema_url applies to the data in the "resource" field. It does not apply
    /// to the data in the "scope_logs" field which have their own schema_url field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A collection of Logs produced by a Scope.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ScopeLogs {
    /// The instrumentation scope information for the logs in this message.
    /// Semantically when InstrumentationScope isn't set, it is equivalent with
    /// an empty instrumentation scope name (unknown).
    #[prost(message, optional, tag = "1")]
    pub scope: ::core::option::Option<super::super::common::v1::InstrumentationScope>,
    /// A list of log records.
    #[prost(message, repeated, tag = "2")]
    pub log_records: ::prost::alloc::vec::Vec<LogRecord>,
    /// This schema_url applies to all logs in the "logs" field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A log record according to OpenTelemetry Log Data Model:
/// <https://github.com/open-telemetry/oteps/blob/main/text/logs/0097-log-data-model.md>
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LogRecord {
    /// time_unix_nano is the time when the event occurred.
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
    /// Value of 0 indicates unknown or missing timestamp.
    #[prost(fixed64, tag = "1")]
    pub time_unix_nano: u64,
    /// Time when the event was observed by the collection system.
    /// For events that originate in OpenTelemetry (e.g. using OpenTelemetry Logging SDK)
    /// this timestamp is typically set at the generation time and is equal to Timestamp.
    /// For events originating externally and collected by OpenTelemetry (e.g. using
    /// Collector) this is the time when OpenTelemetry's code observed the event measured
    /// by the clock of the OpenTelemetry code. This field MUST be set once the event is
    /// observed by OpenTelemetry.
    ///
    /// For converting OpenTelemetry log data to formats that support only one timestamp or
    /// when receiving OpenTelemetry log data by recipients that support only one timestamp
    /// internally the following logic is recommended:
    ///
    /// * Use time_unix_nano if it is present, otherwise use observed_time_unix_nano.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
    /// Value of 0 indicates unknown or missing timestamp.
    #[prost(fixed64, tag = "11")]
    pub observed_time_unix_nano: u64,
    /// Numerical value of the severity, normalized to values described in Log Data Model.
    /// \[Optional\].
    #[prost(enumeration = "SeverityNumber", tag = "2")]
    pub severity_number: i32,
    /// The severity text (also known as log level). The original string representation as
    /// it is known at the source. \[Optional\].
    #[prost(string, tag = "3")]
    pub severity_text: ::prost::alloc::string::String,
    /// A value containing the body of the log record. Can be for example a human-readable
    /// string message (including multi-line) describing the event in a free form or it can
    /// be a structured data composed of arrays and maps of other values. \[Optional\].
    #[prost(message, optional, tag = "5")]
    pub body: ::core::option::Option<super::super::common::v1::AnyValue>,
    /// Additional attributes that describe the specific event occurrence. \[Optional\].
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "6")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    #[prost(uint32, tag = "7")]
    pub dropped_attributes_count: u32,
    /// Flags, a bit field. 8 least significant bits are the trace flags as
    /// defined in W3C Trace Context specification. 24 most significant bits are reserved
    /// and must be set to 0. Readers must not assume that 24 most significant bits
    /// will be zero and must correctly mask the bits when reading 8-bit trace flag (use
    /// flags & TRACE_FLAGS_MASK). \[Optional\].
    #[prost(fixed32, tag = "8")]
    pub flags: u32,
    /// A unique identifier for a trace. All logs from the same trace share
    /// the same `trace_id`. The ID is a 16-byte array. An ID with all zeroes
    /// is considered invalid. Can be set for logs that are part of request processing
    /// and have an assigned trace id. \[Optional\].
    #[prost(bytes = "vec", tag = "9")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    /// A unique identifier for a span within a trace, assigned when the span
    /// is created. The ID is an 8-byte array. An ID with all zeroes is considered
    /// invalid. Can be set for logs that are part of a particular processing span.
    /// If span_id is present trace_id SHOULD be also present. \[Optional\].
    #[prost(bytes = "vec", tag = "10")]
    pub span_id: ::prost::alloc::vec::Vec<u8>,
}
/// Possible values for LogRecord.SeverityNumber.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum SeverityNumber {
    /// UNSPECIFIED is the default SeverityNumber, it MUST NOT be used.
    Unspecified = 0,
    Trace = 1,
    Trace2 = 2,
    Trace3 = 3,
    Trace4 = 4,
    Debug = 5,
    Debug2 = 6,
    Debug3 = 7,
    Debug4 = 8,
    Info = 9,
    Info2 = 10,
    Info3 = 11,
    Info4 = 12,
    Warn = 13,
    Warn2 = 14,
    Warn3 = 15,
    Warn4 = 16,
    Error = 17,
    Error2 = 18,
    Error3 = 19,
    Error4 = 20,
    Fatal = 21,
    Fatal2 = 22,
    Fatal3 = 23,
    Fatal4 = 24,
}
impl SeverityNumber {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "SEVERITY_NUMBER_UNSPECIFIED",
            Self::Trace => "SEVERITY_NUMBER_TRACE",
            Self::Trace2 => "SEVERITY_NUMBER_TRACE2",
            Self::Trace3 => "SEVERITY_NUMBER_TRACE3",
            Self::Trace4 => "SEVERITY_NUMBER_TRACE4",
            Self::Debug => "SEVERITY_NUMBER_DEBUG",
            Self::Debug2 => "SEVERITY_NUMBER_DEBUG2",
            Self::Debug3 => "SEVERITY_NUMBER_DEBUG3",
            Self::Debug4 => "SEVERITY_NUMBER_DEBUG4",
            Self::Info => "SEVERITY_NUMBER_INFO",
            Self::Info2 => "SEVERITY_NUMBER_INFO2",
            Self::Info3 => "SEVERITY_NUMBER_INFO3",
            Self::Info4 => "SEVERITY_NUMBER_INFO4",
            Self::Warn => "SEVERITY_NUMBER_WARN",
            Self::Warn2 => "SEVERITY_NUMBER_WARN2",
            Self::Warn3 => "SEVERITY_NUMBER_WARN3",
            Self::Warn4 => "SEVERITY_NUMBER_WARN4",
            Self::Error => "SEVERITY_NUMBER_ERROR",
            Self::Error2 => "SEVERITY_NUMBER_ERROR2",
            Self::Error3 => "SEVERITY_NUMBER_ERROR3",
            Self::Error4 => "SEVERITY_NUMBER_ERROR4",
            Self::Fatal => "SEVERITY_NUMBER_FATAL",
            Self::Fatal2 => "SEVERITY_NUMBER_FATAL2",
            Self::Fatal3 => "SEVERITY_NUMBER_FATAL3",
            Self::Fatal4 => "SEVERITY_NUMBER_FATAL4",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "SEVERITY_NUMBER_UNSPECIFIED" => Some(Self::Unspecified),
            "SEVERITY_NUMBER_TRACE" => Some(Self::Trace),
            "SEVERITY_NUMBER_TRACE2" => Some(Self::Trace2),
            "SEVERITY_NUMBER_TRACE3" => Some(Self::Trace3),
            "SEVERITY_NUMBER_TRACE4" => Some(Self::Trace4),
            "SEVERITY_NUMBER_DEBUG" => Some(Self::Debug),
            "SEVERITY_NUMBER_DEBUG2" => Some(Self::Debug2),
            "SEVERITY_NUMBER_DEBUG3" => Some(Self::Debug3),
            "SEVERITY_NUMBER_DEBUG4" => Some(Self::Debug4),
            "SEVERITY_NUMBER_INFO" => Some(Self::Info),
            "SEVERITY_NUMBER_INFO2" => Some(Self::Info2),
            "SEVERITY_NUMBER_INFO3" => Some(Self::Info3),
            "SEVERITY_NUMBER_INFO4" => Some(Self::Info4),
            "SEVERITY_NUMBER_WARN" => Some(Self::Warn),
            "SEVERITY_NUMBER_WARN2" => Some(Self::Warn2),
            "SEVERITY_NUMBER_WARN3" => Some(Self::Warn3),
            "SEVERITY_NUMBER_WARN4" => Some(Self::Warn4),
            "SEVERITY_NUMBER_ERROR" => Some(Self::Error),
            "SEVERITY_NUMBER_ERROR2" => Some(Self::Error2),
            "SEVERITY_NUMBER_ERROR3" => Some(Self::Error3),
            "SEVERITY_NUMBER_ERROR4" => Some(Self::Error4),
            "SEVERITY_NUMBER_FATAL" => Some(Self::Fatal),
            "SEVERITY_NUMBER_FATAL2" => Some(Self::Fatal2),
            "SEVERITY_NUMBER_FATAL3" => Some(Self::Fatal3),
            "SEVERITY_NUMBER_FATAL4" => Some(Self::Fatal4),
            _ => None,
        }
    }
}
/// Masks for LogRecord.flags field.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum LogRecordFlags {
    LogRecordFlagUnspecified = 0,
    LogRecordFlagTraceFlagsMask = 255,
}
impl LogRecordFlags {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::LogRecordFlagUnspecified => "LOG_RECORD_FLAG_UNSPECIFIED",
            Self::LogRecordFlagTraceFlagsMask => "LOG_RECORD_FLAG_TRACE_FLAGS_MASK",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "LOG_RECORD_FLAG_UNSPECIFIED" => Some(Self::LogRecordFlagUnspecified),
            "LOG_RECORD_FLAG_TRACE_FLAGS_MASK" => Some(Self::LogRecordFlagTraceFlagsMask),
            _ => None,
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.metrics.v1.rs
================================================
// This file is @generated by prost-build.
/// MetricsData represents the metrics data that can be stored in a persistent
/// storage, OR can be embedded by other protocols that transfer OTLP metrics
/// data but do not implement the OTLP protocol.
///
/// The main difference between this message and collector protocol is that
/// in this message there will not be any "control" or "metadata" specific to
/// OTLP protocol.
///
/// When new fields are added into this message, the OTLP request MUST be updated
/// as well.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct MetricsData {
    /// An array of ResourceMetrics.
    /// For data coming from a single resource this array will typically contain
    /// one element. Intermediary nodes that receive data from multiple origins
    /// typically batch the data before forwarding further and in that case this
    /// array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_metrics: ::prost::alloc::vec::Vec<ResourceMetrics>,
}
/// A collection of ScopeMetrics from a Resource.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ResourceMetrics {
    /// The resource for the metrics in this message.
    /// If this field is not set then no resource info is known.
    #[prost(message, optional, tag = "1")]
    pub resource: ::core::option::Option<super::super::resource::v1::Resource>,
    /// A list of metrics that originate from a resource.
    #[prost(message, repeated, tag = "2")]
    pub scope_metrics: ::prost::alloc::vec::Vec<ScopeMetrics>,
    /// This schema_url applies to the data in the "resource" field. It does not apply
    /// to the data in the "scope_metrics" field which have their own schema_url field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A collection of Metrics produced by an Scope.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ScopeMetrics {
    /// The instrumentation scope information for the metrics in this message.
    /// Semantically when InstrumentationScope isn't set, it is equivalent with
    /// an empty instrumentation scope name (unknown).
    #[prost(message, optional, tag = "1")]
    pub scope: ::core::option::Option<super::super::common::v1::InstrumentationScope>,
    /// A list of metrics that originate from an instrumentation library.
    #[prost(message, repeated, tag = "2")]
    pub metrics: ::prost::alloc::vec::Vec<Metric>,
    /// This schema_url applies to all metrics in the "metrics" field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// Defines a Metric which has one or more timeseries.  The following is a
/// brief summary of the Metric data model.  For more details, see:
///
/// <https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/metrics/data-model.md>
///
/// The data model and relation between entities is shown in the
/// diagram below. Here, "DataPoint" is the term used to refer to any
/// one of the specific data point value types, and "points" is the term used
/// to refer to any one of the lists of points contained in the Metric.
///
/// * Metric is composed of a metadata and data.
///
/// * Metadata part contains a name, description, unit.
///
/// * Data is one of the possible types (Sum, Gauge, Histogram, Summary).
///
/// * DataPoint contains timestamps, attributes, and one of the possible value type
///   fields.
///
///   Metric
///   +------------+
///   \|name        |
///   \|description |
///   \|unit        |     +------------------------------------+
///   \|data        |---> |Gauge, Sum, Histogram, Summary, ... |
///   +------------+     +------------------------------------+
///
///   Data \[One of Gauge, Sum, Histogram, Summary, ...\]
///   +-----------+
///   \|...        |  // Metadata about the Data.
///   \|points     |--+
///   +-----------+  |
///   \|      +---------------------------+
///   \|      |DataPoint 1                |
///   v      |+------+------+   +------+ |
///   +-----+   ||label |label |...|label | |
///   \|  1  |-->||value1|value2|...|valueN| |
///   +-----+   |+------+------+   +------+ |
///   \|  .  |   |+-----+                    |
///   \|  .  |   ||value|                    |
///   \|  .  |   |+-----+                    |
///   \|  .  |   +---------------------------+
///   \|  .  |                   .
///   \|  .  |                   .
///   \|  .  |                   .
///   \|  .  |   +---------------------------+
///   \|  .  |   |DataPoint M                |
///   +-----+   |+------+------+   +------+ |
///   \|  M  |-->||label |label |...|label | |
///   +-----+   ||value1|value2|...|valueN| |
///   \|+------+------+   +------+ |
///   \|+-----+                    |
///   \||value|                    |
///   \|+-----+                    |
///   +---------------------------+
///
/// Each distinct type of DataPoint represents the output of a specific
/// aggregation function, the result of applying the DataPoint's
/// associated function of to one or more measurements.
///
/// All DataPoint types have three common fields:
///
/// * Attributes includes key-value pairs associated with the data point
/// * TimeUnixNano is required, set to the end time of the aggregation
/// * StartTimeUnixNano is optional, but strongly encouraged for DataPoints
///   having an AggregationTemporality field, as discussed below.
///
/// Both TimeUnixNano and StartTimeUnixNano values are expressed as
/// UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
///
/// # TimeUnixNano
///
/// This field is required, having consistent interpretation across
/// DataPoint types.  TimeUnixNano is the moment corresponding to when
/// the data point's aggregate value was captured.
///
/// Data points with the 0 value for TimeUnixNano SHOULD be rejected
/// by consumers.
///
/// # StartTimeUnixNano
///
/// StartTimeUnixNano in general allows detecting when a sequence of
/// observations is unbroken.  This field indicates to consumers the
/// start time for points with cumulative and delta
/// AggregationTemporality, and it should be included whenever possible
/// to support correct rate calculation.  Although it may be omitted
/// when the start time is truly unknown, setting StartTimeUnixNano is
/// strongly encouraged.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Metric {
    /// name of the metric, including its DNS name prefix. It must be unique.
    #[prost(string, tag = "1")]
    pub name: ::prost::alloc::string::String,
    /// description of the metric, which can be used in documentation.
    #[prost(string, tag = "2")]
    pub description: ::prost::alloc::string::String,
    /// unit in which the metric value is reported. Follows the format
    /// described by <http://unitsofmeasure.org/ucum.html.>
    #[prost(string, tag = "3")]
    pub unit: ::prost::alloc::string::String,
    /// Data determines the aggregation type (if any) of the metric, what is the
    /// reported value type for the data points, as well as the relatationship to
    /// the time interval over which they are reported.
    #[prost(oneof = "metric::Data", tags = "5, 7, 9, 10, 11")]
    pub data: ::core::option::Option<metric::Data>,
}
/// Nested message and enum types in `Metric`.
pub mod metric {
    /// Data determines the aggregation type (if any) of the metric, what is the
    /// reported value type for the data points, as well as the relatationship to
    /// the time interval over which they are reported.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Data {
        #[prost(message, tag = "5")]
        Gauge(super::Gauge),
        #[prost(message, tag = "7")]
        Sum(super::Sum),
        #[prost(message, tag = "9")]
        Histogram(super::Histogram),
        #[prost(message, tag = "10")]
        ExponentialHistogram(super::ExponentialHistogram),
        #[prost(message, tag = "11")]
        Summary(super::Summary),
    }
}
/// Gauge represents the type of a scalar metric that always exports the
/// "current value" for every data point. It should be used for an "unknown"
/// aggregation.
///
/// A Gauge does not support different aggregation temporalities. Given the
/// aggregation is unknown, points cannot be combined using the same
/// aggregation, regardless of aggregation temporalities. Therefore,
/// AggregationTemporality is not included. Consequently, this also means
/// "StartTimeUnixNano" is ignored for all data points.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Gauge {
    #[prost(message, repeated, tag = "1")]
    pub data_points: ::prost::alloc::vec::Vec<NumberDataPoint>,
}
/// Sum represents the type of a scalar metric that is calculated as a sum of all
/// reported measurements over a time interval.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Sum {
    #[prost(message, repeated, tag = "1")]
    pub data_points: ::prost::alloc::vec::Vec<NumberDataPoint>,
    /// aggregation_temporality describes if the aggregator reports delta changes
    /// since last report time, or cumulative changes since a fixed start time.
    #[prost(enumeration = "AggregationTemporality", tag = "2")]
    pub aggregation_temporality: i32,
    /// If "true" means that the sum is monotonic.
    #[prost(bool, tag = "3")]
    pub is_monotonic: bool,
}
/// Histogram represents the type of a metric that is calculated by aggregating
/// as a Histogram of all reported measurements over a time interval.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Histogram {
    #[prost(message, repeated, tag = "1")]
    pub data_points: ::prost::alloc::vec::Vec<HistogramDataPoint>,
    /// aggregation_temporality describes if the aggregator reports delta changes
    /// since last report time, or cumulative changes since a fixed start time.
    #[prost(enumeration = "AggregationTemporality", tag = "2")]
    pub aggregation_temporality: i32,
}
/// ExponentialHistogram represents the type of a metric that is calculated by aggregating
/// as a ExponentialHistogram of all reported double measurements over a time interval.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ExponentialHistogram {
    #[prost(message, repeated, tag = "1")]
    pub data_points: ::prost::alloc::vec::Vec<ExponentialHistogramDataPoint>,
    /// aggregation_temporality describes if the aggregator reports delta changes
    /// since last report time, or cumulative changes since a fixed start time.
    #[prost(enumeration = "AggregationTemporality", tag = "2")]
    pub aggregation_temporality: i32,
}
/// Summary metric data are used to convey quantile summaries,
/// a Prometheus (see: <https://prometheus.io/docs/concepts/metric_types/#summary>)
/// and OpenMetrics (see: <https://github.com/OpenObservability/OpenMetrics/blob/4dbf6075567ab43296eed941037c12951faafb92/protos/prometheus.proto#L45>)
/// data type. These data points cannot always be merged in a meaningful way.
/// While they can be useful in some applications, histogram data points are
/// recommended for new applications.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Summary {
    #[prost(message, repeated, tag = "1")]
    pub data_points: ::prost::alloc::vec::Vec<SummaryDataPoint>,
}
/// NumberDataPoint is a single data point in a timeseries that describes the
/// time-varying scalar value of a metric.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct NumberDataPoint {
    /// The set of key/value pairs that uniquely identify the timeseries from
    /// where this point belongs. The list may be empty (may contain 0 elements).
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "7")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// StartTimeUnixNano is optional but strongly encouraged, see the
    /// the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "2")]
    pub start_time_unix_nano: u64,
    /// TimeUnixNano is required, see the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "3")]
    pub time_unix_nano: u64,
    /// (Optional) List of exemplars collected from
    /// measurements that were used to form the data point
    #[prost(message, repeated, tag = "5")]
    pub exemplars: ::prost::alloc::vec::Vec<Exemplar>,
    /// Flags that apply to this specific data point.  See DataPointFlags
    /// for the available flags and their meaning.
    #[prost(uint32, tag = "8")]
    pub flags: u32,
    /// The value itself.  A point is considered invalid when one of the recognized
    /// value fields is not present inside this oneof.
    #[prost(oneof = "number_data_point::Value", tags = "4, 6")]
    pub value: ::core::option::Option<number_data_point::Value>,
}
/// Nested message and enum types in `NumberDataPoint`.
pub mod number_data_point {
    /// The value itself.  A point is considered invalid when one of the recognized
    /// value fields is not present inside this oneof.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, Copy, PartialEq, ::prost::Oneof)]
    pub enum Value {
        #[prost(double, tag = "4")]
        AsDouble(f64),
        #[prost(sfixed64, tag = "6")]
        AsInt(i64),
    }
}
/// HistogramDataPoint is a single data point in a timeseries that describes the
/// time-varying values of a Histogram. A Histogram contains summary statistics
/// for a population of values, it may optionally contain the distribution of
/// those values across a set of buckets.
///
/// If the histogram contains the distribution of values, then both
/// "explicit_bounds" and "bucket counts" fields must be defined.
/// If the histogram does not contain the distribution of values, then both
/// "explicit_bounds" and "bucket_counts" must be omitted and only "count" and
/// "sum" are known.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct HistogramDataPoint {
    /// The set of key/value pairs that uniquely identify the timeseries from
    /// where this point belongs. The list may be empty (may contain 0 elements).
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "9")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// StartTimeUnixNano is optional but strongly encouraged, see the
    /// the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "2")]
    pub start_time_unix_nano: u64,
    /// TimeUnixNano is required, see the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "3")]
    pub time_unix_nano: u64,
    /// count is the number of values in the population. Must be non-negative. This
    /// value must be equal to the sum of the "count" fields in buckets if a
    /// histogram is provided.
    #[prost(fixed64, tag = "4")]
    pub count: u64,
    /// sum of the values in the population. If count is zero then this field
    /// must be zero.
    ///
    /// Note: Sum should only be filled out when measuring non-negative discrete
    /// events, and is assumed to be monotonic over the values of these events.
    /// Negative events *can* be recorded, but sum should not be filled out when
    /// doing so.  This is specifically to enforce compatibility w/ OpenMetrics,
    /// see: <https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#histogram>
    #[prost(double, optional, tag = "5")]
    pub sum: ::core::option::Option<f64>,
    /// bucket_counts is an optional field contains the count values of histogram
    /// for each bucket.
    ///
    /// The sum of the bucket_counts must equal the value in the count field.
    ///
    /// The number of elements in bucket_counts array must be by one greater than
    /// the number of elements in explicit_bounds array.
    #[prost(fixed64, repeated, tag = "6")]
    pub bucket_counts: ::prost::alloc::vec::Vec<u64>,
    /// explicit_bounds specifies buckets with explicitly defined bounds for values.
    ///
    /// The boundaries for bucket at index i are:
    ///
    /// (-infinity, explicit_bounds\[i\]\] for i == 0
    /// (explicit_bounds\[i-1\], explicit_bounds\[i\]\] for 0 \< i \< size(explicit_bounds)
    /// (explicit_bounds\[i-1\], +infinity) for i == size(explicit_bounds)
    ///
    /// The values in the explicit_bounds array must be strictly increasing.
    ///
    /// Histogram buckets are inclusive of their upper boundary, except the last
    /// bucket where the boundary is at infinity. This format is intentionally
    /// compatible with the OpenMetrics histogram definition.
    #[prost(double, repeated, tag = "7")]
    pub explicit_bounds: ::prost::alloc::vec::Vec<f64>,
    /// (Optional) List of exemplars collected from
    /// measurements that were used to form the data point
    #[prost(message, repeated, tag = "8")]
    pub exemplars: ::prost::alloc::vec::Vec<Exemplar>,
    /// Flags that apply to this specific data point.  See DataPointFlags
    /// for the available flags and their meaning.
    #[prost(uint32, tag = "10")]
    pub flags: u32,
    /// min is the minimum value over (start_time, end_time\].
    #[prost(double, optional, tag = "11")]
    pub min: ::core::option::Option<f64>,
    /// max is the maximum value over (start_time, end_time\].
    #[prost(double, optional, tag = "12")]
    pub max: ::core::option::Option<f64>,
}
/// ExponentialHistogramDataPoint is a single data point in a timeseries that describes the
/// time-varying values of a ExponentialHistogram of double values. A ExponentialHistogram contains
/// summary statistics for a population of values, it may optionally contain the
/// distribution of those values across a set of buckets.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ExponentialHistogramDataPoint {
    /// The set of key/value pairs that uniquely identify the timeseries from
    /// where this point belongs. The list may be empty (may contain 0 elements).
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "1")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// StartTimeUnixNano is optional but strongly encouraged, see the
    /// the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "2")]
    pub start_time_unix_nano: u64,
    /// TimeUnixNano is required, see the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "3")]
    pub time_unix_nano: u64,
    /// count is the number of values in the population. Must be
    /// non-negative. This value must be equal to the sum of the "bucket_counts"
    /// values in the positive and negative Buckets plus the "zero_count" field.
    #[prost(fixed64, tag = "4")]
    pub count: u64,
    /// sum of the values in the population. If count is zero then this field
    /// must be zero.
    ///
    /// Note: Sum should only be filled out when measuring non-negative discrete
    /// events, and is assumed to be monotonic over the values of these events.
    /// Negative events *can* be recorded, but sum should not be filled out when
    /// doing so.  This is specifically to enforce compatibility w/ OpenMetrics,
    /// see: <https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#histogram>
    #[prost(double, optional, tag = "5")]
    pub sum: ::core::option::Option<f64>,
    /// scale describes the resolution of the histogram.  Boundaries are
    /// located at powers of the base, where:
    ///
    /// base = (2^(2^-scale))
    ///
    /// The histogram bucket identified by `index`, a signed integer,
    /// contains values that are greater than (base^index) and
    /// less than or equal to (base^(index+1)).
    ///
    /// The positive and negative ranges of the histogram are expressed
    /// separately.  Negative values are mapped by their absolute value
    /// into the negative range using the same scale as the positive range.
    ///
    /// scale is not restricted by the protocol, as the permissible
    /// values depend on the range of the data.
    #[prost(sint32, tag = "6")]
    pub scale: i32,
    /// zero_count is the count of values that are either exactly zero or
    /// within the region considered zero by the instrumentation at the
    /// tolerated degree of precision.  This bucket stores values that
    /// cannot be expressed using the standard exponential formula as
    /// well as values that have been rounded to zero.
    ///
    /// Implementations MAY consider the zero bucket to have probability
    /// mass equal to (zero_count / count).
    #[prost(fixed64, tag = "7")]
    pub zero_count: u64,
    /// positive carries the positive range of exponential bucket counts.
    #[prost(message, optional, tag = "8")]
    pub positive: ::core::option::Option<exponential_histogram_data_point::Buckets>,
    /// negative carries the negative range of exponential bucket counts.
    #[prost(message, optional, tag = "9")]
    pub negative: ::core::option::Option<exponential_histogram_data_point::Buckets>,
    /// Flags that apply to this specific data point.  See DataPointFlags
    /// for the available flags and their meaning.
    #[prost(uint32, tag = "10")]
    pub flags: u32,
    /// (Optional) List of exemplars collected from
    /// measurements that were used to form the data point
    #[prost(message, repeated, tag = "11")]
    pub exemplars: ::prost::alloc::vec::Vec<Exemplar>,
    /// min is the minimum value over (start_time, end_time\].
    #[prost(double, optional, tag = "12")]
    pub min: ::core::option::Option<f64>,
    /// max is the maximum value over (start_time, end_time\].
    #[prost(double, optional, tag = "13")]
    pub max: ::core::option::Option<f64>,
}
/// Nested message and enum types in `ExponentialHistogramDataPoint`.
pub mod exponential_histogram_data_point {
    /// Buckets are a set of bucket counts, encoded in a contiguous array
    /// of counts.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
    pub struct Buckets {
        /// Offset is the bucket index of the first entry in the bucket_counts array.
        ///
        /// Note: This uses a varint encoding as a simple form of compression.
        #[prost(sint32, tag = "1")]
        pub offset: i32,
        /// Count is an array of counts, where count\[i\] carries the count
        /// of the bucket at index (offset+i).  count\[i\] is the count of
        /// values greater than base^(offset+i) and less or equal to than
        /// base^(offset+i+1).
        ///
        /// Note: By contrast, the explicit HistogramDataPoint uses
        /// fixed64.  This field is expected to have many buckets,
        /// especially zeros, so uint64 has been selected to ensure
        /// varint encoding.
        #[prost(uint64, repeated, tag = "2")]
        pub bucket_counts: ::prost::alloc::vec::Vec<u64>,
    }
}
/// SummaryDataPoint is a single data point in a timeseries that describes the
/// time-varying values of a Summary metric.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct SummaryDataPoint {
    /// The set of key/value pairs that uniquely identify the timeseries from
    /// where this point belongs. The list may be empty (may contain 0 elements).
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "7")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// StartTimeUnixNano is optional but strongly encouraged, see the
    /// the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "2")]
    pub start_time_unix_nano: u64,
    /// TimeUnixNano is required, see the detailed comments above Metric.
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "3")]
    pub time_unix_nano: u64,
    /// count is the number of values in the population. Must be non-negative.
    #[prost(fixed64, tag = "4")]
    pub count: u64,
    /// sum of the values in the population. If count is zero then this field
    /// must be zero.
    ///
    /// Note: Sum should only be filled out when measuring non-negative discrete
    /// events, and is assumed to be monotonic over the values of these events.
    /// Negative events *can* be recorded, but sum should not be filled out when
    /// doing so.  This is specifically to enforce compatibility w/ OpenMetrics,
    /// see: <https://github.com/OpenObservability/OpenMetrics/blob/main/specification/OpenMetrics.md#summary>
    #[prost(double, tag = "5")]
    pub sum: f64,
    /// (Optional) list of values at different quantiles of the distribution calculated
    /// from the current snapshot. The quantiles must be strictly increasing.
    #[prost(message, repeated, tag = "6")]
    pub quantile_values: ::prost::alloc::vec::Vec<summary_data_point::ValueAtQuantile>,
    /// Flags that apply to this specific data point.  See DataPointFlags
    /// for the available flags and their meaning.
    #[prost(uint32, tag = "8")]
    pub flags: u32,
}
/// Nested message and enum types in `SummaryDataPoint`.
pub mod summary_data_point {
    /// Represents the value at a given quantile of a distribution.
    ///
    /// To record Min and Max values following conventions are used:
    ///
    /// * The 1.0 quantile is equivalent to the maximum value observed.
    /// * The 0.0 quantile is equivalent to the minimum value observed.
    ///
    /// See the following issue for more context:
    /// <https://github.com/open-telemetry/opentelemetry-proto/issues/125>
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, Copy, PartialEq, ::prost::Message)]
    pub struct ValueAtQuantile {
        /// The quantile of a distribution. Must be in the interval
        /// \[0.0, 1.0\].
        #[prost(double, tag = "1")]
        pub quantile: f64,
        /// The value at the given quantile of a distribution.
        ///
        /// Quantile values must NOT be negative.
        #[prost(double, tag = "2")]
        pub value: f64,
    }
}
/// A representation of an exemplar, which is a sample input measurement.
/// Exemplars also hold information about the environment when the measurement
/// was recorded, for example the span and trace ID of the active span when the
/// exemplar was recorded.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Exemplar {
    /// The set of key/value pairs that were filtered out by the aggregator, but
    /// recorded alongside the original measurement. Only key/value pairs that were
    /// filtered out by the aggregator should be included
    #[prost(message, repeated, tag = "7")]
    pub filtered_attributes: ::prost::alloc::vec::Vec<
        super::super::common::v1::KeyValue,
    >,
    /// time_unix_nano is the exact time when this exemplar was recorded
    ///
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January
    /// 1970.
    #[prost(fixed64, tag = "2")]
    pub time_unix_nano: u64,
    /// (Optional) Span ID of the exemplar trace.
    /// span_id may be missing if the measurement is not recorded inside a trace
    /// or if the trace is not sampled.
    #[prost(bytes = "vec", tag = "4")]
    pub span_id: ::prost::alloc::vec::Vec<u8>,
    /// (Optional) Trace ID of the exemplar trace.
    /// trace_id may be missing if the measurement is not recorded inside a trace
    /// or if the trace is not sampled.
    #[prost(bytes = "vec", tag = "5")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    /// The value of the measurement that was recorded. An exemplar is
    /// considered invalid when one of the recognized value fields is not present
    /// inside this oneof.
    #[prost(oneof = "exemplar::Value", tags = "3, 6")]
    pub value: ::core::option::Option<exemplar::Value>,
}
/// Nested message and enum types in `Exemplar`.
pub mod exemplar {
    /// The value of the measurement that was recorded. An exemplar is
    /// considered invalid when one of the recognized value fields is not present
    /// inside this oneof.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, Copy, PartialEq, ::prost::Oneof)]
    pub enum Value {
        #[prost(double, tag = "3")]
        AsDouble(f64),
        #[prost(sfixed64, tag = "6")]
        AsInt(i64),
    }
}
/// AggregationTemporality defines how a metric aggregator reports aggregated
/// values. It describes how those values relate to the time interval over
/// which they are aggregated.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum AggregationTemporality {
    /// UNSPECIFIED is the default AggregationTemporality, it MUST not be used.
    Unspecified = 0,
    /// DELTA is an AggregationTemporality for a metric aggregator which reports
    /// changes since last report time. Successive metrics contain aggregation of
    /// values from continuous and non-overlapping intervals.
    ///
    /// The values for a DELTA metric are based only on the time interval
    /// associated with one measurement cycle. There is no dependency on
    /// previous measurements like is the case for CUMULATIVE metrics.
    ///
    /// For example, consider a system measuring the number of requests that
    /// it receives and reports the sum of these requests every second as a
    /// DELTA metric:
    ///
    /// 1. The system starts receiving at time=t_0.
    /// 1. A request is received, the system measures 1 request.
    /// 1. A request is received, the system measures 1 request.
    /// 1. A request is received, the system measures 1 request.
    /// 1. The 1 second collection cycle ends. A metric is exported for the
    ///    number of requests received over the interval of time t_0 to
    ///    t_0+1 with a value of 3.
    /// 1. A request is received, the system measures 1 request.
    /// 1. A request is received, the system measures 1 request.
    /// 1. The 1 second collection cycle ends. A metric is exported for the
    ///    number of requests received over the interval of time t_0+1 to
    ///    t_0+2 with a value of 2.
    Delta = 1,
    /// CUMULATIVE is an AggregationTemporality for a metric aggregator which
    /// reports changes since a fixed start time. This means that current values
    /// of a CUMULATIVE metric depend on all previous measurements since the
    /// start time. Because of this, the sender is required to retain this state
    /// in some form. If this state is lost or invalidated, the CUMULATIVE metric
    /// values MUST be reset and a new fixed start time following the last
    /// reported measurement time sent MUST be used.
    ///
    /// For example, consider a system measuring the number of requests that
    /// it receives and reports the sum of these requests every second as a
    /// CUMULATIVE metric:
    ///
    /// 1. The system starts receiving at time=t_0.
    /// 1. A request is received, the system measures 1 request.
    /// 1. A request is received, the system measures 1 request.
    /// 1. A request is received, the system measures 1 request.
    /// 1. The 1 second collection cycle ends. A metric is exported for the
    ///    number of requests received over the interval of time t_0 to
    ///    t_0+1 with a value of 3.
    /// 1. A request is received, the system measures 1 request.
    /// 1. A request is received, the system measures 1 request.
    /// 1. The 1 second collection cycle ends. A metric is exported for the
    ///    number of requests received over the interval of time t_0 to
    ///    t_0+2 with a value of 5.
    /// 1. The system experiences a fault and loses state.
    /// 1. The system recovers and resumes receiving at time=t_1.
    /// 1. A request is received, the system measures 1 request.
    /// 1. The 1 second collection cycle ends. A metric is exported for the
    ///    number of requests received over the interval of time t_1 to
    ///    t_0+1 with a value of 1.
    ///
    /// Note: Even though, when reporting changes since last report time, using
    /// CUMULATIVE is valid, it is not recommended. This may cause problems for
    /// systems that do not use start_time to determine when the aggregation
    /// value was reset (e.g. Prometheus).
    Cumulative = 2,
}
impl AggregationTemporality {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "AGGREGATION_TEMPORALITY_UNSPECIFIED",
            Self::Delta => "AGGREGATION_TEMPORALITY_DELTA",
            Self::Cumulative => "AGGREGATION_TEMPORALITY_CUMULATIVE",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "AGGREGATION_TEMPORALITY_UNSPECIFIED" => Some(Self::Unspecified),
            "AGGREGATION_TEMPORALITY_DELTA" => Some(Self::Delta),
            "AGGREGATION_TEMPORALITY_CUMULATIVE" => Some(Self::Cumulative),
            _ => None,
        }
    }
}
/// DataPointFlags is defined as a protobuf 'uint32' type and is to be used as a
/// bit-field representing 32 distinct boolean flags.  Each flag defined in this
/// enum is a bit-mask.  To test the presence of a single flag in the flags of
/// a data point, for example, use an expression like:
///
/// (point.flags & FLAG_NO_RECORDED_VALUE) == FLAG_NO_RECORDED_VALUE
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum DataPointFlags {
    FlagNone = 0,
    /// This DataPoint is valid but has no recorded value.  This value
    /// SHOULD be used to reflect explicitly missing data in a series, as
    /// for an equivalent to the Prometheus "staleness marker".
    FlagNoRecordedValue = 1,
}
impl DataPointFlags {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::FlagNone => "FLAG_NONE",
            Self::FlagNoRecordedValue => "FLAG_NO_RECORDED_VALUE",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "FLAG_NONE" => Some(Self::FlagNone),
            "FLAG_NO_RECORDED_VALUE" => Some(Self::FlagNoRecordedValue),
            _ => None,
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.resource.v1.rs
================================================
// This file is @generated by prost-build.
/// Resource information.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Resource {
    /// Set of attributes that describe the resource.
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "1")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// dropped_attributes_count is the number of dropped attributes. If the value is 0, then
    /// no attributes were dropped.
    #[prost(uint32, tag = "2")]
    pub dropped_attributes_count: u32,
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/opentelemetry/opentelemetry.proto.trace.v1.rs
================================================
// This file is @generated by prost-build.
/// TracesData represents the traces data that can be stored in a persistent storage,
/// OR can be embedded by other protocols that transfer OTLP traces data but do
/// not implement the OTLP protocol.
///
/// The main difference between this message and collector protocol is that
/// in this message there will not be any "control" or "metadata" specific to
/// OTLP protocol.
///
/// When new fields are added into this message, the OTLP request MUST be updated
/// as well.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct TracesData {
    /// An array of ResourceSpans.
    /// For data coming from a single resource this array will typically contain
    /// one element. Intermediary nodes that receive data from multiple origins
    /// typically batch the data before forwarding further and in that case this
    /// array will contain multiple elements.
    #[prost(message, repeated, tag = "1")]
    pub resource_spans: ::prost::alloc::vec::Vec<ResourceSpans>,
}
/// A collection of ScopeSpans from a Resource.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ResourceSpans {
    /// The resource for the spans in this message.
    /// If this field is not set then no resource info is known.
    #[prost(message, optional, tag = "1")]
    pub resource: ::core::option::Option<super::super::resource::v1::Resource>,
    /// A list of ScopeSpans that originate from a resource.
    #[prost(message, repeated, tag = "2")]
    pub scope_spans: ::prost::alloc::vec::Vec<ScopeSpans>,
    /// This schema_url applies to the data in the "resource" field. It does not apply
    /// to the data in the "scope_spans" field which have their own schema_url field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A collection of Spans produced by an InstrumentationScope.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ScopeSpans {
    /// The instrumentation scope information for the spans in this message.
    /// Semantically when InstrumentationScope isn't set, it is equivalent with
    /// an empty instrumentation scope name (unknown).
    #[prost(message, optional, tag = "1")]
    pub scope: ::core::option::Option<super::super::common::v1::InstrumentationScope>,
    /// A list of Spans that originate from an instrumentation scope.
    #[prost(message, repeated, tag = "2")]
    pub spans: ::prost::alloc::vec::Vec<Span>,
    /// This schema_url applies to all spans and span events in the "spans" field.
    #[prost(string, tag = "3")]
    pub schema_url: ::prost::alloc::string::String,
}
/// A Span represents a single operation performed by a single component of the system.
///
/// The next available field id is 17.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Span {
    /// A unique identifier for a trace. All spans from the same trace share
    /// the same `trace_id`. The ID is a 16-byte array. An ID with all zeroes
    /// is considered invalid.
    ///
    /// This field is semantically required. Receiver should generate new
    /// random trace_id if empty or invalid trace_id was received.
    ///
    /// This field is required.
    #[prost(bytes = "vec", tag = "1")]
    pub trace_id: ::prost::alloc::vec::Vec<u8>,
    /// A unique identifier for a span within a trace, assigned when the span
    /// is created. The ID is an 8-byte array. An ID with all zeroes is considered
    /// invalid.
    ///
    /// This field is semantically required. Receiver should generate new
    /// random span_id if empty or invalid span_id was received.
    ///
    /// This field is required.
    #[prost(bytes = "vec", tag = "2")]
    pub span_id: ::prost::alloc::vec::Vec<u8>,
    /// trace_state conveys information about request position in multiple distributed tracing graphs.
    /// It is a trace_state in w3c-trace-context format: <https://www.w3.org/TR/trace-context/#tracestate-header>
    /// See also <https://github.com/w3c/distributed-tracing> for more details about this field.
    #[prost(string, tag = "3")]
    pub trace_state: ::prost::alloc::string::String,
    /// The `span_id` of this span's parent span. If this is a root span, then this
    /// field must be empty. The ID is an 8-byte array.
    #[prost(bytes = "vec", tag = "4")]
    pub parent_span_id: ::prost::alloc::vec::Vec<u8>,
    /// A description of the span's operation.
    ///
    /// For example, the name can be a qualified method name or a file name
    /// and a line number where the operation is called. A best practice is to use
    /// the same display name at the same call point in an application.
    /// This makes it easier to correlate spans in different traces.
    ///
    /// This field is semantically required to be set to non-empty string.
    /// Empty value is equivalent to an unknown span name.
    ///
    /// This field is required.
    #[prost(string, tag = "5")]
    pub name: ::prost::alloc::string::String,
    /// Distinguishes between spans generated in a particular context. For example,
    /// two spans with the same name may be distinguished using `CLIENT` (caller)
    /// and `SERVER` (callee) to identify queueing latency associated with the span.
    #[prost(enumeration = "span::SpanKind", tag = "6")]
    pub kind: i32,
    /// start_time_unix_nano is the start time of the span. On the client side, this is the time
    /// kept by the local machine where the span execution starts. On the server side, this
    /// is the time when the server's application handler starts running.
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
    ///
    /// This field is semantically required and it is expected that end_time >= start_time.
    #[prost(fixed64, tag = "7")]
    pub start_time_unix_nano: u64,
    /// end_time_unix_nano is the end time of the span. On the client side, this is the time
    /// kept by the local machine where the span execution ends. On the server side, this
    /// is the time when the server application handler stops running.
    /// Value is UNIX Epoch time in nanoseconds since 00:00:00 UTC on 1 January 1970.
    ///
    /// This field is semantically required and it is expected that end_time >= start_time.
    #[prost(fixed64, tag = "8")]
    pub end_time_unix_nano: u64,
    /// attributes is a collection of key/value pairs. Note, global attributes
    /// like server name can be set using the resource API. Examples of attributes:
    ///
    /// ```text
    /// "/http/user_agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36"
    /// "/http/server_latency": 300
    /// "abc.com/myattribute": true
    /// "abc.com/score": 10.239
    /// ```
    ///
    /// The OpenTelemetry API specification further restricts the allowed value types:
    /// <https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/common/README.md#attribute>
    /// Attribute keys MUST be unique (it is not allowed to have more than one
    /// attribute with the same key).
    #[prost(message, repeated, tag = "9")]
    pub attributes: ::prost::alloc::vec::Vec<super::super::common::v1::KeyValue>,
    /// dropped_attributes_count is the number of attributes that were discarded. Attributes
    /// can be discarded because their keys are too long or because there are too many
    /// attributes. If this value is 0, then no attributes were dropped.
    #[prost(uint32, tag = "10")]
    pub dropped_attributes_count: u32,
    /// events is a collection of Event items.
    #[prost(message, repeated, tag = "11")]
    pub events: ::prost::alloc::vec::Vec<span::Event>,
    /// dropped_events_count is the number of dropped events. If the value is 0, then no
    /// events were dropped.
    #[prost(uint32, tag = "12")]
    pub dropped_events_count: u32,
    /// links is a collection of Links, which are references from this span to a span
    /// in the same or different trace.
    #[prost(message, repeated, tag = "13")]
    pub links: ::prost::alloc::vec::Vec<span::Link>,
    /// dropped_links_count is the number of dropped links after the maximum size was
    /// enforced. If this value is 0, then no links were dropped.
    #[prost(uint32, tag = "14")]
    pub dropped_links_count: u32,
    /// An optional final status for this span. Semantically when Status isn't set, it means
    /// span's status code is unset, i.e. assume STATUS_CODE_UNSET (code = 0).
    #[prost(message, optional, tag = "15")]
    pub status: ::core::option::Option<Status>,
}
/// Nested message and enum types in `Span`.
pub mod span {
    /// Event is a time-stamped annotation of the span, consisting of user-supplied
    /// text description and key-value pairs.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, PartialEq, ::prost::Message)]
    pub struct Event {
        /// time_unix_nano is the time the event occurred.
        #[prost(fixed64, tag = "1")]
        pub time_unix_nano: u64,
        /// name of the event.
        /// This field is semantically required to be set to non-empty string.
        #[prost(string, tag = "2")]
        pub name: ::prost::alloc::string::String,
        /// attributes is a collection of attribute key/value pairs on the event.
        /// Attribute keys MUST be unique (it is not allowed to have more than one
        /// attribute with the same key).
        #[prost(message, repeated, tag = "3")]
        pub attributes: ::prost::alloc::vec::Vec<
            super::super::super::common::v1::KeyValue,
        >,
        /// dropped_attributes_count is the number of dropped attributes. If the value is 0,
        /// then no attributes were dropped.
        #[prost(uint32, tag = "4")]
        pub dropped_attributes_count: u32,
    }
    /// A pointer from the current span to another span in the same trace or in a
    /// different trace. For example, this can be used in batching operations,
    /// where a single batch handler processes multiple requests from different
    /// traces or when the handler receives a request from a different project.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(Clone, PartialEq, ::prost::Message)]
    pub struct Link {
        /// A unique identifier of a trace that this linked span is part of. The ID is a
        /// 16-byte array.
        #[prost(bytes = "vec", tag = "1")]
        pub trace_id: ::prost::alloc::vec::Vec<u8>,
        /// A unique identifier for the linked span. The ID is an 8-byte array.
        #[prost(bytes = "vec", tag = "2")]
        pub span_id: ::prost::alloc::vec::Vec<u8>,
        /// The trace_state associated with the link.
        #[prost(string, tag = "3")]
        pub trace_state: ::prost::alloc::string::String,
        /// attributes is a collection of attribute key/value pairs on the link.
        /// Attribute keys MUST be unique (it is not allowed to have more than one
        /// attribute with the same key).
        #[prost(message, repeated, tag = "4")]
        pub attributes: ::prost::alloc::vec::Vec<
            super::super::super::common::v1::KeyValue,
        >,
        /// dropped_attributes_count is the number of dropped attributes. If the value is 0,
        /// then no attributes were dropped.
        #[prost(uint32, tag = "5")]
        pub dropped_attributes_count: u32,
    }
    /// SpanKind is the type of span. Can be used to specify additional relationships between spans
    /// in addition to a parent/child relationship.
    #[derive(serde::Serialize, serde::Deserialize)]
    #[derive(
        Clone,
        Copy,
        Debug,
        PartialEq,
        Eq,
        Hash,
        PartialOrd,
        Ord,
        ::prost::Enumeration
    )]
    #[repr(i32)]
    pub enum SpanKind {
        /// Unspecified. Do NOT use as default.
        /// Implementations MAY assume SpanKind to be INTERNAL when receiving UNSPECIFIED.
        Unspecified = 0,
        /// Indicates that the span represents an internal operation within an application,
        /// as opposed to an operation happening at the boundaries. Default value.
        Internal = 1,
        /// Indicates that the span covers server-side handling of an RPC or other
        /// remote network request.
        Server = 2,
        /// Indicates that the span describes a request to some remote service.
        Client = 3,
        /// Indicates that the span describes a producer sending a message to a broker.
        /// Unlike CLIENT and SERVER, there is often no direct critical path latency relationship
        /// between producer and consumer spans. A PRODUCER span ends when the message was accepted
        /// by the broker while the logical processing of the message might span a much longer time.
        Producer = 4,
        /// Indicates that the span describes consumer receiving a message from a broker.
        /// Like the PRODUCER kind, there is often no direct critical path latency relationship
        /// between producer and consumer spans.
        Consumer = 5,
    }
    impl SpanKind {
        /// String value of the enum field names used in the ProtoBuf definition.
        ///
        /// The values are not transformed in any way and thus are considered stable
        /// (if the ProtoBuf definition does not change) and safe for programmatic use.
        pub fn as_str_name(&self) -> &'static str {
            match self {
                Self::Unspecified => "SPAN_KIND_UNSPECIFIED",
                Self::Internal => "SPAN_KIND_INTERNAL",
                Self::Server => "SPAN_KIND_SERVER",
                Self::Client => "SPAN_KIND_CLIENT",
                Self::Producer => "SPAN_KIND_PRODUCER",
                Self::Consumer => "SPAN_KIND_CONSUMER",
            }
        }
        /// Creates an enum from field names used in the ProtoBuf definition.
        pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
            match value {
                "SPAN_KIND_UNSPECIFIED" => Some(Self::Unspecified),
                "SPAN_KIND_INTERNAL" => Some(Self::Internal),
                "SPAN_KIND_SERVER" => Some(Self::Server),
                "SPAN_KIND_CLIENT" => Some(Self::Client),
                "SPAN_KIND_PRODUCER" => Some(Self::Producer),
                "SPAN_KIND_CONSUMER" => Some(Self::Consumer),
                _ => None,
            }
        }
    }
}
/// The Status type defines a logical error model that is suitable for different
/// programming environments, including REST APIs and RPC APIs.
#[derive(serde::Serialize, serde::Deserialize)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct Status {
    /// A developer-facing human readable error message.
    #[prost(string, tag = "2")]
    pub message: ::prost::alloc::string::String,
    /// The status code.
    #[prost(enumeration = "status::StatusCode", tag = "3")]
    pub code: i32,
}
/// Nested message and enum types in `Status`.
pub mod status {
    /// For the semantics of status codes see
    /// <https://github.com/open-telemetry/opentelemetry-specification/blob/main/specification/trace/api.md#set-status>
    #[derive(serde::Serialize, serde::Deserialize)]
    #[serde(rename_all = "snake_case")]
    #[derive(
        Clone,
        Copy,
        Debug,
        PartialEq,
        Eq,
        Hash,
        PartialOrd,
        Ord,
        ::prost::Enumeration
    )]
    #[repr(i32)]
    pub enum StatusCode {
        /// The default status.
        Unset = 0,
        /// The Span has been validated by an Application developer or Operator to
        /// have completed successfully.
        Ok = 1,
        /// The Span contains an error.
        Error = 2,
    }
    impl StatusCode {
        /// String value of the enum field names used in the ProtoBuf definition.
        ///
        /// The values are not transformed in any way and thus are considered stable
        /// (if the ProtoBuf definition does not change) and safe for programmatic use.
        pub fn as_str_name(&self) -> &'static str {
            match self {
                Self::Unset => "STATUS_CODE_UNSET",
                Self::Ok => "STATUS_CODE_OK",
                Self::Error => "STATUS_CODE_ERROR",
            }
        }
        /// Creates an enum from field names used in the ProtoBuf definition.
        pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
            match value {
                "STATUS_CODE_UNSET" => Some(Self::Unset),
                "STATUS_CODE_OK" => Some(Self::Ok),
                "STATUS_CODE_ERROR" => Some(Self::Error),
                _ => None,
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.cluster.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ChitchatId {
    #[prost(string, tag = "1")]
    pub node_id: ::prost::alloc::string::String,
    #[prost(uint64, tag = "2")]
    pub generation_id: u64,
    #[prost(string, tag = "3")]
    pub gossip_advertise_addr: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct VersionedKeyValue {
    #[prost(string, tag = "1")]
    pub key: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub value: ::prost::alloc::string::String,
    #[prost(uint64, tag = "3")]
    pub version: u64,
    #[prost(enumeration = "DeletionStatus", tag = "4")]
    pub status: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct NodeState {
    #[prost(message, optional, tag = "1")]
    pub chitchat_id: ::core::option::Option<ChitchatId>,
    #[prost(message, repeated, tag = "2")]
    pub key_values: ::prost::alloc::vec::Vec<VersionedKeyValue>,
    #[prost(uint64, tag = "3")]
    pub max_version: u64,
    #[prost(uint64, tag = "4")]
    pub last_gc_version: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FetchClusterStateRequest {
    #[prost(string, tag = "1")]
    pub cluster_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FetchClusterStateResponse {
    #[prost(string, tag = "1")]
    pub cluster_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "2")]
    pub node_states: ::prost::alloc::vec::Vec<NodeState>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum DeletionStatus {
    Set = 0,
    Deleted = 1,
    DeleteAfterTtl = 2,
}
impl DeletionStatus {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Set => "Set",
            Self::Deleted => "Deleted",
            Self::DeleteAfterTtl => "DeleteAfterTtl",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "Set" => Some(Self::Set),
            "Deleted" => Some(Self::Deleted),
            "DeleteAfterTtl" => Some(Self::DeleteAfterTtl),
            _ => None,
        }
    }
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for FetchClusterStateRequest {
    fn rpc_name() -> &'static str {
        "fetch_cluster_state"
    }
}
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait ClusterService: std::fmt::Debug + Send + Sync + 'static {
    async fn fetch_cluster_state(
        &self,
        request: FetchClusterStateRequest,
    ) -> crate::cluster::ClusterResult<FetchClusterStateResponse>;
}
#[derive(Debug, Clone)]
pub struct ClusterServiceClient {
    inner: InnerClusterServiceClient,
}
#[derive(Debug, Clone)]
struct InnerClusterServiceClient(std::sync::Arc<dyn ClusterService>);
impl ClusterServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: ClusterService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockClusterService > (),
            "`MockClusterService` must be wrapped in a `MockClusterServiceWrapper`: use `ClusterServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerClusterServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> cluster_service_grpc_server::ClusterServiceGrpcServer<
        ClusterServiceGrpcServerAdapter,
    > {
        let adapter = ClusterServiceGrpcServerAdapter::new(self.clone());
        cluster_service_grpc_server::ClusterServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = cluster_service_grpc_client::ClusterServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = ClusterServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> ClusterServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = cluster_service_grpc_client::ClusterServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = ClusterServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        ClusterServiceMailbox<A>: ClusterService,
    {
        ClusterServiceClient::new(ClusterServiceMailbox::new(mailbox))
    }
    pub fn tower() -> ClusterServiceTowerLayerStack {
        ClusterServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockClusterService) -> Self {
        let mock_wrapper = mock_cluster_service::MockClusterServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockClusterService::new())
    }
}
#[async_trait::async_trait]
impl ClusterService for ClusterServiceClient {
    async fn fetch_cluster_state(
        &self,
        request: FetchClusterStateRequest,
    ) -> crate::cluster::ClusterResult<FetchClusterStateResponse> {
        self.inner.0.fetch_cluster_state(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_cluster_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockClusterServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockClusterService>,
    }
    #[async_trait::async_trait]
    impl ClusterService for MockClusterServiceWrapper {
        async fn fetch_cluster_state(
            &self,
            request: super::FetchClusterStateRequest,
        ) -> crate::cluster::ClusterResult<super::FetchClusterStateResponse> {
            self.inner.lock().await.fetch_cluster_state(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<FetchClusterStateRequest> for InnerClusterServiceClient {
    type Response = FetchClusterStateResponse;
    type Error = crate::cluster::ClusterError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: FetchClusterStateRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.fetch_cluster_state(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct ClusterServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerClusterServiceClient,
    fetch_cluster_state_svc: quickwit_common::tower::BoxService<
        FetchClusterStateRequest,
        FetchClusterStateResponse,
        crate::cluster::ClusterError,
    >,
}
#[async_trait::async_trait]
impl ClusterService for ClusterServiceTowerServiceStack {
    async fn fetch_cluster_state(
        &self,
        request: FetchClusterStateRequest,
    ) -> crate::cluster::ClusterResult<FetchClusterStateResponse> {
        self.fetch_cluster_state_svc.clone().ready().await?.call(request).await
    }
}
type FetchClusterStateLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        FetchClusterStateRequest,
        FetchClusterStateResponse,
        crate::cluster::ClusterError,
    >,
    FetchClusterStateRequest,
    FetchClusterStateResponse,
    crate::cluster::ClusterError,
>;
#[derive(Debug, Default)]
pub struct ClusterServiceTowerLayerStack {
    fetch_cluster_state_layers: Vec<FetchClusterStateLayer>,
}
impl ClusterServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    FetchClusterStateRequest,
                    FetchClusterStateResponse,
                    crate::cluster::ClusterError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                FetchClusterStateRequest,
                FetchClusterStateResponse,
                crate::cluster::ClusterError,
            >,
        >>::Service: tower::Service<
                FetchClusterStateRequest,
                Response = FetchClusterStateResponse,
                Error = crate::cluster::ClusterError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                FetchClusterStateRequest,
                FetchClusterStateResponse,
                crate::cluster::ClusterError,
            >,
        >>::Service as tower::Service<FetchClusterStateRequest>>::Future: Send + 'static,
    {
        self.fetch_cluster_state_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_fetch_cluster_state_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    FetchClusterStateRequest,
                    FetchClusterStateResponse,
                    crate::cluster::ClusterError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                FetchClusterStateRequest,
                Response = FetchClusterStateResponse,
                Error = crate::cluster::ClusterError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<FetchClusterStateRequest>>::Future: Send + 'static,
    {
        self.fetch_cluster_state_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> ClusterServiceClient
    where
        T: ClusterService,
    {
        let inner_client = InnerClusterServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> ClusterServiceClient {
        let client = ClusterServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> ClusterServiceClient {
        let client = ClusterServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> ClusterServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        ClusterServiceMailbox<A>: ClusterService,
    {
        let inner_client = InnerClusterServiceClient(
            std::sync::Arc::new(ClusterServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockClusterService) -> ClusterServiceClient {
        let client = ClusterServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerClusterServiceClient,
    ) -> ClusterServiceClient {
        let fetch_cluster_state_svc = self
            .fetch_cluster_state_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = ClusterServiceTowerServiceStack {
            inner: inner_client,
            fetch_cluster_state_svc,
        };
        ClusterServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct ClusterServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::cluster::ClusterError>,
}
impl<A: quickwit_actors::Actor> ClusterServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for ClusterServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for ClusterServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::cluster::ClusterError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::cluster::ClusterError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> ClusterService for ClusterServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    ClusterServiceMailbox<
        A,
    >: tower::Service<
        FetchClusterStateRequest,
        Response = FetchClusterStateResponse,
        Error = crate::cluster::ClusterError,
        Future = BoxFuture<FetchClusterStateResponse, crate::cluster::ClusterError>,
    >,
{
    async fn fetch_cluster_state(
        &self,
        request: FetchClusterStateRequest,
    ) -> crate::cluster::ClusterResult<FetchClusterStateResponse> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct ClusterServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> ClusterServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> ClusterService
for ClusterServiceGrpcClientAdapter<
    cluster_service_grpc_client::ClusterServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn fetch_cluster_state(
        &self,
        request: FetchClusterStateRequest,
    ) -> crate::cluster::ClusterResult<FetchClusterStateResponse> {
        self.inner
            .clone()
            .fetch_cluster_state(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                FetchClusterStateRequest::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct ClusterServiceGrpcServerAdapter {
    inner: InnerClusterServiceClient,
}
impl ClusterServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: ClusterService,
    {
        Self {
            inner: InnerClusterServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl cluster_service_grpc_server::ClusterServiceGrpc
for ClusterServiceGrpcServerAdapter {
    async fn fetch_cluster_state(
        &self,
        request: tonic::Request<FetchClusterStateRequest>,
    ) -> Result<tonic::Response<FetchClusterStateResponse>, tonic::Status> {
        self.inner
            .0
            .fetch_cluster_state(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod cluster_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct ClusterServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl ClusterServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> ClusterServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> ClusterServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            ClusterServiceGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        pub async fn fetch_cluster_state(
            &mut self,
            request: impl tonic::IntoRequest<super::FetchClusterStateRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FetchClusterStateResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.cluster.ClusterService/FetchClusterState",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.cluster.ClusterService",
                        "FetchClusterState",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod cluster_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with ClusterServiceGrpcServer.
    #[async_trait]
    pub trait ClusterServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        async fn fetch_cluster_state(
            &self,
            request: tonic::Request<super::FetchClusterStateRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FetchClusterStateResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct ClusterServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> ClusterServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for ClusterServiceGrpcServer<T>
    where
        T: ClusterServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.cluster.ClusterService/FetchClusterState" => {
                    #[allow(non_camel_case_types)]
                    struct FetchClusterStateSvc<T: ClusterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ClusterServiceGrpc,
                    > tonic::server::UnaryService<super::FetchClusterStateRequest>
                    for FetchClusterStateSvc<T> {
                        type Response = super::FetchClusterStateResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FetchClusterStateRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ClusterServiceGrpc>::fetch_cluster_state(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FetchClusterStateSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for ClusterServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.cluster.ClusterService";
    impl<T> tonic::server::NamedService for ClusterServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.common.rs
================================================
// This file is @generated by prost-build.
/// The corresponding Rust struct \[`crate::types::DocUid`\] is defined manually and
/// externally provided during code generation (see `build.rs`).
///
/// Modify at your own risk.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DocUid {
    /// ULID encoded as a sequence of 16 bytes (big-endian u128).
    #[prost(bytes = "vec", tag = "1")]
    pub doc_uid: ::prost::alloc::vec::Vec<u8>,
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.control_plane.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetOrCreateOpenShardsRequest {
    /// There should be at most one subrequest per index per request.
    #[prost(message, repeated, tag = "1")]
    pub subrequests: ::prost::alloc::vec::Vec<GetOrCreateOpenShardsSubrequest>,
    #[prost(message, repeated, tag = "2")]
    pub closed_shards: ::prost::alloc::vec::Vec<super::ingest::ShardIds>,
    /// The control plane should return shards that are not present on the supplied leaders.
    ///
    /// The control plane does not change the status of those leaders just from this signal.
    /// It will check the status of its own ingester pool.
    #[prost(string, repeated, tag = "3")]
    pub unavailable_leaders: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetOrCreateOpenShardsSubrequest {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(string, tag = "2")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetOrCreateOpenShardsResponse {
    #[prost(message, repeated, tag = "1")]
    pub successes: ::prost::alloc::vec::Vec<GetOrCreateOpenShardsSuccess>,
    #[prost(message, repeated, tag = "2")]
    pub failures: ::prost::alloc::vec::Vec<GetOrCreateOpenShardsFailure>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct GetOrCreateOpenShardsSuccess {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "4")]
    pub open_shards: ::prost::alloc::vec::Vec<super::ingest::Shard>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetOrCreateOpenShardsFailure {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(string, tag = "2")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(enumeration = "GetOrCreateOpenShardsFailureReason", tag = "4")]
    pub reason: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AdviseResetShardsRequest {
    #[prost(message, repeated, tag = "1")]
    pub shard_ids: ::prost::alloc::vec::Vec<super::ingest::ShardIds>,
    #[prost(string, tag = "2")]
    pub ingester_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AdviseResetShardsResponse {
    #[prost(message, repeated, tag = "1")]
    pub shards_to_delete: ::prost::alloc::vec::Vec<super::ingest::ShardIds>,
    #[prost(message, repeated, tag = "2")]
    pub shards_to_truncate: ::prost::alloc::vec::Vec<super::ingest::ShardIdPositions>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum GetOrCreateOpenShardsFailureReason {
    Unspecified = 0,
    IndexNotFound = 1,
    SourceNotFound = 2,
    NoIngestersAvailable = 3,
}
impl GetOrCreateOpenShardsFailureReason {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_UNSPECIFIED",
            Self::IndexNotFound => {
                "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_INDEX_NOT_FOUND"
            }
            Self::SourceNotFound => {
                "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_SOURCE_NOT_FOUND"
            }
            Self::NoIngestersAvailable => {
                "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_NO_INGESTERS_AVAILABLE"
            }
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_UNSPECIFIED" => {
                Some(Self::Unspecified)
            }
            "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_INDEX_NOT_FOUND" => {
                Some(Self::IndexNotFound)
            }
            "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_SOURCE_NOT_FOUND" => {
                Some(Self::SourceNotFound)
            }
            "GET_OR_CREATE_OPEN_SHARDS_FAILURE_REASON_NO_INGESTERS_AVAILABLE" => {
                Some(Self::NoIngestersAvailable)
            }
            _ => None,
        }
    }
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait ControlPlaneService: std::fmt::Debug + Send + Sync + 'static {
    ///Creates a new index.
    async fn create_index(
        &self,
        request: super::metastore::CreateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::CreateIndexResponse>;
    ///Updates an index.
    async fn update_index(
        &self,
        request: super::metastore::UpdateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::IndexMetadataResponse,
    >;
    ///Deletes an index.
    async fn delete_index(
        &self,
        request: super::metastore::DeleteIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse>;
    ///Adds a source to an index.
    async fn add_source(
        &self,
        request: super::metastore::AddSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse>;
    ///Update a source.
    async fn update_source(
        &self,
        request: super::metastore::UpdateSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse>;
    ///Enables or disables a source.
    async fn toggle_source(
        &self,
        request: super::metastore::ToggleSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse>;
    ///Removes a source from an index.
    async fn delete_source(
        &self,
        request: super::metastore::DeleteSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse>;
    ///Returns the list of open shards for one or several sources. If the control plane is not able to find any
    ///for a source, it will pick a pair of leader-follower ingesters and will open a new shard.
    async fn get_or_create_open_shards(
        &self,
        request: GetOrCreateOpenShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<GetOrCreateOpenShardsResponse>;
    ///Asks the control plane whether the shards listed in the request should be deleted or truncated.
    async fn advise_reset_shards(
        &self,
        request: AdviseResetShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<AdviseResetShardsResponse>;
    ///Performs a debounced shard pruning request to the metastore.
    async fn prune_shards(
        &self,
        request: super::metastore::PruneShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse>;
}
#[derive(Debug, Clone)]
pub struct ControlPlaneServiceClient {
    inner: InnerControlPlaneServiceClient,
}
#[derive(Debug, Clone)]
struct InnerControlPlaneServiceClient(std::sync::Arc<dyn ControlPlaneService>);
impl ControlPlaneServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: ControlPlaneService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockControlPlaneService > (),
            "`MockControlPlaneService` must be wrapped in a `MockControlPlaneServiceWrapper`: use `ControlPlaneServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerControlPlaneServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> control_plane_service_grpc_server::ControlPlaneServiceGrpcServer<
        ControlPlaneServiceGrpcServerAdapter,
    > {
        let adapter = ControlPlaneServiceGrpcServerAdapter::new(self.clone());
        control_plane_service_grpc_server::ControlPlaneServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = control_plane_service_grpc_client::ControlPlaneServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = ControlPlaneServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> ControlPlaneServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = control_plane_service_grpc_client::ControlPlaneServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = ControlPlaneServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        ControlPlaneServiceMailbox<A>: ControlPlaneService,
    {
        ControlPlaneServiceClient::new(ControlPlaneServiceMailbox::new(mailbox))
    }
    pub fn tower() -> ControlPlaneServiceTowerLayerStack {
        ControlPlaneServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockControlPlaneService) -> Self {
        let mock_wrapper = mock_control_plane_service::MockControlPlaneServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockControlPlaneService::new())
    }
}
#[async_trait::async_trait]
impl ControlPlaneService for ControlPlaneServiceClient {
    async fn create_index(
        &self,
        request: super::metastore::CreateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::CreateIndexResponse,
    > {
        self.inner.0.create_index(request).await
    }
    async fn update_index(
        &self,
        request: super::metastore::UpdateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::IndexMetadataResponse,
    > {
        self.inner.0.update_index(request).await
    }
    async fn delete_index(
        &self,
        request: super::metastore::DeleteIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner.0.delete_index(request).await
    }
    async fn add_source(
        &self,
        request: super::metastore::AddSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner.0.add_source(request).await
    }
    async fn update_source(
        &self,
        request: super::metastore::UpdateSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner.0.update_source(request).await
    }
    async fn toggle_source(
        &self,
        request: super::metastore::ToggleSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner.0.toggle_source(request).await
    }
    async fn delete_source(
        &self,
        request: super::metastore::DeleteSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner.0.delete_source(request).await
    }
    async fn get_or_create_open_shards(
        &self,
        request: GetOrCreateOpenShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<GetOrCreateOpenShardsResponse> {
        self.inner.0.get_or_create_open_shards(request).await
    }
    async fn advise_reset_shards(
        &self,
        request: AdviseResetShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<AdviseResetShardsResponse> {
        self.inner.0.advise_reset_shards(request).await
    }
    async fn prune_shards(
        &self,
        request: super::metastore::PruneShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner.0.prune_shards(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_control_plane_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockControlPlaneServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockControlPlaneService>,
    }
    #[async_trait::async_trait]
    impl ControlPlaneService for MockControlPlaneServiceWrapper {
        async fn create_index(
            &self,
            request: super::super::metastore::CreateIndexRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::CreateIndexResponse,
        > {
            self.inner.lock().await.create_index(request).await
        }
        async fn update_index(
            &self,
            request: super::super::metastore::UpdateIndexRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::IndexMetadataResponse,
        > {
            self.inner.lock().await.update_index(request).await
        }
        async fn delete_index(
            &self,
            request: super::super::metastore::DeleteIndexRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::EmptyResponse,
        > {
            self.inner.lock().await.delete_index(request).await
        }
        async fn add_source(
            &self,
            request: super::super::metastore::AddSourceRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::EmptyResponse,
        > {
            self.inner.lock().await.add_source(request).await
        }
        async fn update_source(
            &self,
            request: super::super::metastore::UpdateSourceRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::EmptyResponse,
        > {
            self.inner.lock().await.update_source(request).await
        }
        async fn toggle_source(
            &self,
            request: super::super::metastore::ToggleSourceRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::EmptyResponse,
        > {
            self.inner.lock().await.toggle_source(request).await
        }
        async fn delete_source(
            &self,
            request: super::super::metastore::DeleteSourceRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::EmptyResponse,
        > {
            self.inner.lock().await.delete_source(request).await
        }
        async fn get_or_create_open_shards(
            &self,
            request: super::GetOrCreateOpenShardsRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::GetOrCreateOpenShardsResponse,
        > {
            self.inner.lock().await.get_or_create_open_shards(request).await
        }
        async fn advise_reset_shards(
            &self,
            request: super::AdviseResetShardsRequest,
        ) -> crate::control_plane::ControlPlaneResult<super::AdviseResetShardsResponse> {
            self.inner.lock().await.advise_reset_shards(request).await
        }
        async fn prune_shards(
            &self,
            request: super::super::metastore::PruneShardsRequest,
        ) -> crate::control_plane::ControlPlaneResult<
            super::super::metastore::EmptyResponse,
        > {
            self.inner.lock().await.prune_shards(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<super::metastore::CreateIndexRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::CreateIndexResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::CreateIndexRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.create_index(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::UpdateIndexRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::IndexMetadataResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::UpdateIndexRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.update_index(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::DeleteIndexRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::EmptyResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::DeleteIndexRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_index(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::AddSourceRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::EmptyResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::AddSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.add_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::UpdateSourceRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::EmptyResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::UpdateSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.update_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::ToggleSourceRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::EmptyResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::ToggleSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.toggle_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::DeleteSourceRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::EmptyResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::DeleteSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<GetOrCreateOpenShardsRequest> for InnerControlPlaneServiceClient {
    type Response = GetOrCreateOpenShardsResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: GetOrCreateOpenShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.get_or_create_open_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<AdviseResetShardsRequest> for InnerControlPlaneServiceClient {
    type Response = AdviseResetShardsResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: AdviseResetShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.advise_reset_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<super::metastore::PruneShardsRequest>
for InnerControlPlaneServiceClient {
    type Response = super::metastore::EmptyResponse;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: super::metastore::PruneShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.prune_shards(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct ControlPlaneServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerControlPlaneServiceClient,
    create_index_svc: quickwit_common::tower::BoxService<
        super::metastore::CreateIndexRequest,
        super::metastore::CreateIndexResponse,
        crate::control_plane::ControlPlaneError,
    >,
    update_index_svc: quickwit_common::tower::BoxService<
        super::metastore::UpdateIndexRequest,
        super::metastore::IndexMetadataResponse,
        crate::control_plane::ControlPlaneError,
    >,
    delete_index_svc: quickwit_common::tower::BoxService<
        super::metastore::DeleteIndexRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    add_source_svc: quickwit_common::tower::BoxService<
        super::metastore::AddSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    update_source_svc: quickwit_common::tower::BoxService<
        super::metastore::UpdateSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    toggle_source_svc: quickwit_common::tower::BoxService<
        super::metastore::ToggleSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    delete_source_svc: quickwit_common::tower::BoxService<
        super::metastore::DeleteSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    get_or_create_open_shards_svc: quickwit_common::tower::BoxService<
        GetOrCreateOpenShardsRequest,
        GetOrCreateOpenShardsResponse,
        crate::control_plane::ControlPlaneError,
    >,
    advise_reset_shards_svc: quickwit_common::tower::BoxService<
        AdviseResetShardsRequest,
        AdviseResetShardsResponse,
        crate::control_plane::ControlPlaneError,
    >,
    prune_shards_svc: quickwit_common::tower::BoxService<
        super::metastore::PruneShardsRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
}
#[async_trait::async_trait]
impl ControlPlaneService for ControlPlaneServiceTowerServiceStack {
    async fn create_index(
        &self,
        request: super::metastore::CreateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::CreateIndexResponse,
    > {
        self.create_index_svc.clone().ready().await?.call(request).await
    }
    async fn update_index(
        &self,
        request: super::metastore::UpdateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::IndexMetadataResponse,
    > {
        self.update_index_svc.clone().ready().await?.call(request).await
    }
    async fn delete_index(
        &self,
        request: super::metastore::DeleteIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.delete_index_svc.clone().ready().await?.call(request).await
    }
    async fn add_source(
        &self,
        request: super::metastore::AddSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.add_source_svc.clone().ready().await?.call(request).await
    }
    async fn update_source(
        &self,
        request: super::metastore::UpdateSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.update_source_svc.clone().ready().await?.call(request).await
    }
    async fn toggle_source(
        &self,
        request: super::metastore::ToggleSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.toggle_source_svc.clone().ready().await?.call(request).await
    }
    async fn delete_source(
        &self,
        request: super::metastore::DeleteSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.delete_source_svc.clone().ready().await?.call(request).await
    }
    async fn get_or_create_open_shards(
        &self,
        request: GetOrCreateOpenShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<GetOrCreateOpenShardsResponse> {
        self.get_or_create_open_shards_svc.clone().ready().await?.call(request).await
    }
    async fn advise_reset_shards(
        &self,
        request: AdviseResetShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<AdviseResetShardsResponse> {
        self.advise_reset_shards_svc.clone().ready().await?.call(request).await
    }
    async fn prune_shards(
        &self,
        request: super::metastore::PruneShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.prune_shards_svc.clone().ready().await?.call(request).await
    }
}
type CreateIndexLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::CreateIndexRequest,
        super::metastore::CreateIndexResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::CreateIndexRequest,
    super::metastore::CreateIndexResponse,
    crate::control_plane::ControlPlaneError,
>;
type UpdateIndexLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::UpdateIndexRequest,
        super::metastore::IndexMetadataResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::UpdateIndexRequest,
    super::metastore::IndexMetadataResponse,
    crate::control_plane::ControlPlaneError,
>;
type DeleteIndexLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::DeleteIndexRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::DeleteIndexRequest,
    super::metastore::EmptyResponse,
    crate::control_plane::ControlPlaneError,
>;
type AddSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::AddSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::AddSourceRequest,
    super::metastore::EmptyResponse,
    crate::control_plane::ControlPlaneError,
>;
type UpdateSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::UpdateSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::UpdateSourceRequest,
    super::metastore::EmptyResponse,
    crate::control_plane::ControlPlaneError,
>;
type ToggleSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::ToggleSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::ToggleSourceRequest,
    super::metastore::EmptyResponse,
    crate::control_plane::ControlPlaneError,
>;
type DeleteSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::DeleteSourceRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::DeleteSourceRequest,
    super::metastore::EmptyResponse,
    crate::control_plane::ControlPlaneError,
>;
type GetOrCreateOpenShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        GetOrCreateOpenShardsRequest,
        GetOrCreateOpenShardsResponse,
        crate::control_plane::ControlPlaneError,
    >,
    GetOrCreateOpenShardsRequest,
    GetOrCreateOpenShardsResponse,
    crate::control_plane::ControlPlaneError,
>;
type AdviseResetShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        AdviseResetShardsRequest,
        AdviseResetShardsResponse,
        crate::control_plane::ControlPlaneError,
    >,
    AdviseResetShardsRequest,
    AdviseResetShardsResponse,
    crate::control_plane::ControlPlaneError,
>;
type PruneShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        super::metastore::PruneShardsRequest,
        super::metastore::EmptyResponse,
        crate::control_plane::ControlPlaneError,
    >,
    super::metastore::PruneShardsRequest,
    super::metastore::EmptyResponse,
    crate::control_plane::ControlPlaneError,
>;
#[derive(Debug, Default)]
pub struct ControlPlaneServiceTowerLayerStack {
    create_index_layers: Vec<CreateIndexLayer>,
    update_index_layers: Vec<UpdateIndexLayer>,
    delete_index_layers: Vec<DeleteIndexLayer>,
    add_source_layers: Vec<AddSourceLayer>,
    update_source_layers: Vec<UpdateSourceLayer>,
    toggle_source_layers: Vec<ToggleSourceLayer>,
    delete_source_layers: Vec<DeleteSourceLayer>,
    get_or_create_open_shards_layers: Vec<GetOrCreateOpenShardsLayer>,
    advise_reset_shards_layers: Vec<AdviseResetShardsLayer>,
    prune_shards_layers: Vec<PruneShardsLayer>,
}
impl ControlPlaneServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::CreateIndexRequest,
                    super::metastore::CreateIndexResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::CreateIndexRequest,
                super::metastore::CreateIndexResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::CreateIndexRequest,
                Response = super::metastore::CreateIndexResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::CreateIndexRequest,
                super::metastore::CreateIndexResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::CreateIndexRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::UpdateIndexRequest,
                    super::metastore::IndexMetadataResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::UpdateIndexRequest,
                super::metastore::IndexMetadataResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::UpdateIndexRequest,
                Response = super::metastore::IndexMetadataResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::UpdateIndexRequest,
                super::metastore::IndexMetadataResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::UpdateIndexRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::DeleteIndexRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::DeleteIndexRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::DeleteIndexRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::DeleteIndexRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::DeleteIndexRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::AddSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::AddSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::AddSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::AddSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::AddSourceRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::UpdateSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::UpdateSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::UpdateSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::UpdateSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::UpdateSourceRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::ToggleSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::ToggleSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::ToggleSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::ToggleSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::ToggleSourceRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::DeleteSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::DeleteSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::DeleteSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::DeleteSourceRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::DeleteSourceRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetOrCreateOpenShardsRequest,
                    GetOrCreateOpenShardsResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetOrCreateOpenShardsRequest,
                GetOrCreateOpenShardsResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                GetOrCreateOpenShardsRequest,
                Response = GetOrCreateOpenShardsResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetOrCreateOpenShardsRequest,
                GetOrCreateOpenShardsResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            GetOrCreateOpenShardsRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    AdviseResetShardsRequest,
                    AdviseResetShardsResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                AdviseResetShardsRequest,
                AdviseResetShardsResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                AdviseResetShardsRequest,
                Response = AdviseResetShardsResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                AdviseResetShardsRequest,
                AdviseResetShardsResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<AdviseResetShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::PruneShardsRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::PruneShardsRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service: tower::Service<
                super::metastore::PruneShardsRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                super::metastore::PruneShardsRequest,
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >>::Service as tower::Service<
            super::metastore::PruneShardsRequest,
        >>::Future: Send + 'static,
    {
        self.create_index_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.update_index_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_index_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.add_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.update_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.toggle_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.get_or_create_open_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.advise_reset_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.prune_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_create_index_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::CreateIndexRequest,
                    super::metastore::CreateIndexResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::CreateIndexRequest,
                Response = super::metastore::CreateIndexResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::CreateIndexRequest,
        >>::Future: Send + 'static,
    {
        self.create_index_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_update_index_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::UpdateIndexRequest,
                    super::metastore::IndexMetadataResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::UpdateIndexRequest,
                Response = super::metastore::IndexMetadataResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::UpdateIndexRequest,
        >>::Future: Send + 'static,
    {
        self.update_index_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_index_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::DeleteIndexRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::DeleteIndexRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::DeleteIndexRequest,
        >>::Future: Send + 'static,
    {
        self.delete_index_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_add_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::AddSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::AddSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::AddSourceRequest,
        >>::Future: Send + 'static,
    {
        self.add_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_update_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::UpdateSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::UpdateSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::UpdateSourceRequest,
        >>::Future: Send + 'static,
    {
        self.update_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_toggle_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::ToggleSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::ToggleSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::ToggleSourceRequest,
        >>::Future: Send + 'static,
    {
        self.toggle_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::DeleteSourceRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::DeleteSourceRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::DeleteSourceRequest,
        >>::Future: Send + 'static,
    {
        self.delete_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_get_or_create_open_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetOrCreateOpenShardsRequest,
                    GetOrCreateOpenShardsResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                GetOrCreateOpenShardsRequest,
                Response = GetOrCreateOpenShardsResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            GetOrCreateOpenShardsRequest,
        >>::Future: Send + 'static,
    {
        self.get_or_create_open_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_advise_reset_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    AdviseResetShardsRequest,
                    AdviseResetShardsResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                AdviseResetShardsRequest,
                Response = AdviseResetShardsResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<AdviseResetShardsRequest>>::Future: Send + 'static,
    {
        self.advise_reset_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_prune_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    super::metastore::PruneShardsRequest,
                    super::metastore::EmptyResponse,
                    crate::control_plane::ControlPlaneError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                super::metastore::PruneShardsRequest,
                Response = super::metastore::EmptyResponse,
                Error = crate::control_plane::ControlPlaneError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            super::metastore::PruneShardsRequest,
        >>::Future: Send + 'static,
    {
        self.prune_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> ControlPlaneServiceClient
    where
        T: ControlPlaneService,
    {
        let inner_client = InnerControlPlaneServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> ControlPlaneServiceClient {
        let client = ControlPlaneServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> ControlPlaneServiceClient {
        let client = ControlPlaneServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> ControlPlaneServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        ControlPlaneServiceMailbox<A>: ControlPlaneService,
    {
        let inner_client = InnerControlPlaneServiceClient(
            std::sync::Arc::new(ControlPlaneServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(
        self,
        mock: MockControlPlaneService,
    ) -> ControlPlaneServiceClient {
        let client = ControlPlaneServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerControlPlaneServiceClient,
    ) -> ControlPlaneServiceClient {
        let create_index_svc = self
            .create_index_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let update_index_svc = self
            .update_index_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_index_svc = self
            .delete_index_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let add_source_svc = self
            .add_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let update_source_svc = self
            .update_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let toggle_source_svc = self
            .toggle_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_source_svc = self
            .delete_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let get_or_create_open_shards_svc = self
            .get_or_create_open_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let advise_reset_shards_svc = self
            .advise_reset_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let prune_shards_svc = self
            .prune_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = ControlPlaneServiceTowerServiceStack {
            inner: inner_client,
            create_index_svc,
            update_index_svc,
            delete_index_svc,
            add_source_svc,
            update_source_svc,
            toggle_source_svc,
            delete_source_svc,
            get_or_create_open_shards_svc,
            advise_reset_shards_svc,
            prune_shards_svc,
        };
        ControlPlaneServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct ControlPlaneServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::control_plane::ControlPlaneError>,
}
impl<A: quickwit_actors::Actor> ControlPlaneServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for ControlPlaneServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for ControlPlaneServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::control_plane::ControlPlaneError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::control_plane::ControlPlaneError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> ControlPlaneService for ControlPlaneServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    ControlPlaneServiceMailbox<
        A,
    >: tower::Service<
            super::metastore::CreateIndexRequest,
            Response = super::metastore::CreateIndexResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::CreateIndexResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::UpdateIndexRequest,
            Response = super::metastore::IndexMetadataResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::IndexMetadataResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::DeleteIndexRequest,
            Response = super::metastore::EmptyResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::AddSourceRequest,
            Response = super::metastore::EmptyResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::UpdateSourceRequest,
            Response = super::metastore::EmptyResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::ToggleSourceRequest,
            Response = super::metastore::EmptyResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::DeleteSourceRequest,
            Response = super::metastore::EmptyResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            GetOrCreateOpenShardsRequest,
            Response = GetOrCreateOpenShardsResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                GetOrCreateOpenShardsResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            AdviseResetShardsRequest,
            Response = AdviseResetShardsResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                AdviseResetShardsResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >
        + tower::Service<
            super::metastore::PruneShardsRequest,
            Response = super::metastore::EmptyResponse,
            Error = crate::control_plane::ControlPlaneError,
            Future = BoxFuture<
                super::metastore::EmptyResponse,
                crate::control_plane::ControlPlaneError,
            >,
        >,
{
    async fn create_index(
        &self,
        request: super::metastore::CreateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::CreateIndexResponse,
    > {
        self.clone().call(request).await
    }
    async fn update_index(
        &self,
        request: super::metastore::UpdateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::IndexMetadataResponse,
    > {
        self.clone().call(request).await
    }
    async fn delete_index(
        &self,
        request: super::metastore::DeleteIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.clone().call(request).await
    }
    async fn add_source(
        &self,
        request: super::metastore::AddSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.clone().call(request).await
    }
    async fn update_source(
        &self,
        request: super::metastore::UpdateSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.clone().call(request).await
    }
    async fn toggle_source(
        &self,
        request: super::metastore::ToggleSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.clone().call(request).await
    }
    async fn delete_source(
        &self,
        request: super::metastore::DeleteSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.clone().call(request).await
    }
    async fn get_or_create_open_shards(
        &self,
        request: GetOrCreateOpenShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<GetOrCreateOpenShardsResponse> {
        self.clone().call(request).await
    }
    async fn advise_reset_shards(
        &self,
        request: AdviseResetShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<AdviseResetShardsResponse> {
        self.clone().call(request).await
    }
    async fn prune_shards(
        &self,
        request: super::metastore::PruneShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct ControlPlaneServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> ControlPlaneServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> ControlPlaneService
for ControlPlaneServiceGrpcClientAdapter<
    control_plane_service_grpc_client::ControlPlaneServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn create_index(
        &self,
        request: super::metastore::CreateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::CreateIndexResponse,
    > {
        self.inner
            .clone()
            .create_index(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::CreateIndexRequest::rpc_name(),
            ))
    }
    async fn update_index(
        &self,
        request: super::metastore::UpdateIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<
        super::metastore::IndexMetadataResponse,
    > {
        self.inner
            .clone()
            .update_index(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::UpdateIndexRequest::rpc_name(),
            ))
    }
    async fn delete_index(
        &self,
        request: super::metastore::DeleteIndexRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner
            .clone()
            .delete_index(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::DeleteIndexRequest::rpc_name(),
            ))
    }
    async fn add_source(
        &self,
        request: super::metastore::AddSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner
            .clone()
            .add_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::AddSourceRequest::rpc_name(),
            ))
    }
    async fn update_source(
        &self,
        request: super::metastore::UpdateSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner
            .clone()
            .update_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::UpdateSourceRequest::rpc_name(),
            ))
    }
    async fn toggle_source(
        &self,
        request: super::metastore::ToggleSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner
            .clone()
            .toggle_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::ToggleSourceRequest::rpc_name(),
            ))
    }
    async fn delete_source(
        &self,
        request: super::metastore::DeleteSourceRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner
            .clone()
            .delete_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::DeleteSourceRequest::rpc_name(),
            ))
    }
    async fn get_or_create_open_shards(
        &self,
        request: GetOrCreateOpenShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<GetOrCreateOpenShardsResponse> {
        self.inner
            .clone()
            .get_or_create_open_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                GetOrCreateOpenShardsRequest::rpc_name(),
            ))
    }
    async fn advise_reset_shards(
        &self,
        request: AdviseResetShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<AdviseResetShardsResponse> {
        self.inner
            .clone()
            .advise_reset_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                AdviseResetShardsRequest::rpc_name(),
            ))
    }
    async fn prune_shards(
        &self,
        request: super::metastore::PruneShardsRequest,
    ) -> crate::control_plane::ControlPlaneResult<super::metastore::EmptyResponse> {
        self.inner
            .clone()
            .prune_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                super::metastore::PruneShardsRequest::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct ControlPlaneServiceGrpcServerAdapter {
    inner: InnerControlPlaneServiceClient,
}
impl ControlPlaneServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: ControlPlaneService,
    {
        Self {
            inner: InnerControlPlaneServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl control_plane_service_grpc_server::ControlPlaneServiceGrpc
for ControlPlaneServiceGrpcServerAdapter {
    async fn create_index(
        &self,
        request: tonic::Request<super::metastore::CreateIndexRequest>,
    ) -> Result<tonic::Response<super::metastore::CreateIndexResponse>, tonic::Status> {
        self.inner
            .0
            .create_index(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn update_index(
        &self,
        request: tonic::Request<super::metastore::UpdateIndexRequest>,
    ) -> Result<
        tonic::Response<super::metastore::IndexMetadataResponse>,
        tonic::Status,
    > {
        self.inner
            .0
            .update_index(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_index(
        &self,
        request: tonic::Request<super::metastore::DeleteIndexRequest>,
    ) -> Result<tonic::Response<super::metastore::EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .delete_index(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn add_source(
        &self,
        request: tonic::Request<super::metastore::AddSourceRequest>,
    ) -> Result<tonic::Response<super::metastore::EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .add_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn update_source(
        &self,
        request: tonic::Request<super::metastore::UpdateSourceRequest>,
    ) -> Result<tonic::Response<super::metastore::EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .update_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn toggle_source(
        &self,
        request: tonic::Request<super::metastore::ToggleSourceRequest>,
    ) -> Result<tonic::Response<super::metastore::EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .toggle_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_source(
        &self,
        request: tonic::Request<super::metastore::DeleteSourceRequest>,
    ) -> Result<tonic::Response<super::metastore::EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .delete_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn get_or_create_open_shards(
        &self,
        request: tonic::Request<GetOrCreateOpenShardsRequest>,
    ) -> Result<tonic::Response<GetOrCreateOpenShardsResponse>, tonic::Status> {
        self.inner
            .0
            .get_or_create_open_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn advise_reset_shards(
        &self,
        request: tonic::Request<AdviseResetShardsRequest>,
    ) -> Result<tonic::Response<AdviseResetShardsResponse>, tonic::Status> {
        self.inner
            .0
            .advise_reset_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn prune_shards(
        &self,
        request: tonic::Request<super::metastore::PruneShardsRequest>,
    ) -> Result<tonic::Response<super::metastore::EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .prune_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod control_plane_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct ControlPlaneServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl ControlPlaneServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> ControlPlaneServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> ControlPlaneServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            ControlPlaneServiceGrpcClient::new(
                InterceptedService::new(inner, interceptor),
            )
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Creates a new index.
        pub async fn create_index(
            &mut self,
            request: impl tonic::IntoRequest<super::super::metastore::CreateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::CreateIndexResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/CreateIndex",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "CreateIndex",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Updates an index.
        pub async fn update_index(
            &mut self,
            request: impl tonic::IntoRequest<super::super::metastore::UpdateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::IndexMetadataResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/UpdateIndex",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "UpdateIndex",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Deletes an index.
        pub async fn delete_index(
            &mut self,
            request: impl tonic::IntoRequest<super::super::metastore::DeleteIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/DeleteIndex",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "DeleteIndex",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Adds a source to an index.
        pub async fn add_source(
            &mut self,
            request: impl tonic::IntoRequest<super::super::metastore::AddSourceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/AddSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "AddSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Update a source.
        pub async fn update_source(
            &mut self,
            request: impl tonic::IntoRequest<
                super::super::metastore::UpdateSourceRequest,
            >,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/UpdateSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "UpdateSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Enables or disables a source.
        pub async fn toggle_source(
            &mut self,
            request: impl tonic::IntoRequest<
                super::super::metastore::ToggleSourceRequest,
            >,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/ToggleSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "ToggleSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Removes a source from an index.
        pub async fn delete_source(
            &mut self,
            request: impl tonic::IntoRequest<
                super::super::metastore::DeleteSourceRequest,
            >,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/DeleteSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "DeleteSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Returns the list of open shards for one or several sources. If the control plane is not able to find any
        /// for a source, it will pick a pair of leader-follower ingesters and will open a new shard.
        pub async fn get_or_create_open_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::GetOrCreateOpenShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetOrCreateOpenShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/GetOrCreateOpenShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "GetOrCreateOpenShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Asks the control plane whether the shards listed in the request should be deleted or truncated.
        pub async fn advise_reset_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::AdviseResetShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::AdviseResetShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/AdviseResetShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "AdviseResetShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Performs a debounced shard pruning request to the metastore.
        pub async fn prune_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::super::metastore::PruneShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.control_plane.ControlPlaneService/PruneShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.control_plane.ControlPlaneService",
                        "PruneShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod control_plane_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with ControlPlaneServiceGrpcServer.
    #[async_trait]
    pub trait ControlPlaneServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Creates a new index.
        async fn create_index(
            &self,
            request: tonic::Request<super::super::metastore::CreateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::CreateIndexResponse>,
            tonic::Status,
        >;
        /// Updates an index.
        async fn update_index(
            &self,
            request: tonic::Request<super::super::metastore::UpdateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::IndexMetadataResponse>,
            tonic::Status,
        >;
        /// Deletes an index.
        async fn delete_index(
            &self,
            request: tonic::Request<super::super::metastore::DeleteIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        >;
        /// Adds a source to an index.
        async fn add_source(
            &self,
            request: tonic::Request<super::super::metastore::AddSourceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        >;
        /// Update a source.
        async fn update_source(
            &self,
            request: tonic::Request<super::super::metastore::UpdateSourceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        >;
        /// Enables or disables a source.
        async fn toggle_source(
            &self,
            request: tonic::Request<super::super::metastore::ToggleSourceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        >;
        /// Removes a source from an index.
        async fn delete_source(
            &self,
            request: tonic::Request<super::super::metastore::DeleteSourceRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        >;
        /// Returns the list of open shards for one or several sources. If the control plane is not able to find any
        /// for a source, it will pick a pair of leader-follower ingesters and will open a new shard.
        async fn get_or_create_open_shards(
            &self,
            request: tonic::Request<super::GetOrCreateOpenShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetOrCreateOpenShardsResponse>,
            tonic::Status,
        >;
        /// Asks the control plane whether the shards listed in the request should be deleted or truncated.
        async fn advise_reset_shards(
            &self,
            request: tonic::Request<super::AdviseResetShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::AdviseResetShardsResponse>,
            tonic::Status,
        >;
        /// Performs a debounced shard pruning request to the metastore.
        async fn prune_shards(
            &self,
            request: tonic::Request<super::super::metastore::PruneShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::super::metastore::EmptyResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct ControlPlaneServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> ControlPlaneServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for ControlPlaneServiceGrpcServer<T>
    where
        T: ControlPlaneServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.control_plane.ControlPlaneService/CreateIndex" => {
                    #[allow(non_camel_case_types)]
                    struct CreateIndexSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::CreateIndexRequest,
                    > for CreateIndexSvc<T> {
                        type Response = super::super::metastore::CreateIndexResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::CreateIndexRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::create_index(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CreateIndexSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/UpdateIndex" => {
                    #[allow(non_camel_case_types)]
                    struct UpdateIndexSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::UpdateIndexRequest,
                    > for UpdateIndexSvc<T> {
                        type Response = super::super::metastore::IndexMetadataResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::UpdateIndexRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::update_index(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = UpdateIndexSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/DeleteIndex" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteIndexSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::DeleteIndexRequest,
                    > for DeleteIndexSvc<T> {
                        type Response = super::super::metastore::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::DeleteIndexRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::delete_index(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteIndexSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/AddSource" => {
                    #[allow(non_camel_case_types)]
                    struct AddSourceSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::AddSourceRequest,
                    > for AddSourceSvc<T> {
                        type Response = super::super::metastore::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::AddSourceRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::add_source(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = AddSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/UpdateSource" => {
                    #[allow(non_camel_case_types)]
                    struct UpdateSourceSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::UpdateSourceRequest,
                    > for UpdateSourceSvc<T> {
                        type Response = super::super::metastore::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::UpdateSourceRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::update_source(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = UpdateSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/ToggleSource" => {
                    #[allow(non_camel_case_types)]
                    struct ToggleSourceSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::ToggleSourceRequest,
                    > for ToggleSourceSvc<T> {
                        type Response = super::super::metastore::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::ToggleSourceRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::toggle_source(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ToggleSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/DeleteSource" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteSourceSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::DeleteSourceRequest,
                    > for DeleteSourceSvc<T> {
                        type Response = super::super::metastore::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::DeleteSourceRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::delete_source(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/GetOrCreateOpenShards" => {
                    #[allow(non_camel_case_types)]
                    struct GetOrCreateOpenShardsSvc<T: ControlPlaneServiceGrpc>(
                        pub Arc<T>,
                    );
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<super::GetOrCreateOpenShardsRequest>
                    for GetOrCreateOpenShardsSvc<T> {
                        type Response = super::GetOrCreateOpenShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetOrCreateOpenShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::get_or_create_open_shards(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetOrCreateOpenShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/AdviseResetShards" => {
                    #[allow(non_camel_case_types)]
                    struct AdviseResetShardsSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<super::AdviseResetShardsRequest>
                    for AdviseResetShardsSvc<T> {
                        type Response = super::AdviseResetShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::AdviseResetShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::advise_reset_shards(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = AdviseResetShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.control_plane.ControlPlaneService/PruneShards" => {
                    #[allow(non_camel_case_types)]
                    struct PruneShardsSvc<T: ControlPlaneServiceGrpc>(pub Arc<T>);
                    impl<
                        T: ControlPlaneServiceGrpc,
                    > tonic::server::UnaryService<
                        super::super::metastore::PruneShardsRequest,
                    > for PruneShardsSvc<T> {
                        type Response = super::super::metastore::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::super::metastore::PruneShardsRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as ControlPlaneServiceGrpc>::prune_shards(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = PruneShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for ControlPlaneServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.control_plane.ControlPlaneService";
    impl<T> tonic::server::NamedService for ControlPlaneServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.developer.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetDebugInfoRequest {
    /// Restricts the debug info to the given roles.
    #[prost(string, repeated, tag = "1")]
    pub roles: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetDebugInfoResponse {
    #[prost(bytes = "bytes", tag = "1")]
    pub debug_info_json: ::prost::bytes::Bytes,
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for GetDebugInfoRequest {
    fn rpc_name() -> &'static str {
        "get_debug_info"
    }
}
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait DeveloperService: std::fmt::Debug + Send + Sync + 'static {
    async fn get_debug_info(
        &self,
        request: GetDebugInfoRequest,
    ) -> crate::developer::DeveloperResult<GetDebugInfoResponse>;
}
#[derive(Debug, Clone)]
pub struct DeveloperServiceClient {
    inner: InnerDeveloperServiceClient,
}
#[derive(Debug, Clone)]
struct InnerDeveloperServiceClient(std::sync::Arc<dyn DeveloperService>);
impl DeveloperServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: DeveloperService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockDeveloperService > (),
            "`MockDeveloperService` must be wrapped in a `MockDeveloperServiceWrapper`: use `DeveloperServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerDeveloperServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> developer_service_grpc_server::DeveloperServiceGrpcServer<
        DeveloperServiceGrpcServerAdapter,
    > {
        let adapter = DeveloperServiceGrpcServerAdapter::new(self.clone());
        developer_service_grpc_server::DeveloperServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = developer_service_grpc_client::DeveloperServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = DeveloperServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> DeveloperServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = developer_service_grpc_client::DeveloperServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = DeveloperServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        DeveloperServiceMailbox<A>: DeveloperService,
    {
        DeveloperServiceClient::new(DeveloperServiceMailbox::new(mailbox))
    }
    pub fn tower() -> DeveloperServiceTowerLayerStack {
        DeveloperServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockDeveloperService) -> Self {
        let mock_wrapper = mock_developer_service::MockDeveloperServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockDeveloperService::new())
    }
}
#[async_trait::async_trait]
impl DeveloperService for DeveloperServiceClient {
    async fn get_debug_info(
        &self,
        request: GetDebugInfoRequest,
    ) -> crate::developer::DeveloperResult<GetDebugInfoResponse> {
        self.inner.0.get_debug_info(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_developer_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockDeveloperServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockDeveloperService>,
    }
    #[async_trait::async_trait]
    impl DeveloperService for MockDeveloperServiceWrapper {
        async fn get_debug_info(
            &self,
            request: super::GetDebugInfoRequest,
        ) -> crate::developer::DeveloperResult<super::GetDebugInfoResponse> {
            self.inner.lock().await.get_debug_info(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<GetDebugInfoRequest> for InnerDeveloperServiceClient {
    type Response = GetDebugInfoResponse;
    type Error = crate::developer::DeveloperError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: GetDebugInfoRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.get_debug_info(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct DeveloperServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerDeveloperServiceClient,
    get_debug_info_svc: quickwit_common::tower::BoxService<
        GetDebugInfoRequest,
        GetDebugInfoResponse,
        crate::developer::DeveloperError,
    >,
}
#[async_trait::async_trait]
impl DeveloperService for DeveloperServiceTowerServiceStack {
    async fn get_debug_info(
        &self,
        request: GetDebugInfoRequest,
    ) -> crate::developer::DeveloperResult<GetDebugInfoResponse> {
        self.get_debug_info_svc.clone().ready().await?.call(request).await
    }
}
type GetDebugInfoLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        GetDebugInfoRequest,
        GetDebugInfoResponse,
        crate::developer::DeveloperError,
    >,
    GetDebugInfoRequest,
    GetDebugInfoResponse,
    crate::developer::DeveloperError,
>;
#[derive(Debug, Default)]
pub struct DeveloperServiceTowerLayerStack {
    get_debug_info_layers: Vec<GetDebugInfoLayer>,
}
impl DeveloperServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetDebugInfoRequest,
                    GetDebugInfoResponse,
                    crate::developer::DeveloperError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetDebugInfoRequest,
                GetDebugInfoResponse,
                crate::developer::DeveloperError,
            >,
        >>::Service: tower::Service<
                GetDebugInfoRequest,
                Response = GetDebugInfoResponse,
                Error = crate::developer::DeveloperError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetDebugInfoRequest,
                GetDebugInfoResponse,
                crate::developer::DeveloperError,
            >,
        >>::Service as tower::Service<GetDebugInfoRequest>>::Future: Send + 'static,
    {
        self.get_debug_info_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_get_debug_info_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetDebugInfoRequest,
                    GetDebugInfoResponse,
                    crate::developer::DeveloperError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                GetDebugInfoRequest,
                Response = GetDebugInfoResponse,
                Error = crate::developer::DeveloperError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<GetDebugInfoRequest>>::Future: Send + 'static,
    {
        self.get_debug_info_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> DeveloperServiceClient
    where
        T: DeveloperService,
    {
        let inner_client = InnerDeveloperServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> DeveloperServiceClient {
        let client = DeveloperServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> DeveloperServiceClient {
        let client = DeveloperServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> DeveloperServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        DeveloperServiceMailbox<A>: DeveloperService,
    {
        let inner_client = InnerDeveloperServiceClient(
            std::sync::Arc::new(DeveloperServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockDeveloperService) -> DeveloperServiceClient {
        let client = DeveloperServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerDeveloperServiceClient,
    ) -> DeveloperServiceClient {
        let get_debug_info_svc = self
            .get_debug_info_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = DeveloperServiceTowerServiceStack {
            inner: inner_client,
            get_debug_info_svc,
        };
        DeveloperServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct DeveloperServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::developer::DeveloperError>,
}
impl<A: quickwit_actors::Actor> DeveloperServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for DeveloperServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for DeveloperServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::developer::DeveloperError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::developer::DeveloperError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> DeveloperService for DeveloperServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    DeveloperServiceMailbox<
        A,
    >: tower::Service<
        GetDebugInfoRequest,
        Response = GetDebugInfoResponse,
        Error = crate::developer::DeveloperError,
        Future = BoxFuture<GetDebugInfoResponse, crate::developer::DeveloperError>,
    >,
{
    async fn get_debug_info(
        &self,
        request: GetDebugInfoRequest,
    ) -> crate::developer::DeveloperResult<GetDebugInfoResponse> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct DeveloperServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> DeveloperServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> DeveloperService
for DeveloperServiceGrpcClientAdapter<
    developer_service_grpc_client::DeveloperServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn get_debug_info(
        &self,
        request: GetDebugInfoRequest,
    ) -> crate::developer::DeveloperResult<GetDebugInfoResponse> {
        self.inner
            .clone()
            .get_debug_info(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                GetDebugInfoRequest::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct DeveloperServiceGrpcServerAdapter {
    inner: InnerDeveloperServiceClient,
}
impl DeveloperServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: DeveloperService,
    {
        Self {
            inner: InnerDeveloperServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl developer_service_grpc_server::DeveloperServiceGrpc
for DeveloperServiceGrpcServerAdapter {
    async fn get_debug_info(
        &self,
        request: tonic::Request<GetDebugInfoRequest>,
    ) -> Result<tonic::Response<GetDebugInfoResponse>, tonic::Status> {
        self.inner
            .0
            .get_debug_info(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod developer_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct DeveloperServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl DeveloperServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> DeveloperServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> DeveloperServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            DeveloperServiceGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        pub async fn get_debug_info(
            &mut self,
            request: impl tonic::IntoRequest<super::GetDebugInfoRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetDebugInfoResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.developer.DeveloperService/GetDebugInfo",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.developer.DeveloperService",
                        "GetDebugInfo",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod developer_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with DeveloperServiceGrpcServer.
    #[async_trait]
    pub trait DeveloperServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        async fn get_debug_info(
            &self,
            request: tonic::Request<super::GetDebugInfoRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetDebugInfoResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct DeveloperServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> DeveloperServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for DeveloperServiceGrpcServer<T>
    where
        T: DeveloperServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.developer.DeveloperService/GetDebugInfo" => {
                    #[allow(non_camel_case_types)]
                    struct GetDebugInfoSvc<T: DeveloperServiceGrpc>(pub Arc<T>);
                    impl<
                        T: DeveloperServiceGrpc,
                    > tonic::server::UnaryService<super::GetDebugInfoRequest>
                    for GetDebugInfoSvc<T> {
                        type Response = super::GetDebugInfoResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetDebugInfoRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as DeveloperServiceGrpc>::get_debug_info(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetDebugInfoSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for DeveloperServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.developer.DeveloperService";
    impl<T> tonic::server::NamedService for DeveloperServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.indexing.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ApplyIndexingPlanRequest {
    #[prost(message, repeated, tag = "1")]
    pub indexing_tasks: ::prost::alloc::vec::Vec<IndexingTask>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IndexingTask {
    /// The tasks's index UID.
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    /// The task's source ID.
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    /// pipeline id
    #[prost(message, optional, tag = "4")]
    pub pipeline_uid: ::core::option::Option<crate::types::PipelineUid>,
    /// The shards assigned to the indexer.
    #[prost(message, repeated, tag = "3")]
    pub shard_ids: ::prost::alloc::vec::Vec<crate::types::ShardId>,
    /// Fingerprint of the pipeline parameters. Anything that should cause a pipeline restart (such
    /// as updating indexing settings, the doc mapping or the source) should influence this value.
    #[prost(uint64, tag = "6")]
    pub params_fingerprint: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ApplyIndexingPlanResponse {}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait IndexingService: std::fmt::Debug + Send + Sync + 'static {
    ///Apply an indexing plan on the node.
    async fn apply_indexing_plan(
        &self,
        request: ApplyIndexingPlanRequest,
    ) -> crate::indexing::IndexingResult<ApplyIndexingPlanResponse>;
}
#[derive(Debug, Clone)]
pub struct IndexingServiceClient {
    inner: InnerIndexingServiceClient,
}
#[derive(Debug, Clone)]
struct InnerIndexingServiceClient(std::sync::Arc<dyn IndexingService>);
impl IndexingServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: IndexingService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockIndexingService > (),
            "`MockIndexingService` must be wrapped in a `MockIndexingServiceWrapper`: use `IndexingServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerIndexingServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> indexing_service_grpc_server::IndexingServiceGrpcServer<
        IndexingServiceGrpcServerAdapter,
    > {
        let adapter = IndexingServiceGrpcServerAdapter::new(self.clone());
        indexing_service_grpc_server::IndexingServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = indexing_service_grpc_client::IndexingServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IndexingServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IndexingServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = indexing_service_grpc_client::IndexingServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IndexingServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IndexingServiceMailbox<A>: IndexingService,
    {
        IndexingServiceClient::new(IndexingServiceMailbox::new(mailbox))
    }
    pub fn tower() -> IndexingServiceTowerLayerStack {
        IndexingServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockIndexingService) -> Self {
        let mock_wrapper = mock_indexing_service::MockIndexingServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockIndexingService::new())
    }
}
#[async_trait::async_trait]
impl IndexingService for IndexingServiceClient {
    async fn apply_indexing_plan(
        &self,
        request: ApplyIndexingPlanRequest,
    ) -> crate::indexing::IndexingResult<ApplyIndexingPlanResponse> {
        self.inner.0.apply_indexing_plan(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_indexing_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockIndexingServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockIndexingService>,
    }
    #[async_trait::async_trait]
    impl IndexingService for MockIndexingServiceWrapper {
        async fn apply_indexing_plan(
            &self,
            request: super::ApplyIndexingPlanRequest,
        ) -> crate::indexing::IndexingResult<super::ApplyIndexingPlanResponse> {
            self.inner.lock().await.apply_indexing_plan(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<ApplyIndexingPlanRequest> for InnerIndexingServiceClient {
    type Response = ApplyIndexingPlanResponse;
    type Error = crate::indexing::IndexingError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ApplyIndexingPlanRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.apply_indexing_plan(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct IndexingServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerIndexingServiceClient,
    apply_indexing_plan_svc: quickwit_common::tower::BoxService<
        ApplyIndexingPlanRequest,
        ApplyIndexingPlanResponse,
        crate::indexing::IndexingError,
    >,
}
#[async_trait::async_trait]
impl IndexingService for IndexingServiceTowerServiceStack {
    async fn apply_indexing_plan(
        &self,
        request: ApplyIndexingPlanRequest,
    ) -> crate::indexing::IndexingResult<ApplyIndexingPlanResponse> {
        self.apply_indexing_plan_svc.clone().ready().await?.call(request).await
    }
}
type ApplyIndexingPlanLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ApplyIndexingPlanRequest,
        ApplyIndexingPlanResponse,
        crate::indexing::IndexingError,
    >,
    ApplyIndexingPlanRequest,
    ApplyIndexingPlanResponse,
    crate::indexing::IndexingError,
>;
#[derive(Debug, Default)]
pub struct IndexingServiceTowerLayerStack {
    apply_indexing_plan_layers: Vec<ApplyIndexingPlanLayer>,
}
impl IndexingServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ApplyIndexingPlanRequest,
                    ApplyIndexingPlanResponse,
                    crate::indexing::IndexingError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ApplyIndexingPlanRequest,
                ApplyIndexingPlanResponse,
                crate::indexing::IndexingError,
            >,
        >>::Service: tower::Service<
                ApplyIndexingPlanRequest,
                Response = ApplyIndexingPlanResponse,
                Error = crate::indexing::IndexingError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ApplyIndexingPlanRequest,
                ApplyIndexingPlanResponse,
                crate::indexing::IndexingError,
            >,
        >>::Service as tower::Service<ApplyIndexingPlanRequest>>::Future: Send + 'static,
    {
        self.apply_indexing_plan_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_apply_indexing_plan_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ApplyIndexingPlanRequest,
                    ApplyIndexingPlanResponse,
                    crate::indexing::IndexingError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ApplyIndexingPlanRequest,
                Response = ApplyIndexingPlanResponse,
                Error = crate::indexing::IndexingError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ApplyIndexingPlanRequest>>::Future: Send + 'static,
    {
        self.apply_indexing_plan_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> IndexingServiceClient
    where
        T: IndexingService,
    {
        let inner_client = InnerIndexingServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IndexingServiceClient {
        let client = IndexingServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IndexingServiceClient {
        let client = IndexingServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> IndexingServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IndexingServiceMailbox<A>: IndexingService,
    {
        let inner_client = InnerIndexingServiceClient(
            std::sync::Arc::new(IndexingServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockIndexingService) -> IndexingServiceClient {
        let client = IndexingServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerIndexingServiceClient,
    ) -> IndexingServiceClient {
        let apply_indexing_plan_svc = self
            .apply_indexing_plan_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = IndexingServiceTowerServiceStack {
            inner: inner_client,
            apply_indexing_plan_svc,
        };
        IndexingServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct IndexingServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::indexing::IndexingError>,
}
impl<A: quickwit_actors::Actor> IndexingServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for IndexingServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for IndexingServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::indexing::IndexingError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::indexing::IndexingError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> IndexingService for IndexingServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    IndexingServiceMailbox<
        A,
    >: tower::Service<
        ApplyIndexingPlanRequest,
        Response = ApplyIndexingPlanResponse,
        Error = crate::indexing::IndexingError,
        Future = BoxFuture<ApplyIndexingPlanResponse, crate::indexing::IndexingError>,
    >,
{
    async fn apply_indexing_plan(
        &self,
        request: ApplyIndexingPlanRequest,
    ) -> crate::indexing::IndexingResult<ApplyIndexingPlanResponse> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct IndexingServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> IndexingServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> IndexingService
for IndexingServiceGrpcClientAdapter<
    indexing_service_grpc_client::IndexingServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn apply_indexing_plan(
        &self,
        request: ApplyIndexingPlanRequest,
    ) -> crate::indexing::IndexingResult<ApplyIndexingPlanResponse> {
        self.inner
            .clone()
            .apply_indexing_plan(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ApplyIndexingPlanRequest::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct IndexingServiceGrpcServerAdapter {
    inner: InnerIndexingServiceClient,
}
impl IndexingServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: IndexingService,
    {
        Self {
            inner: InnerIndexingServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl indexing_service_grpc_server::IndexingServiceGrpc
for IndexingServiceGrpcServerAdapter {
    async fn apply_indexing_plan(
        &self,
        request: tonic::Request<ApplyIndexingPlanRequest>,
    ) -> Result<tonic::Response<ApplyIndexingPlanResponse>, tonic::Status> {
        self.inner
            .0
            .apply_indexing_plan(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod indexing_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct IndexingServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl IndexingServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> IndexingServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> IndexingServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            IndexingServiceGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Apply an indexing plan on the node.
        pub async fn apply_indexing_plan(
            &mut self,
            request: impl tonic::IntoRequest<super::ApplyIndexingPlanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ApplyIndexingPlanResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.indexing.IndexingService/ApplyIndexingPlan",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.indexing.IndexingService",
                        "ApplyIndexingPlan",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod indexing_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with IndexingServiceGrpcServer.
    #[async_trait]
    pub trait IndexingServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Apply an indexing plan on the node.
        async fn apply_indexing_plan(
            &self,
            request: tonic::Request<super::ApplyIndexingPlanRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ApplyIndexingPlanResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct IndexingServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> IndexingServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for IndexingServiceGrpcServer<T>
    where
        T: IndexingServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.indexing.IndexingService/ApplyIndexingPlan" => {
                    #[allow(non_camel_case_types)]
                    struct ApplyIndexingPlanSvc<T: IndexingServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IndexingServiceGrpc,
                    > tonic::server::UnaryService<super::ApplyIndexingPlanRequest>
                    for ApplyIndexingPlanSvc<T> {
                        type Response = super::ApplyIndexingPlanResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ApplyIndexingPlanRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IndexingServiceGrpc>::apply_indexing_plan(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ApplyIndexingPlanSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for IndexingServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.indexing.IndexingService";
    impl<T> tonic::server::NamedService for IndexingServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.ingest.ingester.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct RetainShardsForSource {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub shard_ids: ::prost::alloc::vec::Vec<crate::types::ShardId>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct RetainShardsRequest {
    #[prost(message, repeated, tag = "1")]
    pub retain_shards_for_sources: ::prost::alloc::vec::Vec<RetainShardsForSource>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct RetainShardsResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct PersistRequest {
    #[prost(string, tag = "1")]
    pub leader_id: ::prost::alloc::string::String,
    #[prost(enumeration = "super::CommitTypeV2", tag = "3")]
    pub commit_type: i32,
    #[prost(message, repeated, tag = "4")]
    pub subrequests: ::prost::alloc::vec::Vec<PersistSubrequest>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct PersistSubrequest {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "5")]
    pub doc_batch: ::core::option::Option<super::DocBatchV2>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct PersistResponse {
    #[prost(string, tag = "1")]
    pub leader_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "2")]
    pub successes: ::prost::alloc::vec::Vec<PersistSuccess>,
    #[prost(message, repeated, tag = "3")]
    pub failures: ::prost::alloc::vec::Vec<PersistFailure>,
    #[prost(message, optional, tag = "4")]
    pub routing_update: ::core::option::Option<RoutingUpdate>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct RoutingUpdate {
    #[prost(uint32, tag = "1")]
    pub capacity_score: u32,
    #[prost(message, repeated, tag = "2")]
    pub source_shard_updates: ::prost::alloc::vec::Vec<SourceShardUpdate>,
    #[prost(message, repeated, tag = "3")]
    pub closed_shards: ::prost::alloc::vec::Vec<super::ShardIds>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SourceShardUpdate {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(uint32, tag = "3")]
    pub open_shard_count: u32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct PersistSuccess {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "5")]
    pub replication_position_inclusive: ::core::option::Option<crate::types::Position>,
    #[prost(uint32, tag = "6")]
    pub num_persisted_docs: u32,
    #[prost(message, repeated, tag = "7")]
    pub parse_failures: ::prost::alloc::vec::Vec<super::ParseFailure>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PersistFailure {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(enumeration = "PersistFailureReason", tag = "5")]
    pub reason: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct SynReplicationMessage {
    #[prost(oneof = "syn_replication_message::Message", tags = "1, 2, 3")]
    pub message: ::core::option::Option<syn_replication_message::Message>,
}
/// Nested message and enum types in `SynReplicationMessage`.
pub mod syn_replication_message {
    #[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
    #[serde(rename_all = "snake_case")]
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Message {
        #[prost(message, tag = "1")]
        OpenRequest(super::OpenReplicationStreamRequest),
        #[prost(message, tag = "2")]
        InitRequest(super::InitReplicaRequest),
        #[prost(message, tag = "3")]
        ReplicateRequest(super::ReplicateRequest),
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AckReplicationMessage {
    #[prost(oneof = "ack_replication_message::Message", tags = "1, 2, 3")]
    pub message: ::core::option::Option<ack_replication_message::Message>,
}
/// Nested message and enum types in `AckReplicationMessage`.
pub mod ack_replication_message {
    #[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
    #[serde(rename_all = "snake_case")]
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Message {
        #[prost(message, tag = "1")]
        OpenResponse(super::OpenReplicationStreamResponse),
        #[prost(message, tag = "2")]
        InitResponse(super::InitReplicaResponse),
        #[prost(message, tag = "3")]
        ReplicateResponse(super::ReplicateResponse),
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct OpenReplicationStreamRequest {
    #[prost(string, tag = "1")]
    pub leader_id: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub follower_id: ::prost::alloc::string::String,
    /// Position of the request in the replication stream.
    #[prost(uint64, tag = "3")]
    pub replication_seqno: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct OpenReplicationStreamResponse {
    /// Position of the response in the replication stream. It should match the position of the request.
    #[prost(uint64, tag = "1")]
    pub replication_seqno: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct InitReplicaRequest {
    #[prost(message, optional, tag = "1")]
    pub replica_shard: ::core::option::Option<super::Shard>,
    #[prost(uint64, tag = "2")]
    pub replication_seqno: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct InitReplicaResponse {
    #[prost(uint64, tag = "1")]
    pub replication_seqno: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ReplicateRequest {
    #[prost(string, tag = "1")]
    pub leader_id: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub follower_id: ::prost::alloc::string::String,
    #[prost(enumeration = "super::CommitTypeV2", tag = "3")]
    pub commit_type: i32,
    #[prost(message, repeated, tag = "4")]
    pub subrequests: ::prost::alloc::vec::Vec<ReplicateSubrequest>,
    /// Position of the request in the replication stream.
    #[prost(uint64, tag = "5")]
    pub replication_seqno: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ReplicateSubrequest {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "5")]
    pub from_position_exclusive: ::core::option::Option<crate::types::Position>,
    #[prost(message, optional, tag = "6")]
    pub doc_batch: ::core::option::Option<super::DocBatchV2>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ReplicateResponse {
    #[prost(string, tag = "1")]
    pub follower_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "2")]
    pub successes: ::prost::alloc::vec::Vec<ReplicateSuccess>,
    #[prost(message, repeated, tag = "3")]
    pub failures: ::prost::alloc::vec::Vec<ReplicateFailure>,
    /// Position of the response in the replication stream. It should match the position of the request.
    #[prost(uint64, tag = "4")]
    pub replication_seqno: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ReplicateSuccess {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "5")]
    pub replication_position_inclusive: ::core::option::Option<crate::types::Position>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ReplicateFailure {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(enumeration = "ReplicateFailureReason", tag = "5")]
    pub reason: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct TruncateShardsRequest {
    #[prost(string, tag = "1")]
    pub ingester_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "2")]
    pub subrequests: ::prost::alloc::vec::Vec<TruncateShardsSubrequest>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct TruncateShardsSubrequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "3")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    /// The position up to which the shard should be truncated (inclusive).
    #[prost(message, optional, tag = "4")]
    pub truncate_up_to_position_inclusive: ::core::option::Option<
        crate::types::Position,
    >,
}
/// TODO
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct TruncateShardsResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct OpenFetchStreamRequest {
    #[prost(string, tag = "1")]
    pub client_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "5")]
    pub from_position_exclusive: ::core::option::Option<crate::types::Position>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FetchMessage {
    #[prost(oneof = "fetch_message::Message", tags = "1, 2")]
    pub message: ::core::option::Option<fetch_message::Message>,
}
/// Nested message and enum types in `FetchMessage`.
pub mod fetch_message {
    #[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
    #[serde(rename_all = "snake_case")]
    #[derive(Clone, PartialEq, Eq, Hash, ::prost::Oneof)]
    pub enum Message {
        #[prost(message, tag = "1")]
        Payload(super::FetchPayload),
        #[prost(message, tag = "2")]
        Eof(super::FetchEof),
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FetchPayload {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "3")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "4")]
    pub mrecord_batch: ::core::option::Option<super::MRecordBatch>,
    #[prost(message, optional, tag = "5")]
    pub from_position_exclusive: ::core::option::Option<crate::types::Position>,
    #[prost(message, optional, tag = "6")]
    pub to_position_inclusive: ::core::option::Option<crate::types::Position>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FetchEof {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "3")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "4")]
    pub eof_position: ::core::option::Option<crate::types::Position>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct InitShardsRequest {
    #[prost(message, repeated, tag = "2")]
    pub subrequests: ::prost::alloc::vec::Vec<InitShardSubrequest>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct InitShardSubrequest {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub shard: ::core::option::Option<super::Shard>,
    #[prost(string, tag = "3")]
    pub doc_mapping_json: ::prost::alloc::string::String,
    #[prost(bool, tag = "4")]
    pub validate_docs: bool,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct InitShardsResponse {
    #[prost(message, repeated, tag = "1")]
    pub successes: ::prost::alloc::vec::Vec<InitShardSuccess>,
    #[prost(message, repeated, tag = "2")]
    pub failures: ::prost::alloc::vec::Vec<InitShardFailure>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct InitShardSuccess {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub shard: ::core::option::Option<super::Shard>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct InitShardFailure {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    /// InitShardFailureReason reason = 5;
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct CloseShardsRequest {
    #[prost(message, repeated, tag = "2")]
    pub shard_pkeys: ::prost::alloc::vec::Vec<super::ShardPKey>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct CloseShardsResponse {
    #[prost(message, repeated, tag = "1")]
    pub successes: ::prost::alloc::vec::Vec<super::ShardPKey>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DecommissionRequest {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DecommissionResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct OpenObservationStreamRequest {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ObservationMessage {
    #[prost(string, tag = "1")]
    pub node_id: ::prost::alloc::string::String,
    #[prost(enumeration = "IngesterStatus", tag = "2")]
    pub status: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum PersistFailureReason {
    Unspecified = 0,
    WalFull = 4,
    Timeout = 5,
    NoShardsAvailable = 6,
    NodeUnavailable = 7,
}
impl PersistFailureReason {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "PERSIST_FAILURE_REASON_UNSPECIFIED",
            Self::WalFull => "PERSIST_FAILURE_REASON_WAL_FULL",
            Self::Timeout => "PERSIST_FAILURE_REASON_TIMEOUT",
            Self::NoShardsAvailable => "PERSIST_FAILURE_REASON_NO_SHARDS_AVAILABLE",
            Self::NodeUnavailable => "PERSIST_FAILURE_REASON_NODE_UNAVAILABLE",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "PERSIST_FAILURE_REASON_UNSPECIFIED" => Some(Self::Unspecified),
            "PERSIST_FAILURE_REASON_WAL_FULL" => Some(Self::WalFull),
            "PERSIST_FAILURE_REASON_TIMEOUT" => Some(Self::Timeout),
            "PERSIST_FAILURE_REASON_NO_SHARDS_AVAILABLE" => Some(Self::NoShardsAvailable),
            "PERSIST_FAILURE_REASON_NODE_UNAVAILABLE" => Some(Self::NodeUnavailable),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum ReplicateFailureReason {
    Unspecified = 0,
    ShardNotFound = 1,
    ShardClosed = 2,
    WalFull = 4,
}
impl ReplicateFailureReason {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "REPLICATE_FAILURE_REASON_UNSPECIFIED",
            Self::ShardNotFound => "REPLICATE_FAILURE_REASON_SHARD_NOT_FOUND",
            Self::ShardClosed => "REPLICATE_FAILURE_REASON_SHARD_CLOSED",
            Self::WalFull => "REPLICATE_FAILURE_REASON_WAL_FULL",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "REPLICATE_FAILURE_REASON_UNSPECIFIED" => Some(Self::Unspecified),
            "REPLICATE_FAILURE_REASON_SHARD_NOT_FOUND" => Some(Self::ShardNotFound),
            "REPLICATE_FAILURE_REASON_SHARD_CLOSED" => Some(Self::ShardClosed),
            "REPLICATE_FAILURE_REASON_WAL_FULL" => Some(Self::WalFull),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum IngesterStatus {
    Unspecified = 0,
    /// The ingester is live but not ready yet to accept requests.
    Initializing = 1,
    /// The ingester is ready and accepts read and write requests.
    Ready = 2,
    /// The ingester is about to be decommissioned. It still accepts read and write requests, but will not accept write requests in a few seconds and should be avoided by future write requests.
    Retiring = 6,
    /// The ingester is being decommissioned. It accepts read requests but rejects write requests
    /// (open shards, persist, and replicate requests). It will transition to `Decommissioned` once
    /// all shards are fully indexed.
    Decommissioning = 3,
    /// The ingester no longer accepts read and write requests. It does not hold any data and can
    /// be safely removed from the cluster.
    Decommissioned = 4,
    /// The ingester failed to initialize and is not ready to accept requests.
    Failed = 5,
}
impl IngesterStatus {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "INGESTER_STATUS_UNSPECIFIED",
            Self::Initializing => "INGESTER_STATUS_INITIALIZING",
            Self::Ready => "INGESTER_STATUS_READY",
            Self::Retiring => "INGESTER_STATUS_RETIRING",
            Self::Decommissioning => "INGESTER_STATUS_DECOMMISSIONING",
            Self::Decommissioned => "INGESTER_STATUS_DECOMMISSIONED",
            Self::Failed => "INGESTER_STATUS_FAILED",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "INGESTER_STATUS_UNSPECIFIED" => Some(Self::Unspecified),
            "INGESTER_STATUS_INITIALIZING" => Some(Self::Initializing),
            "INGESTER_STATUS_READY" => Some(Self::Ready),
            "INGESTER_STATUS_RETIRING" => Some(Self::Retiring),
            "INGESTER_STATUS_DECOMMISSIONING" => Some(Self::Decommissioning),
            "INGESTER_STATUS_DECOMMISSIONED" => Some(Self::Decommissioned),
            "INGESTER_STATUS_FAILED" => Some(Self::Failed),
            _ => None,
        }
    }
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for PersistRequest {
    fn rpc_name() -> &'static str {
        "persist"
    }
}
impl RpcName for SynReplicationMessage {
    fn rpc_name() -> &'static str {
        "open_replication_stream"
    }
}
impl RpcName for OpenFetchStreamRequest {
    fn rpc_name() -> &'static str {
        "open_fetch_stream"
    }
}
impl RpcName for OpenObservationStreamRequest {
    fn rpc_name() -> &'static str {
        "open_observation_stream"
    }
}
impl RpcName for InitShardsRequest {
    fn rpc_name() -> &'static str {
        "init_shards"
    }
}
impl RpcName for RetainShardsRequest {
    fn rpc_name() -> &'static str {
        "retain_shards"
    }
}
impl RpcName for TruncateShardsRequest {
    fn rpc_name() -> &'static str {
        "truncate_shards"
    }
}
impl RpcName for CloseShardsRequest {
    fn rpc_name() -> &'static str {
        "close_shards"
    }
}
impl RpcName for DecommissionRequest {
    fn rpc_name() -> &'static str {
        "decommission"
    }
}
pub type IngesterServiceStream<T> = quickwit_common::ServiceStream<
    crate::ingest::IngestV2Result<T>,
>;
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait IngesterService: std::fmt::Debug + Send + Sync + 'static {
    ///Persists batches of documents to primary shards hosted on a leader.
    async fn persist(
        &self,
        request: PersistRequest,
    ) -> crate::ingest::IngestV2Result<PersistResponse>;
    ///Opens a replication stream from a leader to a follower.
    async fn open_replication_stream(
        &self,
        request: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<AckReplicationMessage>>;
    ///Streams records from a leader or a follower. The client can optionally specify a range of positions to fetch,
    ///otherwise the stream will go indefinitely or until the shard is closed.
    async fn open_fetch_stream(
        &self,
        request: OpenFetchStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<FetchMessage>>;
    ///Streams status updates, called "observations", from an ingester.
    async fn open_observation_stream(
        &self,
        request: OpenObservationStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<ObservationMessage>>;
    ///Creates and initializes a set of newly opened shards. This RPC is called by the control plane on leaders.
    async fn init_shards(
        &self,
        request: InitShardsRequest,
    ) -> crate::ingest::IngestV2Result<InitShardsResponse>;
    ///Only retain the shards that are listed in the request.
    ///Other shards are deleted.
    async fn retain_shards(
        &self,
        request: RetainShardsRequest,
    ) -> crate::ingest::IngestV2Result<RetainShardsResponse>;
    ///Truncates a set of shards at the given positions. This RPC is called by indexers on leaders AND followers.
    async fn truncate_shards(
        &self,
        request: TruncateShardsRequest,
    ) -> crate::ingest::IngestV2Result<TruncateShardsResponse>;
    ///Closes a set of shards. This RPC is called by the control plane.
    async fn close_shards(
        &self,
        request: CloseShardsRequest,
    ) -> crate::ingest::IngestV2Result<CloseShardsResponse>;
    ///Decommissions the ingester.
    async fn decommission(
        &self,
        request: DecommissionRequest,
    ) -> crate::ingest::IngestV2Result<DecommissionResponse>;
}
#[derive(Debug, Clone)]
pub struct IngesterServiceClient {
    inner: InnerIngesterServiceClient,
}
#[derive(Debug, Clone)]
struct InnerIngesterServiceClient(std::sync::Arc<dyn IngesterService>);
impl IngesterServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: IngesterService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockIngesterService > (),
            "`MockIngesterService` must be wrapped in a `MockIngesterServiceWrapper`: use `IngesterServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerIngesterServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> ingester_service_grpc_server::IngesterServiceGrpcServer<
        IngesterServiceGrpcServerAdapter,
    > {
        let adapter = IngesterServiceGrpcServerAdapter::new(self.clone());
        ingester_service_grpc_server::IngesterServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = ingester_service_grpc_client::IngesterServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IngesterServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngesterServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = ingester_service_grpc_client::IngesterServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IngesterServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IngesterServiceMailbox<A>: IngesterService,
    {
        IngesterServiceClient::new(IngesterServiceMailbox::new(mailbox))
    }
    pub fn tower() -> IngesterServiceTowerLayerStack {
        IngesterServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockIngesterService) -> Self {
        let mock_wrapper = mock_ingester_service::MockIngesterServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockIngesterService::new())
    }
}
#[async_trait::async_trait]
impl IngesterService for IngesterServiceClient {
    async fn persist(
        &self,
        request: PersistRequest,
    ) -> crate::ingest::IngestV2Result<PersistResponse> {
        self.inner.0.persist(request).await
    }
    async fn open_replication_stream(
        &self,
        request: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<AckReplicationMessage>> {
        self.inner.0.open_replication_stream(request).await
    }
    async fn open_fetch_stream(
        &self,
        request: OpenFetchStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<FetchMessage>> {
        self.inner.0.open_fetch_stream(request).await
    }
    async fn open_observation_stream(
        &self,
        request: OpenObservationStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<ObservationMessage>> {
        self.inner.0.open_observation_stream(request).await
    }
    async fn init_shards(
        &self,
        request: InitShardsRequest,
    ) -> crate::ingest::IngestV2Result<InitShardsResponse> {
        self.inner.0.init_shards(request).await
    }
    async fn retain_shards(
        &self,
        request: RetainShardsRequest,
    ) -> crate::ingest::IngestV2Result<RetainShardsResponse> {
        self.inner.0.retain_shards(request).await
    }
    async fn truncate_shards(
        &self,
        request: TruncateShardsRequest,
    ) -> crate::ingest::IngestV2Result<TruncateShardsResponse> {
        self.inner.0.truncate_shards(request).await
    }
    async fn close_shards(
        &self,
        request: CloseShardsRequest,
    ) -> crate::ingest::IngestV2Result<CloseShardsResponse> {
        self.inner.0.close_shards(request).await
    }
    async fn decommission(
        &self,
        request: DecommissionRequest,
    ) -> crate::ingest::IngestV2Result<DecommissionResponse> {
        self.inner.0.decommission(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_ingester_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockIngesterServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockIngesterService>,
    }
    #[async_trait::async_trait]
    impl IngesterService for MockIngesterServiceWrapper {
        async fn persist(
            &self,
            request: super::PersistRequest,
        ) -> crate::ingest::IngestV2Result<super::PersistResponse> {
            self.inner.lock().await.persist(request).await
        }
        async fn open_replication_stream(
            &self,
            request: quickwit_common::ServiceStream<super::SynReplicationMessage>,
        ) -> crate::ingest::IngestV2Result<
            IngesterServiceStream<super::AckReplicationMessage>,
        > {
            self.inner.lock().await.open_replication_stream(request).await
        }
        async fn open_fetch_stream(
            &self,
            request: super::OpenFetchStreamRequest,
        ) -> crate::ingest::IngestV2Result<IngesterServiceStream<super::FetchMessage>> {
            self.inner.lock().await.open_fetch_stream(request).await
        }
        async fn open_observation_stream(
            &self,
            request: super::OpenObservationStreamRequest,
        ) -> crate::ingest::IngestV2Result<
            IngesterServiceStream<super::ObservationMessage>,
        > {
            self.inner.lock().await.open_observation_stream(request).await
        }
        async fn init_shards(
            &self,
            request: super::InitShardsRequest,
        ) -> crate::ingest::IngestV2Result<super::InitShardsResponse> {
            self.inner.lock().await.init_shards(request).await
        }
        async fn retain_shards(
            &self,
            request: super::RetainShardsRequest,
        ) -> crate::ingest::IngestV2Result<super::RetainShardsResponse> {
            self.inner.lock().await.retain_shards(request).await
        }
        async fn truncate_shards(
            &self,
            request: super::TruncateShardsRequest,
        ) -> crate::ingest::IngestV2Result<super::TruncateShardsResponse> {
            self.inner.lock().await.truncate_shards(request).await
        }
        async fn close_shards(
            &self,
            request: super::CloseShardsRequest,
        ) -> crate::ingest::IngestV2Result<super::CloseShardsResponse> {
            self.inner.lock().await.close_shards(request).await
        }
        async fn decommission(
            &self,
            request: super::DecommissionRequest,
        ) -> crate::ingest::IngestV2Result<super::DecommissionResponse> {
            self.inner.lock().await.decommission(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<PersistRequest> for InnerIngesterServiceClient {
    type Response = PersistResponse;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: PersistRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.persist(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<quickwit_common::ServiceStream<SynReplicationMessage>>
for InnerIngesterServiceClient {
    type Response = IngesterServiceStream<AckReplicationMessage>;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(
        &mut self,
        request: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.open_replication_stream(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<OpenFetchStreamRequest> for InnerIngesterServiceClient {
    type Response = IngesterServiceStream<FetchMessage>;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: OpenFetchStreamRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.open_fetch_stream(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<OpenObservationStreamRequest> for InnerIngesterServiceClient {
    type Response = IngesterServiceStream<ObservationMessage>;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: OpenObservationStreamRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.open_observation_stream(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<InitShardsRequest> for InnerIngesterServiceClient {
    type Response = InitShardsResponse;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: InitShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.init_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<RetainShardsRequest> for InnerIngesterServiceClient {
    type Response = RetainShardsResponse;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: RetainShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.retain_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<TruncateShardsRequest> for InnerIngesterServiceClient {
    type Response = TruncateShardsResponse;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: TruncateShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.truncate_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<CloseShardsRequest> for InnerIngesterServiceClient {
    type Response = CloseShardsResponse;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: CloseShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.close_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DecommissionRequest> for InnerIngesterServiceClient {
    type Response = DecommissionResponse;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DecommissionRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.decommission(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct IngesterServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerIngesterServiceClient,
    persist_svc: quickwit_common::tower::BoxService<
        PersistRequest,
        PersistResponse,
        crate::ingest::IngestV2Error,
    >,
    open_replication_stream_svc: quickwit_common::tower::BoxService<
        quickwit_common::ServiceStream<SynReplicationMessage>,
        IngesterServiceStream<AckReplicationMessage>,
        crate::ingest::IngestV2Error,
    >,
    open_fetch_stream_svc: quickwit_common::tower::BoxService<
        OpenFetchStreamRequest,
        IngesterServiceStream<FetchMessage>,
        crate::ingest::IngestV2Error,
    >,
    open_observation_stream_svc: quickwit_common::tower::BoxService<
        OpenObservationStreamRequest,
        IngesterServiceStream<ObservationMessage>,
        crate::ingest::IngestV2Error,
    >,
    init_shards_svc: quickwit_common::tower::BoxService<
        InitShardsRequest,
        InitShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    retain_shards_svc: quickwit_common::tower::BoxService<
        RetainShardsRequest,
        RetainShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    truncate_shards_svc: quickwit_common::tower::BoxService<
        TruncateShardsRequest,
        TruncateShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    close_shards_svc: quickwit_common::tower::BoxService<
        CloseShardsRequest,
        CloseShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    decommission_svc: quickwit_common::tower::BoxService<
        DecommissionRequest,
        DecommissionResponse,
        crate::ingest::IngestV2Error,
    >,
}
#[async_trait::async_trait]
impl IngesterService for IngesterServiceTowerServiceStack {
    async fn persist(
        &self,
        request: PersistRequest,
    ) -> crate::ingest::IngestV2Result<PersistResponse> {
        self.persist_svc.clone().ready().await?.call(request).await
    }
    async fn open_replication_stream(
        &self,
        request: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<AckReplicationMessage>> {
        self.open_replication_stream_svc.clone().ready().await?.call(request).await
    }
    async fn open_fetch_stream(
        &self,
        request: OpenFetchStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<FetchMessage>> {
        self.open_fetch_stream_svc.clone().ready().await?.call(request).await
    }
    async fn open_observation_stream(
        &self,
        request: OpenObservationStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<ObservationMessage>> {
        self.open_observation_stream_svc.clone().ready().await?.call(request).await
    }
    async fn init_shards(
        &self,
        request: InitShardsRequest,
    ) -> crate::ingest::IngestV2Result<InitShardsResponse> {
        self.init_shards_svc.clone().ready().await?.call(request).await
    }
    async fn retain_shards(
        &self,
        request: RetainShardsRequest,
    ) -> crate::ingest::IngestV2Result<RetainShardsResponse> {
        self.retain_shards_svc.clone().ready().await?.call(request).await
    }
    async fn truncate_shards(
        &self,
        request: TruncateShardsRequest,
    ) -> crate::ingest::IngestV2Result<TruncateShardsResponse> {
        self.truncate_shards_svc.clone().ready().await?.call(request).await
    }
    async fn close_shards(
        &self,
        request: CloseShardsRequest,
    ) -> crate::ingest::IngestV2Result<CloseShardsResponse> {
        self.close_shards_svc.clone().ready().await?.call(request).await
    }
    async fn decommission(
        &self,
        request: DecommissionRequest,
    ) -> crate::ingest::IngestV2Result<DecommissionResponse> {
        self.decommission_svc.clone().ready().await?.call(request).await
    }
}
type PersistLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        PersistRequest,
        PersistResponse,
        crate::ingest::IngestV2Error,
    >,
    PersistRequest,
    PersistResponse,
    crate::ingest::IngestV2Error,
>;
type OpenReplicationStreamLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        quickwit_common::ServiceStream<SynReplicationMessage>,
        IngesterServiceStream<AckReplicationMessage>,
        crate::ingest::IngestV2Error,
    >,
    quickwit_common::ServiceStream<SynReplicationMessage>,
    IngesterServiceStream<AckReplicationMessage>,
    crate::ingest::IngestV2Error,
>;
type OpenFetchStreamLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        OpenFetchStreamRequest,
        IngesterServiceStream<FetchMessage>,
        crate::ingest::IngestV2Error,
    >,
    OpenFetchStreamRequest,
    IngesterServiceStream<FetchMessage>,
    crate::ingest::IngestV2Error,
>;
type OpenObservationStreamLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        OpenObservationStreamRequest,
        IngesterServiceStream<ObservationMessage>,
        crate::ingest::IngestV2Error,
    >,
    OpenObservationStreamRequest,
    IngesterServiceStream<ObservationMessage>,
    crate::ingest::IngestV2Error,
>;
type InitShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        InitShardsRequest,
        InitShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    InitShardsRequest,
    InitShardsResponse,
    crate::ingest::IngestV2Error,
>;
type RetainShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        RetainShardsRequest,
        RetainShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    RetainShardsRequest,
    RetainShardsResponse,
    crate::ingest::IngestV2Error,
>;
type TruncateShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        TruncateShardsRequest,
        TruncateShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    TruncateShardsRequest,
    TruncateShardsResponse,
    crate::ingest::IngestV2Error,
>;
type CloseShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        CloseShardsRequest,
        CloseShardsResponse,
        crate::ingest::IngestV2Error,
    >,
    CloseShardsRequest,
    CloseShardsResponse,
    crate::ingest::IngestV2Error,
>;
type DecommissionLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DecommissionRequest,
        DecommissionResponse,
        crate::ingest::IngestV2Error,
    >,
    DecommissionRequest,
    DecommissionResponse,
    crate::ingest::IngestV2Error,
>;
#[derive(Debug, Default)]
pub struct IngesterServiceTowerLayerStack {
    persist_layers: Vec<PersistLayer>,
    open_replication_stream_layers: Vec<OpenReplicationStreamLayer>,
    open_fetch_stream_layers: Vec<OpenFetchStreamLayer>,
    open_observation_stream_layers: Vec<OpenObservationStreamLayer>,
    init_shards_layers: Vec<InitShardsLayer>,
    retain_shards_layers: Vec<RetainShardsLayer>,
    truncate_shards_layers: Vec<TruncateShardsLayer>,
    close_shards_layers: Vec<CloseShardsLayer>,
    decommission_layers: Vec<DecommissionLayer>,
}
impl IngesterServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    PersistRequest,
                    PersistResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                PersistRequest,
                PersistResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                PersistRequest,
                Response = PersistResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                PersistRequest,
                PersistResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<PersistRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    quickwit_common::ServiceStream<SynReplicationMessage>,
                    IngesterServiceStream<AckReplicationMessage>,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                quickwit_common::ServiceStream<SynReplicationMessage>,
                IngesterServiceStream<AckReplicationMessage>,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                quickwit_common::ServiceStream<SynReplicationMessage>,
                Response = IngesterServiceStream<AckReplicationMessage>,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                quickwit_common::ServiceStream<SynReplicationMessage>,
                IngesterServiceStream<AckReplicationMessage>,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<
            quickwit_common::ServiceStream<SynReplicationMessage>,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    OpenFetchStreamRequest,
                    IngesterServiceStream<FetchMessage>,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                OpenFetchStreamRequest,
                IngesterServiceStream<FetchMessage>,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                OpenFetchStreamRequest,
                Response = IngesterServiceStream<FetchMessage>,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                OpenFetchStreamRequest,
                IngesterServiceStream<FetchMessage>,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<OpenFetchStreamRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    OpenObservationStreamRequest,
                    IngesterServiceStream<ObservationMessage>,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                OpenObservationStreamRequest,
                IngesterServiceStream<ObservationMessage>,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                OpenObservationStreamRequest,
                Response = IngesterServiceStream<ObservationMessage>,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                OpenObservationStreamRequest,
                IngesterServiceStream<ObservationMessage>,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<
            OpenObservationStreamRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    InitShardsRequest,
                    InitShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                InitShardsRequest,
                InitShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                InitShardsRequest,
                Response = InitShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                InitShardsRequest,
                InitShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<InitShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    RetainShardsRequest,
                    RetainShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                RetainShardsRequest,
                RetainShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                RetainShardsRequest,
                Response = RetainShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                RetainShardsRequest,
                RetainShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<RetainShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    TruncateShardsRequest,
                    TruncateShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                TruncateShardsRequest,
                TruncateShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                TruncateShardsRequest,
                Response = TruncateShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                TruncateShardsRequest,
                TruncateShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<TruncateShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    CloseShardsRequest,
                    CloseShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                CloseShardsRequest,
                CloseShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                CloseShardsRequest,
                Response = CloseShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                CloseShardsRequest,
                CloseShardsResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<CloseShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DecommissionRequest,
                    DecommissionResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DecommissionRequest,
                DecommissionResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                DecommissionRequest,
                Response = DecommissionResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DecommissionRequest,
                DecommissionResponse,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<DecommissionRequest>>::Future: Send + 'static,
    {
        self.persist_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.open_replication_stream_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.open_fetch_stream_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.open_observation_stream_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.init_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.retain_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.truncate_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.close_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.decommission_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_persist_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    PersistRequest,
                    PersistResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                PersistRequest,
                Response = PersistResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<PersistRequest>>::Future: Send + 'static,
    {
        self.persist_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_open_replication_stream_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    quickwit_common::ServiceStream<SynReplicationMessage>,
                    IngesterServiceStream<AckReplicationMessage>,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                quickwit_common::ServiceStream<SynReplicationMessage>,
                Response = IngesterServiceStream<AckReplicationMessage>,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            quickwit_common::ServiceStream<SynReplicationMessage>,
        >>::Future: Send + 'static,
    {
        self.open_replication_stream_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_open_fetch_stream_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    OpenFetchStreamRequest,
                    IngesterServiceStream<FetchMessage>,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                OpenFetchStreamRequest,
                Response = IngesterServiceStream<FetchMessage>,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<OpenFetchStreamRequest>>::Future: Send + 'static,
    {
        self.open_fetch_stream_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_open_observation_stream_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    OpenObservationStreamRequest,
                    IngesterServiceStream<ObservationMessage>,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                OpenObservationStreamRequest,
                Response = IngesterServiceStream<ObservationMessage>,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            OpenObservationStreamRequest,
        >>::Future: Send + 'static,
    {
        self.open_observation_stream_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_init_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    InitShardsRequest,
                    InitShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                InitShardsRequest,
                Response = InitShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<InitShardsRequest>>::Future: Send + 'static,
    {
        self.init_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_retain_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    RetainShardsRequest,
                    RetainShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                RetainShardsRequest,
                Response = RetainShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<RetainShardsRequest>>::Future: Send + 'static,
    {
        self.retain_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_truncate_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    TruncateShardsRequest,
                    TruncateShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                TruncateShardsRequest,
                Response = TruncateShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<TruncateShardsRequest>>::Future: Send + 'static,
    {
        self.truncate_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_close_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    CloseShardsRequest,
                    CloseShardsResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                CloseShardsRequest,
                Response = CloseShardsResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<CloseShardsRequest>>::Future: Send + 'static,
    {
        self.close_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_decommission_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DecommissionRequest,
                    DecommissionResponse,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DecommissionRequest,
                Response = DecommissionResponse,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<DecommissionRequest>>::Future: Send + 'static,
    {
        self.decommission_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> IngesterServiceClient
    where
        T: IngesterService,
    {
        let inner_client = InnerIngesterServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngesterServiceClient {
        let client = IngesterServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngesterServiceClient {
        let client = IngesterServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> IngesterServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IngesterServiceMailbox<A>: IngesterService,
    {
        let inner_client = InnerIngesterServiceClient(
            std::sync::Arc::new(IngesterServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockIngesterService) -> IngesterServiceClient {
        let client = IngesterServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerIngesterServiceClient,
    ) -> IngesterServiceClient {
        let persist_svc = self
            .persist_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let open_replication_stream_svc = self
            .open_replication_stream_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let open_fetch_stream_svc = self
            .open_fetch_stream_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let open_observation_stream_svc = self
            .open_observation_stream_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let init_shards_svc = self
            .init_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let retain_shards_svc = self
            .retain_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let truncate_shards_svc = self
            .truncate_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let close_shards_svc = self
            .close_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let decommission_svc = self
            .decommission_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = IngesterServiceTowerServiceStack {
            inner: inner_client,
            persist_svc,
            open_replication_stream_svc,
            open_fetch_stream_svc,
            open_observation_stream_svc,
            init_shards_svc,
            retain_shards_svc,
            truncate_shards_svc,
            close_shards_svc,
            decommission_svc,
        };
        IngesterServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct IngesterServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::ingest::IngestV2Error>,
}
impl<A: quickwit_actors::Actor> IngesterServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for IngesterServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for IngesterServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::ingest::IngestV2Error: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> IngesterService for IngesterServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    IngesterServiceMailbox<
        A,
    >: tower::Service<
            PersistRequest,
            Response = PersistResponse,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<PersistResponse, crate::ingest::IngestV2Error>,
        >
        + tower::Service<
            quickwit_common::ServiceStream<SynReplicationMessage>,
            Response = IngesterServiceStream<AckReplicationMessage>,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<
                IngesterServiceStream<AckReplicationMessage>,
                crate::ingest::IngestV2Error,
            >,
        >
        + tower::Service<
            OpenFetchStreamRequest,
            Response = IngesterServiceStream<FetchMessage>,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<
                IngesterServiceStream<FetchMessage>,
                crate::ingest::IngestV2Error,
            >,
        >
        + tower::Service<
            OpenObservationStreamRequest,
            Response = IngesterServiceStream<ObservationMessage>,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<
                IngesterServiceStream<ObservationMessage>,
                crate::ingest::IngestV2Error,
            >,
        >
        + tower::Service<
            InitShardsRequest,
            Response = InitShardsResponse,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<InitShardsResponse, crate::ingest::IngestV2Error>,
        >
        + tower::Service<
            RetainShardsRequest,
            Response = RetainShardsResponse,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<RetainShardsResponse, crate::ingest::IngestV2Error>,
        >
        + tower::Service<
            TruncateShardsRequest,
            Response = TruncateShardsResponse,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<TruncateShardsResponse, crate::ingest::IngestV2Error>,
        >
        + tower::Service<
            CloseShardsRequest,
            Response = CloseShardsResponse,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<CloseShardsResponse, crate::ingest::IngestV2Error>,
        >
        + tower::Service<
            DecommissionRequest,
            Response = DecommissionResponse,
            Error = crate::ingest::IngestV2Error,
            Future = BoxFuture<DecommissionResponse, crate::ingest::IngestV2Error>,
        >,
{
    async fn persist(
        &self,
        request: PersistRequest,
    ) -> crate::ingest::IngestV2Result<PersistResponse> {
        self.clone().call(request).await
    }
    async fn open_replication_stream(
        &self,
        request: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<AckReplicationMessage>> {
        self.clone().call(request).await
    }
    async fn open_fetch_stream(
        &self,
        request: OpenFetchStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<FetchMessage>> {
        self.clone().call(request).await
    }
    async fn open_observation_stream(
        &self,
        request: OpenObservationStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<ObservationMessage>> {
        self.clone().call(request).await
    }
    async fn init_shards(
        &self,
        request: InitShardsRequest,
    ) -> crate::ingest::IngestV2Result<InitShardsResponse> {
        self.clone().call(request).await
    }
    async fn retain_shards(
        &self,
        request: RetainShardsRequest,
    ) -> crate::ingest::IngestV2Result<RetainShardsResponse> {
        self.clone().call(request).await
    }
    async fn truncate_shards(
        &self,
        request: TruncateShardsRequest,
    ) -> crate::ingest::IngestV2Result<TruncateShardsResponse> {
        self.clone().call(request).await
    }
    async fn close_shards(
        &self,
        request: CloseShardsRequest,
    ) -> crate::ingest::IngestV2Result<CloseShardsResponse> {
        self.clone().call(request).await
    }
    async fn decommission(
        &self,
        request: DecommissionRequest,
    ) -> crate::ingest::IngestV2Result<DecommissionResponse> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct IngesterServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> IngesterServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> IngesterService
for IngesterServiceGrpcClientAdapter<
    ingester_service_grpc_client::IngesterServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn persist(
        &self,
        request: PersistRequest,
    ) -> crate::ingest::IngestV2Result<PersistResponse> {
        self.inner
            .clone()
            .persist(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                PersistRequest::rpc_name(),
            ))
    }
    async fn open_replication_stream(
        &self,
        request: quickwit_common::ServiceStream<SynReplicationMessage>,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<AckReplicationMessage>> {
        self.inner
            .clone()
            .open_replication_stream(request)
            .await
            .map(|response| {
                let streaming: tonic::Streaming<_> = response.into_inner();
                let stream = quickwit_common::ServiceStream::from(streaming);
                stream
                    .map_err(|status| crate::error::grpc_status_to_service_error(
                        status,
                        SynReplicationMessage::rpc_name(),
                    ))
            })
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                SynReplicationMessage::rpc_name(),
            ))
    }
    async fn open_fetch_stream(
        &self,
        request: OpenFetchStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<FetchMessage>> {
        self.inner
            .clone()
            .open_fetch_stream(request)
            .await
            .map(|response| {
                let streaming: tonic::Streaming<_> = response.into_inner();
                let stream = quickwit_common::ServiceStream::from(streaming);
                stream
                    .map_err(|status| crate::error::grpc_status_to_service_error(
                        status,
                        OpenFetchStreamRequest::rpc_name(),
                    ))
            })
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                OpenFetchStreamRequest::rpc_name(),
            ))
    }
    async fn open_observation_stream(
        &self,
        request: OpenObservationStreamRequest,
    ) -> crate::ingest::IngestV2Result<IngesterServiceStream<ObservationMessage>> {
        self.inner
            .clone()
            .open_observation_stream(request)
            .await
            .map(|response| {
                let streaming: tonic::Streaming<_> = response.into_inner();
                let stream = quickwit_common::ServiceStream::from(streaming);
                stream
                    .map_err(|status| crate::error::grpc_status_to_service_error(
                        status,
                        OpenObservationStreamRequest::rpc_name(),
                    ))
            })
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                OpenObservationStreamRequest::rpc_name(),
            ))
    }
    async fn init_shards(
        &self,
        request: InitShardsRequest,
    ) -> crate::ingest::IngestV2Result<InitShardsResponse> {
        self.inner
            .clone()
            .init_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                InitShardsRequest::rpc_name(),
            ))
    }
    async fn retain_shards(
        &self,
        request: RetainShardsRequest,
    ) -> crate::ingest::IngestV2Result<RetainShardsResponse> {
        self.inner
            .clone()
            .retain_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                RetainShardsRequest::rpc_name(),
            ))
    }
    async fn truncate_shards(
        &self,
        request: TruncateShardsRequest,
    ) -> crate::ingest::IngestV2Result<TruncateShardsResponse> {
        self.inner
            .clone()
            .truncate_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                TruncateShardsRequest::rpc_name(),
            ))
    }
    async fn close_shards(
        &self,
        request: CloseShardsRequest,
    ) -> crate::ingest::IngestV2Result<CloseShardsResponse> {
        self.inner
            .clone()
            .close_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                CloseShardsRequest::rpc_name(),
            ))
    }
    async fn decommission(
        &self,
        request: DecommissionRequest,
    ) -> crate::ingest::IngestV2Result<DecommissionResponse> {
        self.inner
            .clone()
            .decommission(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DecommissionRequest::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct IngesterServiceGrpcServerAdapter {
    inner: InnerIngesterServiceClient,
}
impl IngesterServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: IngesterService,
    {
        Self {
            inner: InnerIngesterServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl ingester_service_grpc_server::IngesterServiceGrpc
for IngesterServiceGrpcServerAdapter {
    async fn persist(
        &self,
        request: tonic::Request<PersistRequest>,
    ) -> Result<tonic::Response<PersistResponse>, tonic::Status> {
        self.inner
            .0
            .persist(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    type OpenReplicationStreamStream = quickwit_common::ServiceStream<
        tonic::Result<AckReplicationMessage>,
    >;
    async fn open_replication_stream(
        &self,
        request: tonic::Request<tonic::Streaming<SynReplicationMessage>>,
    ) -> Result<tonic::Response<Self::OpenReplicationStreamStream>, tonic::Status> {
        self.inner
            .0
            .open_replication_stream({
                let streaming: tonic::Streaming<_> = request.into_inner();
                quickwit_common::ServiceStream::from(streaming)
            })
            .await
            .map(|stream| tonic::Response::new(
                stream.map_err(crate::error::grpc_error_to_grpc_status),
            ))
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    type OpenFetchStreamStream = quickwit_common::ServiceStream<
        tonic::Result<FetchMessage>,
    >;
    async fn open_fetch_stream(
        &self,
        request: tonic::Request<OpenFetchStreamRequest>,
    ) -> Result<tonic::Response<Self::OpenFetchStreamStream>, tonic::Status> {
        self.inner
            .0
            .open_fetch_stream(request.into_inner())
            .await
            .map(|stream| tonic::Response::new(
                stream.map_err(crate::error::grpc_error_to_grpc_status),
            ))
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    type OpenObservationStreamStream = quickwit_common::ServiceStream<
        tonic::Result<ObservationMessage>,
    >;
    async fn open_observation_stream(
        &self,
        request: tonic::Request<OpenObservationStreamRequest>,
    ) -> Result<tonic::Response<Self::OpenObservationStreamStream>, tonic::Status> {
        self.inner
            .0
            .open_observation_stream(request.into_inner())
            .await
            .map(|stream| tonic::Response::new(
                stream.map_err(crate::error::grpc_error_to_grpc_status),
            ))
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn init_shards(
        &self,
        request: tonic::Request<InitShardsRequest>,
    ) -> Result<tonic::Response<InitShardsResponse>, tonic::Status> {
        self.inner
            .0
            .init_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn retain_shards(
        &self,
        request: tonic::Request<RetainShardsRequest>,
    ) -> Result<tonic::Response<RetainShardsResponse>, tonic::Status> {
        self.inner
            .0
            .retain_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn truncate_shards(
        &self,
        request: tonic::Request<TruncateShardsRequest>,
    ) -> Result<tonic::Response<TruncateShardsResponse>, tonic::Status> {
        self.inner
            .0
            .truncate_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn close_shards(
        &self,
        request: tonic::Request<CloseShardsRequest>,
    ) -> Result<tonic::Response<CloseShardsResponse>, tonic::Status> {
        self.inner
            .0
            .close_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn decommission(
        &self,
        request: tonic::Request<DecommissionRequest>,
    ) -> Result<tonic::Response<DecommissionResponse>, tonic::Status> {
        self.inner
            .0
            .decommission(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod ingester_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct IngesterServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl IngesterServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> IngesterServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> IngesterServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            IngesterServiceGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Persists batches of documents to primary shards hosted on a leader.
        pub async fn persist(
            &mut self,
            request: impl tonic::IntoRequest<super::PersistRequest>,
        ) -> std::result::Result<
            tonic::Response<super::PersistResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/Persist",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "Persist",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Opens a replication stream from a leader to a follower.
        pub async fn open_replication_stream(
            &mut self,
            request: impl tonic::IntoStreamingRequest<
                Message = super::SynReplicationMessage,
            >,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::AckReplicationMessage>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/OpenReplicationStream",
            );
            let mut req = request.into_streaming_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "OpenReplicationStream",
                    ),
                );
            self.inner.streaming(req, path, codec).await
        }
        /// Streams records from a leader or a follower. The client can optionally specify a range of positions to fetch,
        /// otherwise the stream will go indefinitely or until the shard is closed.
        pub async fn open_fetch_stream(
            &mut self,
            request: impl tonic::IntoRequest<super::OpenFetchStreamRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::FetchMessage>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/OpenFetchStream",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "OpenFetchStream",
                    ),
                );
            self.inner.server_streaming(req, path, codec).await
        }
        /// Streams status updates, called "observations", from an ingester.
        pub async fn open_observation_stream(
            &mut self,
            request: impl tonic::IntoRequest<super::OpenObservationStreamRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::ObservationMessage>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/OpenObservationStream",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "OpenObservationStream",
                    ),
                );
            self.inner.server_streaming(req, path, codec).await
        }
        /// Creates and initializes a set of newly opened shards. This RPC is called by the control plane on leaders.
        pub async fn init_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::InitShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::InitShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/InitShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "InitShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Only retain the shards that are listed in the request.
        /// Other shards are deleted.
        pub async fn retain_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::RetainShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::RetainShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/RetainShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "RetainShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Truncates a set of shards at the given positions. This RPC is called by indexers on leaders AND followers.
        pub async fn truncate_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::TruncateShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::TruncateShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/TruncateShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "TruncateShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Closes a set of shards. This RPC is called by the control plane.
        pub async fn close_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::CloseShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CloseShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/CloseShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "CloseShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Decommissions the ingester.
        pub async fn decommission(
            &mut self,
            request: impl tonic::IntoRequest<super::DecommissionRequest>,
        ) -> std::result::Result<
            tonic::Response<super::DecommissionResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.ingester.IngesterService/Decommission",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.ingester.IngesterService",
                        "Decommission",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod ingester_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with IngesterServiceGrpcServer.
    #[async_trait]
    pub trait IngesterServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Persists batches of documents to primary shards hosted on a leader.
        async fn persist(
            &self,
            request: tonic::Request<super::PersistRequest>,
        ) -> std::result::Result<tonic::Response<super::PersistResponse>, tonic::Status>;
        /// Server streaming response type for the OpenReplicationStream method.
        type OpenReplicationStreamStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::AckReplicationMessage, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// Opens a replication stream from a leader to a follower.
        async fn open_replication_stream(
            &self,
            request: tonic::Request<tonic::Streaming<super::SynReplicationMessage>>,
        ) -> std::result::Result<
            tonic::Response<Self::OpenReplicationStreamStream>,
            tonic::Status,
        >;
        /// Server streaming response type for the OpenFetchStream method.
        type OpenFetchStreamStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::FetchMessage, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// Streams records from a leader or a follower. The client can optionally specify a range of positions to fetch,
        /// otherwise the stream will go indefinitely or until the shard is closed.
        async fn open_fetch_stream(
            &self,
            request: tonic::Request<super::OpenFetchStreamRequest>,
        ) -> std::result::Result<
            tonic::Response<Self::OpenFetchStreamStream>,
            tonic::Status,
        >;
        /// Server streaming response type for the OpenObservationStream method.
        type OpenObservationStreamStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::ObservationMessage, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// Streams status updates, called "observations", from an ingester.
        async fn open_observation_stream(
            &self,
            request: tonic::Request<super::OpenObservationStreamRequest>,
        ) -> std::result::Result<
            tonic::Response<Self::OpenObservationStreamStream>,
            tonic::Status,
        >;
        /// Creates and initializes a set of newly opened shards. This RPC is called by the control plane on leaders.
        async fn init_shards(
            &self,
            request: tonic::Request<super::InitShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::InitShardsResponse>,
            tonic::Status,
        >;
        /// Only retain the shards that are listed in the request.
        /// Other shards are deleted.
        async fn retain_shards(
            &self,
            request: tonic::Request<super::RetainShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::RetainShardsResponse>,
            tonic::Status,
        >;
        /// Truncates a set of shards at the given positions. This RPC is called by indexers on leaders AND followers.
        async fn truncate_shards(
            &self,
            request: tonic::Request<super::TruncateShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::TruncateShardsResponse>,
            tonic::Status,
        >;
        /// Closes a set of shards. This RPC is called by the control plane.
        async fn close_shards(
            &self,
            request: tonic::Request<super::CloseShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CloseShardsResponse>,
            tonic::Status,
        >;
        /// Decommissions the ingester.
        async fn decommission(
            &self,
            request: tonic::Request<super::DecommissionRequest>,
        ) -> std::result::Result<
            tonic::Response<super::DecommissionResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct IngesterServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> IngesterServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for IngesterServiceGrpcServer<T>
    where
        T: IngesterServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.ingest.ingester.IngesterService/Persist" => {
                    #[allow(non_camel_case_types)]
                    struct PersistSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::UnaryService<super::PersistRequest>
                    for PersistSvc<T> {
                        type Response = super::PersistResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::PersistRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::persist(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = PersistSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/OpenReplicationStream" => {
                    #[allow(non_camel_case_types)]
                    struct OpenReplicationStreamSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::StreamingService<super::SynReplicationMessage>
                    for OpenReplicationStreamSvc<T> {
                        type Response = super::AckReplicationMessage;
                        type ResponseStream = T::OpenReplicationStreamStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                tonic::Streaming<super::SynReplicationMessage>,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::open_replication_stream(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = OpenReplicationStreamSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/OpenFetchStream" => {
                    #[allow(non_camel_case_types)]
                    struct OpenFetchStreamSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::ServerStreamingService<
                        super::OpenFetchStreamRequest,
                    > for OpenFetchStreamSvc<T> {
                        type Response = super::FetchMessage;
                        type ResponseStream = T::OpenFetchStreamStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::OpenFetchStreamRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::open_fetch_stream(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = OpenFetchStreamSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/OpenObservationStream" => {
                    #[allow(non_camel_case_types)]
                    struct OpenObservationStreamSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::ServerStreamingService<
                        super::OpenObservationStreamRequest,
                    > for OpenObservationStreamSvc<T> {
                        type Response = super::ObservationMessage;
                        type ResponseStream = T::OpenObservationStreamStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::OpenObservationStreamRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::open_observation_stream(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = OpenObservationStreamSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/InitShards" => {
                    #[allow(non_camel_case_types)]
                    struct InitShardsSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::UnaryService<super::InitShardsRequest>
                    for InitShardsSvc<T> {
                        type Response = super::InitShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::InitShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::init_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = InitShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/RetainShards" => {
                    #[allow(non_camel_case_types)]
                    struct RetainShardsSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::UnaryService<super::RetainShardsRequest>
                    for RetainShardsSvc<T> {
                        type Response = super::RetainShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::RetainShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::retain_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = RetainShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/TruncateShards" => {
                    #[allow(non_camel_case_types)]
                    struct TruncateShardsSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::UnaryService<super::TruncateShardsRequest>
                    for TruncateShardsSvc<T> {
                        type Response = super::TruncateShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::TruncateShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::truncate_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = TruncateShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/CloseShards" => {
                    #[allow(non_camel_case_types)]
                    struct CloseShardsSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::UnaryService<super::CloseShardsRequest>
                    for CloseShardsSvc<T> {
                        type Response = super::CloseShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::CloseShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::close_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CloseShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.ingest.ingester.IngesterService/Decommission" => {
                    #[allow(non_camel_case_types)]
                    struct DecommissionSvc<T: IngesterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngesterServiceGrpc,
                    > tonic::server::UnaryService<super::DecommissionRequest>
                    for DecommissionSvc<T> {
                        type Response = super::DecommissionResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DecommissionRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngesterServiceGrpc>::decommission(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DecommissionSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for IngesterServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.ingest.ingester.IngesterService";
    impl<T> tonic::server::NamedService for IngesterServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.ingest.router.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IngestRequestV2 {
    /// There should be at most one subrequest per index per request.
    #[prost(message, repeated, tag = "1")]
    pub subrequests: ::prost::alloc::vec::Vec<IngestSubrequest>,
    #[prost(enumeration = "super::CommitTypeV2", tag = "2")]
    pub commit_type: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IngestSubrequest {
    /// The subrequest ID is used to identify the various subrequests and responses
    /// (ingest, persist, replicate) at play during the ingest and replication
    /// process.
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(string, tag = "2")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub doc_batch: ::core::option::Option<super::DocBatchV2>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IngestResponseV2 {
    #[prost(message, repeated, tag = "1")]
    pub successes: ::prost::alloc::vec::Vec<IngestSuccess>,
    #[prost(message, repeated, tag = "2")]
    pub failures: ::prost::alloc::vec::Vec<IngestFailure>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IngestSuccess {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    /// Replication position inclusive.
    #[prost(message, optional, tag = "5")]
    pub replication_position_inclusive: ::core::option::Option<crate::types::Position>,
    #[prost(uint32, tag = "6")]
    pub num_ingested_docs: u32,
    #[prost(message, repeated, tag = "7")]
    pub parse_failures: ::prost::alloc::vec::Vec<super::ParseFailure>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IngestFailure {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(string, tag = "2")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(enumeration = "IngestFailureReason", tag = "5")]
    pub reason: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum IngestFailureReason {
    Unspecified = 0,
    IndexNotFound = 1,
    SourceNotFound = 2,
    Internal = 3,
    NoShardsAvailable = 4,
    ShardRateLimited = 5,
    WalFull = 6,
    Timeout = 7,
    RouterLoadShedding = 8,
    LoadShedding = 9,
    CircuitBreaker = 10,
}
impl IngestFailureReason {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "INGEST_FAILURE_REASON_UNSPECIFIED",
            Self::IndexNotFound => "INGEST_FAILURE_REASON_INDEX_NOT_FOUND",
            Self::SourceNotFound => "INGEST_FAILURE_REASON_SOURCE_NOT_FOUND",
            Self::Internal => "INGEST_FAILURE_REASON_INTERNAL",
            Self::NoShardsAvailable => "INGEST_FAILURE_REASON_NO_SHARDS_AVAILABLE",
            Self::ShardRateLimited => "INGEST_FAILURE_REASON_SHARD_RATE_LIMITED",
            Self::WalFull => "INGEST_FAILURE_REASON_WAL_FULL",
            Self::Timeout => "INGEST_FAILURE_REASON_TIMEOUT",
            Self::RouterLoadShedding => "INGEST_FAILURE_REASON_ROUTER_LOAD_SHEDDING",
            Self::LoadShedding => "INGEST_FAILURE_REASON_LOAD_SHEDDING",
            Self::CircuitBreaker => "INGEST_FAILURE_REASON_CIRCUIT_BREAKER",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "INGEST_FAILURE_REASON_UNSPECIFIED" => Some(Self::Unspecified),
            "INGEST_FAILURE_REASON_INDEX_NOT_FOUND" => Some(Self::IndexNotFound),
            "INGEST_FAILURE_REASON_SOURCE_NOT_FOUND" => Some(Self::SourceNotFound),
            "INGEST_FAILURE_REASON_INTERNAL" => Some(Self::Internal),
            "INGEST_FAILURE_REASON_NO_SHARDS_AVAILABLE" => Some(Self::NoShardsAvailable),
            "INGEST_FAILURE_REASON_SHARD_RATE_LIMITED" => Some(Self::ShardRateLimited),
            "INGEST_FAILURE_REASON_WAL_FULL" => Some(Self::WalFull),
            "INGEST_FAILURE_REASON_TIMEOUT" => Some(Self::Timeout),
            "INGEST_FAILURE_REASON_ROUTER_LOAD_SHEDDING" => {
                Some(Self::RouterLoadShedding)
            }
            "INGEST_FAILURE_REASON_LOAD_SHEDDING" => Some(Self::LoadShedding),
            "INGEST_FAILURE_REASON_CIRCUIT_BREAKER" => Some(Self::CircuitBreaker),
            _ => None,
        }
    }
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for IngestRequestV2 {
    fn rpc_name() -> &'static str {
        "ingest"
    }
}
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait IngestRouterService: std::fmt::Debug + Send + Sync + 'static {
    ///Ingests batches of documents for one or multiple indexes.
    ///TODO: Describe error cases and how to handle them.
    async fn ingest(
        &self,
        request: IngestRequestV2,
    ) -> crate::ingest::IngestV2Result<IngestResponseV2>;
}
#[derive(Debug, Clone)]
pub struct IngestRouterServiceClient {
    inner: InnerIngestRouterServiceClient,
}
#[derive(Debug, Clone)]
struct InnerIngestRouterServiceClient(std::sync::Arc<dyn IngestRouterService>);
impl IngestRouterServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: IngestRouterService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockIngestRouterService > (),
            "`MockIngestRouterService` must be wrapped in a `MockIngestRouterServiceWrapper`: use `IngestRouterServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerIngestRouterServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> ingest_router_service_grpc_server::IngestRouterServiceGrpcServer<
        IngestRouterServiceGrpcServerAdapter,
    > {
        let adapter = IngestRouterServiceGrpcServerAdapter::new(self.clone());
        ingest_router_service_grpc_server::IngestRouterServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = ingest_router_service_grpc_client::IngestRouterServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IngestRouterServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngestRouterServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = ingest_router_service_grpc_client::IngestRouterServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = IngestRouterServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IngestRouterServiceMailbox<A>: IngestRouterService,
    {
        IngestRouterServiceClient::new(IngestRouterServiceMailbox::new(mailbox))
    }
    pub fn tower() -> IngestRouterServiceTowerLayerStack {
        IngestRouterServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockIngestRouterService) -> Self {
        let mock_wrapper = mock_ingest_router_service::MockIngestRouterServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockIngestRouterService::new())
    }
}
#[async_trait::async_trait]
impl IngestRouterService for IngestRouterServiceClient {
    async fn ingest(
        &self,
        request: IngestRequestV2,
    ) -> crate::ingest::IngestV2Result<IngestResponseV2> {
        self.inner.0.ingest(request).await
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_ingest_router_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockIngestRouterServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockIngestRouterService>,
    }
    #[async_trait::async_trait]
    impl IngestRouterService for MockIngestRouterServiceWrapper {
        async fn ingest(
            &self,
            request: super::IngestRequestV2,
        ) -> crate::ingest::IngestV2Result<super::IngestResponseV2> {
            self.inner.lock().await.ingest(request).await
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<IngestRequestV2> for InnerIngestRouterServiceClient {
    type Response = IngestResponseV2;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: IngestRequestV2) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.ingest(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct IngestRouterServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerIngestRouterServiceClient,
    ingest_svc: quickwit_common::tower::BoxService<
        IngestRequestV2,
        IngestResponseV2,
        crate::ingest::IngestV2Error,
    >,
}
#[async_trait::async_trait]
impl IngestRouterService for IngestRouterServiceTowerServiceStack {
    async fn ingest(
        &self,
        request: IngestRequestV2,
    ) -> crate::ingest::IngestV2Result<IngestResponseV2> {
        self.ingest_svc.clone().ready().await?.call(request).await
    }
}
type IngestLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        IngestRequestV2,
        IngestResponseV2,
        crate::ingest::IngestV2Error,
    >,
    IngestRequestV2,
    IngestResponseV2,
    crate::ingest::IngestV2Error,
>;
#[derive(Debug, Default)]
pub struct IngestRouterServiceTowerLayerStack {
    ingest_layers: Vec<IngestLayer>,
}
impl IngestRouterServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IngestRequestV2,
                    IngestResponseV2,
                    crate::ingest::IngestV2Error,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                IngestRequestV2,
                IngestResponseV2,
                crate::ingest::IngestV2Error,
            >,
        >>::Service: tower::Service<
                IngestRequestV2,
                Response = IngestResponseV2,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                IngestRequestV2,
                IngestResponseV2,
                crate::ingest::IngestV2Error,
            >,
        >>::Service as tower::Service<IngestRequestV2>>::Future: Send + 'static,
    {
        self.ingest_layers.push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_ingest_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IngestRequestV2,
                    IngestResponseV2,
                    crate::ingest::IngestV2Error,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                IngestRequestV2,
                Response = IngestResponseV2,
                Error = crate::ingest::IngestV2Error,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<IngestRequestV2>>::Future: Send + 'static,
    {
        self.ingest_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> IngestRouterServiceClient
    where
        T: IngestRouterService,
    {
        let inner_client = InnerIngestRouterServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngestRouterServiceClient {
        let client = IngestRouterServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> IngestRouterServiceClient {
        let client = IngestRouterServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> IngestRouterServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        IngestRouterServiceMailbox<A>: IngestRouterService,
    {
        let inner_client = InnerIngestRouterServiceClient(
            std::sync::Arc::new(IngestRouterServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(
        self,
        mock: MockIngestRouterService,
    ) -> IngestRouterServiceClient {
        let client = IngestRouterServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerIngestRouterServiceClient,
    ) -> IngestRouterServiceClient {
        let ingest_svc = self
            .ingest_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = IngestRouterServiceTowerServiceStack {
            inner: inner_client,
            ingest_svc,
        };
        IngestRouterServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct IngestRouterServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::ingest::IngestV2Error>,
}
impl<A: quickwit_actors::Actor> IngestRouterServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for IngestRouterServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for IngestRouterServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::ingest::IngestV2Error: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::ingest::IngestV2Error;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> IngestRouterService for IngestRouterServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    IngestRouterServiceMailbox<
        A,
    >: tower::Service<
        IngestRequestV2,
        Response = IngestResponseV2,
        Error = crate::ingest::IngestV2Error,
        Future = BoxFuture<IngestResponseV2, crate::ingest::IngestV2Error>,
    >,
{
    async fn ingest(
        &self,
        request: IngestRequestV2,
    ) -> crate::ingest::IngestV2Result<IngestResponseV2> {
        self.clone().call(request).await
    }
}
#[derive(Debug, Clone)]
pub struct IngestRouterServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> IngestRouterServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> IngestRouterService
for IngestRouterServiceGrpcClientAdapter<
    ingest_router_service_grpc_client::IngestRouterServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn ingest(
        &self,
        request: IngestRequestV2,
    ) -> crate::ingest::IngestV2Result<IngestResponseV2> {
        self.inner
            .clone()
            .ingest(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                IngestRequestV2::rpc_name(),
            ))
    }
}
#[derive(Debug)]
pub struct IngestRouterServiceGrpcServerAdapter {
    inner: InnerIngestRouterServiceClient,
}
impl IngestRouterServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: IngestRouterService,
    {
        Self {
            inner: InnerIngestRouterServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl ingest_router_service_grpc_server::IngestRouterServiceGrpc
for IngestRouterServiceGrpcServerAdapter {
    async fn ingest(
        &self,
        request: tonic::Request<IngestRequestV2>,
    ) -> Result<tonic::Response<IngestResponseV2>, tonic::Status> {
        self.inner
            .0
            .ingest(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod ingest_router_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct IngestRouterServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl IngestRouterServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> IngestRouterServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> IngestRouterServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            IngestRouterServiceGrpcClient::new(
                InterceptedService::new(inner, interceptor),
            )
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Ingests batches of documents for one or multiple indexes.
        /// TODO: Describe error cases and how to handle them.
        pub async fn ingest(
            &mut self,
            request: impl tonic::IntoRequest<super::IngestRequestV2>,
        ) -> std::result::Result<
            tonic::Response<super::IngestResponseV2>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.ingest.router.IngestRouterService/Ingest",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.ingest.router.IngestRouterService",
                        "Ingest",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod ingest_router_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with IngestRouterServiceGrpcServer.
    #[async_trait]
    pub trait IngestRouterServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Ingests batches of documents for one or multiple indexes.
        /// TODO: Describe error cases and how to handle them.
        async fn ingest(
            &self,
            request: tonic::Request<super::IngestRequestV2>,
        ) -> std::result::Result<
            tonic::Response<super::IngestResponseV2>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct IngestRouterServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> IngestRouterServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for IngestRouterServiceGrpcServer<T>
    where
        T: IngestRouterServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.ingest.router.IngestRouterService/Ingest" => {
                    #[allow(non_camel_case_types)]
                    struct IngestSvc<T: IngestRouterServiceGrpc>(pub Arc<T>);
                    impl<
                        T: IngestRouterServiceGrpc,
                    > tonic::server::UnaryService<super::IngestRequestV2>
                    for IngestSvc<T> {
                        type Response = super::IngestResponseV2;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::IngestRequestV2>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as IngestRouterServiceGrpc>::ingest(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = IngestSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for IngestRouterServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.ingest.router.IngestRouterService";
    impl<T> tonic::server::NamedService for IngestRouterServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.ingest.rs
================================================
// This file is @generated by prost-build.
/// Shard primary key.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ShardPKey {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "3")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct DocBatchV2 {
    #[prost(bytes = "bytes", tag = "1")]
    pub doc_buffer: ::prost::bytes::Bytes,
    #[prost(uint32, repeated, tag = "2")]
    pub doc_lengths: ::prost::alloc::vec::Vec<u32>,
    #[prost(message, repeated, tag = "3")]
    pub doc_uids: ::prost::alloc::vec::Vec<crate::types::DocUid>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct MRecordBatch {
    /// Buffer of encoded and then concatenated mrecords.
    #[prost(bytes = "bytes", tag = "1")]
    pub mrecord_buffer: ::prost::bytes::Bytes,
    /// Lengths of the mrecords in the buffer.
    #[prost(uint32, repeated, tag = "2")]
    pub mrecord_lengths: ::prost::alloc::vec::Vec<u32>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct Shard {
    /// Immutable fields
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "3")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    /// The node ID of the ingester to which all the write requests for this shard should be sent to.
    #[prost(string, tag = "4")]
    pub leader_id: ::prost::alloc::string::String,
    /// The node ID of the ingester holding a copy of the data.
    #[prost(string, optional, tag = "5")]
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub follower_id: ::core::option::Option<::prost::alloc::string::String>,
    /// Mutable fields
    #[prost(enumeration = "ShardState", tag = "8")]
    pub shard_state: i32,
    /// Position up to which indexers have indexed and published the records stored in the shard.
    /// It is updated asynchronously in a best effort manner by the indexers and indicates the position up to which the log can be safely truncated.
    #[prost(message, optional, tag = "9")]
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub publish_position_inclusive: ::core::option::Option<crate::types::Position>,
    /// A publish token that ensures only one indexer works on a given shard at a time.
    /// For instance, if an indexer goes rogue, eventually the control plane will detect it and assign the shard to another indexer, which will override the publish token.
    #[prost(string, optional, tag = "10")]
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub publish_token: ::core::option::Option<::prost::alloc::string::String>,
    /// The UID of the index doc mapping when the shard was created.
    #[prost(message, optional, tag = "11")]
    pub doc_mapping_uid: ::core::option::Option<crate::types::DocMappingUid>,
    /// Time when the shard was last updated
    #[prost(int64, tag = "12")]
    #[serde(default = "super::compatibility_shard_update_timestamp")]
    pub update_timestamp: i64,
}
/// A group of shards belonging to the same index and source.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ShardIds {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub shard_ids: ::prost::alloc::vec::Vec<crate::types::ShardId>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ShardIdPositions {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub shard_positions: ::prost::alloc::vec::Vec<ShardIdPosition>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ShardIdPosition {
    #[prost(message, optional, tag = "1")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(message, optional, tag = "2")]
    pub publish_position_inclusive: ::core::option::Option<crate::types::Position>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ParseFailure {
    #[prost(message, optional, tag = "1")]
    pub doc_uid: ::core::option::Option<crate::types::DocUid>,
    #[prost(enumeration = "ParseFailureReason", tag = "2")]
    pub reason: i32,
    #[prost(string, tag = "3")]
    pub message: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum CommitTypeV2 {
    Unspecified = 0,
    Auto = 1,
    WaitFor = 2,
    Force = 3,
}
impl CommitTypeV2 {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "COMMIT_TYPE_V2_UNSPECIFIED",
            Self::Auto => "COMMIT_TYPE_V2_AUTO",
            Self::WaitFor => "COMMIT_TYPE_V2_WAIT_FOR",
            Self::Force => "COMMIT_TYPE_V2_FORCE",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "COMMIT_TYPE_V2_UNSPECIFIED" => Some(Self::Unspecified),
            "COMMIT_TYPE_V2_AUTO" => Some(Self::Auto),
            "COMMIT_TYPE_V2_WAIT_FOR" => Some(Self::WaitFor),
            "COMMIT_TYPE_V2_FORCE" => Some(Self::Force),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum ShardState {
    Unspecified = 0,
    /// The shard is open and accepts write requests.
    Open = 1,
    /// The ingester hosting the shard is unavailable.
    Unavailable = 2,
    /// The shard is closed and cannot be written to.
    /// It can be safely deleted if the publish position is superior or equal to `~eof`.
    Closed = 3,
}
impl ShardState {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "SHARD_STATE_UNSPECIFIED",
            Self::Open => "SHARD_STATE_OPEN",
            Self::Unavailable => "SHARD_STATE_UNAVAILABLE",
            Self::Closed => "SHARD_STATE_CLOSED",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "SHARD_STATE_UNSPECIFIED" => Some(Self::Unspecified),
            "SHARD_STATE_OPEN" => Some(Self::Open),
            "SHARD_STATE_UNAVAILABLE" => Some(Self::Unavailable),
            "SHARD_STATE_CLOSED" => Some(Self::Closed),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum ParseFailureReason {
    Unspecified = 0,
    InvalidJson = 1,
    InvalidSchema = 2,
}
impl ParseFailureReason {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "PARSE_FAILURE_REASON_UNSPECIFIED",
            Self::InvalidJson => "PARSE_FAILURE_REASON_INVALID_JSON",
            Self::InvalidSchema => "PARSE_FAILURE_REASON_INVALID_SCHEMA",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "PARSE_FAILURE_REASON_UNSPECIFIED" => Some(Self::Unspecified),
            "PARSE_FAILURE_REASON_INVALID_JSON" => Some(Self::InvalidJson),
            "PARSE_FAILURE_REASON_INVALID_SCHEMA" => Some(Self::InvalidSchema),
            _ => None,
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.metastore.rs
================================================
// This file is @generated by prost-build.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct EmptyResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CreateIndexRequest {
    #[prost(string, tag = "2")]
    pub index_config_json: ::prost::alloc::string::String,
    #[prost(string, repeated, tag = "3")]
    pub source_configs_json: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CreateIndexResponse {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub index_metadata_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct UpdateIndexRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "5")]
    pub doc_mapping_json: ::prost::alloc::string::String,
    #[prost(string, tag = "4")]
    pub indexing_settings_json: ::prost::alloc::string::String,
    #[prost(string, tag = "6")]
    pub ingest_settings_json: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub search_settings_json: ::prost::alloc::string::String,
    #[prost(string, optional, tag = "3")]
    pub retention_policy_json_opt: ::core::option::Option<
        ::prost::alloc::string::String,
    >,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListIndexesMetadataRequest {
    /// List of patterns an index should match or not match to get considered
    /// An index must match at least one positive pattern (a pattern not starting
    /// with a '-'), and no negative pattern (a pattern starting with a '-').
    #[prost(string, repeated, tag = "2")]
    pub index_id_patterns: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListIndexesMetadataResponse {
    /// Deprecated (v0.9.0), use `indexes_metadata_json_zstd` instead.
    #[prost(string, optional, tag = "1")]
    pub indexes_metadata_json_opt: ::core::option::Option<
        ::prost::alloc::string::String,
    >,
    /// A JSON serialized then ZSTD compressed list of `IndexMetadata`: `Vec<IndexMetadata> | JSON | ZSTD`.
    /// We don't use `repeated` here to increase the compression rate and ratio.
    #[prost(bytes = "bytes", tag = "2")]
    pub indexes_metadata_json_zstd: ::prost::bytes::Bytes,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DeleteIndexRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
}
/// Request the metadata of an index.
/// Either `index_uid` or `index_id` must be specified.
///
/// If both are supplied, `index_uid` is used.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IndexMetadataRequest {
    #[prost(string, optional, tag = "1")]
    pub index_id: ::core::option::Option<::prost::alloc::string::String>,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IndexMetadataResponse {
    #[prost(string, tag = "1")]
    pub index_metadata_serialized_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IndexesMetadataRequest {
    #[prost(message, repeated, tag = "1")]
    pub subrequests: ::prost::alloc::vec::Vec<IndexMetadataSubrequest>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IndexMetadataSubrequest {
    #[prost(string, optional, tag = "1")]
    pub index_id: ::core::option::Option<::prost::alloc::string::String>,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct IndexesMetadataResponse {
    /// A JSON serialized then ZSTD compressed list of `IndexMetadata`: `Vec<IndexMetadata> | JSON | ZSTD`.
    /// We don't use `repeated` here to increase the compression rate and ratio.
    #[prost(bytes = "bytes", tag = "1")]
    pub indexes_metadata_json_zstd: ::prost::bytes::Bytes,
    #[prost(message, repeated, tag = "2")]
    pub failures: ::prost::alloc::vec::Vec<IndexMetadataFailure>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IndexMetadataFailure {
    #[prost(string, optional, tag = "1")]
    pub index_id: ::core::option::Option<::prost::alloc::string::String>,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(enumeration = "IndexMetadataFailureReason", tag = "3")]
    pub reason: i32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListIndexStatsRequest {
    /// List of patterns an index should match or not match to get considered
    /// An index must match at least one positive pattern (a pattern not starting
    /// with a '-'), and no negative pattern (a pattern starting with a '-').
    #[prost(string, repeated, tag = "1")]
    pub index_id_patterns: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListIndexStatsResponse {
    /// list of IndexStats. each one has the index id, the number of splits and the total size.
    #[prost(message, repeated, tag = "1")]
    pub index_stats: ::prost::alloc::vec::Vec<IndexStats>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IndexStats {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(message, optional, tag = "2")]
    pub staged: ::core::option::Option<SplitStats>,
    #[prost(message, optional, tag = "3")]
    pub published: ::core::option::Option<SplitStats>,
    #[prost(message, optional, tag = "4")]
    pub marked_for_deletion: ::core::option::Option<SplitStats>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SplitStats {
    #[prost(uint64, tag = "1")]
    pub num_splits: u64,
    #[prost(uint64, tag = "2")]
    pub total_size_bytes: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListSplitsRequest {
    /// Predicate used to filter splits.
    /// The predicate is expressed as a JSON serialized
    /// `ListSplitsQuery`.
    #[prost(string, tag = "1")]
    pub query_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListSplitsResponse {
    /// TODO use repeated and encode splits json individually.
    #[prost(string, tag = "1")]
    pub splits_serialized_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct StageSplitsRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub split_metadata_list_serialized_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PublishSplitsRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, repeated, tag = "2")]
    pub staged_split_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    #[prost(string, repeated, tag = "3")]
    pub replaced_split_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    #[prost(string, optional, tag = "4")]
    pub index_checkpoint_delta_json_opt: ::core::option::Option<
        ::prost::alloc::string::String,
    >,
    #[prost(string, optional, tag = "5")]
    pub publish_token_opt: ::core::option::Option<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct MarkSplitsForDeletionRequest {
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, repeated, tag = "3")]
    pub split_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DeleteSplitsRequest {
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, repeated, tag = "3")]
    pub split_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct AddSourceRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_config_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct UpdateSourceRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_config_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ToggleSourceRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(bool, tag = "3")]
    pub enable: bool,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DeleteSourceRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ResetSourceCheckpointRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DeleteTask {
    #[prost(int64, tag = "1")]
    pub create_timestamp: i64,
    #[prost(uint64, tag = "2")]
    pub opstamp: u64,
    #[prost(message, optional, tag = "3")]
    pub delete_query: ::core::option::Option<DeleteQuery>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DeleteQuery {
    /// Index UID.
    #[prost(message, optional, tag = "1")]
    #[schema(value_type = String)]
    #[serde(alias = "index_id")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    /// If set, restrict search to documents with a `timestamp >= start_timestamp`.
    #[prost(int64, optional, tag = "2")]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub start_timestamp: ::core::option::Option<i64>,
    /// If set, restrict search to documents with a \`timestamp \< end_timestamp\``.
    #[prost(int64, optional, tag = "3")]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub end_timestamp: ::core::option::Option<i64>,
    /// Query AST serialized in JSON
    #[prost(string, tag = "6")]
    #[serde(alias = "query")]
    pub query_ast: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct UpdateSplitsDeleteOpstampRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, repeated, tag = "2")]
    pub split_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    #[prost(uint64, tag = "3")]
    pub delete_opstamp: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct UpdateSplitsDeleteOpstampResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct LastDeleteOpstampRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct LastDeleteOpstampResponse {
    #[prost(uint64, tag = "1")]
    pub last_delete_opstamp: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListStaleSplitsRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(uint64, tag = "2")]
    pub delete_opstamp: u64,
    #[prost(uint64, tag = "3")]
    pub num_splits: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListDeleteTasksRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(uint64, tag = "2")]
    pub opstamp_start: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListDeleteTasksResponse {
    #[prost(message, repeated, tag = "1")]
    pub delete_tasks: ::prost::alloc::vec::Vec<DeleteTask>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct OpenShardsRequest {
    #[prost(message, repeated, tag = "1")]
    pub subrequests: ::prost::alloc::vec::Vec<OpenShardSubrequest>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct OpenShardSubrequest {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "2")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "3")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "4")]
    pub shard_id: ::core::option::Option<crate::types::ShardId>,
    #[prost(string, tag = "5")]
    pub leader_id: ::prost::alloc::string::String,
    #[prost(string, optional, tag = "6")]
    pub follower_id: ::core::option::Option<::prost::alloc::string::String>,
    #[prost(message, optional, tag = "7")]
    pub doc_mapping_uid: ::core::option::Option<crate::types::DocMappingUid>,
    #[prost(string, optional, tag = "8")]
    pub publish_token: ::core::option::Option<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct OpenShardsResponse {
    #[prost(message, repeated, tag = "1")]
    pub subresponses: ::prost::alloc::vec::Vec<OpenShardSubresponse>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct OpenShardSubresponse {
    #[prost(uint32, tag = "1")]
    pub subrequest_id: u32,
    #[prost(message, optional, tag = "4")]
    pub open_shard: ::core::option::Option<super::ingest::Shard>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AcquireShardsRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub shard_ids: ::prost::alloc::vec::Vec<crate::types::ShardId>,
    #[prost(string, tag = "4")]
    pub publish_token: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct AcquireShardsResponse {
    /// List of acquired shards, in no specific order.
    #[prost(message, repeated, tag = "3")]
    pub acquired_shards: ::prost::alloc::vec::Vec<super::ingest::Shard>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct DeleteShardsRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub shard_ids: ::prost::alloc::vec::Vec<crate::types::ShardId>,
    /// If false, only shards at EOF positions will be deleted.
    #[prost(bool, tag = "4")]
    pub force: bool,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct DeleteShardsResponse {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    /// List of shard IDs that were successfully deleted.
    #[prost(message, repeated, tag = "3")]
    pub successes: ::prost::alloc::vec::Vec<crate::types::ShardId>,
    /// List of shard IDs that could not be deleted because `force` was set to `false` in the request,
    /// and the shards are not at EOF, i.e., not fully indexed.
    #[prost(message, repeated, tag = "4")]
    pub failures: ::prost::alloc::vec::Vec<crate::types::ShardId>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PruneShardsRequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    /// The maximum age of the shards to keep, in seconds.
    #[prost(uint32, optional, tag = "5")]
    pub max_age_secs: ::core::option::Option<u32>,
    /// The maximum number of the shards to keep. Delete older shards first.
    #[prost(uint32, optional, tag = "6")]
    pub max_count: ::core::option::Option<u32>,
    /// The interval between two pruning operations, in seconds.
    #[prost(uint32, optional, tag = "7")]
    pub interval_secs: ::core::option::Option<u32>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListShardsRequest {
    #[prost(message, repeated, tag = "1")]
    pub subrequests: ::prost::alloc::vec::Vec<ListShardsSubrequest>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListShardsSubrequest {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(enumeration = "super::ingest::ShardState", optional, tag = "3")]
    pub shard_state: ::core::option::Option<i32>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListShardsResponse {
    #[prost(message, repeated, tag = "1")]
    pub subresponses: ::prost::alloc::vec::Vec<ListShardsSubresponse>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListShardsSubresponse {
    #[prost(message, optional, tag = "1")]
    pub index_uid: ::core::option::Option<crate::types::IndexUid>,
    #[prost(string, tag = "2")]
    pub source_id: ::prost::alloc::string::String,
    #[prost(message, repeated, tag = "3")]
    pub shards: ::prost::alloc::vec::Vec<super::ingest::Shard>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct CreateIndexTemplateRequest {
    #[prost(string, tag = "1")]
    pub index_template_json: ::prost::alloc::string::String,
    #[prost(bool, tag = "2")]
    pub overwrite: bool,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetIndexTemplateRequest {
    #[prost(string, tag = "1")]
    pub template_id: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetIndexTemplateResponse {
    #[prost(string, tag = "1")]
    pub index_template_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct FindIndexTemplateMatchesRequest {
    #[prost(string, repeated, tag = "1")]
    pub index_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FindIndexTemplateMatchesResponse {
    #[prost(message, repeated, tag = "1")]
    pub matches: ::prost::alloc::vec::Vec<IndexTemplateMatch>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct IndexTemplateMatch {
    #[prost(string, tag = "1")]
    pub index_id: ::prost::alloc::string::String,
    #[prost(string, tag = "2")]
    pub template_id: ::prost::alloc::string::String,
    #[prost(string, tag = "3")]
    pub index_template_json: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListIndexTemplatesRequest {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListIndexTemplatesResponse {
    #[prost(string, repeated, tag = "1")]
    pub index_templates_json: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct DeleteIndexTemplatesRequest {
    #[prost(string, repeated, tag = "1")]
    pub template_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetClusterIdentityRequest {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetClusterIdentityResponse {
    #[prost(string, tag = "1")]
    pub uuid: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum SourceType {
    Unspecified = 0,
    Cli = 1,
    File = 2,
    IngestV1 = 4,
    IngestV2 = 5,
    /// Apache Kafka
    Kafka = 6,
    /// Amazon Kinesis
    Kinesis = 7,
    Nats = 8,
    /// Google Cloud Pub/Sub
    PubSub = 3,
    /// Apache Pulsar
    Pulsar = 9,
    Vec = 10,
    Void = 11,
    Stdin = 13,
}
impl SourceType {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "SOURCE_TYPE_UNSPECIFIED",
            Self::Cli => "SOURCE_TYPE_CLI",
            Self::File => "SOURCE_TYPE_FILE",
            Self::IngestV1 => "SOURCE_TYPE_INGEST_V1",
            Self::IngestV2 => "SOURCE_TYPE_INGEST_V2",
            Self::Kafka => "SOURCE_TYPE_KAFKA",
            Self::Kinesis => "SOURCE_TYPE_KINESIS",
            Self::Nats => "SOURCE_TYPE_NATS",
            Self::PubSub => "SOURCE_TYPE_PUB_SUB",
            Self::Pulsar => "SOURCE_TYPE_PULSAR",
            Self::Vec => "SOURCE_TYPE_VEC",
            Self::Void => "SOURCE_TYPE_VOID",
            Self::Stdin => "SOURCE_TYPE_STDIN",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "SOURCE_TYPE_UNSPECIFIED" => Some(Self::Unspecified),
            "SOURCE_TYPE_CLI" => Some(Self::Cli),
            "SOURCE_TYPE_FILE" => Some(Self::File),
            "SOURCE_TYPE_INGEST_V1" => Some(Self::IngestV1),
            "SOURCE_TYPE_INGEST_V2" => Some(Self::IngestV2),
            "SOURCE_TYPE_KAFKA" => Some(Self::Kafka),
            "SOURCE_TYPE_KINESIS" => Some(Self::Kinesis),
            "SOURCE_TYPE_NATS" => Some(Self::Nats),
            "SOURCE_TYPE_PUB_SUB" => Some(Self::PubSub),
            "SOURCE_TYPE_PULSAR" => Some(Self::Pulsar),
            "SOURCE_TYPE_VEC" => Some(Self::Vec),
            "SOURCE_TYPE_VOID" => Some(Self::Void),
            "SOURCE_TYPE_STDIN" => Some(Self::Stdin),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum IndexMetadataFailureReason {
    Unspecified = 0,
    NotFound = 1,
    Internal = 2,
}
impl IndexMetadataFailureReason {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "INDEX_METADATA_FAILURE_REASON_UNSPECIFIED",
            Self::NotFound => "INDEX_METADATA_FAILURE_REASON_NOT_FOUND",
            Self::Internal => "INDEX_METADATA_FAILURE_REASON_INTERNAL",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "INDEX_METADATA_FAILURE_REASON_UNSPECIFIED" => Some(Self::Unspecified),
            "INDEX_METADATA_FAILURE_REASON_NOT_FOUND" => Some(Self::NotFound),
            "INDEX_METADATA_FAILURE_REASON_INTERNAL" => Some(Self::Internal),
            _ => None,
        }
    }
}
/// BEGIN quickwit-codegen
#[allow(unused_imports)]
use std::str::FromStr;
use tower::{Layer, Service, ServiceExt};
use quickwit_common::tower::RpcName;
impl RpcName for CreateIndexRequest {
    fn rpc_name() -> &'static str {
        "create_index"
    }
}
impl RpcName for UpdateIndexRequest {
    fn rpc_name() -> &'static str {
        "update_index"
    }
}
impl RpcName for IndexMetadataRequest {
    fn rpc_name() -> &'static str {
        "index_metadata"
    }
}
impl RpcName for IndexesMetadataRequest {
    fn rpc_name() -> &'static str {
        "indexes_metadata"
    }
}
impl RpcName for ListIndexesMetadataRequest {
    fn rpc_name() -> &'static str {
        "list_indexes_metadata"
    }
}
impl RpcName for DeleteIndexRequest {
    fn rpc_name() -> &'static str {
        "delete_index"
    }
}
impl RpcName for ListIndexStatsRequest {
    fn rpc_name() -> &'static str {
        "list_index_stats"
    }
}
impl RpcName for ListSplitsRequest {
    fn rpc_name() -> &'static str {
        "list_splits"
    }
}
impl RpcName for StageSplitsRequest {
    fn rpc_name() -> &'static str {
        "stage_splits"
    }
}
impl RpcName for PublishSplitsRequest {
    fn rpc_name() -> &'static str {
        "publish_splits"
    }
}
impl RpcName for MarkSplitsForDeletionRequest {
    fn rpc_name() -> &'static str {
        "mark_splits_for_deletion"
    }
}
impl RpcName for DeleteSplitsRequest {
    fn rpc_name() -> &'static str {
        "delete_splits"
    }
}
impl RpcName for AddSourceRequest {
    fn rpc_name() -> &'static str {
        "add_source"
    }
}
impl RpcName for UpdateSourceRequest {
    fn rpc_name() -> &'static str {
        "update_source"
    }
}
impl RpcName for ToggleSourceRequest {
    fn rpc_name() -> &'static str {
        "toggle_source"
    }
}
impl RpcName for DeleteSourceRequest {
    fn rpc_name() -> &'static str {
        "delete_source"
    }
}
impl RpcName for ResetSourceCheckpointRequest {
    fn rpc_name() -> &'static str {
        "reset_source_checkpoint"
    }
}
impl RpcName for LastDeleteOpstampRequest {
    fn rpc_name() -> &'static str {
        "last_delete_opstamp"
    }
}
impl RpcName for DeleteQuery {
    fn rpc_name() -> &'static str {
        "create_delete_task"
    }
}
impl RpcName for UpdateSplitsDeleteOpstampRequest {
    fn rpc_name() -> &'static str {
        "update_splits_delete_opstamp"
    }
}
impl RpcName for ListDeleteTasksRequest {
    fn rpc_name() -> &'static str {
        "list_delete_tasks"
    }
}
impl RpcName for ListStaleSplitsRequest {
    fn rpc_name() -> &'static str {
        "list_stale_splits"
    }
}
impl RpcName for OpenShardsRequest {
    fn rpc_name() -> &'static str {
        "open_shards"
    }
}
impl RpcName for AcquireShardsRequest {
    fn rpc_name() -> &'static str {
        "acquire_shards"
    }
}
impl RpcName for DeleteShardsRequest {
    fn rpc_name() -> &'static str {
        "delete_shards"
    }
}
impl RpcName for PruneShardsRequest {
    fn rpc_name() -> &'static str {
        "prune_shards"
    }
}
impl RpcName for ListShardsRequest {
    fn rpc_name() -> &'static str {
        "list_shards"
    }
}
impl RpcName for CreateIndexTemplateRequest {
    fn rpc_name() -> &'static str {
        "create_index_template"
    }
}
impl RpcName for GetIndexTemplateRequest {
    fn rpc_name() -> &'static str {
        "get_index_template"
    }
}
impl RpcName for FindIndexTemplateMatchesRequest {
    fn rpc_name() -> &'static str {
        "find_index_template_matches"
    }
}
impl RpcName for ListIndexTemplatesRequest {
    fn rpc_name() -> &'static str {
        "list_index_templates"
    }
}
impl RpcName for DeleteIndexTemplatesRequest {
    fn rpc_name() -> &'static str {
        "delete_index_templates"
    }
}
impl RpcName for GetClusterIdentityRequest {
    fn rpc_name() -> &'static str {
        "get_cluster_identity"
    }
}
pub type MetastoreServiceStream<T> = quickwit_common::ServiceStream<
    crate::metastore::MetastoreResult<T>,
>;
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait::async_trait]
pub trait MetastoreService: std::fmt::Debug + Send + Sync + 'static {
    ///Creates an index.
    ///
    ///This API creates a new index in the metastore.
    ///An error will occur if an index that already exists in the storage is specified.
    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> crate::metastore::MetastoreResult<CreateIndexResponse>;
    ///Update an index.
    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse>;
    ///Returns the `IndexMetadata` of an index identified by its IndexID or its IndexUID.
    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse>;
    ///Fetches the metadata of a list of indexes identified by their Index IDs or UIDs.
    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexesMetadataResponse>;
    ///Gets an indexes metadatas.
    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexesMetadataResponse>;
    ///Deletes an index
    async fn delete_index(
        &self,
        request: DeleteIndexRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Returns a list of size info for each index.
    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexStatsResponse>;
    ///Streams splits from index.
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> crate::metastore::MetastoreResult<MetastoreServiceStream<ListSplitsResponse>>;
    ///Stages several splits.
    async fn stage_splits(
        &self,
        request: StageSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Publishes split.
    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Marks splits for deletion.
    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Deletes splits.
    async fn delete_splits(
        &self,
        request: DeleteSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Adds a source.
    async fn add_source(
        &self,
        request: AddSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Updates a source.
    async fn update_source(
        &self,
        request: UpdateSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Toggles (turns on or off) source.
    async fn toggle_source(
        &self,
        request: ToggleSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Removes source.
    async fn delete_source(
        &self,
        request: DeleteSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Resets source checkpoint.
    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Gets last opstamp for a given `index_id`.
    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<LastDeleteOpstampResponse>;
    ///Creates a delete task.
    async fn create_delete_task(
        &self,
        request: DeleteQuery,
    ) -> crate::metastore::MetastoreResult<DeleteTask>;
    ///Updates splits `delete_opstamp`.
    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<UpdateSplitsDeleteOpstampResponse>;
    ///Lists delete tasks with `delete_task.opstamp` > `opstamp_start` for a given `index_id`.
    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> crate::metastore::MetastoreResult<ListDeleteTasksResponse>;
    ///Lists splits with `split.delete_opstamp` \< `delete_opstamp` for a given `index_id`.
    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> crate::metastore::MetastoreResult<ListSplitsResponse>;
    ///Shard API
    ///
    ///Note that for the file-backed metastore implementation, the requests are not processed atomically.
    ///Indeed, each request comprises one or more subrequests that target different indexes and sources processed
    ///independently. Responses list the requests that succeeded or failed in the fields `successes` and
    ///`failures`.
    async fn open_shards(
        &self,
        request: OpenShardsRequest,
    ) -> crate::metastore::MetastoreResult<OpenShardsResponse>;
    ///Acquires a set of shards for indexing. This RPC locks the shards for publishing thanks to a publish token and only
    ///the last indexer that has acquired the shards is allowed to publish. The response returns for each subrequest the
    ///list of acquired shards along with the positions to index from.
    ///
    ///If a requested shard is missing, this method does not return an error. It should simply return the list of
    ///shards that were actually acquired.
    ///
    ///For this reason, AcquireShards.acquire_shards may return less subresponse than there was in the request.
    ///Also they may be returned in any order.
    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> crate::metastore::MetastoreResult<AcquireShardsResponse>;
    ///Deletes a set of shards. This RPC deletes the shards from the metastore.
    ///If the shard did not exist to begin with, the operation is successful and does not return any error.
    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> crate::metastore::MetastoreResult<DeleteShardsResponse>;
    ///Deletes outdated shards. This RPC deletes the shards from the metastore.
    async fn prune_shards(
        &self,
        request: PruneShardsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    async fn list_shards(
        &self,
        request: ListShardsRequest,
    ) -> crate::metastore::MetastoreResult<ListShardsResponse>;
    ///Creates an index template.
    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Fetches an index template.
    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<GetIndexTemplateResponse>;
    ///Finds matching index templates.
    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> crate::metastore::MetastoreResult<FindIndexTemplateMatchesResponse>;
    ///Returns all the index templates.
    async fn list_index_templates(
        &self,
        request: ListIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexTemplatesResponse>;
    ///Deletes index templates.
    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse>;
    ///Get cluster identity
    async fn get_cluster_identity(
        &self,
        request: GetClusterIdentityRequest,
    ) -> crate::metastore::MetastoreResult<GetClusterIdentityResponse>;
    async fn check_connectivity(&self) -> anyhow::Result<()>;
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri>;
}
#[derive(Debug, Clone)]
pub struct MetastoreServiceClient {
    inner: InnerMetastoreServiceClient,
}
#[derive(Debug, Clone)]
struct InnerMetastoreServiceClient(std::sync::Arc<dyn MetastoreService>);
impl MetastoreServiceClient {
    pub fn new<T>(instance: T) -> Self
    where
        T: MetastoreService,
    {
        #[cfg(any(test, feature = "testsuite"))]
        assert!(
            std::any::TypeId::of:: < T > () != std::any::TypeId::of:: <
            MockMetastoreService > (),
            "`MockMetastoreService` must be wrapped in a `MockMetastoreServiceWrapper`: use `MetastoreServiceClient::from_mock(mock)` to instantiate the client"
        );
        Self {
            inner: InnerMetastoreServiceClient(std::sync::Arc::new(instance)),
        }
    }
    pub fn as_grpc_service(
        &self,
        max_message_size: bytesize::ByteSize,
    ) -> metastore_service_grpc_server::MetastoreServiceGrpcServer<
        MetastoreServiceGrpcServerAdapter,
    > {
        let adapter = MetastoreServiceGrpcServerAdapter::new(self.clone());
        metastore_service_grpc_server::MetastoreServiceGrpcServer::new(adapter)
            .accept_compressed(tonic::codec::CompressionEncoding::Gzip)
            .accept_compressed(tonic::codec::CompressionEncoding::Zstd)
            .send_compressed(tonic::codec::CompressionEncoding::Gzip)
            .send_compressed(tonic::codec::CompressionEncoding::Zstd)
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize)
    }
    pub fn from_channel(
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> Self {
        let (_, connection_keys_watcher) = tokio::sync::watch::channel(
            std::collections::HashSet::from_iter([addr]),
        );
        let mut client = metastore_service_grpc_client::MetastoreServiceGrpcClient::new(
                channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = MetastoreServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_balance_channel(
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> MetastoreServiceClient {
        let connection_keys_watcher = balance_channel.connection_keys_watcher();
        let mut client = metastore_service_grpc_client::MetastoreServiceGrpcClient::new(
                balance_channel,
            )
            .max_decoding_message_size(max_message_size.0 as usize)
            .max_encoding_message_size(max_message_size.0 as usize);
        if let Some(compression_encoding) = compression_encoding_opt {
            client = client
                .accept_compressed(compression_encoding)
                .send_compressed(compression_encoding);
        }
        let adapter = MetastoreServiceGrpcClientAdapter::new(
            client,
            connection_keys_watcher,
        );
        Self::new(adapter)
    }
    pub fn from_mailbox<A>(mailbox: quickwit_actors::Mailbox<A>) -> Self
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        MetastoreServiceMailbox<A>: MetastoreService,
    {
        MetastoreServiceClient::new(MetastoreServiceMailbox::new(mailbox))
    }
    pub fn tower() -> MetastoreServiceTowerLayerStack {
        MetastoreServiceTowerLayerStack::default()
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn from_mock(mock: MockMetastoreService) -> Self {
        let mock_wrapper = mock_metastore_service::MockMetastoreServiceWrapper {
            inner: tokio::sync::Mutex::new(mock),
        };
        Self::new(mock_wrapper)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn mocked() -> Self {
        Self::from_mock(MockMetastoreService::new())
    }
}
#[async_trait::async_trait]
impl MetastoreService for MetastoreServiceClient {
    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> crate::metastore::MetastoreResult<CreateIndexResponse> {
        self.inner.0.create_index(request).await
    }
    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.inner.0.update_index(request).await
    }
    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.inner.0.index_metadata(request).await
    }
    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexesMetadataResponse> {
        self.inner.0.indexes_metadata(request).await
    }
    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexesMetadataResponse> {
        self.inner.0.list_indexes_metadata(request).await
    }
    async fn delete_index(
        &self,
        request: DeleteIndexRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.delete_index(request).await
    }
    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexStatsResponse> {
        self.inner.0.list_index_stats(request).await
    }
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> crate::metastore::MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        self.inner.0.list_splits(request).await
    }
    async fn stage_splits(
        &self,
        request: StageSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.stage_splits(request).await
    }
    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.publish_splits(request).await
    }
    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.mark_splits_for_deletion(request).await
    }
    async fn delete_splits(
        &self,
        request: DeleteSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.delete_splits(request).await
    }
    async fn add_source(
        &self,
        request: AddSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.add_source(request).await
    }
    async fn update_source(
        &self,
        request: UpdateSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.update_source(request).await
    }
    async fn toggle_source(
        &self,
        request: ToggleSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.toggle_source(request).await
    }
    async fn delete_source(
        &self,
        request: DeleteSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.delete_source(request).await
    }
    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.reset_source_checkpoint(request).await
    }
    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<LastDeleteOpstampResponse> {
        self.inner.0.last_delete_opstamp(request).await
    }
    async fn create_delete_task(
        &self,
        request: DeleteQuery,
    ) -> crate::metastore::MetastoreResult<DeleteTask> {
        self.inner.0.create_delete_task(request).await
    }
    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        self.inner.0.update_splits_delete_opstamp(request).await
    }
    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> crate::metastore::MetastoreResult<ListDeleteTasksResponse> {
        self.inner.0.list_delete_tasks(request).await
    }
    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> crate::metastore::MetastoreResult<ListSplitsResponse> {
        self.inner.0.list_stale_splits(request).await
    }
    async fn open_shards(
        &self,
        request: OpenShardsRequest,
    ) -> crate::metastore::MetastoreResult<OpenShardsResponse> {
        self.inner.0.open_shards(request).await
    }
    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> crate::metastore::MetastoreResult<AcquireShardsResponse> {
        self.inner.0.acquire_shards(request).await
    }
    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> crate::metastore::MetastoreResult<DeleteShardsResponse> {
        self.inner.0.delete_shards(request).await
    }
    async fn prune_shards(
        &self,
        request: PruneShardsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.prune_shards(request).await
    }
    async fn list_shards(
        &self,
        request: ListShardsRequest,
    ) -> crate::metastore::MetastoreResult<ListShardsResponse> {
        self.inner.0.list_shards(request).await
    }
    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.create_index_template(request).await
    }
    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<GetIndexTemplateResponse> {
        self.inner.0.get_index_template(request).await
    }
    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> crate::metastore::MetastoreResult<FindIndexTemplateMatchesResponse> {
        self.inner.0.find_index_template_matches(request).await
    }
    async fn list_index_templates(
        &self,
        request: ListIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexTemplatesResponse> {
        self.inner.0.list_index_templates(request).await
    }
    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner.0.delete_index_templates(request).await
    }
    async fn get_cluster_identity(
        &self,
        request: GetClusterIdentityRequest,
    ) -> crate::metastore::MetastoreResult<GetClusterIdentityResponse> {
        self.inner.0.get_cluster_identity(request).await
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.inner.0.check_connectivity().await
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        self.inner.0.endpoints()
    }
}
#[cfg(any(test, feature = "testsuite"))]
pub mod mock_metastore_service {
    use super::*;
    #[derive(Debug)]
    pub struct MockMetastoreServiceWrapper {
        pub(super) inner: tokio::sync::Mutex<MockMetastoreService>,
    }
    #[async_trait::async_trait]
    impl MetastoreService for MockMetastoreServiceWrapper {
        async fn create_index(
            &self,
            request: super::CreateIndexRequest,
        ) -> crate::metastore::MetastoreResult<super::CreateIndexResponse> {
            self.inner.lock().await.create_index(request).await
        }
        async fn update_index(
            &self,
            request: super::UpdateIndexRequest,
        ) -> crate::metastore::MetastoreResult<super::IndexMetadataResponse> {
            self.inner.lock().await.update_index(request).await
        }
        async fn index_metadata(
            &self,
            request: super::IndexMetadataRequest,
        ) -> crate::metastore::MetastoreResult<super::IndexMetadataResponse> {
            self.inner.lock().await.index_metadata(request).await
        }
        async fn indexes_metadata(
            &self,
            request: super::IndexesMetadataRequest,
        ) -> crate::metastore::MetastoreResult<super::IndexesMetadataResponse> {
            self.inner.lock().await.indexes_metadata(request).await
        }
        async fn list_indexes_metadata(
            &self,
            request: super::ListIndexesMetadataRequest,
        ) -> crate::metastore::MetastoreResult<super::ListIndexesMetadataResponse> {
            self.inner.lock().await.list_indexes_metadata(request).await
        }
        async fn delete_index(
            &self,
            request: super::DeleteIndexRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.delete_index(request).await
        }
        async fn list_index_stats(
            &self,
            request: super::ListIndexStatsRequest,
        ) -> crate::metastore::MetastoreResult<super::ListIndexStatsResponse> {
            self.inner.lock().await.list_index_stats(request).await
        }
        async fn list_splits(
            &self,
            request: super::ListSplitsRequest,
        ) -> crate::metastore::MetastoreResult<
            MetastoreServiceStream<super::ListSplitsResponse>,
        > {
            self.inner.lock().await.list_splits(request).await
        }
        async fn stage_splits(
            &self,
            request: super::StageSplitsRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.stage_splits(request).await
        }
        async fn publish_splits(
            &self,
            request: super::PublishSplitsRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.publish_splits(request).await
        }
        async fn mark_splits_for_deletion(
            &self,
            request: super::MarkSplitsForDeletionRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.mark_splits_for_deletion(request).await
        }
        async fn delete_splits(
            &self,
            request: super::DeleteSplitsRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.delete_splits(request).await
        }
        async fn add_source(
            &self,
            request: super::AddSourceRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.add_source(request).await
        }
        async fn update_source(
            &self,
            request: super::UpdateSourceRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.update_source(request).await
        }
        async fn toggle_source(
            &self,
            request: super::ToggleSourceRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.toggle_source(request).await
        }
        async fn delete_source(
            &self,
            request: super::DeleteSourceRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.delete_source(request).await
        }
        async fn reset_source_checkpoint(
            &self,
            request: super::ResetSourceCheckpointRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.reset_source_checkpoint(request).await
        }
        async fn last_delete_opstamp(
            &self,
            request: super::LastDeleteOpstampRequest,
        ) -> crate::metastore::MetastoreResult<super::LastDeleteOpstampResponse> {
            self.inner.lock().await.last_delete_opstamp(request).await
        }
        async fn create_delete_task(
            &self,
            request: super::DeleteQuery,
        ) -> crate::metastore::MetastoreResult<super::DeleteTask> {
            self.inner.lock().await.create_delete_task(request).await
        }
        async fn update_splits_delete_opstamp(
            &self,
            request: super::UpdateSplitsDeleteOpstampRequest,
        ) -> crate::metastore::MetastoreResult<
            super::UpdateSplitsDeleteOpstampResponse,
        > {
            self.inner.lock().await.update_splits_delete_opstamp(request).await
        }
        async fn list_delete_tasks(
            &self,
            request: super::ListDeleteTasksRequest,
        ) -> crate::metastore::MetastoreResult<super::ListDeleteTasksResponse> {
            self.inner.lock().await.list_delete_tasks(request).await
        }
        async fn list_stale_splits(
            &self,
            request: super::ListStaleSplitsRequest,
        ) -> crate::metastore::MetastoreResult<super::ListSplitsResponse> {
            self.inner.lock().await.list_stale_splits(request).await
        }
        async fn open_shards(
            &self,
            request: super::OpenShardsRequest,
        ) -> crate::metastore::MetastoreResult<super::OpenShardsResponse> {
            self.inner.lock().await.open_shards(request).await
        }
        async fn acquire_shards(
            &self,
            request: super::AcquireShardsRequest,
        ) -> crate::metastore::MetastoreResult<super::AcquireShardsResponse> {
            self.inner.lock().await.acquire_shards(request).await
        }
        async fn delete_shards(
            &self,
            request: super::DeleteShardsRequest,
        ) -> crate::metastore::MetastoreResult<super::DeleteShardsResponse> {
            self.inner.lock().await.delete_shards(request).await
        }
        async fn prune_shards(
            &self,
            request: super::PruneShardsRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.prune_shards(request).await
        }
        async fn list_shards(
            &self,
            request: super::ListShardsRequest,
        ) -> crate::metastore::MetastoreResult<super::ListShardsResponse> {
            self.inner.lock().await.list_shards(request).await
        }
        async fn create_index_template(
            &self,
            request: super::CreateIndexTemplateRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.create_index_template(request).await
        }
        async fn get_index_template(
            &self,
            request: super::GetIndexTemplateRequest,
        ) -> crate::metastore::MetastoreResult<super::GetIndexTemplateResponse> {
            self.inner.lock().await.get_index_template(request).await
        }
        async fn find_index_template_matches(
            &self,
            request: super::FindIndexTemplateMatchesRequest,
        ) -> crate::metastore::MetastoreResult<super::FindIndexTemplateMatchesResponse> {
            self.inner.lock().await.find_index_template_matches(request).await
        }
        async fn list_index_templates(
            &self,
            request: super::ListIndexTemplatesRequest,
        ) -> crate::metastore::MetastoreResult<super::ListIndexTemplatesResponse> {
            self.inner.lock().await.list_index_templates(request).await
        }
        async fn delete_index_templates(
            &self,
            request: super::DeleteIndexTemplatesRequest,
        ) -> crate::metastore::MetastoreResult<super::EmptyResponse> {
            self.inner.lock().await.delete_index_templates(request).await
        }
        async fn get_cluster_identity(
            &self,
            request: super::GetClusterIdentityRequest,
        ) -> crate::metastore::MetastoreResult<super::GetClusterIdentityResponse> {
            self.inner.lock().await.get_cluster_identity(request).await
        }
        async fn check_connectivity(&self) -> anyhow::Result<()> {
            self.inner.lock().await.check_connectivity().await
        }
        fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
            futures::executor::block_on(self.inner.lock()).endpoints()
        }
    }
}
pub type BoxFuture<T, E> = std::pin::Pin<
    Box<dyn std::future::Future<Output = Result<T, E>> + Send + 'static>,
>;
impl tower::Service<CreateIndexRequest> for InnerMetastoreServiceClient {
    type Response = CreateIndexResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: CreateIndexRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.create_index(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<UpdateIndexRequest> for InnerMetastoreServiceClient {
    type Response = IndexMetadataResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: UpdateIndexRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.update_index(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<IndexMetadataRequest> for InnerMetastoreServiceClient {
    type Response = IndexMetadataResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: IndexMetadataRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.index_metadata(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<IndexesMetadataRequest> for InnerMetastoreServiceClient {
    type Response = IndexesMetadataResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: IndexesMetadataRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.indexes_metadata(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListIndexesMetadataRequest> for InnerMetastoreServiceClient {
    type Response = ListIndexesMetadataResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListIndexesMetadataRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_indexes_metadata(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DeleteIndexRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DeleteIndexRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_index(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListIndexStatsRequest> for InnerMetastoreServiceClient {
    type Response = ListIndexStatsResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListIndexStatsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_index_stats(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListSplitsRequest> for InnerMetastoreServiceClient {
    type Response = MetastoreServiceStream<ListSplitsResponse>;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListSplitsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_splits(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<StageSplitsRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: StageSplitsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.stage_splits(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<PublishSplitsRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: PublishSplitsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.publish_splits(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<MarkSplitsForDeletionRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: MarkSplitsForDeletionRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.mark_splits_for_deletion(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DeleteSplitsRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DeleteSplitsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_splits(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<AddSourceRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: AddSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.add_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<UpdateSourceRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: UpdateSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.update_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ToggleSourceRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ToggleSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.toggle_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DeleteSourceRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DeleteSourceRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_source(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ResetSourceCheckpointRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ResetSourceCheckpointRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.reset_source_checkpoint(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<LastDeleteOpstampRequest> for InnerMetastoreServiceClient {
    type Response = LastDeleteOpstampResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: LastDeleteOpstampRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.last_delete_opstamp(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DeleteQuery> for InnerMetastoreServiceClient {
    type Response = DeleteTask;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DeleteQuery) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.create_delete_task(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<UpdateSplitsDeleteOpstampRequest> for InnerMetastoreServiceClient {
    type Response = UpdateSplitsDeleteOpstampResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: UpdateSplitsDeleteOpstampRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.update_splits_delete_opstamp(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListDeleteTasksRequest> for InnerMetastoreServiceClient {
    type Response = ListDeleteTasksResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListDeleteTasksRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_delete_tasks(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListStaleSplitsRequest> for InnerMetastoreServiceClient {
    type Response = ListSplitsResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListStaleSplitsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_stale_splits(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<OpenShardsRequest> for InnerMetastoreServiceClient {
    type Response = OpenShardsResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: OpenShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.open_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<AcquireShardsRequest> for InnerMetastoreServiceClient {
    type Response = AcquireShardsResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: AcquireShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.acquire_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DeleteShardsRequest> for InnerMetastoreServiceClient {
    type Response = DeleteShardsResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DeleteShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<PruneShardsRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: PruneShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.prune_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListShardsRequest> for InnerMetastoreServiceClient {
    type Response = ListShardsResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListShardsRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_shards(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<CreateIndexTemplateRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: CreateIndexTemplateRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.create_index_template(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<GetIndexTemplateRequest> for InnerMetastoreServiceClient {
    type Response = GetIndexTemplateResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: GetIndexTemplateRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.get_index_template(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<FindIndexTemplateMatchesRequest> for InnerMetastoreServiceClient {
    type Response = FindIndexTemplateMatchesResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: FindIndexTemplateMatchesRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.find_index_template_matches(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<ListIndexTemplatesRequest> for InnerMetastoreServiceClient {
    type Response = ListIndexTemplatesResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: ListIndexTemplatesRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.list_index_templates(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<DeleteIndexTemplatesRequest> for InnerMetastoreServiceClient {
    type Response = EmptyResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: DeleteIndexTemplatesRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.delete_index_templates(request).await };
        Box::pin(fut)
    }
}
impl tower::Service<GetClusterIdentityRequest> for InnerMetastoreServiceClient {
    type Response = GetClusterIdentityResponse;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, request: GetClusterIdentityRequest) -> Self::Future {
        let svc = self.clone();
        let fut = async move { svc.0.get_cluster_identity(request).await };
        Box::pin(fut)
    }
}
/// A tower service stack is a set of tower services.
#[derive(Debug)]
struct MetastoreServiceTowerServiceStack {
    #[allow(dead_code)]
    inner: InnerMetastoreServiceClient,
    create_index_svc: quickwit_common::tower::BoxService<
        CreateIndexRequest,
        CreateIndexResponse,
        crate::metastore::MetastoreError,
    >,
    update_index_svc: quickwit_common::tower::BoxService<
        UpdateIndexRequest,
        IndexMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    index_metadata_svc: quickwit_common::tower::BoxService<
        IndexMetadataRequest,
        IndexMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    indexes_metadata_svc: quickwit_common::tower::BoxService<
        IndexesMetadataRequest,
        IndexesMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    list_indexes_metadata_svc: quickwit_common::tower::BoxService<
        ListIndexesMetadataRequest,
        ListIndexesMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    delete_index_svc: quickwit_common::tower::BoxService<
        DeleteIndexRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    list_index_stats_svc: quickwit_common::tower::BoxService<
        ListIndexStatsRequest,
        ListIndexStatsResponse,
        crate::metastore::MetastoreError,
    >,
    list_splits_svc: quickwit_common::tower::BoxService<
        ListSplitsRequest,
        MetastoreServiceStream<ListSplitsResponse>,
        crate::metastore::MetastoreError,
    >,
    stage_splits_svc: quickwit_common::tower::BoxService<
        StageSplitsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    publish_splits_svc: quickwit_common::tower::BoxService<
        PublishSplitsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    mark_splits_for_deletion_svc: quickwit_common::tower::BoxService<
        MarkSplitsForDeletionRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    delete_splits_svc: quickwit_common::tower::BoxService<
        DeleteSplitsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    add_source_svc: quickwit_common::tower::BoxService<
        AddSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    update_source_svc: quickwit_common::tower::BoxService<
        UpdateSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    toggle_source_svc: quickwit_common::tower::BoxService<
        ToggleSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    delete_source_svc: quickwit_common::tower::BoxService<
        DeleteSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    reset_source_checkpoint_svc: quickwit_common::tower::BoxService<
        ResetSourceCheckpointRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    last_delete_opstamp_svc: quickwit_common::tower::BoxService<
        LastDeleteOpstampRequest,
        LastDeleteOpstampResponse,
        crate::metastore::MetastoreError,
    >,
    create_delete_task_svc: quickwit_common::tower::BoxService<
        DeleteQuery,
        DeleteTask,
        crate::metastore::MetastoreError,
    >,
    update_splits_delete_opstamp_svc: quickwit_common::tower::BoxService<
        UpdateSplitsDeleteOpstampRequest,
        UpdateSplitsDeleteOpstampResponse,
        crate::metastore::MetastoreError,
    >,
    list_delete_tasks_svc: quickwit_common::tower::BoxService<
        ListDeleteTasksRequest,
        ListDeleteTasksResponse,
        crate::metastore::MetastoreError,
    >,
    list_stale_splits_svc: quickwit_common::tower::BoxService<
        ListStaleSplitsRequest,
        ListSplitsResponse,
        crate::metastore::MetastoreError,
    >,
    open_shards_svc: quickwit_common::tower::BoxService<
        OpenShardsRequest,
        OpenShardsResponse,
        crate::metastore::MetastoreError,
    >,
    acquire_shards_svc: quickwit_common::tower::BoxService<
        AcquireShardsRequest,
        AcquireShardsResponse,
        crate::metastore::MetastoreError,
    >,
    delete_shards_svc: quickwit_common::tower::BoxService<
        DeleteShardsRequest,
        DeleteShardsResponse,
        crate::metastore::MetastoreError,
    >,
    prune_shards_svc: quickwit_common::tower::BoxService<
        PruneShardsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    list_shards_svc: quickwit_common::tower::BoxService<
        ListShardsRequest,
        ListShardsResponse,
        crate::metastore::MetastoreError,
    >,
    create_index_template_svc: quickwit_common::tower::BoxService<
        CreateIndexTemplateRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    get_index_template_svc: quickwit_common::tower::BoxService<
        GetIndexTemplateRequest,
        GetIndexTemplateResponse,
        crate::metastore::MetastoreError,
    >,
    find_index_template_matches_svc: quickwit_common::tower::BoxService<
        FindIndexTemplateMatchesRequest,
        FindIndexTemplateMatchesResponse,
        crate::metastore::MetastoreError,
    >,
    list_index_templates_svc: quickwit_common::tower::BoxService<
        ListIndexTemplatesRequest,
        ListIndexTemplatesResponse,
        crate::metastore::MetastoreError,
    >,
    delete_index_templates_svc: quickwit_common::tower::BoxService<
        DeleteIndexTemplatesRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    get_cluster_identity_svc: quickwit_common::tower::BoxService<
        GetClusterIdentityRequest,
        GetClusterIdentityResponse,
        crate::metastore::MetastoreError,
    >,
}
#[async_trait::async_trait]
impl MetastoreService for MetastoreServiceTowerServiceStack {
    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> crate::metastore::MetastoreResult<CreateIndexResponse> {
        self.create_index_svc.clone().ready().await?.call(request).await
    }
    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.update_index_svc.clone().ready().await?.call(request).await
    }
    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.index_metadata_svc.clone().ready().await?.call(request).await
    }
    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexesMetadataResponse> {
        self.indexes_metadata_svc.clone().ready().await?.call(request).await
    }
    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexesMetadataResponse> {
        self.list_indexes_metadata_svc.clone().ready().await?.call(request).await
    }
    async fn delete_index(
        &self,
        request: DeleteIndexRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.delete_index_svc.clone().ready().await?.call(request).await
    }
    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexStatsResponse> {
        self.list_index_stats_svc.clone().ready().await?.call(request).await
    }
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> crate::metastore::MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        self.list_splits_svc.clone().ready().await?.call(request).await
    }
    async fn stage_splits(
        &self,
        request: StageSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.stage_splits_svc.clone().ready().await?.call(request).await
    }
    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.publish_splits_svc.clone().ready().await?.call(request).await
    }
    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.mark_splits_for_deletion_svc.clone().ready().await?.call(request).await
    }
    async fn delete_splits(
        &self,
        request: DeleteSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.delete_splits_svc.clone().ready().await?.call(request).await
    }
    async fn add_source(
        &self,
        request: AddSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.add_source_svc.clone().ready().await?.call(request).await
    }
    async fn update_source(
        &self,
        request: UpdateSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.update_source_svc.clone().ready().await?.call(request).await
    }
    async fn toggle_source(
        &self,
        request: ToggleSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.toggle_source_svc.clone().ready().await?.call(request).await
    }
    async fn delete_source(
        &self,
        request: DeleteSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.delete_source_svc.clone().ready().await?.call(request).await
    }
    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.reset_source_checkpoint_svc.clone().ready().await?.call(request).await
    }
    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<LastDeleteOpstampResponse> {
        self.last_delete_opstamp_svc.clone().ready().await?.call(request).await
    }
    async fn create_delete_task(
        &self,
        request: DeleteQuery,
    ) -> crate::metastore::MetastoreResult<DeleteTask> {
        self.create_delete_task_svc.clone().ready().await?.call(request).await
    }
    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        self.update_splits_delete_opstamp_svc.clone().ready().await?.call(request).await
    }
    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> crate::metastore::MetastoreResult<ListDeleteTasksResponse> {
        self.list_delete_tasks_svc.clone().ready().await?.call(request).await
    }
    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> crate::metastore::MetastoreResult<ListSplitsResponse> {
        self.list_stale_splits_svc.clone().ready().await?.call(request).await
    }
    async fn open_shards(
        &self,
        request: OpenShardsRequest,
    ) -> crate::metastore::MetastoreResult<OpenShardsResponse> {
        self.open_shards_svc.clone().ready().await?.call(request).await
    }
    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> crate::metastore::MetastoreResult<AcquireShardsResponse> {
        self.acquire_shards_svc.clone().ready().await?.call(request).await
    }
    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> crate::metastore::MetastoreResult<DeleteShardsResponse> {
        self.delete_shards_svc.clone().ready().await?.call(request).await
    }
    async fn prune_shards(
        &self,
        request: PruneShardsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.prune_shards_svc.clone().ready().await?.call(request).await
    }
    async fn list_shards(
        &self,
        request: ListShardsRequest,
    ) -> crate::metastore::MetastoreResult<ListShardsResponse> {
        self.list_shards_svc.clone().ready().await?.call(request).await
    }
    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.create_index_template_svc.clone().ready().await?.call(request).await
    }
    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<GetIndexTemplateResponse> {
        self.get_index_template_svc.clone().ready().await?.call(request).await
    }
    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> crate::metastore::MetastoreResult<FindIndexTemplateMatchesResponse> {
        self.find_index_template_matches_svc.clone().ready().await?.call(request).await
    }
    async fn list_index_templates(
        &self,
        request: ListIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexTemplatesResponse> {
        self.list_index_templates_svc.clone().ready().await?.call(request).await
    }
    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.delete_index_templates_svc.clone().ready().await?.call(request).await
    }
    async fn get_cluster_identity(
        &self,
        request: GetClusterIdentityRequest,
    ) -> crate::metastore::MetastoreResult<GetClusterIdentityResponse> {
        self.get_cluster_identity_svc.clone().ready().await?.call(request).await
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.inner.0.check_connectivity().await
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        self.inner.0.endpoints()
    }
}
type CreateIndexLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        CreateIndexRequest,
        CreateIndexResponse,
        crate::metastore::MetastoreError,
    >,
    CreateIndexRequest,
    CreateIndexResponse,
    crate::metastore::MetastoreError,
>;
type UpdateIndexLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        UpdateIndexRequest,
        IndexMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    UpdateIndexRequest,
    IndexMetadataResponse,
    crate::metastore::MetastoreError,
>;
type IndexMetadataLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        IndexMetadataRequest,
        IndexMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    IndexMetadataRequest,
    IndexMetadataResponse,
    crate::metastore::MetastoreError,
>;
type IndexesMetadataLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        IndexesMetadataRequest,
        IndexesMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    IndexesMetadataRequest,
    IndexesMetadataResponse,
    crate::metastore::MetastoreError,
>;
type ListIndexesMetadataLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListIndexesMetadataRequest,
        ListIndexesMetadataResponse,
        crate::metastore::MetastoreError,
    >,
    ListIndexesMetadataRequest,
    ListIndexesMetadataResponse,
    crate::metastore::MetastoreError,
>;
type DeleteIndexLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DeleteIndexRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    DeleteIndexRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type ListIndexStatsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListIndexStatsRequest,
        ListIndexStatsResponse,
        crate::metastore::MetastoreError,
    >,
    ListIndexStatsRequest,
    ListIndexStatsResponse,
    crate::metastore::MetastoreError,
>;
type ListSplitsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListSplitsRequest,
        MetastoreServiceStream<ListSplitsResponse>,
        crate::metastore::MetastoreError,
    >,
    ListSplitsRequest,
    MetastoreServiceStream<ListSplitsResponse>,
    crate::metastore::MetastoreError,
>;
type StageSplitsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        StageSplitsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    StageSplitsRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type PublishSplitsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        PublishSplitsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    PublishSplitsRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type MarkSplitsForDeletionLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        MarkSplitsForDeletionRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    MarkSplitsForDeletionRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type DeleteSplitsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DeleteSplitsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    DeleteSplitsRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type AddSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        AddSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    AddSourceRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type UpdateSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        UpdateSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    UpdateSourceRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type ToggleSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ToggleSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    ToggleSourceRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type DeleteSourceLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DeleteSourceRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    DeleteSourceRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type ResetSourceCheckpointLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ResetSourceCheckpointRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    ResetSourceCheckpointRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type LastDeleteOpstampLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        LastDeleteOpstampRequest,
        LastDeleteOpstampResponse,
        crate::metastore::MetastoreError,
    >,
    LastDeleteOpstampRequest,
    LastDeleteOpstampResponse,
    crate::metastore::MetastoreError,
>;
type CreateDeleteTaskLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DeleteQuery,
        DeleteTask,
        crate::metastore::MetastoreError,
    >,
    DeleteQuery,
    DeleteTask,
    crate::metastore::MetastoreError,
>;
type UpdateSplitsDeleteOpstampLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        UpdateSplitsDeleteOpstampRequest,
        UpdateSplitsDeleteOpstampResponse,
        crate::metastore::MetastoreError,
    >,
    UpdateSplitsDeleteOpstampRequest,
    UpdateSplitsDeleteOpstampResponse,
    crate::metastore::MetastoreError,
>;
type ListDeleteTasksLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListDeleteTasksRequest,
        ListDeleteTasksResponse,
        crate::metastore::MetastoreError,
    >,
    ListDeleteTasksRequest,
    ListDeleteTasksResponse,
    crate::metastore::MetastoreError,
>;
type ListStaleSplitsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListStaleSplitsRequest,
        ListSplitsResponse,
        crate::metastore::MetastoreError,
    >,
    ListStaleSplitsRequest,
    ListSplitsResponse,
    crate::metastore::MetastoreError,
>;
type OpenShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        OpenShardsRequest,
        OpenShardsResponse,
        crate::metastore::MetastoreError,
    >,
    OpenShardsRequest,
    OpenShardsResponse,
    crate::metastore::MetastoreError,
>;
type AcquireShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        AcquireShardsRequest,
        AcquireShardsResponse,
        crate::metastore::MetastoreError,
    >,
    AcquireShardsRequest,
    AcquireShardsResponse,
    crate::metastore::MetastoreError,
>;
type DeleteShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DeleteShardsRequest,
        DeleteShardsResponse,
        crate::metastore::MetastoreError,
    >,
    DeleteShardsRequest,
    DeleteShardsResponse,
    crate::metastore::MetastoreError,
>;
type PruneShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        PruneShardsRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    PruneShardsRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type ListShardsLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListShardsRequest,
        ListShardsResponse,
        crate::metastore::MetastoreError,
    >,
    ListShardsRequest,
    ListShardsResponse,
    crate::metastore::MetastoreError,
>;
type CreateIndexTemplateLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        CreateIndexTemplateRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    CreateIndexTemplateRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type GetIndexTemplateLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        GetIndexTemplateRequest,
        GetIndexTemplateResponse,
        crate::metastore::MetastoreError,
    >,
    GetIndexTemplateRequest,
    GetIndexTemplateResponse,
    crate::metastore::MetastoreError,
>;
type FindIndexTemplateMatchesLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        FindIndexTemplateMatchesRequest,
        FindIndexTemplateMatchesResponse,
        crate::metastore::MetastoreError,
    >,
    FindIndexTemplateMatchesRequest,
    FindIndexTemplateMatchesResponse,
    crate::metastore::MetastoreError,
>;
type ListIndexTemplatesLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        ListIndexTemplatesRequest,
        ListIndexTemplatesResponse,
        crate::metastore::MetastoreError,
    >,
    ListIndexTemplatesRequest,
    ListIndexTemplatesResponse,
    crate::metastore::MetastoreError,
>;
type DeleteIndexTemplatesLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        DeleteIndexTemplatesRequest,
        EmptyResponse,
        crate::metastore::MetastoreError,
    >,
    DeleteIndexTemplatesRequest,
    EmptyResponse,
    crate::metastore::MetastoreError,
>;
type GetClusterIdentityLayer = quickwit_common::tower::BoxLayer<
    quickwit_common::tower::BoxService<
        GetClusterIdentityRequest,
        GetClusterIdentityResponse,
        crate::metastore::MetastoreError,
    >,
    GetClusterIdentityRequest,
    GetClusterIdentityResponse,
    crate::metastore::MetastoreError,
>;
#[derive(Debug, Default)]
pub struct MetastoreServiceTowerLayerStack {
    create_index_layers: Vec<CreateIndexLayer>,
    update_index_layers: Vec<UpdateIndexLayer>,
    index_metadata_layers: Vec<IndexMetadataLayer>,
    indexes_metadata_layers: Vec<IndexesMetadataLayer>,
    list_indexes_metadata_layers: Vec<ListIndexesMetadataLayer>,
    delete_index_layers: Vec<DeleteIndexLayer>,
    list_index_stats_layers: Vec<ListIndexStatsLayer>,
    list_splits_layers: Vec<ListSplitsLayer>,
    stage_splits_layers: Vec<StageSplitsLayer>,
    publish_splits_layers: Vec<PublishSplitsLayer>,
    mark_splits_for_deletion_layers: Vec<MarkSplitsForDeletionLayer>,
    delete_splits_layers: Vec<DeleteSplitsLayer>,
    add_source_layers: Vec<AddSourceLayer>,
    update_source_layers: Vec<UpdateSourceLayer>,
    toggle_source_layers: Vec<ToggleSourceLayer>,
    delete_source_layers: Vec<DeleteSourceLayer>,
    reset_source_checkpoint_layers: Vec<ResetSourceCheckpointLayer>,
    last_delete_opstamp_layers: Vec<LastDeleteOpstampLayer>,
    create_delete_task_layers: Vec<CreateDeleteTaskLayer>,
    update_splits_delete_opstamp_layers: Vec<UpdateSplitsDeleteOpstampLayer>,
    list_delete_tasks_layers: Vec<ListDeleteTasksLayer>,
    list_stale_splits_layers: Vec<ListStaleSplitsLayer>,
    open_shards_layers: Vec<OpenShardsLayer>,
    acquire_shards_layers: Vec<AcquireShardsLayer>,
    delete_shards_layers: Vec<DeleteShardsLayer>,
    prune_shards_layers: Vec<PruneShardsLayer>,
    list_shards_layers: Vec<ListShardsLayer>,
    create_index_template_layers: Vec<CreateIndexTemplateLayer>,
    get_index_template_layers: Vec<GetIndexTemplateLayer>,
    find_index_template_matches_layers: Vec<FindIndexTemplateMatchesLayer>,
    list_index_templates_layers: Vec<ListIndexTemplatesLayer>,
    delete_index_templates_layers: Vec<DeleteIndexTemplatesLayer>,
    get_cluster_identity_layers: Vec<GetClusterIdentityLayer>,
}
impl MetastoreServiceTowerLayerStack {
    pub fn stack_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    CreateIndexRequest,
                    CreateIndexResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                CreateIndexRequest,
                CreateIndexResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                CreateIndexRequest,
                Response = CreateIndexResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                CreateIndexRequest,
                CreateIndexResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<CreateIndexRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    UpdateIndexRequest,
                    IndexMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                UpdateIndexRequest,
                IndexMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                UpdateIndexRequest,
                Response = IndexMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                UpdateIndexRequest,
                IndexMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<UpdateIndexRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IndexMetadataRequest,
                    IndexMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                IndexMetadataRequest,
                IndexMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                IndexMetadataRequest,
                Response = IndexMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                IndexMetadataRequest,
                IndexMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<IndexMetadataRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IndexesMetadataRequest,
                    IndexesMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                IndexesMetadataRequest,
                IndexesMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                IndexesMetadataRequest,
                Response = IndexesMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                IndexesMetadataRequest,
                IndexesMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<IndexesMetadataRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListIndexesMetadataRequest,
                    ListIndexesMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListIndexesMetadataRequest,
                ListIndexesMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListIndexesMetadataRequest,
                Response = ListIndexesMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListIndexesMetadataRequest,
                ListIndexesMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            ListIndexesMetadataRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteIndexRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteIndexRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                DeleteIndexRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteIndexRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<DeleteIndexRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListIndexStatsRequest,
                    ListIndexStatsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListIndexStatsRequest,
                ListIndexStatsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListIndexStatsRequest,
                Response = ListIndexStatsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListIndexStatsRequest,
                ListIndexStatsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<ListIndexStatsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListSplitsRequest,
                    MetastoreServiceStream<ListSplitsResponse>,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListSplitsRequest,
                MetastoreServiceStream<ListSplitsResponse>,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListSplitsRequest,
                Response = MetastoreServiceStream<ListSplitsResponse>,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListSplitsRequest,
                MetastoreServiceStream<ListSplitsResponse>,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<ListSplitsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    StageSplitsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                StageSplitsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                StageSplitsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                StageSplitsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<StageSplitsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    PublishSplitsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                PublishSplitsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                PublishSplitsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                PublishSplitsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<PublishSplitsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    MarkSplitsForDeletionRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                MarkSplitsForDeletionRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                MarkSplitsForDeletionRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                MarkSplitsForDeletionRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            MarkSplitsForDeletionRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteSplitsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteSplitsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                DeleteSplitsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteSplitsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<DeleteSplitsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    AddSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                AddSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                AddSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                AddSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<AddSourceRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    UpdateSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                UpdateSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                UpdateSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                UpdateSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<UpdateSourceRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ToggleSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ToggleSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ToggleSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ToggleSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<ToggleSourceRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                DeleteSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteSourceRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<DeleteSourceRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ResetSourceCheckpointRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ResetSourceCheckpointRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ResetSourceCheckpointRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ResetSourceCheckpointRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            ResetSourceCheckpointRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    LastDeleteOpstampRequest,
                    LastDeleteOpstampResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                LastDeleteOpstampRequest,
                LastDeleteOpstampResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                LastDeleteOpstampRequest,
                Response = LastDeleteOpstampResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                LastDeleteOpstampRequest,
                LastDeleteOpstampResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<LastDeleteOpstampRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteQuery,
                    DeleteTask,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteQuery,
                DeleteTask,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                DeleteQuery,
                Response = DeleteTask,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteQuery,
                DeleteTask,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<DeleteQuery>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    UpdateSplitsDeleteOpstampRequest,
                    UpdateSplitsDeleteOpstampResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                UpdateSplitsDeleteOpstampRequest,
                UpdateSplitsDeleteOpstampResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                UpdateSplitsDeleteOpstampRequest,
                Response = UpdateSplitsDeleteOpstampResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                UpdateSplitsDeleteOpstampRequest,
                UpdateSplitsDeleteOpstampResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            UpdateSplitsDeleteOpstampRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListDeleteTasksRequest,
                    ListDeleteTasksResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListDeleteTasksRequest,
                ListDeleteTasksResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListDeleteTasksRequest,
                Response = ListDeleteTasksResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListDeleteTasksRequest,
                ListDeleteTasksResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<ListDeleteTasksRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListStaleSplitsRequest,
                    ListSplitsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListStaleSplitsRequest,
                ListSplitsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListStaleSplitsRequest,
                Response = ListSplitsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListStaleSplitsRequest,
                ListSplitsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<ListStaleSplitsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    OpenShardsRequest,
                    OpenShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                OpenShardsRequest,
                OpenShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                OpenShardsRequest,
                Response = OpenShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                OpenShardsRequest,
                OpenShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<OpenShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    AcquireShardsRequest,
                    AcquireShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                AcquireShardsRequest,
                AcquireShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                AcquireShardsRequest,
                Response = AcquireShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                AcquireShardsRequest,
                AcquireShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<AcquireShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteShardsRequest,
                    DeleteShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteShardsRequest,
                DeleteShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                DeleteShardsRequest,
                Response = DeleteShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteShardsRequest,
                DeleteShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<DeleteShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    PruneShardsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                PruneShardsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                PruneShardsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                PruneShardsRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<PruneShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListShardsRequest,
                    ListShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListShardsRequest,
                ListShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListShardsRequest,
                Response = ListShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListShardsRequest,
                ListShardsResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<ListShardsRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    CreateIndexTemplateRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                CreateIndexTemplateRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                CreateIndexTemplateRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                CreateIndexTemplateRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            CreateIndexTemplateRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetIndexTemplateRequest,
                    GetIndexTemplateResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetIndexTemplateRequest,
                GetIndexTemplateResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                GetIndexTemplateRequest,
                Response = GetIndexTemplateResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetIndexTemplateRequest,
                GetIndexTemplateResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<GetIndexTemplateRequest>>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    FindIndexTemplateMatchesRequest,
                    FindIndexTemplateMatchesResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                FindIndexTemplateMatchesRequest,
                FindIndexTemplateMatchesResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                FindIndexTemplateMatchesRequest,
                Response = FindIndexTemplateMatchesResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                FindIndexTemplateMatchesRequest,
                FindIndexTemplateMatchesResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            FindIndexTemplateMatchesRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListIndexTemplatesRequest,
                    ListIndexTemplatesResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListIndexTemplatesRequest,
                ListIndexTemplatesResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                ListIndexTemplatesRequest,
                Response = ListIndexTemplatesResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                ListIndexTemplatesRequest,
                ListIndexTemplatesResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            ListIndexTemplatesRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteIndexTemplatesRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteIndexTemplatesRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                DeleteIndexTemplatesRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                DeleteIndexTemplatesRequest,
                EmptyResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            DeleteIndexTemplatesRequest,
        >>::Future: Send + 'static,
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetClusterIdentityRequest,
                    GetClusterIdentityResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Clone + Send + Sync + 'static,
        <L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetClusterIdentityRequest,
                GetClusterIdentityResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service: tower::Service<
                GetClusterIdentityRequest,
                Response = GetClusterIdentityResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <<L as tower::Layer<
            quickwit_common::tower::BoxService<
                GetClusterIdentityRequest,
                GetClusterIdentityResponse,
                crate::metastore::MetastoreError,
            >,
        >>::Service as tower::Service<
            GetClusterIdentityRequest,
        >>::Future: Send + 'static,
    {
        self.create_index_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.update_index_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.index_metadata_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.indexes_metadata_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_indexes_metadata_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_index_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_index_stats_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_splits_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.stage_splits_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.publish_splits_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.mark_splits_for_deletion_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_splits_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.add_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.update_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.toggle_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_source_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.reset_source_checkpoint_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.last_delete_opstamp_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.create_delete_task_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.update_splits_delete_opstamp_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_delete_tasks_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_stale_splits_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.open_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.acquire_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.prune_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_shards_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.create_index_template_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.get_index_template_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.find_index_template_matches_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.list_index_templates_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.delete_index_templates_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self.get_cluster_identity_layers
            .push(quickwit_common::tower::BoxLayer::new(layer.clone()));
        self
    }
    pub fn stack_create_index_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    CreateIndexRequest,
                    CreateIndexResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                CreateIndexRequest,
                Response = CreateIndexResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<CreateIndexRequest>>::Future: Send + 'static,
    {
        self.create_index_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_update_index_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    UpdateIndexRequest,
                    IndexMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                UpdateIndexRequest,
                Response = IndexMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<UpdateIndexRequest>>::Future: Send + 'static,
    {
        self.update_index_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_index_metadata_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IndexMetadataRequest,
                    IndexMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                IndexMetadataRequest,
                Response = IndexMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<IndexMetadataRequest>>::Future: Send + 'static,
    {
        self.index_metadata_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_indexes_metadata_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    IndexesMetadataRequest,
                    IndexesMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                IndexesMetadataRequest,
                Response = IndexesMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<IndexesMetadataRequest>>::Future: Send + 'static,
    {
        self.indexes_metadata_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_indexes_metadata_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListIndexesMetadataRequest,
                    ListIndexesMetadataResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListIndexesMetadataRequest,
                Response = ListIndexesMetadataResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            ListIndexesMetadataRequest,
        >>::Future: Send + 'static,
    {
        self.list_indexes_metadata_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_index_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteIndexRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DeleteIndexRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<DeleteIndexRequest>>::Future: Send + 'static,
    {
        self.delete_index_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_index_stats_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListIndexStatsRequest,
                    ListIndexStatsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListIndexStatsRequest,
                Response = ListIndexStatsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ListIndexStatsRequest>>::Future: Send + 'static,
    {
        self.list_index_stats_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_splits_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListSplitsRequest,
                    MetastoreServiceStream<ListSplitsResponse>,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListSplitsRequest,
                Response = MetastoreServiceStream<ListSplitsResponse>,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ListSplitsRequest>>::Future: Send + 'static,
    {
        self.list_splits_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_stage_splits_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    StageSplitsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                StageSplitsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<StageSplitsRequest>>::Future: Send + 'static,
    {
        self.stage_splits_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_publish_splits_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    PublishSplitsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                PublishSplitsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<PublishSplitsRequest>>::Future: Send + 'static,
    {
        self.publish_splits_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_mark_splits_for_deletion_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    MarkSplitsForDeletionRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                MarkSplitsForDeletionRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            MarkSplitsForDeletionRequest,
        >>::Future: Send + 'static,
    {
        self.mark_splits_for_deletion_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_splits_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteSplitsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DeleteSplitsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<DeleteSplitsRequest>>::Future: Send + 'static,
    {
        self.delete_splits_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_add_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    AddSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                AddSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<AddSourceRequest>>::Future: Send + 'static,
    {
        self.add_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_update_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    UpdateSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                UpdateSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<UpdateSourceRequest>>::Future: Send + 'static,
    {
        self.update_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_toggle_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ToggleSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ToggleSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ToggleSourceRequest>>::Future: Send + 'static,
    {
        self.toggle_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_source_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteSourceRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DeleteSourceRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<DeleteSourceRequest>>::Future: Send + 'static,
    {
        self.delete_source_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_reset_source_checkpoint_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ResetSourceCheckpointRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ResetSourceCheckpointRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            ResetSourceCheckpointRequest,
        >>::Future: Send + 'static,
    {
        self.reset_source_checkpoint_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_last_delete_opstamp_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    LastDeleteOpstampRequest,
                    LastDeleteOpstampResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                LastDeleteOpstampRequest,
                Response = LastDeleteOpstampResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<LastDeleteOpstampRequest>>::Future: Send + 'static,
    {
        self.last_delete_opstamp_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_create_delete_task_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteQuery,
                    DeleteTask,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DeleteQuery,
                Response = DeleteTask,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<DeleteQuery>>::Future: Send + 'static,
    {
        self.create_delete_task_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_update_splits_delete_opstamp_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    UpdateSplitsDeleteOpstampRequest,
                    UpdateSplitsDeleteOpstampResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                UpdateSplitsDeleteOpstampRequest,
                Response = UpdateSplitsDeleteOpstampResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            UpdateSplitsDeleteOpstampRequest,
        >>::Future: Send + 'static,
    {
        self.update_splits_delete_opstamp_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_delete_tasks_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListDeleteTasksRequest,
                    ListDeleteTasksResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListDeleteTasksRequest,
                Response = ListDeleteTasksResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ListDeleteTasksRequest>>::Future: Send + 'static,
    {
        self.list_delete_tasks_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_stale_splits_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListStaleSplitsRequest,
                    ListSplitsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListStaleSplitsRequest,
                Response = ListSplitsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ListStaleSplitsRequest>>::Future: Send + 'static,
    {
        self.list_stale_splits_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_open_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    OpenShardsRequest,
                    OpenShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                OpenShardsRequest,
                Response = OpenShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<OpenShardsRequest>>::Future: Send + 'static,
    {
        self.open_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_acquire_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    AcquireShardsRequest,
                    AcquireShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                AcquireShardsRequest,
                Response = AcquireShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<AcquireShardsRequest>>::Future: Send + 'static,
    {
        self.acquire_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteShardsRequest,
                    DeleteShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DeleteShardsRequest,
                Response = DeleteShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<DeleteShardsRequest>>::Future: Send + 'static,
    {
        self.delete_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_prune_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    PruneShardsRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                PruneShardsRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<PruneShardsRequest>>::Future: Send + 'static,
    {
        self.prune_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_shards_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListShardsRequest,
                    ListShardsResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListShardsRequest,
                Response = ListShardsResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<ListShardsRequest>>::Future: Send + 'static,
    {
        self.list_shards_layers.push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_create_index_template_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    CreateIndexTemplateRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                CreateIndexTemplateRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            CreateIndexTemplateRequest,
        >>::Future: Send + 'static,
    {
        self.create_index_template_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_get_index_template_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetIndexTemplateRequest,
                    GetIndexTemplateResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                GetIndexTemplateRequest,
                Response = GetIndexTemplateResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<GetIndexTemplateRequest>>::Future: Send + 'static,
    {
        self.get_index_template_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_find_index_template_matches_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    FindIndexTemplateMatchesRequest,
                    FindIndexTemplateMatchesResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                FindIndexTemplateMatchesRequest,
                Response = FindIndexTemplateMatchesResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            FindIndexTemplateMatchesRequest,
        >>::Future: Send + 'static,
    {
        self.find_index_template_matches_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_list_index_templates_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    ListIndexTemplatesRequest,
                    ListIndexTemplatesResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                ListIndexTemplatesRequest,
                Response = ListIndexTemplatesResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            ListIndexTemplatesRequest,
        >>::Future: Send + 'static,
    {
        self.list_index_templates_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_delete_index_templates_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    DeleteIndexTemplatesRequest,
                    EmptyResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                DeleteIndexTemplatesRequest,
                Response = EmptyResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            DeleteIndexTemplatesRequest,
        >>::Future: Send + 'static,
    {
        self.delete_index_templates_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn stack_get_cluster_identity_layer<L>(mut self, layer: L) -> Self
    where
        L: tower::Layer<
                quickwit_common::tower::BoxService<
                    GetClusterIdentityRequest,
                    GetClusterIdentityResponse,
                    crate::metastore::MetastoreError,
                >,
            > + Send + Sync + 'static,
        L::Service: tower::Service<
                GetClusterIdentityRequest,
                Response = GetClusterIdentityResponse,
                Error = crate::metastore::MetastoreError,
            > + Clone + Send + Sync + 'static,
        <L::Service as tower::Service<
            GetClusterIdentityRequest,
        >>::Future: Send + 'static,
    {
        self.get_cluster_identity_layers
            .push(quickwit_common::tower::BoxLayer::new(layer));
        self
    }
    pub fn build<T>(self, instance: T) -> MetastoreServiceClient
    where
        T: MetastoreService,
    {
        let inner_client = InnerMetastoreServiceClient(std::sync::Arc::new(instance));
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_channel(
        self,
        addr: std::net::SocketAddr,
        channel: tonic::transport::Channel,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> MetastoreServiceClient {
        let client = MetastoreServiceClient::from_channel(
            addr,
            channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_balance_channel(
        self,
        balance_channel: quickwit_common::tower::BalanceChannel<std::net::SocketAddr>,
        max_message_size: bytesize::ByteSize,
        compression_encoding_opt: Option<tonic::codec::CompressionEncoding>,
    ) -> MetastoreServiceClient {
        let client = MetastoreServiceClient::from_balance_channel(
            balance_channel,
            max_message_size,
            compression_encoding_opt,
        );
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    pub fn build_from_mailbox<A>(
        self,
        mailbox: quickwit_actors::Mailbox<A>,
    ) -> MetastoreServiceClient
    where
        A: quickwit_actors::Actor + std::fmt::Debug + Send + 'static,
        MetastoreServiceMailbox<A>: MetastoreService,
    {
        let inner_client = InnerMetastoreServiceClient(
            std::sync::Arc::new(MetastoreServiceMailbox::new(mailbox)),
        );
        self.build_from_inner_client(inner_client)
    }
    #[cfg(any(test, feature = "testsuite"))]
    pub fn build_from_mock(self, mock: MockMetastoreService) -> MetastoreServiceClient {
        let client = MetastoreServiceClient::from_mock(mock);
        let inner_client = client.inner;
        self.build_from_inner_client(inner_client)
    }
    fn build_from_inner_client(
        self,
        inner_client: InnerMetastoreServiceClient,
    ) -> MetastoreServiceClient {
        let create_index_svc = self
            .create_index_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let update_index_svc = self
            .update_index_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let index_metadata_svc = self
            .index_metadata_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let indexes_metadata_svc = self
            .indexes_metadata_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_indexes_metadata_svc = self
            .list_indexes_metadata_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_index_svc = self
            .delete_index_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_index_stats_svc = self
            .list_index_stats_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_splits_svc = self
            .list_splits_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let stage_splits_svc = self
            .stage_splits_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let publish_splits_svc = self
            .publish_splits_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let mark_splits_for_deletion_svc = self
            .mark_splits_for_deletion_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_splits_svc = self
            .delete_splits_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let add_source_svc = self
            .add_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let update_source_svc = self
            .update_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let toggle_source_svc = self
            .toggle_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_source_svc = self
            .delete_source_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let reset_source_checkpoint_svc = self
            .reset_source_checkpoint_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let last_delete_opstamp_svc = self
            .last_delete_opstamp_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let create_delete_task_svc = self
            .create_delete_task_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let update_splits_delete_opstamp_svc = self
            .update_splits_delete_opstamp_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_delete_tasks_svc = self
            .list_delete_tasks_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_stale_splits_svc = self
            .list_stale_splits_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let open_shards_svc = self
            .open_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let acquire_shards_svc = self
            .acquire_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_shards_svc = self
            .delete_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let prune_shards_svc = self
            .prune_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_shards_svc = self
            .list_shards_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let create_index_template_svc = self
            .create_index_template_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let get_index_template_svc = self
            .get_index_template_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let find_index_template_matches_svc = self
            .find_index_template_matches_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let list_index_templates_svc = self
            .list_index_templates_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let delete_index_templates_svc = self
            .delete_index_templates_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let get_cluster_identity_svc = self
            .get_cluster_identity_layers
            .into_iter()
            .rev()
            .fold(
                quickwit_common::tower::BoxService::new(inner_client.clone()),
                |svc, layer| layer.layer(svc),
            );
        let tower_svc_stack = MetastoreServiceTowerServiceStack {
            inner: inner_client,
            create_index_svc,
            update_index_svc,
            index_metadata_svc,
            indexes_metadata_svc,
            list_indexes_metadata_svc,
            delete_index_svc,
            list_index_stats_svc,
            list_splits_svc,
            stage_splits_svc,
            publish_splits_svc,
            mark_splits_for_deletion_svc,
            delete_splits_svc,
            add_source_svc,
            update_source_svc,
            toggle_source_svc,
            delete_source_svc,
            reset_source_checkpoint_svc,
            last_delete_opstamp_svc,
            create_delete_task_svc,
            update_splits_delete_opstamp_svc,
            list_delete_tasks_svc,
            list_stale_splits_svc,
            open_shards_svc,
            acquire_shards_svc,
            delete_shards_svc,
            prune_shards_svc,
            list_shards_svc,
            create_index_template_svc,
            get_index_template_svc,
            find_index_template_matches_svc,
            list_index_templates_svc,
            delete_index_templates_svc,
            get_cluster_identity_svc,
        };
        MetastoreServiceClient::new(tower_svc_stack)
    }
}
#[derive(Debug, Clone)]
struct MailboxAdapter<A: quickwit_actors::Actor, E> {
    inner: quickwit_actors::Mailbox<A>,
    phantom: std::marker::PhantomData<E>,
}
impl<A, E> std::ops::Deref for MailboxAdapter<A, E>
where
    A: quickwit_actors::Actor,
{
    type Target = quickwit_actors::Mailbox<A>;
    fn deref(&self) -> &Self::Target {
        &self.inner
    }
}
#[derive(Debug)]
pub struct MetastoreServiceMailbox<A: quickwit_actors::Actor> {
    inner: MailboxAdapter<A, crate::metastore::MetastoreError>,
}
impl<A: quickwit_actors::Actor> MetastoreServiceMailbox<A> {
    pub fn new(instance: quickwit_actors::Mailbox<A>) -> Self {
        let inner = MailboxAdapter {
            inner: instance,
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A: quickwit_actors::Actor> Clone for MetastoreServiceMailbox<A> {
    fn clone(&self) -> Self {
        let inner = MailboxAdapter {
            inner: self.inner.clone(),
            phantom: std::marker::PhantomData,
        };
        Self { inner }
    }
}
impl<A, M, T, E> tower::Service<M> for MetastoreServiceMailbox<A>
where
    A: quickwit_actors::Actor
        + quickwit_actors::DeferableReplyHandler<M, Reply = Result<T, E>> + Send
        + 'static,
    M: std::fmt::Debug + Send + 'static,
    T: Send + 'static,
    E: std::fmt::Debug + Send + 'static,
    crate::metastore::MetastoreError: From<quickwit_actors::AskError<E>>,
{
    type Response = T;
    type Error = crate::metastore::MetastoreError;
    type Future = BoxFuture<Self::Response, Self::Error>;
    fn poll_ready(
        &mut self,
        _cx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Result<(), Self::Error>> {
        //! This does not work with balance middlewares such as `tower::balance::pool::Pool` because
        //! this always returns `Poll::Ready`. The fix is to acquire a permit from the
        //! mailbox in `poll_ready` and consume it in `call`.
        std::task::Poll::Ready(Ok(()))
    }
    fn call(&mut self, message: M) -> Self::Future {
        let mailbox = self.inner.clone();
        let fut = async move {
            mailbox.ask_for_res(message).await.map_err(|error| error.into())
        };
        Box::pin(fut)
    }
}
#[async_trait::async_trait]
impl<A> MetastoreService for MetastoreServiceMailbox<A>
where
    A: quickwit_actors::Actor + std::fmt::Debug,
    MetastoreServiceMailbox<
        A,
    >: tower::Service<
            CreateIndexRequest,
            Response = CreateIndexResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<CreateIndexResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            UpdateIndexRequest,
            Response = IndexMetadataResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<IndexMetadataResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            IndexMetadataRequest,
            Response = IndexMetadataResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<IndexMetadataResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            IndexesMetadataRequest,
            Response = IndexesMetadataResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<IndexesMetadataResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ListIndexesMetadataRequest,
            Response = ListIndexesMetadataResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                ListIndexesMetadataResponse,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            DeleteIndexRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ListIndexStatsRequest,
            Response = ListIndexStatsResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<ListIndexStatsResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ListSplitsRequest,
            Response = MetastoreServiceStream<ListSplitsResponse>,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                MetastoreServiceStream<ListSplitsResponse>,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            StageSplitsRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            PublishSplitsRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            MarkSplitsForDeletionRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            DeleteSplitsRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            AddSourceRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            UpdateSourceRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ToggleSourceRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            DeleteSourceRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ResetSourceCheckpointRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            LastDeleteOpstampRequest,
            Response = LastDeleteOpstampResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                LastDeleteOpstampResponse,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            DeleteQuery,
            Response = DeleteTask,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<DeleteTask, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            UpdateSplitsDeleteOpstampRequest,
            Response = UpdateSplitsDeleteOpstampResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                UpdateSplitsDeleteOpstampResponse,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            ListDeleteTasksRequest,
            Response = ListDeleteTasksResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<ListDeleteTasksResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ListStaleSplitsRequest,
            Response = ListSplitsResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<ListSplitsResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            OpenShardsRequest,
            Response = OpenShardsResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<OpenShardsResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            AcquireShardsRequest,
            Response = AcquireShardsResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<AcquireShardsResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            DeleteShardsRequest,
            Response = DeleteShardsResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<DeleteShardsResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            PruneShardsRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            ListShardsRequest,
            Response = ListShardsResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<ListShardsResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            CreateIndexTemplateRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            GetIndexTemplateRequest,
            Response = GetIndexTemplateResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                GetIndexTemplateResponse,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            FindIndexTemplateMatchesRequest,
            Response = FindIndexTemplateMatchesResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                FindIndexTemplateMatchesResponse,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            ListIndexTemplatesRequest,
            Response = ListIndexTemplatesResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                ListIndexTemplatesResponse,
                crate::metastore::MetastoreError,
            >,
        >
        + tower::Service<
            DeleteIndexTemplatesRequest,
            Response = EmptyResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<EmptyResponse, crate::metastore::MetastoreError>,
        >
        + tower::Service<
            GetClusterIdentityRequest,
            Response = GetClusterIdentityResponse,
            Error = crate::metastore::MetastoreError,
            Future = BoxFuture<
                GetClusterIdentityResponse,
                crate::metastore::MetastoreError,
            >,
        >,
{
    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> crate::metastore::MetastoreResult<CreateIndexResponse> {
        self.clone().call(request).await
    }
    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.clone().call(request).await
    }
    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.clone().call(request).await
    }
    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexesMetadataResponse> {
        self.clone().call(request).await
    }
    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexesMetadataResponse> {
        self.clone().call(request).await
    }
    async fn delete_index(
        &self,
        request: DeleteIndexRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexStatsResponse> {
        self.clone().call(request).await
    }
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> crate::metastore::MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        self.clone().call(request).await
    }
    async fn stage_splits(
        &self,
        request: StageSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn delete_splits(
        &self,
        request: DeleteSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn add_source(
        &self,
        request: AddSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn update_source(
        &self,
        request: UpdateSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn toggle_source(
        &self,
        request: ToggleSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn delete_source(
        &self,
        request: DeleteSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<LastDeleteOpstampResponse> {
        self.clone().call(request).await
    }
    async fn create_delete_task(
        &self,
        request: DeleteQuery,
    ) -> crate::metastore::MetastoreResult<DeleteTask> {
        self.clone().call(request).await
    }
    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        self.clone().call(request).await
    }
    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> crate::metastore::MetastoreResult<ListDeleteTasksResponse> {
        self.clone().call(request).await
    }
    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> crate::metastore::MetastoreResult<ListSplitsResponse> {
        self.clone().call(request).await
    }
    async fn open_shards(
        &self,
        request: OpenShardsRequest,
    ) -> crate::metastore::MetastoreResult<OpenShardsResponse> {
        self.clone().call(request).await
    }
    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> crate::metastore::MetastoreResult<AcquireShardsResponse> {
        self.clone().call(request).await
    }
    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> crate::metastore::MetastoreResult<DeleteShardsResponse> {
        self.clone().call(request).await
    }
    async fn prune_shards(
        &self,
        request: PruneShardsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn list_shards(
        &self,
        request: ListShardsRequest,
    ) -> crate::metastore::MetastoreResult<ListShardsResponse> {
        self.clone().call(request).await
    }
    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<GetIndexTemplateResponse> {
        self.clone().call(request).await
    }
    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> crate::metastore::MetastoreResult<FindIndexTemplateMatchesResponse> {
        self.clone().call(request).await
    }
    async fn list_index_templates(
        &self,
        request: ListIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexTemplatesResponse> {
        self.clone().call(request).await
    }
    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.clone().call(request).await
    }
    async fn get_cluster_identity(
        &self,
        request: GetClusterIdentityRequest,
    ) -> crate::metastore::MetastoreResult<GetClusterIdentityResponse> {
        self.clone().call(request).await
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if self.inner.is_disconnected() {
            anyhow::bail!("actor `{}` is disconnected", self.inner.actor_instance_id())
        }
        Ok(())
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        vec![
            quickwit_common::uri::Uri::from_str(& format!("actor://localhost/{}", self
            .inner.actor_instance_id())).expect("URI should be valid")
        ]
    }
}
#[derive(Debug, Clone)]
pub struct MetastoreServiceGrpcClientAdapter<T> {
    inner: T,
    #[allow(dead_code)]
    connection_addrs_rx: tokio::sync::watch::Receiver<
        std::collections::HashSet<std::net::SocketAddr>,
    >,
}
impl<T> MetastoreServiceGrpcClientAdapter<T> {
    pub fn new(
        instance: T,
        connection_addrs_rx: tokio::sync::watch::Receiver<
            std::collections::HashSet<std::net::SocketAddr>,
        >,
    ) -> Self {
        Self {
            inner: instance,
            connection_addrs_rx,
        }
    }
}
#[async_trait::async_trait]
impl<T> MetastoreService
for MetastoreServiceGrpcClientAdapter<
    metastore_service_grpc_client::MetastoreServiceGrpcClient<T>,
>
where
    T: tonic::client::GrpcService<tonic::body::Body> + std::fmt::Debug + Clone + Send
        + Sync + 'static,
    T::ResponseBody: tonic::codegen::Body<Data = tonic::codegen::Bytes> + Send + 'static,
    <T::ResponseBody as tonic::codegen::Body>::Error: Into<tonic::codegen::StdError>
        + Send,
    T::Future: Send,
{
    async fn create_index(
        &self,
        request: CreateIndexRequest,
    ) -> crate::metastore::MetastoreResult<CreateIndexResponse> {
        self.inner
            .clone()
            .create_index(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                CreateIndexRequest::rpc_name(),
            ))
    }
    async fn update_index(
        &self,
        request: UpdateIndexRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.inner
            .clone()
            .update_index(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                UpdateIndexRequest::rpc_name(),
            ))
    }
    async fn index_metadata(
        &self,
        request: IndexMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexMetadataResponse> {
        self.inner
            .clone()
            .index_metadata(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                IndexMetadataRequest::rpc_name(),
            ))
    }
    async fn indexes_metadata(
        &self,
        request: IndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<IndexesMetadataResponse> {
        self.inner
            .clone()
            .indexes_metadata(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                IndexesMetadataRequest::rpc_name(),
            ))
    }
    async fn list_indexes_metadata(
        &self,
        request: ListIndexesMetadataRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexesMetadataResponse> {
        self.inner
            .clone()
            .list_indexes_metadata(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListIndexesMetadataRequest::rpc_name(),
            ))
    }
    async fn delete_index(
        &self,
        request: DeleteIndexRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .delete_index(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DeleteIndexRequest::rpc_name(),
            ))
    }
    async fn list_index_stats(
        &self,
        request: ListIndexStatsRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexStatsResponse> {
        self.inner
            .clone()
            .list_index_stats(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListIndexStatsRequest::rpc_name(),
            ))
    }
    async fn list_splits(
        &self,
        request: ListSplitsRequest,
    ) -> crate::metastore::MetastoreResult<MetastoreServiceStream<ListSplitsResponse>> {
        self.inner
            .clone()
            .list_splits(request)
            .await
            .map(|response| {
                let streaming: tonic::Streaming<_> = response.into_inner();
                let stream = quickwit_common::ServiceStream::from(streaming);
                stream
                    .map_err(|status| crate::error::grpc_status_to_service_error(
                        status,
                        ListSplitsRequest::rpc_name(),
                    ))
            })
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListSplitsRequest::rpc_name(),
            ))
    }
    async fn stage_splits(
        &self,
        request: StageSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .stage_splits(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                StageSplitsRequest::rpc_name(),
            ))
    }
    async fn publish_splits(
        &self,
        request: PublishSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .publish_splits(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                PublishSplitsRequest::rpc_name(),
            ))
    }
    async fn mark_splits_for_deletion(
        &self,
        request: MarkSplitsForDeletionRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .mark_splits_for_deletion(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                MarkSplitsForDeletionRequest::rpc_name(),
            ))
    }
    async fn delete_splits(
        &self,
        request: DeleteSplitsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .delete_splits(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DeleteSplitsRequest::rpc_name(),
            ))
    }
    async fn add_source(
        &self,
        request: AddSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .add_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                AddSourceRequest::rpc_name(),
            ))
    }
    async fn update_source(
        &self,
        request: UpdateSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .update_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                UpdateSourceRequest::rpc_name(),
            ))
    }
    async fn toggle_source(
        &self,
        request: ToggleSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .toggle_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ToggleSourceRequest::rpc_name(),
            ))
    }
    async fn delete_source(
        &self,
        request: DeleteSourceRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .delete_source(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DeleteSourceRequest::rpc_name(),
            ))
    }
    async fn reset_source_checkpoint(
        &self,
        request: ResetSourceCheckpointRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .reset_source_checkpoint(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ResetSourceCheckpointRequest::rpc_name(),
            ))
    }
    async fn last_delete_opstamp(
        &self,
        request: LastDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<LastDeleteOpstampResponse> {
        self.inner
            .clone()
            .last_delete_opstamp(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                LastDeleteOpstampRequest::rpc_name(),
            ))
    }
    async fn create_delete_task(
        &self,
        request: DeleteQuery,
    ) -> crate::metastore::MetastoreResult<DeleteTask> {
        self.inner
            .clone()
            .create_delete_task(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DeleteQuery::rpc_name(),
            ))
    }
    async fn update_splits_delete_opstamp(
        &self,
        request: UpdateSplitsDeleteOpstampRequest,
    ) -> crate::metastore::MetastoreResult<UpdateSplitsDeleteOpstampResponse> {
        self.inner
            .clone()
            .update_splits_delete_opstamp(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                UpdateSplitsDeleteOpstampRequest::rpc_name(),
            ))
    }
    async fn list_delete_tasks(
        &self,
        request: ListDeleteTasksRequest,
    ) -> crate::metastore::MetastoreResult<ListDeleteTasksResponse> {
        self.inner
            .clone()
            .list_delete_tasks(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListDeleteTasksRequest::rpc_name(),
            ))
    }
    async fn list_stale_splits(
        &self,
        request: ListStaleSplitsRequest,
    ) -> crate::metastore::MetastoreResult<ListSplitsResponse> {
        self.inner
            .clone()
            .list_stale_splits(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListStaleSplitsRequest::rpc_name(),
            ))
    }
    async fn open_shards(
        &self,
        request: OpenShardsRequest,
    ) -> crate::metastore::MetastoreResult<OpenShardsResponse> {
        self.inner
            .clone()
            .open_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                OpenShardsRequest::rpc_name(),
            ))
    }
    async fn acquire_shards(
        &self,
        request: AcquireShardsRequest,
    ) -> crate::metastore::MetastoreResult<AcquireShardsResponse> {
        self.inner
            .clone()
            .acquire_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                AcquireShardsRequest::rpc_name(),
            ))
    }
    async fn delete_shards(
        &self,
        request: DeleteShardsRequest,
    ) -> crate::metastore::MetastoreResult<DeleteShardsResponse> {
        self.inner
            .clone()
            .delete_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DeleteShardsRequest::rpc_name(),
            ))
    }
    async fn prune_shards(
        &self,
        request: PruneShardsRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .prune_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                PruneShardsRequest::rpc_name(),
            ))
    }
    async fn list_shards(
        &self,
        request: ListShardsRequest,
    ) -> crate::metastore::MetastoreResult<ListShardsResponse> {
        self.inner
            .clone()
            .list_shards(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListShardsRequest::rpc_name(),
            ))
    }
    async fn create_index_template(
        &self,
        request: CreateIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .create_index_template(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                CreateIndexTemplateRequest::rpc_name(),
            ))
    }
    async fn get_index_template(
        &self,
        request: GetIndexTemplateRequest,
    ) -> crate::metastore::MetastoreResult<GetIndexTemplateResponse> {
        self.inner
            .clone()
            .get_index_template(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                GetIndexTemplateRequest::rpc_name(),
            ))
    }
    async fn find_index_template_matches(
        &self,
        request: FindIndexTemplateMatchesRequest,
    ) -> crate::metastore::MetastoreResult<FindIndexTemplateMatchesResponse> {
        self.inner
            .clone()
            .find_index_template_matches(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                FindIndexTemplateMatchesRequest::rpc_name(),
            ))
    }
    async fn list_index_templates(
        &self,
        request: ListIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<ListIndexTemplatesResponse> {
        self.inner
            .clone()
            .list_index_templates(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                ListIndexTemplatesRequest::rpc_name(),
            ))
    }
    async fn delete_index_templates(
        &self,
        request: DeleteIndexTemplatesRequest,
    ) -> crate::metastore::MetastoreResult<EmptyResponse> {
        self.inner
            .clone()
            .delete_index_templates(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                DeleteIndexTemplatesRequest::rpc_name(),
            ))
    }
    async fn get_cluster_identity(
        &self,
        request: GetClusterIdentityRequest,
    ) -> crate::metastore::MetastoreResult<GetClusterIdentityResponse> {
        self.inner
            .clone()
            .get_cluster_identity(request)
            .await
            .map(|response| response.into_inner())
            .map_err(|status| crate::error::grpc_status_to_service_error(
                status,
                GetClusterIdentityRequest::rpc_name(),
            ))
    }
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if self.connection_addrs_rx.borrow().is_empty() {
            anyhow::bail!("no server currently available")
        }
        Ok(())
    }
    fn endpoints(&self) -> Vec<quickwit_common::uri::Uri> {
        self.connection_addrs_rx
            .borrow()
            .iter()
            .flat_map(|addr| quickwit_common::uri::Uri::from_str(
                &format!("grpc://{addr}/{}.{}", "quickwit.metastore", "MetastoreService"),
            ))
            .collect()
    }
}
#[derive(Debug)]
pub struct MetastoreServiceGrpcServerAdapter {
    inner: InnerMetastoreServiceClient,
}
impl MetastoreServiceGrpcServerAdapter {
    pub fn new<T>(instance: T) -> Self
    where
        T: MetastoreService,
    {
        Self {
            inner: InnerMetastoreServiceClient(std::sync::Arc::new(instance)),
        }
    }
}
#[async_trait::async_trait]
impl metastore_service_grpc_server::MetastoreServiceGrpc
for MetastoreServiceGrpcServerAdapter {
    async fn create_index(
        &self,
        request: tonic::Request<CreateIndexRequest>,
    ) -> Result<tonic::Response<CreateIndexResponse>, tonic::Status> {
        self.inner
            .0
            .create_index(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn update_index(
        &self,
        request: tonic::Request<UpdateIndexRequest>,
    ) -> Result<tonic::Response<IndexMetadataResponse>, tonic::Status> {
        self.inner
            .0
            .update_index(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn index_metadata(
        &self,
        request: tonic::Request<IndexMetadataRequest>,
    ) -> Result<tonic::Response<IndexMetadataResponse>, tonic::Status> {
        self.inner
            .0
            .index_metadata(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn indexes_metadata(
        &self,
        request: tonic::Request<IndexesMetadataRequest>,
    ) -> Result<tonic::Response<IndexesMetadataResponse>, tonic::Status> {
        self.inner
            .0
            .indexes_metadata(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn list_indexes_metadata(
        &self,
        request: tonic::Request<ListIndexesMetadataRequest>,
    ) -> Result<tonic::Response<ListIndexesMetadataResponse>, tonic::Status> {
        self.inner
            .0
            .list_indexes_metadata(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_index(
        &self,
        request: tonic::Request<DeleteIndexRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .delete_index(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn list_index_stats(
        &self,
        request: tonic::Request<ListIndexStatsRequest>,
    ) -> Result<tonic::Response<ListIndexStatsResponse>, tonic::Status> {
        self.inner
            .0
            .list_index_stats(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    type ListSplitsStream = quickwit_common::ServiceStream<
        tonic::Result<ListSplitsResponse>,
    >;
    async fn list_splits(
        &self,
        request: tonic::Request<ListSplitsRequest>,
    ) -> Result<tonic::Response<Self::ListSplitsStream>, tonic::Status> {
        self.inner
            .0
            .list_splits(request.into_inner())
            .await
            .map(|stream| tonic::Response::new(
                stream.map_err(crate::error::grpc_error_to_grpc_status),
            ))
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn stage_splits(
        &self,
        request: tonic::Request<StageSplitsRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .stage_splits(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn publish_splits(
        &self,
        request: tonic::Request<PublishSplitsRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .publish_splits(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn mark_splits_for_deletion(
        &self,
        request: tonic::Request<MarkSplitsForDeletionRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .mark_splits_for_deletion(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_splits(
        &self,
        request: tonic::Request<DeleteSplitsRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .delete_splits(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn add_source(
        &self,
        request: tonic::Request<AddSourceRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .add_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn update_source(
        &self,
        request: tonic::Request<UpdateSourceRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .update_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn toggle_source(
        &self,
        request: tonic::Request<ToggleSourceRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .toggle_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_source(
        &self,
        request: tonic::Request<DeleteSourceRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .delete_source(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn reset_source_checkpoint(
        &self,
        request: tonic::Request<ResetSourceCheckpointRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .reset_source_checkpoint(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn last_delete_opstamp(
        &self,
        request: tonic::Request<LastDeleteOpstampRequest>,
    ) -> Result<tonic::Response<LastDeleteOpstampResponse>, tonic::Status> {
        self.inner
            .0
            .last_delete_opstamp(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn create_delete_task(
        &self,
        request: tonic::Request<DeleteQuery>,
    ) -> Result<tonic::Response<DeleteTask>, tonic::Status> {
        self.inner
            .0
            .create_delete_task(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn update_splits_delete_opstamp(
        &self,
        request: tonic::Request<UpdateSplitsDeleteOpstampRequest>,
    ) -> Result<tonic::Response<UpdateSplitsDeleteOpstampResponse>, tonic::Status> {
        self.inner
            .0
            .update_splits_delete_opstamp(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn list_delete_tasks(
        &self,
        request: tonic::Request<ListDeleteTasksRequest>,
    ) -> Result<tonic::Response<ListDeleteTasksResponse>, tonic::Status> {
        self.inner
            .0
            .list_delete_tasks(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn list_stale_splits(
        &self,
        request: tonic::Request<ListStaleSplitsRequest>,
    ) -> Result<tonic::Response<ListSplitsResponse>, tonic::Status> {
        self.inner
            .0
            .list_stale_splits(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn open_shards(
        &self,
        request: tonic::Request<OpenShardsRequest>,
    ) -> Result<tonic::Response<OpenShardsResponse>, tonic::Status> {
        self.inner
            .0
            .open_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn acquire_shards(
        &self,
        request: tonic::Request<AcquireShardsRequest>,
    ) -> Result<tonic::Response<AcquireShardsResponse>, tonic::Status> {
        self.inner
            .0
            .acquire_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_shards(
        &self,
        request: tonic::Request<DeleteShardsRequest>,
    ) -> Result<tonic::Response<DeleteShardsResponse>, tonic::Status> {
        self.inner
            .0
            .delete_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn prune_shards(
        &self,
        request: tonic::Request<PruneShardsRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .prune_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn list_shards(
        &self,
        request: tonic::Request<ListShardsRequest>,
    ) -> Result<tonic::Response<ListShardsResponse>, tonic::Status> {
        self.inner
            .0
            .list_shards(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn create_index_template(
        &self,
        request: tonic::Request<CreateIndexTemplateRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .create_index_template(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn get_index_template(
        &self,
        request: tonic::Request<GetIndexTemplateRequest>,
    ) -> Result<tonic::Response<GetIndexTemplateResponse>, tonic::Status> {
        self.inner
            .0
            .get_index_template(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn find_index_template_matches(
        &self,
        request: tonic::Request<FindIndexTemplateMatchesRequest>,
    ) -> Result<tonic::Response<FindIndexTemplateMatchesResponse>, tonic::Status> {
        self.inner
            .0
            .find_index_template_matches(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn list_index_templates(
        &self,
        request: tonic::Request<ListIndexTemplatesRequest>,
    ) -> Result<tonic::Response<ListIndexTemplatesResponse>, tonic::Status> {
        self.inner
            .0
            .list_index_templates(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn delete_index_templates(
        &self,
        request: tonic::Request<DeleteIndexTemplatesRequest>,
    ) -> Result<tonic::Response<EmptyResponse>, tonic::Status> {
        self.inner
            .0
            .delete_index_templates(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
    async fn get_cluster_identity(
        &self,
        request: tonic::Request<GetClusterIdentityRequest>,
    ) -> Result<tonic::Response<GetClusterIdentityResponse>, tonic::Status> {
        self.inner
            .0
            .get_cluster_identity(request.into_inner())
            .await
            .map(tonic::Response::new)
            .map_err(crate::error::grpc_error_to_grpc_status)
    }
}
/// Generated client implementations.
pub mod metastore_service_grpc_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    /// Metastore meant to manage Quickwit's indexes, their splits and delete tasks.
    ///
    /// I. Index and splits management.
    ///
    /// Quickwit needs a way to ensure that we can cleanup unused files,
    /// and this process needs to be resilient to any fail-stop failures.
    /// We rely on atomically transitioning the status of splits.
    ///
    /// The split state goes through the following life cycle:
    ///
    /// 1. `Staged`
    ///
    /// * Start uploading the split files.
    ///
    /// 2. `Published`
    ///
    /// * Uploading the split files is complete and the split is searchable.
    ///
    /// 3. `MarkedForDeletion`
    ///
    /// * Mark the split for deletion.
    ///
    /// If a split has a file in the storage, it MUST be registered in the metastore,
    /// and its state can be as follows:
    ///
    /// * `Staged`: The split is almost ready. Some of its files may have been uploaded in the storage.
    /// * `Published`: The split is ready and published.
    /// * `MarkedForDeletion`: The split is marked for deletion.
    ///
    /// Before creating any file, we need to stage the split. If there is a failure, upon recovery, we
    /// schedule for deletion all the staged splits. A client may not necessarily remove files from
    /// storage right after marking it for deletion. A CLI client may delete files right away, but a
    /// more serious deployment should probably only delete those files after a grace period so that the
    /// running search queries can complete.
    ///
    /// II. Delete tasks management.
    ///
    /// A delete task is defined on a given index and by a search query. It can be
    /// applied to all the splits of the index.
    ///
    /// Quickwit needs a way to track that a delete task has been applied to a split. This is ensured
    /// by two mechanisms:
    ///
    /// * On creation of a delete task, we give to the task a monotically increasing opstamp (uniqueness
    ///  and monotonically increasing must be true at the index level).
    /// * When a delete task is executed on a split, that is when the documents matched by the search
    ///  query are removed from the splits, we update the split's `delete_opstamp` to the value of the
    ///  task's opstamp. This marks the split as "up-to-date" regarding this delete task. If new delete
    ///  tasks are added, we will know that we need to run these delete tasks on the splits as its
    ///  `delete_optstamp` will be inferior to the `opstamp` of the new tasks.
    ///
    /// For splits created after a given delete task, Quickwit's indexing ensures that these splits
    /// are created with a `delete_opstamp` equal the latest opstamp of the tasks of the
    /// corresponding index.
    #[derive(Debug, Clone)]
    pub struct MetastoreServiceGrpcClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl MetastoreServiceGrpcClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> MetastoreServiceGrpcClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> MetastoreServiceGrpcClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            MetastoreServiceGrpcClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Creates an index.
        ///
        /// This API creates a new index in the metastore.
        /// An error will occur if an index that already exists in the storage is specified.
        pub async fn create_index(
            &mut self,
            request: impl tonic::IntoRequest<super::CreateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CreateIndexResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/CreateIndex",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "CreateIndex"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Update an index.
        pub async fn update_index(
            &mut self,
            request: impl tonic::IntoRequest<super::UpdateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::IndexMetadataResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/UpdateIndex",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "UpdateIndex"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Returns the `IndexMetadata` of an index identified by its IndexID or its IndexUID.
        pub async fn index_metadata(
            &mut self,
            request: impl tonic::IntoRequest<super::IndexMetadataRequest>,
        ) -> std::result::Result<
            tonic::Response<super::IndexMetadataResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/IndexMetadata",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "IndexMetadata",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Fetches the metadata of a list of indexes identified by their Index IDs or UIDs.
        pub async fn indexes_metadata(
            &mut self,
            request: impl tonic::IntoRequest<super::IndexesMetadataRequest>,
        ) -> std::result::Result<
            tonic::Response<super::IndexesMetadataResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/IndexesMetadata",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "IndexesMetadata",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Gets an indexes metadatas.
        pub async fn list_indexes_metadata(
            &mut self,
            request: impl tonic::IntoRequest<super::ListIndexesMetadataRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListIndexesMetadataResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListIndexesMetadata",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ListIndexesMetadata",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Deletes an index
        pub async fn delete_index(
            &mut self,
            request: impl tonic::IntoRequest<super::DeleteIndexRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/DeleteIndex",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "DeleteIndex"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Returns a list of size info for each index.
        pub async fn list_index_stats(
            &mut self,
            request: impl tonic::IntoRequest<super::ListIndexStatsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListIndexStatsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListIndexStats",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ListIndexStats",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Streams splits from index.
        pub async fn list_splits(
            &mut self,
            request: impl tonic::IntoRequest<super::ListSplitsRequest>,
        ) -> std::result::Result<
            tonic::Response<tonic::codec::Streaming<super::ListSplitsResponse>>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListSplits",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "ListSplits"),
                );
            self.inner.server_streaming(req, path, codec).await
        }
        /// Stages several splits.
        pub async fn stage_splits(
            &mut self,
            request: impl tonic::IntoRequest<super::StageSplitsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/StageSplits",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "StageSplits"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Publishes split.
        pub async fn publish_splits(
            &mut self,
            request: impl tonic::IntoRequest<super::PublishSplitsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/PublishSplits",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "PublishSplits",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Marks splits for deletion.
        pub async fn mark_splits_for_deletion(
            &mut self,
            request: impl tonic::IntoRequest<super::MarkSplitsForDeletionRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/MarkSplitsForDeletion",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "MarkSplitsForDeletion",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Deletes splits.
        pub async fn delete_splits(
            &mut self,
            request: impl tonic::IntoRequest<super::DeleteSplitsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/DeleteSplits",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "DeleteSplits",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Adds a source.
        pub async fn add_source(
            &mut self,
            request: impl tonic::IntoRequest<super::AddSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/AddSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "AddSource"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Updates a source.
        pub async fn update_source(
            &mut self,
            request: impl tonic::IntoRequest<super::UpdateSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/UpdateSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "UpdateSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Toggles (turns on or off) source.
        pub async fn toggle_source(
            &mut self,
            request: impl tonic::IntoRequest<super::ToggleSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ToggleSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ToggleSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Removes source.
        pub async fn delete_source(
            &mut self,
            request: impl tonic::IntoRequest<super::DeleteSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/DeleteSource",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "DeleteSource",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Resets source checkpoint.
        pub async fn reset_source_checkpoint(
            &mut self,
            request: impl tonic::IntoRequest<super::ResetSourceCheckpointRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ResetSourceCheckpoint",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ResetSourceCheckpoint",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Gets last opstamp for a given `index_id`.
        pub async fn last_delete_opstamp(
            &mut self,
            request: impl tonic::IntoRequest<super::LastDeleteOpstampRequest>,
        ) -> std::result::Result<
            tonic::Response<super::LastDeleteOpstampResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/LastDeleteOpstamp",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "LastDeleteOpstamp",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Creates a delete task.
        pub async fn create_delete_task(
            &mut self,
            request: impl tonic::IntoRequest<super::DeleteQuery>,
        ) -> std::result::Result<tonic::Response<super::DeleteTask>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/CreateDeleteTask",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "CreateDeleteTask",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Updates splits `delete_opstamp`.
        pub async fn update_splits_delete_opstamp(
            &mut self,
            request: impl tonic::IntoRequest<super::UpdateSplitsDeleteOpstampRequest>,
        ) -> std::result::Result<
            tonic::Response<super::UpdateSplitsDeleteOpstampResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/UpdateSplitsDeleteOpstamp",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "UpdateSplitsDeleteOpstamp",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Lists delete tasks with `delete_task.opstamp` > `opstamp_start` for a given `index_id`.
        pub async fn list_delete_tasks(
            &mut self,
            request: impl tonic::IntoRequest<super::ListDeleteTasksRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListDeleteTasksResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListDeleteTasks",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ListDeleteTasks",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Lists splits with `split.delete_opstamp` \< `delete_opstamp` for a given `index_id`.
        pub async fn list_stale_splits(
            &mut self,
            request: impl tonic::IntoRequest<super::ListStaleSplitsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListSplitsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListStaleSplits",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ListStaleSplits",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Shard API
        ///
        /// Note that for the file-backed metastore implementation, the requests are not processed atomically.
        /// Indeed, each request comprises one or more subrequests that target different indexes and sources processed
        /// independently. Responses list the requests that succeeded or failed in the fields `successes` and
        /// `failures`.
        pub async fn open_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::OpenShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::OpenShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/OpenShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "OpenShards"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Acquires a set of shards for indexing. This RPC locks the shards for publishing thanks to a publish token and only
        /// the last indexer that has acquired the shards is allowed to publish. The response returns for each subrequest the
        /// list of acquired shards along with the positions to index from.
        ///
        /// If a requested shard is missing, this method does not return an error. It should simply return the list of
        /// shards that were actually acquired.
        ///
        /// For this reason, AcquireShards.acquire_shards may return less subresponse than there was in the request.
        /// Also they may be returned in any order.
        pub async fn acquire_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::AcquireShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::AcquireShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/AcquireShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "AcquireShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Deletes a set of shards. This RPC deletes the shards from the metastore.
        /// If the shard did not exist to begin with, the operation is successful and does not return any error.
        pub async fn delete_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::DeleteShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::DeleteShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/DeleteShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "DeleteShards",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Deletes outdated shards. This RPC deletes the shards from the metastore.
        pub async fn prune_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::PruneShardsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/PruneShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "PruneShards"),
                );
            self.inner.unary(req, path, codec).await
        }
        pub async fn list_shards(
            &mut self,
            request: impl tonic::IntoRequest<super::ListShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListShardsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListShards",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.metastore.MetastoreService", "ListShards"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Creates an index template.
        pub async fn create_index_template(
            &mut self,
            request: impl tonic::IntoRequest<super::CreateIndexTemplateRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/CreateIndexTemplate",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "CreateIndexTemplate",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Fetches an index template.
        pub async fn get_index_template(
            &mut self,
            request: impl tonic::IntoRequest<super::GetIndexTemplateRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetIndexTemplateResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/GetIndexTemplate",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "GetIndexTemplate",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Finds matching index templates.
        pub async fn find_index_template_matches(
            &mut self,
            request: impl tonic::IntoRequest<super::FindIndexTemplateMatchesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FindIndexTemplateMatchesResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/FindIndexTemplateMatches",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "FindIndexTemplateMatches",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Returns all the index templates.
        pub async fn list_index_templates(
            &mut self,
            request: impl tonic::IntoRequest<super::ListIndexTemplatesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListIndexTemplatesResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/ListIndexTemplates",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "ListIndexTemplates",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Deletes index templates.
        pub async fn delete_index_templates(
            &mut self,
            request: impl tonic::IntoRequest<super::DeleteIndexTemplatesRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/DeleteIndexTemplates",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "DeleteIndexTemplates",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Get cluster identity
        pub async fn get_cluster_identity(
            &mut self,
            request: impl tonic::IntoRequest<super::GetClusterIdentityRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetClusterIdentityResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.metastore.MetastoreService/GetClusterIdentity",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new(
                        "quickwit.metastore.MetastoreService",
                        "GetClusterIdentity",
                    ),
                );
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod metastore_service_grpc_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with MetastoreServiceGrpcServer.
    #[async_trait]
    pub trait MetastoreServiceGrpc: std::marker::Send + std::marker::Sync + 'static {
        /// Creates an index.
        ///
        /// This API creates a new index in the metastore.
        /// An error will occur if an index that already exists in the storage is specified.
        async fn create_index(
            &self,
            request: tonic::Request<super::CreateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::CreateIndexResponse>,
            tonic::Status,
        >;
        /// Update an index.
        async fn update_index(
            &self,
            request: tonic::Request<super::UpdateIndexRequest>,
        ) -> std::result::Result<
            tonic::Response<super::IndexMetadataResponse>,
            tonic::Status,
        >;
        /// Returns the `IndexMetadata` of an index identified by its IndexID or its IndexUID.
        async fn index_metadata(
            &self,
            request: tonic::Request<super::IndexMetadataRequest>,
        ) -> std::result::Result<
            tonic::Response<super::IndexMetadataResponse>,
            tonic::Status,
        >;
        /// Fetches the metadata of a list of indexes identified by their Index IDs or UIDs.
        async fn indexes_metadata(
            &self,
            request: tonic::Request<super::IndexesMetadataRequest>,
        ) -> std::result::Result<
            tonic::Response<super::IndexesMetadataResponse>,
            tonic::Status,
        >;
        /// Gets an indexes metadatas.
        async fn list_indexes_metadata(
            &self,
            request: tonic::Request<super::ListIndexesMetadataRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListIndexesMetadataResponse>,
            tonic::Status,
        >;
        /// Deletes an index
        async fn delete_index(
            &self,
            request: tonic::Request<super::DeleteIndexRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Returns a list of size info for each index.
        async fn list_index_stats(
            &self,
            request: tonic::Request<super::ListIndexStatsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListIndexStatsResponse>,
            tonic::Status,
        >;
        /// Server streaming response type for the ListSplits method.
        type ListSplitsStream: tonic::codegen::tokio_stream::Stream<
                Item = std::result::Result<super::ListSplitsResponse, tonic::Status>,
            >
            + std::marker::Send
            + 'static;
        /// Streams splits from index.
        async fn list_splits(
            &self,
            request: tonic::Request<super::ListSplitsRequest>,
        ) -> std::result::Result<tonic::Response<Self::ListSplitsStream>, tonic::Status>;
        /// Stages several splits.
        async fn stage_splits(
            &self,
            request: tonic::Request<super::StageSplitsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Publishes split.
        async fn publish_splits(
            &self,
            request: tonic::Request<super::PublishSplitsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Marks splits for deletion.
        async fn mark_splits_for_deletion(
            &self,
            request: tonic::Request<super::MarkSplitsForDeletionRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Deletes splits.
        async fn delete_splits(
            &self,
            request: tonic::Request<super::DeleteSplitsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Adds a source.
        async fn add_source(
            &self,
            request: tonic::Request<super::AddSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Updates a source.
        async fn update_source(
            &self,
            request: tonic::Request<super::UpdateSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Toggles (turns on or off) source.
        async fn toggle_source(
            &self,
            request: tonic::Request<super::ToggleSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Removes source.
        async fn delete_source(
            &self,
            request: tonic::Request<super::DeleteSourceRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Resets source checkpoint.
        async fn reset_source_checkpoint(
            &self,
            request: tonic::Request<super::ResetSourceCheckpointRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Gets last opstamp for a given `index_id`.
        async fn last_delete_opstamp(
            &self,
            request: tonic::Request<super::LastDeleteOpstampRequest>,
        ) -> std::result::Result<
            tonic::Response<super::LastDeleteOpstampResponse>,
            tonic::Status,
        >;
        /// Creates a delete task.
        async fn create_delete_task(
            &self,
            request: tonic::Request<super::DeleteQuery>,
        ) -> std::result::Result<tonic::Response<super::DeleteTask>, tonic::Status>;
        /// Updates splits `delete_opstamp`.
        async fn update_splits_delete_opstamp(
            &self,
            request: tonic::Request<super::UpdateSplitsDeleteOpstampRequest>,
        ) -> std::result::Result<
            tonic::Response<super::UpdateSplitsDeleteOpstampResponse>,
            tonic::Status,
        >;
        /// Lists delete tasks with `delete_task.opstamp` > `opstamp_start` for a given `index_id`.
        async fn list_delete_tasks(
            &self,
            request: tonic::Request<super::ListDeleteTasksRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListDeleteTasksResponse>,
            tonic::Status,
        >;
        /// Lists splits with `split.delete_opstamp` \< `delete_opstamp` for a given `index_id`.
        async fn list_stale_splits(
            &self,
            request: tonic::Request<super::ListStaleSplitsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListSplitsResponse>,
            tonic::Status,
        >;
        /// Shard API
        ///
        /// Note that for the file-backed metastore implementation, the requests are not processed atomically.
        /// Indeed, each request comprises one or more subrequests that target different indexes and sources processed
        /// independently. Responses list the requests that succeeded or failed in the fields `successes` and
        /// `failures`.
        async fn open_shards(
            &self,
            request: tonic::Request<super::OpenShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::OpenShardsResponse>,
            tonic::Status,
        >;
        /// Acquires a set of shards for indexing. This RPC locks the shards for publishing thanks to a publish token and only
        /// the last indexer that has acquired the shards is allowed to publish. The response returns for each subrequest the
        /// list of acquired shards along with the positions to index from.
        ///
        /// If a requested shard is missing, this method does not return an error. It should simply return the list of
        /// shards that were actually acquired.
        ///
        /// For this reason, AcquireShards.acquire_shards may return less subresponse than there was in the request.
        /// Also they may be returned in any order.
        async fn acquire_shards(
            &self,
            request: tonic::Request<super::AcquireShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::AcquireShardsResponse>,
            tonic::Status,
        >;
        /// Deletes a set of shards. This RPC deletes the shards from the metastore.
        /// If the shard did not exist to begin with, the operation is successful and does not return any error.
        async fn delete_shards(
            &self,
            request: tonic::Request<super::DeleteShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::DeleteShardsResponse>,
            tonic::Status,
        >;
        /// Deletes outdated shards. This RPC deletes the shards from the metastore.
        async fn prune_shards(
            &self,
            request: tonic::Request<super::PruneShardsRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        async fn list_shards(
            &self,
            request: tonic::Request<super::ListShardsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListShardsResponse>,
            tonic::Status,
        >;
        /// Creates an index template.
        async fn create_index_template(
            &self,
            request: tonic::Request<super::CreateIndexTemplateRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Fetches an index template.
        async fn get_index_template(
            &self,
            request: tonic::Request<super::GetIndexTemplateRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetIndexTemplateResponse>,
            tonic::Status,
        >;
        /// Finds matching index templates.
        async fn find_index_template_matches(
            &self,
            request: tonic::Request<super::FindIndexTemplateMatchesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FindIndexTemplateMatchesResponse>,
            tonic::Status,
        >;
        /// Returns all the index templates.
        async fn list_index_templates(
            &self,
            request: tonic::Request<super::ListIndexTemplatesRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListIndexTemplatesResponse>,
            tonic::Status,
        >;
        /// Deletes index templates.
        async fn delete_index_templates(
            &self,
            request: tonic::Request<super::DeleteIndexTemplatesRequest>,
        ) -> std::result::Result<tonic::Response<super::EmptyResponse>, tonic::Status>;
        /// Get cluster identity
        async fn get_cluster_identity(
            &self,
            request: tonic::Request<super::GetClusterIdentityRequest>,
        ) -> std::result::Result<
            tonic::Response<super::GetClusterIdentityResponse>,
            tonic::Status,
        >;
    }
    /// Metastore meant to manage Quickwit's indexes, their splits and delete tasks.
    ///
    /// I. Index and splits management.
    ///
    /// Quickwit needs a way to ensure that we can cleanup unused files,
    /// and this process needs to be resilient to any fail-stop failures.
    /// We rely on atomically transitioning the status of splits.
    ///
    /// The split state goes through the following life cycle:
    ///
    /// 1. `Staged`
    ///
    /// * Start uploading the split files.
    ///
    /// 2. `Published`
    ///
    /// * Uploading the split files is complete and the split is searchable.
    ///
    /// 3. `MarkedForDeletion`
    ///
    /// * Mark the split for deletion.
    ///
    /// If a split has a file in the storage, it MUST be registered in the metastore,
    /// and its state can be as follows:
    ///
    /// * `Staged`: The split is almost ready. Some of its files may have been uploaded in the storage.
    /// * `Published`: The split is ready and published.
    /// * `MarkedForDeletion`: The split is marked for deletion.
    ///
    /// Before creating any file, we need to stage the split. If there is a failure, upon recovery, we
    /// schedule for deletion all the staged splits. A client may not necessarily remove files from
    /// storage right after marking it for deletion. A CLI client may delete files right away, but a
    /// more serious deployment should probably only delete those files after a grace period so that the
    /// running search queries can complete.
    ///
    /// II. Delete tasks management.
    ///
    /// A delete task is defined on a given index and by a search query. It can be
    /// applied to all the splits of the index.
    ///
    /// Quickwit needs a way to track that a delete task has been applied to a split. This is ensured
    /// by two mechanisms:
    ///
    /// * On creation of a delete task, we give to the task a monotically increasing opstamp (uniqueness
    ///  and monotonically increasing must be true at the index level).
    /// * When a delete task is executed on a split, that is when the documents matched by the search
    ///  query are removed from the splits, we update the split's `delete_opstamp` to the value of the
    ///  task's opstamp. This marks the split as "up-to-date" regarding this delete task. If new delete
    ///  tasks are added, we will know that we need to run these delete tasks on the splits as its
    ///  `delete_optstamp` will be inferior to the `opstamp` of the new tasks.
    ///
    /// For splits created after a given delete task, Quickwit's indexing ensures that these splits
    /// are created with a `delete_opstamp` equal the latest opstamp of the tasks of the
    /// corresponding index.
    #[derive(Debug)]
    pub struct MetastoreServiceGrpcServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> MetastoreServiceGrpcServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>>
    for MetastoreServiceGrpcServer<T>
    where
        T: MetastoreServiceGrpc,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.metastore.MetastoreService/CreateIndex" => {
                    #[allow(non_camel_case_types)]
                    struct CreateIndexSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::CreateIndexRequest>
                    for CreateIndexSvc<T> {
                        type Response = super::CreateIndexResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::CreateIndexRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::create_index(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CreateIndexSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/UpdateIndex" => {
                    #[allow(non_camel_case_types)]
                    struct UpdateIndexSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::UpdateIndexRequest>
                    for UpdateIndexSvc<T> {
                        type Response = super::IndexMetadataResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::UpdateIndexRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::update_index(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = UpdateIndexSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/IndexMetadata" => {
                    #[allow(non_camel_case_types)]
                    struct IndexMetadataSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::IndexMetadataRequest>
                    for IndexMetadataSvc<T> {
                        type Response = super::IndexMetadataResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::IndexMetadataRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::index_metadata(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = IndexMetadataSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/IndexesMetadata" => {
                    #[allow(non_camel_case_types)]
                    struct IndexesMetadataSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::IndexesMetadataRequest>
                    for IndexesMetadataSvc<T> {
                        type Response = super::IndexesMetadataResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::IndexesMetadataRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::indexes_metadata(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = IndexesMetadataSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListIndexesMetadata" => {
                    #[allow(non_camel_case_types)]
                    struct ListIndexesMetadataSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ListIndexesMetadataRequest>
                    for ListIndexesMetadataSvc<T> {
                        type Response = super::ListIndexesMetadataResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListIndexesMetadataRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_indexes_metadata(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListIndexesMetadataSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/DeleteIndex" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteIndexSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::DeleteIndexRequest>
                    for DeleteIndexSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DeleteIndexRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::delete_index(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteIndexSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListIndexStats" => {
                    #[allow(non_camel_case_types)]
                    struct ListIndexStatsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ListIndexStatsRequest>
                    for ListIndexStatsSvc<T> {
                        type Response = super::ListIndexStatsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListIndexStatsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_index_stats(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListIndexStatsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListSplits" => {
                    #[allow(non_camel_case_types)]
                    struct ListSplitsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::ServerStreamingService<super::ListSplitsRequest>
                    for ListSplitsSvc<T> {
                        type Response = super::ListSplitsResponse;
                        type ResponseStream = T::ListSplitsStream;
                        type Future = BoxFuture<
                            tonic::Response<Self::ResponseStream>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListSplitsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_splits(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListSplitsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.server_streaming(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/StageSplits" => {
                    #[allow(non_camel_case_types)]
                    struct StageSplitsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::StageSplitsRequest>
                    for StageSplitsSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::StageSplitsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::stage_splits(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = StageSplitsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/PublishSplits" => {
                    #[allow(non_camel_case_types)]
                    struct PublishSplitsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::PublishSplitsRequest>
                    for PublishSplitsSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::PublishSplitsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::publish_splits(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = PublishSplitsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/MarkSplitsForDeletion" => {
                    #[allow(non_camel_case_types)]
                    struct MarkSplitsForDeletionSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::MarkSplitsForDeletionRequest>
                    for MarkSplitsForDeletionSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::MarkSplitsForDeletionRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::mark_splits_for_deletion(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = MarkSplitsForDeletionSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/DeleteSplits" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteSplitsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::DeleteSplitsRequest>
                    for DeleteSplitsSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DeleteSplitsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::delete_splits(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteSplitsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/AddSource" => {
                    #[allow(non_camel_case_types)]
                    struct AddSourceSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::AddSourceRequest>
                    for AddSourceSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::AddSourceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::add_source(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = AddSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/UpdateSource" => {
                    #[allow(non_camel_case_types)]
                    struct UpdateSourceSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::UpdateSourceRequest>
                    for UpdateSourceSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::UpdateSourceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::update_source(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = UpdateSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ToggleSource" => {
                    #[allow(non_camel_case_types)]
                    struct ToggleSourceSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ToggleSourceRequest>
                    for ToggleSourceSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ToggleSourceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::toggle_source(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ToggleSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/DeleteSource" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteSourceSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::DeleteSourceRequest>
                    for DeleteSourceSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DeleteSourceRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::delete_source(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteSourceSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ResetSourceCheckpoint" => {
                    #[allow(non_camel_case_types)]
                    struct ResetSourceCheckpointSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ResetSourceCheckpointRequest>
                    for ResetSourceCheckpointSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ResetSourceCheckpointRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::reset_source_checkpoint(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ResetSourceCheckpointSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/LastDeleteOpstamp" => {
                    #[allow(non_camel_case_types)]
                    struct LastDeleteOpstampSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::LastDeleteOpstampRequest>
                    for LastDeleteOpstampSvc<T> {
                        type Response = super::LastDeleteOpstampResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::LastDeleteOpstampRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::last_delete_opstamp(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = LastDeleteOpstampSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/CreateDeleteTask" => {
                    #[allow(non_camel_case_types)]
                    struct CreateDeleteTaskSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::DeleteQuery>
                    for CreateDeleteTaskSvc<T> {
                        type Response = super::DeleteTask;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DeleteQuery>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::create_delete_task(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CreateDeleteTaskSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/UpdateSplitsDeleteOpstamp" => {
                    #[allow(non_camel_case_types)]
                    struct UpdateSplitsDeleteOpstampSvc<T: MetastoreServiceGrpc>(
                        pub Arc<T>,
                    );
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<
                        super::UpdateSplitsDeleteOpstampRequest,
                    > for UpdateSplitsDeleteOpstampSvc<T> {
                        type Response = super::UpdateSplitsDeleteOpstampResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::UpdateSplitsDeleteOpstampRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::update_splits_delete_opstamp(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = UpdateSplitsDeleteOpstampSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListDeleteTasks" => {
                    #[allow(non_camel_case_types)]
                    struct ListDeleteTasksSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ListDeleteTasksRequest>
                    for ListDeleteTasksSvc<T> {
                        type Response = super::ListDeleteTasksResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListDeleteTasksRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_delete_tasks(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListDeleteTasksSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListStaleSplits" => {
                    #[allow(non_camel_case_types)]
                    struct ListStaleSplitsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ListStaleSplitsRequest>
                    for ListStaleSplitsSvc<T> {
                        type Response = super::ListSplitsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListStaleSplitsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_stale_splits(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListStaleSplitsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/OpenShards" => {
                    #[allow(non_camel_case_types)]
                    struct OpenShardsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::OpenShardsRequest>
                    for OpenShardsSvc<T> {
                        type Response = super::OpenShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::OpenShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::open_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = OpenShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/AcquireShards" => {
                    #[allow(non_camel_case_types)]
                    struct AcquireShardsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::AcquireShardsRequest>
                    for AcquireShardsSvc<T> {
                        type Response = super::AcquireShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::AcquireShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::acquire_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = AcquireShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/DeleteShards" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteShardsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::DeleteShardsRequest>
                    for DeleteShardsSvc<T> {
                        type Response = super::DeleteShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DeleteShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::delete_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/PruneShards" => {
                    #[allow(non_camel_case_types)]
                    struct PruneShardsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::PruneShardsRequest>
                    for PruneShardsSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::PruneShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::prune_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = PruneShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListShards" => {
                    #[allow(non_camel_case_types)]
                    struct ListShardsSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ListShardsRequest>
                    for ListShardsSvc<T> {
                        type Response = super::ListShardsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListShardsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_shards(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListShardsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/CreateIndexTemplate" => {
                    #[allow(non_camel_case_types)]
                    struct CreateIndexTemplateSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::CreateIndexTemplateRequest>
                    for CreateIndexTemplateSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::CreateIndexTemplateRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::create_index_template(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = CreateIndexTemplateSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/GetIndexTemplate" => {
                    #[allow(non_camel_case_types)]
                    struct GetIndexTemplateSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::GetIndexTemplateRequest>
                    for GetIndexTemplateSvc<T> {
                        type Response = super::GetIndexTemplateResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetIndexTemplateRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::get_index_template(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetIndexTemplateSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/FindIndexTemplateMatches" => {
                    #[allow(non_camel_case_types)]
                    struct FindIndexTemplateMatchesSvc<T: MetastoreServiceGrpc>(
                        pub Arc<T>,
                    );
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::FindIndexTemplateMatchesRequest>
                    for FindIndexTemplateMatchesSvc<T> {
                        type Response = super::FindIndexTemplateMatchesResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<
                                super::FindIndexTemplateMatchesRequest,
                            >,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::find_index_template_matches(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FindIndexTemplateMatchesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/ListIndexTemplates" => {
                    #[allow(non_camel_case_types)]
                    struct ListIndexTemplatesSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::ListIndexTemplatesRequest>
                    for ListIndexTemplatesSvc<T> {
                        type Response = super::ListIndexTemplatesResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListIndexTemplatesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::list_index_templates(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListIndexTemplatesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/DeleteIndexTemplates" => {
                    #[allow(non_camel_case_types)]
                    struct DeleteIndexTemplatesSvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::DeleteIndexTemplatesRequest>
                    for DeleteIndexTemplatesSvc<T> {
                        type Response = super::EmptyResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::DeleteIndexTemplatesRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::delete_index_templates(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = DeleteIndexTemplatesSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.metastore.MetastoreService/GetClusterIdentity" => {
                    #[allow(non_camel_case_types)]
                    struct GetClusterIdentitySvc<T: MetastoreServiceGrpc>(pub Arc<T>);
                    impl<
                        T: MetastoreServiceGrpc,
                    > tonic::server::UnaryService<super::GetClusterIdentityRequest>
                    for GetClusterIdentitySvc<T> {
                        type Response = super::GetClusterIdentityResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetClusterIdentityRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as MetastoreServiceGrpc>::get_cluster_identity(
                                        &inner,
                                        request,
                                    )
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetClusterIdentitySvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for MetastoreServiceGrpcServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.metastore.MetastoreService";
    impl<T> tonic::server::NamedService for MetastoreServiceGrpcServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/codegen/quickwit/quickwit.search.rs
================================================
// This file is @generated by prost-build.
/// / Scroll Request
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ScrollRequest {
    /// / The `scroll_id` is the given in the response of a search request including a scroll.
    #[prost(string, tag = "1")]
    pub scroll_id: ::prost::alloc::string::String,
    #[prost(uint32, optional, tag = "2")]
    pub scroll_ttl_secs: ::core::option::Option<u32>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PutKvRequest {
    #[prost(bytes = "vec", tag = "1")]
    pub key: ::prost::alloc::vec::Vec<u8>,
    #[prost(bytes = "vec", tag = "2")]
    pub payload: ::prost::alloc::vec::Vec<u8>,
    #[prost(uint32, tag = "3")]
    pub ttl_secs: u32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct PutKvResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetKvRequest {
    #[prost(bytes = "vec", tag = "1")]
    pub key: ::prost::alloc::vec::Vec<u8>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct GetKvResponse {
    #[prost(bytes = "vec", optional, tag = "1")]
    pub payload: ::core::option::Option<::prost::alloc::vec::Vec<u8>>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ReportSplit {
    /// Split id (ULID format `01HAV29D4XY3D462FS3D8K5Q2H`)
    #[prost(string, tag = "2")]
    pub split_id: ::prost::alloc::string::String,
    /// The storage uri. This URI does NOT include the split id.
    #[prost(string, tag = "1")]
    pub storage_uri: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ReportSplitsRequest {
    #[prost(message, repeated, tag = "1")]
    pub report_splits: ::prost::alloc::vec::Vec<ReportSplit>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ReportSplitsResponse {}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListFieldsRequest {
    /// Index ID patterns
    #[prost(string, repeated, tag = "1")]
    pub index_id_patterns: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// Optional limit query to a list of fields
    /// Wildcard expressions are supported.
    #[prost(string, repeated, tag = "2")]
    pub fields: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// Time filter, expressed in seconds since epoch.
    /// That filter is to be interpreted as the semi-open interval:
    /// \[start_timestamp, end_timestamp).
    #[prost(int64, optional, tag = "3")]
    pub start_timestamp: ::core::option::Option<i64>,
    #[prost(int64, optional, tag = "4")]
    pub end_timestamp: ::core::option::Option<i64>,
    /// JSON-serialized QueryAst for index_filter support.
    /// When provided, only fields from documents matching this query are returned.
    #[prost(string, optional, tag = "5")]
    pub query_ast: ::core::option::Option<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafListFieldsRequest {
    /// The index id
    #[prost(string, tag = "1")]
    pub index_id: ::prost::alloc::string::String,
    /// The index uri
    #[prost(string, tag = "2")]
    pub index_uri: ::prost::alloc::string::String,
    /// Index split ids to apply the query on.
    /// This ids are resolved from the index_uri defined in the search_request.
    #[prost(message, repeated, tag = "3")]
    pub split_offsets: ::prost::alloc::vec::Vec<SplitIdAndFooterOffsets>,
    /// Optional limit query to a list of fields
    /// Wildcard expressions are supported.
    #[prost(string, repeated, tag = "4")]
    pub fields: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListFieldsResponse {
    #[prost(message, repeated, tag = "1")]
    pub fields: ::prost::alloc::vec::Vec<ListFieldsEntryResponse>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListFieldsEntryResponse {
    #[prost(string, tag = "1")]
    pub field_name: ::prost::alloc::string::String,
    #[prost(enumeration = "ListFieldType", tag = "2")]
    pub field_type: i32,
    /// The index ids the field exists
    #[prost(string, repeated, tag = "3")]
    pub index_ids: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// True means the field is searchable (indexed) in at least some indices.
    /// False means the field is not searchable in any indices.
    #[prost(bool, tag = "4")]
    pub searchable: bool,
    /// True means the field is aggregatable (fast) in at least some indices.
    /// False means the field is not aggregatable in any indices.
    #[prost(bool, tag = "5")]
    pub aggregatable: bool,
    /// The index ids the field exists, but is not searchable.
    #[prost(string, repeated, tag = "6")]
    pub non_searchable_index_ids: ::prost::alloc::vec::Vec<
        ::prost::alloc::string::String,
    >,
    /// The index ids the field exists, but is not aggregatable
    #[prost(string, repeated, tag = "7")]
    pub non_aggregatable_index_ids: ::prost::alloc::vec::Vec<
        ::prost::alloc::string::String,
    >,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct ListFields {
    #[prost(message, repeated, tag = "1")]
    pub fields: ::prost::alloc::vec::Vec<ListFieldsEntryResponse>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Hash, Eq)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct SearchRequest {
    /// Index ID patterns
    #[prost(string, repeated, tag = "1")]
    pub index_id_patterns: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// Json object representing Quickwit's QueryAst.
    #[prost(string, tag = "13")]
    pub query_ast: ::prost::alloc::string::String,
    /// Time filter, expressed in seconds since epoch.
    /// That filter is to be interpreted as the semi-open interval:
    /// \[start_timestamp, end_timestamp).
    /// If the query AST contains a range query over the timestamp field,
    /// then the the bounds of the range query are used directly and
    /// these two fields are ignored.
    #[prost(int64, optional, tag = "4")]
    pub start_timestamp: ::core::option::Option<i64>,
    #[prost(int64, optional, tag = "5")]
    pub end_timestamp: ::core::option::Option<i64>,
    /// Maximum number of hits to return.
    #[prost(uint64, tag = "6")]
    pub max_hits: u64,
    /// First hit to return. Together with max_hits, this parameter
    /// can be used for pagination.
    ///
    /// E.g.
    /// The results with rank \[start_offset..start_offset + max_hits) are returned.
    #[prost(uint64, tag = "7")]
    pub start_offset: u64,
    /// json serialized aggregation_request
    #[prost(string, optional, tag = "11")]
    pub aggregation_request: ::core::option::Option<::prost::alloc::string::String>,
    /// Fields to extract snippet on
    #[prost(string, repeated, tag = "12")]
    pub snippet_fields: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// Optional sort by one or more fields (limited to 2 at the moment).
    #[prost(message, repeated, tag = "14")]
    pub sort_fields: ::prost::alloc::vec::Vec<SortField>,
    /// If set, the search response will include a search id
    /// that will make it possible to paginate through the results
    /// in a consistent manner.
    #[prost(uint32, optional, tag = "15")]
    pub scroll_ttl_secs: ::core::option::Option<u32>,
    /// Document with sort tuple smaller or equal to this are discarded to
    /// enable pagination.
    /// If split_id is empty, no comparison with \_shard_doc should be done
    #[prost(message, optional, tag = "16")]
    pub search_after: ::core::option::Option<PartialHit>,
    #[prost(enumeration = "CountHits", tag = "17")]
    pub count_hits: i32,
    /// When an exact index ID is provided (not a pattern), the query fails only if
    /// that index is not found and this parameter is set to `false`.
    #[prost(bool, tag = "18")]
    pub ignore_missing_indexes: bool,
    /// When true, skip finalization of aggregation results and return
    /// the raw IntermediateAggregationResults bytes instead.
    #[prost(bool, tag = "19")]
    pub skip_aggregation_finalization: bool,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SortField {
    #[prost(string, tag = "1")]
    pub field_name: ::prost::alloc::string::String,
    #[prost(enumeration = "SortOrder", tag = "2")]
    pub sort_order: i32,
    /// Optional sort value format for datetime field only.
    /// If none, the default output format for datetime field is
    /// unix_timestamp_nanos.
    #[prost(enumeration = "SortDatetimeFormat", optional, tag = "3")]
    pub sort_datetime_format: ::core::option::Option<i32>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct SearchResponse {
    /// Number of hits matching the query.
    #[prost(uint64, tag = "1")]
    pub num_hits: u64,
    /// Matched hits
    #[prost(message, repeated, tag = "2")]
    pub hits: ::prost::alloc::vec::Vec<Hit>,
    /// Elapsed time to perform the request. This time is measured
    /// server-side and expressed in microseconds.
    #[prost(uint64, tag = "3")]
    pub elapsed_time_micros: u64,
    /// The searcherrors that occurred formatted as string.
    #[prost(string, repeated, tag = "4")]
    pub errors: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// Postcard-encoded aggregation response
    #[prost(bytes = "vec", optional, tag = "9")]
    pub aggregation_postcard: ::core::option::Option<::prost::alloc::vec::Vec<u8>>,
    /// Scroll Id (only set if scroll_secs was set in the request)
    #[prost(string, optional, tag = "6")]
    pub scroll_id: ::core::option::Option<::prost::alloc::string::String>,
    /// Returns the list of splits for which search failed.
    /// For the moment, the cause is unknown.
    ///
    /// It is up to the caller to decide whether to interpret
    /// this as an overall failure or to present the partial results
    /// to the end user.
    #[prost(message, repeated, tag = "7")]
    pub failed_splits: ::prost::alloc::vec::Vec<SplitSearchError>,
    /// Total number of successful splits searched.
    #[prost(uint64, tag = "8")]
    pub num_successful_splits: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SearchPlanResponse {
    #[prost(string, tag = "1")]
    pub result: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SplitSearchError {
    /// The searcherror that occurred formatted as string.
    #[prost(string, tag = "1")]
    pub error: ::prost::alloc::string::String,
    /// Split id that failed.
    #[prost(string, tag = "2")]
    pub split_id: ::prost::alloc::string::String,
    /// Flag to indicate if the error can be considered a retryable error
    #[prost(bool, tag = "3")]
    pub retryable_error: bool,
}
/// A LeafSearchRequest can span multiple indices.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafSearchRequest {
    /// Search request. This is a perfect copy of the original search request
    /// that was sent to root apart from the start_offset, max_hits params and index_id_patterns.
    /// index_id_patterns contains the actual index ids queried on that leaf.
    #[prost(message, optional, tag = "1")]
    pub search_request: ::core::option::Option<SearchRequest>,
    /// List of leaf requests, one per index.
    #[prost(message, repeated, tag = "7")]
    pub leaf_requests: ::prost::alloc::vec::Vec<LeafRequestRef>,
    /// List of unique doc_mappers serialized as json.
    #[prost(string, repeated, tag = "8")]
    pub doc_mappers: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// List of index uris
    /// Index URI. The index URI defines the location of the storage that contains the
    /// split files.
    #[prost(string, repeated, tag = "9")]
    pub index_uris: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, Copy, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ResourceStats {
    #[prost(uint64, tag = "1")]
    pub short_lived_cache_num_bytes: u64,
    #[prost(uint64, tag = "2")]
    pub split_num_docs: u64,
    #[prost(uint64, tag = "3")]
    pub warmup_microsecs: u64,
    #[prost(uint64, tag = "4")]
    pub cpu_thread_pool_wait_microsecs: u64,
    #[prost(uint64, tag = "5")]
    pub cpu_microsecs: u64,
}
/// LeafRequestRef references data in LeafSearchRequest to deduplicate data.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafRequestRef {
    /// The ordinal of the doc_mapper in `LeafSearchRequest.doc_mappers`
    #[prost(uint32, tag = "1")]
    pub doc_mapper_ord: u32,
    /// The ordinal of the index uri in LeafSearchRequest.index_uris
    #[prost(uint32, tag = "2")]
    pub index_uri_ord: u32,
    /// Index split ids to apply the query on.
    /// This ids are resolved from the index_uri defined in the search_request.
    #[prost(message, repeated, tag = "3")]
    pub split_offsets: ::prost::alloc::vec::Vec<SplitIdAndFooterOffsets>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SplitIdAndFooterOffsets {
    /// Index split id to apply the query on.
    /// This id is resolved from the index_uri defined in the search_request.
    #[prost(string, tag = "1")]
    pub split_id: ::prost::alloc::string::String,
    /// The offset of the start of footer in the split bundle. The footer contains the file bundle metadata and the hotcache.
    #[prost(uint64, tag = "2")]
    pub split_footer_start: u64,
    /// The offset of the end of the footer in split bundle. The footer contains the file bundle metadata and the hotcache.
    #[prost(uint64, tag = "3")]
    pub split_footer_end: u64,
    /// The lowest timestamp appearing in the split, in seconds since epoch
    #[prost(int64, optional, tag = "4")]
    pub timestamp_start: ::core::option::Option<i64>,
    /// The highest timestamp appearing in the split, in seconds since epoch
    #[prost(int64, optional, tag = "5")]
    pub timestamp_end: ::core::option::Option<i64>,
    /// The number of docs in the split
    #[prost(uint64, tag = "6")]
    pub num_docs: u64,
}
/// Hits returned by a FetchDocRequest.
///
/// The json that is joined is the raw tantivy json doc.
/// It is very different from a quickwit json doc.
///
/// For instance:
///
/// * it may contain a \_source and a \_dynamic field.
/// * since tantivy has no notion of cardinality,
///   all fields are arrays.
/// * since tantivy has no notion of object, the object is
///   flattened by concatenating the path to the root.
///
/// See  `quickwit_search::convert_leaf_hit`
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafHit {
    /// The actual content of the hit/
    #[prost(string, tag = "1")]
    pub leaf_json: ::prost::alloc::string::String,
    /// The partial hit (ie: the sorting field + the document address)
    #[prost(message, optional, tag = "2")]
    pub partial_hit: ::core::option::Option<PartialHit>,
    /// A snippet of the matching content
    #[prost(string, optional, tag = "3")]
    pub leaf_snippet_json: ::core::option::Option<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct Hit {
    /// The actual content of the hit
    #[prost(string, tag = "1")]
    pub json: ::prost::alloc::string::String,
    /// The partial hit (ie: the sorting field + the document address)
    #[prost(message, optional, tag = "2")]
    pub partial_hit: ::core::option::Option<PartialHit>,
    /// A snippet of the matching content
    #[prost(string, optional, tag = "3")]
    pub snippet: ::core::option::Option<::prost::alloc::string::String>,
    /// The index id of the hit
    #[prost(string, tag = "4")]
    pub index_id: ::prost::alloc::string::String,
}
/// A partial hit, is a hit for which we have not fetch the content yet.
/// Instead, it holds a document_uri which is enough information to
/// go and fetch the actual document data, by performing a `get_doc(...)`
/// request.
///
/// Value of the sorting key for the given document.
///
/// Quickwit only computes top-K of this sorting field.
/// If the user requested for a bottom-K of a given fast field, then quickwit simply
/// emits an decreasing mapping of this fast field.
///
/// In case of a tie, quickwit uses the increasing order of
///
/// * the split_id,
/// * the segment_ord,
/// * the doc id.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Hash, Eq)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct PartialHit {
    #[prost(message, optional, tag = "10")]
    pub sort_value: ::core::option::Option<SortByValue>,
    #[prost(message, optional, tag = "11")]
    pub sort_value2: ::core::option::Option<SortByValue>,
    #[prost(string, tag = "2")]
    pub split_id: ::prost::alloc::string::String,
    /// (segment_ord, doc) form a tantivy DocAddress, which is sufficient to identify a document
    /// within a split
    #[prost(uint32, tag = "3")]
    pub segment_ord: u32,
    /// The DocId identifies a unique document at the scale of a tantivy segment.
    #[prost(uint32, tag = "4")]
    pub doc_id: u32,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Ord, PartialOrd)]
#[derive(Clone, Copy, PartialEq, ::prost::Message)]
pub struct SortByValue {
    #[prost(oneof = "sort_by_value::SortValue", tags = "1, 2, 3, 4")]
    pub sort_value: ::core::option::Option<sort_by_value::SortValue>,
}
/// Nested message and enum types in `SortByValue`.
pub mod sort_by_value {
    #[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
    #[serde(rename_all = "snake_case")]
    #[derive(Clone, Copy, PartialEq, ::prost::Oneof)]
    pub enum SortValue {
        #[prost(uint64, tag = "1")]
        U64(u64),
        #[prost(int64, tag = "2")]
        I64(i64),
        #[prost(double, tag = "3")]
        F64(f64),
        #[prost(bool, tag = "4")]
        Boolean(bool),
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafSearchResponse {
    /// Total number of documents matched by the query.
    #[prost(uint64, tag = "1")]
    pub num_hits: u64,
    /// List of the best top-K candidates for the given leaf query.
    #[prost(message, repeated, tag = "2")]
    pub partial_hits: ::prost::alloc::vec::Vec<PartialHit>,
    /// The list of splits that failed. LeafSearchResponse can be an aggregation of results, so there may be multiple.
    #[prost(message, repeated, tag = "3")]
    pub failed_splits: ::prost::alloc::vec::Vec<SplitSearchError>,
    /// Total number of attempt to search into splits.
    /// We do have:
    /// `num_splits_requested == num_successful_splits + num_failed_splits.len()`
    /// But we do not necessarily have:
    /// `num_splits_requested = num_attempted_splits because of retries.`
    #[prost(uint64, tag = "4")]
    pub num_attempted_splits: u64,
    /// Total number of successful splits searched.
    #[prost(uint64, tag = "7")]
    pub num_successful_splits: u64,
    /// postcard serialized intermediate aggregation_result.
    #[prost(bytes = "vec", optional, tag = "6")]
    pub intermediate_aggregation_result: ::core::option::Option<
        ::prost::alloc::vec::Vec<u8>,
    >,
    #[prost(message, optional, tag = "8")]
    pub resource_stats: ::core::option::Option<ResourceStats>,
}
/// The result of searching a single split in a Lambda invocation.
/// Each result is tagged with its split_id so that ordering is irrelevant.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LambdaSingleSplitResult {
    /// The split that was searched.
    #[prost(string, tag = "1")]
    pub split_id: ::prost::alloc::string::String,
    #[prost(oneof = "lambda_single_split_result::Outcome", tags = "2, 3")]
    pub outcome: ::core::option::Option<lambda_single_split_result::Outcome>,
}
/// Nested message and enum types in `LambdaSingleSplitResult`.
pub mod lambda_single_split_result {
    #[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
    #[serde(rename_all = "snake_case")]
    #[derive(Clone, PartialEq, ::prost::Oneof)]
    pub enum Outcome {
        /// On success, the leaf search response for this split.
        #[prost(message, tag = "2")]
        Response(super::LeafSearchResponse),
        /// On failure, the error message.
        #[prost(string, tag = "3")]
        Error(::prost::alloc::string::String),
    }
}
/// Wrapper for per-split results from a Lambda invocation.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LambdaSearchResponses {
    #[prost(message, repeated, tag = "2")]
    pub split_results: ::prost::alloc::vec::Vec<LambdaSingleSplitResult>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct SnippetRequest {
    #[prost(string, repeated, tag = "1")]
    pub snippet_fields: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    #[prost(string, tag = "2")]
    pub query_ast_resolved: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FetchDocsRequest {
    /// Request fetching the content of a given list of partial_hits.
    #[prost(message, repeated, tag = "1")]
    pub partial_hits: ::prost::alloc::vec::Vec<PartialHit>,
    /// Split footer offsets. They are required for fetch docs to
    /// fetch the document content in two reads, when the footer is not
    /// cached.
    #[prost(message, repeated, tag = "3")]
    pub split_offsets: ::prost::alloc::vec::Vec<SplitIdAndFooterOffsets>,
    /// Index URI. The index URI defines the location of the storage that contains the
    /// split files.
    #[prost(string, tag = "4")]
    pub index_uri: ::prost::alloc::string::String,
    #[prost(message, optional, tag = "7")]
    pub snippet_request: ::core::option::Option<SnippetRequest>,
    /// `DocMapper` as json serialized trait.
    #[prost(string, tag = "6")]
    pub doc_mapper: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct FetchDocsResponse {
    /// List of complete hits.
    #[prost(message, repeated, tag = "1")]
    pub hits: ::prost::alloc::vec::Vec<LeafHit>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListTermsRequest {
    /// Index ID patterns
    #[prost(string, repeated, tag = "1")]
    pub index_id_patterns: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
    /// Field to search on
    #[prost(string, tag = "3")]
    pub field: ::prost::alloc::string::String,
    /// Time filter
    #[prost(int64, optional, tag = "4")]
    pub start_timestamp: ::core::option::Option<i64>,
    #[prost(int64, optional, tag = "5")]
    pub end_timestamp: ::core::option::Option<i64>,
    /// Maximum number of hits to return.
    #[prost(uint64, optional, tag = "6")]
    pub max_hits: ::core::option::Option<u64>,
    /// start_key is included, end_key is excluded
    #[prost(bytes = "vec", optional, tag = "7")]
    pub start_key: ::core::option::Option<::prost::alloc::vec::Vec<u8>>,
    #[prost(bytes = "vec", optional, tag = "8")]
    pub end_key: ::core::option::Option<::prost::alloc::vec::Vec<u8>>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, Eq, Hash, ::prost::Message)]
pub struct ListTermsResponse {
    /// Number of hits matching the query.
    #[prost(uint64, tag = "1")]
    pub num_hits: u64,
    /// Matched hits
    #[prost(bytes = "vec", repeated, tag = "2")]
    pub terms: ::prost::alloc::vec::Vec<::prost::alloc::vec::Vec<u8>>,
    /// Elapsed time to perform the request. This time is measured
    /// server-side and expressed in microseconds.
    #[prost(uint64, tag = "3")]
    pub elapsed_time_micros: u64,
    /// The searcherrors that occurred formatted as string.
    #[prost(string, repeated, tag = "4")]
    pub errors: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafListTermsRequest {
    /// Search request. This is a perfect copy of the original list request,
    #[prost(message, optional, tag = "1")]
    pub list_terms_request: ::core::option::Option<ListTermsRequest>,
    /// Index split ids to apply the query on.
    /// This ids are resolved from the index_uri defined in the search_request.
    #[prost(message, repeated, tag = "2")]
    pub split_offsets: ::prost::alloc::vec::Vec<SplitIdAndFooterOffsets>,
    /// Index URI. The index URI defines the location of the storage that contains the
    /// split files.
    #[prost(string, tag = "3")]
    pub index_uri: ::prost::alloc::string::String,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[derive(Clone, PartialEq, ::prost::Message)]
pub struct LeafListTermsResponse {
    /// Total number of documents matched by the query.
    #[prost(uint64, tag = "1")]
    pub num_hits: u64,
    /// List of the first K terms the given leaf query.
    #[prost(bytes = "vec", repeated, tag = "2")]
    pub terms: ::prost::alloc::vec::Vec<::prost::alloc::vec::Vec<u8>>,
    /// The list of splits that failed. LeafSearchResponse can be an aggregation of results, so there may be multiple.
    #[prost(message, repeated, tag = "3")]
    pub failed_splits: ::prost::alloc::vec::Vec<SplitSearchError>,
    /// Total number of single split search attempted.
    #[prost(uint64, tag = "4")]
    pub num_attempted_splits: u64,
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum ListFieldType {
    Str = 0,
    U64 = 1,
    I64 = 2,
    F64 = 3,
    Bool = 4,
    Date = 5,
    Facet = 6,
    Bytes = 7,
    IpAddr = 8,
    Json = 9,
}
impl ListFieldType {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Str => "STR",
            Self::U64 => "U64",
            Self::I64 => "I64",
            Self::F64 => "F64",
            Self::Bool => "BOOL",
            Self::Date => "DATE",
            Self::Facet => "FACET",
            Self::Bytes => "BYTES",
            Self::IpAddr => "IP_ADDR",
            Self::Json => "JSON",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "STR" => Some(Self::Str),
            "U64" => Some(Self::U64),
            "I64" => Some(Self::I64),
            "F64" => Some(Self::F64),
            "BOOL" => Some(Self::Bool),
            "DATE" => Some(Self::Date),
            "FACET" => Some(Self::Facet),
            "BYTES" => Some(Self::Bytes),
            "IP_ADDR" => Some(Self::IpAddr),
            "JSON" => Some(Self::Json),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum CountHits {
    /// Count all hits, querying all splits.
    CountAll = 0,
    /// Give an underestimate of the number of hits, possibly skipping entire
    /// splits if they are otherwise not needed to fulfull a query.
    Underestimate = 1,
}
impl CountHits {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::CountAll => "COUNT_ALL",
            Self::Underestimate => "UNDERESTIMATE",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "COUNT_ALL" => Some(Self::CountAll),
            "UNDERESTIMATE" => Some(Self::Underestimate),
            _ => None,
        }
    }
}
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum SortOrder {
    /// Ascending order.
    Asc = 0,
    /// Descending order.
    ///
    /// \< This will be the default value;
    Desc = 1,
}
impl SortOrder {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::Asc => "ASC",
            Self::Desc => "DESC",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "ASC" => Some(Self::Asc),
            "DESC" => Some(Self::Desc),
            _ => None,
        }
    }
}
/// Sort value format for datetime field.
/// We keep an enum with only one format
/// for future extension.
#[derive(serde::Serialize, serde::Deserialize, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
#[repr(i32)]
pub enum SortDatetimeFormat {
    UnixTimestampMillis = 0,
    UnixTimestampNanos = 1,
}
impl SortDatetimeFormat {
    /// String value of the enum field names used in the ProtoBuf definition.
    ///
    /// The values are not transformed in any way and thus are considered stable
    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
    pub fn as_str_name(&self) -> &'static str {
        match self {
            Self::UnixTimestampMillis => "UNIX_TIMESTAMP_MILLIS",
            Self::UnixTimestampNanos => "UNIX_TIMESTAMP_NANOS",
        }
    }
    /// Creates an enum from field names used in the ProtoBuf definition.
    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
        match value {
            "UNIX_TIMESTAMP_MILLIS" => Some(Self::UnixTimestampMillis),
            "UNIX_TIMESTAMP_NANOS" => Some(Self::UnixTimestampNanos),
            _ => None,
        }
    }
}
/// Generated client implementations.
pub mod search_service_client {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    use tonic::codegen::http::Uri;
    #[derive(Debug, Clone)]
    pub struct SearchServiceClient<T> {
        inner: tonic::client::Grpc<T>,
    }
    impl SearchServiceClient<tonic::transport::Channel> {
        /// Attempt to create a new client by connecting to a given endpoint.
        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
        where
            D: TryInto<tonic::transport::Endpoint>,
            D::Error: Into<StdError>,
        {
            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
            Ok(Self::new(conn))
        }
    }
    impl<T> SearchServiceClient<T>
    where
        T: tonic::client::GrpcService<tonic::body::Body>,
        T::Error: Into<StdError>,
        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
    {
        pub fn new(inner: T) -> Self {
            let inner = tonic::client::Grpc::new(inner);
            Self { inner }
        }
        pub fn with_origin(inner: T, origin: Uri) -> Self {
            let inner = tonic::client::Grpc::with_origin(inner, origin);
            Self { inner }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> SearchServiceClient<InterceptedService<T, F>>
        where
            F: tonic::service::Interceptor,
            T::ResponseBody: Default,
            T: tonic::codegen::Service<
                http::Request<tonic::body::Body>,
                Response = http::Response<
                    <T as tonic::client::GrpcService<tonic::body::Body>>::ResponseBody,
                >,
            >,
            <T as tonic::codegen::Service<
                http::Request<tonic::body::Body>,
            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
        {
            SearchServiceClient::new(InterceptedService::new(inner, interceptor))
        }
        /// Compress requests with the given encoding.
        ///
        /// This requires the server to support it otherwise it might respond with an
        /// error.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.send_compressed(encoding);
            self
        }
        /// Enable decompressing responses.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.inner = self.inner.accept_compressed(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_decoding_message_size(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.inner = self.inner.max_encoding_message_size(limit);
            self
        }
        /// Root search API.
        /// This RPC identifies the set of splits on which the query should run on,
        /// and dispatch the several calls to `LeafSearch`.
        ///
        /// It is also in charge of merging back the results.
        pub async fn root_search(
            &mut self,
            request: impl tonic::IntoRequest<super::SearchRequest>,
        ) -> std::result::Result<tonic::Response<super::SearchResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/RootSearch",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "RootSearch"));
            self.inner.unary(req, path, codec).await
        }
        /// Perform a leaf search on a given set of splits.
        ///
        /// It is like a regular search except that:
        ///
        /// * the node should perform the search locally instead of dispatching
        ///  it to other nodes.
        /// * it should be applied on the given subset of splits
        /// * Hit content is not fetched, and we instead return so called `PartialHit`.
        pub async fn leaf_search(
            &mut self,
            request: impl tonic::IntoRequest<super::LeafSearchRequest>,
        ) -> std::result::Result<
            tonic::Response<super::LeafSearchResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/LeafSearch",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "LeafSearch"));
            self.inner.unary(req, path, codec).await
        }
        /// / Fetches the documents contents from the document store.
        /// / This methods takes `PartialHit`s and returns `Hit`s.
        pub async fn fetch_docs(
            &mut self,
            request: impl tonic::IntoRequest<super::FetchDocsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FetchDocsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/FetchDocs",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "FetchDocs"));
            self.inner.unary(req, path, codec).await
        }
        /// Root list terms API.
        /// This RPC identifies the set of splits on which the query should run on,
        /// and dispatches the several calls to `LeafListTerms`.
        ///
        /// It is also in charge of merging back the results.
        pub async fn root_list_terms(
            &mut self,
            request: impl tonic::IntoRequest<super::ListTermsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListTermsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/RootListTerms",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.search.SearchService", "RootListTerms"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Performs a leaf list terms on a given set of splits.
        ///
        /// It is like a regular list term except that:
        ///
        /// * the node should perform the listing locally instead of dispatching
        ///  it to other nodes.
        /// * it should be applied on the given subset of splits
        pub async fn leaf_list_terms(
            &mut self,
            request: impl tonic::IntoRequest<super::LeafListTermsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::LeafListTermsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/LeafListTerms",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.search.SearchService", "LeafListTerms"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Performs a scroll request.
        pub async fn scroll(
            &mut self,
            request: impl tonic::IntoRequest<super::ScrollRequest>,
        ) -> std::result::Result<tonic::Response<super::SearchResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/Scroll",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "Scroll"));
            self.inner.unary(req, path, codec).await
        }
        /// gRPC request used to store a key in the local storage of the targeted node.
        /// This RPC is used in the mini distributed immutable KV store embedded in quickwit.
        pub async fn put_kv(
            &mut self,
            request: impl tonic::IntoRequest<super::PutKvRequest>,
        ) -> std::result::Result<tonic::Response<super::PutKvResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/PutKV",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "PutKV"));
            self.inner.unary(req, path, codec).await
        }
        /// Gets a key from the local storage of the targeted node.
        /// This RPC is used in the mini distributed immutable KV store embedded in quickwit.
        pub async fn get_kv(
            &mut self,
            request: impl tonic::IntoRequest<super::GetKvRequest>,
        ) -> std::result::Result<tonic::Response<super::GetKvResponse>, tonic::Status> {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/GetKV",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "GetKV"));
            self.inner.unary(req, path, codec).await
        }
        pub async fn report_splits(
            &mut self,
            request: impl tonic::IntoRequest<super::ReportSplitsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ReportSplitsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/ReportSplits",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.search.SearchService", "ReportSplits"),
                );
            self.inner.unary(req, path, codec).await
        }
        pub async fn list_fields(
            &mut self,
            request: impl tonic::IntoRequest<super::ListFieldsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListFieldsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/ListFields",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "ListFields"));
            self.inner.unary(req, path, codec).await
        }
        pub async fn leaf_list_fields(
            &mut self,
            request: impl tonic::IntoRequest<super::LeafListFieldsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListFieldsResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/LeafListFields",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(
                    GrpcMethod::new("quickwit.search.SearchService", "LeafListFields"),
                );
            self.inner.unary(req, path, codec).await
        }
        /// Describe how a search would be processed.
        pub async fn search_plan(
            &mut self,
            request: impl tonic::IntoRequest<super::SearchRequest>,
        ) -> std::result::Result<
            tonic::Response<super::SearchPlanResponse>,
            tonic::Status,
        > {
            self.inner
                .ready()
                .await
                .map_err(|e| {
                    tonic::Status::unknown(
                        format!("Service was not ready: {}", e.into()),
                    )
                })?;
            let codec = tonic_prost::ProstCodec::default();
            let path = http::uri::PathAndQuery::from_static(
                "/quickwit.search.SearchService/SearchPlan",
            );
            let mut req = request.into_request();
            req.extensions_mut()
                .insert(GrpcMethod::new("quickwit.search.SearchService", "SearchPlan"));
            self.inner.unary(req, path, codec).await
        }
    }
}
/// Generated server implementations.
pub mod search_service_server {
    #![allow(
        unused_variables,
        dead_code,
        missing_docs,
        clippy::wildcard_imports,
        clippy::let_unit_value,
    )]
    use tonic::codegen::*;
    /// Generated trait containing gRPC methods that should be implemented for use with SearchServiceServer.
    #[async_trait]
    pub trait SearchService: std::marker::Send + std::marker::Sync + 'static {
        /// Root search API.
        /// This RPC identifies the set of splits on which the query should run on,
        /// and dispatch the several calls to `LeafSearch`.
        ///
        /// It is also in charge of merging back the results.
        async fn root_search(
            &self,
            request: tonic::Request<super::SearchRequest>,
        ) -> std::result::Result<tonic::Response<super::SearchResponse>, tonic::Status>;
        /// Perform a leaf search on a given set of splits.
        ///
        /// It is like a regular search except that:
        ///
        /// * the node should perform the search locally instead of dispatching
        ///  it to other nodes.
        /// * it should be applied on the given subset of splits
        /// * Hit content is not fetched, and we instead return so called `PartialHit`.
        async fn leaf_search(
            &self,
            request: tonic::Request<super::LeafSearchRequest>,
        ) -> std::result::Result<
            tonic::Response<super::LeafSearchResponse>,
            tonic::Status,
        >;
        /// / Fetches the documents contents from the document store.
        /// / This methods takes `PartialHit`s and returns `Hit`s.
        async fn fetch_docs(
            &self,
            request: tonic::Request<super::FetchDocsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::FetchDocsResponse>,
            tonic::Status,
        >;
        /// Root list terms API.
        /// This RPC identifies the set of splits on which the query should run on,
        /// and dispatches the several calls to `LeafListTerms`.
        ///
        /// It is also in charge of merging back the results.
        async fn root_list_terms(
            &self,
            request: tonic::Request<super::ListTermsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListTermsResponse>,
            tonic::Status,
        >;
        /// Performs a leaf list terms on a given set of splits.
        ///
        /// It is like a regular list term except that:
        ///
        /// * the node should perform the listing locally instead of dispatching
        ///  it to other nodes.
        /// * it should be applied on the given subset of splits
        async fn leaf_list_terms(
            &self,
            request: tonic::Request<super::LeafListTermsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::LeafListTermsResponse>,
            tonic::Status,
        >;
        /// Performs a scroll request.
        async fn scroll(
            &self,
            request: tonic::Request<super::ScrollRequest>,
        ) -> std::result::Result<tonic::Response<super::SearchResponse>, tonic::Status>;
        /// gRPC request used to store a key in the local storage of the targeted node.
        /// This RPC is used in the mini distributed immutable KV store embedded in quickwit.
        async fn put_kv(
            &self,
            request: tonic::Request<super::PutKvRequest>,
        ) -> std::result::Result<tonic::Response<super::PutKvResponse>, tonic::Status>;
        /// Gets a key from the local storage of the targeted node.
        /// This RPC is used in the mini distributed immutable KV store embedded in quickwit.
        async fn get_kv(
            &self,
            request: tonic::Request<super::GetKvRequest>,
        ) -> std::result::Result<tonic::Response<super::GetKvResponse>, tonic::Status>;
        async fn report_splits(
            &self,
            request: tonic::Request<super::ReportSplitsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ReportSplitsResponse>,
            tonic::Status,
        >;
        async fn list_fields(
            &self,
            request: tonic::Request<super::ListFieldsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListFieldsResponse>,
            tonic::Status,
        >;
        async fn leaf_list_fields(
            &self,
            request: tonic::Request<super::LeafListFieldsRequest>,
        ) -> std::result::Result<
            tonic::Response<super::ListFieldsResponse>,
            tonic::Status,
        >;
        /// Describe how a search would be processed.
        async fn search_plan(
            &self,
            request: tonic::Request<super::SearchRequest>,
        ) -> std::result::Result<
            tonic::Response<super::SearchPlanResponse>,
            tonic::Status,
        >;
    }
    #[derive(Debug)]
    pub struct SearchServiceServer<T> {
        inner: Arc<T>,
        accept_compression_encodings: EnabledCompressionEncodings,
        send_compression_encodings: EnabledCompressionEncodings,
        max_decoding_message_size: Option<usize>,
        max_encoding_message_size: Option<usize>,
    }
    impl<T> SearchServiceServer<T> {
        pub fn new(inner: T) -> Self {
            Self::from_arc(Arc::new(inner))
        }
        pub fn from_arc(inner: Arc<T>) -> Self {
            Self {
                inner,
                accept_compression_encodings: Default::default(),
                send_compression_encodings: Default::default(),
                max_decoding_message_size: None,
                max_encoding_message_size: None,
            }
        }
        pub fn with_interceptor<F>(
            inner: T,
            interceptor: F,
        ) -> InterceptedService<Self, F>
        where
            F: tonic::service::Interceptor,
        {
            InterceptedService::new(Self::new(inner), interceptor)
        }
        /// Enable decompressing requests with the given encoding.
        #[must_use]
        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.accept_compression_encodings.enable(encoding);
            self
        }
        /// Compress responses with the given encoding, if the client supports it.
        #[must_use]
        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
            self.send_compression_encodings.enable(encoding);
            self
        }
        /// Limits the maximum size of a decoded message.
        ///
        /// Default: `4MB`
        #[must_use]
        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
            self.max_decoding_message_size = Some(limit);
            self
        }
        /// Limits the maximum size of an encoded message.
        ///
        /// Default: `usize::MAX`
        #[must_use]
        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
            self.max_encoding_message_size = Some(limit);
            self
        }
    }
    impl<T, B> tonic::codegen::Service<http::Request<B>> for SearchServiceServer<T>
    where
        T: SearchService,
        B: Body + std::marker::Send + 'static,
        B::Error: Into<StdError> + std::marker::Send + 'static,
    {
        type Response = http::Response<tonic::body::Body>;
        type Error = std::convert::Infallible;
        type Future = BoxFuture<Self::Response, Self::Error>;
        fn poll_ready(
            &mut self,
            _cx: &mut Context<'_>,
        ) -> Poll<std::result::Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }
        fn call(&mut self, req: http::Request<B>) -> Self::Future {
            match req.uri().path() {
                "/quickwit.search.SearchService/RootSearch" => {
                    #[allow(non_camel_case_types)]
                    struct RootSearchSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::SearchRequest>
                    for RootSearchSvc<T> {
                        type Response = super::SearchResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::SearchRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::root_search(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = RootSearchSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/LeafSearch" => {
                    #[allow(non_camel_case_types)]
                    struct LeafSearchSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::LeafSearchRequest>
                    for LeafSearchSvc<T> {
                        type Response = super::LeafSearchResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::LeafSearchRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::leaf_search(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = LeafSearchSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/FetchDocs" => {
                    #[allow(non_camel_case_types)]
                    struct FetchDocsSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::FetchDocsRequest>
                    for FetchDocsSvc<T> {
                        type Response = super::FetchDocsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::FetchDocsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::fetch_docs(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = FetchDocsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/RootListTerms" => {
                    #[allow(non_camel_case_types)]
                    struct RootListTermsSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::ListTermsRequest>
                    for RootListTermsSvc<T> {
                        type Response = super::ListTermsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListTermsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::root_list_terms(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = RootListTermsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/LeafListTerms" => {
                    #[allow(non_camel_case_types)]
                    struct LeafListTermsSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::LeafListTermsRequest>
                    for LeafListTermsSvc<T> {
                        type Response = super::LeafListTermsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::LeafListTermsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::leaf_list_terms(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = LeafListTermsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/Scroll" => {
                    #[allow(non_camel_case_types)]
                    struct ScrollSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::ScrollRequest>
                    for ScrollSvc<T> {
                        type Response = super::SearchResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ScrollRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::scroll(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ScrollSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/PutKV" => {
                    #[allow(non_camel_case_types)]
                    struct PutKVSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::PutKvRequest> for PutKVSvc<T> {
                        type Response = super::PutKvResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::PutKvRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::put_kv(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = PutKVSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/GetKV" => {
                    #[allow(non_camel_case_types)]
                    struct GetKVSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::GetKvRequest> for GetKVSvc<T> {
                        type Response = super::GetKvResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::GetKvRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::get_kv(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = GetKVSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/ReportSplits" => {
                    #[allow(non_camel_case_types)]
                    struct ReportSplitsSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::ReportSplitsRequest>
                    for ReportSplitsSvc<T> {
                        type Response = super::ReportSplitsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ReportSplitsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::report_splits(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ReportSplitsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/ListFields" => {
                    #[allow(non_camel_case_types)]
                    struct ListFieldsSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::ListFieldsRequest>
                    for ListFieldsSvc<T> {
                        type Response = super::ListFieldsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::ListFieldsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::list_fields(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = ListFieldsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/LeafListFields" => {
                    #[allow(non_camel_case_types)]
                    struct LeafListFieldsSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::LeafListFieldsRequest>
                    for LeafListFieldsSvc<T> {
                        type Response = super::ListFieldsResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::LeafListFieldsRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::leaf_list_fields(&inner, request)
                                    .await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = LeafListFieldsSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                "/quickwit.search.SearchService/SearchPlan" => {
                    #[allow(non_camel_case_types)]
                    struct SearchPlanSvc<T: SearchService>(pub Arc<T>);
                    impl<
                        T: SearchService,
                    > tonic::server::UnaryService<super::SearchRequest>
                    for SearchPlanSvc<T> {
                        type Response = super::SearchPlanResponse;
                        type Future = BoxFuture<
                            tonic::Response<Self::Response>,
                            tonic::Status,
                        >;
                        fn call(
                            &mut self,
                            request: tonic::Request<super::SearchRequest>,
                        ) -> Self::Future {
                            let inner = Arc::clone(&self.0);
                            let fut = async move {
                                <T as SearchService>::search_plan(&inner, request).await
                            };
                            Box::pin(fut)
                        }
                    }
                    let accept_compression_encodings = self.accept_compression_encodings;
                    let send_compression_encodings = self.send_compression_encodings;
                    let max_decoding_message_size = self.max_decoding_message_size;
                    let max_encoding_message_size = self.max_encoding_message_size;
                    let inner = self.inner.clone();
                    let fut = async move {
                        let method = SearchPlanSvc(inner);
                        let codec = tonic_prost::ProstCodec::default();
                        let mut grpc = tonic::server::Grpc::new(codec)
                            .apply_compression_config(
                                accept_compression_encodings,
                                send_compression_encodings,
                            )
                            .apply_max_message_size_config(
                                max_decoding_message_size,
                                max_encoding_message_size,
                            );
                        let res = grpc.unary(method, req).await;
                        Ok(res)
                    };
                    Box::pin(fut)
                }
                _ => {
                    Box::pin(async move {
                        let mut response = http::Response::new(
                            tonic::body::Body::default(),
                        );
                        let headers = response.headers_mut();
                        headers
                            .insert(
                                tonic::Status::GRPC_STATUS,
                                (tonic::Code::Unimplemented as i32).into(),
                            );
                        headers
                            .insert(
                                http::header::CONTENT_TYPE,
                                tonic::metadata::GRPC_CONTENT_TYPE,
                            );
                        Ok(response)
                    })
                }
            }
        }
    }
    impl<T> Clone for SearchServiceServer<T> {
        fn clone(&self) -> Self {
            let inner = self.inner.clone();
            Self {
                inner,
                accept_compression_encodings: self.accept_compression_encodings,
                send_compression_encodings: self.send_compression_encodings,
                max_decoding_message_size: self.max_decoding_message_size,
                max_encoding_message_size: self.max_encoding_message_size,
            }
        }
    }
    /// Generated gRPC service name
    pub const SERVICE_NAME: &str = "quickwit.search.SearchService";
    impl<T> tonic::server::NamedService for SearchServiceServer<T> {
        const NAME: &'static str = SERVICE_NAME;
    }
}


================================================
FILE: quickwit/quickwit-proto/src/control_plane/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_actors::AskError;
use quickwit_common::rate_limited_error;
use quickwit_common::tower::{MakeLoadShedError, RpcName, TimeoutExceeded};
use serde::{Deserialize, Serialize};
use thiserror;

use crate::metastore::{MetastoreError, OpenShardSubrequest};
use crate::{GrpcServiceError, ServiceError, ServiceErrorCode};

include!("../codegen/quickwit/quickwit.control_plane.rs");

pub const CONTROL_PLANE_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/control_plane_descriptor.bin");

pub type ControlPlaneResult<T> = std::result::Result<T, ControlPlaneError>;

#[derive(Debug, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum ControlPlaneError {
    #[error("internal error: {0}")]
    Internal(String),
    #[error("metastore error: {0}")]
    Metastore(#[from] MetastoreError),
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests,
    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl From<TimeoutExceeded> for ControlPlaneError {
    fn from(_timeout_exceeded: TimeoutExceeded) -> Self {
        Self::Timeout("tower layer timeout".to_string())
    }
}

impl From<quickwit_common::tower::TaskCancelled> for ControlPlaneError {
    fn from(task_cancelled: quickwit_common::tower::TaskCancelled) -> Self {
        ControlPlaneError::Internal(task_cancelled.to_string())
    }
}

impl ServiceError for ControlPlaneError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(error_msg) => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "control plane internal error: {error_msg}"
                );
                ServiceErrorCode::Internal
            }
            Self::Metastore(metastore_error) => metastore_error.error_code(),
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for ControlPlaneError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}

impl MakeLoadShedError for ControlPlaneError {
    fn make_load_shed_error() -> Self {
        Self::TooManyRequests
    }
}

impl From<ControlPlaneError> for MetastoreError {
    fn from(error: ControlPlaneError) -> Self {
        match error {
            ControlPlaneError::Internal(message) => MetastoreError::Internal {
                message: "an internal metastore error occurred".to_string(),
                cause: message,
            },
            ControlPlaneError::Metastore(error) => error,
            ControlPlaneError::Timeout(message) => MetastoreError::Timeout(message),
            ControlPlaneError::TooManyRequests => MetastoreError::TooManyRequests,
            ControlPlaneError::Unavailable(message) => MetastoreError::Unavailable(message),
        }
    }
}

impl From<AskError<ControlPlaneError>> for ControlPlaneError {
    fn from(error: AskError<ControlPlaneError>) -> Self {
        match error {
            AskError::ErrorReply(error) => error,
            AskError::MessageNotDelivered => {
                Self::new_unavailable("request could not be delivered to actor".to_string())
            }
            AskError::ProcessMessageError => {
                Self::new_internal("an error occurred while processing the request".to_string())
            }
        }
    }
}

impl RpcName for GetOrCreateOpenShardsRequest {
    fn rpc_name() -> &'static str {
        "get_or_create_open_shards"
    }
}

impl RpcName for AdviseResetShardsRequest {
    fn rpc_name() -> &'static str {
        "advise_reset_shards"
    }
}

impl GetOrCreateOpenShardsFailureReason {
    pub fn create_failure(
        &self,
        subrequest: impl Into<GetOrCreateOpenShardsSubrequest>,
    ) -> GetOrCreateOpenShardsFailure {
        let subrequest = subrequest.into();

        GetOrCreateOpenShardsFailure {
            subrequest_id: subrequest.subrequest_id,
            index_id: subrequest.index_id,
            source_id: subrequest.source_id,
            reason: *self as i32,
        }
    }
}

impl From<crate::metastore::OpenShardSubrequest> for GetOrCreateOpenShardsSubrequest {
    fn from(metastore_open_shard_subrequest: OpenShardSubrequest) -> Self {
        let index_id = metastore_open_shard_subrequest.index_uid().index_id.clone();

        Self {
            subrequest_id: metastore_open_shard_subrequest.subrequest_id,
            index_id,
            source_id: metastore_open_shard_subrequest.source_id,
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/developer/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use thiserror;

use crate::{GrpcServiceError, ServiceError, ServiceErrorCode};

include!("../codegen/quickwit/quickwit.developer.rs");

pub const DEVELOPER_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/developer_descriptor.bin");

pub type DeveloperResult<T> = std::result::Result<T, DeveloperError>;

#[derive(Debug, thiserror::Error, Eq, PartialEq, serde::Serialize, serde::Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum DeveloperError {
    #[error("internal error: {0}")]
    Internal(String),
    #[error("invalid argument: {0}")]
    InvalidArgument(String),
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests,
    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl ServiceError for DeveloperError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(_) => ServiceErrorCode::Internal,
            Self::InvalidArgument(_) => ServiceErrorCode::BadRequest,
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for DeveloperError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}


================================================
FILE: quickwit/quickwit-proto/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::Infallible;
use std::error::Error;
use std::fmt::Debug;

use anyhow::Context;
use quickwit_actors::AskError;
use serde::Serialize;
use serde::de::DeserializeOwned;
use tonic::metadata::BinaryMetadataValue;
use tracing::{error, warn};

const QW_ERROR_HEADER_NAME: &str = "qw-error-bin";

/// This enum maps our internal error codes to
/// gRPC and HTTP status codes.
///
/// It is voluntarily a restricted subset of gRPC status codes. Please introduce new variants
/// thoughtfully.
#[derive(Clone, Copy)]
pub enum ServiceErrorCode {
    AlreadyExists,
    BadRequest,
    // Use `Unauthenticated` if the caller cannot be identified.
    Forbidden,
    Internal,
    NotFound,
    Timeout,
    TooManyRequests,
    Unauthenticated,
    Unavailable,
}

impl ServiceErrorCode {
    fn grpc_status_code(&self) -> tonic::Code {
        match self {
            Self::AlreadyExists => tonic::Code::AlreadyExists,
            Self::BadRequest => tonic::Code::InvalidArgument,
            Self::Forbidden => tonic::Code::PermissionDenied,
            Self::Internal => tonic::Code::Internal,
            Self::NotFound => tonic::Code::NotFound,
            Self::Timeout => tonic::Code::DeadlineExceeded,
            Self::TooManyRequests => tonic::Code::ResourceExhausted,
            Self::Unauthenticated => tonic::Code::Unauthenticated,
            Self::Unavailable => tonic::Code::Unavailable,
        }
    }

    pub fn http_status_code(&self) -> http::StatusCode {
        match self {
            Self::AlreadyExists => http::StatusCode::BAD_REQUEST,
            Self::BadRequest => http::StatusCode::BAD_REQUEST,
            Self::Forbidden => http::StatusCode::FORBIDDEN,
            Self::Internal => http::StatusCode::INTERNAL_SERVER_ERROR,
            Self::NotFound => http::StatusCode::NOT_FOUND,
            Self::Timeout => http::StatusCode::REQUEST_TIMEOUT,
            Self::TooManyRequests => http::StatusCode::TOO_MANY_REQUESTS,
            Self::Unauthenticated => http::StatusCode::UNAUTHORIZED,
            Self::Unavailable => http::StatusCode::SERVICE_UNAVAILABLE,
        }
    }
}

pub trait ServiceError: Error + Debug + 'static {
    fn error_code(&self) -> ServiceErrorCode;
}

impl ServiceError for Infallible {
    fn error_code(&self) -> ServiceErrorCode {
        unreachable!()
    }
}

impl<E> ServiceError for AskError<E>
where E: ServiceError
{
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            AskError::ErrorReply(error) => error.error_code(),
            AskError::MessageNotDelivered => ServiceErrorCode::Unavailable,
            AskError::ProcessMessageError => ServiceErrorCode::Internal,
        }
    }
}

/// A trait for encoding/decoding service errors to/from gRPC statuses. Errors are stored in JSON
/// in the gRPC header `qw-error-bin`. This allows for propagating them transparently
/// between clients and servers over the network without being semantically limited to a status code
/// and a message. However, it also means that modifying the serialization format of existing errors
/// or introducing new ones is not backward compatible.
pub trait GrpcServiceError: ServiceError + Serialize + DeserializeOwned + Send + Sync {
    fn into_grpc_status(self) -> tonic::Status {
        grpc_error_to_grpc_status(self)
    }

    fn new_internal(message: String) -> Self;

    fn new_timeout(message: String) -> Self;

    fn new_too_many_requests() -> Self;

    fn new_unavailable(message: String) -> Self;
}

/// Converts a service error into a gRPC status.
pub fn grpc_error_to_grpc_status<E>(service_error: E) -> tonic::Status
where E: GrpcServiceError {
    let code = service_error.error_code().grpc_status_code();
    let message = service_error.to_string();
    let mut status = tonic::Status::new(code, message);

    match encode_error(&service_error) {
        Ok(header_value) => {
            status
                .metadata_mut()
                .insert_bin(QW_ERROR_HEADER_NAME, header_value);
        }
        Err(error) => {
            warn!(%error, "failed to encode error `{service_error:?}`");
        }
    }
    status
}

/// Converts a gRPC status into a service error.
pub fn grpc_status_to_service_error<E>(status: tonic::Status, rpc_name: &'static str) -> E
where E: GrpcServiceError {
    if let Some(header_value) = status.metadata().get_bin(QW_ERROR_HEADER_NAME) {
        let service_error = match decode_error(header_value) {
            Ok(service_error) => service_error,
            Err(error) => {
                let message = format!(
                    "failed to deserialize error returned from server (this can happen during \
                     rolling upgrades): {error}"
                );
                E::new_internal(message)
            }
        };
        return service_error;
    }
    let message = status.message().to_string();
    error!(code = ?status.code(), rpc = rpc_name, "gRPC transport error: {message}");

    match status.code() {
        // `Cancelled` is a client timeout whereas `DeadlineExceeded` is a server timeout. At this
        // stage, we don't distinguish them.
        tonic::Code::Cancelled | tonic::Code::DeadlineExceeded => E::new_timeout(message),
        tonic::Code::Unavailable => E::new_unavailable(message),
        _ => E::new_internal(message),
    }
}

/// Encodes a service error into a gRPC header value.
fn encode_error<E: Serialize>(service_error: &E) -> anyhow::Result<BinaryMetadataValue> {
    let service_error_json = serde_json::to_vec(&service_error)?;
    let header_value = BinaryMetadataValue::from_bytes(&service_error_json);
    Ok(header_value)
}

/// Decodes a service error from a gRPC header value.
fn decode_error<E: DeserializeOwned>(header_value: &BinaryMetadataValue) -> anyhow::Result<E> {
    let service_error_json = header_value.to_bytes().context("invalid header value")?;
    let service_error = serde_json::from_slice(&service_error_json).with_context(|| {
        if let Ok(service_error_json_str) = std::str::from_utf8(&service_error_json) {
            format!("invalid JSON `{service_error_json_str}`")
        } else {
            "invalid JSON".to_string()
        }
    })?;
    Ok(service_error)
}

#[allow(clippy::result_large_err)]
pub fn convert_to_grpc_result<T, E: GrpcServiceError>(
    result: Result<T, E>,
) -> tonic::Result<tonic::Response<T>> {
    result
        .map(tonic::Response::new)
        .map_err(|error| error.into_grpc_status())
}

#[cfg(test)]
mod tests {
    use serde::Deserialize;

    use super::*;

    #[test]
    fn test_grpc_service_error_roundtrip() {
        #[derive(Clone, Debug, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
        #[serde(rename_all = "snake_case")]
        enum MyError {
            #[error("internal error: {0}")]
            Internal(String),
            #[error("request timed out: {0}")]
            Timeout(String),

            #[error("too many requests")]
            TooManyRequests,

            #[error("service unavailable: {0}")]
            Unavailable(String),
        }

        impl ServiceError for MyError {
            fn error_code(&self) -> ServiceErrorCode {
                match self {
                    Self::Internal(_) => ServiceErrorCode::Internal,
                    Self::Timeout(_) => ServiceErrorCode::Timeout,
                    Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
                    Self::Unavailable(_) => ServiceErrorCode::Unavailable,
                }
            }
        }

        impl GrpcServiceError for MyError {
            fn new_internal(message: String) -> Self {
                Self::Internal(message)
            }

            fn new_timeout(message: String) -> Self {
                Self::Timeout(message)
            }

            fn new_too_many_requests() -> Self {
                Self::TooManyRequests
            }

            fn new_unavailable(message: String) -> Self {
                Self::Unavailable(message)
            }
        }

        let service_error = MyError::new_internal("test".to_string());
        let status = grpc_error_to_grpc_status(service_error.clone());
        let expected_error: MyError = grpc_status_to_service_error(status, "rpc_name");
        assert_eq!(service_error, expected_error);
    }
}


================================================
FILE: quickwit/quickwit-proto/src/getters.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use crate::control_plane::*;
use crate::indexing::*;
use crate::ingest::ingester::*;
use crate::ingest::router::*;
use crate::ingest::*;
use crate::metastore::*;
use crate::types::*;

macro_rules! generate_getters {
    (impl fn $field:ident() -> $type:ty {} for $($struct:ty),+) => {
        $(
        impl $struct {
            // we track caller so the reported line isn't the macro invocation below
            #[track_caller]
            pub fn $field(&self) -> $type {
                self.$field
                    .as_ref()
                    .expect(concat!("`",
                    stringify!($field), "` should be a required field"))
            }
        }
        )*
    }
}

macro_rules! generate_clone_getters {
    (impl fn $field:ident() -> $type:ty {} for $($struct:ty),+) => {
        $(
        impl $struct {
            // we track caller so the reported line isn't the macro invocation below
            #[track_caller]
            pub fn $field(&self) -> $type {
                self.$field
                    .clone()
                    .expect(concat!("`",
                    stringify!($field), "` should be a required field"))
            }
        }
        )*
    }
}

macro_rules! generate_copy_getters {
    (impl fn $field:ident() -> $type:ty {} for $($struct:ty),+) => {
        $(
        impl $struct {
            // we track caller so the reported line isn't the macro invocation below
            #[track_caller]
            pub fn $field(&self) -> $type {
                self.$field
                    .expect(concat!("`",
                    stringify!($field), "` should be a required field"))
            }
        }
        )*
    }
}

// [`DocMappingUid`] getters
generate_copy_getters!(
    impl fn doc_mapping_uid() -> DocMappingUid {} for

    OpenShardSubrequest,
    Shard
);

// [`DocUid`] getters
generate_copy_getters! {
    impl fn doc_uid() -> DocUid {} for

    ParseFailure
}

// [`IndexUid`] getters
generate_getters! {
    impl fn index_uid() -> &IndexUid {} for
    // Control Plane API
    GetOrCreateOpenShardsSuccess,

    // Indexing API
    IndexingTask,

    // Ingest API
    FetchEof,
    FetchPayload,
    IngestSuccess,
    OpenFetchStreamRequest,
    PersistFailure,
    PersistSubrequest,
    PersistSuccess,
    ReplicateFailure,
    ReplicateSubrequest,
    ReplicateSuccess,
    RetainShardsForSource,
    Shard,
    ShardIdPositions,
    ShardIds,
    ShardPKey,
    TruncateShardsSubrequest,
    SourceShardUpdate,

    // Metastore API
    AcquireShardsRequest,
    AddSourceRequest,
    CreateIndexResponse,
    DeleteIndexRequest,
    DeleteQuery,
    DeleteShardsRequest,
    DeleteShardsResponse,
    DeleteSourceRequest,
    DeleteSplitsRequest,
    LastDeleteOpstampRequest,
    ListDeleteTasksRequest,
    ListShardsSubrequest,
    ListShardsSubresponse,
    ListStaleSplitsRequest,
    MarkSplitsForDeletionRequest,
    OpenShardSubrequest,
    PruneShardsRequest,
    PublishSplitsRequest,
    ResetSourceCheckpointRequest,
    StageSplitsRequest,
    ToggleSourceRequest,
    UpdateIndexRequest,
    UpdateSourceRequest,
    UpdateSplitsDeleteOpstampRequest
}

// [`PipelineUid`] getters
generate_copy_getters! {
    impl fn pipeline_uid() -> PipelineUid {} for

    IndexingTask
}

// [`Position`] getters. We use `clone` because `Position` is an `Arc` under the hood.
generate_clone_getters! {
    impl fn eof_position() -> Position {} for

    FetchEof
}

generate_clone_getters! {
    impl fn from_position_exclusive() -> Position {} for

    FetchPayload,
    OpenFetchStreamRequest,
    ReplicateSubrequest
}

generate_clone_getters! {
    impl fn to_position_inclusive() -> Position {} for

    FetchPayload
}

generate_clone_getters! {
    impl fn publish_position_inclusive() -> Position {} for

    Shard,
    ShardIdPosition
}

generate_clone_getters! {
    impl fn replication_position_inclusive() -> Position {} for

    ReplicateSuccess
}

generate_clone_getters! {
    impl fn truncate_up_to_position_inclusive() -> Position {} for

    TruncateShardsSubrequest
}

// [`Shard`] getters
generate_getters! {
    impl fn open_shard() -> &Shard {} for

    OpenShardSubresponse
}

generate_getters! {
    impl fn shard() -> &Shard {} for

    InitShardSubrequest,
    InitShardSuccess
}

// [`ShardId`] getters
generate_getters! {
    impl fn shard_id() -> &ShardId {} for

    FetchEof,
    FetchPayload,
    InitShardFailure,
    OpenFetchStreamRequest,
    OpenShardSubrequest,
    PersistSuccess,
    ReplicateFailure,
    ReplicateSubrequest,
    ReplicateSuccess,
    Shard,
    ShardIdPosition,
    ShardPKey,
    TruncateShardsSubrequest
}


================================================
FILE: quickwit/quickwit-proto/src/indexing/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::fmt::{Display, Formatter};
use std::hash::Hash;
use std::ops::{Add, Mul, Sub};

use bytesize::ByteSize;
use quickwit_actors::AskError;
use quickwit_common::pubsub::Event;
use quickwit_common::rate_limited_error;
use quickwit_common::tower::{MakeLoadShedError, RpcName, TimeoutExceeded};
use serde::{Deserialize, Serialize};
use thiserror;

use crate::metastore::MetastoreError;
use crate::types::{IndexUid, NodeId, PipelineUid, Position, ShardId, SourceId, SourceUid};
use crate::{GrpcServiceError, ServiceError, ServiceErrorCode};

include!("../codegen/quickwit/quickwit.indexing.rs");

pub const INDEXING_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/indexing_descriptor.bin");

pub type IndexingResult<T> = std::result::Result<T, IndexingError>;

#[derive(Debug, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum IndexingError {
    #[error("internal error: {0}")]
    Internal(String),
    #[error("metastore error: {0}")]
    Metastore(#[from] MetastoreError),
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests,
    #[error("service unavailable: {0}")]
    Unavailable(String),
}
impl From<TimeoutExceeded> for IndexingError {
    fn from(_timeout_exceeded: TimeoutExceeded) -> Self {
        Self::Timeout("tower layer timeout".to_string())
    }
}

impl ServiceError for IndexingError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(err_msg) => {
                rate_limited_error!(limit_per_min = 6, "indexing error: {err_msg}");
                ServiceErrorCode::Internal
            }
            Self::Metastore(metastore_error) => metastore_error.error_code(),
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for IndexingError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}

impl MakeLoadShedError for IndexingError {
    fn make_load_shed_error() -> Self {
        Self::TooManyRequests
    }
}

impl From<AskError<IndexingError>> for IndexingError {
    fn from(error: AskError<IndexingError>) -> Self {
        match error {
            AskError::ErrorReply(error) => error,
            AskError::MessageNotDelivered => {
                Self::new_unavailable("request could not be delivered to actor".to_string())
            }
            AskError::ProcessMessageError => {
                Self::new_internal("an error occurred while processing the request".to_string())
            }
        }
    }
}

/// Uniquely identifies an indexing pipeline. There can be multiple indexing pipelines per
/// source `(index_uid, source_id)` running simultaneously on an indexer.
#[derive(Clone, Debug, Hash, Eq, PartialEq)]
pub struct IndexingPipelineId {
    pub node_id: NodeId,
    pub index_uid: IndexUid,
    pub source_id: SourceId,
    pub pipeline_uid: PipelineUid,
}

impl IndexingPipelineId {
    pub fn merge_pipeline_id(&self) -> MergePipelineId {
        MergePipelineId {
            node_id: self.node_id.clone(),
            index_uid: self.index_uid.clone(),
            source_id: self.source_id.clone(),
        }
    }
}

impl Display for IndexingPipelineId {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "{}:{}", self.index_uid, &self.source_id)
    }
}

/// Uniquely identifies a merge pipeline. There exists at most one merge pipeline per
/// `(index_uid, source_id)` running on indexer at any given time fed by one or more indexing
/// pipelines.
#[derive(Clone, Debug, Hash, Eq, PartialEq)]
pub struct MergePipelineId {
    pub node_id: NodeId,
    pub index_uid: IndexUid,
    pub source_id: SourceId,
}

impl Display for MergePipelineId {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "merge:{}:{}", self.index_uid, &self.source_id)
    }
}

impl Display for IndexingTask {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "{}:{}", self.index_uid(), &self.source_id)
    }
}

impl Eq for IndexingTask {}

// TODO: This implementation conflicts with the default derived implementation. It would be better
// to use a wrapper over `IndexingTask` where we need to group indexing tasks by index UID and
// source ID.
impl Hash for IndexingTask {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        self.index_uid.hash(state);
        self.source_id.hash(state);
    }
}
#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, utoipa::ToSchema)]
pub struct PipelineMetrics {
    pub cpu_load: CpuCapacity,
    // Indexing throughput (when the CPU is working).
    // This measure the theoretical maximum number of MB/s a full indexing pipeline could process
    // provided enough data was being ingested.
    pub throughput_mb_per_sec: u16,
}

impl Display for PipelineMetrics {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "{},{}MB/s", self.cpu_load, self.throughput_mb_per_sec)
    }
}

/// One full pipeline (including merging) is assumed to consume 4 CPU threads.
/// The actual number somewhere between 3 and 4. Quickwit is not super sensitive to this number.
///
/// It simply impacts the point where we prefer to work on balancing the load over the different
/// indexers and the point where we prefer improving other feature of the system (shard locality,
/// grouping pipelines associated to a given index on the same node, etc.).
pub const PIPELINE_FULL_CAPACITY: CpuCapacity = CpuCapacity::from_cpu_millis(4_000u32);

/// One full pipeline (including merging) is supposed to have the capacity to index at least 20mb/s.
/// This is a defensive value: In reality, this is typically above 30mb/s.
pub const PIPELINE_THROUGHPUT: ByteSize = ByteSize::mb(20);

/// The CpuCapacity represents an amount of CPU resource available.
///
/// It is usually expressed in CPU millis (For instance, one full CPU thread is
/// displayed as `1000m`).
#[derive(
    Copy, Clone, Debug, Eq, PartialEq, Deserialize, Serialize, Ord, PartialOrd, utoipa::ToSchema,
)]
#[serde(
    into = "CpuCapacityForSerialization",
    try_from = "CpuCapacityForSerialization"
)]
pub struct CpuCapacity(u32);

/// Short helper function to build `CpuCapacity`.
#[inline(always)]
pub const fn mcpu(milli_cpus: u32) -> CpuCapacity {
    CpuCapacity::from_cpu_millis(milli_cpus)
}

impl CpuCapacity {
    #[inline(always)]
    pub const fn from_cpu_millis(cpu_millis: u32) -> CpuCapacity {
        CpuCapacity(cpu_millis)
    }

    #[inline(always)]
    pub fn cpu_millis(self) -> u32 {
        self.0
    }

    #[inline(always)]
    pub fn zero() -> CpuCapacity {
        CpuCapacity::from_cpu_millis(0u32)
    }

    #[inline(always)]
    pub fn one_cpu_thread() -> CpuCapacity {
        CpuCapacity::from_cpu_millis(1_000u32)
    }
}

impl Sub<CpuCapacity> for CpuCapacity {
    type Output = CpuCapacity;

    #[inline(always)]
    fn sub(self, rhs: CpuCapacity) -> Self::Output {
        CpuCapacity::from_cpu_millis(self.0 - rhs.0)
    }
}

impl Add<CpuCapacity> for CpuCapacity {
    type Output = CpuCapacity;

    #[inline(always)]
    fn add(self, rhs: CpuCapacity) -> Self::Output {
        CpuCapacity::from_cpu_millis(self.0 + rhs.0)
    }
}

impl Mul<u32> for CpuCapacity {
    type Output = CpuCapacity;

    #[inline(always)]
    fn mul(self, rhs: u32) -> CpuCapacity {
        CpuCapacity::from_cpu_millis(self.0 * rhs)
    }
}

impl Mul<f32> for CpuCapacity {
    type Output = CpuCapacity;

    #[inline(always)]
    fn mul(self, scale: f32) -> CpuCapacity {
        CpuCapacity::from_cpu_millis((self.0 as f32 * scale) as u32)
    }
}

impl Display for CpuCapacity {
    fn fmt(&self, f: &mut Formatter) -> std::fmt::Result {
        write!(f, "{}m", self.0)
    }
}

#[derive(Serialize, Deserialize)]
#[serde(untagged)]
enum CpuCapacityForSerialization {
    Float(f32),
    MilliCpuWithUnit(String),
}

impl TryFrom<CpuCapacityForSerialization> for CpuCapacity {
    type Error = String;

    fn try_from(
        cpu_capacity_for_serialization: CpuCapacityForSerialization,
    ) -> Result<CpuCapacity, Self::Error> {
        match cpu_capacity_for_serialization {
            CpuCapacityForSerialization::Float(cpu_capacity) => {
                Ok(CpuCapacity((cpu_capacity * 1000.0f32) as u32))
            }
            CpuCapacityForSerialization::MilliCpuWithUnit(cpu_capacity_str) => {
                Self::from_str(&cpu_capacity_str)
            }
        }
    }
}

impl FromStr for CpuCapacity {
    type Err = String;

    fn from_str(cpu_capacity_str: &str) -> Result<Self, Self::Err> {
        let Some(milli_cpus_without_unit_str) = cpu_capacity_str.strip_suffix('m') else {
            return Err(format!(
                "invalid cpu capacity: `{cpu_capacity_str}`. String format expects a trailing 'm'."
            ));
        };
        let milli_cpus: u32 = milli_cpus_without_unit_str
            .parse::<u32>()
            .map_err(|_err| format!("invalid cpu capacity: `{cpu_capacity_str}`."))?;
        Ok(CpuCapacity(milli_cpus))
    }
}

impl From<CpuCapacity> for CpuCapacityForSerialization {
    fn from(cpu_capacity: CpuCapacity) -> CpuCapacityForSerialization {
        CpuCapacityForSerialization::MilliCpuWithUnit(format!("{}m", cpu_capacity.0))
    }
}

/// Whenever a shard position update is detected (whether it is emit by an indexing pipeline local
/// to the cluster or received via chitchat), the shard positions service publishes a
/// `ShardPositionsUpdate` event through the cluster's `EventBroker`.
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct ShardPositionsUpdate {
    pub source_uid: SourceUid,
    // Only shards that received an update are listed here.
    pub updated_shard_positions: Vec<(ShardId, Position)>,
}

impl Event for ShardPositionsUpdate {}

impl RpcName for ApplyIndexingPlanRequest {
    fn rpc_name() -> &'static str {
        "apply_indexing_plan"
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_cpu_capacity_serialization() {
        assert_eq!(CpuCapacity::from_str("2000m").unwrap(), mcpu(2000));
        assert_eq!(CpuCapacity::from_cpu_millis(2500), mcpu(2500));
        assert_eq!(
            CpuCapacity::from_str("2.5").unwrap_err(),
            "invalid cpu capacity: `2.5`. String format expects a trailing 'm'."
        );
        assert_eq!(
            serde_json::from_value::<CpuCapacity>(serde_json::Value::String("1200m".to_string()))
                .unwrap(),
            mcpu(1200)
        );
        assert_eq!(
            serde_json::from_value::<CpuCapacity>(serde_json::Value::Number(
                serde_json::Number::from_f64(1.2f64).unwrap()
            ))
            .unwrap(),
            mcpu(1200)
        );
        assert_eq!(
            serde_json::from_value::<CpuCapacity>(serde_json::Value::Number(
                serde_json::Number::from(1u32)
            ))
            .unwrap(),
            mcpu(1000)
        );
        assert_eq!(CpuCapacity::from_cpu_millis(2500).to_string(), "2500m");
        assert_eq!(serde_json::to_string(&mcpu(2500)).unwrap(), "\"2500m\"");
    }
}


================================================
FILE: quickwit/quickwit-proto/src/ingest/ingester.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytesize::ByteSize;

use crate::types::{Position, QueueId, queue_id};

include!("../codegen/quickwit/quickwit.ingest.ingester.rs");

pub use ingester_service_grpc_server::IngesterServiceGrpcServer;

impl FetchMessage {
    pub fn new_payload(payload: FetchPayload) -> Self {
        assert!(
            matches!(&payload.mrecord_batch, Some(batch) if !batch.mrecord_lengths.is_empty()),
            "`mrecord_batch` must be set and non-empty"
        );

        Self {
            message: Some(fetch_message::Message::Payload(payload)),
        }
    }

    pub fn new_eof(eof: FetchEof) -> Self {
        assert!(
            matches!(eof.eof_position, Some(Position::Eof(_))),
            "`eof_position` must be set"
        );

        Self {
            message: Some(fetch_message::Message::Eof(eof)),
        }
    }
}

impl FetchPayload {
    pub fn queue_id(&self) -> QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }

    pub fn num_mrecords(&self) -> usize {
        if let Some(mrecord_batch) = &self.mrecord_batch {
            mrecord_batch.mrecord_lengths.len()
        } else {
            0
        }
    }

    pub fn estimate_size(&self) -> ByteSize {
        if let Some(mrecord_batch) = &self.mrecord_batch {
            mrecord_batch.estimate_size()
        } else {
            ByteSize(0)
        }
    }
}

impl IngesterStatus {
    pub fn as_json_str_name(&self) -> &'static str {
        match self {
            Self::Unspecified => "unspecified",
            Self::Initializing => "initializing",
            Self::Ready => "ready",
            Self::Retiring => "retiring",
            Self::Decommissioning => "decommissioning",
            Self::Decommissioned => "decommissioned",
            Self::Failed => "failed",
        }
    }

    pub fn from_json_str_name(value: &str) -> Option<Self> {
        match value {
            "unspecified" => Some(Self::Unspecified),
            "initializing" => Some(Self::Initializing),
            "ready" => Some(Self::Ready),
            "retiring" => Some(Self::Retiring),
            "decommissioning" => Some(Self::Decommissioning),
            "decommissioned" => Some(Self::Decommissioned),
            "failed" => Some(Self::Failed),
            _ => None,
        }
    }

    pub fn is_ready(&self) -> bool {
        matches!(self, Self::Ready)
    }

    pub fn accepts_write_requests(&self) -> bool {
        matches!(self, Self::Ready | Self::Retiring)
    }
}

impl std::fmt::Display for IngesterStatus {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(f, "{}", self.as_json_str_name())
    }
}

impl OpenFetchStreamRequest {
    pub fn queue_id(&self) -> QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }
}

impl PersistSuccess {
    pub fn queue_id(&self) -> QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }
}

impl SynReplicationMessage {
    pub fn into_open_request(self) -> Option<OpenReplicationStreamRequest> {
        match self.message {
            Some(syn_replication_message::Message::OpenRequest(open_request)) => Some(open_request),
            _ => None,
        }
    }

    pub fn new_open_request(open_request: OpenReplicationStreamRequest) -> Self {
        Self {
            message: Some(syn_replication_message::Message::OpenRequest(open_request)),
        }
    }

    pub fn new_init_replica_request(init_replica_request: InitReplicaRequest) -> Self {
        Self {
            message: Some(syn_replication_message::Message::InitRequest(
                init_replica_request,
            )),
        }
    }

    pub fn new_replicate_request(replicate_request: ReplicateRequest) -> Self {
        Self {
            message: Some(syn_replication_message::Message::ReplicateRequest(
                replicate_request,
            )),
        }
    }
}

impl AckReplicationMessage {
    pub fn into_open_response(self) -> Option<OpenReplicationStreamResponse> {
        match self.message {
            Some(ack_replication_message::Message::OpenResponse(open_response)) => {
                Some(open_response)
            }
            _ => None,
        }
    }

    pub fn new_open_response(open_response: OpenReplicationStreamResponse) -> Self {
        Self {
            message: Some(ack_replication_message::Message::OpenResponse(
                open_response,
            )),
        }
    }

    pub fn new_init_replica_response(init_replica_response: InitReplicaResponse) -> Self {
        Self {
            message: Some(ack_replication_message::Message::InitResponse(
                init_replica_response,
            )),
        }
    }

    pub fn new_replicate_response(replicate_response: ReplicateResponse) -> Self {
        Self {
            message: Some(ack_replication_message::Message::ReplicateResponse(
                replicate_response,
            )),
        }
    }
}

impl ReplicateRequest {
    pub fn num_bytes(&self) -> usize {
        self.subrequests
            .iter()
            .flat_map(|subrequest| &subrequest.doc_batch)
            .map(|doc_batch| doc_batch.num_bytes())
            .sum()
    }
}

impl ReplicateSubrequest {
    pub fn queue_id(&self) -> QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }
}

impl TruncateShardsSubrequest {
    pub fn queue_id(&self) -> QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }
}


================================================
FILE: quickwit/quickwit-proto/src/ingest/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::iter::zip;

use bytes::Bytes;
use bytesize::ByteSize;
use quickwit_common::rate_limited_error;
use quickwit_common::tower::MakeLoadShedError;
use serde::{Deserialize, Serialize};

use self::ingester::{PersistFailureReason, ReplicateFailureReason};
use self::router::IngestFailureReason;
use super::GrpcServiceError;
use crate::types::{DocUid, NodeIdRef, Position, QueueId, ShardId, SourceUid, queue_id};
use crate::{ServiceError, ServiceErrorCode};

pub mod ingester;
pub mod router;

include!("../codegen/quickwit/quickwit.ingest.rs");

pub const INGEST_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/ingest_descriptor.bin");

pub type IngestV2Result<T> = std::result::Result<T, IngestV2Error>;

#[derive(Debug, Copy, Clone, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
pub enum RateLimitingCause {
    #[error("router load shedding")]
    RouterLoadShedding,
    #[error("load shedding")]
    LoadShedding,
    #[error("wal full (memory or disk)")]
    WalFull,
    #[error("circuit breaker")]
    CircuitBreaker,
    #[error("shard rate limiting")]
    ShardRateLimiting,
    #[error("unknown")]
    Unknown,
}

#[derive(Debug, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum IngestV2Error {
    #[error("internal error: {0}")]
    Internal(String),
    #[error("shard `{shard_id}` not found")]
    ShardNotFound { shard_id: ShardId },
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests(RateLimitingCause),
    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl From<quickwit_common::tower::TimeoutExceeded> for IngestV2Error {
    fn from(_: quickwit_common::tower::TimeoutExceeded) -> IngestV2Error {
        IngestV2Error::Timeout("tower layer timeout".to_string())
    }
}

impl From<quickwit_common::tower::TaskCancelled> for IngestV2Error {
    fn from(task_cancelled: quickwit_common::tower::TaskCancelled) -> IngestV2Error {
        IngestV2Error::Internal(task_cancelled.to_string())
    }
}

impl ServiceError for IngestV2Error {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::Internal(error_msg) => {
                rate_limited_error!(limit_per_min = 6, "ingest internal error: {error_msg}");
                ServiceErrorCode::Internal
            }
            Self::ShardNotFound { .. } => ServiceErrorCode::NotFound,
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests(_) => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for IngestV2Error {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests(RateLimitingCause::Unknown)
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}

impl MakeLoadShedError for IngestV2Error {
    fn make_load_shed_error() -> Self {
        IngestV2Error::TooManyRequests(RateLimitingCause::LoadShedding)
    }
}

impl Shard {
    /// List of nodes that are storing the shard (the leader, and optionally the follower).
    pub fn ingesters(&self) -> impl Iterator<Item = &NodeIdRef> + '_ {
        [Some(&self.leader_id), self.follower_id.as_ref()]
            .into_iter()
            .flatten()
            .map(|node_id| NodeIdRef::from_str(node_id))
    }

    pub fn source_uid(&self) -> SourceUid {
        SourceUid {
            index_uid: self.index_uid().clone(),
            source_id: self.source_id.clone(),
        }
    }
}

impl ShardPKey {
    pub fn queue_id(&self) -> QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }
}

impl DocBatchV2 {
    pub fn docs(&self) -> impl Iterator<Item = (DocUid, Bytes)> + '_ {
        zip(&self.doc_uids, &self.doc_lengths).scan(
            self.doc_buffer.clone(),
            |doc_buffer, (doc_uid, doc_len)| {
                let doc = doc_buffer.split_to(*doc_len as usize);
                Some((*doc_uid, doc))
            },
        )
    }

    pub fn into_docs(self) -> impl Iterator<Item = (DocUid, Bytes)> {
        zip(self.doc_uids, self.doc_lengths).scan(
            self.doc_buffer,
            |doc_buffer, (doc_uid, doc_len)| {
                let doc = doc_buffer.split_to(doc_len as usize);
                Some((doc_uid, doc))
            },
        )
    }

    pub fn is_empty(&self) -> bool {
        self.doc_lengths.is_empty()
    }

    pub fn num_bytes(&self) -> usize {
        self.doc_buffer.len() + self.doc_lengths.len() * 4
    }

    pub fn num_docs(&self) -> usize {
        self.doc_lengths.len()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(docs: impl IntoIterator<Item = &'static str>) -> Self {
        let mut doc_uids = Vec::new();
        let mut doc_buffer = Vec::new();
        let mut doc_lengths = Vec::new();

        for (doc_uid, doc) in docs.into_iter().enumerate() {
            doc_uids.push(DocUid::for_test(doc_uid as u128));
            doc_buffer.extend(doc.as_bytes());
            doc_lengths.push(doc.len() as u32);
        }
        Self {
            doc_uids,
            doc_buffer: Bytes::from(doc_buffer),
            doc_lengths,
        }
    }
}

impl MRecordBatch {
    pub fn encoded_mrecords(&self) -> impl Iterator<Item = Bytes> + '_ {
        self.mrecord_lengths
            .iter()
            .scan(0, |start_offset, mrecord_length| {
                let start = *start_offset;
                let end = start + *mrecord_length as usize;
                *start_offset = end;
                Some(self.mrecord_buffer.slice(start..end))
            })
    }

    pub fn is_empty(&self) -> bool {
        self.mrecord_lengths.is_empty()
    }

    pub fn estimate_size(&self) -> ByteSize {
        ByteSize((self.mrecord_buffer.len() + self.mrecord_lengths.len() * 4) as u64)
    }

    pub fn num_mrecords(&self) -> usize {
        self.mrecord_lengths.len()
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(mrecords: impl IntoIterator<Item = &'static str>) -> Option<Self> {
        let mut mrecord_buffer = Vec::new();
        let mut mrecord_lengths = Vec::new();

        for mrecord in mrecords {
            mrecord_buffer.extend(mrecord.as_bytes());
            mrecord_lengths.push(mrecord.len() as u32);
        }
        Some(Self {
            mrecord_lengths,
            mrecord_buffer: Bytes::from(mrecord_buffer),
        })
    }
}

impl Shard {
    pub fn is_open(&self) -> bool {
        self.shard_state().is_open()
    }

    pub fn is_unavailable(&self) -> bool {
        self.shard_state().is_unavailable()
    }

    pub fn is_closed(&self) -> bool {
        self.shard_state().is_closed()
    }

    pub fn queue_id(&self) -> super::types::QueueId {
        queue_id(self.index_uid(), &self.source_id, self.shard_id())
    }
}

impl ShardState {
    pub fn is_open(&self) -> bool {
        *self == ShardState::Open
    }

    pub fn is_unavailable(&self) -> bool {
        *self == ShardState::Unavailable
    }

    pub fn is_closed(&self) -> bool {
        *self == ShardState::Closed
    }

    pub fn as_json_str_name(&self) -> &'static str {
        match self {
            ShardState::Unspecified => "unspecified",
            ShardState::Open => "open",
            ShardState::Unavailable => "unavailable",
            ShardState::Closed => "closed",
        }
    }

    pub fn from_json_str_name(shard_state_json_name: &str) -> Option<Self> {
        match shard_state_json_name {
            "unspecified" => Some(Self::Unspecified),
            "open" => Some(Self::Open),
            "unavailable" => Some(Self::Unavailable),
            "closed" => Some(Self::Closed),
            _ => None,
        }
    }
}

impl ShardIds {
    pub fn queue_ids(&self) -> impl Iterator<Item = QueueId> + '_ {
        self.shard_ids
            .iter()
            .map(|shard_id| queue_id(self.index_uid(), &self.source_id, shard_id))
    }

    pub fn pkeys(&self) -> impl Iterator<Item = ShardPKey> + '_ {
        self.shard_ids.iter().map(move |shard_id| ShardPKey {
            index_uid: self.index_uid.clone(),
            source_id: self.source_id.clone(),
            shard_id: Some(shard_id.clone()),
        })
    }
}

impl ShardIdPositions {
    pub fn queue_id_positions(&self) -> impl Iterator<Item = (QueueId, Position)> + '_ {
        self.shard_positions.iter().map(|shard_position| {
            let queue_id = queue_id(self.index_uid(), &self.source_id, shard_position.shard_id());
            (queue_id, shard_position.publish_position_inclusive())
        })
    }
}

impl From<PersistFailureReason> for IngestFailureReason {
    fn from(reason: PersistFailureReason) -> Self {
        match reason {
            PersistFailureReason::Unspecified => IngestFailureReason::Unspecified,
            PersistFailureReason::NoShardsAvailable => IngestFailureReason::NoShardsAvailable,
            PersistFailureReason::WalFull => IngestFailureReason::WalFull,
            PersistFailureReason::Timeout => IngestFailureReason::Timeout,
            PersistFailureReason::NodeUnavailable => IngestFailureReason::NoShardsAvailable,
        }
    }
}

impl From<ReplicateFailureReason> for PersistFailureReason {
    fn from(reason: ReplicateFailureReason) -> Self {
        match reason {
            ReplicateFailureReason::Unspecified => PersistFailureReason::Unspecified,
            ReplicateFailureReason::ShardNotFound => PersistFailureReason::NoShardsAvailable,
            ReplicateFailureReason::ShardClosed => PersistFailureReason::NoShardsAvailable,
            ReplicateFailureReason::WalFull => PersistFailureReason::WalFull,
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_shard_state_json_str_name() {
        let shard_state_json_name = ShardState::Unspecified.as_json_str_name();
        let shard_state = ShardState::from_json_str_name(shard_state_json_name).unwrap();
        assert_eq!(shard_state, ShardState::Unspecified);

        let shard_state_json_name = ShardState::Open.as_json_str_name();
        let shard_state = ShardState::from_json_str_name(shard_state_json_name).unwrap();
        assert_eq!(shard_state, ShardState::Open);

        let shard_state_json_name = ShardState::Unavailable.as_json_str_name();
        let shard_state = ShardState::from_json_str_name(shard_state_json_name).unwrap();
        assert_eq!(shard_state, ShardState::Unavailable);

        let shard_state_json_name = ShardState::Closed.as_json_str_name();
        let shard_state = ShardState::from_json_str_name(shard_state_json_name).unwrap();
        assert_eq!(shard_state, ShardState::Closed);

        assert!(ShardState::from_json_str_name("unknown").is_none());
    }
}


================================================
FILE: quickwit/quickwit-proto/src/ingest/router.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

include!("../codegen/quickwit/quickwit.ingest.router.rs");

impl IngestRequestV2 {
    pub fn num_bytes(&self) -> usize {
        self.subrequests
            .iter()
            .map(|subrequest| subrequest.num_bytes())
            .sum()
    }
}

impl IngestSubrequest {
    pub fn num_bytes(&self) -> usize {
        self.doc_batch
            .as_ref()
            .map(|doc_batch| doc_batch.doc_buffer.len())
            .unwrap_or(0)
    }
}


================================================
FILE: quickwit/quickwit-proto/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![allow(clippy::derive_partial_eq_without_eq)]
#![allow(clippy::disallowed_methods)]
#![allow(clippy::doc_lazy_continuation)]
#![allow(rustdoc::invalid_html_tags)]

use std::cmp::Ordering;

use ::opentelemetry::global;
use ::opentelemetry::propagation::{Extractor, Injector};
use tonic::Status;
use tonic::service::Interceptor;
use tracing::Span;
use tracing_opentelemetry::OpenTelemetrySpanExt;

pub mod cluster;
pub mod control_plane;
pub use bytes;
pub use tonic;
pub mod developer;
pub mod error;
mod getters;
pub mod indexing;
pub mod ingest;
pub mod metastore;
pub mod search;
pub mod types;

pub use error::{GrpcServiceError, ServiceError, ServiceErrorCode};
use search::ReportSplitsRequest;

pub mod jaeger {
    pub mod api_v2 {
        include!("codegen/jaeger/jaeger.api_v2.rs");
    }
    pub mod storage {
        pub mod v1 {
            include!("codegen/jaeger/jaeger.storage.v1.rs");
        }
        pub mod v2 {
            include!("codegen/jaeger/jaeger.storage.v2.rs");
        }
    }
}

pub mod opentelemetry {
    #[cfg(not(doctest))]
    pub mod proto {

        pub mod collector {
            pub mod logs {
                pub mod v1 {
                    include!("codegen/opentelemetry/opentelemetry.proto.collector.logs.v1.rs");
                }
            }
            // One can dream.
            // pub mod metrics {
            //     pub mod v1 {
            //         include!("codegen/opentelemetry/opentelemetry.proto.collector.metrics.v1.rs"
            // );     }
            // }
            pub mod trace {
                pub mod v1 {
                    include!("codegen/opentelemetry/opentelemetry.proto.collector.trace.v1.rs");
                }
            }
        }
        pub mod common {
            pub mod v1 {
                include!("codegen/opentelemetry/opentelemetry.proto.common.v1.rs");
            }
        }
        pub mod logs {
            pub mod v1 {
                include!("codegen/opentelemetry/opentelemetry.proto.logs.v1.rs");
            }
        }
        // pub mod metrics {
        //     pub mod experimental {
        //         include!("codegen/opentelemetry/opentelemetry.proto.metrics.experimental.rs");
        //     }
        //     pub mod v1 {
        //         tonic::include_proto!("codegen/opentelemetry/opentelemetry.proto.metrics.v1");
        //     }
        // }
        pub mod resource {
            pub mod v1 {
                include!("codegen/opentelemetry/opentelemetry.proto.resource.v1.rs");
            }
        }
        pub mod trace {
            pub mod v1 {
                include!("codegen/opentelemetry/opentelemetry.proto.trace.v1.rs");
            }
        }
    }
}

impl TryFrom<metastore::DeleteQuery> for search::SearchRequest {
    type Error = anyhow::Error;

    fn try_from(delete_query: metastore::DeleteQuery) -> anyhow::Result<Self> {
        Ok(Self {
            index_id_patterns: vec![delete_query.index_uid().index_id.to_string()],
            query_ast: delete_query.query_ast,
            start_timestamp: delete_query.start_timestamp,
            end_timestamp: delete_query.end_timestamp,
            ..Default::default()
        })
    }
}

/// `MutMetadataMap` used to extract [`tonic::metadata::MetadataMap`] from a request.
pub struct MutMetadataMap<'a>(&'a mut tonic::metadata::MetadataMap);

impl Injector for MutMetadataMap<'_> {
    /// Sets a key-value pair in the [`MetadataMap`]. No-op if the key or value is invalid.
    fn set(&mut self, key: &str, value: String) {
        if let Ok(metadata_key) = tonic::metadata::MetadataKey::from_bytes(key.as_bytes())
            && let Ok(metadata_value) = tonic::metadata::MetadataValue::try_from(&value)
        {
            self.0.insert(metadata_key, metadata_value);
        }
    }
}

impl Extractor for MutMetadataMap<'_> {
    /// Gets a value for a key from the MetadataMap.  If the value can't be converted to &str,
    /// returns None.
    fn get(&self, key: &str) -> Option<&str> {
        self.0.get(key).and_then(|metadata| metadata.to_str().ok())
    }

    /// Collect all the keys from the MetadataMap.
    fn keys(&self) -> Vec<&str> {
        self.0
            .keys()
            .map(|key| match key {
                tonic::metadata::KeyRef::Ascii(v) => v.as_str(),
                tonic::metadata::KeyRef::Binary(v) => v.as_str(),
            })
            .collect::<Vec<_>>()
    }
}

/// [`tonic::service::interceptor::Interceptor`] which injects the span context into
/// [`tonic::metadata::MetadataMap`].
#[derive(Clone, Debug)]
pub struct SpanContextInterceptor;

impl Interceptor for SpanContextInterceptor {
    fn call(&mut self, mut request: tonic::Request<()>) -> Result<tonic::Request<()>, Status> {
        global::get_text_map_propagator(|propagator| {
            propagator.inject_context(
                &tracing::Span::current().context(),
                &mut MutMetadataMap(request.metadata_mut()),
            )
        });
        Ok(request)
    }
}

/// `MetadataMap` extracts OpenTelemetry
/// tracing keys from request's headers.
struct MetadataMap<'a>(&'a tonic::metadata::MetadataMap);

impl Extractor for MetadataMap<'_> {
    /// Gets a value for a key from the MetadataMap.  If the value can't be converted to &str,
    /// returns None.
    fn get(&self, key: &str) -> Option<&str> {
        self.0.get(key).and_then(|metadata| metadata.to_str().ok())
    }

    /// Collect all the keys from the MetadataMap.
    fn keys(&self) -> Vec<&str> {
        self.0
            .keys()
            .map(|key| match key {
                tonic::metadata::KeyRef::Ascii(v) => v.as_str(),
                tonic::metadata::KeyRef::Binary(v) => v.as_str(),
            })
            .collect::<Vec<_>>()
    }
}

/// Sets parent span context derived from [`tonic::metadata::MetadataMap`].
pub fn set_parent_span_from_request_metadata(request_metadata: &tonic::metadata::MetadataMap) {
    let parent_cx =
        global::get_text_map_propagator(|prop| prop.extract(&MetadataMap(request_metadata)));
    let _ = Span::current().set_parent(parent_cx);
}

impl search::SortOrder {
    #[inline(always)]
    pub fn compare_opt<T: Ord>(&self, this: &Option<T>, other: &Option<T>) -> Ordering {
        match (this, other) {
            (Some(this), Some(other)) => self.compare(this, other),
            (Some(_), None) => Ordering::Greater,
            (None, Some(_)) => Ordering::Less,
            (None, None) => Ordering::Equal,
        }
    }

    pub fn compare<T: Ord>(&self, this: &T, other: &T) -> Ordering {
        if self == &search::SortOrder::Desc {
            this.cmp(other)
        } else {
            other.cmp(this)
        }
    }
}

impl quickwit_common::pubsub::Event for ReportSplitsRequest {}

/// Shard update_timestamp to use when reading file metastores <v0.9
pub fn compatibility_shard_update_timestamp() -> i64 {
    // We prefer a fix value here because it makes backward compatibility tests
    // simpler. Very few users use the shard API in versions <0.9 anyway.
    1704067200 // 2024-00-00T00:00:00Z
}


================================================
FILE: quickwit/quickwit-proto/src/metastore/events.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// use quickwit_common::pubsub::Event;

use quickwit_common::pubsub::Event;

use super::{
    AddSourceRequest, CreateIndexRequest, DeleteIndexRequest, DeleteSourceRequest, SourceType,
    ToggleSourceRequest,
};
use crate::types::{IndexUid, SourceId};

/// Delete index event.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct DeleteIndexEvent {
    /// Index ID of the deleted index.
    pub index_uid: IndexUid,
}

/// Add source event.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct AddSourceEvent {
    /// The ID of the index to which the source belongs.
    pub index_uid: IndexUid,
    /// The source ID.
    pub source_id: SourceId,
    /// The source type.
    pub source_type: SourceType,
}

/// Toggle source events.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct ToggleSourceEvent {
    /// Index ID of the toggled source.
    pub index_uid: IndexUid,
    /// Source ID of the toggled source.
    pub source_id: SourceId,
    /// Whether the source is enabled.
    pub enabled: bool,
}

/// Delete source event.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct DeleteSourceEvent {
    /// Index ID of the deleted source.
    pub index_uid: IndexUid,
    /// Source ID of the deleted source.
    pub source_id: SourceId,
}

impl Event for AddSourceRequest {}
impl Event for CreateIndexRequest {}
impl Event for DeleteIndexRequest {}
impl Event for DeleteSourceRequest {}
impl Event for ToggleSourceRequest {}


================================================
FILE: quickwit/quickwit-proto/src/metastore/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use quickwit_common::rate_limited_error;
use quickwit_common::retry::Retryable;
use quickwit_common::tower::{MakeLoadShedError, TimeoutExceeded};
use serde::{Deserialize, Serialize};

use crate::types::{IndexId, IndexUid, QueueId, SourceId, SplitId};
use crate::{GrpcServiceError, ServiceError, ServiceErrorCode};

pub mod events;

include!("../codegen/quickwit/quickwit.metastore.rs");

pub const METASTORE_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/metastore_descriptor.bin");

pub type MetastoreResult<T> = Result<T, MetastoreError>;

/// Lists the object types stored and managed by the metastore.
#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum EntityKind {
    /// A checkpoint delta.
    CheckpointDelta {
        /// Index ID.
        index_id: IndexId,
        /// Source ID.
        source_id: SourceId,
    },
    /// An index.
    Index {
        /// Index ID.
        index_id: IndexId,
    },
    /// A set of indexes.
    Indexes {
        /// Index IDs.
        index_ids: Vec<IndexId>,
    },
    /// A source.
    Source {
        /// Index ID.
        index_id: IndexId,
        /// Source ID.
        source_id: SourceId,
    },
    /// A shard.
    Shard {
        /// Shard queue ID: <index_uid>/<source_id>/<shard_id>
        queue_id: QueueId,
    },
    /// A split.
    Split {
        /// Split ID.
        split_id: SplitId,
    },
    /// A set of splits.
    Splits {
        /// Split IDs.
        split_ids: Vec<String>,
    },
    /// An index template.
    IndexTemplate {
        /// Index template ID.
        template_id: String,
    },
}

impl fmt::Display for EntityKind {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        match self {
            EntityKind::CheckpointDelta {
                index_id,
                source_id,
            } => write!(f, "checkpoint delta `{index_id}/{source_id}`"),
            EntityKind::Index { index_id } => write!(f, "index `{index_id}`"),
            EntityKind::Indexes { index_ids } => write!(f, "indexes `{}`", index_ids.join(", ")),
            EntityKind::Shard { queue_id } => write!(f, "shard `{queue_id}`"),
            EntityKind::Source {
                index_id,
                source_id,
            } => write!(f, "source `{index_id}/{source_id}`"),
            EntityKind::Split { split_id } => write!(f, "split `{split_id}`"),
            EntityKind::Splits { split_ids } => write!(f, "splits `{}`", split_ids.join(", ")),
            EntityKind::IndexTemplate { template_id } => {
                write!(f, "index template `{template_id}`")
            }
        }
    }
}

#[derive(Debug, Clone, thiserror::Error, Eq, PartialEq, Serialize, Deserialize)]
pub enum MetastoreError {
    #[error("{0} already exist(s)")]
    AlreadyExists(EntityKind),

    #[error("connection error: {message}")]
    Connection { message: String },

    #[error("database error: {message}")]
    Db { message: String },

    #[error("precondition failed for {entity}: {message}")]
    FailedPrecondition { entity: EntityKind, message: String },

    #[error("access forbidden: {message}")]
    Forbidden { message: String },

    #[error("internal error: {message}; cause: `{cause}`")]
    Internal { message: String, cause: String },

    #[error("invalid argument: {message}")]
    InvalidArgument { message: String },

    #[error("IO error: {message}")]
    Io { message: String },

    #[error("failed to deserialize `{struct_name}` from JSON: {message}")]
    JsonDeserializeError {
        struct_name: String,
        message: String,
    },

    #[error("failed to serialize `{struct_name}` to JSON: {message}")]
    JsonSerializeError {
        struct_name: String,
        message: String,
    },

    #[error("{0} not found")]
    NotFound(EntityKind),

    #[error("request timed out: {0}")]
    Timeout(String),

    #[error("too many requests")]
    TooManyRequests,

    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl MetastoreError {
    /// Returns `true` if the transaction that emitted this error is "certainly abort".
    /// Returns `false` if we cannot know whether the transaction was successful or not.
    pub fn is_transaction_certainly_aborted(&self) -> bool {
        match self {
            MetastoreError::AlreadyExists(_)
            | MetastoreError::FailedPrecondition { .. }
            | MetastoreError::Forbidden { .. }
            | MetastoreError::InvalidArgument { .. }
            | MetastoreError::JsonDeserializeError { .. }
            | MetastoreError::JsonSerializeError { .. }
            | MetastoreError::NotFound(_)
            | MetastoreError::TooManyRequests => true,
            MetastoreError::Connection { .. }
            | MetastoreError::Db { .. }
            | MetastoreError::Internal { .. }
            | MetastoreError::Io { .. }
            | MetastoreError::Timeout { .. }
            | MetastoreError::Unavailable(_) => false,
        }
    }
}

#[cfg(feature = "postgres")]
impl From<sqlx::Error> for MetastoreError {
    fn from(error: sqlx::Error) -> Self {
        MetastoreError::Db {
            message: error.to_string(),
        }
    }
}

impl From<TimeoutExceeded> for MetastoreError {
    fn from(_: TimeoutExceeded) -> Self {
        MetastoreError::Timeout("client".to_string())
    }
}

impl ServiceError for MetastoreError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::AlreadyExists(_) => ServiceErrorCode::AlreadyExists,
            Self::Connection { message } => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "metastore/connection internal error: {message}"
                );
                ServiceErrorCode::Internal
            }
            Self::Db { message } => {
                rate_limited_error!(limit_per_min = 6, "metastore/db internal error: {message}");
                ServiceErrorCode::Internal
            }
            Self::FailedPrecondition { .. } => ServiceErrorCode::BadRequest,
            Self::Forbidden { .. } => ServiceErrorCode::Forbidden,
            Self::Internal { message, cause } => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "metastore internal error: {message} cause: {cause}"
                );
                ServiceErrorCode::Internal
            }
            Self::InvalidArgument { .. } => ServiceErrorCode::BadRequest,
            Self::Io { message } => {
                rate_limited_error!(limit_per_min = 6, "metastore/io internal error: {message}");
                ServiceErrorCode::Internal
            }
            Self::JsonDeserializeError {
                struct_name,
                message,
            } => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "metastore/jsondeser internal error: [{struct_name}] {message}"
                );
                ServiceErrorCode::Internal
            }
            Self::JsonSerializeError {
                struct_name,
                message,
            } => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "metastore/jsonser internal error: [{struct_name}]  {message}"
                );
                ServiceErrorCode::Internal
            }
            Self::NotFound(_) => ServiceErrorCode::NotFound,
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for MetastoreError {
    fn new_internal(message: String) -> Self {
        quickwit_common::rate_limited_error!(limit_per_min=6, message=%message.as_str(), "metastore error: internal");
        Self::Internal {
            message,
            cause: "".to_string(),
        }
    }

    fn new_timeout(message: String) -> Self {
        quickwit_common::rate_limited_error!(limit_per_min=6, message=%message.as_str(), "metastore error: timeout");
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        quickwit_common::rate_limited_error!(
            limit_per_min = 6,
            "metastore error: too many requests"
        );
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        quickwit_common::rate_limited_error!(limit_per_min=6, message=%message.as_str(), "metastore error: unavailable metastore");
        Self::Unavailable(message)
    }
}

impl Retryable for MetastoreError {
    fn is_retryable(&self) -> bool {
        matches!(
            self,
            Self::Connection { .. }
                | Self::Db { .. }
                | Self::Internal { .. }
                | Self::Io { .. }
                | Self::Timeout(_)
                | Self::Unavailable(_)
        )
    }
}

impl MakeLoadShedError for MetastoreError {
    fn make_load_shed_error() -> Self {
        MetastoreError::TooManyRequests
    }
}

impl SourceType {
    pub fn as_str(&self) -> &'static str {
        match self {
            SourceType::Cli => "ingest-cli",
            SourceType::File => "file",
            SourceType::IngestV1 => "ingest-api",
            SourceType::IngestV2 => "ingest",
            SourceType::Kafka => "kafka",
            SourceType::Kinesis => "kinesis",
            SourceType::Nats => "nats",
            SourceType::PubSub => "pubsub",
            SourceType::Pulsar => "pulsar",
            SourceType::Stdin => "stdin",
            SourceType::Unspecified => "unspecified",
            SourceType::Vec => "vec",
            SourceType::Void => "void",
        }
    }
}

impl fmt::Display for SourceType {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        let source_type_str = match self {
            SourceType::Cli => "CLI ingest",
            SourceType::File => "file",
            SourceType::IngestV1 => "ingest API v1",
            SourceType::IngestV2 => "ingest API v2",
            SourceType::Kafka => "Apache Kafka",
            SourceType::Kinesis => "Amazon Kinesis",
            SourceType::Nats => "NATS",
            SourceType::PubSub => "Google Cloud Pub/Sub",
            SourceType::Pulsar => "Apache Pulsar",
            SourceType::Stdin => "Stdin",
            SourceType::Unspecified => "unspecified",
            SourceType::Vec => "vec",
            SourceType::Void => "void",
        };
        write!(f, "{source_type_str}")
    }
}

impl IndexMetadataRequest {
    pub fn into_index_id(self) -> Option<IndexId> {
        self.index_uid
            .map(|index_uid| index_uid.index_id)
            .or(self.index_id)
    }

    pub fn for_index_id(index_id: IndexId) -> Self {
        Self {
            index_uid: None,
            index_id: Some(index_id),
        }
    }

    pub fn for_index_uid(index_uid: IndexUid) -> Self {
        Self {
            index_uid: Some(index_uid),
            index_id: None,
        }
    }
}

impl MarkSplitsForDeletionRequest {
    pub fn new(index_uid: IndexUid, split_ids: Vec<String>) -> Self {
        Self {
            index_uid: index_uid.into(),
            split_ids,
        }
    }
}

impl LastDeleteOpstampResponse {
    pub fn new(last_delete_opstamp: u64) -> Self {
        Self {
            last_delete_opstamp,
        }
    }
}

impl ListDeleteTasksRequest {
    pub fn new(index_uid: IndexUid, opstamp_start: u64) -> Self {
        Self {
            index_uid: index_uid.into(),
            opstamp_start,
        }
    }
}

impl SplitStats {
    pub fn add_split(&mut self, size_bytes: u64) {
        self.num_splits += 1;
        self.total_size_bytes += size_bytes;
    }
}

pub mod serde_utils {
    use serde::de::DeserializeOwned;
    use serde::{Deserialize, Serialize};
    use serde_json::Value as JsonValue;

    use super::{MetastoreError, MetastoreResult};

    pub fn from_json_bytes<'de, T: Deserialize<'de>>(value_bytes: &'de [u8]) -> MetastoreResult<T> {
        serde_json::from_slice(value_bytes).map_err(|error| MetastoreError::JsonDeserializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }

    pub fn from_json_zstd<T: DeserializeOwned>(value_bytes: &[u8]) -> MetastoreResult<T> {
        let value_json = zstd::decode_all(value_bytes).map_err(|error| {
            MetastoreError::JsonDeserializeError {
                struct_name: std::any::type_name::<T>().to_string(),
                message: error.to_string(),
            }
        })?;
        serde_json::from_slice(&value_json).map_err(|error| MetastoreError::JsonDeserializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }

    pub fn from_json_str<'de, T: Deserialize<'de>>(value_str: &'de str) -> MetastoreResult<T> {
        serde_json::from_str(value_str).map_err(|error| MetastoreError::JsonDeserializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }

    pub fn from_json_value<T: DeserializeOwned>(value: JsonValue) -> MetastoreResult<T> {
        serde_json::from_value(value).map_err(|error| MetastoreError::JsonDeserializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }

    pub fn to_json_str<T: Serialize>(value: &T) -> Result<String, MetastoreError> {
        serde_json::to_string(value).map_err(|error| MetastoreError::JsonSerializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }

    pub fn to_json_bytes<T: Serialize>(value: &T) -> Result<Vec<u8>, MetastoreError> {
        serde_json::to_vec(value).map_err(|error| MetastoreError::JsonSerializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }

    pub fn to_json_zstd<T: Serialize>(
        value: &T,
        compression_level: i32,
    ) -> Result<Vec<u8>, MetastoreError> {
        let value_json =
            serde_json::to_vec(value).map_err(|error| MetastoreError::JsonSerializeError {
                struct_name: std::any::type_name::<T>().to_string(),
                message: error.to_string(),
            })?;
        zstd::encode_all(value_json.as_slice(), compression_level).map_err(|error| {
            MetastoreError::JsonSerializeError {
                struct_name: std::any::type_name::<T>().to_string(),
                message: error.to_string(),
            }
        })
    }

    pub fn to_json_bytes_pretty<T: Serialize>(value: &T) -> Result<Vec<u8>, MetastoreError> {
        serde_json::to_vec_pretty(value).map_err(|error| MetastoreError::JsonSerializeError {
            struct_name: std::any::type_name::<T>().to_string(),
            message: error.to_string(),
        })
    }
}

impl ListIndexesMetadataRequest {
    pub fn all() -> ListIndexesMetadataRequest {
        ListIndexesMetadataRequest {
            index_id_patterns: vec!["*".to_string()],
        }
    }
}


================================================
FILE: quickwit/quickwit-proto/src/search/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod span_id;
mod trace_id;

use std::cmp::Ordering;
use std::fmt;
use std::io::{self, Read};

use prost::Message;
pub use sort_by_value::SortValue;
pub use span_id::{SpanId, TryFromSpanIdError};
pub use trace_id::{TraceId, TryFromTraceIdError};

include!("../codegen/quickwit/quickwit.search.rs");

pub const SEARCH_FILE_DESCRIPTOR_SET: &[u8] =
    include_bytes!("../codegen/quickwit/search_descriptor.bin");

impl SearchRequest {
    pub fn time_range(&self) -> impl std::ops::RangeBounds<i64> {
        use std::ops::Bound;
        (
            self.start_timestamp
                .map_or(Bound::Unbounded, Bound::Included),
            self.end_timestamp.map_or(Bound::Unbounded, Bound::Excluded),
        )
    }
}

impl SplitIdAndFooterOffsets {
    pub fn time_range(&self) -> impl std::ops::RangeBounds<i64> {
        use std::ops::Bound;
        (
            self.timestamp_start
                .map_or(Bound::Unbounded, Bound::Included),
            self.timestamp_end.map_or(Bound::Unbounded, Bound::Included),
        )
    }
}

impl fmt::Display for SplitSearchError {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "({}, split_id: {})", self.error, self.split_id)
    }
}

impl Eq for SortByValue {}

impl From<SortValue> for SortByValue {
    fn from(sort_value: SortValue) -> Self {
        SortByValue {
            sort_value: Some(sort_value),
        }
    }
}

impl std::hash::Hash for SortByValue {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        self.sort_value.hash(state);
    }
}

impl SortByValue {
    pub fn into_json(self) -> serde_json::Value {
        use serde_json::Value::*;
        match self.sort_value {
            Some(SortValue::U64(num)) => Number(num.into()),
            Some(SortValue::I64(num)) => Number(num.into()),
            Some(SortValue::F64(num)) => {
                if let Some(num) = serde_json::Number::from_f64(num) {
                    Number(num)
                } else {
                    // TODO is there a better way to handle infinite/nan?
                    Null
                }
            }
            Some(SortValue::Boolean(b)) => Bool(b),
            None => Null,
        }
    }

    pub fn try_from_json(value: serde_json::Value) -> Option<Self> {
        use serde_json::Value::*;
        let sort_value = match value {
            Null => None,
            Bool(b) => Some(SortValue::Boolean(b)),
            Number(number) => {
                if let Some(number) = number.as_u64() {
                    Some(SortValue::U64(number))
                } else if let Some(number) = number.as_i64() {
                    Some(SortValue::I64(number))
                } else if let Some(number) = number.as_f64() {
                    Some(SortValue::F64(number))
                } else {
                    // this should never happen as we don't emit such number ourselves
                    return None;
                }
            }
            // Strings that can be converted to a number are accepted.
            // Some clients (like JS clients) can't easily handle large integers
            // without losing precision, so we accept them as strings.
            String(value) => {
                if let Ok(number) = value.parse::<i64>() {
                    Some(SortValue::I64(number))
                } else if let Ok(number) = value.parse::<u64>() {
                    Some(SortValue::U64(number))
                } else {
                    return None;
                }
            }
            Array(_) | Object(_) => return None,
        };
        Some(SortByValue { sort_value })
    }
}

// !!! Disclaimer !!!
//
// Prost imposes the PartialEq derived implementation.
// This is terrible because this means Eq, PartialEq are not really in line with Ord's
// implementation. if in presence of NaN.
impl Eq for SortValue {}

impl Ord for SortValue {
    #[inline]
    fn cmp(&self, other: &Self) -> Ordering {
        // We make sure to end up with a total order.
        match (*self, *other) {
            // Same types.
            (SortValue::U64(left), SortValue::U64(right)) => left.cmp(&right),
            (SortValue::I64(left), SortValue::I64(right)) => left.cmp(&right),
            (SortValue::Boolean(left), SortValue::Boolean(right)) => left.cmp(&right),
            // We half the logic by making sure we keep
            // the "stronger" type on the left.
            (SortValue::U64(left), SortValue::I64(right)) => {
                if left > i64::MAX as u64 {
                    return Ordering::Greater;
                }
                (left as i64).cmp(&right)
            }
            (SortValue::F64(left), SortValue::F64(right)) => left.total_cmp(&right),
            (SortValue::F64(left), SortValue::U64(right)) => left.total_cmp(&(right as f64)),
            (SortValue::F64(left), SortValue::I64(right)) => left.total_cmp(&(right as f64)),
            (SortValue::Boolean(left), right) => SortValue::U64(left as u64).cmp(&right),
            (left, right) => right.cmp(&left).reverse(),
        }
    }
}

impl PartialOrd for SortValue {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl std::hash::Hash for SortValue {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        let this = self.normalize();
        std::mem::discriminant(&this).hash(state);
        match this {
            SortValue::U64(number) => {
                number.hash(state);
            }
            SortValue::I64(number) => {
                number.hash(state);
            }
            SortValue::F64(number) => {
                number.to_bits().hash(state);
            }
            SortValue::Boolean(b) => {
                b.hash(state);
            }
        }
    }
}

impl SortValue {
    /// Where multiple variant could represent the same logical value, convert to a canonical form.
    ///
    /// For number, we prefer to represent them, in order, as i64, then as u64 and finally as f64.
    pub fn normalize(&self) -> Self {
        match self {
            SortValue::I64(_) => *self,
            SortValue::Boolean(_) => *self,
            SortValue::U64(number) => {
                if let Ok(number) = (*number).try_into() {
                    SortValue::I64(number)
                } else {
                    *self
                }
            }
            SortValue::F64(number) => {
                let number = *number;
                if number.ceil() == number {
                    // number is not NaN, and is a natural number
                    if number >= i64::MIN as f64 && number <= i64::MAX as f64 {
                        return SortValue::I64(number as i64);
                    } else if number.is_sign_positive() && number <= u64::MAX as f64 {
                        return SortValue::U64(number as u64);
                    }
                }
                *self
            }
        }
    }
}

impl PartialHit {
    /// Helper to get access to the 1st sort value
    pub fn sort_value(&self) -> Option<SortValue> {
        if let Some(sort_value) = self.sort_value {
            sort_value.sort_value
        } else {
            None
        }
    }
}

/// Serializes the Split fields.
///
/// `fields_metadata` has to be sorted.
pub fn serialize_split_fields(list_fields: ListFields) -> Vec<u8> {
    let payload = list_fields.encode_to_vec();
    let compression_level = 3;
    let payload_compressed = zstd::stream::encode_all(&mut &payload[..], compression_level)
        .expect("zstd encoding failed");
    let mut out = Vec::new();
    // Write Header -- Format Version 2
    let format_version = 2u8;
    out.push(format_version);
    // Write Payload
    out.extend_from_slice(&payload_compressed);
    out
}

/// Reads a fixed number of bytes into an array and returns the array.
fn read_exact_array<const N: usize>(reader: &mut impl Read) -> io::Result<[u8; N]> {
    let mut buffer = [0u8; N];
    reader.read_exact(&mut buffer)?;
    Ok(buffer)
}

/// Reads the Split fields from a zstd compressed stream of bytes
pub fn deserialize_split_fields<R: Read>(mut reader: R) -> io::Result<ListFields> {
    let format_version = read_exact_array::<1>(&mut reader)?[0];
    if format_version != 2 {
        return Err(io::Error::new(
            io::ErrorKind::InvalidData,
            format!("Unsupported split field format version: {format_version}"),
        ));
    }
    let reader = zstd::Decoder::new(reader)?;
    read_split_fields_from_zstd(reader)
}

/// Reads the Split fields from a stream of bytes
#[allow(clippy::unbuffered_bytes)]
fn read_split_fields_from_zstd<R: Read>(reader: R) -> io::Result<ListFields> {
    let all_bytes: Vec<_> = reader.bytes().collect::<io::Result<_>>()?;
    let serialized_list_fields: ListFields = prost::Message::decode(&all_bytes[..])?;

    Ok(serialized_list_fields)
}


================================================
FILE: quickwit/quickwit-proto/src/search/span_id.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Deserializer, Serialize, Serializer, de};

#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)]
pub struct SpanId([u8; 8]);

impl SpanId {
    pub const HEX_LENGTH: usize = 16;

    pub fn new(bytes: [u8; 8]) -> Self {
        Self(bytes)
    }

    pub fn as_bytes(&self) -> &[u8] {
        &self.0
    }

    pub fn to_vec(&self) -> Vec<u8> {
        self.0.to_vec()
    }
}

impl Serialize for SpanId {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        let hexspan_id = hex::encode(self.0);
        serializer.serialize_str(&hexspan_id)
    }
}

impl<'de> Deserialize<'de> for SpanId {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let hexspan_id = String::deserialize(deserializer)?;

        if hexspan_id.len() != SpanId::HEX_LENGTH {
            let message = format!(
                "hex span ID must be {} bytes long, got {}",
                SpanId::HEX_LENGTH,
                hexspan_id.len()
            );
            return Err(de::Error::custom(message));
        }
        let mut span_id = [0u8; 8];
        hex::decode_to_slice(hexspan_id, &mut span_id).map_err(|error| {
            let message = format!("failed to decode hex span ID: {error:?}");
            de::Error::custom(message)
        })?;
        Ok(SpanId(span_id))
    }
}

#[derive(Debug, thiserror::Error)]
#[error("span ID must be 8 bytes long, got {0}")]
pub struct TryFromSpanIdError(usize);

impl TryFrom<&[u8]> for SpanId {
    type Error = TryFromSpanIdError;

    fn try_from(slice: &[u8]) -> Result<Self, Self::Error> {
        let span_id = slice
            .try_into()
            .map_err(|_| TryFromSpanIdError(slice.len()))?;
        Ok(SpanId(span_id))
    }
}

impl TryFrom<Vec<u8>> for SpanId {
    type Error = TryFromSpanIdError;

    fn try_from(vec: Vec<u8>) -> Result<Self, Self::Error> {
        Self::try_from(&vec[..])
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_span_id_serde() {
        let expected_span_id = SpanId::new([1; 8]);
        let span_id_json = serde_json::to_string(&expected_span_id).unwrap();
        assert_eq!(span_id_json, r#""0101010101010101""#);

        let span_id = serde_json::from_str::<SpanId>(&span_id_json).unwrap();
        assert_eq!(span_id, expected_span_id,);
    }

    #[test]
    fn test_span_id_try_from() {
        let expected_span_id = SpanId::new([1; 8]);
        let span_id = SpanId::try_from([1; 8].as_slice()).unwrap();
        assert_eq!(span_id, expected_span_id);

        let error = SpanId::try_from([1; 9].as_slice()).unwrap_err();
        assert_eq!(error.0, 9);
    }
}


================================================
FILE: quickwit/quickwit-proto/src/search/trace_id.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Deserializer, Serialize, Serializer, de};

#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)]
pub struct TraceId([u8; 16]);

impl TraceId {
    pub const HEX_LENGTH: usize = 32;

    pub fn new(bytes: [u8; 16]) -> Self {
        Self(bytes)
    }

    pub fn into_bytes(self) -> [u8; 16] {
        self.0
    }

    pub fn to_vec(&self) -> Vec<u8> {
        self.0.to_vec()
    }

    pub fn hex_display(&self) -> String {
        hex::encode(self.0)
    }
}

impl Serialize for TraceId {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        if serializer.is_human_readable() {
            let hextrace_id = hex::encode(self.0);
            serializer.serialize_str(&hextrace_id)
        } else {
            self.0.serialize(serializer)
        }
    }
}

impl<'de> Deserialize<'de> for TraceId {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        if deserializer.is_human_readable() {
            let hextrace_id = String::deserialize(deserializer)?;
            if hextrace_id.len() != TraceId::HEX_LENGTH {
                let message = format!(
                    "hex trace ID must be {} bytes long, got {}",
                    TraceId::HEX_LENGTH,
                    hextrace_id.len()
                );
                return Err(de::Error::custom(message));
            }
            let mut trace_id_bytes = [0u8; 16];
            hex::decode_to_slice(hextrace_id, &mut trace_id_bytes).map_err(|error| {
                let message = format!("failed to decode hex span ID: {error:?}");
                de::Error::custom(message)
            })?;
            Ok(TraceId(trace_id_bytes))
        } else {
            let trace_id_bytes: [u8; 16] = <[u8; 16]>::deserialize(deserializer)?;
            Ok(TraceId(trace_id_bytes))
        }
    }
}

#[derive(Debug, thiserror::Error)]
#[error("trace ID must be 16 bytes long, got {0}")]
pub struct TryFromTraceIdError(usize);

impl TryFrom<&[u8]> for TraceId {
    type Error = TryFromTraceIdError;

    fn try_from(slice: &[u8]) -> Result<Self, Self::Error> {
        let trace_id = slice
            .try_into()
            .map_err(|_| TryFromTraceIdError(slice.len()))?;
        Ok(TraceId(trace_id))
    }
}

impl TryFrom<Vec<u8>> for TraceId {
    type Error = TryFromTraceIdError;

    fn try_from(vec: Vec<u8>) -> Result<Self, Self::Error> {
        Self::try_from(&vec[..])
    }
}

impl From<TryFromTraceIdError> for tonic::Status {
    fn from(error: TryFromTraceIdError) -> Self {
        tonic::Status::invalid_argument(error.to_string())
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_trace_id_serde() {
        let expected_trace_id = TraceId::new([1; 16]);
        let trace_id_json = serde_json::to_string(&expected_trace_id).unwrap();
        assert_eq!(trace_id_json, r#""01010101010101010101010101010101""#);

        let trace_id = serde_json::from_str::<TraceId>(&trace_id_json).unwrap();
        assert_eq!(trace_id, expected_trace_id,);
    }

    #[test]
    fn test_trace_id_try_from() {
        let expected_trace_id = TraceId::new([1; 16]);
        let trace_id = TraceId::try_from([1; 16].as_slice()).unwrap();
        assert_eq!(trace_id, expected_trace_id);

        let error = TraceId::try_from([1; 17].as_slice()).unwrap_err();
        assert_eq!(error.0, 17);
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/doc_mapping_uid.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::fmt;
use std::str::FromStr;

use anyhow::Context;
use serde::de::Error;
use serde::{Deserialize, Deserializer, Serialize, Serializer};
pub use ulid::Ulid;

use super::ULID_SIZE;

/// Unique identifier for a document mapping.
#[derive(Clone, Copy, Default, Hash, Eq, PartialEq, Ord, PartialOrd, utoipa::ToSchema)]
pub struct DocMappingUid(Ulid);

impl fmt::Debug for DocMappingUid {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "DocMapping({})", self.0)
    }
}

impl fmt::Display for DocMappingUid {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        self.0.fmt(f)
    }
}

impl From<Ulid> for DocMappingUid {
    fn from(ulid: Ulid) -> Self {
        Self(ulid)
    }
}

impl DocMappingUid {
    /// Creates a new random doc mapping UID.
    pub fn random() -> Self {
        Self(Ulid::new())
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(ulid_u128: u128) -> DocMappingUid {
        Self(Ulid::from(ulid_u128))
    }
}

impl<'de> Deserialize<'de> for DocMappingUid {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let doc_mapping_uid_str: Cow<'de, str> = Cow::deserialize(deserializer)?;
        doc_mapping_uid_str.parse().map_err(D::Error::custom)
    }
}

impl Serialize for DocMappingUid {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.collect_str(&self.0)
    }
}

impl prost::Message for DocMappingUid {
    fn encode_raw(&self, buf: &mut impl prost::bytes::BufMut) {
        // TODO: when `bytes::encode` supports `&[u8]`, we can remove this allocation.
        prost::encoding::bytes::encode(1u32, &self.0.to_bytes().to_vec(), buf);
    }

    fn merge_field(
        &mut self,
        tag: u32,
        wire_type: prost::encoding::WireType,
        buf: &mut impl prost::bytes::Buf,
        ctx: prost::encoding::DecodeContext,
    ) -> ::core::result::Result<(), prost::DecodeError> {
        const STRUCT_NAME: &str = "DocMappingUid";

        match tag {
            1u32 => {
                let mut buffer = Vec::with_capacity(ULID_SIZE);

                prost::encoding::bytes::merge(wire_type, &mut buffer, buf, ctx).map_err(
                    |mut error| {
                        error.push(STRUCT_NAME, "doc_mapping_uid");
                        error
                    },
                )?;
                let ulid_bytes: [u8; ULID_SIZE] =
                    buffer.try_into().map_err(|buffer: Vec<u8>| {
                        prost::DecodeError::new(format!(
                            "invalid length for field `doc_mapping_uid`, expected 16 bytes, got {}",
                            buffer.len()
                        ))
                    })?;
                self.0 = Ulid::from_bytes(ulid_bytes);
                Ok(())
            }
            _ => prost::encoding::skip_field(wire_type, tag, buf, ctx),
        }
    }

    #[inline]
    fn encoded_len(&self) -> usize {
        prost::encoding::key_len(1u32)
            + prost::encoding::encoded_len_varint(ULID_SIZE as u64)
            + ULID_SIZE
    }

    fn clear(&mut self) {
        self.0 = Ulid::nil();
    }
}

impl FromStr for DocMappingUid {
    type Err = anyhow::Error;

    fn from_str(doc_mapping_uid_str: &str) -> Result<Self, Self::Err> {
        Ulid::from_string(doc_mapping_uid_str)
            .map(Self)
            .with_context(|| format!("failed to parse doc mapping UID `{doc_mapping_uid_str}`"))
    }
}

#[cfg(feature = "postgres")]
impl TryFrom<String> for DocMappingUid {
    type Error = anyhow::Error;

    fn try_from(doc_mapping_uid_str: String) -> Result<Self, Self::Error> {
        doc_mapping_uid_str.parse()
    }
}

#[cfg(feature = "postgres")]
impl sqlx::Type<sqlx::Postgres> for DocMappingUid {
    fn type_info() -> sqlx::postgres::PgTypeInfo {
        sqlx::postgres::PgTypeInfo::with_name("VARCHAR(26)")
    }
}

#[cfg(feature = "postgres")]
impl sqlx::Encode<'_, sqlx::Postgres> for DocMappingUid {
    fn encode_by_ref(
        &self,
        buf: &mut sqlx::postgres::PgArgumentBuffer,
    ) -> Result<sqlx::encode::IsNull, sqlx::error::BoxDynError> {
        sqlx::Encode::<sqlx::Postgres>::encode(self.0.to_string(), buf)
    }
}

#[cfg(test)]
mod tests {
    use bytes::Bytes;
    use prost::Message;

    use super::*;

    #[test]
    fn test_doc_mapping_uid_json_serde_roundtrip() {
        let doc_mapping_uid = DocMappingUid::default();
        let serialized = serde_json::to_string(&doc_mapping_uid).unwrap();
        assert_eq!(serialized, r#""00000000000000000000000000""#);

        let deserialized: DocMappingUid = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, doc_mapping_uid);
    }

    #[test]
    fn test_doc_mapping_uid_prost_serde_roundtrip() {
        let doc_mapping_uid = DocMappingUid::random();

        let encoded = doc_mapping_uid.encode_to_vec();
        assert_eq!(
            DocMappingUid::decode(Bytes::from(encoded)).unwrap(),
            doc_mapping_uid
        );

        let encoded = doc_mapping_uid.encode_length_delimited_to_vec();
        assert_eq!(
            DocMappingUid::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            doc_mapping_uid
        );
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/doc_uid.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::fmt;

use serde::de::Error;
use serde::{Deserialize, Deserializer, Serialize, Serializer};
pub use ulid::Ulid;

use super::ULID_SIZE;

/// A doc UID identifies a document across segments, splits, and indexes.
#[derive(Clone, Copy, Default, Hash, Eq, PartialEq, Ord, PartialOrd)]
pub struct DocUid(Ulid);

impl fmt::Debug for DocUid {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "Doc({})", self.0)
    }
}

impl fmt::Display for DocUid {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        self.0.fmt(f)
    }
}

impl From<Ulid> for DocUid {
    fn from(ulid: Ulid) -> Self {
        Self(ulid)
    }
}

impl DocUid {
    /// Creates a new random doc UID.
    pub fn random() -> Self {
        Self(Ulid::new())
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(ulid_u128: u128) -> DocUid {
        Self(Ulid::from(ulid_u128))
    }
}

impl<'de> Deserialize<'de> for DocUid {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let doc_uid_str: Cow<'de, str> = Cow::deserialize(deserializer)?;
        let doc_uid = Ulid::from_string(&doc_uid_str).map_err(D::Error::custom)?;
        Ok(Self(doc_uid))
    }
}

impl Serialize for DocUid {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.collect_str(&self.0)
    }
}

impl prost::Message for DocUid {
    fn encode_raw(&self, buf: &mut impl prost::bytes::BufMut) {
        // TODO: when `bytes::encode` supports `&[u8]`, we can remove this allocation.
        prost::encoding::bytes::encode(1u32, &self.0.to_bytes().to_vec(), buf);
    }

    fn merge_field(
        &mut self,
        tag: u32,
        wire_type: prost::encoding::WireType,
        buf: &mut impl prost::bytes::Buf,
        ctx: prost::encoding::DecodeContext,
    ) -> ::core::result::Result<(), prost::DecodeError> {
        const STRUCT_NAME: &str = "DocUid";

        match tag {
            1u32 => {
                let mut buffer = Vec::with_capacity(ULID_SIZE);

                prost::encoding::bytes::merge(wire_type, &mut buffer, buf, ctx).map_err(
                    |mut error| {
                        error.push(STRUCT_NAME, "doc_uid");
                        error
                    },
                )?;
                let ulid_bytes: [u8; ULID_SIZE] =
                    buffer.try_into().map_err(|buffer: Vec<u8>| {
                        prost::DecodeError::new(format!(
                            "invalid length for field `doc_uid`, expected 16 bytes, got {}",
                            buffer.len()
                        ))
                    })?;
                self.0 = Ulid::from_bytes(ulid_bytes);
                Ok(())
            }
            _ => prost::encoding::skip_field(wire_type, tag, buf, ctx),
        }
    }

    #[inline]
    fn encoded_len(&self) -> usize {
        prost::encoding::key_len(1u32)
            + prost::encoding::encoded_len_varint(ULID_SIZE as u64)
            + ULID_SIZE
    }

    fn clear(&mut self) {
        self.0 = Ulid::nil();
    }
}

/// Generates monotonically increasing doc UIDs. It is not `Clone` nor `Copy` on purpose.
#[derive(Debug)]
pub struct DocUidGenerator {
    next_ulid: Ulid,
}

impl Default for DocUidGenerator {
    fn default() -> Self {
        Self {
            next_ulid: Ulid::new(),
        }
    }
}

impl DocUidGenerator {
    /// Generates a new doc UID.
    #[allow(clippy::unwrap_or_default)]
    pub fn next_doc_uid(&mut self) -> DocUid {
        let doc_uid = DocUid(self.next_ulid);
        // Clippy insists on using `unwrap_or_default`, but that's really not what we want here:
        // https://github.com/rust-lang/rust-clippy/issues/11631
        self.next_ulid = self.next_ulid.increment().unwrap_or_else(Ulid::new);
        doc_uid
    }
}

#[cfg(test)]
mod tests {
    use bytes::Bytes;
    use prost::Message;

    use super::*;

    #[test]
    fn test_doc_uid_json_serde_roundtrip() {
        let doc_uid = DocUid::default();
        let serialized = serde_json::to_string(&doc_uid).unwrap();
        assert_eq!(serialized, r#""00000000000000000000000000""#);

        let deserialized: DocUid = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, doc_uid);
    }

    #[test]
    fn test_doc_uid_prost_serde_roundtrip() {
        let doc_uid = DocUid::random();

        let encoded = doc_uid.encode_to_vec();
        assert_eq!(DocUid::decode(Bytes::from(encoded)).unwrap(), doc_uid);

        let encoded = doc_uid.encode_length_delimited_to_vec();
        assert_eq!(
            DocUid::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            doc_uid
        );
    }

    #[test]
    fn test_doc_uid_generator() {
        let mut generator = DocUidGenerator::default();
        let doc_uids: Vec<DocUid> = (0..10_000).map(|_| generator.next_doc_uid()).collect();
        assert!(doc_uids.windows(2).all(|window| window[0] < window[1]));
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/index_uid.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::fmt;
use std::str::FromStr;

use serde::de::Error;
use serde::{Deserialize, Deserializer, Serialize, Serializer};
use thiserror::Error;
pub use ulid::Ulid;

use super::ULID_SIZE;
use crate::types::IndexId;

/// Index identifiers that uniquely identify not only the index, but also
/// its incarnation allowing to distinguish between deleted and recreated indexes.
/// It is represented as a string in index_id:incarnation_id format.
#[derive(Clone, Debug, Default, PartialEq, Eq, Ord, PartialOrd, Hash)]
pub struct IndexUid {
    pub index_id: IndexId,
    pub incarnation_id: Ulid,
}

impl fmt::Display for IndexUid {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{}:{}", self.index_id, self.incarnation_id)
    }
}

impl IndexUid {
    /// Creates a new index UID from an index ID using a random ULID as incarnation ID.
    pub fn new_with_random_ulid(index_id: &str) -> Self {
        Self::new(index_id, Ulid::new())
    }

    fn new(index_id: &str, incarnation_id: impl Into<Ulid>) -> Self {
        assert!(!index_id.contains(':'), "index ID may not contain `:`");

        Self {
            index_id: index_id.to_string(),
            incarnation_id: incarnation_id.into(),
        }
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(index_id: &str, incarnation_id: u128) -> Self {
        Self {
            index_id: index_id.to_string(),
            incarnation_id: incarnation_id.into(),
        }
    }
}

#[derive(Error, Debug)]
#[error("invalid index UID `{0}`")]
pub struct InvalidIndexUid(String);

impl FromStr for IndexUid {
    type Err = InvalidIndexUid;

    fn from_str(index_uid_str: &str) -> Result<Self, Self::Err> {
        let Some((index_id, incarnation_id_str)) = index_uid_str.split_once(':') else {
            return Err(InvalidIndexUid(index_uid_str.to_string()));
        };
        let incarnation_id = Ulid::from_string(incarnation_id_str)
            .map_err(|_| InvalidIndexUid(index_uid_str.to_string()))?;
        let index_uid = IndexUid {
            index_id: index_id.to_string(),
            incarnation_id,
        };
        Ok(index_uid)
    }
}

impl<'de> Deserialize<'de> for IndexUid {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let index_uid_str: Cow<'de, str> = Cow::deserialize(deserializer)?;
        let index_uid = IndexUid::from_str(&index_uid_str).map_err(D::Error::custom)?;
        Ok(index_uid)
    }
}

impl Serialize for IndexUid {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.collect_str(&self)
    }
}

impl prost::Message for IndexUid {
    fn encode_raw(&self, buf: &mut impl prost::bytes::BufMut) {
        if !self.index_id.is_empty() {
            prost::encoding::string::encode(1u32, &self.index_id, buf);
        }
        // TODO: when `bytes::encode` supports `&[u8]`, we can remove this allocation.
        prost::encoding::bytes::encode(2u32, &self.incarnation_id.to_bytes().to_vec(), buf);
    }

    fn merge_field(
        &mut self,
        tag: u32,
        wire_type: prost::encoding::WireType,
        buf: &mut impl prost::bytes::Buf,
        ctx: prost::encoding::DecodeContext,
    ) -> ::core::result::Result<(), prost::DecodeError> {
        const STRUCT_NAME: &str = "IndexUid";

        match tag {
            1u32 => {
                let value = &mut self.index_id;
                prost::encoding::string::merge(wire_type, value, buf, ctx).map_err(|mut error| {
                    error.push(STRUCT_NAME, "index_id");
                    error
                })
            }
            2u32 => {
                let mut buffer = Vec::with_capacity(ULID_SIZE);

                prost::encoding::bytes::merge(wire_type, &mut buffer, buf, ctx).map_err(
                    |mut error| {
                        error.push(STRUCT_NAME, "incarnation_id");
                        error
                    },
                )?;
                let ulid_bytes: [u8; ULID_SIZE] =
                    buffer.try_into().map_err(|buffer: Vec<u8>| {
                        prost::DecodeError::new(format!(
                            "invalid length for field `incarnation_id`, expected 16 bytes, got {}",
                            buffer.len()
                        ))
                    })?;
                self.incarnation_id = Ulid::from_bytes(ulid_bytes);
                Ok(())
            }
            _ => prost::encoding::skip_field(wire_type, tag, buf, ctx),
        }
    }

    #[inline]
    fn encoded_len(&self) -> usize {
        let mut len = 0;

        if !self.index_id.is_empty() {
            len += prost::encoding::string::encoded_len(1u32, &self.index_id);
        }

        len += prost::encoding::key_len(2u32)
            + prost::encoding::encoded_len_varint(ULID_SIZE as u64)
            + ULID_SIZE;
        len
    }

    fn clear(&mut self) {
        self.index_id.clear();
        self.incarnation_id = Ulid::nil();
    }
}

#[cfg(feature = "postgres")]
impl TryFrom<String> for IndexUid {
    type Error = InvalidIndexUid;

    fn try_from(value: String) -> Result<Self, Self::Error> {
        value.parse()
    }
}

#[cfg(feature = "postgres")]
impl sqlx::Type<sqlx::Postgres> for IndexUid {
    fn type_info() -> sqlx::postgres::PgTypeInfo {
        sqlx::postgres::PgTypeInfo::with_name("VARCHAR")
    }
}

#[cfg(feature = "postgres")]
impl sqlx::Encode<'_, sqlx::Postgres> for IndexUid {
    fn encode_by_ref(
        &self,
        buf: &mut sqlx::postgres::PgArgumentBuffer,
    ) -> Result<sqlx::encode::IsNull, sqlx::error::BoxDynError> {
        let _ = sqlx::Encode::<sqlx::Postgres>::encode(&self.index_id, buf)?;
        let _ = sqlx::Encode::<sqlx::Postgres>::encode(":", buf)?;
        sqlx::Encode::<sqlx::Postgres>::encode(self.incarnation_id.to_string(), buf)
    }
}

#[cfg(feature = "postgres")]
impl sqlx::postgres::PgHasArrayType for IndexUid {
    fn array_type_info() -> sqlx::postgres::PgTypeInfo {
        sqlx::postgres::PgTypeInfo::with_name("VARCHAR[]")
    }
}

impl PartialEq<(&'static str, u128)> for IndexUid {
    fn eq(&self, (index_id, incarnation_id): &(&str, u128)) -> bool {
        self.index_id == *index_id && self.incarnation_id == Ulid::from(*incarnation_id)
    }
}

#[cfg(feature = "postgres")]
impl From<IndexUid> for sea_query::Value {
    fn from(index_uid: IndexUid) -> Self {
        index_uid.to_string().into()
    }
}

#[cfg(feature = "postgres")]
impl From<&IndexUid> for sea_query::Value {
    fn from(index_uid: &IndexUid) -> Self {
        index_uid.to_string().into()
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Borrow;
use std::convert::Infallible;
use std::fmt;
use std::fmt::{Display, Formatter};
use std::ops::Deref;
use std::str::FromStr;

use serde::{Deserialize, Serialize};
use tracing::error;
pub use ulid::Ulid;

mod doc_mapping_uid;
mod doc_uid;
mod index_uid;
mod pipeline_uid;
mod position;
mod shard_id;

pub use doc_mapping_uid::DocMappingUid;
pub use doc_uid::{DocUid, DocUidGenerator};
pub use index_uid::IndexUid;
pub use pipeline_uid::PipelineUid;
pub use position::Position;
pub use shard_id::ShardId;

/// The size of an ULID in bytes. Use `ULID_LEN` for the length of Base32 encoded ULID strings.
pub(crate) const ULID_SIZE: usize = 16;

pub type IndexId = String;

pub type SourceId = String;

pub type SplitId = String;

pub type SubrequestId = u32;

/// See the file `ingest.proto` for more details.
pub type PublishToken = String;

/// Uniquely identifies a shard and its underlying mrecordlog queue.
pub type QueueId = String; // <index_uid>/<source_id>/<shard_id>

pub fn queue_id(index_uid: &IndexUid, source_id: &str, shard_id: &ShardId) -> QueueId {
    format!("{index_uid}/{source_id}/{shard_id}")
}

pub fn split_queue_id(queue_id: &str) -> Option<(IndexUid, SourceId, ShardId)> {
    let parts_opt = split_queue_id_inner(queue_id);

    if parts_opt.is_none() {
        error!("failed to parse queue ID `{queue_id}`: this should never happen, please report");
    }
    parts_opt
}

fn split_queue_id_inner(queue_id: &str) -> Option<(IndexUid, SourceId, ShardId)> {
    let mut parts = queue_id.split('/');
    let index_uid = parts.next()?;
    let source_id = parts.next()?;
    let shard_id = parts.next()?;
    Some((
        index_uid.parse().ok()?,
        source_id.to_string(),
        ShardId::from(shard_id),
    ))
}

/// It can however appear only once in a given index.
/// In itself, `SourceId` is not unique, but the pair `(IndexUid, SourceId)` is.
#[derive(PartialEq, Eq, Debug, PartialOrd, Ord, Hash, Clone)]
pub struct SourceUid {
    pub index_uid: IndexUid,
    pub source_id: SourceId,
}

impl Display for SourceUid {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "{}:{}", self.index_uid, self.source_id)
    }
}

#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
pub struct NodeId(String);

impl NodeId {
    /// Constructs a new [`NodeId`].
    pub const fn new(node_id: String) -> Self {
        Self(node_id)
    }

    /// Takes ownership of the underlying [`String`], consuming `self`.
    pub fn take(self) -> String {
        self.0
    }
}

impl AsRef<NodeIdRef> for NodeId {
    fn as_ref(&self) -> &NodeIdRef {
        self.deref()
    }
}

impl Borrow<str> for NodeId {
    fn borrow(&self) -> &str {
        &self.0
    }
}

impl Borrow<String> for NodeId {
    fn borrow(&self) -> &String {
        &self.0
    }
}

impl Borrow<NodeIdRef> for NodeId {
    fn borrow(&self) -> &NodeIdRef {
        self.deref()
    }
}

impl Deref for NodeId {
    type Target = NodeIdRef;

    fn deref(&self) -> &Self::Target {
        NodeIdRef::from_str(&self.0)
    }
}

impl Display for NodeId {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(f, "{}", self.0)
    }
}

impl From<&'_ str> for NodeId {
    fn from(node_id: &str) -> Self {
        Self::new(node_id.to_string())
    }
}

impl From<String> for NodeId {
    fn from(node_id: String) -> Self {
        Self::new(node_id)
    }
}

impl From<NodeId> for String {
    fn from(node_id: NodeId) -> Self {
        node_id.0
    }
}

impl From<&'_ NodeIdRef> for NodeId {
    fn from(node_id: &NodeIdRef) -> Self {
        node_id.to_owned()
    }
}

impl FromStr for NodeId {
    type Err = Infallible;

    fn from_str(node_id: &str) -> Result<Self, Self::Err> {
        Ok(NodeId::new(node_id.to_string()))
    }
}

impl PartialEq<&str> for NodeId {
    fn eq(&self, other: &&str) -> bool {
        self.as_str() == *other
    }
}

impl PartialEq<String> for NodeId {
    fn eq(&self, other: &String) -> bool {
        self.as_str() == *other
    }
}

#[repr(transparent)]
#[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
pub struct NodeIdRef(str);

impl NodeIdRef {
    /// Transparently reinterprets the string slice as a strongly-typed [`NodeIdRef`].
    pub const fn from_str(node_id: &str) -> &Self {
        let ptr: *const str = node_id;
        // SAFETY: `NodeIdRef` is `#[repr(transparent)]` around a single `str` field, so a `*const
        // str` can be safely reinterpreted as a `*const NodeIdRef`
        unsafe { &*(ptr as *const Self) }
    }

    /// Transparently reinterprets the static string slice as a strongly-typed [`NodeIdRef`].
    pub const fn from_static(node_id: &'static str) -> &'static Self {
        Self::from_str(node_id)
    }

    /// Provides access to the underlying value as a string slice.
    pub const fn as_str(&self) -> &str {
        &self.0
    }
}

impl AsRef<str> for NodeIdRef {
    fn as_ref(&self) -> &str {
        &self.0
    }
}

impl Borrow<str> for NodeIdRef {
    fn borrow(&self) -> &str {
        &self.0
    }
}

impl Display for NodeIdRef {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "{}", &self.0)
    }
}

impl<'a> From<&'a str> for &'a NodeIdRef {
    fn from(node_id: &'a str) -> &'a NodeIdRef {
        NodeIdRef::from_str(node_id)
    }
}

impl PartialEq<NodeIdRef> for NodeId {
    fn eq(&self, other: &NodeIdRef) -> bool {
        self.as_str() == other.as_str()
    }
}

impl PartialEq<&'_ NodeIdRef> for NodeId {
    fn eq(&self, other: &&NodeIdRef) -> bool {
        self.as_str() == other.as_str()
    }
}

impl PartialEq<NodeId> for NodeIdRef {
    fn eq(&self, other: &NodeId) -> bool {
        self.as_str() == other.as_str()
    }
}

impl PartialEq<NodeId> for &'_ NodeIdRef {
    fn eq(&self, other: &NodeId) -> bool {
        self.as_str() == other.as_str()
    }
}

impl PartialEq<NodeId> for String {
    fn eq(&self, other: &NodeId) -> bool {
        self.as_str() == other.as_str()
    }
}

impl ToOwned for NodeIdRef {
    type Owned = NodeId;

    fn to_owned(&self) -> Self::Owned {
        NodeId(self.0.to_string())
    }
}

#[cfg(feature = "postgres")]
impl From<&NodeId> for sea_query::Value {
    fn from(node_id: &NodeId) -> Self {
        node_id.to_string().into()
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_queue_id() {
        assert_eq!(
            queue_id(
                &IndexUid::for_test("test-index", 0),
                "test-source",
                &ShardId::from(1u64)
            ),
            "test-index:00000000000000000000000000/test-source/00000000000000000001"
        );
    }

    #[test]
    fn test_split_queue_id() {
        let splits = split_queue_id("test-index:00000000000000000000000000");
        assert!(splits.is_none());

        let splits = split_queue_id("test-index:00000000000000000000000000/test-source");
        assert!(splits.is_none());

        let (index_uid, source_id, shard_id) = split_queue_id(
            "test-index:00000000000000000000000000/test-source/00000000000000000001",
        )
        .unwrap();
        assert_eq!(
            &index_uid.to_string(),
            "test-index:00000000000000000000000000"
        );
        assert_eq!(source_id, "test-source");
        assert_eq!(shard_id, ShardId::from(1u64));
    }

    #[test]
    fn test_node_id() {
        let node_id = NodeId::new("test-node".to_string());
        assert_eq!(node_id.as_str(), "test-node");
        assert_eq!(node_id, NodeIdRef::from_str("test-node"));
    }

    #[test]
    fn test_node_serde() {
        #[derive(Debug, PartialEq, Eq, Serialize, Deserialize)]
        struct Node {
            node_id: NodeId,
        }
        let node = Node {
            node_id: NodeId::from("test-node"),
        };
        let serialized = serde_json::to_string(&node).unwrap();
        assert_eq!(serialized, r#"{"node_id":"test-node"}"#);

        let deserialized = serde_json::from_str::<Node>(&serialized).unwrap();
        assert_eq!(deserialized, node);
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/pipeline_uid.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::fmt;
use std::fmt::{Display, Formatter};
use std::str::FromStr;

use serde::de::Error;
use serde::{Deserialize, Serialize};
use ulid::Ulid;

use super::ULID_SIZE;

/// A pipeline UID identifies an indexing pipeline and an indexing task.
#[derive(Clone, Copy, Default, Hash, Eq, PartialEq, Ord, PartialOrd)]
pub struct PipelineUid(Ulid);

impl fmt::Debug for PipelineUid {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        write!(f, "Pipeline({})", self.0)
    }
}

impl Display for PipelineUid {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        self.0.fmt(f)
    }
}

impl PipelineUid {
    /// Creates a new random pipeline UID.
    pub fn random() -> Self {
        Self(Ulid::new())
    }

    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test(ulid_u128: u128) -> PipelineUid {
        Self(Ulid::from(ulid_u128))
    }
}

impl FromStr for PipelineUid {
    type Err = &'static str;

    fn from_str(pipeline_uid_str: &str) -> Result<PipelineUid, Self::Err> {
        let pipeline_ulid =
            Ulid::from_string(pipeline_uid_str).map_err(|_| "invalid pipeline UID")?;
        Ok(PipelineUid(pipeline_ulid))
    }
}

impl Serialize for PipelineUid {
    fn serialize<S: serde::Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        serializer.collect_str(&self.0)
    }
}

impl<'de> Deserialize<'de> for PipelineUid {
    fn deserialize<D: serde::Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let ulid_str: Cow<'de, str> = Cow::deserialize(deserializer)?;
        let ulid = Ulid::from_string(&ulid_str).map_err(D::Error::custom)?;
        Ok(Self(ulid))
    }
}

impl prost::Message for PipelineUid {
    fn encode_raw(&self, buf: &mut impl prost::bytes::BufMut) {
        // TODO: when `bytes::encode` supports `&[u8]`, we can remove this allocation.
        prost::encoding::bytes::encode(1u32, &self.0.to_bytes().to_vec(), buf);
    }

    fn merge_field(
        &mut self,
        tag: u32,
        wire_type: prost::encoding::WireType,
        buf: &mut impl prost::bytes::Buf,
        ctx: prost::encoding::DecodeContext,
    ) -> ::core::result::Result<(), prost::DecodeError> {
        const STRUCT_NAME: &str = "PipelineUid";

        match tag {
            1u32 => {
                let mut buffer = Vec::with_capacity(ULID_SIZE);

                prost::encoding::bytes::merge(wire_type, &mut buffer, buf, ctx).map_err(
                    |mut error| {
                        error.push(STRUCT_NAME, "pipeline_uid");
                        error
                    },
                )?;
                let ulid_bytes: [u8; ULID_SIZE] =
                    buffer.try_into().map_err(|buffer: Vec<u8>| {
                        prost::DecodeError::new(format!(
                            "invalid length for field `pipeline_uid`, expected 16 bytes, got {}",
                            buffer.len()
                        ))
                    })?;
                self.0 = Ulid::from_bytes(ulid_bytes);
                Ok(())
            }
            _ => prost::encoding::skip_field(wire_type, tag, buf, ctx),
        }
    }

    #[inline]
    fn encoded_len(&self) -> usize {
        prost::encoding::key_len(1u32)
            + prost::encoding::encoded_len_varint(ULID_SIZE as u64)
            + ULID_SIZE
    }

    fn clear(&mut self) {
        self.0 = Ulid::default();
    }
}

#[cfg(test)]
mod tests {
    use bytes::Bytes;
    use prost::Message;

    use super::*;

    #[test]
    fn test_pipeline_uid_json_serde_roundtrip() {
        let pipeline_uid = PipelineUid::default();
        let serialized = serde_json::to_string(&pipeline_uid).unwrap();
        assert_eq!(serialized, r#""00000000000000000000000000""#);

        let deserialized: PipelineUid = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, pipeline_uid);
    }

    #[test]
    fn test_pipeline_uid_prost_serde_roundtrip() {
        let pipeline_uid = PipelineUid::random();

        let encoded = pipeline_uid.encode_to_vec();
        assert_eq!(
            PipelineUid::decode(Bytes::from(encoded)).unwrap(),
            pipeline_uid
        );

        let encoded = pipeline_uid.encode_length_delimited_to_vec();
        assert_eq!(
            PipelineUid::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            pipeline_uid
        );
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/position.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::{Debug, Display};
use std::{fmt, mem};

use bytes::{Bytes, BytesMut};
use bytestring::ByteString;
use prost::{self, DecodeError};
use quickwit_common::pretty::PrettyDisplay;
use serde::{Deserialize, Serialize};

const BEGINNING: &str = "";

const EOF_PREFIX: &str = "~";

#[derive(Clone, Debug, Default, Eq, PartialEq, Hash, Ord, PartialOrd)]
pub struct Offset(ByteString);

impl Offset {
    pub fn as_str(&self) -> &str {
        &self.0
    }

    pub fn as_i64(&self) -> Option<i64> {
        self.0.parse::<i64>().ok()
    }

    pub fn as_u64(&self) -> Option<u64> {
        self.0.parse::<u64>().ok()
    }

    pub fn as_usize(&self) -> Option<usize> {
        self.0.parse::<usize>().ok()
    }
}

impl fmt::Display for Offset {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{}", &self.0)
    }
}

impl From<i64> for Offset {
    fn from(offset: i64) -> Self {
        Self(ByteString::from(format!("{offset:0>20}")))
    }
}

impl From<u64> for Offset {
    fn from(offset: u64) -> Self {
        Self(ByteString::from(format!("{offset:0>20}")))
    }
}

impl From<usize> for Offset {
    fn from(offset: usize) -> Self {
        Self(ByteString::from(format!("{offset:0>20}")))
    }
}

impl From<&str> for Offset {
    fn from(offset: &str) -> Self {
        Self(ByteString::from(offset))
    }
}

/// Marks a position within a specific partition/shard of a source.
///
/// The nature of the position depends on the source.
/// Each source must encode it as a `String` in such a way that
/// the lexicographical order matches the natural order of the
/// position.
///
/// For instance, for u64, a 20-left-padded decimal representation
/// can be used. Alternatively, a base64 representation of their
/// big-endian representation can be used.
///
/// The empty string can be used to represent the beginning of the source,
/// if no position makes sense. It can be built via `Position::default()`.
#[derive(Clone, Default, Eq, PartialEq, Hash, Ord, PartialOrd)]
pub enum Position {
    #[default]
    Beginning,
    Offset(Offset),
    /// End of partition/shard at the given offset. `Eof(None)` means no records were ever written.
    Eof(Option<Offset>),
}

impl Debug for Position {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        match self {
            Self::Beginning => write!(f, "Position::Beginning"),
            // The derive implementation would show `Offset(Offset(0000001u64))` here.
            Self::Offset(offset) => write!(f, "Position::Offset({offset})"),
            Self::Eof(Some(offset)) => write!(f, "Position::Eof({offset})"),
            Self::Eof(None) => write!(f, "Position::Eof"),
        }
    }
}

// Caution: This is also the serialization format for chitchat and serde. Modify with care.
impl Display for Position {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        match self {
            Self::Beginning => write!(f, "{BEGINNING}"),
            Self::Offset(offset) => write!(f, "{offset}"),
            Self::Eof(Some(offset)) => write!(f, "{EOF_PREFIX}{offset}"),
            Self::Eof(None) => write!(f, "{EOF_PREFIX}"),
        }
    }
}

struct PositionPrettyDisplay<'a>(&'a Position);

impl fmt::Display for PositionPrettyDisplay<'_> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        match self.0 {
            Position::Beginning => write!(f, "beginning"),
            Position::Offset(offset) => write!(f, "{offset}"),
            Position::Eof(Some(offset)) => write!(f, "eof({offset})"),
            Position::Eof(None) => write!(f, "eof"),
        }
    }
}

impl PrettyDisplay for Position {
    fn pretty_display(&self) -> impl fmt::Display {
        PositionPrettyDisplay(self)
    }
}

impl Position {
    pub fn offset(offset: impl Into<Offset>) -> Self {
        Self::Offset(offset.into())
    }

    pub fn eof(offset: impl Into<Offset>) -> Self {
        Self::Eof(Some(offset.into()))
    }

    pub fn as_eof(&self) -> Self {
        match self {
            Self::Beginning => Self::Eof(None),
            Self::Offset(offset) => Self::Eof(Some(offset.clone())),
            _ => self.clone(),
        }
    }

    pub fn to_eof(&mut self) {
        match self {
            Self::Beginning => *self = Self::Eof(None),
            Self::Offset(offset) => *self = Self::Eof(Some(mem::take(offset))),
            _ => (),
        }
    }

    pub fn as_i64(&self) -> Option<i64> {
        match self {
            Self::Offset(offset) | Self::Eof(Some(offset)) => offset.as_i64(),
            _ => None,
        }
    }

    pub fn as_u64(&self) -> Option<u64> {
        match self {
            Self::Offset(offset) | Self::Eof(Some(offset)) => offset.as_u64(),
            _ => None,
        }
    }

    pub fn as_usize(&self) -> Option<usize> {
        match self {
            Self::Offset(offset) | Self::Eof(Some(offset)) => offset.as_usize(),
            _ => None,
        }
    }

    pub fn is_beginning(&self) -> bool {
        matches!(self, Self::Beginning)
    }

    pub fn is_eof(&self) -> bool {
        matches!(self, Self::Eof(_))
    }

    fn as_bytes(&self) -> Bytes {
        match self {
            Self::Beginning => Bytes::from_static(BEGINNING.as_bytes()),
            Self::Offset(offset) => offset.0.as_bytes().clone(),
            Self::Eof(Some(offset)) => {
                let mut bytes = BytesMut::with_capacity(EOF_PREFIX.len() + offset.0.len());
                bytes.extend_from_slice(EOF_PREFIX.as_bytes());
                bytes.extend_from_slice(offset.0.as_bytes());
                bytes.freeze()
            }
            Self::Eof(None) => Bytes::from_static(EOF_PREFIX.as_bytes()),
        }
    }
}

impl From<ByteString> for Position {
    fn from(position: ByteString) -> Self {
        match &position[..] {
            BEGINNING => Self::Beginning,
            EOF_PREFIX => Self::Eof(None),
            offset if offset.starts_with(EOF_PREFIX) => {
                let offset = ByteString::from(&offset[EOF_PREFIX.len()..]);
                Self::Eof(Some(Offset(offset)))
            }
            _ => Self::Offset(Offset(position)),
        }
    }
}

impl From<String> for Position {
    fn from(position: String) -> Self {
        Self::from(ByteString::from(position))
    }
}

impl Serialize for Position {
    fn serialize<S: serde::Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        serializer.collect_str(self)
    }
}

impl<'de> Deserialize<'de> for Position {
    fn deserialize<D: serde::Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let position_str = String::deserialize(deserializer)?;
        Ok(Self::from(position_str))
    }
}

impl PartialEq<Position> for &Position {
    #[inline]
    fn eq(&self, other: &Position) -> bool {
        *self == other
    }
}

impl prost::Message for Position {
    fn encode_raw(&self, buf: &mut impl prost::bytes::BufMut) {
        prost::encoding::bytes::encode(1u32, &self.as_bytes(), buf);
    }

    fn merge_field(
        &mut self,
        tag: u32,
        wire_type: prost::encoding::WireType,
        buf: &mut impl prost::bytes::Buf,
        ctx: prost::encoding::DecodeContext,
    ) -> ::core::result::Result<(), prost::DecodeError> {
        const STRUCT_NAME: &str = "Position";

        match tag {
            1u32 => {
                let mut value = Vec::new();
                prost::encoding::bytes::merge(wire_type, &mut value, buf, ctx).map_err(
                    |mut error| {
                        error.push(STRUCT_NAME, "position");
                        error
                    },
                )?;
                let byte_string = ByteString::try_from(value)
                    .map_err(|_| DecodeError::new("position is not valid UTF-8"))?;
                *self = Self::from(byte_string);
                Ok(())
            }
            _ => prost::encoding::skip_field(wire_type, tag, buf, ctx),
        }
    }

    #[inline]
    fn encoded_len(&self) -> usize {
        prost::encoding::bytes::encoded_len(1u32, &self.as_bytes())
    }

    fn clear(&mut self) {
        *self = Self::default();
    }
}

#[cfg(test)]
mod tests {
    use prost::Message;

    use super::*;

    #[test]
    #[allow(clippy::cmp_owned)]
    fn test_position_ord() {
        assert!(Position::Beginning < Position::offset(0u64));
        assert!(Position::Beginning < Position::Eof(None));
        assert!(Position::Beginning < Position::eof(0u64));

        assert!(Position::offset(0u64) < Position::offset(1u64));

        assert!(Position::Eof(None) < Position::eof(0u64));
        assert!(Position::eof(0u64) < Position::eof(1u64));
    }

    #[test]
    fn test_position_as_eof() {
        let eof_position = Position::Beginning.as_eof();

        assert!(eof_position.is_eof());
        assert!(eof_position.as_u64().is_none());

        let eof_position = Position::offset(0u64).as_eof();

        assert!(eof_position.is_eof());
        assert_eq!(eof_position.as_u64().unwrap(), 0u64);
    }

    #[test]
    fn test_position_to_eof() {
        let mut position = Position::Beginning;
        position.to_eof();
        assert!(matches!(position, Position::Eof(None)));

        let mut position = Position::offset(0u64);
        position.to_eof();
        assert!(matches!(position, Position::Eof(Some(offset)) if offset.as_u64().unwrap() == 0));
    }

    #[test]
    fn test_position_json_serde_roundtrip() {
        let serialized = serde_json::to_string(&Position::Beginning).unwrap();
        assert_eq!(serialized, r#""""#);
        let deserialized: Position = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, Position::Beginning);

        let serialized = serde_json::to_string(&Position::offset(0u64)).unwrap();
        assert_eq!(serialized, r#""00000000000000000000""#);
        let deserialized: Position = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, Position::offset(0u64));

        let serialized = serde_json::to_string(&Position::Eof(None)).unwrap();
        assert_eq!(serialized, r#""~""#);
        let deserialized: Position = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, Position::Eof(None));

        let serialized = serde_json::to_string(&Position::eof(0u64)).unwrap();
        assert_eq!(serialized, r#""~00000000000000000000""#);
        let deserialized: Position = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, Position::eof(0u64));
    }

    #[test]
    fn test_position_prost_serde_roundtrip() {
        let encoded = Position::Beginning.encode_to_vec();
        assert_eq!(
            Position::decode(Bytes::from(encoded)).unwrap(),
            Position::Beginning
        );
        let encoded = Position::Beginning.encode_length_delimited_to_vec();
        assert_eq!(
            Position::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            Position::Beginning
        );

        let encoded = Position::offset(0u64).encode_to_vec();
        assert_eq!(
            Position::decode(Bytes::from(encoded)).unwrap(),
            Position::offset(0u64)
        );
        let encoded = Position::offset(0u64).encode_length_delimited_to_vec();
        assert_eq!(
            Position::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            Position::offset(0u64)
        );

        let encoded = Position::Eof(None).encode_to_vec();
        assert_eq!(
            Position::decode(Bytes::from(encoded)).unwrap(),
            Position::Eof(None)
        );
        let encoded = Position::Eof(None).encode_length_delimited_to_vec();
        assert_eq!(
            Position::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            Position::Eof(None)
        );

        let encoded = Position::eof(0u64).encode_to_vec();
        assert_eq!(
            Position::decode(Bytes::from(encoded)).unwrap(),
            Position::eof(0u64)
        );
        let encoded = Position::eof(0u64).encode_length_delimited_to_vec();
        assert_eq!(
            Position::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            Position::eof(0u64)
        );
    }
}


================================================
FILE: quickwit/quickwit-proto/src/types/shard_id.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::fmt::Debug;

use bytestring::ByteString;
use prost::DecodeError;
use serde::{Deserialize, Serialize};
use ulid::Ulid;

/// Shard ID.
/// Shard ID are required to be globally unique.
///
/// In other words, there cannot be two shards belonging to two different sources
/// with the same shard ID.
#[derive(Clone, Debug, Default, Eq, PartialEq, Hash, Ord, PartialOrd)]
pub struct ShardId(ByteString);

impl ShardId {
    pub fn as_str(&self) -> &str {
        &self.0
    }

    pub fn as_u64(&self) -> Option<u64> {
        self.0.parse().ok()
    }
}

impl fmt::Display for ShardId {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{}", &self.0)
    }
}

impl From<&str> for ShardId {
    fn from(shard_id: &str) -> Self {
        Self(ByteString::from(shard_id))
    }
}

impl From<String> for ShardId {
    fn from(shard_id: String) -> Self {
        Self(ByteString::from(shard_id))
    }
}

impl From<u64> for ShardId {
    fn from(shard_id: u64) -> Self {
        Self(ByteString::from(format!("{shard_id:0>20}")))
    }
}

impl From<Ulid> for ShardId {
    fn from(shard_id: Ulid) -> Self {
        Self(ByteString::from(shard_id.to_string()))
    }
}

impl Serialize for ShardId {
    fn serialize<S: serde::Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        serializer.collect_str(self)
    }
}

impl<'de> Deserialize<'de> for ShardId {
    fn deserialize<D: serde::Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let shard_id = String::deserialize(deserializer)?;
        Ok(Self::from(shard_id))
    }
}

impl prost::Message for ShardId {
    fn encode_raw(&self, buf: &mut impl prost::bytes::BufMut) {
        prost::encoding::bytes::encode(1u32, &self.0.as_bytes().clone(), buf);
    }

    fn merge_field(
        &mut self,
        tag: u32,
        wire_type: prost::encoding::WireType,
        buf: &mut impl prost::bytes::Buf,
        ctx: prost::encoding::DecodeContext,
    ) -> ::core::result::Result<(), prost::DecodeError> {
        const STRUCT_NAME: &str = "ShardId";

        match tag {
            1u32 => {
                let mut value = Vec::new();
                prost::encoding::bytes::merge(wire_type, &mut value, buf, ctx).map_err(
                    |mut error| {
                        error.push(STRUCT_NAME, "position");
                        error
                    },
                )?;
                let byte_string = ByteString::try_from(value)
                    .map_err(|_| DecodeError::new("shard_id is not valid UTF-8"))?;
                *self = Self(byte_string);
                Ok(())
            }
            _ => prost::encoding::skip_field(wire_type, tag, buf, ctx),
        }
    }

    #[inline]
    fn encoded_len(&self) -> usize {
        prost::encoding::bytes::encoded_len(1u32, &self.0.as_bytes().clone())
    }

    fn clear(&mut self) {
        *self = Self::default();
    }
}

impl PartialEq<ShardId> for &ShardId {
    #[inline]
    fn eq(&self, other: &ShardId) -> bool {
        *self == other
    }
}

#[cfg(feature = "postgres")]
impl sqlx::Type<sqlx::Postgres> for ShardId {
    fn type_info() -> sqlx::postgres::PgTypeInfo {
        sqlx::postgres::PgTypeInfo::with_name("VARCHAR")
    }
}

#[cfg(feature = "postgres")]
impl sqlx::Encode<'_, sqlx::Postgres> for ShardId {
    fn encode_by_ref(
        &self,
        buf: &mut sqlx::postgres::PgArgumentBuffer,
    ) -> Result<sqlx::encode::IsNull, sqlx::error::BoxDynError> {
        sqlx::Encode::<sqlx::Postgres>::encode(self.as_str(), buf)
    }
}

#[cfg(feature = "postgres")]
impl sqlx::postgres::PgHasArrayType for ShardId {
    fn array_type_info() -> sqlx::postgres::PgTypeInfo {
        sqlx::postgres::PgTypeInfo::with_name("VARCHAR[]")
    }
}

#[cfg(test)]
mod tests {

    use bytes::Bytes;
    use prost::Message;

    use super::*;

    #[test]
    fn test_shard_id_json_serde_roundtrip() {
        let serialized = serde_json::to_string(&ShardId::from(0)).unwrap();
        assert_eq!(serialized, r#""00000000000000000000""#);
        let deserialized: ShardId = serde_json::from_str(&serialized).unwrap();
        assert_eq!(deserialized, ShardId::from(0));
    }

    #[test]
    fn test_shard_id_prost_serde_roundtrip() {
        let ulid = Ulid::new();
        let encoded = ShardId::from(ulid).encode_to_vec();
        assert_eq!(
            ShardId::decode(Bytes::from(encoded)).unwrap(),
            ShardId::from(ulid)
        );
        let encoded = ShardId::from(ulid).encode_length_delimited_to_vec();
        assert_eq!(
            ShardId::decode_length_delimited(Bytes::from(encoded)).unwrap(),
            ShardId::from(ulid)
        );
    }
}


================================================
FILE: quickwit/quickwit-query/Cargo.toml
================================================
[package]
name = "quickwit-query"
description = "Query DSL definition and parsing"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
base64 = { workspace = true }
bitpacking = { workspace = true }
hex = { workspace = true }
once_cell = { workspace = true }
regex = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
serde_with = { workspace = true }
tantivy = { workspace = true }
tantivy-fst = { workspace = true }
tracing = { workspace = true }
time = { workspace = true }
thiserror = { workspace = true }
rustc-hash = { workspace = true }

quickwit-common = { workspace = true }
quickwit-datetime = { workspace = true }
quickwit-proto = { workspace = true }

[dev-dependencies]
criterion = { workspace = true }
proptest = { workspace = true }
time = { workspace = true }

quickwit-common = { workspace = true, features = ["testsuite"] }

[[bench]]
name = "tokenizers_bench"
harness = false


================================================
FILE: quickwit/quickwit-query/README.md
================================================
Quickwit

```mermaid
flowchart LR
    EsApiQParam[ES q= query string param] -->|parse user query| QueryAST
    EsQueryDSL[ES query DSL in json body] -->|Parse json| QueryAST
    QuickwitAPI -->|parse user query| QueryAST
    QueryAST -->|apply query to a split| TantivyQuery

```

In quickwit and tantivy, we call XXXQuery every object representing a predicate over a document, hence selecting a subset of documents.

Such objects do not contain information about what to do with the document, for instance, how to sort them, which aggregation to run on them, etc.

The `SearchRequest` object, on the other hand, is the larger object in charge of gathering all of the information of the request, including the user query.

Quickwit uses a `QueryAST` object to represent queries internally.
Regardless of how the query has been supplied (ES-compatible API, quickwit search API,  search stream API), we convert
it to a QueryAST. Because it is schema agnostic, it can be serialized and passed around.

# root / leaf

One confusing thing about the QueryAST is that because we want its construction to not depend on
the docmapper: building the QueryAST should not require interrogating the metastore. It
is built without knowing the default fields of the index.

For this reason, the AST contains a node called `UserInputQuery` that has a bit of special status:
before usage, the AST must parse the content of these nodes and replace them by an AST.

This operation is done on the root search (on which the doc mapper, and hence the default fields are known),
and dispatched to the leaf search.
The root search checks the validity of the search against *against the current DocMapper*.

That way we are able to return an error to the user, if for instance the query includes a range query that does not target a fast field.

The leaf search is applied on splits that may have been produced with a different doc mapper.
Considering our example again, we want users to be able to run range query after they updated their schema.

Reindexing is not option in quickwit, so what will happen is generally speaking a best effort solution.
The range query node of the AST will act as if it was a match nothing node, and the recall will be affected for these
legacy splits.
Generally, this behavior decreases recall, but `MUST NOT` clauses can actually increase recall.

# Elasticsearch compatibility API

The user's request contains information in both the http body and the querystring parameters. These parameters may overlap, in which case the querystring parameter takes priority.

In the body, a user can supply the query using a rich query DSL expressed in JSON format.
```json
{
    "query": { /* ESQueryDSL */}
}
```

When the query is passed as an `ESQueryDSL`, it is simply deserialized into a `QueryAST` object. The `QueryAST is` a one-to-one representation of the user input. It is entirely schema-agnostic.


================================================
FILE: quickwit/quickwit-query/benches/tokenizers_bench.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use criterion::{Criterion, Throughput, black_box, criterion_group, criterion_main};
use quickwit_query::CodeTokenizer;
use tantivy::tokenizer::{RegexTokenizer, TextAnalyzer, Token, TokenStream};

// A random ascii string of length 100 chars.
static CODE_TEXT: &str = r#"
# Camel case variables
firstName = "John"
lastName = "Doe"
ageOfPerson = 30
isEmployed = True

# Snake case variables
first_name = "Jane"
last_name = "Smith"
age_of_person = 25
is_employed = False

# Mixed case variables
fullName = firstName + " " + lastName
isPersonEmployed = isEmployed and is_employed

# Code logic
if isEmployed and is_employed:
    print(f"{firstName} {first_name} is currently employed.")
else:
    print(f"{lastName} {last_name} is not employed at the moment.")

totalAge = ageOfPerson + age_of_person
print(f"The combined age is: {totalAge}")

# Longer word examples
longCamelCaseWord = "LongCamelCase"
longSnakeCaseWord = "long_snake_case"
mixedCaseWord = "ThisIsAMixedCaseWord"
longCamelCaseWord = "LongCamelCase"
longSnakeCaseWord = "long_snake_case"
mixedCaseWord = "ThisIsAMixedCaseWord"

# Words with consecutive uppercase letters
WORDWITHConsecutiveUppercase1 = "1"
WORDWITHCONSECUTIVEUppercase2 = "2"
WORDWITHCONSECUTIVEUPPERCASE2 = "3"
"#;

fn process_tokens(analyzer: &mut TextAnalyzer, text: &str) -> Vec<Token> {
    let mut token_stream = analyzer.token_stream(text);
    let mut tokens: Vec<Token> = Vec::new();
    token_stream.process(&mut |token: &Token| tokens.push(token.clone()));
    tokens
}

pub fn tokenizers_throughput_benchmark(c: &mut Criterion) {
    let mut group = c.benchmark_group("code_tokenizer");
    let mut regex_tokenizer = TextAnalyzer::from(
        RegexTokenizer::new("(\\p{Ll}+|\\p{Lu}\\p{Ll}+|\\p{Lu}+|\\d+)").unwrap(),
    );
    let mut code_tokenizer = TextAnalyzer::from(CodeTokenizer::default());

    group
        .throughput(Throughput::Bytes(CODE_TEXT.len() as u64))
        .bench_with_input("regex-tokenize", CODE_TEXT, |b, text| {
            b.iter(|| process_tokens(&mut regex_tokenizer, black_box(text)));
        });
    group
        .throughput(Throughput::Bytes(CODE_TEXT.len() as u64))
        .bench_with_input("code-tokenize", CODE_TEXT, |b, text| {
            b.iter(|| process_tokens(&mut code_tokenizer, black_box(text)));
        });
}

criterion_group!(
    tokenizers_throughput_benches,
    tokenizers_throughput_benchmark
);
criterion_main!(tokenizers_throughput_benches);


================================================
FILE: quickwit/quickwit-query/src/aggregations.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};
use tantivy::aggregation::Key as TantivyKey;
use tantivy::aggregation::agg_result::{
    AggregationResult as TantivyAggregationResult, AggregationResults as TantivyAggregationResults,
    BucketEntries as TantivyBucketEntries, BucketEntry as TantivyBucketEntry,
    BucketResult as TantivyBucketResult, MetricResult as TantivyMetricResult,
    RangeBucketEntry as TantivyRangeBucketEntry,
};
use tantivy::aggregation::metric::{
    ExtendedStats, PercentileValues as TantivyPercentileValues, PercentileValuesVecEntry,
    PercentilesMetricResult as TantivyPercentilesMetricResult, SingleMetricResult, Stats,
    TopHitsMetricResult,
};

// hopefully all From in this module are no-ops, otherwise, this is a very sad situation

#[derive(Clone, Debug, Serialize, Deserialize)]
/// The final aggregation result.
pub struct AggregationResults(pub Vec<(String, AggregationResult)>);

impl From<TantivyAggregationResults> for AggregationResults {
    fn from(value: TantivyAggregationResults) -> AggregationResults {
        AggregationResults(value.0.into_iter().map(|(k, v)| (k, v.into())).collect())
    }
}

impl From<AggregationResults> for TantivyAggregationResults {
    fn from(value: AggregationResults) -> TantivyAggregationResults {
        TantivyAggregationResults(value.0.into_iter().map(|(k, v)| (k, v.into())).collect())
    }
}

#[derive(Clone, Debug, Serialize, Deserialize)]
/// An aggregation is either a bucket or a metric.
pub enum AggregationResult {
    /// Bucket result variant.
    BucketResult(BucketResult),
    /// Metric result variant.
    MetricResult(MetricResult),
}

impl From<TantivyAggregationResult> for AggregationResult {
    fn from(value: TantivyAggregationResult) -> AggregationResult {
        match value {
            TantivyAggregationResult::BucketResult(bucket) => {
                AggregationResult::BucketResult(bucket.into())
            }
            TantivyAggregationResult::MetricResult(metric) => {
                AggregationResult::MetricResult(metric.into())
            }
        }
    }
}

impl From<AggregationResult> for TantivyAggregationResult {
    fn from(value: AggregationResult) -> TantivyAggregationResult {
        match value {
            AggregationResult::BucketResult(bucket) => {
                TantivyAggregationResult::BucketResult(bucket.into())
            }
            AggregationResult::MetricResult(metric) => {
                TantivyAggregationResult::MetricResult(metric.into())
            }
        }
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
/// MetricResult
pub enum MetricResult {
    /// Average metric result.
    Average(SingleMetricResult),
    /// Count metric result.
    Count(SingleMetricResult),
    /// Max metric result.
    Max(SingleMetricResult),
    /// Min metric result.
    Min(SingleMetricResult),
    /// Stats metric result.
    Stats(Stats),
    /// ExtendedStats metric result.
    ExtendedStats(Box<ExtendedStats>),
    /// Sum metric result.
    Sum(SingleMetricResult),
    /// Percentiles metric result.
    Percentiles(PercentilesMetricResult),
    /// Top hits metric result
    TopHits(TopHitsMetricResult),
    /// Cardinality metric result
    Cardinality(SingleMetricResult),
}

impl From<TantivyMetricResult> for MetricResult {
    fn from(value: TantivyMetricResult) -> MetricResult {
        match value {
            TantivyMetricResult::Average(val) => MetricResult::Average(val),
            TantivyMetricResult::Count(val) => MetricResult::Count(val),
            TantivyMetricResult::Max(val) => MetricResult::Max(val),
            TantivyMetricResult::Min(val) => MetricResult::Min(val),
            TantivyMetricResult::Stats(val) => MetricResult::Stats(val),
            TantivyMetricResult::ExtendedStats(val) => MetricResult::ExtendedStats(val),
            TantivyMetricResult::Sum(val) => MetricResult::Sum(val),
            TantivyMetricResult::Percentiles(val) => MetricResult::Percentiles(val.into()),
            TantivyMetricResult::TopHits(val) => MetricResult::TopHits(val),
            TantivyMetricResult::Cardinality(val) => MetricResult::Cardinality(val),
        }
    }
}

impl From<MetricResult> for TantivyMetricResult {
    fn from(value: MetricResult) -> TantivyMetricResult {
        match value {
            MetricResult::Average(val) => TantivyMetricResult::Average(val),
            MetricResult::Count(val) => TantivyMetricResult::Count(val),
            MetricResult::Max(val) => TantivyMetricResult::Max(val),
            MetricResult::Min(val) => TantivyMetricResult::Min(val),
            MetricResult::Stats(val) => TantivyMetricResult::Stats(val),
            MetricResult::ExtendedStats(val) => TantivyMetricResult::ExtendedStats(val),
            MetricResult::Sum(val) => TantivyMetricResult::Sum(val),
            MetricResult::Percentiles(val) => TantivyMetricResult::Percentiles(val.into()),
            MetricResult::TopHits(val) => TantivyMetricResult::TopHits(val),
            MetricResult::Cardinality(val) => TantivyMetricResult::Cardinality(val),
        }
    }
}

/// BucketEntry holds bucket aggregation result types.
#[derive(Clone, Debug, Serialize, Deserialize)]
pub enum BucketResult {
    /// This is the range entry for a bucket, which contains a key, count, from, to, and optionally
    /// sub-aggregations.
    Range {
        /// The range buckets sorted by range.
        buckets: BucketEntries<RangeBucketEntry>,
    },
    /// This is the histogram entry for a bucket, which contains a key, count, and optionally
    /// sub-aggregations.
    Histogram {
        /// The buckets.
        ///
        /// If there are holes depends on the request, if min_doc_count is 0, then there are no
        /// holes between the first and last bucket.
        /// See `HistogramAggregation`
        buckets: BucketEntries<BucketEntry>,
    },
    /// This is the term result
    Terms {
        /// The buckets.
        ///
        /// See `TermsAggregation`
        buckets: Vec<BucketEntry>,
        /// The number of documents that didn’t make it into to TOP N due to shard_size or size
        sum_other_doc_count: u64,
        /// The upper bound error for the doc count of each term.
        doc_count_error_upper_bound: Option<u64>,
    },
}

impl From<TantivyBucketResult> for BucketResult {
    fn from(value: TantivyBucketResult) -> BucketResult {
        match value {
            TantivyBucketResult::Range { buckets } => BucketResult::Range {
                buckets: buckets.into(),
            },
            TantivyBucketResult::Histogram { buckets } => BucketResult::Histogram {
                buckets: buckets.into(),
            },
            TantivyBucketResult::Terms {
                buckets,
                sum_other_doc_count,
                doc_count_error_upper_bound,
            } => BucketResult::Terms {
                buckets: buckets.into_iter().map(Into::into).collect(),
                sum_other_doc_count,
                doc_count_error_upper_bound,
            },
            TantivyBucketResult::Filter(_filter_bucket_result) => {
                unimplemented!("filter aggregation is not yet supported in quickwit")
            }
        }
    }
}

impl From<BucketResult> for TantivyBucketResult {
    fn from(value: BucketResult) -> TantivyBucketResult {
        match value {
            BucketResult::Range { buckets } => TantivyBucketResult::Range {
                buckets: buckets.into(),
            },
            BucketResult::Histogram { buckets } => TantivyBucketResult::Histogram {
                buckets: buckets.into(),
            },
            BucketResult::Terms {
                buckets,
                sum_other_doc_count,
                doc_count_error_upper_bound,
            } => TantivyBucketResult::Terms {
                buckets: buckets.into_iter().map(Into::into).collect(),
                sum_other_doc_count,
                doc_count_error_upper_bound,
            },
        }
    }
}

/// This is the wrapper of buckets entries, which can be vector or hashmap
/// depending on if it's keyed or not.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub enum BucketEntries<T> {
    /// Vector format bucket entries
    Vec(Vec<T>),
    /// HashMap format bucket entries
    HashMap(Vec<(String, T)>),
}

impl<T, U> From<TantivyBucketEntries<T>> for BucketEntries<U>
where U: From<T>
{
    fn from(value: TantivyBucketEntries<T>) -> BucketEntries<U> {
        match value {
            TantivyBucketEntries::Vec(vec) => {
                BucketEntries::Vec(vec.into_iter().map(Into::into).collect())
            }
            TantivyBucketEntries::HashMap(map) => {
                BucketEntries::HashMap(map.into_iter().map(|(k, v)| (k, v.into())).collect())
            }
        }
    }
}

impl<T, U> From<BucketEntries<T>> for TantivyBucketEntries<U>
where U: From<T>
{
    fn from(value: BucketEntries<T>) -> TantivyBucketEntries<U> {
        match value {
            BucketEntries::Vec(vec) => {
                TantivyBucketEntries::Vec(vec.into_iter().map(Into::into).collect())
            }
            BucketEntries::HashMap(map) => {
                TantivyBucketEntries::HashMap(map.into_iter().map(|(k, v)| (k, v.into())).collect())
            }
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct RangeBucketEntry {
    /// The identifier of the bucket.
    pub key: Key,
    /// Number of documents in the bucket.
    pub doc_count: u64,
    /// Sub-aggregations in this bucket.
    // here we had a flatten, postcard didn't like that (unknown map size)
    pub sub_aggregation: AggregationResults,
    /// The from range of the bucket. Equals `f64::MIN` when `None`.
    pub from: Option<f64>,
    /// The to range of the bucket. Equals `f64::MAX` when `None`.
    pub to: Option<f64>,
    /// The optional string representation for the `from` range.
    pub from_as_string: Option<String>,
    /// The optional string representation for the `to` range.
    pub to_as_string: Option<String>,
}

impl From<TantivyRangeBucketEntry> for RangeBucketEntry {
    fn from(value: TantivyRangeBucketEntry) -> RangeBucketEntry {
        RangeBucketEntry {
            key: value.key.into(),
            doc_count: value.doc_count,
            from: value.from,
            to: value.to,
            from_as_string: value.from_as_string,
            to_as_string: value.to_as_string,
            sub_aggregation: value.sub_aggregation.into(),
        }
    }
}

impl From<RangeBucketEntry> for TantivyRangeBucketEntry {
    fn from(value: RangeBucketEntry) -> TantivyRangeBucketEntry {
        TantivyRangeBucketEntry {
            key: value.key.into(),
            doc_count: value.doc_count,
            from: value.from,
            to: value.to,
            from_as_string: value.from_as_string,
            to_as_string: value.to_as_string,
            sub_aggregation: value.sub_aggregation.into(),
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct BucketEntry {
    /// The string representation of the bucket.
    pub key_as_string: Option<String>,
    /// The identifier of the bucket.
    pub key: Key,
    /// Number of documents in the bucket.
    pub doc_count: u64,
    /// Sub-aggregations in this bucket.
    pub sub_aggregation: AggregationResults,
}

impl From<TantivyBucketEntry> for BucketEntry {
    fn from(value: TantivyBucketEntry) -> BucketEntry {
        BucketEntry {
            key_as_string: value.key_as_string,
            key: value.key.into(),
            doc_count: value.doc_count,
            sub_aggregation: value.sub_aggregation.into(),
        }
    }
}

impl From<BucketEntry> for TantivyBucketEntry {
    fn from(value: BucketEntry) -> TantivyBucketEntry {
        TantivyBucketEntry {
            key_as_string: value.key_as_string,
            key: value.key.into(),
            doc_count: value.doc_count,
            sub_aggregation: value.sub_aggregation.into(),
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub enum Key {
    /// String key
    Str(String),
    /// `i64` key
    I64(i64),
    /// `u64` key
    U64(u64),
    /// `f64` key
    F64(f64),
}

impl From<TantivyKey> for Key {
    fn from(value: TantivyKey) -> Key {
        match value {
            TantivyKey::Str(s) => Key::Str(s),
            TantivyKey::I64(i) => Key::I64(i),
            TantivyKey::U64(u) => Key::U64(u),
            TantivyKey::F64(f) => Key::F64(f),
        }
    }
}

impl From<Key> for TantivyKey {
    fn from(value: Key) -> TantivyKey {
        match value {
            Key::Str(s) => TantivyKey::Str(s),
            Key::I64(i) => TantivyKey::I64(i),
            Key::U64(u) => TantivyKey::U64(u),
            Key::F64(f) => TantivyKey::F64(f),
        }
    }
}

/// Single-metric aggregations use this common result structure.
///
/// Main reason to wrap it in value is to match elasticsearch output structure.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct PercentilesMetricResult {
    /// The result of the percentile metric.
    pub values: PercentileValues,
}

/// This is the wrapper of percentile entries, which can be vector or hashmap
/// depending on if it's keyed or not.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub enum PercentileValues {
    /// Vector format percentile entries
    Vec(Vec<PercentileValuesVecEntry>),
    /// HashMap format percentile entries. Key is the serialized percentile
    // we use a hashmap here because neither key nor value require conversion, almost
    // all usage of PercentileValues will be direct conversion to TantivyPercentilesValue
    HashMap(FxHashMap<String, f64>),
}

impl From<TantivyPercentilesMetricResult> for PercentilesMetricResult {
    fn from(value: TantivyPercentilesMetricResult) -> PercentilesMetricResult {
        let values = match value.values {
            TantivyPercentileValues::Vec(vec) => PercentileValues::Vec(vec),
            TantivyPercentileValues::HashMap(map) => PercentileValues::HashMap(map),
        };
        PercentilesMetricResult { values }
    }
}

impl From<PercentilesMetricResult> for TantivyPercentilesMetricResult {
    fn from(value: PercentilesMetricResult) -> TantivyPercentilesMetricResult {
        let values = match value.values {
            PercentileValues::Vec(vec) => TantivyPercentileValues::Vec(vec),
            PercentileValues::HashMap(map) => TantivyPercentileValues::HashMap(map),
        };
        TantivyPercentilesMetricResult { values }
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/bool_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;
use serde_with::formats::PreferMany;
use serde_with::{DefaultOnNull, OneOrMany, serde_as};

use crate::elastic_query_dsl::{ConvertibleToQueryAst, ElasticQueryDslInner};
use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::{self, QueryAst};

/// # Unsupported features
/// - named queries
#[serde_as]
#[derive(Deserialize, Debug, PartialEq, Clone)]
#[serde(deny_unknown_fields)]
pub struct BoolQuery {
    #[serde_as(deserialize_as = "DefaultOnNull<OneOrMany<_, PreferMany>>")]
    #[serde(default)]
    must: Vec<ElasticQueryDslInner>,
    #[serde_as(deserialize_as = "DefaultOnNull<OneOrMany<_, PreferMany>>")]
    #[serde(default)]
    must_not: Vec<ElasticQueryDslInner>,
    #[serde_as(deserialize_as = "DefaultOnNull<OneOrMany<_, PreferMany>>")]
    #[serde(default)]
    should: Vec<ElasticQueryDslInner>,
    #[serde_as(deserialize_as = "DefaultOnNull<OneOrMany<_, PreferMany>>")]
    #[serde(default)]
    filter: Vec<ElasticQueryDslInner>,
    #[serde(default)]
    pub boost: Option<NotNaNf32>,
    #[serde(default)]
    pub minimum_should_match: Option<MinimumShouldMatch>,
    #[serde(alias = "adjust_pure_negative", default, skip_serializing)]
    _adjust_pure_negative: Option<serde::de::IgnoredAny>,
}

// `IgnoredAny` implements `PartialEq` but not `Eq`, so we derive `PartialEq`
// and manually assert `Eq` (safe because `IgnoredAny` is a unit struct).
impl Eq for BoolQuery {}

#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(untagged)]
pub enum MinimumShouldMatch {
    Str(String),
    Int(isize),
}

impl MinimumShouldMatch {
    fn resolve(&self, num_should_clauses: usize) -> anyhow::Result<MinimumShouldMatchResolved> {
        match self {
            MinimumShouldMatch::Str(minimum_should_match_dsl) => {
                let Some(percentage) = parse_percentage(minimum_should_match_dsl) else {
                    anyhow::bail!(
                        "Unsupported minimum should match dsl {}. quickwit currently only \
                         supports the format '35%' and `-35%`",
                        minimum_should_match_dsl
                    );
                };
                let min_should_match = percentage * num_should_clauses as isize / 100;
                MinimumShouldMatch::Int(min_should_match).resolve(num_should_clauses)
            }
            MinimumShouldMatch::Int(neg_num_missing_should_clauses)
                if *neg_num_missing_should_clauses < 0 =>
            {
                let num_missing_should_clauses = -neg_num_missing_should_clauses as usize;
                if num_missing_should_clauses >= num_should_clauses {
                    Ok(MinimumShouldMatchResolved::Unspecified)
                } else {
                    Ok(MinimumShouldMatchResolved::Min(
                        num_should_clauses - num_missing_should_clauses,
                    ))
                }
            }
            MinimumShouldMatch::Int(num_required_should_clauses) => {
                let num_required_should_clauses: usize = *num_required_should_clauses as usize;
                if num_required_should_clauses > num_should_clauses {
                    Ok(MinimumShouldMatchResolved::NoMatch)
                } else {
                    Ok(MinimumShouldMatchResolved::Min(num_required_should_clauses))
                }
            }
        }
    }
}

#[derive(Deserialize, Debug, Copy, Clone, Eq, PartialEq)]
enum MinimumShouldMatchResolved {
    Unspecified,
    Min(usize),
    NoMatch,
}

fn parse_percentage(s: &str) -> Option<isize> {
    let percentage_str = s.strip_suffix('%')?;
    let percentage_isize = percentage_str.parse::<isize>().ok()?;
    if percentage_isize.abs() > 100 {
        return None;
    }
    Some(percentage_isize)
}

impl BoolQuery {
    fn resolve_minimum_should_match(&self) -> anyhow::Result<MinimumShouldMatchResolved> {
        let num_should_clauses = self.should.len();
        let Some(minimum_should_match) = &self.minimum_should_match else {
            return Ok(MinimumShouldMatchResolved::Unspecified);
        };
        minimum_should_match.resolve(num_should_clauses)
    }
}

impl BoolQuery {
    // Combines a list of children queries into a boolean union.
    pub(crate) fn union(children: Vec<ElasticQueryDslInner>) -> BoolQuery {
        BoolQuery {
            must: Vec::new(),
            must_not: Vec::new(),
            should: children,
            filter: Vec::new(),
            boost: None,
            minimum_should_match: None,
            _adjust_pure_negative: None,
        }
    }
}

fn convert_vec(query_dsls: Vec<ElasticQueryDslInner>) -> anyhow::Result<Vec<QueryAst>> {
    query_dsls
        .into_iter()
        .map(|query_dsl| query_dsl.convert_to_query_ast())
        .collect()
}

impl ConvertibleToQueryAst for BoolQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let minimum_should_match_resolved = self.resolve_minimum_should_match()?;
        let must = convert_vec(self.must)?;
        let must_not = convert_vec(self.must_not)?;
        let should = convert_vec(self.should)?;
        let filter = convert_vec(self.filter)?;

        let minimum_should_match_opt = match minimum_should_match_resolved {
            MinimumShouldMatchResolved::Unspecified => None,
            MinimumShouldMatchResolved::Min(minimum_should_match) => Some(minimum_should_match),
            MinimumShouldMatchResolved::NoMatch => {
                return Ok(QueryAst::MatchNone);
            }
        };
        let bool_query_ast = query_ast::BoolQuery {
            must,
            must_not,
            should,
            filter,
            minimum_should_match: minimum_should_match_opt,
        };
        Ok(bool_query_ast.into())
    }
}

impl From<BoolQuery> for ElasticQueryDslInner {
    fn from(bool_query: BoolQuery) -> Self {
        ElasticQueryDslInner::Bool(bool_query)
    }
}

#[cfg(test)]
mod tests {
    use super::parse_percentage;
    use crate::elastic_query_dsl::ConvertibleToQueryAst;
    use crate::elastic_query_dsl::bool_query::{
        BoolQuery, MinimumShouldMatch, MinimumShouldMatchResolved,
    };
    use crate::elastic_query_dsl::term_query::term_query_from_field_value;
    use crate::query_ast::QueryAst;

    #[test]
    fn test_dsl_bool_query_deserialize_simple() {
        let bool_query_json = r#"{
            "must": [
                { "term": {"product_id": {"value": "1" }} },
                { "term": {"product_id": {"value": "2" }} }
            ]
        }"#;
        let bool_query: BoolQuery = serde_json::from_str(bool_query_json).unwrap();
        assert_eq!(
            &bool_query,
            &BoolQuery {
                must: vec![
                    term_query_from_field_value("product_id", "1").into(),
                    term_query_from_field_value("product_id", "2").into(),
                ],
                must_not: Vec::new(),
                should: Vec::new(),
                filter: Vec::new(),
                boost: None,
                minimum_should_match: None,
                _adjust_pure_negative: None,
            }
        );
    }

    #[test]
    fn test_dsl_query_single() {
        let bool_query_json = r#"{
            "must": { "term": {"product_id": {"value": "1" }} },
            "filter": { "term": {"product_id": {"value": "2" }} }
        }"#;
        let bool_query: BoolQuery = serde_json::from_str(bool_query_json).unwrap();
        assert_eq!(
            &bool_query,
            &BoolQuery {
                must: vec![term_query_from_field_value("product_id", "1").into(),],
                must_not: Vec::new(),
                should: Vec::new(),
                filter: vec![term_query_from_field_value("product_id", "2").into(),],
                boost: None,
                minimum_should_match: None,
                _adjust_pure_negative: None,
            }
        );
    }

    #[test]
    fn test_dsl_query_with_null_values() {
        let bool_query_json = r#"{
            "must": null,
            "must_not": null,
            "should": null,
            "filter": null,
            "boost": null
        }"#;
        let bool_query: BoolQuery = serde_json::from_str(bool_query_json).unwrap();
        assert_eq!(
            &bool_query,
            &BoolQuery {
                must: Vec::new(),
                must_not: Vec::new(),
                should: Vec::new(),
                filter: Vec::new(),
                boost: None,
                minimum_should_match: None,
                _adjust_pure_negative: None,
            }
        );
    }

    #[test]
    fn test_dsl_bool_query_deserialize_adjust_pure_negative() {
        let bool_query_json = r#"{
            "must": [
                { "term": {"product_id": {"value": "1" }} }
            ],
            "adjust_pure_negative": true
        }"#;
        let bool_query: BoolQuery = serde_json::from_str(bool_query_json).unwrap();
        assert!(bool_query._adjust_pure_negative.is_some());
        assert_eq!(bool_query.must.len(), 1);
        bool_query.convert_to_query_ast().unwrap();
    }

    #[test]
    fn test_dsl_bool_query_deserialize_minimum_should_match() {
        let bool_query: super::BoolQuery = serde_json::from_str(
            r#"{
            "must": [
                { "term": {"product_id": {"value": "1" }} },
                { "term": {"product_id": {"value": "2" }} }
            ],
            "minimum_should_match": -2
        }"#,
        )
        .unwrap();
        assert_eq!(
            bool_query.minimum_should_match.as_ref().unwrap(),
            &MinimumShouldMatch::Int(-2)
        );
    }

    #[test]
    fn test_dsl_query_with_minimum_should_match() {
        let bool_query_json = r#"{
                "should": [
                    { "term": {"product_id": {"value": "1" }} },
                    { "term": {"product_id": {"value": "2" }} },
                    { "term": {"product_id": {"value": "3" }} }
                ],
                "minimum_should_match": 2
            }"#;
        let bool_query: BoolQuery = serde_json::from_str(bool_query_json).unwrap();
        assert_eq!(bool_query.should.len(), 3);
        assert_eq!(
            bool_query.minimum_should_match.as_ref().unwrap(),
            &super::MinimumShouldMatch::Int(2)
        );
        let QueryAst::Bool(bool_query_ast) = bool_query.convert_to_query_ast().unwrap() else {
            panic!();
        };
        assert_eq!(bool_query_ast.should.len(), 3);
        assert_eq!(bool_query_ast.minimum_should_match, Some(2));
    }

    #[test]
    fn test_parse_percentage() {
        assert_eq!(parse_percentage("10%"), Some(10));
        assert_eq!(parse_percentage("101%"), None);
        assert_eq!(parse_percentage("0%"), Some(0));
        assert_eq!(parse_percentage("100%"), Some(100));
        assert_eq!(parse_percentage("-20%"), Some(-20));
        assert_eq!(parse_percentage("20"), None);
        assert_eq!(parse_percentage("20a%"), None);
    }

    #[test]
    fn test_resolve_minimum_should_match() {
        assert_eq!(
            MinimumShouldMatch::Str("30%".to_string())
                .resolve(10)
                .unwrap(),
            MinimumShouldMatchResolved::Min(3)
        );
        // not supported yet
        assert_eq!(
            MinimumShouldMatch::Str("-30%".to_string())
                .resolve(10)
                .unwrap(),
            MinimumShouldMatchResolved::Min(7)
        );
        assert!(
            MinimumShouldMatch::Str("-30!".to_string())
                .resolve(10)
                .is_err()
        );
        assert_eq!(
            MinimumShouldMatch::Int(10).resolve(11).unwrap(),
            MinimumShouldMatchResolved::Min(10)
        );
        assert_eq!(
            MinimumShouldMatch::Int(-10).resolve(11).unwrap(),
            MinimumShouldMatchResolved::Min(1)
        );
        assert_eq!(
            MinimumShouldMatch::Int(-12).resolve(11).unwrap(),
            MinimumShouldMatchResolved::Unspecified
        );
        assert_eq!(
            MinimumShouldMatch::Int(12).resolve(11).unwrap(),
            MinimumShouldMatchResolved::NoMatch
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/exists_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use crate::elastic_query_dsl::ConvertibleToQueryAst;
use crate::query_ast::{self, QueryAst};

#[derive(Deserialize, Clone, Eq, PartialEq, Debug)]
pub struct ExistsQuery {
    field: String,
}

impl ConvertibleToQueryAst for ExistsQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        Ok(QueryAst::FieldPresence(query_ast::FieldPresenceQuery {
            field: self.field,
        }))
    }
}

#[cfg(test)]
mod tests {
    use crate::elastic_query_dsl::exists_query::ExistsQuery;

    #[test]
    fn test_dsl_exists_query_deserialize_simple() {
        let exists_query_json = r#"{
           "field": "privileged"
        }"#;
        let bool_query: ExistsQuery = serde_json::from_str(exists_query_json).unwrap();
        assert_eq!(
            &bool_query,
            &ExistsQuery {
                field: "privileged".to_string(),
            }
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/match_bool_prefix.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use super::{ElasticQueryDslInner, StringOrStructForSerialization};
use crate::OneFieldMap;
use crate::elastic_query_dsl::match_query::MatchQueryParams;
use crate::elastic_query_dsl::{ConvertibleToQueryAst, default_max_expansions};
use crate::query_ast::{FullTextParams, FullTextQuery, QueryAst};

/// `MatchBoolPrefixQuery` as defined in
/// <https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-bool-prefix-query.html>
#[derive(Deserialize, Clone, Eq, PartialEq, Debug)]
#[serde(from = "OneFieldMap<StringOrStructForSerialization<MatchQueryParams>>")]
pub(crate) struct MatchBoolPrefixQuery {
    pub(crate) field: String,
    pub(crate) params: MatchQueryParams,
}

impl ConvertibleToQueryAst for MatchBoolPrefixQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let full_text_params = FullTextParams {
            tokenizer: None,
            mode: crate::query_ast::FullTextMode::BoolPrefix {
                operator: self.params.operator,
                max_expansions: default_max_expansions(),
            },
            zero_terms_query: self.params.zero_terms_query,
        };
        Ok(QueryAst::FullText(FullTextQuery {
            field: self.field,
            text: self.params.query,
            params: full_text_params,
            lenient: self.params.lenient,
        }))
    }
}

impl From<MatchBoolPrefixQuery> for ElasticQueryDslInner {
    fn from(match_bool_prefix_query: MatchBoolPrefixQuery) -> Self {
        ElasticQueryDslInner::MatchBoolPrefix(match_bool_prefix_query)
    }
}

impl From<OneFieldMap<StringOrStructForSerialization<MatchQueryParams>>> for MatchBoolPrefixQuery {
    fn from(
        match_query_params: OneFieldMap<StringOrStructForSerialization<MatchQueryParams>>,
    ) -> Self {
        let OneFieldMap { field, value } = match_query_params;
        MatchBoolPrefixQuery {
            field,
            params: value.inner,
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/match_phrase_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use crate::elastic_query_dsl::{
    ConvertibleToQueryAst, ElasticQueryDslInner, StringOrStructForSerialization,
};
use crate::query_ast::{FullTextMode, FullTextParams, FullTextQuery, QueryAst};
use crate::{MatchAllOrNone, OneFieldMap};

/// `MatchPhraseQuery` as defined in
/// <https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query-phrase.html>
#[derive(Deserialize, Clone, Eq, PartialEq, Debug)]
#[serde(from = "OneFieldMap<StringOrStructForSerialization<MatchPhraseQueryParams>>")]
pub(crate) struct MatchPhraseQuery {
    pub(crate) field: String,
    pub(crate) params: MatchPhraseQueryParams,
}

#[derive(Clone, Deserialize, PartialEq, Eq, Debug)]
#[serde(deny_unknown_fields)]
pub struct MatchPhraseQueryParams {
    pub(crate) query: String,
    #[serde(default)]
    pub(crate) zero_terms_query: MatchAllOrNone,
    #[serde(default)]
    pub(crate) analyzer: Option<String>,
    #[serde(default)]
    pub(crate) slop: u32,
}

impl ConvertibleToQueryAst for MatchPhraseQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let full_text_params = FullTextParams {
            tokenizer: self.params.analyzer,
            mode: FullTextMode::Phrase {
                slop: self.params.slop,
            },
            zero_terms_query: self.params.zero_terms_query,
        };
        Ok(QueryAst::FullText(FullTextQuery {
            field: self.field,
            text: self.params.query,
            params: full_text_params,
            lenient: false,
        }))
    }
}

impl From<MatchPhraseQuery> for ElasticQueryDslInner {
    fn from(match_phrase_query: MatchPhraseQuery) -> Self {
        ElasticQueryDslInner::MatchPhrase(match_phrase_query)
    }
}

impl From<OneFieldMap<StringOrStructForSerialization<MatchPhraseQueryParams>>>
    for MatchPhraseQuery
{
    fn from(
        match_query_params: OneFieldMap<StringOrStructForSerialization<MatchPhraseQueryParams>>,
    ) -> Self {
        let OneFieldMap { field, value } = match_query_params;
        MatchPhraseQuery {
            field,
            params: value.inner,
        }
    }
}

impl From<String> for MatchPhraseQueryParams {
    fn from(query: String) -> MatchPhraseQueryParams {
        MatchPhraseQueryParams {
            query,
            zero_terms_query: Default::default(),
            analyzer: None,
            slop: 0,
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_deserialize_match_query_string() {
        // We accept a single string
        let match_query: MatchPhraseQuery =
            serde_json::from_str(r#"{"my_field": "my_query"}"#).unwrap();
        assert_eq!(match_query.field, "my_field");
        assert_eq!(&match_query.params.query, "my_query");
        assert_eq!(match_query.params.slop, 0u32);
        assert!(match_query.params.analyzer.is_none());
        assert_eq!(
            match_query.params.zero_terms_query,
            MatchAllOrNone::MatchNone
        );
    }

    #[test]
    fn test_deserialize_match_query_struct() {
        // We accept a struct too.
        let match_query: MatchPhraseQuery = serde_json::from_str(
            r#"
            {"my_field":
                {
                    "query": "my_query",
                    "slop": 1
                }
            }
        "#,
        )
        .unwrap();
        assert_eq!(match_query.field, "my_field");
        assert_eq!(&match_query.params.query, "my_query");
        assert_eq!(match_query.params.slop, 1u32);
    }

    #[test]
    fn test_deserialize_match_query_nice_errors() {
        let deser_error = serde_json::from_str::<MatchPhraseQuery>(
            r#"{"my_field": {"query": "my_query", "wrong_param": 2}}"#,
        )
        .unwrap_err();
        assert!(
            deser_error
                .to_string()
                .contains("unknown field `wrong_param`")
        );
    }

    #[test]
    fn test_match_query() {
        let match_query = MatchPhraseQuery {
            field: "body".to_string(),
            params: MatchPhraseQueryParams {
                analyzer: Some("whitespace".to_string()),
                query: "hello".to_string(),
                slop: 2u32,
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
            },
        };
        let ast = match_query.convert_to_query_ast().unwrap();
        let QueryAst::FullText(FullTextQuery {
            field,
            text,
            params,
            lenient: _,
        }) = ast
        else {
            panic!()
        };
        assert_eq!(field, "body");
        assert_eq!(text, "hello");
        assert_eq!(params.mode, FullTextMode::Phrase { slop: 2u32 });
        assert_eq!(params.zero_terms_query, MatchAllOrNone::MatchAll);
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/match_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use super::LeniencyBool;
use crate::elastic_query_dsl::{
    ConvertibleToQueryAst, ElasticQueryDslInner, StringOrStructForSerialization,
};
use crate::query_ast::{FullTextParams, FullTextQuery, QueryAst};
use crate::{BooleanOperand, MatchAllOrNone, OneFieldMap};

/// `MatchQuery` as defined in
/// <https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query.html>
#[derive(Deserialize, Clone, Eq, PartialEq, Debug)]
#[serde(from = "OneFieldMap<StringOrStructForSerialization<MatchQueryParams>>")]
pub struct MatchQuery {
    pub(crate) field: String,
    pub(crate) params: MatchQueryParams,
}

#[derive(Clone, Deserialize, PartialEq, Eq, Debug)]
#[serde(deny_unknown_fields)]
pub(crate) struct MatchQueryParams {
    pub(crate) query: String,
    #[serde(default)]
    pub(crate) operator: BooleanOperand,
    #[serde(default)]
    pub(crate) zero_terms_query: MatchAllOrNone,
    #[serde(default)]
    pub(crate) lenient: LeniencyBool,
}

impl ConvertibleToQueryAst for MatchQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let full_text_params = FullTextParams {
            tokenizer: None,
            mode: self.params.operator.into(),
            zero_terms_query: self.params.zero_terms_query,
        };
        Ok(QueryAst::FullText(FullTextQuery {
            field: self.field,
            text: self.params.query,
            params: full_text_params,
            lenient: self.params.lenient,
        }))
    }
}

impl From<MatchQuery> for ElasticQueryDslInner {
    fn from(match_query: MatchQuery) -> Self {
        ElasticQueryDslInner::Match(match_query)
    }
}

impl From<OneFieldMap<StringOrStructForSerialization<MatchQueryParams>>> for MatchQuery {
    fn from(
        match_query_params: OneFieldMap<StringOrStructForSerialization<MatchQueryParams>>,
    ) -> Self {
        let OneFieldMap { field, value } = match_query_params;
        MatchQuery {
            field,
            params: value.inner,
        }
    }
}

impl From<String> for MatchQueryParams {
    fn from(query: String) -> MatchQueryParams {
        MatchQueryParams {
            query,
            zero_terms_query: Default::default(),
            operator: Default::default(),
            lenient: false,
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::query_ast::FullTextMode;

    #[test]
    fn test_deserialize_match_query_string() {
        // We accept a single string
        let match_query: MatchQuery = serde_json::from_str(r#"{"my_field": "my_query"}"#).unwrap();
        assert_eq!(match_query.field, "my_field");
        assert_eq!(&match_query.params.query, "my_query");
        assert_eq!(match_query.params.operator, BooleanOperand::Or);
    }

    #[test]
    fn test_deserialize_match_query_struct() {
        // We accept a struct too.
        let match_query: MatchQuery =
            serde_json::from_str(r#"{"my_field": {"query": "my_query", "operator": "AND"}}"#)
                .unwrap();
        assert_eq!(match_query.field, "my_field");
        assert_eq!(&match_query.params.query, "my_query");
        assert_eq!(match_query.params.operator, BooleanOperand::And);
    }

    #[test]
    fn test_deserialize_match_query_nice_errors() {
        let deser_error = serde_json::from_str::<MatchQuery>(
            r#"{"my_field": {"query": "my_query", "wrong_param": 2}}"#,
        )
        .unwrap_err();
        assert!(
            deser_error
                .to_string()
                .contains("unknown field `wrong_param`")
        );
    }

    #[test]
    fn test_match_query() {
        let match_query = MatchQuery {
            field: "body".to_string(),
            params: MatchQueryParams {
                query: "hello".to_string(),
                operator: BooleanOperand::And,
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
                lenient: false,
            },
        };
        let ast = match_query.convert_to_query_ast().unwrap();
        let QueryAst::FullText(FullTextQuery {
            field,
            text,
            params,
            lenient: _,
        }) = ast
        else {
            panic!()
        };
        assert_eq!(field, "body");
        assert_eq!(text, "hello");
        assert_eq!(
            params.mode,
            FullTextMode::Bool {
                operator: BooleanOperand::And
            }
        );
        assert_eq!(params.zero_terms_query, MatchAllOrNone::MatchAll);
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Serialize};

mod bool_query;
mod exists_query;
mod match_bool_prefix;
mod match_phrase_query;
mod match_query;
mod multi_match;
mod one_field_map;
mod phrase_prefix_query;
mod prefix_query;
mod query_string_query;
mod range_query;
mod regex_query;
mod string_or_struct;
mod term_query;
mod terms_query;
mod wildcard_query;

use bool_query::BoolQuery;
pub use one_field_map::OneFieldMap;
use phrase_prefix_query::MatchPhrasePrefixQuery;
use prefix_query::PrefixQuery;
pub(crate) use query_string_query::QueryStringQuery;
use range_query::RangeQuery;
pub(crate) use string_or_struct::StringOrStructForSerialization;
use term_query::TermQuery;

use crate::elastic_query_dsl::exists_query::ExistsQuery;
use crate::elastic_query_dsl::match_bool_prefix::MatchBoolPrefixQuery;
use crate::elastic_query_dsl::match_phrase_query::MatchPhraseQuery;
use crate::elastic_query_dsl::match_query::MatchQuery;
use crate::elastic_query_dsl::multi_match::MultiMatchQuery;
use crate::elastic_query_dsl::regex_query::RegexQuery;
use crate::elastic_query_dsl::terms_query::TermsQuery;
use crate::elastic_query_dsl::wildcard_query::WildcardQuery;
use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::QueryAst;

/// Quickwit and Elasticsearch have different interpretations of leniency:
/// - In Quickwit, lenient mode allows ignoring parts of the query that reference non-existing
///   columns. This is a behavior that Elasticsearch supports by default.
/// - In Elasticsearch, lenient mode primarily addresses type errors (such as searching for text in
///   an integer field). Quickwit always supports this behavior, regardless of the `lenient`
///   setting.
pub type LeniencyBool = bool;

fn default_max_expansions() -> u32 {
    50
}

#[derive(Serialize, Deserialize, Debug, Eq, PartialEq, Clone, Copy, Default)]
#[serde(deny_unknown_fields)]
pub(crate) struct MatchAllQuery {
    pub boost: Option<NotNaNf32>,
}

#[derive(Serialize, Deserialize, Debug, Eq, PartialEq, Clone, Copy)]
pub(crate) struct MatchNoneQuery;

#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(rename_all = "snake_case", deny_unknown_fields)]
pub(crate) enum ElasticQueryDslInner {
    QueryString(QueryStringQuery),
    Bool(BoolQuery),
    Term(TermQuery),
    Terms(TermsQuery),
    MatchAll(MatchAllQuery),
    MatchNone(MatchNoneQuery),
    Match(MatchQuery),
    MatchBoolPrefix(MatchBoolPrefixQuery),
    MatchPhrase(MatchPhraseQuery),
    MatchPhrasePrefix(MatchPhrasePrefixQuery),
    MultiMatch(MultiMatchQuery),
    Range(RangeQuery),
    Exists(ExistsQuery),
    Regexp(RegexQuery),
    Wildcard(WildcardQuery),
    Prefix(PrefixQuery),
}

#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(transparent)]
pub struct ElasticQueryDsl(ElasticQueryDslInner);

impl TryFrom<ElasticQueryDsl> for QueryAst {
    type Error = anyhow::Error;

    fn try_from(es_dsl: ElasticQueryDsl) -> anyhow::Result<Self> {
        es_dsl.0.convert_to_query_ast()
    }
}

pub(crate) trait ConvertibleToQueryAst {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst>;
}

impl ConvertibleToQueryAst for ElasticQueryDslInner {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        match self {
            Self::QueryString(query_string_query) => query_string_query.convert_to_query_ast(),
            Self::Bool(bool_query) => bool_query.convert_to_query_ast(),
            Self::Term(term_query) => term_query.convert_to_query_ast(),
            Self::Terms(terms_query) => terms_query.convert_to_query_ast(),
            Self::MatchAll(match_all_query) => {
                if let Some(boost) = match_all_query.boost {
                    Ok(QueryAst::Boost {
                        boost,
                        underlying: Box::new(QueryAst::MatchAll),
                    })
                } else {
                    Ok(QueryAst::MatchAll)
                }
            }
            Self::MatchNone(_) => Ok(QueryAst::MatchNone),
            Self::MatchBoolPrefix(match_bool_prefix_query) => {
                match_bool_prefix_query.convert_to_query_ast()
            }
            Self::MatchPhrase(match_phrase_query) => match_phrase_query.convert_to_query_ast(),
            Self::MatchPhrasePrefix(match_phrase_prefix) => {
                match_phrase_prefix.convert_to_query_ast()
            }
            Self::Range(range_query) => range_query.convert_to_query_ast(),
            Self::Match(match_query) => match_query.convert_to_query_ast(),
            Self::Exists(exists_query) => exists_query.convert_to_query_ast(),
            Self::MultiMatch(multi_match_query) => multi_match_query.convert_to_query_ast(),
            Self::Regexp(regex_query) => regex_query.convert_to_query_ast(),
            Self::Wildcard(wildcard_query) => wildcard_query.convert_to_query_ast(),
            Self::Prefix(prefix_query) => prefix_query.convert_to_query_ast(),
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::elastic_query_dsl::term_query::term_query_from_field_value;

    #[test]
    fn test_query_dsl_deserialize_simple() {
        let term_query_json = r#"{
            "term": {
                "product_id": { "value": "61809" }
            }
        }"#;
        let query_dsl = serde_json::from_str(term_query_json).unwrap();
        let ElasticQueryDsl(ElasticQueryDslInner::Term(term_query)) = query_dsl else {
            panic!()
        };
        assert_eq!(
            &term_query,
            &term_query_from_field_value("product_id", "61809")
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/multi_match.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;
use serde_with::formats::PreferMany;
use serde_with::{OneOrMany, serde_as};

use super::LeniencyBool;
use crate::elastic_query_dsl::bool_query::BoolQuery;
use crate::elastic_query_dsl::match_bool_prefix::MatchBoolPrefixQuery;
use crate::elastic_query_dsl::match_phrase_query::{MatchPhraseQuery, MatchPhraseQueryParams};
use crate::elastic_query_dsl::match_query::{MatchQuery, MatchQueryParams};
use crate::elastic_query_dsl::phrase_prefix_query::{
    MatchPhrasePrefixQuery, MatchPhrasePrefixQueryParams,
};
use crate::elastic_query_dsl::{ConvertibleToQueryAst, ElasticQueryDslInner};

/// Multi match queries are a bit odd. They end up being expanded into another type of query.
/// In Quickwit, we operate this expansion in generic way at the time of deserialization.
#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(try_from = "MultiMatchQueryForDeserialization")]
pub struct MultiMatchQuery(Box<ElasticQueryDslInner>);

#[serde_as]
#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
struct MultiMatchQueryForDeserialization {
    #[serde(rename = "type", default)]
    match_type: MatchType,
    // Other parameters is used to dynamically collect more parameters.
    // We will then expand the query at the json level, and then deserialize the right object.
    #[serde(flatten)]
    other_parameters: serde_json::Map<String, serde_json::Value>,
    #[serde_as(deserialize_as = "OneOrMany<_, PreferMany>")]
    #[serde(default)]
    fields: Vec<String>,
    #[serde(default)]
    lenient: LeniencyBool,
}

fn deserialize_match_query_for_one_field(
    match_type: MatchType,
    field: &str,
    json_object: serde_json::Map<String, serde_json::Value>,
) -> serde_json::Result<ElasticQueryDslInner> {
    let json_val = serde_json::Value::Object(json_object);
    match match_type {
        MatchType::Phrase => {
            let params: MatchPhraseQueryParams = serde_json::from_value(json_val)?;
            let phrase_query = MatchPhraseQuery {
                field: field.to_string(),
                params,
            };
            Ok(ElasticQueryDslInner::MatchPhrase(phrase_query))
        }
        MatchType::PhrasePrefix => {
            let phrase_prefix_params: MatchPhrasePrefixQueryParams =
                serde_json::from_value(json_val)?;
            let phrase_prefix = MatchPhrasePrefixQuery {
                field: field.to_string(),
                value: phrase_prefix_params,
            };
            Ok(ElasticQueryDslInner::MatchPhrasePrefix(phrase_prefix))
        }
        MatchType::BoolPrefix => {
            let bool_prefix_params: MatchQueryParams = serde_json::from_value(json_val)?;
            let bool_prefix = MatchBoolPrefixQuery {
                params: bool_prefix_params,
                field: field.to_string(),
            };
            Ok(ElasticQueryDslInner::MatchBoolPrefix(bool_prefix))
        }
        MatchType::MostFields | MatchType::BestFields | MatchType::CrossFields => {
            let match_query_params: MatchQueryParams = serde_json::from_value(json_val)?;
            let match_query = MatchQuery {
                field: field.to_string(),
                params: match_query_params,
            };
            Ok(ElasticQueryDslInner::Match(match_query))
        }
    }
}

fn validate_field_name(field_name: &str) -> Result<(), String> {
    if field_name.contains('^') {
        return Err(format!(
            "Quickwit does not support field boosting in the multi match query fields (got \
             `{field_name}`)"
        ));
    }
    if field_name.contains('*') {
        return Err(format!(
            "Quickwit does not support wildcards in the multi match query fields (got \
             `{field_name}`)"
        ));
    }
    Ok(())
}

impl TryFrom<MultiMatchQueryForDeserialization> for MultiMatchQuery {
    type Error = serde_json::Error;

    fn try_from(multi_match_query: MultiMatchQueryForDeserialization) -> Result<Self, Self::Error> {
        if multi_match_query.fields.is_empty() {
            // TODO: We can use default field from index configuration instead
            return Err(serde::de::Error::custom(
                "Quickwit does not support multi match query with 0 fields. MultiMatchQueries \
                 must have at least one field.",
            ));
        }
        for field in &multi_match_query.fields {
            validate_field_name(field).map_err(serde::de::Error::custom)?;
        }
        let mut children = Vec::new();
        for field in multi_match_query.fields {
            let child = deserialize_match_query_for_one_field(
                multi_match_query.match_type,
                &field,
                multi_match_query.other_parameters.clone(),
            )?;
            children.push(child);
        }
        let bool_query = BoolQuery::union(children);
        Ok(MultiMatchQuery(Box::new(ElasticQueryDslInner::Bool(
            bool_query,
        ))))
    }
}

#[derive(Deserialize, Debug, Default, Eq, PartialEq, Clone, Copy)]
#[serde(rename_all = "snake_case")]
pub enum MatchType {
    #[default]
    MostFields,
    BestFields,  // Not implemented will be converted to MostFields
    CrossFields, // Not implemented will be converted to MostFields
    Phrase,
    PhrasePrefix,
    BoolPrefix,
}

impl ConvertibleToQueryAst for MultiMatchQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<crate::query_ast::QueryAst> {
        self.0.convert_to_query_ast()
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::elastic_query_dsl::default_max_expansions;

    #[track_caller]
    fn test_multimatch_query_ok_aux<T: Into<ElasticQueryDslInner>>(json: &str, expected: T) {
        let expected: ElasticQueryDslInner = expected.into();
        let multi_match_query: MultiMatchQuery = serde_json::from_str(json).unwrap();
        let es_query = &*multi_match_query.0;
        assert_eq!(es_query, &expected);
    }

    #[track_caller]
    fn test_multimatch_query_err_aux(json: &str, expected_error_msg: &'static str) {
        let err_msg: String = serde_json::from_str::<MultiMatchQuery>(json)
            .unwrap_err()
            .to_string();
        assert!(err_msg.contains(expected_error_msg), "Got `{err_msg}`");
    }

    #[test]
    fn test_multimatch_query_deserialization() {
        test_multimatch_query_ok_aux(
            r#"{
                "query": "quick brown fox",
                "type": "most_fields",
                "fields": ["title", "body"]
            }"#,
            BoolQuery::union(vec![
                MatchQuery {
                    field: "title".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown fox".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
                MatchQuery {
                    field: "body".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown fox".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
            ]),
        );

        test_multimatch_query_ok_aux(
            r#"{
            "query": "quick brown fox",
            "type": "best_fields",
            "fields": ["title", "body"]
        }"#,
            BoolQuery::union(vec![
                MatchQuery {
                    field: "title".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown fox".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
                MatchQuery {
                    field: "body".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown fox".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
            ]),
        );

        test_multimatch_query_ok_aux(
            r#"{
            "query": "quick brown fox",
            "type": "cross_fields",
            "fields": ["title", "body"]
        }"#,
            BoolQuery::union(vec![
                MatchQuery {
                    field: "title".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown fox".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
                MatchQuery {
                    field: "body".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown fox".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
            ]),
        );

        test_multimatch_query_ok_aux(
            r#"{
            "query": "quick brown fox",
            "type": "phrase",
            "fields": ["title", "body"]
        }"#,
            BoolQuery::union(vec![
                MatchPhraseQuery {
                    field: "title".to_string(),
                    params: MatchPhraseQueryParams {
                        query: "quick brown fox".to_string(),
                        zero_terms_query: Default::default(),
                        analyzer: None,
                        slop: Default::default(),
                    },
                }
                .into(),
                MatchPhraseQuery {
                    field: "body".to_string(),
                    params: MatchPhraseQueryParams {
                        query: "quick brown fox".to_string(),
                        zero_terms_query: Default::default(),
                        analyzer: None,
                        slop: Default::default(),
                    },
                }
                .into(),
            ]),
        );

        test_multimatch_query_ok_aux(
            r#"{
            "query": "quick brown fox",
            "type": "phrase_prefix",
            "fields": ["title", "body"]
        }"#,
            BoolQuery::union(vec![
                MatchPhrasePrefixQuery {
                    field: "title".to_string(),
                    value: MatchPhrasePrefixQueryParams {
                        query: "quick brown fox".to_string(),
                        analyzer: Default::default(),
                        max_expansions: default_max_expansions(),
                        slop: Default::default(),
                        zero_terms_query: Default::default(),
                    },
                }
                .into(),
                MatchPhrasePrefixQuery {
                    field: "body".to_string(),
                    value: MatchPhrasePrefixQueryParams {
                        query: "quick brown fox".to_string(),
                        analyzer: Default::default(),
                        max_expansions: default_max_expansions(),
                        slop: Default::default(),
                        zero_terms_query: Default::default(),
                    },
                }
                .into(),
            ]),
        );

        test_multimatch_query_ok_aux(
            r#"{
            "query": "quick brown",
            "type": "bool_prefix",
            "fields": ["title", "body"]
        }"#,
            BoolQuery::union(vec![
                MatchBoolPrefixQuery {
                    field: "title".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
                MatchBoolPrefixQuery {
                    field: "body".to_string(),
                    params: MatchQueryParams {
                        query: "quick brown".to_string(),
                        operator: crate::BooleanOperand::Or,
                        zero_terms_query: Default::default(),
                        lenient: false,
                    },
                }
                .into(),
            ]),
        );
    }

    #[test]
    fn test_multimatch_unsupported() {
        test_multimatch_query_err_aux(
            r#"{
                "query": "quick brown fox",
                "type": "most_fields",
                "fields": ["body", "body.*"]
            }"#,
            "Quickwit does not support wildcards",
        );
        test_multimatch_query_err_aux(
            r#"{
                "query": "quick brown fox",
                "type": "most_fields",
                "fields": ["body", "title^3"]
            }"#,
            "Quickwit does not support field boosting",
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/one_field_map.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::marker::PhantomData;

use serde::de::Visitor;
use serde::ser::SerializeMap;
use serde::{Deserialize, Serialize};

/// Helper to serialize/deserialize `{"my_field": {..}}` object
/// often present in Elasticsearch DSL.
#[derive(PartialEq, Eq, Debug, Clone)]
pub struct OneFieldMap<V> {
    pub field: String,
    pub value: V,
}

impl<V: Serialize> Serialize for OneFieldMap<V> {
    fn serialize<S: serde::Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        let mut map = serializer.serialize_map(Some(1))?;
        map.serialize_entry(&self.field, &self.value)?;
        map.end()
    }
}

struct OneFieldMapVisitor<V> {
    _data: PhantomData<V>,
}

impl<'de, V: Deserialize<'de>> Visitor<'de> for OneFieldMapVisitor<V> {
    type Value = OneFieldMap<V>;

    fn expecting(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "Expected a map with a single field.")
    }

    fn visit_map<A>(self, mut map: A) -> Result<Self::Value, A::Error>
    where A: serde::de::MapAccess<'de> {
        if let Some(num_keys) = map.size_hint()
            && num_keys != 1
        {
            return Err(serde::de::Error::custom(format!(
                "expected a single field. got {num_keys}"
            )));
        }
        let Some((key, val)) = map.next_entry()? else {
            return Err(serde::de::Error::custom(
                "expected a single field. got none",
            ));
        };
        if let Some(second_key) = map.next_key::<String>()? {
            return Err(serde::de::Error::custom(format!(
                "expected a single field. got several ({key}, {second_key}, ...)"
            )));
        }
        Ok(OneFieldMap {
            field: key,
            value: val,
        })
    }
}

impl<'de, V: Deserialize<'de>> Deserialize<'de> for OneFieldMap<V> {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        deserializer.deserialize_map(OneFieldMapVisitor {
            _data: Default::default(),
        })
    }
}

#[cfg(test)]
mod tests {

    use serde::{Deserialize, Serialize};

    use crate::OneFieldMap;
    #[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
    struct Property {
        count: usize,
    }

    #[test]
    fn test_one_field_hash_map_simple() {
        let one_field_map = OneFieldMap {
            field: "my-field".to_string(),
            value: Property { count: 2 },
        };
        let json = serde_json::to_value(one_field_map).unwrap();
        assert_eq!(&json, &serde_json::json!({"my-field": {"count": 2}}));
        let deser_ser = serde_json::from_value::<OneFieldMap<Property>>(json).unwrap();
        assert_eq!(deser_ser.field.as_str(), "my-field");
        assert_eq!(deser_ser.value.count, 2);
    }

    #[test]
    fn test_one_field_hash_map_deserialize_error_too_many_fields() {
        let deser: serde_json::Result<OneFieldMap<Property>> =
            serde_json::from_value(serde_json::json!({
                "my-field": {"count": 2},
                "my-field2": {"count": 2}
            }));
        let deser_err = deser.unwrap_err();
        assert_eq!(deser_err.to_string(), "expected a single field. got 2");
    }

    #[test]
    fn test_one_field_hash_map_deserialize_error_no_fields() {
        let deser: serde_json::Result<OneFieldMap<Property>> =
            serde_json::from_value(serde_json::json!({}));
        let deser_err = deser.unwrap_err();
        assert_eq!(deser_err.to_string(), "expected a single field. got 0");
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/phrase_prefix_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use crate::MatchAllOrNone;
use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::elastic_query_dsl::{
    ConvertibleToQueryAst, ElasticQueryDslInner, default_max_expansions,
};
use crate::query_ast::{self, FullTextMode, FullTextParams, QueryAst};

pub(crate) type MatchPhrasePrefixQuery = OneFieldMap<MatchPhrasePrefixQueryParams>;

#[derive(PartialEq, Eq, Debug, Deserialize, Clone)]
#[serde(deny_unknown_fields)]
pub(crate) struct MatchPhrasePrefixQueryParams {
    pub query: String,
    #[serde(default)]
    pub analyzer: Option<String>,
    #[serde(default = "default_max_expansions")]
    pub max_expansions: u32,
    #[serde(default)]
    pub slop: u32,
    #[serde(default, skip_serializing_if = "MatchAllOrNone::is_none")]
    pub zero_terms_query: MatchAllOrNone,
}

impl From<MatchPhrasePrefixQuery> for ElasticQueryDslInner {
    fn from(term_query: MatchPhrasePrefixQuery) -> Self {
        Self::MatchPhrasePrefix(term_query)
    }
}

impl ConvertibleToQueryAst for MatchPhrasePrefixQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let MatchPhrasePrefixQueryParams {
            query,
            analyzer,
            max_expansions,
            slop,
            zero_terms_query,
        } = self.value;
        let analyzer = FullTextParams {
            tokenizer: analyzer,
            mode: FullTextMode::Phrase { slop },
            zero_terms_query,
        };
        let phrase_prefix_query_ast = query_ast::PhrasePrefixQuery {
            field: self.field,
            phrase: query,
            params: analyzer,
            max_expansions,
            lenient: false,
        };
        Ok(phrase_prefix_query_ast.into())
    }
}

#[cfg(test)]
mod tests {
    use super::{MatchAllOrNone, MatchPhrasePrefixQuery, MatchPhrasePrefixQueryParams};

    #[test]
    fn test_term_query_simple() {
        let phrase_prefix_json = r#"{ "message": { "query": "quick brown f" } }"#;
        let phrase_prefix: MatchPhrasePrefixQuery =
            serde_json::from_str(phrase_prefix_json).unwrap();
        let expected = MatchPhrasePrefixQuery {
            field: "message".to_string(),
            value: MatchPhrasePrefixQueryParams {
                query: "quick brown f".to_string(),
                analyzer: None,
                max_expansions: 50,
                slop: 0,
                zero_terms_query: MatchAllOrNone::MatchNone,
            },
        };

        assert_eq!(&phrase_prefix, &expected);
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/prefix_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::elastic_query_dsl::{ConvertibleToQueryAst, StringOrStructForSerialization};
use crate::query_ast::{QueryAst, WildcardQuery as AstWildcardQuery};

#[derive(Deserialize, Clone, Eq, PartialEq, Debug)]
#[serde(from = "OneFieldMap<StringOrStructForSerialization<PrefixQueryParams>>")]
pub(crate) struct PrefixQuery {
    pub(crate) field: String,
    pub(crate) params: PrefixQueryParams,
}

#[derive(Deserialize, Debug, Default, Eq, PartialEq, Clone)]
#[serde(deny_unknown_fields)]
pub struct PrefixQueryParams {
    value: String,
    #[serde(default)]
    case_insensitive: bool,
}

impl ConvertibleToQueryAst for PrefixQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let wildcard = format!(
            "{}*",
            self.params
                .value
                .replace(r"\", r"\\")
                .replace("*", r"\*")
                .replace("?", r"\?")
        );
        Ok(AstWildcardQuery {
            field: self.field,
            value: wildcard,
            lenient: true,
            case_insensitive: self.params.case_insensitive,
        }
        .into())
    }
}

impl From<OneFieldMap<StringOrStructForSerialization<PrefixQueryParams>>> for PrefixQuery {
    fn from(
        match_query_params: OneFieldMap<StringOrStructForSerialization<PrefixQueryParams>>,
    ) -> Self {
        let OneFieldMap { field, value } = match_query_params;
        PrefixQuery {
            field,
            params: value.inner,
        }
    }
}

impl From<String> for PrefixQueryParams {
    fn from(value: String) -> PrefixQueryParams {
        PrefixQueryParams {
            value,
            case_insensitive: false,
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_prefix_query_convert_to_query_ast() {
        let prefix_query_json = r#"{
            "user_name": {
                "value": "john"
            }
        }"#;
        let prefix_query: PrefixQuery = serde_json::from_str(prefix_query_json).unwrap();
        let query_ast = prefix_query.convert_to_query_ast().unwrap();

        if let QueryAst::Wildcard(prefix) = query_ast {
            assert_eq!(prefix.field, "user_name");
            assert_eq!(prefix.value, "john*");
            assert!(prefix.lenient);
        } else {
            panic!("Expected QueryAst::Prefix, got {:?}", query_ast);
        }
    }

    #[test]
    fn test_prefix_query_convert_to_query_ast_special_chars() {
        let prefix_query_json = r#"{
            "user_name": {
                "value": "a\\dm?n*"
            }
        }"#;
        let prefix_query: PrefixQuery = serde_json::from_str(prefix_query_json).unwrap();
        let query_ast = prefix_query.convert_to_query_ast().unwrap();

        if let QueryAst::Wildcard(prefix) = query_ast {
            assert_eq!(prefix.field, "user_name");
            assert_eq!(prefix.value, r"a\\dm\?n\**");
            assert!(prefix.lenient);
        } else {
            panic!("Expected QueryAst::Prefix, got {:?}", query_ast);
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/query_string_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use super::LeniencyBool;
use crate::BooleanOperand;
use crate::elastic_query_dsl::ConvertibleToQueryAst;
use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::UserInputQuery;

#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(deny_unknown_fields)]
pub(crate) struct QueryStringQuery {
    query: String,
    /// Limitation. We do not support * at the moment.
    /// We do not support JSON field either.
    ///
    /// Note that following elastic, we do not support "string" and require an array here.
    #[serde(default)]
    fields: Option<Vec<String>>,
    #[serde(default)]
    default_field: Option<String>,
    #[serde(default)]
    default_operator: BooleanOperand,
    #[serde(default)]
    boost: Option<NotNaNf32>,
    #[serde(default)]
    lenient: LeniencyBool,
}

impl ConvertibleToQueryAst for QueryStringQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<crate::query_ast::QueryAst> {
        if self.default_field.is_some() && self.fields.is_some() {
            anyhow::bail!("fields and default_field cannot be both set in `query_string` queries");
        }
        let default_fields: Option<Vec<String>> = self
            .default_field
            .map(|default_field| vec![default_field])
            .or(self.fields);
        let user_text_query = UserInputQuery {
            user_text: self.query,
            default_fields,
            default_operator: self.default_operator,
            lenient: self.lenient,
        };
        Ok(user_text_query.into())
    }
}

#[cfg(test)]
mod tests {
    use crate::BooleanOperand;
    use crate::elastic_query_dsl::{ConvertibleToQueryAst, QueryStringQuery};
    use crate::query_ast::{QueryAst, UserInputQuery};

    #[test]
    fn test_build_query_string_query_with_fields_non_empty() {
        let query_string_query = crate::elastic_query_dsl::QueryStringQuery {
            query: "hello world".to_string(),
            fields: Some(vec!["hello".to_string()]),
            default_operator: crate::BooleanOperand::Or,
            default_field: None,
            boost: None,
            lenient: false,
        };
        let QueryAst::UserInput(user_input_query) =
            query_string_query.convert_to_query_ast().unwrap()
        else {
            panic!();
        };
        assert_eq!(user_input_query.default_operator, BooleanOperand::Or);
        assert_eq!(
            user_input_query.default_fields.unwrap(),
            vec!["hello".to_string()]
        );
    }

    #[test]
    fn test_build_query_string_query_with_default_field_non_empty() {
        let query_string_query = crate::elastic_query_dsl::QueryStringQuery {
            query: "hello world".to_string(),
            fields: None,
            default_operator: crate::BooleanOperand::Or,
            default_field: Some("hello".to_string()),
            boost: None,
            lenient: false,
        };
        let QueryAst::UserInput(user_input_query) =
            query_string_query.convert_to_query_ast().unwrap()
        else {
            panic!();
        };
        assert_eq!(user_input_query.default_operator, BooleanOperand::Or);
        assert_eq!(
            user_input_query.default_fields.unwrap(),
            vec!["hello".to_string()]
        );
    }

    #[test]
    fn test_build_query_string_query_with_both_default_fields_and_field_yield_an_error() {
        let query_string_query = crate::elastic_query_dsl::QueryStringQuery {
            query: "hello world".to_string(),
            fields: Some(vec!["hello".to_string()]),
            default_operator: crate::BooleanOperand::Or,
            default_field: Some("hello".to_string()),
            boost: None,
            lenient: false,
        };
        let err_msg = query_string_query
            .convert_to_query_ast()
            .unwrap_err()
            .to_string();
        assert!(err_msg.contains("cannot be both set"));
    }

    #[test]
    fn test_build_query_string_query_with_default_operand_and() {
        let query_string_query = crate::elastic_query_dsl::QueryStringQuery {
            query: "hello world".to_string(),
            fields: Some(Vec::new()),
            default_field: None,
            default_operator: crate::BooleanOperand::And,
            boost: None,
            lenient: false,
        };
        let QueryAst::UserInput(user_input_query) =
            query_string_query.convert_to_query_ast().unwrap()
        else {
            panic!();
        };
        assert_eq!(user_input_query.default_operator, BooleanOperand::And);
    }

    #[test]
    fn test_build_query_string_query_with_empty_default_field() {
        let query_string_query = crate::elastic_query_dsl::QueryStringQuery {
            query: "hello world".to_string(),
            fields: Some(Vec::new()),
            default_field: None,
            default_operator: crate::BooleanOperand::Or,
            boost: None,
            lenient: false,
        };
        let QueryAst::UserInput(user_input_query) =
            query_string_query.convert_to_query_ast().unwrap()
        else {
            panic!();
        };
        assert_eq!(user_input_query.default_operator, BooleanOperand::Or);
        assert!(user_input_query.default_fields.unwrap().is_empty());
    }

    #[test]
    fn test_build_query_string_query_no_default_fields() {
        let query_string_query = crate::elastic_query_dsl::QueryStringQuery {
            query: "hello world".to_string(),
            fields: None,
            default_field: None,
            default_operator: crate::BooleanOperand::Or,
            boost: None,
            lenient: false,
        };
        let QueryAst::UserInput(user_input_query) =
            query_string_query.convert_to_query_ast().unwrap()
        else {
            panic!();
        };
        assert!(user_input_query.default_fields.is_none());
    }

    #[test]
    fn test_build_query_string_default_operator() {
        let query_string_query: QueryStringQuery =
            serde_json::from_str(r#"{ "query": "hello world", "fields": ["text"] }"#).unwrap();
        // By default the default operator is OR in elasticsearch and opensearch.
        assert_eq!(query_string_query.default_operator, BooleanOperand::Or);
        assert_eq!(query_string_query.fields, Some(vec!["text".to_string()]));
        assert_eq!(&query_string_query.query, "hello world");
        assert_eq!(query_string_query.boost, None);
        let query_ast: QueryAst = query_string_query.convert_to_query_ast().unwrap();
        assert!(matches!(query_ast, QueryAst::UserInput(UserInputQuery {
            user_text,
            default_fields,
            default_operator,
            lenient: _,
        }) if user_text == "hello world"
            && default_operator == BooleanOperand::Or
            && default_fields == Some(vec!["text".to_string()])));
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/range_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Bound;

use quickwit_datetime::StrptimeParser;
use serde::Deserialize;
use time::format_description::well_known::Rfc3339;

use crate::JsonLiteral;
use crate::elastic_query_dsl::ConvertibleToQueryAst;
use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::QueryAst;

#[derive(Deserialize, Debug, Default, Eq, PartialEq, Clone)]
#[serde(deny_unknown_fields)]
pub struct RangeQueryParams {
    #[serde(default)]
    gt: Option<JsonLiteral>,
    #[serde(default)]
    gte: Option<JsonLiteral>,
    #[serde(default)]
    lt: Option<JsonLiteral>,
    #[serde(default)]
    lte: Option<JsonLiteral>,
    #[serde(default)]
    boost: Option<NotNaNf32>,
    #[serde(default)]
    format: Option<JsonLiteral>,
    #[serde(default)]
    from: Option<JsonLiteral>,
    #[serde(default)]
    to: Option<JsonLiteral>,
    #[serde(default)]
    include_lower: Option<bool>,
    #[serde(default)]
    include_upper: Option<bool>,
}

pub type RangeQuery = OneFieldMap<RangeQueryParams>;

impl ConvertibleToQueryAst for RangeQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let field = self.field;
        let RangeQueryParams {
            gt,
            gte,
            lt,
            lte,
            boost,
            format,
            from,
            to,
            include_lower,
            include_upper,
        } = self.value;

        let (mut gt, mut gte, mut lt, mut lte) = (gt, gte, lt, lte);
        if let Some(from_val) = from
            && gt.is_none()
            && gte.is_none()
        {
            if include_lower.unwrap_or(true) {
                gte = Some(from_val);
            } else {
                gt = Some(from_val);
            }
        }
        if let Some(to_val) = to
            && lt.is_none()
            && lte.is_none()
        {
            if include_upper.unwrap_or(true) {
                lte = Some(to_val);
            } else {
                lt = Some(to_val);
            }
        }

        let (gt, gte, lt, lte) = if let Some(JsonLiteral::String(java_date_format)) = format {
            let parser = StrptimeParser::from_java_datetime_format(&java_date_format)
                .map_err(|err| anyhow::anyhow!("failed to parse range query date format. {err}"))?;
            (
                gt.map(|v| parse_and_convert(v, &parser)).transpose()?,
                gte.map(|v| parse_and_convert(v, &parser)).transpose()?,
                lt.map(|v| parse_and_convert(v, &parser)).transpose()?,
                lte.map(|v| parse_and_convert(v, &parser)).transpose()?,
            )
        } else {
            (gt, gte, lt, lte)
        };

        let range_query_ast = crate::query_ast::RangeQuery {
            field,
            lower_bound: match (gt, gte) {
                (Some(_gt), Some(_gte)) => {
                    anyhow::bail!("both gt and gte are set")
                }
                (Some(gt), None) => Bound::Excluded(gt),
                (None, Some(gte)) => Bound::Included(gte),
                (None, None) => Bound::Unbounded,
            },
            upper_bound: match (lt, lte) {
                (Some(_lt), Some(_lte)) => {
                    anyhow::bail!("both lt and lte are set")
                }
                (Some(lt), None) => Bound::Excluded(lt),
                (None, Some(lte)) => Bound::Included(lte),
                (None, None) => Bound::Unbounded,
            },
        };
        let ast: QueryAst = range_query_ast.into();
        Ok(ast.boost(boost))
    }
}

fn parse_and_convert(literal: JsonLiteral, parser: &StrptimeParser) -> anyhow::Result<JsonLiteral> {
    if let JsonLiteral::String(date_time_str) = literal {
        let parsed_date_time = parser
            .parse_date_time(&date_time_str)
            .map_err(|reason| anyhow::anyhow!("Failed to parse date time: {}", reason))?;
        let parsed_date_time_rfc3339 = parsed_date_time.format(&Rfc3339)?;
        Ok(JsonLiteral::String(parsed_date_time_rfc3339))
    } else {
        Ok(literal)
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Bound;

    use super::{RangeQuery as ElasticRangeQuery, RangeQueryParams as ElasticRangeQueryParams};
    use crate::JsonLiteral;
    use crate::elastic_query_dsl::ConvertibleToQueryAst;
    use crate::query_ast::{QueryAst, RangeQuery};

    #[test]
    fn test_date_range_query_with_format() {
        let range_query_params = ElasticRangeQueryParams {
            gt: Some(JsonLiteral::String("2021-01-03T13:32:43".to_string())),
            gte: None,
            lt: None,
            lte: None,
            boost: None,
            format: JsonLiteral::String("yyyy-MM-dd['T'HH:mm:ss]".to_string()).into(),
            ..Default::default()
        };
        let range_query: ElasticRangeQuery = ElasticRangeQuery {
            field: "date".to_string(),
            value: range_query_params,
        };
        let range_query_ast = range_query.convert_to_query_ast().unwrap();
        assert!(matches!(
            range_query_ast,
            QueryAst::Range(RangeQuery {
                field,
                lower_bound: Bound::Excluded(lower_bound),
                upper_bound: Bound::Unbounded,
            })
            if field == "date" && lower_bound == JsonLiteral::String("2021-01-03T13:32:43Z".to_string())
        ));
    }

    fn into_json_number(n: u64) -> JsonLiteral {
        JsonLiteral::Number(serde_json::Number::from(n))
    }

    #[test]
    fn test_range_query_with_from_to_inclusive() {
        let range_json =
            r#"{"score": {"from": 50, "to": 100, "include_lower": true, "include_upper": true}}"#;
        let range_query: ElasticRangeQuery = serde_json::from_str(range_json).unwrap();
        let ast = range_query.convert_to_query_ast().unwrap();
        let QueryAst::Range(rq) = ast else {
            panic!("expected Range, got {ast:?}");
        };
        assert_eq!(rq.field, "score");
        assert_eq!(rq.lower_bound, Bound::Included(into_json_number(50)));
        assert_eq!(rq.upper_bound, Bound::Included(into_json_number(100)));
    }

    #[test]
    fn test_range_query_with_from_to_exclusive() {
        let range_json =
            r#"{"score": {"from": 50, "to": 100, "include_lower": false, "include_upper": false}}"#;
        let range_query: ElasticRangeQuery = serde_json::from_str(range_json).unwrap();
        let ast = range_query.convert_to_query_ast().unwrap();
        let QueryAst::Range(rq) = ast else {
            panic!("expected Range, got {ast:?}");
        };
        assert_eq!(rq.field, "score");
        assert_eq!(rq.lower_bound, Bound::Excluded(into_json_number(50)));
        assert_eq!(rq.upper_bound, Bound::Excluded(into_json_number(100)));
    }

    #[test]
    fn test_range_query_with_from_to_defaults() {
        let range_json = r#"{"score": {"from": 50, "to": 100}}"#;
        let range_query: ElasticRangeQuery = serde_json::from_str(range_json).unwrap();
        let ast = range_query.convert_to_query_ast().unwrap();
        let QueryAst::Range(rq) = ast else {
            panic!("expected Range, got {ast:?}");
        };
        assert_eq!(rq.field, "score");
        assert_eq!(rq.lower_bound, Bound::Included(into_json_number(50)));
        assert_eq!(rq.upper_bound, Bound::Included(into_json_number(100)));
    }

    #[test]
    fn test_date_range_query_with_strict_date_optional_time_format() {
        let range_query_params = ElasticRangeQueryParams {
            gt: None,
            gte: None,
            lt: None,
            lte: Some(JsonLiteral::String("2024-09-28T10:22:55.797Z".to_string())),
            boost: None,
            format: JsonLiteral::String("strict_date_optional_time".to_string()).into(),
            ..Default::default()
        };
        let range_query: ElasticRangeQuery = ElasticRangeQuery {
            field: "timestamp".to_string(),
            value: range_query_params,
        };
        let range_query_ast = range_query.convert_to_query_ast().unwrap();
        assert!(matches!(
            range_query_ast,
            QueryAst::Range(RangeQuery {
                field,
                lower_bound: Bound::Unbounded,
                upper_bound: Bound::Included(upper_bound),
            })
            if field == "timestamp" && upper_bound == JsonLiteral::String("2024-09-28T10:22:55.797Z".to_string())
        ));
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/regex_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use crate::elastic_query_dsl::ConvertibleToQueryAst;
use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::query_ast::{QueryAst, RegexQuery as AstRegexQuery};

/// Elasticsearch supports two formats for regexp queries:
/// - Shorthand: `{"regexp": {"field": "pattern"}}`
/// - Full:      `{"regexp": {"field": {"value": "pattern", "case_insensitive": true}}}`
#[derive(Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(untagged)]
pub enum RegexQueryParams {
    Full {
        #[serde(rename = "value")]
        pattern: String,
        #[serde(default)]
        case_insensitive: bool,
    },
    Shorthand(String),
}

impl RegexQueryParams {
    fn into_tuple(self) -> (String, bool) {
        match self {
            RegexQueryParams::Full {
                pattern,
                case_insensitive,
            } => (pattern, case_insensitive),
            RegexQueryParams::Shorthand(pattern) => (pattern, false),
        }
    }
}

pub type RegexQuery = OneFieldMap<RegexQueryParams>;

impl ConvertibleToQueryAst for RegexQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let (pattern, case_insensitive) = self.value.into_tuple();

        let regex = if case_insensitive {
            format!("(?i){pattern}")
        } else {
            pattern
        };
        Ok(AstRegexQuery {
            field: self.field,
            regex,
        }
        .into())
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_regex_query_shorthand_format() {
        let json = serde_json::json!({"service": ".*logs.*"});
        let query: RegexQuery = serde_json::from_value(json).unwrap();
        assert_eq!(query.field, "service");
        let (pattern, case_insensitive) = query.value.into_tuple();
        assert_eq!(pattern, ".*logs.*");
        assert!(!case_insensitive);
    }

    #[test]
    fn test_regex_query_full_format() {
        let json = serde_json::json!({"service": {"value": ".*logs.*", "case_insensitive": true}});
        let query: RegexQuery = serde_json::from_value(json).unwrap();
        assert_eq!(query.field, "service");
        let (pattern, case_insensitive) = query.value.into_tuple();
        assert_eq!(pattern, ".*logs.*");
        assert!(case_insensitive);
    }

    #[test]
    fn test_regex_query_full_format_default_case() {
        let json = serde_json::json!({"service": {"value": ".*logs.*"}});
        let query: RegexQuery = serde_json::from_value(json).unwrap();
        assert_eq!(query.field, "service");
        let (pattern, case_insensitive) = query.value.into_tuple();
        assert_eq!(pattern, ".*logs.*");
        assert!(!case_insensitive);
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/string_or_struct.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::marker::PhantomData;

use serde::de::{MapAccess, Visitor};
use serde::{Deserialize, Deserializer, de};

/// The point of `StringOrStructForSerialization` is to support
/// the two following formats for various queries.
///
/// `{"field": {"query": "my query", "default_operator": "OR"}}`
///
/// and the shorter.
/// `{"field": "my query"}`
///
/// If a integer is passed, we cast it to string. Floats are not supported.
///
/// We don't use untagged enum to support this, in order to keep good errors.
///
/// The code below is adapted from solution described here: <https://serde.rs/string-or-struct.html>
#[derive(Deserialize)]
#[serde(transparent)]
pub(crate) struct StringOrStructForSerialization<T>
where
    T: From<String>,
    for<'de2> T: Deserialize<'de2>,
{
    #[serde(deserialize_with = "string_or_struct")]
    pub inner: T,
}

struct StringOrStructVisitor<T> {
    phantom_data: PhantomData<T>,
}

fn string_or_struct<'de, D, T>(deserializer: D) -> Result<T, D::Error>
where
    D: Deserializer<'de>,
    T: From<String> + Deserialize<'de>,
{
    deserializer.deserialize_any(StringOrStructVisitor {
        phantom_data: Default::default(),
    })
}

impl<'de, T> Visitor<'de> for StringOrStructVisitor<T>
where
    T: From<String>,
    T: Deserialize<'de>,
{
    type Value = T;

    fn expecting(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        let type_str = std::any::type_name::<T>();
        formatter.write_str(&format!("string or map to deserialize {type_str}."))
    }

    fn visit_i64<E>(self, v: i64) -> Result<Self::Value, E>
    where E: de::Error {
        self.visit_str(&v.to_string())
    }

    fn visit_u64<E>(self, v: u64) -> Result<Self::Value, E>
    where E: de::Error {
        self.visit_str(&v.to_string())
    }

    fn visit_str<E>(self, query: &str) -> Result<Self::Value, E>
    where E: serde::de::Error {
        Ok(T::from(query.to_string()))
    }

    fn visit_map<M>(self, map: M) -> Result<T, M::Error>
    where M: MapAccess<'de> {
        Deserialize::deserialize(de::value::MapAccessDeserializer::new(map))
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/term_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Deserializer, Serialize};

use super::StringOrStructForSerialization;
use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::elastic_query_dsl::{ConvertibleToQueryAst, ElasticQueryDslInner};
use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::{self, QueryAst};

#[derive(Deserialize, Debug, PartialEq, Eq, Clone)]
#[serde(from = "OneFieldMap<StringOrStructForSerialization<TermQueryParams>>")]
pub struct TermQuery {
    pub field: String,
    pub value: TermQueryParams,
}

impl From<OneFieldMap<StringOrStructForSerialization<TermQueryParams>>> for TermQuery {
    fn from(one_field_map: OneFieldMap<StringOrStructForSerialization<TermQueryParams>>) -> Self {
        TermQuery {
            field: one_field_map.field,
            value: one_field_map.value.inner,
        }
    }
}

impl From<String> for TermQueryParams {
    fn from(query: String) -> TermQueryParams {
        TermQueryParams {
            value: query,
            boost: None,
            case_insensitive: false,
        }
    }
}

#[derive(Deserialize)]
#[serde(untagged)]
enum TermValue {
    I64(i64),
    U64(u64),
    Str(String),
}

fn deserialize_term_value<'de, D>(deserializer: D) -> Result<String, D::Error>
where D: Deserializer<'de> {
    let term_value = TermValue::deserialize(deserializer)?;
    match term_value {
        TermValue::I64(i64) => Ok(i64.to_string()),
        TermValue::U64(u64) => Ok(u64.to_string()),
        TermValue::Str(str) => Ok(str),
    }
}

#[derive(PartialEq, Eq, Debug, Serialize, Deserialize, Clone)]
#[serde(deny_unknown_fields)]
pub struct TermQueryParams {
    #[serde(deserialize_with = "deserialize_term_value")]
    pub value: String,
    #[serde(default)]
    pub boost: Option<NotNaNf32>,
    #[serde(default)]
    case_insensitive: bool,
}

#[cfg(test)]
pub fn term_query_from_field_value(field: impl ToString, value: impl ToString) -> TermQuery {
    TermQuery {
        field: field.to_string(),
        value: TermQueryParams {
            value: value.to_string(),
            boost: None,
            case_insensitive: false,
        },
    }
}

impl From<TermQuery> for ElasticQueryDslInner {
    fn from(term_query: TermQuery) -> Self {
        Self::Term(term_query)
    }
}

impl ConvertibleToQueryAst for TermQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let TermQueryParams {
            value,
            boost,
            case_insensitive,
        } = self.value;
        if case_insensitive {
            let ci_value = format!("(?i){}", regex::escape(&value));
            let term_ast: QueryAst = query_ast::RegexQuery {
                field: self.field,
                regex: ci_value,
            }
            .into();
            return Ok(term_ast.boost(boost));
        }
        let term_ast: QueryAst = query_ast::TermQuery {
            field: self.field,
            value,
        }
        .into();
        Ok(term_ast.boost(boost))
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_term_query_simple() {
        let term_query_json = r#"{ "product_id": { "value": "61809" } }"#;
        let term_query: TermQuery = serde_json::from_str(term_query_json).unwrap();
        assert_eq!(
            &term_query,
            &term_query_from_field_value("product_id", "61809")
        );
    }

    #[test]
    fn test_term_query_deserialization_in_short_format() {
        let term_query: TermQuery = serde_json::from_str(
            r#"{
            "product_id": "61809"
        }"#,
        )
        .unwrap();
        assert_eq!(
            &term_query,
            &term_query_from_field_value("product_id", "61809")
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/terms_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeSet, HashMap};

use serde::Deserialize;

use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::elastic_query_dsl::{ConvertibleToQueryAst, ElasticQueryDslInner};
use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::{QueryAst, TermSetQuery};

#[derive(PartialEq, Eq, Debug, Deserialize, Clone)]
#[serde(try_from = "TermsQueryForSerialization")]
pub struct TermsQuery {
    pub boost: Option<NotNaNf32>,
    pub field: String,
    pub values: Vec<String>,
}

#[derive(Deserialize)]
struct TermsQueryForSerialization {
    #[serde(default)]
    boost: Option<NotNaNf32>,
    #[serde(flatten)]
    capture_other: serde_json::Value,
}

#[derive(Deserialize)]
#[serde(untagged)]
enum TermValue {
    I64(i64),
    U64(u64),
    Str(String),
}

impl From<TermValue> for String {
    fn from(term_value: TermValue) -> String {
        match term_value {
            TermValue::I64(val) => val.to_string(),
            TermValue::U64(val) => val.to_string(),
            TermValue::Str(val) => val,
        }
    }
}

#[derive(Deserialize)]
#[serde(untagged)]
enum OneOrMany {
    One(TermValue),
    Many(Vec<TermValue>),
}

impl From<OneOrMany> for Vec<String> {
    fn from(one_or_many: OneOrMany) -> Vec<String> {
        match one_or_many {
            OneOrMany::One(one_value) => vec![String::from(one_value)],
            OneOrMany::Many(values) => values.into_iter().map(String::from).collect(),
        }
    }
}

impl TryFrom<TermsQueryForSerialization> for TermsQuery {
    type Error = serde_json::Error;

    fn try_from(value: TermsQueryForSerialization) -> serde_json::Result<TermsQuery> {
        let one_field: OneFieldMap<OneOrMany> = serde_json::from_value(value.capture_other)?;
        let one_field_values: Vec<String> = one_field.value.into();
        Ok(TermsQuery {
            boost: value.boost,
            field: one_field.field,
            values: one_field_values,
        })
    }
}

impl ConvertibleToQueryAst for TermsQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let mut terms_per_field = HashMap::new();
        let values_set: BTreeSet<String> = self.values.into_iter().collect();
        terms_per_field.insert(self.field, values_set);

        let term_set_query = TermSetQuery { terms_per_field };
        let query_ast: QueryAst = term_set_query.into();

        Ok(query_ast.boost(self.boost))
    }
}

impl From<TermsQuery> for ElasticQueryDslInner {
    fn from(term_query: TermsQuery) -> Self {
        Self::Terms(term_query)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_terms_query_simple() {
        let terms_query_json = r#"{ "user.id": ["hello", "happy"] }"#;
        let terms_query: TermsQuery = serde_json::from_str(terms_query_json).unwrap();
        assert_eq!(&terms_query.field, "user.id");
        assert_eq!(
            &terms_query.values[..],
            &["hello".to_string(), "happy".to_string()]
        );
    }

    #[test]
    fn test_terms_query_single_term_not_array() {
        let terms_query_json = r#"{ "user.id": "hello"}"#;
        let terms_query: TermsQuery = serde_json::from_str(terms_query_json).unwrap();
        assert_eq!(&terms_query.field, "user.id");
        assert_eq!(&terms_query.values[..], &["hello".to_string()]);
    }

    #[test]
    fn test_terms_query_not_string() {
        let terms_query_json = r#"{ "user.id": [1, 2] }"#;
        let terms_query: TermsQuery = serde_json::from_str(terms_query_json).unwrap();
        assert_eq!(&terms_query.field, "user.id");
        assert_eq!(&terms_query.values[..], &["1".to_string(), "2".to_string()]);
    }

    #[test]
    fn test_terms_query_single_term_boost() {
        let terms_query_json = r#"{ "user.id": ["hello", "happy"], "boost": 2 }"#;
        let terms_query: TermsQuery = serde_json::from_str(terms_query_json).unwrap();
        assert_eq!(&terms_query.field, "user.id");
        assert_eq!(
            &terms_query.values[..],
            &["hello".to_string(), "happy".to_string()]
        );
        let boost: f32 = terms_query.boost.unwrap().into();
        assert!((boost - 2.0f32).abs() < 0.0001f32);
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/visitor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use crate::match_all::MatchAllQuery;
use crate::match_none::MatchNoneQuery;
use crate::query_string_query::QueryStringQuery;
use crate::range_query::RangeQuery;
use crate::term_query::TermQuery;
use crate::QueryDsl;

pub trait QueryDslVisitor<'a> {
    type Err;

    fn visit(&mut self, query_dsl: &'a QueryDsl) -> Result<(), Self::Err> {
        match query_dsl {
            QueryDsl::QueryString(query_string_query) => {
                self.visit_query_string(query_string_query)
            }
            QueryDsl::Bool(bool_query) => self.visit_bool_query(bool_query),
            QueryDsl::Term(term_query) => self.visit_term(term_query),
            QueryDsl::MatchAll(just_boost) => self.visit_match_all(just_boost),
            QueryDsl::MatchNone(match_none) => self.visit_match_none(match_none),
            QueryDsl::Range(range_query) => self.visit_range(range_query),
        }
    }

    fn visit_query_string(
        &mut self,
        _query_string_query: &'a QueryStringQuery,
    ) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_bool_query(&mut self, bool_query: &'a BoolQuery) -> Result<(), Self::Err> {
        for ast in bool_query
            .must
            .iter()
            .chain(bool_query.should.iter())
            .chain(bool_query.must_not.iter())
            .chain(bool_query.filter.iter())
        {
            self.visit(ast)?;
        }
        Ok(())
    }

    fn visit_term(&mut self, _term_query: &'a TermQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_match_all(&mut self, _match_all: &'a MatchAllQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_match_none(&mut self, _match_none: &'a MatchNoneQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_range(&mut self, _range_query: &'a RangeQuery) -> Result<(), Self::Err> {
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-query/src/elastic_query_dsl/wildcard_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

use crate::NotNaNf32;
use crate::elastic_query_dsl::one_field_map::OneFieldMap;
use crate::elastic_query_dsl::{ConvertibleToQueryAst, StringOrStructForSerialization};
use crate::query_ast::{QueryAst, WildcardQuery as AstWildcardQuery};

#[derive(Deserialize, Clone, Eq, PartialEq, Debug)]
#[serde(from = "OneFieldMap<StringOrStructForSerialization<WildcardQueryParams>>")]
pub(crate) struct WildcardQuery {
    pub(crate) field: String,
    pub(crate) params: WildcardQueryParams,
}

#[derive(Deserialize, Debug, Default, Eq, PartialEq, Clone)]
#[serde(deny_unknown_fields)]
pub struct WildcardQueryParams {
    value: String,
    #[serde(default)]
    pub boost: Option<NotNaNf32>,
    #[serde(default)]
    case_insensitive: bool,
}

impl ConvertibleToQueryAst for WildcardQuery {
    fn convert_to_query_ast(self) -> anyhow::Result<QueryAst> {
        let wildcard_ast: QueryAst = AstWildcardQuery {
            field: self.field,
            value: self.params.value,
            lenient: true,
            case_insensitive: self.params.case_insensitive,
        }
        .into();
        Ok(wildcard_ast.boost(self.params.boost))
    }
}

impl From<OneFieldMap<StringOrStructForSerialization<WildcardQueryParams>>> for WildcardQuery {
    fn from(
        match_query_params: OneFieldMap<StringOrStructForSerialization<WildcardQueryParams>>,
    ) -> Self {
        let OneFieldMap { field, value } = match_query_params;
        WildcardQuery {
            field,
            params: value.inner,
        }
    }
}

impl From<String> for WildcardQueryParams {
    fn from(value: String) -> WildcardQueryParams {
        WildcardQueryParams {
            value,
            boost: None,
            case_insensitive: false,
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_wildcard_query_convert_to_query_ast() {
        let wildcard_query_json = r#"{
            "user_name": {
                "value": "john*"
            }
        }"#;
        let wildcard_query: WildcardQuery = serde_json::from_str(wildcard_query_json).unwrap();
        let query_ast = wildcard_query.convert_to_query_ast().unwrap();

        if let QueryAst::Wildcard(wildcard) = query_ast {
            assert_eq!(wildcard.field, "user_name");
            assert_eq!(wildcard.value, "john*");
            assert!(wildcard.lenient);
        } else {
            panic!("Expected QueryAst::Wildcard");
        }
    }

    #[test]
    fn test_boosted_wildcard_query_convert_to_query_ast() {
        let wildcard_query_json = r#"{
            "user_name": {
                "value": "john*",
                "boost": 2.0
            }
        }"#;
        let wildcard_query: WildcardQuery = serde_json::from_str(wildcard_query_json).unwrap();
        let query_ast = wildcard_query.convert_to_query_ast().unwrap();

        if let QueryAst::Boost { underlying, boost } = query_ast {
            if let QueryAst::Wildcard(wildcard) = *underlying {
                assert_eq!(wildcard.field, "user_name");
                assert_eq!(wildcard.value, "john*");
                assert!(wildcard.lenient);
            } else {
                panic!("Expected underlying QueryAst::Wildcard");
            }
            assert_eq!(boost, NotNaNf32::try_from(2.0).unwrap());
        } else {
            panic!("Expected QueryAst::Wildcard");
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use thiserror::Error;

#[derive(Error, Debug)]
pub enum InvalidQuery {
    #[error("query is incompatible with schema. {0})")]
    SchemaError(String),
    #[error("expected `{expected_value_type}` boundary for field `{field_name}`")]
    InvalidBoundary {
        expected_value_type: &'static str,
        field_name: String,
    },
    #[error(
        "expected a `{expected_value_type}` search value for field `{field_name}`, got `{value}`"
    )]
    InvalidSearchTerm {
        expected_value_type: &'static str,
        field_name: String,
        value: String,
    },
    #[error("range query on `{value_type}` field (`{field_name}`) forbidden")]
    RangeQueryNotSupportedForField {
        value_type: &'static str,
        field_name: String,
    },
    #[error("field does not exist: `{full_path}`")]
    FieldDoesNotExist { full_path: String },
    #[error("Json field root is not a valid search field: `{full_path}`")]
    JsonFieldRootNotSearchable { full_path: String },
    #[error("user query should have been parsed")]
    UserQueryNotParsed,
    #[error("{0}")]
    Other(#[from] anyhow::Error),
}


================================================
FILE: quickwit/quickwit-query/src/json_literal.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::net::{IpAddr, Ipv6Addr};
use std::str::FromStr;

use base64::Engine;
use once_cell::sync::OnceCell;
use quickwit_datetime::{DateTimeInputFormat, parse_date_time_str, parse_timestamp};
use serde::{Deserialize, Serialize};
use tantivy::schema::IntoIpv6Addr;

fn get_default_date_time_format() -> &'static [DateTimeInputFormat] {
    static DEFAULT_DATE_TIME_FORMATS: OnceCell<Vec<DateTimeInputFormat>> = OnceCell::new();
    DEFAULT_DATE_TIME_FORMATS
        .get_or_init(|| {
            vec![
                DateTimeInputFormat::Rfc3339,
                DateTimeInputFormat::Rfc2822,
                DateTimeInputFormat::Timestamp,
                DateTimeInputFormat::from_str("%Y-%m-%dT%H:%M:%S").unwrap(),
                DateTimeInputFormat::from_str("%Y-%m-%d %H:%M:%S.%f").unwrap(),
                DateTimeInputFormat::from_str("%Y-%m-%d %H:%M:%S").unwrap(),
                DateTimeInputFormat::from_str("%Y-%m-%d").unwrap(),
                DateTimeInputFormat::from_str("%Y/%m/%d").unwrap(),
            ]
        })
        .as_slice()
}

#[derive(Serialize, Deserialize, Eq, PartialEq, Clone, Debug)]
#[serde(untagged)]
pub enum JsonLiteral {
    Number(serde_json::Number),
    // String is a bit special.
    //
    // It can either mean it was passed as a string by the user (via the es query dsl for
    // instance), or it can mean its type is unknown as it was parsed out of tantivy's query
    // language.
    //
    // We have decided to not make a difference at the moment.
    String(String),
    Bool(bool),
}

pub trait InterpretUserInput<'a>: Sized {
    fn interpret_json(user_input: &'a JsonLiteral) -> Option<Self> {
        match user_input {
            JsonLiteral::Number(number) => Self::interpret_number(number),
            JsonLiteral::String(str_val) => Self::interpret_str(str_val),
            JsonLiteral::Bool(bool_val) => Self::interpret_bool(*bool_val),
        }
    }

    fn interpret_number(_number: &serde_json::Number) -> Option<Self> {
        None
    }

    fn interpret_bool(_bool: bool) -> Option<Self> {
        None
    }
    fn interpret_str(_text: &'a str) -> Option<Self> {
        None
    }

    fn name() -> &'static str {
        std::any::type_name::<Self>()
    }
}

impl<'a> InterpretUserInput<'a> for &'a str {
    fn interpret_str(text: &'a str) -> Option<Self> {
        Some(text)
    }
}

impl<'a> InterpretUserInput<'a> for u64 {
    fn interpret_number(number: &serde_json::Number) -> Option<Self> {
        number.as_u64()
    }

    fn interpret_str(text: &'a str) -> Option<Self> {
        text.parse().ok()
    }
}

impl<'a> InterpretUserInput<'a> for i64 {
    fn interpret_number(number: &serde_json::Number) -> Option<Self> {
        number.as_i64()
    }

    fn interpret_str(text: &'a str) -> Option<Self> {
        text.parse().ok()
    }
}

// We refuse NaN and infinity.
impl<'a> InterpretUserInput<'a> for f64 {
    fn interpret_number(number: &serde_json::Number) -> Option<Self> {
        let val = number.as_f64()?;
        if val.is_nan() || val.is_infinite() {
            return None;
        }
        Some(val)
    }

    fn interpret_str(text: &'a str) -> Option<f64> {
        let val: f64 = text.parse().ok()?;
        if val.is_nan() || val.is_infinite() {
            return None;
        }
        Some(val)
    }
}

impl InterpretUserInput<'_> for bool {
    fn interpret_bool(b: bool) -> Option<Self> {
        Some(b)
    }

    fn interpret_str(text: &str) -> Option<Self> {
        text.parse().ok()
    }
}

impl InterpretUserInput<'_> for Ipv6Addr {
    fn interpret_str(text: &str) -> Option<Self> {
        let ip_addr: IpAddr = text.parse().ok()?;
        Some(ip_addr.into_ipv6_addr())
    }
}

impl InterpretUserInput<'_> for tantivy::DateTime {
    fn interpret_str(text: &str) -> Option<Self> {
        let date_time_formats = get_default_date_time_format();
        if let Ok(datetime) = parse_date_time_str(text, date_time_formats) {
            return Some(datetime);
        }
        // Parsing the normal string formats failed.
        // Maybe it is actually a timestamp as a string?
        let possible_timestamp = text.parse::<i64>().ok()?;
        parse_timestamp(possible_timestamp).ok()
    }

    fn interpret_number(number: &serde_json::Number) -> Option<Self> {
        let possible_timestamp = number.as_i64()?;
        parse_timestamp(possible_timestamp).ok()
    }
}

/// Lenient base64 engine that allows users to use padding or not.
const LENIENT_BASE64_ENGINE: base64::engine::GeneralPurpose = base64::engine::GeneralPurpose::new(
    &base64::alphabet::STANDARD,
    base64::engine::GeneralPurposeConfig::new()
        .with_decode_padding_mode(base64::engine::DecodePaddingMode::Indifferent),
);

impl InterpretUserInput<'_> for Vec<u8> {
    fn interpret_str(mut text: &str) -> Option<Vec<u8>> {
        let Some(first_byte) = text.as_bytes().first().copied() else {
            return Some(Vec::new());
        };
        let mut buffer = Vec::with_capacity(text.len() * 3 / 4);
        if first_byte == b'!' {
            // We use ! as a marker to force base64 decoding.
            text = &text[1..];
        } else {
            buffer.resize(text.len() / 2, 0u8);
            if hex::decode_to_slice(text, &mut buffer[..]).is_ok() {
                return Some(buffer);
            }
            buffer.clear();
        }
        LENIENT_BASE64_ENGINE.decode_vec(text, &mut buffer).ok()?;
        Some(buffer)
    }
}

impl From<bool> for JsonLiteral {
    fn from(b: bool) -> JsonLiteral {
        JsonLiteral::Bool(b)
    }
}

impl From<String> for JsonLiteral {
    fn from(s: String) -> JsonLiteral {
        JsonLiteral::String(s)
    }
}

impl From<u64> for JsonLiteral {
    fn from(number: u64) -> JsonLiteral {
        JsonLiteral::Number(number.into())
    }
}

impl From<i64> for JsonLiteral {
    fn from(number: i64) -> JsonLiteral {
        JsonLiteral::Number(number.into())
    }
}

#[cfg(test)]
mod tests {
    use tantivy::DateTime;
    use time::macros::datetime;

    use crate::JsonLiteral;
    use crate::json_literal::InterpretUserInput;

    #[test]
    fn test_interpret_str_u64() {
        let val_opt = u64::interpret_str("123");
        assert_eq!(val_opt, Some(123u64));
    }

    #[test]
    fn test_interpret_datetime_simple_date() {
        let dt_opt = DateTime::interpret_json(&JsonLiteral::String("2023-05-25".to_string()));
        let expected_datetime = datetime!(2023-05-25 00:00 UTC);
        assert_eq!(dt_opt, Some(DateTime::from_utc(expected_datetime)));
    }

    #[test]
    fn test_interpret_datetime_rfc3339_with_no_timezone() {
        let dt_opt =
            DateTime::interpret_json(&JsonLiteral::String("2023-05-25T18:00:00".to_string()));
        let expected_datetime = datetime!(2023-05-25 18:00 UTC);
        assert_eq!(dt_opt, Some(DateTime::from_utc(expected_datetime)));
    }

    #[test]
    fn test_interpret_datetime_fractional_millis() {
        let dt_opt =
            DateTime::interpret_json(&JsonLiteral::String("2023-05-25 10:20:11.322".to_string()));
        let expected_datetime = datetime!(2023-05-25 10:20:11.322 UTC);
        assert_eq!(dt_opt, Some(DateTime::from_utc(expected_datetime)));
    }

    #[test]
    fn test_interpret_datetime_unix_timestamp_as_string() {
        let dt_opt = DateTime::interpret_json(&JsonLiteral::String("1685086013".to_string()));
        let expected_datetime = datetime!(2023-05-26 07:26:53 UTC);
        assert_eq!(dt_opt, Some(DateTime::from_utc(expected_datetime)));
    }

    #[test]
    fn test_interpret_datetime_unix_timestamp_as_number() {
        let dt_opt = DateTime::interpret_json(&JsonLiteral::Number(1685086013.into()));
        let expected_datetime = datetime!(2023-05-26 07:26:53 UTC);
        assert_eq!(dt_opt, Some(DateTime::from_utc(expected_datetime)));
    }

    #[test]
    fn test_interpret_bytes_base16_lowercase() {
        let bytes_opt = Vec::<u8>::interpret_str("deadbeef");
        assert_eq!(bytes_opt, Some(vec![0xde, 0xad, 0xbe, 0xef]));
    }

    #[test]
    fn test_interpret_bytes_base16_uppercase() {
        let bytes_opt = Vec::<u8>::interpret_str("DEADBEEF");
        assert_eq!(bytes_opt, Some(vec![0xde, 0xad, 0xbe, 0xef]));
    }

    #[test]
    fn test_interpret_bytes_base16_mixed_casing() {
        let bytes_opt = Vec::<u8>::interpret_str("dEadbeef");
        assert_eq!(bytes_opt, Some(vec![0xde, 0xad, 0xbe, 0xef]));
    }

    #[test]
    fn test_interpret_bytes_base64() {
        let decoded = Vec::<u8>::interpret_str("aGVsbG8=").unwrap();
        assert_eq!(decoded, b"hello");
    }

    #[test]
    fn test_interpret_force_ambiguous_base64() {
        let decoded = Vec::<u8>::interpret_str("!beef").unwrap();
        assert_eq!(decoded, &[109, 231, 159]);
    }

    #[test]
    fn test_interpret_with_and_without_padding() {
        let decoded_without_padding = Vec::<u8>::interpret_str("cQ").unwrap();
        let decoded_with_padding = Vec::<u8>::interpret_str("cQ").unwrap();
        assert_eq!(&decoded_with_padding, &decoded_without_padding);
        assert_eq!(&decoded_with_padding, b"q");
    }

    #[test]
    fn test_interpret_bytes_invalid() {
        assert!(Vec::<u8>::interpret_str("deadbeef@").is_none());
    }
}


================================================
FILE: quickwit/quickwit-query/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! QueryDSL partially compatible with Elasticsearch/Opensearch QueryDSL.
//! See documentation here:
//! <https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl.html>

// As you add queries in this file please insert it in the order of the OpenSearch 2.6
// documentation (the opensearch documentation has a nicer structure than that of ES).
// https://opensearch.org/docs/2.6/query-dsl/term/
//
// For the individual detailed API documentation however, you should refer to elastic
// documentation.

pub mod aggregations;
mod elastic_query_dsl;
mod error;
mod json_literal;
mod not_nan_f32;
pub mod query_ast;
pub mod tokenizers;

pub use elastic_query_dsl::{ElasticQueryDsl, OneFieldMap};
pub use error::InvalidQuery;
pub use json_literal::{InterpretUserInput, JsonLiteral};
pub(crate) use not_nan_f32::NotNaNf32;
pub use query_ast::utils::find_field_or_hit_dynamic;
use serde::{Deserialize, Serialize};
pub use tantivy::query::Query as TantivyQuery;
pub use tokenizers::{
    CodeTokenizer, DEFAULT_REMOVE_TOKEN_LENGTH, create_default_quickwit_tokenizer_manager,
    get_quickwit_fastfield_normalizer_manager,
};

#[derive(Serialize, Deserialize, Debug, Default, Copy, Clone, Eq, PartialEq)]
pub enum BooleanOperand {
    #[serde(alias = "AND")]
    And,
    #[default]
    #[serde(alias = "OR")]
    Or,
}

#[derive(Serialize, Deserialize, Debug, Copy, Clone, Eq, PartialEq, Default)]
pub enum MatchAllOrNone {
    #[serde(rename = "none")]
    #[default]
    MatchNone,
    #[serde(rename = "all")]
    MatchAll,
}

impl MatchAllOrNone {
    pub fn is_none(&self) -> bool {
        self == &MatchAllOrNone::MatchNone
    }
}


================================================
FILE: quickwit/quickwit-query/src/not_nan_f32.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Serialize};

#[derive(Serialize, Deserialize, Debug, Copy, Clone, PartialEq)]
#[serde(into = "f32", try_from = "f32")]
pub struct NotNaNf32(f32);

impl NotNaNf32 {
    pub const ZERO: Self = NotNaNf32(0.0f32);
    pub const ONE: Self = NotNaNf32(1.0f32);
}

impl From<NotNaNf32> for f32 {
    fn from(not_nan_f32: NotNaNf32) -> f32 {
        not_nan_f32.0
    }
}

impl TryFrom<f32> for NotNaNf32 {
    type Error = &'static str;

    fn try_from(possibly_nan: f32) -> Result<NotNaNf32, &'static str> {
        if possibly_nan.is_nan() {
            return Err("NaN is not supported as a boost value");
        }
        Ok(NotNaNf32(possibly_nan))
    }
}

impl Eq for NotNaNf32 {}


================================================
FILE: quickwit/quickwit-query/src/query_ast/bool_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Serialize};

use super::{BuildTantivyAst, BuildTantivyAstContext, TantivyQueryAst};
use crate::InvalidQuery;
use crate::query_ast::QueryAst;

/// # Unsupported features
/// - named queries
///
/// Edge cases of BooleanQuery are not obvious,
/// and different behavior could be justified.
///
/// Here we align ourselves with Elasticsearch.
/// A boolean query is to be interpreted like a filtering predicate
/// over the set of documents.
///
/// If all clauses are empty, then the full set of documents is returned.
/// Adding a match all must clause does not change the result of a boolean query.
#[derive(Serialize, Deserialize, Debug, PartialEq, Eq, Clone, Default)]
pub struct BoolQuery {
    #[serde(default, skip_serializing_if = "Vec::is_empty")]
    pub must: Vec<QueryAst>,
    #[serde(default, skip_serializing_if = "Vec::is_empty")]
    pub must_not: Vec<QueryAst>,
    #[serde(default, skip_serializing_if = "Vec::is_empty")]
    pub should: Vec<QueryAst>,
    #[serde(default, skip_serializing_if = "Vec::is_empty")]
    pub filter: Vec<QueryAst>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub minimum_should_match: Option<usize>,
}

impl From<BoolQuery> for QueryAst {
    fn from(bool_query: BoolQuery) -> Self {
        QueryAst::Bool(bool_query)
    }
}

impl BuildTantivyAst for BoolQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let mut boolean_query = super::tantivy_query_ast::TantivyBoolQuery {
            minimum_should_match: self.minimum_should_match,
            ..Default::default()
        };
        for must in &self.must {
            let must_leaf = must.build_tantivy_ast_call(context)?;
            boolean_query.must.push(must_leaf);
        }
        for must_not in &self.must_not {
            let must_not_leaf = must_not.build_tantivy_ast_call(context)?;
            boolean_query.must_not.push(must_not_leaf);
        }
        for should in &self.should {
            let should_leaf = should.build_tantivy_ast_call(context)?;
            boolean_query.should.push(should_leaf);
        }
        for filter in &self.filter {
            let filter_leaf = filter.build_tantivy_ast_call(context)?;
            boolean_query.filter.push(filter_leaf);
        }
        Ok(TantivyQueryAst::Bool(boolean_query))
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/cache_node.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use bitpacking::{BitPacker, BitPacker1x};
use quickwit_proto::types::SplitId;
use serde::{Deserialize, Serialize};

use super::{BuildTantivyAst, BuildTantivyAstContext, TantivyQueryAst};
use crate::InvalidQuery;
use crate::query_ast::QueryAst;

/// A node caching the result of an inner query.
///
/// This can be used when it's known that some sub-ast might appear in many queries,
/// or that the same query might be run, with various aggregations.
///
/// /!\ Sprinkling this everywhere can lead to performance degradations: the whole posting
/// list of the underlying query will need to be evaluated to build the cache, whereas it could
/// have been largely skipped if some other part of the query is very selective.
#[derive(Serialize, Deserialize, Debug, Clone)]
pub struct CacheNode {
    pub inner: Box<QueryAst>,
    #[serde(skip)]
    pub state: CacheState,
}

#[derive(Default, Clone)]
pub enum CacheState {
    // This is the state a CacheNode should be before
    #[default]
    Uninitialized,
    CacheHit(CacheEntry),
    CacheMiss(CacheFiller),
}

impl std::fmt::Debug for CacheState {
    fn fmt(&self, fmt: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            CacheState::Uninitialized => fmt.debug_tuple("Uninitialized").finish(),
            CacheState::CacheHit(_) => fmt.debug_tuple("CacheHit").finish_non_exhaustive(),
            CacheState::CacheMiss(_) => fmt.debug_tuple("CacheMiss").finish_non_exhaustive(),
        }
    }
}

// cache state shouldn't impact a CacheNode equality
impl Eq for CacheNode {}
impl PartialEq for CacheNode {
    fn eq(&self, other: &Self) -> bool {
        self.inner == other.inner
    }
}

impl From<CacheNode> for QueryAst {
    fn from(cache_node: CacheNode) -> Self {
        QueryAst::Cache(cache_node)
    }
}

impl CacheNode {
    pub fn new(ast: QueryAst) -> Self {
        CacheNode {
            inner: Box::new(ast),
            state: CacheState::Uninitialized,
        }
    }

    pub fn fill_cache_state(&mut self, cache: &Arc<dyn PredicateCache>, split_id: &str) {
        let Ok(query) = serde_json::to_string(&self.inner) else {
            return;
        };
        if let Some((segment_id, hits)) = cache.get(split_id.to_string(), query.clone()) {
            self.state = CacheState::CacheHit(CacheEntry { segment_id, hits });
        } else {
            self.state = CacheState::CacheMiss(CacheFiller {
                cache: cache.clone(),
                split_id: split_id.to_string(),
                query,
            });
        }
    }
}

impl BuildTantivyAst for CacheNode {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        match &self.state {
            CacheState::Uninitialized => self.inner.build_tantivy_ast_call(context),
            CacheState::CacheHit(cache_entry) => Ok(CacheHitQuery {
                cache_entry: cache_entry.clone(),
            }
            .into()),
            CacheState::CacheMiss(cache_filler) => {
                let tantivy_query: Box<dyn Query> = self
                    .inner
                    .build_tantivy_ast_call(context)?
                    .simplify()
                    .into();
                Ok(CacheFillerQuery {
                    inner_query: Box::new(tantivy_query),
                    cache_filler: cache_filler.clone(),
                }
                .into())
            }
        }
    }
}

use tantivy::directory::OwnedBytes;
use tantivy::index::SegmentId;
use tantivy::query::{EnableScoring, Explanation, Query, Scorer, Weight};
use tantivy::{DocId, DocSet, Score, SegmentReader, TantivyError};

#[derive(Clone, Debug)]
pub struct CacheHitQuery {
    cache_entry: CacheEntry,
}

impl Query for CacheHitQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> tantivy::Result<Box<dyn Weight>> {
        if enable_scoring.is_scoring_enabled() {
            Err(tantivy::TantivyError::InternalError(
                "Predicate cache doesn't support scoring yet".to_string(),
            ))
        } else {
            Ok(Box::new(CacheHitWeight {
                cache_entry: self.cache_entry.clone(),
            }))
        }
    }
}

/// Weight associated with the `AllQuery` query.
pub struct CacheHitWeight {
    cache_entry: CacheEntry,
}

impl Weight for CacheHitWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> tantivy::Result<Box<dyn Scorer>> {
        // we could try to run the query if for some reason we don't actually find an entry in
        // cache, but that would have required loading stuff during warmup which we skipped.
        // An error is the best we can do
        let mut hit_set = self
            .cache_entry
            .for_segment(reader.segment_id())
            .ok_or_else(|| TantivyError::InternalError("Segment not found in cache".to_string()))?;
        hit_set.boost = boost;
        Ok(Box::new(hit_set))
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> tantivy::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) == doc {
            Ok(Explanation::new("HitSet", 1.0))
        } else {
            Err(TantivyError::InvalidArgument(
                "Document does not exist".to_string(),
            ))
        }
    }
}

#[derive(Clone)]
pub struct CacheEntry {
    segment_id: SegmentId,
    hits: HitSet,
}

impl std::fmt::Debug for CacheEntry {
    fn fmt(&self, fmt: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        fmt.debug_struct("CacheEntry")
            .field("segment_id", &self.segment_id)
            .finish_non_exhaustive()
    }
}

impl CacheEntry {
    fn for_segment(&self, segment_id: SegmentId) -> Option<HitSet> {
        if segment_id == self.segment_id {
            Some(self.hits.clone())
        } else {
            None
        }
    }
}

#[derive(Debug, Clone)]
pub struct HitSet {
    buffer: OwnedBytes,
    buffer_pos: usize,
    previous_last_val: Option<u32>,
    current_block: [u32; BitPacker1x::BLOCK_LEN],
    block_pos: usize,
    boost: Score,
}

const INCOMPLETE_BLOCK_MARKER: u8 = 0x80;

impl HitSet {
    #[cfg(test)]
    fn empty() -> Self {
        Self::from_buffer(OwnedBytes::new(vec![0, 0, 0, 0]))
    }

    /// Build a HitSet from its serialized form.
    ///
    /// The provided buffer must come from `HitSet::into_buffer`
    pub fn from_buffer(buffer: OwnedBytes) -> Self {
        let mut this = Self {
            buffer,
            // skip count
            buffer_pos: 4,
            previous_last_val: None,
            current_block: [0; BitPacker1x::BLOCK_LEN],
            // we set this to block_len minus 1 so we can call advance() once to initialize
            // everything
            block_pos: BitPacker1x::BLOCK_LEN - 1,
            boost: 1.0,
        };
        this.advance();
        this
    }

    /// Return a buffer representing the underlying data.
    ///
    /// This does not preserve where in the DocSet you are.
    pub fn into_buffer(self) -> OwnedBytes {
        self.buffer
    }

    fn load_new_block(&mut self) {
        let Some(num_bits) = self.buffer.get(self.buffer_pos) else {
            // we ended iteration: simply fill the current_block full of TERMINATED
            self.current_block = [tantivy::TERMINATED; 32];
            return;
        };
        self.buffer_pos += 1;
        if *num_bits == INCOMPLETE_BLOCK_MARKER {
            // final block, decode as many ids as possible
            let mut i = 0;
            for chunk in self.buffer[self.buffer_pos..].as_chunks().0 {
                self.current_block[i] = u32::from_ne_bytes(*chunk);
                i += 1;
            }
            // pad with TERMINATED
            while i < BitPacker1x::BLOCK_LEN {
                self.current_block[i] = tantivy::TERMINATED;
                i += 1;
            }
            self.buffer_pos = self.buffer.len();
        } else {
            self.buffer_pos += BitPacker1x.decompress_strictly_sorted(
                self.previous_last_val,
                &self.buffer[self.buffer_pos..],
                &mut self.current_block,
                *num_bits,
            );
            self.previous_last_val = self.current_block.last().copied();
        }
    }
}

impl DocSet for HitSet {
    fn advance(&mut self) -> DocId {
        self.block_pos += 1;
        if let Some(doc_id) = self.current_block.get(self.block_pos) {
            return *doc_id;
        }
        self.load_new_block();
        self.block_pos = 0;
        self.current_block[0]
    }

    // fn seek(&mut self, target: DocId) -> DocId {
    // }

    #[inline(always)]
    fn doc(&self) -> DocId {
        self.current_block[self.block_pos]
    }

    fn size_hint(&self) -> u32 {
        u32::from_ne_bytes(self.buffer[0..4].try_into().unwrap())
    }
}

impl Scorer for HitSet {
    fn score(&mut self) -> f32 {
        self.boost
    }
}

pub struct HitSetBuilder {
    count: u32,
    current_block: [u32; BitPacker1x::BLOCK_LEN],
    previous_last_val: Option<u32>,
    buffer: Vec<u8>,
}

impl HitSetBuilder {
    pub fn new() -> Self {
        HitSetBuilder {
            count: 0,
            current_block: [0; BitPacker1x::BLOCK_LEN],
            previous_last_val: None,
            buffer: vec![0; 4],
        }
    }

    fn in_block_pos(&self) -> usize {
        (self.count % BitPacker1x::BLOCK_LEN as u32) as usize
    }

    fn end_of_block(&self) -> bool {
        self.in_block_pos() == (BitPacker1x::BLOCK_LEN - 1)
    }

    fn flush_block(&mut self) {
        let num_bits =
            BitPacker1x.num_bits_strictly_sorted(self.previous_last_val, &self.current_block);
        self.buffer.push(num_bits);
        let current_buffer_pos = self.buffer.len();
        let new_end = current_buffer_pos + (BitPacker1x::BLOCK_LEN * num_bits as usize) / 8;
        self.buffer.resize(new_end, 0);
        BitPacker1x.compress_strictly_sorted(
            self.previous_last_val,
            &self.current_block,
            &mut self.buffer[current_buffer_pos..],
            num_bits,
        );
        self.previous_last_val = self.current_block.last().copied();
    }

    pub fn insert(&mut self, value: u32) {
        self.current_block[self.in_block_pos()] = value;
        if self.end_of_block() {
            self.flush_block();
        }
        self.count += 1;
    }

    pub fn build(mut self) -> HitSet {
        if self.in_block_pos() != 0 {
            self.buffer.push(INCOMPLETE_BLOCK_MARKER);
            for elem in &self.current_block[..self.in_block_pos()] {
                self.buffer.extend_from_slice(&elem.to_ne_bytes());
            }
        }
        // write back the count of items
        self.buffer[0..4].copy_from_slice(&self.count.to_ne_bytes());
        HitSet::from_buffer(OwnedBytes::new(self.buffer))
    }
}

#[derive(Clone)]
pub struct CacheFiller {
    cache: Arc<dyn PredicateCache>,
    split_id: String,
    query: String,
}

impl std::fmt::Debug for CacheFiller {
    fn fmt(&self, fmt: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        fmt.debug_struct("CacheFiller")
            .field("split_id", &self.split_id)
            .finish_non_exhaustive()
    }
}

impl CacheFiller {
    fn fill_segment(&self, segment_id: SegmentId, value: HitSet) {
        self.cache
            .put(self.split_id.clone(), self.query.clone(), segment_id, value);
    }
}

#[derive(Debug)]
pub struct CacheFillerQuery {
    inner_query: Box<dyn Query>,
    cache_filler: CacheFiller,
}

impl Clone for CacheFillerQuery {
    fn clone(&self) -> Self {
        Self {
            inner_query: self.inner_query.box_clone(),
            cache_filler: self.cache_filler.clone(),
        }
    }
}

impl Query for CacheFillerQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> tantivy::Result<Box<dyn Weight>> {
        if enable_scoring.is_scoring_enabled() {
            Err(tantivy::TantivyError::InternalError(
                "Predicate cache doesn't support scoring yet".to_string(),
            ))
        } else {
            Ok(Box::new(CacheFillerWeight {
                inner_weight: self.inner_query.weight(enable_scoring)?,
                cache_filler: self.cache_filler.clone(),
            }))
        }
    }
    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a tantivy::Term, bool)) {
        self.inner_query.query_terms(visitor)
    }
}

/// Weight associated with the `AllQuery` query.
pub struct CacheFillerWeight {
    inner_weight: Box<dyn Weight>,
    cache_filler: CacheFiller,
}

impl Weight for CacheFillerWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> tantivy::Result<Box<dyn Scorer>> {
        let mut hit_set_builder = HitSetBuilder::new();
        let mut scorer = self.inner_weight.scorer(reader, 1.0)?;
        let mut doc_id = scorer.doc();
        while doc_id < tantivy::TERMINATED {
            hit_set_builder.insert(doc_id);
            doc_id = scorer.advance();
        }
        let mut hit_set = hit_set_builder.build();
        self.cache_filler
            .fill_segment(reader.segment_id(), hit_set.clone());
        hit_set.boost = boost;
        Ok(Box::new(hit_set))
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> tantivy::Result<Explanation> {
        self.inner_weight.explain(reader, doc)
    }
}

/// A transformer that goes through a QueryAst, and change the state of all CacheNodes
/// to Hit/Miss based on the provided cache.
///
/// This must be called for any CacheNode inside a QueryAst to do anything (though not calling
/// it isn't an error, it just means no cache will be used).
pub struct PredicateCacheInjector {
    pub cache: Arc<dyn PredicateCache>,
    pub split_id: String,
}

impl crate::query_ast::QueryAstTransformer for PredicateCacheInjector {
    type Err = std::convert::Infallible;

    fn transform_cache_node(
        &mut self,
        mut cache_node: CacheNode,
    ) -> Result<Option<QueryAst>, Self::Err> {
        cache_node.fill_cache_state(&self.cache, &self.split_id);
        self.transform(*cache_node.inner).map(|maybe_ast| {
            maybe_ast.map(|inner| {
                QueryAst::Cache(CacheNode {
                    inner: Box::new(inner),
                    state: cache_node.state,
                })
            })
        })
    }
}

// we use a trait to dodge circular dependancies with quickwit-storage
pub trait PredicateCache: Send + Sync + 'static {
    fn get(&self, split_id: SplitId, query_ast_json: String) -> Option<(SegmentId, HitSet)>;

    fn put(&self, split_id: SplitId, query_ast_json: String, segment: SegmentId, results: HitSet);
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;
    use std::sync::Mutex;

    use tantivy::DocSet;
    use tantivy::query::Query as TantivyQuery;
    use tantivy::schema::{Schema, TEXT};

    use super::*;
    use crate::query_ast::{
        BuildTantivyAstContext, QueryAstTransformer, QueryAstVisitor, TermQuery,
    };

    impl PredicateCache for Mutex<HashMap<(SplitId, String), (SegmentId, HitSet)>> {
        fn get(&self, split_id: SplitId, query_ast_json: String) -> Option<(SegmentId, HitSet)> {
            self.lock()
                .unwrap()
                .get(&(split_id, query_ast_json))
                .cloned()
        }

        fn put(
            &self,
            split_id: SplitId,
            query_ast_json: String,
            segment: SegmentId,
            results: HitSet,
        ) {
            self.lock()
                .unwrap()
                .insert((split_id, query_ast_json), (segment, results));
        }
    }

    #[track_caller]
    fn test_hit_set_roundtrip_helper<I: Iterator<Item = u32> + Clone>(iter: I) {
        let mut hitset_builder = HitSetBuilder::new();
        for i in iter.clone() {
            hitset_builder.insert(i);
        }
        let mut hitset = hitset_builder.build();

        for val in iter {
            assert_eq!(hitset.doc(), val);
            hitset.advance();
        }
        for _ in 0..96 {
            assert_eq!(hitset.doc(), tantivy::TERMINATED);
            hitset.advance();
        }
    }

    #[test]
    fn test_hit_set_roundtrip() {
        // this generate a pseurorandom strictrly increasing sequence
        let generator = std::iter::successors(Some(0u32), |x| Some(x + x.trailing_ones() + 1));

        // empty
        test_hit_set_roundtrip_helper(generator.clone().take(0));
        // one item
        test_hit_set_roundtrip_helper(generator.clone().take(1));
        test_hit_set_roundtrip_helper(generator.clone().skip(10).take(1));
        // partial block
        test_hit_set_roundtrip_helper(generator.clone().take(24));
        test_hit_set_roundtrip_helper(generator.clone().skip(10).take(24));

        // one block
        test_hit_set_roundtrip_helper(generator.clone().take(32));
        test_hit_set_roundtrip_helper(generator.clone().skip(10).take(32));
        // two blocks
        test_hit_set_roundtrip_helper(generator.clone().take(64));
        test_hit_set_roundtrip_helper(generator.clone().skip(10).take(64));

        // many blocks, partial last block
        test_hit_set_roundtrip_helper(generator.clone().take(1024 + 6));
        test_hit_set_roundtrip_helper(generator.clone().skip(10).take(1024 + 6));
    }

    #[test]
    fn test_built_tantivy_ast() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let term_query: QueryAst = TermQuery {
            field: "body".to_string(),
            value: "val".to_string(),
        }
        .into();
        let tantivy_term_query: Box<dyn TantivyQuery> = term_query
            .build_tantivy_ast_impl(&BuildTantivyAstContext::for_test(&schema))
            .unwrap()
            .into();

        {
            let ast = CacheNode {
                inner: Box::new(term_query.clone()),
                state: CacheState::Uninitialized,
            };
            let uninit_cache_query: Box<dyn TantivyQuery> = ast
                .build_tantivy_ast_impl(&BuildTantivyAstContext::for_test(&schema))
                .unwrap()
                .into();
            assert_eq!(
                format!("{uninit_cache_query:?}"),
                format!("{tantivy_term_query:?}")
            );
        }

        {
            let cache_entry = CacheEntry {
                segment_id: SegmentId::from_uuid_string("1686a000d4f7a91939d0e71df1646d7a")
                    .unwrap(),
                hits: HitSet::empty(),
            };
            let ast = CacheNode {
                inner: Box::new(term_query.clone()),
                state: CacheState::CacheHit(cache_entry),
            };
            let cache_hit_query: Box<dyn TantivyQuery> = ast
                .build_tantivy_ast_impl(&BuildTantivyAstContext::for_test(&schema))
                .unwrap()
                .into();

            let debug_query = format!("{cache_hit_query:?}");
            assert!(debug_query.contains("CacheHitQuery"));
            assert!(!debug_query.contains("TermQuery"));
        }
        {
            let cache_filler = CacheFiller {
                cache: Arc::new(Mutex::new(HashMap::new())),
                split_id: "split_id".to_string(),
                query: "{}".to_string(),
            };
            let ast = CacheNode {
                inner: Box::new(term_query.clone()),
                state: CacheState::CacheMiss(cache_filler),
            };
            let cache_miss_query: Box<dyn TantivyQuery> = ast
                .build_tantivy_ast_impl(&BuildTantivyAstContext::for_test(&schema))
                .unwrap()
                .into();

            let debug_query = format!("{cache_miss_query:?}");
            assert!(debug_query.contains("CacheFillerQuery"));
            assert!(debug_query.contains(&format!("{tantivy_term_query:?}")));
        }
    }

    struct FoundATermVisitor(bool);
    impl QueryAstVisitor<'_> for FoundATermVisitor {
        type Err = std::convert::Infallible;
        fn visit_term(&mut self, _term: &TermQuery) -> Result<(), Self::Err> {
            self.0 = true;
            Ok(())
        }
    }

    impl QueryAstTransformer for FoundATermVisitor {
        type Err = std::convert::Infallible;
        fn transform_term(&mut self, term: TermQuery) -> Result<Option<QueryAst>, Self::Err> {
            self.0 = true;
            Ok(Some(term.into()))
        }
    }

    #[test]
    fn test_default_visitor_ignore_cached_node() {
        let term_query: QueryAst = TermQuery {
            field: "body".to_string(),
            value: "val".to_string(),
        }
        .into();
        {
            let ast = CacheNode {
                inner: Box::new(term_query.clone()),
                state: CacheState::Uninitialized,
            }
            .into();

            let mut visitor = FoundATermVisitor(false);
            visitor.visit(&ast).unwrap();
            assert!(visitor.0);
            let mut visitor = FoundATermVisitor(false);
            visitor.transform(ast).unwrap();
            assert!(visitor.0);
        }
        {
            let cache_entry = CacheEntry {
                segment_id: SegmentId::from_uuid_string("1686a000d4f7a91939d0e71df1646d7a")
                    .unwrap(),
                hits: HitSet::empty(),
            };
            let ast = CacheNode {
                inner: Box::new(term_query.clone()),
                state: CacheState::CacheHit(cache_entry),
            }
            .into();

            let mut visitor = FoundATermVisitor(false);
            visitor.visit(&ast).unwrap();
            assert!(!visitor.0);
            let mut visitor = FoundATermVisitor(false);
            visitor.transform(ast).unwrap();
            assert!(!visitor.0);
        }
        {
            let cache_filler = CacheFiller {
                cache: Arc::new(Mutex::new(HashMap::new())),
                split_id: "split_id".to_string(),
                query: "{}".to_string(),
            };
            let ast = CacheNode {
                inner: Box::new(term_query.clone()),
                state: CacheState::CacheMiss(cache_filler),
            }
            .into();

            let mut visitor = FoundATermVisitor(false);
            visitor.visit(&ast).unwrap();
            assert!(visitor.0);
            let mut visitor = FoundATermVisitor(false);
            visitor.transform(ast).unwrap();
            assert!(visitor.0);
        }
    }

    #[test]
    fn test_cache_preigniter_fills_cache() {
        let term_query: QueryAst = TermQuery {
            field: "body".to_string(),
            value: "val".to_string(),
        }
        .into();
        let cache_node = CacheNode {
            inner: Box::new(term_query.clone()),
            state: CacheState::Uninitialized,
        };
        let query_json = serde_json::to_string(&cache_node.inner).unwrap();
        let ast: QueryAst = cache_node.into();
        let cache = Arc::new(Mutex::new(HashMap::new()));
        cache.put(
            "split_2".to_string(),
            query_json,
            SegmentId::from_uuid_string("1686a000d4f7a91939d0e71df1646d7a").unwrap(),
            HitSet::empty(),
        );

        {
            let mut pre_igniter = PredicateCacheInjector {
                cache: cache.clone(),
                split_id: "split_1".to_string(),
            };
            let filled = pre_igniter.transform(ast.clone()).unwrap().unwrap();
            assert!(matches!(
                filled,
                QueryAst::Cache(CacheNode {
                    state: CacheState::CacheMiss(_),
                    ..
                })
            ));
        }

        {
            let mut pre_igniter = PredicateCacheInjector {
                cache: cache.clone(),
                split_id: "split_2".to_string(),
            };
            let filled = pre_igniter.transform(ast.clone()).unwrap().unwrap();
            assert!(matches!(
                filled,
                QueryAst::Cache(CacheNode {
                    state: CacheState::CacheHit(_),
                    ..
                })
            ));
        }
    }

    #[test]
    fn test_cache_hit_returns_correct_docs() {
        let mut schema_builder = Schema::builder();
        let host_field = schema_builder.add_text_field("host", TEXT);
        let schema = schema_builder.build();
        let index = tantivy::IndexBuilder::new()
            .schema(schema.clone())
            .create_in_ram()
            .unwrap();
        let mut index_writer = index.writer_with_num_threads(1, 20_000_000).unwrap();
        for count in 1..13 {
            let mut doc = tantivy::TantivyDocument::default();
            doc.add_text(host_field, format!("host_{count}"));
            for _ in 0..count {
                index_writer.add_document(doc.clone()).unwrap();
            }
        }
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let segment_id = searcher.segment_readers()[0].segment_id();

        let generator =
            std::iter::successors(Some(0u32), |x| Some(x + x.trailing_ones() + 1)).take(500);
        let mut hitset_builder = HitSetBuilder::new();
        for i in generator {
            hitset_builder.insert(i);
        }
        let hitset = hitset_builder.build();

        // this query isn't even valid for that split, but that's not relevant as it won't get run
        let term_query: QueryAst = TermQuery {
            field: "body".to_string(),
            value: "val".to_string(),
        }
        .into();
        let cache_entry = CacheEntry {
            segment_id,
            hits: hitset,
        };
        let ast = CacheNode {
            inner: Box::new(term_query.clone()),
            state: CacheState::CacheHit(cache_entry),
        };
        let cache_hit_query: Box<dyn TantivyQuery> = ast
            .build_tantivy_ast_impl(&BuildTantivyAstContext::for_test(&schema))
            .unwrap()
            .into();

        assert_eq!(cache_hit_query.count(&searcher).unwrap(), 500);
    }

    #[test]
    fn test_cache_miss_returns_correct_docs_and_fill_cache() {
        let mut schema_builder = Schema::builder();
        let host_field = schema_builder.add_text_field("host", TEXT);
        let schema = schema_builder.build();
        let index = tantivy::IndexBuilder::new()
            .schema(schema.clone())
            .create_in_ram()
            .unwrap();
        let mut index_writer = index.writer_with_num_threads(1, 20_000_000).unwrap();
        for count in 1..13 {
            let mut doc = tantivy::TantivyDocument::default();
            doc.add_text(host_field, format!("host_{count}"));
            for _ in 0..count {
                index_writer.add_document(doc.clone()).unwrap();
            }
        }
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let segment_id = searcher.segment_readers()[0].segment_id();

        let term_query: QueryAst = TermQuery {
            field: "host".to_string(),
            value: "11".to_string(),
        }
        .into();
        let cache = Arc::new(Mutex::new(HashMap::new()));
        let cache_filler = CacheFiller {
            cache: cache.clone(),
            split_id: "split_id".to_string(),
            query: "{some_query}".to_string(),
        };
        let ast = CacheNode {
            inner: Box::new(term_query.clone()),
            state: CacheState::CacheMiss(cache_filler),
        };
        let cache_hit_query: Box<dyn TantivyQuery> = ast
            .build_tantivy_ast_impl(&BuildTantivyAstContext::for_test(&schema))
            .unwrap()
            .into();

        assert_eq!(cache_hit_query.count(&searcher).unwrap(), 11);
        let mut cache_entry = cache
            .get("split_id".to_string(), "{some_query}".to_string())
            .unwrap();
        assert_eq!(cache_entry.0, segment_id);
        let expected = (10 * 11 / 2)..(11 * 12 / 2);
        for doc_id in expected {
            assert_eq!(cache_entry.1.doc(), doc_id);
            cache_entry.1.advance();
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/field_presence.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::PathHasher;
use quickwit_common::shared_consts::FIELD_PRESENCE_FIELD_NAME;
use serde::{Deserialize, Serialize};
use tantivy::Term;
use tantivy::schema::{Field, FieldEntry, IndexRecordOption, Schema as TantivySchema};

use super::tantivy_query_ast::TantivyBoolQuery;
use super::utils::{DYNAMIC_FIELD_NAME, find_subfields};
use crate::query_ast::tantivy_query_ast::TantivyQueryAst;
use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext, QueryAst};
use crate::{BooleanOperand, InvalidQuery, find_field_or_hit_dynamic};

#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
pub struct FieldPresenceQuery {
    pub field: String,
}

impl From<FieldPresenceQuery> for QueryAst {
    fn from(field_presence_query: FieldPresenceQuery) -> Self {
        QueryAst::FieldPresence(field_presence_query)
    }
}

fn compute_field_presence_hash(field: Field, field_path: &str) -> PathHasher {
    let mut path_hasher: PathHasher = PathHasher::default();
    path_hasher.append(&field.field_id().to_le_bytes()[..]);
    let mut escaped = false;
    let mut current_segment = String::new();
    for c in field_path.chars() {
        if escaped {
            escaped = false;
            current_segment.push(c);
            continue;
        }
        match c {
            '\\' => {
                escaped = true;
            }
            '.' => {
                path_hasher.append(current_segment.as_bytes());
                current_segment.clear();
            }
            _ => {
                current_segment.push(c);
            }
        }
    }
    if !current_segment.is_empty() {
        path_hasher.append(current_segment.as_bytes());
    }
    path_hasher
}

fn build_existence_query(
    field_presence_field: Field,
    field: Field,
    field_entry: &FieldEntry,
    path: &str,
) -> TantivyQueryAst {
    if field_entry.is_fast() {
        let full_path = if path.is_empty() {
            field_entry.name().to_string()
        } else {
            format!("{}.{}", field_entry.name(), path)
        };
        let exists_query = tantivy::query::ExistsQuery::new(full_path, true);
        TantivyQueryAst::from(exists_query)
    } else {
        // fallback to the presence field
        let presence_hasher = compute_field_presence_hash(field, path);
        let leaf_term = Term::from_field_u64(field_presence_field, presence_hasher.finish_leaf());
        if field_entry.field_type().is_json() {
            let intermediate_term =
                Term::from_field_u64(field_presence_field, presence_hasher.finish_intermediate());
            let query = tantivy::query::TermSetQuery::new([leaf_term, intermediate_term]);
            TantivyQueryAst::from(query)
        } else {
            let query = tantivy::query::TermQuery::new(leaf_term, IndexRecordOption::Basic);
            TantivyQueryAst::from(query)
        }
    }
}

impl FieldPresenceQuery {
    /// Identify the field and potential subfields that are required for this query.
    ///
    /// This is only based on the schema and cannot now about dynamic fields.
    pub fn find_field_and_subfields<'a>(
        &'a self,
        schema: &'a TantivySchema,
    ) -> Vec<(Field, &'a FieldEntry, &'a str)> {
        let mut fields = Vec::new();
        if let Some((field, entry, path)) = find_field_or_hit_dynamic(&self.field, schema) {
            fields.push((field, entry, path));
        };
        // if `self.field` was not found, it might still be an `object` field
        if fields.is_empty() || fields[0].1.name() == DYNAMIC_FIELD_NAME {
            for (field, entry) in find_subfields(&self.field, schema) {
                fields.push((field, entry, ""));
            }
        }
        fields
    }
}

impl BuildTantivyAst for FieldPresenceQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let field_presence_field = context
            .schema
            .get_field(FIELD_PRESENCE_FIELD_NAME)
            .map_err(|_| {
                InvalidQuery::SchemaError(
                    "field presence is not available for this split".to_string(),
                )
            })?;
        let fields = self.find_field_and_subfields(context.schema);
        if fields.is_empty() {
            // the schema is not dynamic and no subfields are defined
            return Err(InvalidQuery::FieldDoesNotExist {
                full_path: self.field.clone(),
            });
        }
        let queries = fields
            .into_iter()
            .map(|(field, entry, path)| {
                build_existence_query(field_presence_field, field, entry, path)
            })
            .collect();
        Ok(TantivyQueryAst::Bool(TantivyBoolQuery::build_clause(
            BooleanOperand::Or,
            queries,
        )))
    }
}

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn test_field_presence_single() {
        let field_presence_term: u64 =
            compute_field_presence_hash(Field::from_field_id(17u32), "attributes").finish_leaf();
        assert_eq!(
            field_presence_term,
            PathHasher::hash_path(&[&17u32.to_le_bytes()[..], b"attributes"])
        );
    }

    #[test]
    fn test_field_presence_hash_simple() {
        let field_presence_term: u64 =
            compute_field_presence_hash(Field::from_field_id(17u32), "attributes.color")
                .finish_leaf();
        assert_eq!(
            field_presence_term,
            PathHasher::hash_path(&[&17u32.to_le_bytes()[..], b"attributes", b"color"])
        );
    }

    #[test]
    fn test_field_presence_hash_escaped_dot() {
        let field_presence_term: u64 =
            compute_field_presence_hash(Field::from_field_id(17u32), r"attributes\.color.hello")
                .finish_leaf();
        assert_eq!(
            field_presence_term,
            PathHasher::hash_path(&[&17u32.to_le_bytes()[..], b"attributes.color", b"hello"])
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/full_text_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use anyhow::Context;
use serde::{Deserialize, Serialize};
use tantivy::Term;
use tantivy::query::{
    PhrasePrefixQuery as TantivyPhrasePrefixQuery, PhraseQuery as TantivyPhraseQuery,
    TermQuery as TantivyTermQuery,
};
use tantivy::schema::{
    Field, FieldType, IndexRecordOption, JsonObjectOptions, Schema as TantivySchema,
    TextFieldIndexing,
};
use tantivy::tokenizer::{TextAnalyzer, TokenStream};

use crate::query_ast::tantivy_query_ast::{TantivyBoolQuery, TantivyQueryAst};
use crate::query_ast::utils::full_text_query;
use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext, QueryAst};
use crate::tokenizers::TokenizerManager;
use crate::{BooleanOperand, InvalidQuery, MatchAllOrNone, find_field_or_hit_dynamic};

#[derive(Serialize, Deserialize, Debug, Eq, PartialEq, Clone)]
#[serde(deny_unknown_fields)]
pub struct FullTextParams {
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub tokenizer: Option<String>,
    pub mode: FullTextMode,
    // How an empty query (no terms after tokenization) should be interpreted.
    // By default we match no documents.
    #[serde(default, skip_serializing_if = "MatchAllOrNone::is_none")]
    pub zero_terms_query: MatchAllOrNone,
}

impl FullTextParams {
    fn text_analyzer(
        &self,
        text_field_indexing: &TextFieldIndexing,
        tokenizer_manager: &TokenizerManager,
    ) -> anyhow::Result<TextAnalyzer> {
        let tokenizer_name: &str = self
            .tokenizer
            .as_deref()
            .unwrap_or(text_field_indexing.tokenizer());
        tokenizer_manager
            .get_tokenizer(tokenizer_name)
            .with_context(|| format!("no tokenizer named `{tokenizer_name}` is registered"))
    }

    pub(crate) fn tokenize_text_into_terms_json(
        &self,
        field: Field,
        json_path: &str,
        text: &str,
        json_options: &JsonObjectOptions,
        tokenizer_manager: &TokenizerManager,
    ) -> anyhow::Result<Vec<(usize, Term)>> {
        let text_indexing_options = json_options
            .get_text_indexing_options()
            .with_context(|| format!("Json field text `{json_path}` is not indexed"))?;
        let mut text_analyzer: TextAnalyzer =
            self.text_analyzer(text_indexing_options, tokenizer_manager)?;
        let mut token_stream = text_analyzer.token_stream(text);
        let mut tokens = Vec::new();
        token_stream.process(&mut |token| {
            let mut term =
                Term::from_field_json_path(field, json_path, json_options.is_expand_dots_enabled());
            term.append_type_and_str(&token.text);
            tokens.push((token.position, term));
        });
        Ok(tokens)
    }

    pub(crate) fn tokenize_text_into_terms(
        &self,
        field: Field,
        text: &str,
        text_field_indexing: &TextFieldIndexing,
        tokenizer_manager: &TokenizerManager,
    ) -> anyhow::Result<Vec<(usize, Term)>> {
        let mut text_analyzer: TextAnalyzer =
            self.text_analyzer(text_field_indexing, tokenizer_manager)?;
        let mut token_stream = text_analyzer.token_stream(text);
        let mut tokens = Vec::new();
        token_stream.process(&mut |token| {
            let term: Term = Term::from_field_text(field, &token.text);
            tokens.push((token.position, term));
        });
        Ok(tokens)
    }

    pub(crate) fn make_query(
        &self,
        mut terms: Vec<(usize, Term)>,
        index_record_option: IndexRecordOption,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        if terms.is_empty() {
            return Ok(self.zero_terms_query.into());
        }
        if terms.len() == 1 {
            let term = terms.pop().unwrap().1;
            return Ok(TantivyTermQuery::new(term, IndexRecordOption::WithFreqs).into());
        }
        match self.mode {
            FullTextMode::Bool { operator } => {
                let leaf_queries: Vec<TantivyQueryAst> = terms
                    .into_iter()
                    .map(|(_, term)| TantivyTermQuery::new(term, index_record_option).into())
                    .collect();
                Ok(TantivyBoolQuery::build_clause(operator, leaf_queries).into())
            }
            FullTextMode::BoolPrefix {
                operator,
                max_expansions,
            } => {
                let term_with_prefix = terms.pop();
                let mut leaf_queries: Vec<TantivyQueryAst> = terms
                    .into_iter()
                    .map(|(_, term)| TantivyTermQuery::new(term, index_record_option).into())
                    .collect();
                if let Some(term_with_prefix) = term_with_prefix {
                    let mut phrase_prefix_query =
                        TantivyPhrasePrefixQuery::new_with_offset(vec![term_with_prefix]);
                    phrase_prefix_query.set_max_expansions(max_expansions);
                    leaf_queries.push(phrase_prefix_query.into());
                }
                Ok(TantivyBoolQuery::build_clause(operator, leaf_queries).into())
            }
            FullTextMode::Phrase { slop } => {
                if !index_record_option.has_positions() {
                    return Err(InvalidQuery::SchemaError(
                        "Applied phrase query on field which does not have positions indexed"
                            .to_string(),
                    ));
                }
                let mut phrase_query = TantivyPhraseQuery::new_with_offset(terms);
                phrase_query.set_slop(slop);
                Ok(phrase_query.into())
            }
            FullTextMode::PhraseFallbackToIntersection => {
                if index_record_option.has_positions() {
                    Ok(TantivyPhraseQuery::new_with_offset(terms).into())
                } else {
                    let term_query: Vec<TantivyQueryAst> = terms
                        .into_iter()
                        .map(|(_, term)| TantivyTermQuery::new(term, index_record_option).into())
                        .collect();
                    Ok(TantivyBoolQuery::build_clause(BooleanOperand::And, term_query).into())
                }
            }
        }
    }
}

fn is_zero(val: &u32) -> bool {
    *val == 0u32
}

/// `FullTextMode` describe how we should derive a query from a user sequence of tokens.
#[derive(Copy, Clone, Debug, Eq, PartialEq, Serialize, Deserialize)]
#[serde(tag = "type", rename_all = "snake_case")]
pub enum FullTextMode {
    // After tokenization, the different tokens should be used to
    // create a boolean clause (conjunction or disjunction based on the operator).
    Bool {
        operator: BooleanOperand,
    },
    BoolPrefix {
        operator: BooleanOperand,
        // max_expansions correspond to the fuzzy stop of query evaluation. It's not the same as
        // the max_expansions of a PhrasePrefixQuery, where it's used for the range
        // expansion.
        max_expansions: u32,
    },
    // Act as Phrase with slop 0 if the field has positions,
    // otherwise act as an intersection.
    PhraseFallbackToIntersection,
    // After tokenization, the different tokens should be used to create
    // a phrase query.
    //
    // A non-zero slop allows the position of the terms to be slightly off.
    Phrase {
        #[serde(default, skip_serializing_if = "is_zero")]
        slop: u32,
    },
}

impl From<BooleanOperand> for FullTextMode {
    fn from(operator: BooleanOperand) -> Self {
        FullTextMode::Bool { operator }
    }
}

/// The Full Text query is tokenized into a sequence of tokens
/// that will then be searched.
///
/// The `full_text_params` defines what type of match is accepted.
/// The tokens might be transformed into a phrase queries,
/// into a disjunction, or into a conjunction.
///
/// If after tokenization, a single term is emitted, it will naturally be
/// produce a tantivy TermQuery.
///
/// If no terms is emitted, it will produce a query that match all or no documents,
/// depending on `full_text_params.zero_terms_query`.
///
/// Contrary to the user input query, the FullTextQuery does not
/// interpret a boolean query grammar and targets a specific field.
#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
pub struct FullTextQuery {
    pub field: String,
    pub text: String,
    pub params: FullTextParams,
    /// Support missing fields
    pub lenient: bool,
}

impl From<FullTextQuery> for QueryAst {
    fn from(full_text_query: FullTextQuery) -> Self {
        QueryAst::FullText(full_text_query)
    }
}

impl BuildTantivyAst for FullTextQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        full_text_query(
            &self.field,
            &self.text,
            &self.params,
            context.schema,
            context.tokenizer_manager,
            self.lenient,
        )
    }
}

impl FullTextQuery {
    /// Returns the last term of the query assuming the query is targeting a string or a Json
    /// field.
    ///
    /// This strange method is used to identify which term range should be warmed up for
    /// phrase prefix queries.
    pub fn get_prefix_term(
        &self,
        schema: &TantivySchema,
        tokenizer_manager: &TokenizerManager,
    ) -> Option<Term> {
        if !matches!(self.params.mode, FullTextMode::BoolPrefix { .. }) {
            return None;
        };

        let (field, field_entry, json_path) = find_field_or_hit_dynamic(&self.field, schema)?;
        let field_type: &FieldType = field_entry.field_type();
        match field_type {
            FieldType::Str(text_options) => {
                let text_field_indexing = text_options.get_indexing_options()?;
                let mut terms = self
                    .params
                    .tokenize_text_into_terms(
                        field,
                        &self.text,
                        text_field_indexing,
                        tokenizer_manager,
                    )
                    .ok()?;
                let (_pos, term) = terms.pop()?;
                Some(term)
            }
            FieldType::JsonObject(json_options) => {
                let mut terms = self
                    .params
                    .tokenize_text_into_terms_json(
                        field,
                        json_path,
                        &self.text,
                        json_options,
                        tokenizer_manager,
                    )
                    .ok()?;
                let (_pos, term) = terms.pop()?;
                Some(term)
            }
            _ => None,
        }
    }
}

#[cfg(test)]
mod tests {
    use tantivy::schema::{DateOptions, DateTimePrecision, Schema, TEXT};

    use crate::BooleanOperand;
    use crate::query_ast::tantivy_query_ast::TantivyQueryAst;
    use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext, FullTextMode, FullTextQuery};

    #[test]
    fn test_zero_terms() {
        let full_text_query = FullTextQuery {
            field: "body".to_string(),
            text: "".to_string(),
            params: super::FullTextParams {
                tokenizer: None,
                mode: BooleanOperand::And.into(),
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
            },
            lenient: false,
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let ast: TantivyQueryAst = full_text_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        assert_eq!(ast.const_predicate(), Some(crate::MatchAllOrNone::MatchAll));
    }

    #[test]
    fn test_phrase_mode_default_tokenizer() {
        let full_text_query = FullTextQuery {
            field: "body".to_string(),
            text: "Hello World!".to_string(),
            params: super::FullTextParams {
                tokenizer: None,
                mode: FullTextMode::Phrase { slop: 1 },
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
            },
            lenient: false,
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let ast: TantivyQueryAst = full_text_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = ast.as_leaf().unwrap();
        assert_eq!(
            &format!("{leaf:?}"),
            "PhraseQuery { field: Field(0), phrase_terms: [(0, Term(field=0, type=Str, \
             \"hello\")), (1, Term(field=0, type=Str, \"world\"))], slop: 1 }"
        );
    }

    #[test]
    fn test_full_text_specific_tokenizer() {
        let full_text_query = FullTextQuery {
            field: "body".to_string(),
            text: "Hello world".to_string(),
            params: super::FullTextParams {
                tokenizer: Some("raw".to_string()),
                mode: FullTextMode::Phrase { slop: 1 },
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
            },
            lenient: false,
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let ast: TantivyQueryAst = full_text_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = ast.as_leaf().unwrap();
        assert_eq!(
            &format!("{leaf:?}"),
            r#"TermQuery(Term(field=0, type=Str, "Hello world"))"#
        );
    }

    #[test]
    fn test_full_text_datetime() {
        let full_text_query = FullTextQuery {
            field: "ts".to_string(),
            text: "2025-12-13T16:13:12.666777Z".to_string(),
            params: super::FullTextParams {
                tokenizer: Some("raw".to_string()),
                mode: FullTextMode::Phrase { slop: 1 },
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
            },
            lenient: false,
        };
        {
            // indexed, we truncate to the second
            let mut schema_builder = Schema::builder();
            schema_builder.add_date_field(
                "ts",
                DateOptions::default()
                    .set_precision(DateTimePrecision::Milliseconds)
                    .set_fast()
                    .set_indexed(),
            );
            let schema = schema_builder.build();
            let ast: TantivyQueryAst = full_text_query
                .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
                .unwrap();
            let leaf = ast.as_leaf().unwrap();
            assert_eq!(
                &format!("{leaf:?}"),
                r#"TermQuery(Term(field=0, type=Date, 2025-12-13T16:13:12Z))"#
            );
        }
        {
            // not indexed, we truncate to fastfield precision
            let mut schema_builder = Schema::builder();
            schema_builder.add_date_field(
                "ts",
                DateOptions::default()
                    .set_precision(DateTimePrecision::Milliseconds)
                    .set_fast(),
            );
            let schema = schema_builder.build();
            let ast: TantivyQueryAst = full_text_query
                .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
                .unwrap();
            let leaf = ast.as_leaf().unwrap();
            assert_eq!(
                &format!("{leaf:?}"),
                r#"TermQuery(Term(field=0, type=Date, 2025-12-13T16:13:12.666Z))"#
            );
        }
    }

    #[test]
    fn test_full_text_bool_mode() {
        let full_text_query = FullTextQuery {
            field: "body".to_string(),
            text: "Hello world".to_string(),
            params: super::FullTextParams {
                tokenizer: None,
                mode: BooleanOperand::And.into(),
                zero_terms_query: crate::MatchAllOrNone::MatchAll,
            },
            lenient: false,
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let ast: TantivyQueryAst = full_text_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let bool_query = ast.as_bool_query().unwrap();
        assert_eq!(bool_query.must.len(), 2);
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Serialize};
use tantivy::query::BoostQuery as TantivyBoostQuery;
use tantivy::schema::Schema as TantivySchema;

use crate::tokenizers::TokenizerManager;

mod bool_query;
mod cache_node;
mod field_presence;
mod full_text_query;
mod phrase_prefix_query;
mod range_query;
mod regex_query;
mod tantivy_query_ast;
mod term_query;
mod term_set_query;
mod user_input_query;
pub(crate) mod utils;
mod visitor;
mod wildcard_query;

pub use bool_query::BoolQuery;
pub use cache_node::{CacheNode, HitSet, PredicateCache, PredicateCacheInjector};
pub use field_presence::FieldPresenceQuery;
pub use full_text_query::{FullTextMode, FullTextParams, FullTextQuery};
pub use phrase_prefix_query::PhrasePrefixQuery;
pub use range_query::RangeQuery;
pub use regex_query::{AutomatonQuery, JsonPathPrefix, RegexQuery};
use tantivy_query_ast::TantivyQueryAst;
pub use term_query::TermQuery;
pub use term_set_query::TermSetQuery;
pub use user_input_query::UserInputQuery;
pub use visitor::{QueryAstTransformer, QueryAstVisitor};
pub use wildcard_query::WildcardQuery;

use crate::{BooleanOperand, InvalidQuery, NotNaNf32};

#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
#[serde(tag = "type")]
#[serde(rename_all = "snake_case")]
pub enum QueryAst {
    Bool(BoolQuery),
    Term(TermQuery),
    TermSet(TermSetQuery),
    FieldPresence(FieldPresenceQuery),
    FullText(FullTextQuery),
    PhrasePrefix(PhrasePrefixQuery),
    Range(RangeQuery),
    UserInput(UserInputQuery),
    Wildcard(WildcardQuery),
    Regex(RegexQuery),
    MatchAll,
    MatchNone,
    Boost {
        underlying: Box<QueryAst>,
        boost: NotNaNf32,
    },
    Cache(CacheNode),
}

impl QueryAst {
    pub fn parse_user_query(
        self: QueryAst,
        default_search_fields: &[String],
    ) -> anyhow::Result<QueryAst> {
        match self {
            QueryAst::Bool(BoolQuery {
                must,
                must_not,
                should,
                filter,
                minimum_should_match,
            }) => {
                let must = parse_user_query_in_asts(must, default_search_fields)?;
                let must_not = parse_user_query_in_asts(must_not, default_search_fields)?;
                let should = parse_user_query_in_asts(should, default_search_fields)?;
                let filter = parse_user_query_in_asts(filter, default_search_fields)?;
                Ok(BoolQuery {
                    must,
                    must_not,
                    should,
                    filter,
                    minimum_should_match,
                }
                .into())
            }
            ast @ QueryAst::Term(_)
            | ast @ QueryAst::TermSet(_)
            | ast @ QueryAst::FullText(_)
            | ast @ QueryAst::PhrasePrefix(_)
            | ast @ QueryAst::MatchAll
            | ast @ QueryAst::MatchNone
            | ast @ QueryAst::FieldPresence(_)
            | ast @ QueryAst::Range(_)
            | ast @ QueryAst::Wildcard(_)
            | ast @ QueryAst::Regex(_) => Ok(ast),
            QueryAst::UserInput(user_text_query) => {
                user_text_query.parse_user_query(default_search_fields)
            }
            QueryAst::Boost { underlying, boost } => {
                let underlying = underlying.parse_user_query(default_search_fields)?;
                Ok(QueryAst::Boost {
                    underlying: Box::new(underlying),
                    boost,
                })
            }
            QueryAst::Cache(cache_node) => {
                let inner = cache_node.inner.parse_user_query(default_search_fields)?;
                let uninitialized =
                    matches!(cache_node.state, cache_node::CacheState::Uninitialized);
                debug_assert!(
                    uninitialized,
                    "QueryAst::parse_user_query called on initialized CacheNode, this is probably \
                     a misstake"
                );
                if !uninitialized {
                    tracing::warn!(
                        "QueryAst::parse_user_query called on initialized CacheNode, cache \
                         discarded"
                    );
                }
                Ok(CacheNode {
                    inner: Box::new(inner),
                    // inner got modified, the result is supposed to be equivalent, but to be safe,
                    // lets reinitialize the cache in practice this function
                    // shouldn't ever be called after cache was resolved
                    state: cache_node::CacheState::Uninitialized,
                }
                .into())
            }
        }
    }

    pub fn boost(self, scale_boost_opt: Option<NotNaNf32>) -> Self {
        let Some(scale_boost) = scale_boost_opt else {
            return self;
        };
        match self {
            QueryAst::Boost { underlying, boost } => {
                let scale_boost_f32: f32 = scale_boost.into();
                let boost_f32: f32 = boost.into();
                let new_boost =
                    NotNaNf32::try_from(scale_boost_f32 * boost_f32).unwrap_or(NotNaNf32::ZERO);
                QueryAst::Boost {
                    underlying,
                    boost: new_boost,
                }
            }
            ast => {
                let underlying = Box::new(ast);
                QueryAst::Boost {
                    underlying,
                    boost: scale_boost,
                }
            }
        }
    }
}

/// Context used when building a tantivy ast.
pub struct BuildTantivyAstContext<'a> {
    pub schema: &'a TantivySchema,
    pub tokenizer_manager: &'a TokenizerManager,
    pub search_fields: &'a [String],
    pub with_validation: bool,
}

impl<'a> BuildTantivyAstContext<'a> {
    pub fn for_test(schema: &'a TantivySchema) -> Self {
        use once_cell::sync::Lazy;

        // we do that to have a TokenizerManager with a long enough lifetime
        static DEFAULT_TOKENIZER_MANAGER: Lazy<TokenizerManager> =
            Lazy::new(crate::create_default_quickwit_tokenizer_manager);

        BuildTantivyAstContext {
            schema,
            tokenizer_manager: &DEFAULT_TOKENIZER_MANAGER,
            search_fields: &[],
            with_validation: true,
        }
    }

    pub fn without_validation(mut self) -> Self {
        self.with_validation = false;
        self
    }
}

trait BuildTantivyAst {
    /// Transforms a query Ast node into a TantivyQueryAst.
    ///
    /// This function is supposed to return an error if it detects a problem in the schema.
    /// It can call `into_tantivy_ast_call_me` but should never call `into_tantivy_ast_impl`.
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery>;

    /// This method is meant to be called, but should never be overloaded.
    fn build_tantivy_ast_call(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let tantivy_ast_res = self.build_tantivy_ast_impl(context);
        if !context.with_validation && tantivy_ast_res.is_err() {
            return match tantivy_ast_res {
                res @ Ok(_) | res @ Err(InvalidQuery::UserQueryNotParsed) => res,
                Err(_) => Ok(TantivyQueryAst::match_none()),
            };
        }
        tantivy_ast_res
    }
}

impl BuildTantivyAst for QueryAst {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        match self {
            QueryAst::Bool(bool_query) => bool_query.build_tantivy_ast_call(context),
            QueryAst::Term(term_query) => term_query.build_tantivy_ast_call(context),
            QueryAst::Range(range_query) => range_query.build_tantivy_ast_call(context),
            QueryAst::MatchAll => Ok(TantivyQueryAst::match_all()),
            QueryAst::MatchNone => Ok(TantivyQueryAst::match_none()),
            QueryAst::Boost { boost, underlying } => {
                let underlying = underlying.build_tantivy_ast_call(context)?.simplify();
                let boost_query = TantivyBoostQuery::new(underlying.into(), (*boost).into());
                Ok(boost_query.into())
            }
            QueryAst::TermSet(term_set) => term_set.build_tantivy_ast_call(context),
            QueryAst::FullText(full_text_query) => full_text_query.build_tantivy_ast_call(context),
            QueryAst::PhrasePrefix(phrase_prefix_query) => {
                phrase_prefix_query.build_tantivy_ast_call(context)
            }
            QueryAst::UserInput(user_text_query) => user_text_query.build_tantivy_ast_call(context),
            QueryAst::FieldPresence(field_presence) => {
                field_presence.build_tantivy_ast_call(context)
            }
            QueryAst::Wildcard(wildcard) => wildcard.build_tantivy_ast_call(context),
            QueryAst::Regex(regex) => regex.build_tantivy_ast_call(context),
            QueryAst::Cache(cache_node) => cache_node.build_tantivy_ast_call(context),
        }
    }
}

impl QueryAst {
    pub fn build_tantivy_query(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<Box<dyn crate::TantivyQuery>, InvalidQuery> {
        let tantivy_query_ast = self.build_tantivy_ast_call(context)?;
        Ok(tantivy_query_ast.simplify().into())
    }
}

fn parse_user_query_in_asts(
    asts: Vec<QueryAst>,
    default_search_fields: &[String],
) -> anyhow::Result<Vec<QueryAst>> {
    asts.into_iter()
        .map(|ast| ast.parse_user_query(default_search_fields))
        .collect::<anyhow::Result<_>>()
}

/// Parses a user query and returns a JSON query AST.
///
/// The resulting query does not include `UserInputQuery` nodes.
/// The resolution assumes that there are no default search fields
/// in the doc mapper.
///
/// # Panics
///
/// Panics if the user text is invalid.
pub fn qast_json_helper(user_text: &str, default_fields: &[&'static str]) -> String {
    let ast = qast_helper(user_text, default_fields);
    serde_json::to_string(&ast).expect("The query AST should be JSON serializable.")
}

pub fn qast_helper(user_text: &str, default_fields: &[&'static str]) -> QueryAst {
    let default_fields: Vec<String> = default_fields
        .iter()
        .map(|default_field| default_field.to_string())
        .collect();
    query_ast_from_user_text(user_text, Some(default_fields))
        .parse_user_query(&[])
        .expect("The user query should be valid.")
}

/// Creates a QueryAST with a single UserInputQuery node.
///
/// Disclaimer:
/// At this point the query has not been parsed.
///
/// The actual parsing is meant to happen on a root node,
/// `default_fields` can be passed to decide which field should be search
/// if not specified specifically in the user query (e.g. hello as opposed to "body:hello").
///
/// If it is not supplied, the docmapper search fields are meant to be used.
///
/// If no boolean operator is specified, the default is `AND` (contrary to the Elasticsearch
/// default).
pub fn query_ast_from_user_text(user_text: &str, default_fields: Option<Vec<String>>) -> QueryAst {
    UserInputQuery {
        user_text: user_text.to_string(),
        default_fields,
        default_operator: BooleanOperand::And,
        lenient: false,
    }
    .into()
}

#[cfg(test)]
mod tests {
    use crate::query_ast::tantivy_query_ast::TantivyQueryAst;
    use crate::query_ast::{
        BoolQuery, BuildTantivyAst, BuildTantivyAstContext, QueryAst, UserInputQuery,
        query_ast_from_user_text,
    };
    use crate::{BooleanOperand, InvalidQuery};

    #[test]
    fn test_user_query_not_parsed() {
        let query_ast: QueryAst = UserInputQuery {
            user_text: "*".to_string(),
            default_fields: Default::default(),
            default_operator: Default::default(),
            lenient: false,
        }
        .into();
        let schema = tantivy::schema::Schema::builder().build();
        let build_tantivy_ast_err: InvalidQuery = query_ast
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap_err();
        assert!(matches!(
            build_tantivy_ast_err,
            InvalidQuery::UserQueryNotParsed
        ));
    }

    #[test]
    fn test_user_query_parsed() {
        let query_ast: QueryAst = UserInputQuery {
            user_text: "*".to_string(),
            default_fields: Default::default(),
            default_operator: Default::default(),
            lenient: false,
        }
        .into();
        let query_ast_with_parsed_user_query: QueryAst = query_ast.parse_user_query(&[]).unwrap();
        let schema = tantivy::schema::Schema::builder().build();
        let tantivy_query_ast = query_ast_with_parsed_user_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        assert_eq!(&tantivy_query_ast, &TantivyQueryAst::match_all(),);
    }

    #[test]
    fn test_user_query_parsed_query_ast() {
        let query_ast: QueryAst = UserInputQuery {
            user_text: "*".to_string(),
            default_fields: Default::default(),
            default_operator: Default::default(),
            lenient: false,
        }
        .into();
        let bool_query_ast: QueryAst = BoolQuery {
            filter: vec![query_ast],
            ..Default::default()
        }
        .into();
        let query_ast_with_parsed_user_query: QueryAst =
            bool_query_ast.parse_user_query(&[]).unwrap();
        let schema = tantivy::schema::Schema::builder().build();
        let tantivy_query_ast = query_ast_with_parsed_user_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let tantivy_query_ast_simplified = tantivy_query_ast.simplify();
        // This does not get more simplified than this, because we need the boost 0 score.
        let tantivy_bool_query = tantivy_query_ast_simplified.as_bool_query().unwrap();
        assert_eq!(tantivy_bool_query.must.len(), 0);
        assert_eq!(tantivy_bool_query.should.len(), 0);
        assert_eq!(tantivy_bool_query.must_not.len(), 0);
        assert_eq!(tantivy_bool_query.filter.len(), 1);
        assert_eq!(&tantivy_bool_query.filter[0], &TantivyQueryAst::match_all(),);
    }

    #[test]
    fn test_query_parse_default_occur_must() {
        let query_ast: QueryAst = UserInputQuery {
            user_text: "field:hello field:toto".to_string(),
            default_fields: None,
            default_operator: crate::BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&[])
        .unwrap();
        let QueryAst::Bool(bool_query) = query_ast else {
            panic!()
        };
        assert_eq!(bool_query.must.len(), 2);
    }

    #[test]
    fn test_query_parse_default_occur_should() {
        let query_ast: QueryAst = UserInputQuery {
            user_text: "field:hello field:toto".to_string(),
            default_fields: None,
            default_operator: crate::BooleanOperand::Or,
            lenient: false,
        }
        .parse_user_query(&[])
        .unwrap();
        let QueryAst::Bool(bool_query) = query_ast else {
            panic!()
        };
        assert_eq!(bool_query.should.len(), 2);
    }

    #[test]
    fn test_query_ast_from_user_text_default_as_and() {
        let ast = query_ast_from_user_text("hello you", None);
        let QueryAst::UserInput(input_query) = ast else {
            panic!()
        };
        assert_eq!(input_query.default_operator, BooleanOperand::And);
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/phrase_prefix_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::{Deserialize, Serialize};
use tantivy::Term;
use tantivy::query::PhrasePrefixQuery as TantivyPhrasePrefixQuery;
use tantivy::schema::{Field, FieldType, Schema as TantivySchema};

use crate::query_ast::tantivy_query_ast::TantivyQueryAst;
use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext, FullTextParams, QueryAst};
use crate::tokenizers::TokenizerManager;
use crate::{InvalidQuery, find_field_or_hit_dynamic};

/// The PhraseQuery node is meant to be tokenized and searched.
///
/// If after tokenization, a single term is emitted, it will naturally be
/// produce a tantivy TermQuery.
/// If not terms is emitted, it will produce a query that match no documents..
#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
pub struct PhrasePrefixQuery {
    pub field: String,
    pub phrase: String,
    pub max_expansions: u32,
    pub params: FullTextParams,
    /// Support missing fields
    pub lenient: bool,
}

impl PhrasePrefixQuery {
    pub fn get_terms(
        &self,
        schema: &TantivySchema,
        tokenizer_manager: &TokenizerManager,
    ) -> Result<(Field, Vec<(usize, Term)>), InvalidQuery> {
        let (field, field_entry, json_path) = find_field_or_hit_dynamic(&self.field, schema)
            .ok_or_else(|| InvalidQuery::FieldDoesNotExist {
                full_path: self.field.clone(),
            })?;
        let field_type = field_entry.field_type();

        match field_type {
            FieldType::Str(text_options) => {
                let text_field_indexing = text_options.get_indexing_options().ok_or_else(|| {
                    InvalidQuery::SchemaError(format!(
                        "field {} is not full-text searchable",
                        field_entry.name()
                    ))
                })?;
                let terms = self.params.tokenize_text_into_terms(
                    field,
                    &self.phrase,
                    text_field_indexing,
                    tokenizer_manager,
                )?;
                if !text_field_indexing.index_option().has_positions() && terms.len() > 1 {
                    return Err(InvalidQuery::SchemaError(
                        "trying to run a phrase prefix query on a field which does not have \
                         positions indexed"
                            .to_string(),
                    ));
                }
                Ok((field, terms))
            }
            FieldType::JsonObject(json_options) => {
                let text_field_indexing =
                    json_options.get_text_indexing_options().ok_or_else(|| {
                        InvalidQuery::SchemaError(format!(
                            "field {} is not full-text searchable",
                            field_entry.name()
                        ))
                    })?;
                let terms = self.params.tokenize_text_into_terms_json(
                    field,
                    json_path,
                    &self.phrase,
                    json_options,
                    tokenizer_manager,
                )?;
                if !text_field_indexing.index_option().has_positions() && terms.len() > 1 {
                    return Err(InvalidQuery::SchemaError(
                        "trying to run a PhrasePrefix query on a field which does not have \
                         positions indexed"
                            .to_string(),
                    ));
                }
                Ok((field, terms))
            }
            _ => Err(InvalidQuery::SchemaError(
                "trying to run a PhrasePrefix query on a non-text field".to_string(),
            )),
        }
    }
}

impl From<PhrasePrefixQuery> for QueryAst {
    fn from(phrase_query: PhrasePrefixQuery) -> Self {
        QueryAst::PhrasePrefix(phrase_query)
    }
}

impl BuildTantivyAst for PhrasePrefixQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let (_, terms) = match self.get_terms(context.schema, context.tokenizer_manager) {
            Ok(res) => res,
            Err(InvalidQuery::FieldDoesNotExist { .. }) if self.lenient => {
                return Ok(TantivyQueryAst::match_none());
            }
            Err(e) => return Err(e),
        };

        if terms.is_empty() {
            if self.params.zero_terms_query.is_none() {
                Ok(TantivyQueryAst::match_none())
            } else {
                Ok(TantivyQueryAst::match_all())
            }
        } else {
            let mut phrase_prefix_query = TantivyPhrasePrefixQuery::new_with_offset(terms);
            phrase_prefix_query.set_max_expansions(self.max_expansions);
            Ok(phrase_prefix_query.into())
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/range_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Bound;

use serde::{Deserialize, Serialize};
use tantivy::fastfield::FastValue;
use tantivy::query::FastFieldRangeQuery;
use tantivy::tokenizer::TextAnalyzer;
use tantivy::{DateTime, Term};

use super::QueryAst;
use super::tantivy_query_ast::TantivyBoolQuery;
use crate::json_literal::InterpretUserInput;
use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext, TantivyQueryAst};
use crate::{InvalidQuery, JsonLiteral};

#[derive(Serialize, Deserialize, Clone, Debug, PartialEq, Eq)]
pub struct RangeQuery {
    pub field: String,
    pub lower_bound: Bound<JsonLiteral>,
    pub upper_bound: Bound<JsonLiteral>,
}

/// Converts a given bound JsonLiteral bound into a bound of type T.
fn convert_bound<'a, T>(bound: &'a Bound<JsonLiteral>) -> Option<Bound<T>>
where T: InterpretUserInput<'a> {
    match bound {
        Bound::Included(val) => {
            let val = T::interpret_json(val)?;
            Some(Bound::Included(val))
        }
        Bound::Excluded(val) => {
            let val = T::interpret_json(val)?;
            Some(Bound::Excluded(val))
        }
        Bound::Unbounded => Some(Bound::Unbounded),
    }
}

/// Converts a given bound JsonLiteral bound into a bound of type T.
fn convert_bounds<'a, T>(
    lower_bound: &'a Bound<JsonLiteral>,
    upper_bound: &'a Bound<JsonLiteral>,
    field_name: &str,
) -> Result<(Bound<T>, Bound<T>), InvalidQuery>
where
    T: InterpretUserInput<'a>,
{
    let invalid_query = || InvalidQuery::InvalidBoundary {
        expected_value_type: T::name(),
        field_name: field_name.to_string(),
    };
    let lower_bound = convert_bound(lower_bound).ok_or_else(invalid_query)?;
    let upper_bound = convert_bound(upper_bound).ok_or_else(invalid_query)?;
    Ok((lower_bound, upper_bound))
}

/// Converts a given bound JsonLiteral bound into a bound of type T.
impl From<RangeQuery> for QueryAst {
    fn from(range_query: RangeQuery) -> Self {
        QueryAst::Range(range_query)
    }
}

fn term_with_fastval<T: FastValue>(term: &Term, val: T) -> Term {
    let mut term = term.clone();
    term.append_type_and_fast_value(val);
    term
}

fn query_from_fast_val_range<T: FastValue>(
    empty_term: &Term,
    range: (Bound<T>, Bound<T>),
) -> FastFieldRangeQuery {
    let (lower_bound, upper_bound) = range;
    FastFieldRangeQuery::new(
        lower_bound.map(|val| term_with_fastval(empty_term, val)),
        upper_bound.map(|val| term_with_fastval(empty_term, val)),
    )
}

fn get_normalized_text(normalizer: &mut Option<TextAnalyzer>, text: &str) -> String {
    if let Some(normalizer) = normalizer {
        let mut token_stream = normalizer.token_stream(text);
        let mut tokens = Vec::new();
        token_stream.process(&mut |token| {
            tokens.push(token.text.clone());
        });
        tokens[0].to_string()
    } else {
        text.to_string()
    }
}

impl BuildTantivyAst for RangeQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let (field, field_entry, json_path) =
            super::utils::find_field_or_hit_dynamic(&self.field, context.schema).ok_or_else(
                || InvalidQuery::FieldDoesNotExist {
                    full_path: self.field.clone(),
                },
            )?;
        if !field_entry.is_fast() {
            return Err(InvalidQuery::SchemaError(format!(
                "range queries are only supported for fast fields. (`{}` is not a fast field)",
                field_entry.name()
            )));
        }
        Ok(match field_entry.field_type() {
            tantivy::schema::FieldType::Str(options) => {
                let mut normalizer =
                    options
                        .get_fast_field_tokenizer_name()
                        .and_then(|tokenizer_name| {
                            context.tokenizer_manager.get_normalizer(tokenizer_name)
                        });

                let (lower_bound, upper_bound) =
                    convert_bounds(&self.lower_bound, &self.upper_bound, field_entry.name())?;

                FastFieldRangeQuery::new(
                    lower_bound.map(|text| {
                        Term::from_field_text(field, &get_normalized_text(&mut normalizer, text))
                    }),
                    upper_bound.map(|text| {
                        Term::from_field_text(field, &get_normalized_text(&mut normalizer, text))
                    }),
                )
                .into()
            }
            tantivy::schema::FieldType::U64(_) => {
                let (lower_bound, upper_bound) =
                    convert_bounds(&self.lower_bound, &self.upper_bound, field_entry.name())?;
                FastFieldRangeQuery::new(
                    lower_bound.map(|val| Term::from_field_u64(field, val)),
                    upper_bound.map(|val| Term::from_field_u64(field, val)),
                )
                .into()
            }
            tantivy::schema::FieldType::I64(_) => {
                let (lower_bound, upper_bound) =
                    convert_bounds(&self.lower_bound, &self.upper_bound, field_entry.name())?;
                FastFieldRangeQuery::new(
                    lower_bound.map(|val| Term::from_field_i64(field, val)),
                    upper_bound.map(|val| Term::from_field_i64(field, val)),
                )
                .into()
            }
            tantivy::schema::FieldType::F64(_) => {
                let (lower_bound, upper_bound) =
                    convert_bounds(&self.lower_bound, &self.upper_bound, field_entry.name())?;
                FastFieldRangeQuery::new(
                    lower_bound.map(|val| Term::from_field_f64(field, val)),
                    upper_bound.map(|val| Term::from_field_f64(field, val)),
                )
                .into()
            }
            tantivy::schema::FieldType::Bool(_) => {
                return Err(InvalidQuery::RangeQueryNotSupportedForField {
                    value_type: "bool",
                    field_name: field_entry.name().to_string(),
                });
            }
            tantivy::schema::FieldType::Date(date_options) => {
                let (lower_bound, upper_bound) =
                    convert_bounds(&self.lower_bound, &self.upper_bound, field_entry.name())?;
                let truncate_datetime =
                    |date: &DateTime| date.truncate(date_options.get_precision());
                let lower_bound = lower_bound.as_ref().map(truncate_datetime);
                let upper_bound = upper_bound.as_ref().map(truncate_datetime);
                FastFieldRangeQuery::new(
                    lower_bound.map(|val| Term::from_field_date(field, val)),
                    upper_bound.map(|val| Term::from_field_date(field, val)),
                )
                .into()
            }
            tantivy::schema::FieldType::Facet(_) => {
                return Err(InvalidQuery::RangeQueryNotSupportedForField {
                    value_type: "facet",
                    field_name: field_entry.name().to_string(),
                });
            }
            tantivy::schema::FieldType::Bytes(_) => todo!(),
            tantivy::schema::FieldType::JsonObject(options) => {
                let mut sub_queries: Vec<TantivyQueryAst> = Vec::new();
                let empty_term =
                    Term::from_field_json_path(field, json_path, options.is_expand_dots_enabled());
                // Try to convert the bounds into numerical values in following order i64, u64,
                // f64. Tantivy will convert to the correct numerical type of the column if it
                // doesn't match.
                let bounds_range_i64: Option<(Bound<i64>, Bound<i64>)> =
                    convert_bound(&self.lower_bound).zip(convert_bound(&self.upper_bound));
                let bounds_range_u64: Option<(Bound<u64>, Bound<u64>)> =
                    convert_bound(&self.lower_bound).zip(convert_bound(&self.upper_bound));
                let bounds_range_f64: Option<(Bound<f64>, Bound<f64>)> =
                    convert_bound(&self.lower_bound).zip(convert_bound(&self.upper_bound));
                if let Some(range) = bounds_range_i64 {
                    sub_queries.push(query_from_fast_val_range(&empty_term, range).into());
                } else if let Some(range) = bounds_range_u64 {
                    sub_queries.push(query_from_fast_val_range(&empty_term, range).into());
                } else if let Some(range) = bounds_range_f64 {
                    sub_queries.push(query_from_fast_val_range(&empty_term, range).into());
                }
                let bounds_range_date: Option<(Bound<DateTime>, Bound<DateTime>)> =
                    convert_bound(&self.lower_bound).zip(convert_bound(&self.upper_bound));
                if let Some(range) = bounds_range_date {
                    sub_queries.push(query_from_fast_val_range(&empty_term, range).into());
                }
                let mut normalizer =
                    options
                        .get_fast_field_tokenizer_name()
                        .and_then(|tokenizer_name| {
                            context.tokenizer_manager.get_normalizer(tokenizer_name)
                        });

                let bounds_range_str: Option<(Bound<&str>, Bound<&str>)> =
                    convert_bound(&self.lower_bound).zip(convert_bound(&self.upper_bound));
                if let Some(range) = bounds_range_str {
                    let str_query = FastFieldRangeQuery::new(
                        range.0.map(|val| {
                            let val = get_normalized_text(&mut normalizer, val);
                            let mut term = empty_term.clone();
                            term.append_type_and_str(&val);
                            term
                        }),
                        range.1.map(|val| {
                            let val = get_normalized_text(&mut normalizer, val);
                            let mut term = empty_term.clone();
                            term.append_type_and_str(&val);
                            term
                        }),
                    )
                    .into();
                    sub_queries.push(str_query);
                }
                if sub_queries.is_empty() {
                    return Err(InvalidQuery::InvalidBoundary {
                        expected_value_type: "i64, u64, f64, str",
                        field_name: field_entry.name().to_string(),
                    });
                }
                if sub_queries.len() == 1 {
                    return Ok(sub_queries.pop().unwrap());
                }

                let bool_query = TantivyBoolQuery {
                    should: sub_queries,
                    ..Default::default()
                };
                bool_query.into()
            }
            tantivy::schema::FieldType::IpAddr(_) => {
                let (lower_bound, upper_bound) =
                    convert_bounds(&self.lower_bound, &self.upper_bound, field_entry.name())?;
                FastFieldRangeQuery::new(
                    lower_bound.map(|val| Term::from_field_ip_addr(field, val)),
                    upper_bound.map(|val| Term::from_field_ip_addr(field, val)),
                )
                .into()
            }
        })
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Bound;

    use tantivy::schema::{DateOptions, DateTimePrecision, FAST, STORED, Schema, TEXT};

    use super::RangeQuery;
    use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext};
    use crate::{InvalidQuery, JsonLiteral, MatchAllOrNone};

    fn make_schema(dynamic_mode: bool) -> Schema {
        let mut schema_builder = Schema::builder();
        schema_builder.add_i64_field("my_i64_field", FAST);
        schema_builder.add_u64_field("my_u64_field", FAST);
        schema_builder.add_f64_field("my_f64_field", FAST);
        schema_builder.add_text_field("my_str_field", FAST);
        let date_options = DateOptions::default()
            .set_fast()
            .set_precision(DateTimePrecision::Milliseconds);
        schema_builder.add_date_field("my_date_field", date_options);
        schema_builder.add_u64_field("my_u64_not_fastfield", STORED);
        if dynamic_mode {
            schema_builder.add_json_field("_dynamic", TEXT | STORED | FAST);
        }
        schema_builder.build()
    }

    fn test_range_query_typed_field_util(
        field: &str,
        lower_value: JsonLiteral,
        upper_value: JsonLiteral,
        expected: &str,
    ) {
        let schema = make_schema(false);
        let range_query = RangeQuery {
            field: field.to_string(),
            lower_bound: Bound::Included(lower_value),
            upper_bound: Bound::Included(upper_value),
        };
        let tantivy_ast = range_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap()
            .simplify();
        let leaf = tantivy_ast.as_leaf().unwrap();
        let leaf_str = format!("{leaf:?}");
        assert_eq!(leaf_str, expected);
    }

    #[test]
    fn test_range_query_typed_field() {
        test_range_query_typed_field_util(
            "my_i64_field",
            JsonLiteral::String("1980".to_string()),
            JsonLiteral::String("1989".to_string()),
            "FastFieldRangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=0, \
             type=I64, 1980)), upper_bound: Included(Term(field=0, type=I64, 1989)) } }",
        );
        test_range_query_typed_field_util(
            "my_u64_field",
            JsonLiteral::String("1980".to_string()),
            JsonLiteral::String("1989".to_string()),
            "FastFieldRangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=1, \
             type=U64, 1980)), upper_bound: Included(Term(field=1, type=U64, 1989)) } }",
        );
        test_range_query_typed_field_util(
            "my_f64_field",
            JsonLiteral::String("1980".to_string()),
            JsonLiteral::String("1989".to_string()),
            "FastFieldRangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=2, \
             type=F64, 1980.0)), upper_bound: Included(Term(field=2, type=F64, 1989.0)) } }",
        );
    }

    #[test]
    fn test_range_query_missing_field() {
        let schema = make_schema(false);
        let range_query = RangeQuery {
            field: "missing_field.toto".to_string(),
            lower_bound: Bound::Included(JsonLiteral::String("1980".to_string())),
            upper_bound: Bound::Included(JsonLiteral::String("1989".to_string())),
        };
        // with validation
        let invalid_query: InvalidQuery = range_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap_err();
        assert!(
            matches!(invalid_query, InvalidQuery::FieldDoesNotExist { full_path } if full_path == "missing_field.toto")
        );
        // without validation
        assert_eq!(
            range_query
                .build_tantivy_ast_call(
                    &BuildTantivyAstContext::for_test(&schema).without_validation()
                )
                .unwrap()
                .const_predicate(),
            Some(MatchAllOrNone::MatchNone)
        );
    }

    #[test]
    fn test_range_dynamic() {
        let range_query = RangeQuery {
            field: "hello".to_string(),
            lower_bound: Bound::Included(JsonLiteral::String("1980".to_string())),
            upper_bound: Bound::Included(JsonLiteral::String("1989".to_string())),
        };
        let schema = make_schema(true);
        let tantivy_ast = range_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        assert_eq!(
            format!("{tantivy_ast:?}"),
            "Bool(TantivyBoolQuery { must: [], must_not: [], should: [Leaf(FastFieldRangeQuery { \
             bounds: BoundsRange { lower_bound: Included(Term(field=6, type=Json, path=hello, \
             type=I64, 1980)), upper_bound: Included(Term(field=6, type=Json, path=hello, \
             type=I64, 1989)) } }), Leaf(FastFieldRangeQuery { bounds: BoundsRange { lower_bound: \
             Included(Term(field=6, type=Json, path=hello, type=Str, \"1980\")), upper_bound: \
             Included(Term(field=6, type=Json, path=hello, type=Str, \"1989\")) } })], filter: \
             [], minimum_should_match: None })"
        );
    }

    #[test]
    fn test_range_dynamic_datetime() {
        let range_query = RangeQuery {
            field: "hello".to_string(),
            lower_bound: Bound::Included(JsonLiteral::String(
                "2020-12-09T16:09:53+00:00".to_string(),
            )),
            upper_bound: Bound::Included(JsonLiteral::String(
                "2020-12-09T16:09:53+00:00".to_string(),
            )),
        };
        let schema = make_schema(true);
        let tantivy_ast = range_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        assert_eq!(
            format!("{tantivy_ast:?}"),
            "Bool(TantivyBoolQuery { must: [], must_not: [], should: [Leaf(FastFieldRangeQuery { \
             bounds: BoundsRange { lower_bound: Included(Term(field=6, type=Json, path=hello, \
             type=Date, 2020-12-09T16:09:53Z)), upper_bound: Included(Term(field=6, type=Json, \
             path=hello, type=Date, 2020-12-09T16:09:53Z)) } }), Leaf(FastFieldRangeQuery { \
             bounds: BoundsRange { lower_bound: Included(Term(field=6, type=Json, path=hello, \
             type=Str, \"2020-12-09T16:09:53+00:00\")), upper_bound: Included(Term(field=6, \
             type=Json, path=hello, type=Str, \"2020-12-09T16:09:53+00:00\")) } })], filter: [], \
             minimum_should_match: None })"
        );
    }

    #[test]
    fn test_range_query_not_fast_field() {
        let range_query = RangeQuery {
            field: "my_u64_not_fastfield".to_string(),
            lower_bound: Bound::Included(JsonLiteral::String("1980".to_string())),
            upper_bound: Bound::Included(JsonLiteral::String("1989".to_string())),
        };
        let schema = make_schema(false);
        let err = range_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap_err();
        assert!(matches!(err, InvalidQuery::SchemaError { .. }));
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/regex_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use anyhow::Context;
pub use prefix::{AutomatonQuery, JsonPathPrefix};
use serde::{Deserialize, Serialize};
use tantivy::Term;
use tantivy::schema::{Field, FieldType, Schema as TantivySchema};

use super::{BuildTantivyAst, BuildTantivyAstContext, QueryAst};
use crate::query_ast::TantivyQueryAst;
use crate::{InvalidQuery, find_field_or_hit_dynamic};

/// A Regex query
#[derive(PartialEq, Eq, Debug, Serialize, Deserialize, Clone)]
pub struct RegexQuery {
    pub field: String,
    pub regex: String,
}

impl From<RegexQuery> for QueryAst {
    fn from(regex_query: RegexQuery) -> Self {
        Self::Regex(regex_query)
    }
}

impl RegexQuery {
    #[cfg(test)]
    pub fn from_field_value(field: impl ToString, regex: impl ToString) -> Self {
        Self {
            field: field.to_string(),
            regex: regex.to_string(),
        }
    }
}

impl RegexQuery {
    pub fn to_field_and_regex(
        &self,
        schema: &TantivySchema,
    ) -> Result<(Field, Option<Vec<u8>>, String), InvalidQuery> {
        let Some((field, field_entry, json_path)) = find_field_or_hit_dynamic(&self.field, schema)
        else {
            return Err(InvalidQuery::FieldDoesNotExist {
                full_path: self.field.clone(),
            });
        };
        let field_type = field_entry.field_type();

        match field_type {
            FieldType::Str(text_options) => {
                text_options.get_indexing_options().ok_or_else(|| {
                    InvalidQuery::SchemaError(format!(
                        "field {} is not full-text searchable",
                        field_entry.name()
                    ))
                })?;

                Ok((field, None, self.regex.to_string()))
            }
            FieldType::JsonObject(json_options) => {
                json_options.get_text_indexing_options().ok_or_else(|| {
                    InvalidQuery::SchemaError(format!(
                        "field {} is not full-text searchable",
                        field_entry.name()
                    ))
                })?;

                let mut term_for_path = Term::from_field_json_path(
                    field,
                    json_path,
                    json_options.is_expand_dots_enabled(),
                );
                term_for_path.append_type_and_str("");

                let value = term_for_path.value();
                // We skip the 1st byte which is a marker to tell this is json. This isn't present
                // in the dictionary
                let byte_path_prefix = value.as_serialized()[1..].to_owned();
                Ok((field, Some(byte_path_prefix), self.regex.to_string()))
            }
            _ => Err(InvalidQuery::SchemaError(
                "trying to run a regex query on a non-text field".to_string(),
            )),
        }
    }
}

impl BuildTantivyAst for RegexQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let (field, path, regex) = self.to_field_and_regex(context.schema)?;
        let regex = tantivy_fst::Regex::new(&regex).context("failed to parse regex")?;
        let regex_automaton_with_path = JsonPathPrefix {
            prefix: path.unwrap_or_default(),
            automaton: regex.into(),
        };
        let regex_query_with_path = AutomatonQuery {
            field,
            automaton: Arc::new(regex_automaton_with_path),
        };
        Ok(regex_query_with_path.into())
    }
}

mod prefix {
    use std::sync::Arc;

    use tantivy::query::{AutomatonWeight, EnableScoring, Query, Weight};
    use tantivy::schema::Field;
    use tantivy_fst::Automaton;

    pub struct JsonPathPrefix<A> {
        pub prefix: Vec<u8>,
        pub automaton: Arc<A>,
    }

    // we need to implement manually because the std adds an unnecessary bound `A: Clone`
    impl<A> Clone for JsonPathPrefix<A> {
        fn clone(&self) -> Self {
            JsonPathPrefix {
                prefix: self.prefix.clone(),
                automaton: self.automaton.clone(),
            }
        }
    }

    #[derive(Clone, Debug, PartialEq)]
    pub enum JsonPathPrefixState<A> {
        Prefix(usize),
        Inner(A),
        PrefixFailed,
    }

    impl<A: Automaton> Automaton for JsonPathPrefix<A> {
        type State = JsonPathPrefixState<A::State>;

        fn start(&self) -> Self::State {
            if self.prefix.is_empty() {
                JsonPathPrefixState::Inner(self.automaton.start())
            } else {
                JsonPathPrefixState::Prefix(0)
            }
        }

        fn is_match(&self, state: &Self::State) -> bool {
            match state {
                JsonPathPrefixState::Prefix(_) => false,
                JsonPathPrefixState::Inner(inner_state) => self.automaton.is_match(inner_state),
                JsonPathPrefixState::PrefixFailed => false,
            }
        }

        fn accept(&self, state: &Self::State, byte: u8) -> Self::State {
            match state {
                JsonPathPrefixState::Prefix(i) => {
                    if self.prefix.get(*i) != Some(&byte) {
                        return JsonPathPrefixState::PrefixFailed;
                    }
                    let next_pos = i + 1;
                    if next_pos == self.prefix.len() {
                        JsonPathPrefixState::Inner(self.automaton.start())
                    } else {
                        JsonPathPrefixState::Prefix(next_pos)
                    }
                }
                JsonPathPrefixState::Inner(inner_state) => {
                    JsonPathPrefixState::Inner(self.automaton.accept(inner_state, byte))
                }
                JsonPathPrefixState::PrefixFailed => JsonPathPrefixState::PrefixFailed,
            }
        }

        fn can_match(&self, state: &Self::State) -> bool {
            match state {
                JsonPathPrefixState::Prefix(_) => true,
                JsonPathPrefixState::Inner(inner_state) => self.automaton.can_match(inner_state),
                JsonPathPrefixState::PrefixFailed => false,
            }
        }

        fn will_always_match(&self, state: &Self::State) -> bool {
            match state {
                JsonPathPrefixState::Prefix(_) => false,
                JsonPathPrefixState::Inner(inner_state) => {
                    self.automaton.will_always_match(inner_state)
                }
                JsonPathPrefixState::PrefixFailed => false,
            }
        }
    }

    // we don't use RegexQuery to handle our path. We could tinker with the regex to embed
    // json field path inside, but that seems not as clean, and would prevent support of
    // case-insensitive search in the future (we would also make the path insensitive,
    // which we shouldn't)
    pub struct AutomatonQuery<A> {
        pub automaton: Arc<A>,
        pub field: Field,
    }

    impl<A> std::fmt::Debug for AutomatonQuery<A> {
        fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
            f.debug_struct("AutomatonQuery")
                .field("field", &self.field)
                .field("automaton", &std::any::type_name::<A>())
                .finish()
        }
    }

    impl<A> Clone for AutomatonQuery<A> {
        fn clone(&self) -> Self {
            AutomatonQuery {
                automaton: self.automaton.clone(),
                field: self.field,
            }
        }
    }

    impl<A: Automaton + Send + Sync + 'static> Query for AutomatonQuery<A>
    where A::State: Clone
    {
        fn weight(&self, _enabled_scoring: EnableScoring<'_>) -> tantivy::Result<Box<dyn Weight>> {
            Ok(Box::new(AutomatonWeight::<A>::new(
                self.field,
                self.automaton.clone(),
            )))
        }
    }
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;

    use tantivy::schema::{Schema as TantivySchema, TEXT};
    use tantivy_fst::{Automaton, Regex};

    use super::prefix::JsonPathPrefixState;
    use super::{JsonPathPrefix, RegexQuery};

    #[test]
    fn test_regex_query_text_field() {
        let mut schema_builder = TantivySchema::builder();
        schema_builder.add_text_field("field", TEXT);
        let schema = schema_builder.build();

        let query = RegexQuery {
            field: "field".to_string(),
            regex: "abc.*xyz".to_string(),
        };
        let (field, path, regex) = query.to_field_and_regex(&schema).unwrap();
        assert_eq!(field, schema.get_field("field").unwrap());
        assert!(path.is_none());
        assert_eq!(regex, query.regex);
    }

    #[test]
    fn test_regex_query_json_field() {
        let mut schema_builder = TantivySchema::builder();
        schema_builder.add_json_field("field", TEXT);
        let schema = schema_builder.build();

        let query = RegexQuery {
            field: "field.sub.field".to_string(),
            regex: "abc.*xyz".to_string(),
        };
        let (field, path, regex) = query.to_field_and_regex(&schema).unwrap();
        assert_eq!(field, schema.get_field("field").unwrap());
        assert_eq!(path.unwrap(), b"sub\x01field\0s");
        assert_eq!(regex, query.regex);

        // i believe this is how concatenated field behave
        let query_empty_path = RegexQuery {
            field: "field".to_string(),
            regex: "abc.*xyz".to_string(),
        };
        let (field, path, regex) = query_empty_path.to_field_and_regex(&schema).unwrap();
        assert_eq!(field, schema.get_field("field").unwrap());
        assert_eq!(path.unwrap(), b"\0s");
        assert_eq!(regex, query_empty_path.regex);
    }

    #[test]
    fn test_json_prefix_automaton_empty_path() {
        let regex = Arc::new(Regex::new("e(f|g.*)").unwrap());
        let empty_path_automaton = JsonPathPrefix {
            prefix: Vec::new(),
            automaton: regex.clone(),
        };

        let start = empty_path_automaton.start();
        assert_eq!(start, JsonPathPrefixState::Inner(regex.start()));
    }

    #[test]
    fn test_json_prefix_automaton() {
        let regex = Arc::new(Regex::new("e(f|g.*)").unwrap());
        let automaton = JsonPathPrefix {
            prefix: b"ab".to_vec(),
            automaton: regex.clone(),
        };

        let start = automaton.start();
        assert!(matches!(start, JsonPathPrefixState::Prefix(_)));
        assert!(automaton.can_match(&start));
        assert!(!automaton.is_match(&start));

        let miss = automaton.accept(&start, b'g');
        assert_eq!(miss, JsonPathPrefixState::PrefixFailed);
        // supporting this is important for optimisation
        assert!(!automaton.can_match(&miss));
        assert!(!automaton.is_match(&miss));

        let a = automaton.accept(&start, b'a');
        assert!(matches!(a, JsonPathPrefixState::Prefix(_)));
        assert!(automaton.can_match(&a));
        assert!(!automaton.is_match(&a));

        let ab = automaton.accept(&a, b'b');
        assert_eq!(ab, JsonPathPrefixState::Inner(regex.start()));
        assert!(automaton.can_match(&ab));
        assert!(!automaton.is_match(&ab));

        // starting here, we just take that we passthrough correctly,
        // and reply to can_match as well as possible
        // (we don't test will_always_match because Regex doesn't support it)
        let abc = automaton.accept(&ab, b'c');
        assert!(matches!(abc, JsonPathPrefixState::Inner(_)));
        assert!(!automaton.can_match(&abc));
        assert!(!automaton.is_match(&abc));

        let abe = automaton.accept(&ab, b'e');
        assert!(matches!(abe, JsonPathPrefixState::Inner(_)));
        assert!(automaton.can_match(&abe));
        assert!(!automaton.is_match(&abe));

        let abef = automaton.accept(&abe, b'f');
        assert!(matches!(abef, JsonPathPrefixState::Inner(_)));
        assert!(automaton.can_match(&abef));
        assert!(automaton.is_match(&abef));

        let abefg = automaton.accept(&abef, b'g');
        assert!(matches!(abefg, JsonPathPrefixState::Inner(_)));
        assert!(!automaton.can_match(&abefg));
        assert!(!automaton.is_match(&abefg));

        let abeg = automaton.accept(&abe, b'g');
        assert!(matches!(abeg, JsonPathPrefixState::Inner(_)));
        assert!(automaton.can_match(&abeg));
        assert!(automaton.is_match(&abeg));

        let abegh = automaton.accept(&abeg, b'h');
        assert!(matches!(abegh, JsonPathPrefixState::Inner(_)));
        assert!(automaton.can_match(&abegh));
        assert!(automaton.is_match(&abegh));
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/tantivy_query_ast.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use tantivy::query::{
    AllQuery as TantivyAllQuery, BooleanQuery, ConstScoreQuery as TantivyConstScoreQuery,
    EmptyQuery as TantivyEmptyQuery,
};
use tantivy::query_grammar::Occur;

use crate::{BooleanOperand, MatchAllOrNone, TantivyQuery};

/// This AST point, is only to make it easier to simplify the generated Tantivy query.
/// when we convert a QueryAst into a TantivyQueryAst.
///
/// Let's keep private.
#[derive(Debug)]
pub(crate) enum TantivyQueryAst {
    Bool(TantivyBoolQuery),
    Leaf(Box<dyn TantivyQuery>),
    ConstPredicate(MatchAllOrNone),
}

impl Clone for TantivyQueryAst {
    fn clone(&self) -> Self {
        match self {
            TantivyQueryAst::Bool(bool_query) => TantivyQueryAst::Bool(bool_query.clone()),
            TantivyQueryAst::ConstPredicate(predicate) => {
                TantivyQueryAst::ConstPredicate(*predicate)
            }
            TantivyQueryAst::Leaf(query) => TantivyQueryAst::Leaf(query.box_clone()),
        }
    }
}

impl From<MatchAllOrNone> for TantivyQueryAst {
    fn from(match_all_or_none: MatchAllOrNone) -> Self {
        TantivyQueryAst::ConstPredicate(match_all_or_none)
    }
}

impl PartialEq for TantivyQueryAst {
    fn eq(&self, other: &Self) -> bool {
        match (self, other) {
            (Self::Bool(left), Self::Bool(right)) => left == right,
            (Self::Leaf(left), Self::Leaf(right)) => {
                let left_str: String = format!("{left:?}");
                let right_str: String = format!("{right:?}");
                left_str == right_str
            }
            (Self::ConstPredicate(left), Self::ConstPredicate(right)) => left == right,
            _ => false,
        }
    }
}

impl Eq for TantivyQueryAst {}

impl TantivyQueryAst {
    #[cfg(test)]
    pub(crate) fn as_bool_query(&self) -> Option<&TantivyBoolQuery> {
        match self {
            TantivyQueryAst::Bool(bool) => Some(bool),
            _ => None,
        }
    }

    #[cfg(test)]
    pub(crate) fn as_leaf(&self) -> Option<&dyn TantivyQuery> {
        match self {
            TantivyQueryAst::Leaf(tantivy_query) => Some(&**tantivy_query),
            _ => None,
        }
    }

    pub(crate) fn const_predicate(&self) -> Option<MatchAllOrNone> {
        if let Self::ConstPredicate(always_or_never) = self {
            Some(*always_or_never)
        } else {
            None
        }
    }

    pub fn match_all() -> Self {
        Self::ConstPredicate(MatchAllOrNone::MatchAll)
    }

    pub fn match_none() -> Self {
        Self::ConstPredicate(MatchAllOrNone::MatchNone)
    }

    pub fn simplify(self) -> TantivyQueryAst {
        match self {
            TantivyQueryAst::Bool(bool_query) => bool_query.simplify(),
            ast => ast,
        }
    }
}

impl<Q: TantivyQuery> From<Q> for TantivyQueryAst {
    fn from(query: Q) -> TantivyQueryAst {
        TantivyQueryAst::Leaf(Box::new(query))
    }
}

impl From<TantivyQueryAst> for Box<dyn TantivyQuery> {
    fn from(boxed_tantivy_query: TantivyQueryAst) -> Box<dyn TantivyQuery> {
        match boxed_tantivy_query {
            TantivyQueryAst::Bool(boolean_query) => boolean_query.into(),
            TantivyQueryAst::Leaf(leaf) => leaf,
            TantivyQueryAst::ConstPredicate(always_or_never_match) => match always_or_never_match {
                MatchAllOrNone::MatchAll => Box::new(TantivyAllQuery),
                MatchAllOrNone::MatchNone => Box::new(TantivyEmptyQuery),
            },
        }
    }
}

// Remove the occurrence of trivial AST in the given list of asts.
//
// If `stop_before_empty` is true, then we will make sure to stop removing asts if it is
// the last element.
// This function may change the order of asts.
fn remove_with_guard(
    asts: &mut Vec<TantivyQueryAst>,
    to_remove: MatchAllOrNone,
    stop_before_empty: bool,
) {
    let mut i = 0;
    while i < asts.len() {
        if stop_before_empty && asts.len() == 1 {
            break;
        }
        if asts[i].const_predicate() == Some(to_remove) {
            asts.swap_remove(i);
        } else {
            i += 1;
        }
    }
}

#[derive(Default, Debug, Clone, Eq, PartialEq)]
pub(crate) struct TantivyBoolQuery {
    pub must: Vec<TantivyQueryAst>,
    pub must_not: Vec<TantivyQueryAst>,
    pub should: Vec<TantivyQueryAst>,
    pub filter: Vec<TantivyQueryAst>,
    pub minimum_should_match: Option<usize>,
}

fn simplify_asts(asts: Vec<TantivyQueryAst>) -> Vec<TantivyQueryAst> {
    asts.into_iter().map(|ast| ast.simplify()).collect()
}

impl TantivyBoolQuery {
    pub fn build_clause(operator: BooleanOperand, children: Vec<TantivyQueryAst>) -> Self {
        match operator {
            BooleanOperand::And => Self {
                must: children,
                ..Default::default()
            },
            BooleanOperand::Or => Self {
                should: children,
                ..Default::default()
            },
        }
    }

    pub fn simplify(mut self) -> TantivyQueryAst {
        // simplify sub branches
        self.must = simplify_asts(self.must);
        self.should = simplify_asts(self.should);
        self.must_not = simplify_asts(self.must_not);
        self.filter = simplify_asts(self.filter);

        for must_children in [&mut self.must, &mut self.filter] {
            for child in must_children {
                if child.const_predicate() == Some(MatchAllOrNone::MatchNone) {
                    return TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchNone);
                }
            }
        }
        if self.should.is_empty()
            && self.must.is_empty()
            && self.filter.is_empty()
            && self.must_not.is_empty()
            && self.minimum_should_match.unwrap_or(0) == 0
        {
            // This is just a convention mimicking Elastic/Commonsearch's behavior.
            return TantivyQueryAst::match_all();
        }

        let mut new_must = Vec::with_capacity(self.must.len());
        for must in self.must {
            let mut must_bool = match must {
                TantivyQueryAst::Bool(bool_query) => bool_query,
                _ => {
                    new_must.push(must);
                    continue;
                }
            };
            if must_bool.should.is_empty() && must_bool.minimum_should_match.is_none() {
                new_must.append(&mut must_bool.must);
                self.filter.append(&mut must_bool.filter);
                self.must_not.append(&mut must_bool.must_not);
            } else {
                new_must.push(TantivyQueryAst::Bool(must_bool));
            }
        }
        self.must = new_must;

        let mut new_filter = Vec::with_capacity(self.filter.len());
        for filter in self.filter {
            let mut filter_bool = match filter {
                TantivyQueryAst::Bool(bool_query) => bool_query,
                _ => {
                    new_filter.push(filter);
                    continue;
                }
            };
            if filter_bool.should.is_empty() && filter_bool.minimum_should_match.is_none() {
                new_filter.append(&mut filter_bool.must);
                new_filter.append(&mut filter_bool.filter);
                // must_not doesn't contribute to score, no need to move it to some filter_not kind
                // of thing
                self.must_not.append(&mut filter_bool.must_not);
            } else {
                new_filter.push(TantivyQueryAst::Bool(filter_bool));
            }
        }
        self.filter = new_filter;

        if self.minimum_should_match.is_none() {
            let mut new_should = Vec::with_capacity(self.should.len());
            for should in self.should {
                let mut should_bool = match should {
                    TantivyQueryAst::Bool(bool_query) => bool_query,
                    _ => {
                        new_should.push(should);
                        continue;
                    }
                };
                if should_bool.must.is_empty()
                    && should_bool.filter.is_empty()
                    && should_bool.must_not.is_empty()
                    && should_bool.minimum_should_match.is_none()
                {
                    new_should.append(&mut should_bool.should);
                } else {
                    new_should.push(TantivyQueryAst::Bool(should_bool));
                }
            }
            self.should = new_should;
        }

        // TODO we could turn must_not(must_not(abc, def)) into should(filter(abc), filter(def)),
        // we can't simply have should(abc, def) because of scoring, and should(filter(abc, def))
        // has a different meaning

        // remove sub-queries which don't impact the result
        remove_with_guard(&mut self.must, MatchAllOrNone::MatchAll, true);
        let mut has_no_positive_ast_so_far = self.must.is_empty();
        remove_with_guard(
            &mut self.filter,
            MatchAllOrNone::MatchAll,
            has_no_positive_ast_so_far,
        );
        has_no_positive_ast_so_far &= self.filter.is_empty();
        if !self.filter.is_empty() {
            // if filter is not empty, we can re-try cleaning must. we can't just check
            // has_no_positive_ast_so_far as it would clean must if must or filter contained
            // something
            remove_with_guard(&mut self.must, MatchAllOrNone::MatchAll, false);
        }
        remove_with_guard(
            &mut self.should,
            MatchAllOrNone::MatchNone,
            has_no_positive_ast_so_far,
        );
        has_no_positive_ast_so_far &= self.should.is_empty();
        remove_with_guard(
            &mut self.must_not,
            MatchAllOrNone::MatchNone,
            has_no_positive_ast_so_far,
        );

        for must_child in self.must.iter().chain(self.filter.iter()) {
            if must_child.const_predicate() == Some(MatchAllOrNone::MatchNone) {
                return TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchNone);
            }
        }
        for must_not_child in &self.must_not {
            if must_not_child.const_predicate() == Some(MatchAllOrNone::MatchAll) {
                return TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchNone);
            }
        }
        let has_positive_children =
            !(self.must.is_empty() && self.should.is_empty() && self.filter.is_empty());

        if !has_positive_children {
            if self.minimum_should_match.unwrap_or(0) > 0 {
                return MatchAllOrNone::MatchNone.into();
            }
            if self
                .must_not
                .iter()
                .all(|must_not| must_not.const_predicate() == Some(MatchAllOrNone::MatchNone))
            {
                return MatchAllOrNone::MatchAll.into();
            }
            self.must.push(TantivyQueryAst::match_all());
        } else {
            let num_children =
                self.must.len() + self.should.len() + self.must_not.len() + self.filter.len();
            if num_children == 1
                && self.minimum_should_match.is_none()
                && let Some(ast) = self.must.pop().or(self.should.pop())
            {
                return ast;
            }
            // We do not optimize a single filter clause for the moment.
            // We do need a mechanism to make sure we keep the boost of 0.
        }

        TantivyQueryAst::Bool(self)
    }
}

impl From<TantivyBoolQuery> for TantivyQueryAst {
    fn from(bool_query: TantivyBoolQuery) -> Self {
        TantivyQueryAst::Bool(bool_query)
    }
}

impl From<TantivyBoolQuery> for Box<dyn TantivyQuery> {
    fn from(bool_query: TantivyBoolQuery) -> Box<dyn TantivyQuery> {
        let mut clause: Vec<(Occur, Box<dyn TantivyQuery>)> = Vec::with_capacity(
            bool_query.must.len()
                + bool_query.must_not.len()
                + bool_query.should.len()
                + bool_query.filter.len(),
        );
        for (occur, child_asts) in [
            (Occur::Must, bool_query.must),
            (Occur::MustNot, bool_query.must_not),
            (Occur::Should, bool_query.should),
        ] {
            for child_ast in child_asts {
                let sub_query = child_ast.into();
                clause.push((occur, sub_query));
            }
        }
        for filter_child in bool_query.filter {
            let filter_query = filter_child.into();
            clause.push((
                Occur::Must,
                Box::new(TantivyConstScoreQuery::new(filter_query, 0.0f32)),
            ));
        }
        let tantivy_bool_query = if let Some(minimum_should_match) = bool_query.minimum_should_match
        {
            BooleanQuery::with_minimum_required_clauses(clause, minimum_should_match)
        } else {
            BooleanQuery::from(clause)
        };
        Box::new(tantivy_bool_query)
    }
}

#[cfg(test)]
mod tests {
    use proptest::prelude::*;
    use tantivy::query::{EmptyQuery, TermQuery};

    use super::TantivyBoolQuery;
    use crate::query_ast::tantivy_query_ast::{MatchAllOrNone, TantivyQueryAst, remove_with_guard};

    fn term(val: &str) -> TantivyQueryAst {
        use tantivy::schema::{Field, Term};
        TermQuery::new(
            Term::from_field_text(Field::from_field_id(0), val),
            Default::default(),
        )
        .into()
    }

    #[test]
    fn test_simplify_bool_query_with_no_clauses() {
        let bool_query = TantivyBoolQuery::default();
        assert_eq!(bool_query.simplify(), TantivyQueryAst::match_all());
    }

    #[test]
    fn test_remove_with_guard() {
        {
            let mut asts = Vec::new();
            // we are just checking for panics
            remove_with_guard(&mut asts, MatchAllOrNone::MatchAll, true);
            remove_with_guard(&mut asts, MatchAllOrNone::MatchAll, false);
        }
        {
            let mut asts = vec![
                MatchAllOrNone::MatchAll.into(),
                MatchAllOrNone::MatchAll.into(),
            ];
            remove_with_guard(&mut asts, MatchAllOrNone::MatchAll, true);
            assert_eq!(asts.len(), 1);
        }
        {
            let mut asts = vec![
                MatchAllOrNone::MatchAll.into(),
                MatchAllOrNone::MatchAll.into(),
            ];
            remove_with_guard(&mut asts, MatchAllOrNone::MatchAll, false);
            assert!(asts.is_empty());
        }
        {
            let mut asts = vec![
                MatchAllOrNone::MatchAll.into(),
                MatchAllOrNone::MatchNone.into(),
                MatchAllOrNone::MatchAll.into(),
            ];
            remove_with_guard(&mut asts, MatchAllOrNone::MatchAll, true);
            assert_eq!(asts.len(), 1);
        }
        {
            let mut asts = vec![
                MatchAllOrNone::MatchAll.into(),
                MatchAllOrNone::MatchNone.into(),
                MatchAllOrNone::MatchAll.into(),
            ];
            remove_with_guard(&mut asts, MatchAllOrNone::MatchAll, false);
            assert_eq!(asts.len(), 1);
        }
    }

    #[test]
    fn test_simplify_bool_query_with_one_clauses() {
        {
            let tantivy_query = EmptyQuery.into();
            let bool_query = TantivyBoolQuery {
                must: vec![tantivy_query],
                ..Default::default()
            };
            assert!(bool_query.simplify().as_leaf().is_some());
        }
        {
            let tantivy_query = EmptyQuery.into();
            let bool_query = TantivyBoolQuery {
                should: vec![tantivy_query],
                ..Default::default()
            };
            assert!(bool_query.simplify().as_leaf().is_some());
        }
        {
            let tantivy_query = EmptyQuery.into();
            let bool_query = TantivyBoolQuery {
                filter: vec![tantivy_query],
                ..Default::default()
            };
            // We do not simplify filter. We somehow need a mechanism to make sure we end up with a
            // const-score.
            assert!(bool_query.simplify().as_leaf().is_none());
        }
    }

    #[test]
    fn test_bool_negative_query_add_wildcard() {
        let tantivy_query = EmptyQuery.into();
        let simplified_ast = TantivyBoolQuery {
            must_not: vec![tantivy_query],
            ..Default::default()
        }
        .simplify();
        let simplified_ast_bool = simplified_ast.as_bool_query().unwrap();
        assert_eq!(simplified_ast_bool.must_not.len(), 1);
        assert_eq!(
            simplified_ast_bool.should.len() + simplified_ast_bool.filter.len(),
            0
        );
        assert_eq!(simplified_ast_bool.must.len(), 1);
        assert_eq!(
            simplified_ast_bool.must[0].const_predicate(),
            Some(MatchAllOrNone::MatchAll)
        );
    }

    #[test]
    fn test_bool_multiple_negative_query_add_wildcard() {
        let simplified_ast = TantivyBoolQuery {
            must_not: vec![EmptyQuery.into(), EmptyQuery.into()],
            ..Default::default()
        }
        .simplify();
        let simplified_ast_bool = simplified_ast.as_bool_query().unwrap();
        assert_eq!(simplified_ast_bool.must_not.len(), 2);
        assert_eq!(
            simplified_ast_bool.should.len() + simplified_ast_bool.filter.len(),
            0
        );
        assert_eq!(simplified_ast_bool.must.len(), 1);
        assert_eq!(
            simplified_ast_bool.must[0].const_predicate(),
            Some(MatchAllOrNone::MatchAll)
        );
    }

    #[test]
    fn test_bool_multiple_negative_query_with_positive() {
        let simplified_ast = TantivyBoolQuery {
            must: vec![EmptyQuery.into()],
            must_not: vec![EmptyQuery.into(), EmptyQuery.into()],
            ..Default::default()
        }
        .simplify();
        let simplified_ast_bool = simplified_ast.as_bool_query().unwrap();
        assert_eq!(simplified_ast_bool.must_not.len(), 2);
        assert_eq!(
            simplified_ast_bool.should.len() + simplified_ast_bool.filter.len(),
            0
        );
        assert_eq!(simplified_ast_bool.must.len(), 1);
        assert!(simplified_ast_bool.must[0].const_predicate().is_none(),);
    }

    #[test]
    fn test_should_lift_simplification() {
        let test_leaf = TantivyQueryAst::Leaf(Box::new(tantivy::query::AllQuery));
        let ast = TantivyQueryAst::Bool(TantivyBoolQuery {
            should: vec![
                test_leaf.clone(),
                TantivyQueryAst::Bool(TantivyBoolQuery {
                    should: vec![test_leaf.clone(), test_leaf],
                    ..Default::default()
                }),
            ],
            ..Default::default()
        });
        let simplified_ast = ast.clone().simplify();
        assert_ne!(simplified_ast, ast);
        let TantivyQueryAst::Bool(bool_query) = simplified_ast else {
            panic!();
        };
        assert_eq!(bool_query.should.len(), 3);
        assert!(bool_query.must.is_empty());
        assert!(bool_query.filter.is_empty());
        assert!(bool_query.must_not.is_empty());
        assert!(bool_query.minimum_should_match.is_none());
    }

    #[test]
    fn test_minimum_should_match_prevent_lift_simplification() {
        let test_leaf = TantivyQueryAst::Leaf(Box::new(tantivy::query::AllQuery));
        let ast = TantivyQueryAst::Bool(TantivyBoolQuery {
            should: vec![
                test_leaf.clone(),
                TantivyQueryAst::Bool(TantivyBoolQuery {
                    should: vec![test_leaf.clone(), test_leaf],
                    ..Default::default()
                }),
            ],
            minimum_should_match: Some(2),
            ..Default::default()
        });
        let simplified_ast = ast.clone().simplify();
        assert_eq!(simplified_ast, ast);
    }

    #[test]
    fn test_simplify_bool_query_with_match_all_must_not_clauses() {
        let tantivy_query = EmptyQuery.into();
        let bool_query = TantivyBoolQuery {
            must: vec![tantivy_query],
            must_not: vec![TantivyQueryAst::match_all()],
            ..Default::default()
        };
        assert_eq!(
            bool_query.simplify().const_predicate(),
            Some(MatchAllOrNone::MatchNone)
        );
    }

    #[test]
    fn test_simplify_bool_query_with_match_must_clauses() {
        let tantivy_query = EmptyQuery.into();
        let bool_query = TantivyBoolQuery {
            must: vec![tantivy_query, TantivyQueryAst::match_all()],
            ..Default::default()
        }
        .simplify();
        assert!(bool_query.as_leaf().is_some());
    }

    #[test]
    fn test_simplify_bool_query_with_match_must_and_other_positive_clauses() {
        let bool_query = TantivyBoolQuery {
            must: vec![TantivyQueryAst::match_all()],
            filter: vec![EmptyQuery.into()],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                filter: vec![EmptyQuery.into()],
                ..Default::default()
            }
            .into()
        );
    }

    #[test]
    fn test_simplify_bool_query_with_match_none_must_clauses() {
        let tantivy_query = EmptyQuery.into();
        let bool_query = TantivyBoolQuery {
            must: vec![TantivyQueryAst::match_none()],
            should: vec![tantivy_query],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query.const_predicate(),
            Some(MatchAllOrNone::MatchNone)
        );
    }

    #[test]
    fn test_simplify_bool_query_with_match_none_no_positive_clauses() {
        let bool_query = TantivyBoolQuery {
            must_not: vec![TantivyQueryAst::match_none()],
            ..Default::default()
        }
        .simplify();
        assert_eq!(bool_query.const_predicate(), Some(MatchAllOrNone::MatchAll));
    }

    #[test]
    fn test_simplify_empty_bool_query_matches_all() {
        let empty_bool_query = TantivyBoolQuery::default().simplify();
        assert_eq!(
            empty_bool_query.const_predicate(),
            Some(MatchAllOrNone::MatchAll)
        );
    }

    #[test]
    fn test_simplify_lift_bool_bool() {
        let bool_query = TantivyBoolQuery {
            must: vec![
                TantivyBoolQuery {
                    must: vec![term("abc"), term("def")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    must: vec![term("ghi"), term("jkl")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                must: vec![term("abc"), term("def"), term("ghi"), term("jkl"),],
                ..Default::default()
            }
            .into()
        );

        let bool_query = TantivyBoolQuery {
            should: vec![
                TantivyBoolQuery {
                    should: vec![term("abc"), term("def")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    should: vec![term("ghi"), term("jkl")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                should: vec![term("abc"), term("def"), term("ghi"), term("jkl"),],
                ..Default::default()
            }
            .into()
        );

        let bool_query = TantivyBoolQuery {
            must: vec![
                TantivyBoolQuery {
                    must: vec![term("abc"), term("def")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    should: vec![term("ghi"), term("jkl")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                must: vec![
                    term("abc"),
                    term("def"),
                    TantivyBoolQuery {
                        should: vec![term("ghi"), term("jkl")],
                        ..Default::default()
                    }
                    .into(),
                ],
                ..Default::default()
            }
            .into()
        );

        let bool_query = TantivyBoolQuery {
            should: vec![
                TantivyBoolQuery {
                    must: vec![term("abc")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    filter: vec![term("ghi")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                should: vec![
                    term("abc"),
                    // filter can't get optimized for scoring reasons
                    TantivyBoolQuery {
                        filter: vec![term("ghi")],
                        ..Default::default()
                    }
                    .into(),
                ],
                ..Default::default()
            }
            .into()
        );

        let bool_query = TantivyBoolQuery {
            must: vec![
                TantivyBoolQuery {
                    should: vec![term("abc")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    should: vec![term("def")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                must: vec![term("abc"), term("def"),],
                ..Default::default()
            }
            .into()
        );

        let bool_query = TantivyBoolQuery {
            must_not: vec![
                TantivyBoolQuery {
                    should: vec![term("abc")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    must: vec![term("def")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                must: vec![MatchAllOrNone::MatchAll.into()],
                must_not: vec![term("abc"), term("def"),],
                ..Default::default()
            }
            .into()
        );

        let bool_query = TantivyBoolQuery {
            must: vec![
                TantivyBoolQuery {
                    must_not: vec![term("abc"), term("def")],
                    ..Default::default()
                }
                .into(),
                TantivyBoolQuery {
                    must_not: vec![term("ghi")],
                    ..Default::default()
                }
                .into(),
            ],
            ..Default::default()
        }
        .simplify();
        assert_eq!(
            bool_query,
            TantivyBoolQuery {
                must: vec![MatchAllOrNone::MatchAll.into()],
                must_not: vec![term("abc"), term("def"), term("ghi"),],
                ..Default::default()
            }
            .into()
        );
    }

    #[derive(Debug, Clone)]
    struct ConstQuery(bool, u32);

    impl tantivy::query::Query for ConstQuery {
        fn weight(
            &self,
            _: tantivy::query::EnableScoring<'_>,
        ) -> tantivy::Result<Box<dyn tantivy::query::Weight>> {
            unimplemented!()
        }
    }

    impl TantivyQueryAst {
        fn evaluate_test(&self) -> Option<u32> {
            match self {
                TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchNone) => None,
                TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchAll) => Some(0),
                TantivyQueryAst::Bool(bool_query) => bool_query.evaluate_test(),
                TantivyQueryAst::Leaf(query) => {
                    let const_query = query
                        .downcast_ref::<ConstQuery>()
                        .expect("query wasn't a ConstQuery");
                    const_query.0.then_some(const_query.1)
                }
            }
        }
    }

    impl TantivyBoolQuery {
        fn evaluate_test(&self) -> Option<u32> {
            if self
                .must_not
                .iter()
                .any(|sub_ast| sub_ast.evaluate_test().is_some())
            {
                return None;
            }

            let mut should_score = 0u32;
            let mut matching_should_count = 0;
            for should in &self.should {
                if let Some(score) = should.evaluate_test() {
                    should_score += score;
                    matching_should_count += 1;
                }
            }

            if let Some(minimum_should_match) = self.minimum_should_match
                && minimum_should_match > matching_should_count
            {
                return None;
            }

            if self.must.len() + self.filter.len() > 0 {
                if self
                    .must
                    .iter()
                    .all(|sub_ast| sub_ast.evaluate_test().is_some())
                    && self
                        .filter
                        .iter()
                        .all(|sub_ast| sub_ast.evaluate_test().is_some())
                {
                    Some(
                        self.must
                            .iter()
                            .map(|sub_ast| sub_ast.evaluate_test().unwrap())
                            .sum::<u32>()
                            + should_score,
                    )
                } else {
                    None
                }
            } else {
                if self.should.is_empty() {
                    // by convention, an empty query returns all match.
                    return Some(0);
                }
                self.should
                    .iter()
                    .any(|sub_ast| sub_ast.evaluate_test().is_some())
                    .then_some(should_score)
            }
        }
    }

    fn ast_strategy() -> impl Strategy<Value = TantivyQueryAst> {
        let ast_leaf = proptest::prop_oneof![
            Just(TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchNone)),
            Just(TantivyQueryAst::ConstPredicate(MatchAllOrNone::MatchAll)),
            (prop::bool::ANY, 0u32..5)
                .prop_map(|(matc, score)| TantivyQueryAst::Leaf(Box::new(ConstQuery(matc, score)))),
        ];

        ast_leaf.prop_recursive(4, 32, 16, |element| {
            let must = proptest::collection::vec(element.clone(), 0..4);
            let filter = proptest::collection::vec(element.clone(), 0..4);
            let should = proptest::collection::vec(element.clone(), 0..4);
            let must_not = proptest::collection::vec(element.clone(), 0..4);
            let minimum_should_match = (0usize..=2).prop_map(|n: usize| n.checked_sub(1));
            (must, filter, should, must_not, minimum_should_match).prop_map(
                |(must, filter, should, must_not, minimum_should_match)| {
                    TantivyQueryAst::Bool(TantivyBoolQuery {
                        must,
                        filter,
                        should,
                        must_not,
                        minimum_should_match,
                    })
                },
            )
        })
    }

    #[track_caller]
    fn test_aux_simplify_never_change_result(ast: TantivyQueryAst) {
        let simplified_ast = ast.clone().simplify();
        assert_eq!(dbg!(simplified_ast).evaluate_test(), ast.evaluate_test());
    }

    proptest::proptest! {
        #![proptest_config(ProptestConfig {
          cases: 100000, .. ProptestConfig::default()
        })]
        #[test]
        fn test_proptest_simplify_never_change_result(ast in ast_strategy()) {
            test_aux_simplify_never_change_result(ast);
        }
    }

    #[test]
    fn test_simplify_never_change_result_simple_corner_case() {
        let ast = TantivyQueryAst::Bool(TantivyBoolQuery {
            minimum_should_match: Some(1),
            ..Default::default()
        });
        test_aux_simplify_never_change_result(ast);
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/term_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use serde::{Deserialize, Serialize};

use super::{BuildTantivyAst, QueryAst};
use crate::query_ast::{BuildTantivyAstContext, FullTextParams, TantivyQueryAst};
use crate::{BooleanOperand, InvalidQuery};

/// The TermQuery acts exactly like a FullTextQuery with
/// a raw tokenizer.
#[derive(PartialEq, Eq, Debug, Serialize, Deserialize, Clone)]
pub struct TermQuery {
    pub field: String,
    pub value: String,
}

impl From<TermQuery> for QueryAst {
    fn from(term_query: TermQuery) -> Self {
        Self::Term(term_query)
    }
}

impl TermQuery {
    #[cfg(test)]
    pub fn from_field_value(field: impl ToString, value: impl ToString) -> Self {
        Self {
            field: field.to_string(),
            value: value.to_string(),
        }
    }
}

impl BuildTantivyAst for TermQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let full_text_params = FullTextParams {
            tokenizer: Some("raw".to_string()),
            // The parameter below won't matter, since we will have only one term
            mode: BooleanOperand::Or.into(),
            zero_terms_query: Default::default(),
        };
        crate::query_ast::utils::full_text_query(
            &self.field,
            &self.value,
            &full_text_params,
            context.schema,
            context.tokenizer_manager,
            false,
        )
    }
}

// Private struct used for serialization.
// It represents the value of a term query. in the json form : `{field: <TermQueryValue>}`.
#[derive(Serialize, Deserialize)]
struct TermQueryValue {
    value: String,
}

impl From<TermQuery> for (String, TermQueryValue) {
    fn from(term_query: TermQuery) -> Self {
        (
            term_query.field,
            TermQueryValue {
                value: term_query.value,
            },
        )
    }
}

impl From<(String, TermQueryValue)> for TermQuery {
    fn from((field, term_query_value): (String, TermQueryValue)) -> Self {
        Self {
            field,
            value: term_query_value.value,
        }
    }
}

impl TryFrom<HashMap<String, TermQueryValue>> for TermQuery {
    type Error = &'static str;

    fn try_from(map: HashMap<String, TermQueryValue>) -> Result<Self, Self::Error> {
        if map.len() > 1 {
            return Err("TermQuery must have exactly one entry");
        }
        Ok(TermQuery::from(map.into_iter().next().unwrap())) // unwrap justified by the if
        // statementabove.
    }
}

impl From<TermQuery> for HashMap<String, TermQueryValue> {
    fn from(term_query: TermQuery) -> HashMap<String, TermQueryValue> {
        let (field, term_query_value) = term_query.into();
        let mut map = HashMap::with_capacity(1);
        map.insert(field, term_query_value);
        map
    }
}

#[cfg(test)]
mod tests {
    use tantivy::schema::{INDEXED, Schema};

    use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext, TermQuery};

    #[test]
    fn test_term_query_with_ipaddr_ipv4() {
        let term_query = TermQuery {
            field: "ip".to_string(),
            value: "127.0.0.1".to_string(),
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_ip_addr_field("ip", INDEXED);
        let schema = schema_builder.build();
        let tantivy_query_ast = term_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = tantivy_query_ast.as_leaf().unwrap();
        assert_eq!(
            &format!("{leaf:?}"),
            "TermQuery(Term(field=0, type=IpAddr, ::ffff:127.0.0.1))"
        );
    }

    #[test]
    fn test_term_query_with_ipaddr_compressed_ipv6() {
        let term_query = TermQuery {
            field: "ip".to_string(),
            value: "2001:db8:85a3::8a2e:370:7334".to_string(), //< note the ::. This is a compressed form
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_ip_addr_field("ip", INDEXED);
        let schema = schema_builder.build();
        let tantivy_query_ast = term_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = tantivy_query_ast.as_leaf().unwrap();
        assert_eq!(
            &format!("{leaf:?}"),
            "TermQuery(Term(field=0, type=IpAddr, 2001:db8:85a3::8a2e:370:7334))"
        );
    }

    #[test]
    fn test_term_query_bytes_with_padding() {
        let term_query = TermQuery {
            field: "bytes".to_string(),
            value: "bGlnaHQgdw==".to_string(),
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_bytes_field("bytes", INDEXED);
        let schema = schema_builder.build();
        let tantivy_query_ast = term_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = tantivy_query_ast.as_leaf().unwrap();
        assert_eq!(
            &format!("{leaf:?}"),
            "TermQuery(Term(field=0, type=Bytes, [108, 105, 103, 104, 116, 32, 119]))"
        );
    }

    #[test]
    fn test_term_query_bytes_without_padding() {
        let term_query = TermQuery {
            field: "bytes".to_string(),
            value: "bGlnaHQgdw".to_string(),
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_bytes_field("bytes", INDEXED);
        let schema = schema_builder.build();
        let tantivy_query_ast = term_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = tantivy_query_ast.as_leaf().unwrap();
        assert_eq!(
            &format!("{leaf:?}"),
            "TermQuery(Term(field=0, type=Bytes, [108, 105, 103, 104, 116, 32, 119]))"
        );
    }

    #[test]
    fn test_term_query_with_date_nanosecond() {
        let term_query = TermQuery {
            field: "timestamp".to_string(),
            value: "2025-08-07T14:49:21.831343Z".to_string(),
        };
        let mut schema_builder = Schema::builder();
        schema_builder.add_date_field("timestamp", INDEXED);
        let schema = schema_builder.build();
        let tantivy_query_ast = term_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();
        let leaf = tantivy_query_ast.as_leaf().unwrap();
        // The date should have been truncated to seconds precision.
        assert_eq!(
            &format!("{leaf:?}"),
            "TermQuery(Term(field=0, type=Date, 2025-08-07T14:49:21Z))"
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/term_set_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeSet, HashMap, HashSet};

use serde::{Deserialize, Serialize};
use tantivy::Term;

use crate::InvalidQuery;
use crate::query_ast::{
    BoolQuery, BuildTantivyAst, BuildTantivyAstContext, QueryAst, TantivyQueryAst, TermQuery,
};

/// TermSetQuery matches the same document set as if it was a union of
/// the equivalent set of TermQueries.
///
/// The text will be used as is, untokenized.
#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
pub struct TermSetQuery {
    pub terms_per_field: HashMap<String, BTreeSet<String>>,
}

impl TermSetQuery {
    fn has_fast_only_field(&self, context: &BuildTantivyAstContext) -> bool {
        for full_path in self.terms_per_field.keys() {
            if let Some((_, field_entry, _)) =
                super::utils::find_field_or_hit_dynamic(full_path, context.schema)
                && field_entry.is_fast()
                && !field_entry.is_indexed()
            {
                return true;
            }
        }
        false
    }

    fn build_bool_query(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let should_clauses = self
            .terms_per_field
            .iter()
            .flat_map(|(full_path, values)| {
                values.iter().map(|value| {
                    QueryAst::Term(TermQuery {
                        field: full_path.to_string(),
                        value: value.to_string(),
                    })
                })
            })
            .collect();

        let bool_query = BoolQuery {
            should: should_clauses,
            ..Default::default()
        };

        bool_query.build_tantivy_ast_impl(context)
    }

    fn build_term_set_query(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let terms_it = self.make_term_iterator(context)?;
        let term_set_query = tantivy::query::TermSetQuery::new(terms_it);
        Ok(term_set_query.into())
    }

    fn make_term_iterator(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<HashSet<Term>, InvalidQuery> {
        let mut terms: HashSet<Term> = HashSet::default();

        for (full_path, values) in &self.terms_per_field {
            for value in values {
                // Mapping a text (field, value) is non-trivial:
                // It depends on the schema of course, and can actually result in a disjunction of
                // multiple terms if the query targets a dynamic field (due to the
                // different types).
                //
                // Here, we ensure the logic is the same as for a TermQuery, by creating the term
                // query and extracting the terms from the resulting `TermQuery`.
                let term_query = TermQuery {
                    field: full_path.to_string(),
                    value: value.to_string(),
                };
                let ast = term_query.build_tantivy_ast_call(context)?;
                let tantivy_query: Box<dyn crate::TantivyQuery> = ast.simplify().into();
                tantivy_query.query_terms(&mut |term, _| {
                    terms.insert(term.clone());
                });
            }
        }
        Ok(terms)
    }
}

impl BuildTantivyAst for TermSetQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        if self.has_fast_only_field(context) {
            self.build_bool_query(context)
        } else {
            self.build_term_set_query(context)
        }
    }
}

impl From<TermSetQuery> for QueryAst {
    fn from(term_set_query: TermSetQuery) -> Self {
        QueryAst::TermSet(term_set_query)
    }
}

#[cfg(test)]
mod tests {
    use std::collections::{BTreeSet, HashMap};

    use tantivy::schema::{FAST, INDEXED, Schema};

    use super::TermSetQuery;
    use crate::query_ast::{BuildTantivyAst, BuildTantivyAstContext};

    #[test]
    fn test_term_set_query_with_fast_only_field_returns_bool_query() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_u64_field("fast_field", FAST);
        let schema = schema_builder.build();

        let terms_per_field = HashMap::from([(
            "fast_field".to_string(),
            BTreeSet::from(["1".to_string(), "2".to_string()]),
        )]);
        let term_set_query = TermSetQuery { terms_per_field };

        let tantivy_query_ast = term_set_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();

        let bool_query = tantivy_query_ast
            .as_bool_query()
            .expect("Expected BoolQuery for fast-only field, but got a different query type");
        assert_eq!(bool_query.should.len(), 2);
        assert_eq!(bool_query.must.len(), 0);
        assert_eq!(bool_query.must_not.len(), 0);
        assert_eq!(bool_query.filter.len(), 0);
    }

    #[test]
    fn test_term_set_query_with_indexed_field_uses_term_set() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_u64_field("indexed_field", FAST | INDEXED);
        let schema = schema_builder.build();

        let terms_per_field = HashMap::from([(
            "indexed_field".to_string(),
            BTreeSet::from(["1".to_string(), "2".to_string()]),
        )]);
        let term_set_query = TermSetQuery { terms_per_field };

        let tantivy_query_ast = term_set_query
            .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
            .unwrap();

        // Should return a leaf query (TermSetQuery wrapped in TantivyQueryAst)
        let leaf = tantivy_query_ast
            .as_leaf()
            .expect("Expected a leaf query (TermSetQuery), but got a complex query");

        // Verify it's a TermSetQuery by checking the debug representation
        let debug_str = format!("{leaf:?}");
        assert!(
            debug_str.contains("TermSetQuery"),
            "Expected TermSetQuery, got: {debug_str}"
        );
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/user_input_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeSet, HashMap};
use std::ops::Bound;

use anyhow::bail;
use serde::{Deserialize, Serialize};
use tantivy::query_grammar::{
    Delimiter, Occur, UserInputAst, UserInputBound, UserInputLeaf, UserInputLiteral,
};

use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::{
    self, BuildTantivyAst, BuildTantivyAstContext, FieldPresenceQuery, FullTextMode,
    FullTextParams, QueryAst, TantivyQueryAst,
};
use crate::{BooleanOperand, InvalidQuery, JsonLiteral};

const DEFAULT_PHRASE_QUERY_MAX_EXPANSION: u32 = 50;

/// A query expressed in the tantivy query grammar DSL.
#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq)]
pub struct UserInputQuery {
    pub user_text: String,
    // Set of search fields to search into for text not specifically
    // targeting a field.
    //
    // If None, the default search fields, as defined in the DocMapper
    // will be used.
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub default_fields: Option<Vec<String>>,
    pub default_operator: BooleanOperand,
    /// Support missing fields
    pub lenient: bool,
}

impl UserInputQuery {
    /// Parse the user query to generate a structured QueryAST, without any UserInputQuery node.
    ///
    /// The `UserInputQuery` have an optional search_fields property that takes precedence over
    /// the `default_search_fields`.
    ///
    /// In quickwit, the search fields in the `UserInputQuery` are usually supplied with the user
    /// request.
    /// The default_search_fields argument on the other hand, is the default search fields defined
    /// in the `DocMapper`.
    pub fn parse_user_query(&self, default_search_fields: &[String]) -> anyhow::Result<QueryAst> {
        let search_fields = self
            .default_fields
            .as_ref()
            .map(|search_fields| &search_fields[..])
            .unwrap_or(default_search_fields);
        let user_input_ast = tantivy::query_grammar::parse_query(&self.user_text)
            .map_err(|_| anyhow::anyhow!("failed to parse query: `{}`", &self.user_text))?;
        let default_occur = match self.default_operator {
            BooleanOperand::And => Occur::Must,
            BooleanOperand::Or => Occur::Should,
        };
        convert_user_input_ast_to_query_ast(
            user_input_ast,
            default_occur,
            search_fields,
            self.lenient,
        )
    }
}

impl From<UserInputQuery> for QueryAst {
    fn from(user_text_query: UserInputQuery) -> Self {
        QueryAst::UserInput(user_text_query)
    }
}

impl BuildTantivyAst for UserInputQuery {
    fn build_tantivy_ast_impl(
        &self,
        _context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, crate::InvalidQuery> {
        Err(InvalidQuery::UserQueryNotParsed)
    }
}

/// Convert the AST of a text query to a QueryAst, filling in default field and default occur when
/// they were not present.
fn convert_user_input_ast_to_query_ast(
    user_input_ast: UserInputAst,
    default_occur: Occur,
    default_search_fields: &[String],
    lenient: bool,
) -> anyhow::Result<QueryAst> {
    match user_input_ast {
        UserInputAst::Clause(clause) => {
            let mut bool_query = query_ast::BoolQuery::default();
            for (occur_opt, sub_ast) in clause {
                let sub_ast = convert_user_input_ast_to_query_ast(
                    sub_ast,
                    default_occur,
                    default_search_fields,
                    lenient,
                )?;
                let children_ast_for_occur: &mut Vec<QueryAst> =
                    match occur_opt.unwrap_or(default_occur) {
                        Occur::Should => &mut bool_query.should,
                        Occur::Must => &mut bool_query.must,
                        Occur::MustNot => &mut bool_query.must_not,
                    };
                children_ast_for_occur.push(sub_ast);
            }
            Ok(bool_query.into())
        }
        UserInputAst::Leaf(leaf) => match *leaf {
            UserInputLeaf::Literal(literal) => {
                convert_user_input_literal(literal, default_search_fields, lenient)
            }
            UserInputLeaf::All => Ok(QueryAst::MatchAll),
            UserInputLeaf::Range {
                field,
                lower,
                upper,
            } => {
                let field = if let Some(field) = field {
                    field
                } else if default_search_fields.len() == 1 {
                    default_search_fields[0].clone()
                } else if default_search_fields.is_empty() {
                    bail!("range query without field is not supported");
                } else {
                    bail!("range query with multiple fields is not supported");
                };
                let convert_bound = |user_input_bound: UserInputBound| match user_input_bound {
                    UserInputBound::Inclusive(user_text) => {
                        Bound::Included(JsonLiteral::String(user_text))
                    }
                    UserInputBound::Exclusive(user_text) => {
                        Bound::Excluded(JsonLiteral::String(user_text))
                    }
                    UserInputBound::Unbounded => Bound::Unbounded,
                };
                let range_query = query_ast::RangeQuery {
                    field,
                    lower_bound: convert_bound(lower),
                    upper_bound: convert_bound(upper),
                };
                Ok(range_query.into())
            }
            UserInputLeaf::Set { field, elements } => {
                let field_names: Vec<String> = if let Some(field) = field.as_ref() {
                    vec![field.to_string()]
                } else {
                    default_search_fields.to_vec()
                };
                if field_names.is_empty() {
                    anyhow::bail!("set query need to target a specific field");
                }
                let mut terms_per_field: HashMap<String, BTreeSet<String>> = Default::default();
                let terms: BTreeSet<String> = elements.into_iter().collect();
                for field in field_names {
                    terms_per_field.insert(field.to_string(), terms.clone());
                }
                let term_set_query = query_ast::TermSetQuery { terms_per_field };
                Ok(term_set_query.into())
            }
            UserInputLeaf::Exists { field } => Ok(FieldPresenceQuery { field }.into()),
            UserInputLeaf::Regex { field, pattern } => {
                let field = if let Some(field) = field {
                    field
                } else if default_search_fields.len() == 1 {
                    default_search_fields[0].clone()
                } else if default_search_fields.is_empty() {
                    bail!("regex query without field is not supported");
                } else {
                    bail!("regex query with multiple fields is not supported");
                };
                let regex_query = query_ast::RegexQuery {
                    field,
                    regex: pattern,
                };
                Ok(regex_query.into())
            }
        },
        UserInputAst::Boost(underlying, boost) => {
            let query_ast = convert_user_input_ast_to_query_ast(
                *underlying,
                default_occur,
                default_search_fields,
                lenient,
            )?;
            let boost: NotNaNf32 = (boost.into_inner() as f32)
                .try_into()
                .map_err(|err_msg: &str| anyhow::anyhow!(err_msg))?;
            Ok(QueryAst::Boost {
                underlying: Box::new(query_ast),
                boost,
            })
        }
    }
}

fn is_wildcard(phrase: &str) -> bool {
    use std::ops::ControlFlow;
    enum State {
        Normal,
        Escaped,
    }

    phrase
        .chars()
        .try_fold(State::Normal, |state, c| match state {
            State::Escaped => ControlFlow::Continue(State::Normal),
            State::Normal => {
                if c == '*' || c == '?' {
                    // we are in a wildcard query
                    ControlFlow::Break(())
                } else if c == '\\' {
                    ControlFlow::Continue(State::Escaped)
                } else {
                    ControlFlow::Continue(State::Normal)
                }
            }
        })
        .is_break()
}

/// Convert a leaf of a text query AST to a QueryAst.
/// This may generate more than a single leaf if there are multiple default fields.
fn convert_user_input_literal(
    user_input_literal: UserInputLiteral,
    default_search_fields: &[String],
    lenient: bool,
) -> anyhow::Result<QueryAst> {
    let UserInputLiteral {
        field_name,
        phrase,
        prefix,
        delimiter,
        slop,
    } = user_input_literal;
    let field_names: Vec<String> = if let Some(field_name) = field_name {
        vec![field_name]
    } else {
        default_search_fields
            .iter()
            .map(|field_name| field_name.to_string())
            .collect()
    };
    if field_names.is_empty() {
        anyhow::bail!("query requires a default search field and none was supplied");
    }
    let mode = match delimiter {
        Delimiter::None => FullTextMode::PhraseFallbackToIntersection,
        Delimiter::SingleQuotes => FullTextMode::Bool {
            operator: BooleanOperand::And,
        },
        Delimiter::DoubleQuotes => FullTextMode::Phrase { slop },
    };
    let full_text_params = FullTextParams {
        tokenizer: None,
        mode,
        zero_terms_query: crate::MatchAllOrNone::MatchNone,
    };
    let wildcard = delimiter == Delimiter::None && is_wildcard(&phrase);
    let mut phrase_queries: Vec<QueryAst> = field_names
        .into_iter()
        .map(|field_name| {
            if prefix {
                query_ast::PhrasePrefixQuery {
                    field: field_name,
                    phrase: phrase.clone(),
                    params: full_text_params.clone(),
                    max_expansions: DEFAULT_PHRASE_QUERY_MAX_EXPANSION,
                    lenient,
                }
                .into()
            } else if wildcard {
                query_ast::WildcardQuery {
                    field: field_name,
                    value: phrase.clone(),
                    lenient,
                    case_insensitive: false,
                }
                .into()
            } else {
                query_ast::FullTextQuery {
                    field: field_name,
                    text: phrase.clone(),
                    params: full_text_params.clone(),
                    lenient,
                }
                .into()
            }
        })
        .collect();
    if phrase_queries.is_empty() {
        Ok(QueryAst::MatchNone)
    } else if phrase_queries.len() == 1 {
        Ok(phrase_queries.pop().unwrap())
    } else {
        Ok(query_ast::BoolQuery {
            should: phrase_queries,
            ..Default::default()
        }
        .into())
    }
}

#[cfg(test)]
mod tests {
    use crate::query_ast::{
        BoolQuery, BuildTantivyAst, BuildTantivyAstContext, FullTextMode, FullTextQuery, QueryAst,
        UserInputQuery,
    };
    use crate::{BooleanOperand, InvalidQuery};

    #[test]
    fn test_user_input_query_not_parsed_error() {
        let user_input_query = UserInputQuery {
            user_text: "hello".to_string(),
            default_fields: None,
            default_operator: BooleanOperand::And,
            lenient: false,
        };
        let schema = tantivy::schema::Schema::builder().build();
        {
            let invalid_query = user_input_query
                .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
                .unwrap_err();
            assert!(matches!(invalid_query, InvalidQuery::UserQueryNotParsed));
        }
        {
            let invalid_query = user_input_query
                .build_tantivy_ast_call(&BuildTantivyAstContext::for_test(&schema))
                .unwrap_err();
            assert!(matches!(invalid_query, InvalidQuery::UserQueryNotParsed));
        }
    }

    #[test]
    fn test_user_input_query_missing_fields() {
        {
            let invalid_err = UserInputQuery {
                user_text: "hello".to_string(),
                default_fields: None,
                default_operator: BooleanOperand::And,
                lenient: false,
            }
            .parse_user_query(&[])
            .unwrap_err();
            assert_eq!(
                &invalid_err.to_string(),
                "query requires a default search field and none was supplied"
            );
        }
        {
            let invalid_err = UserInputQuery {
                user_text: "hello".to_string(),
                default_fields: Some(Vec::new()),
                default_operator: BooleanOperand::And,
                lenient: false,
            }
            .parse_user_query(&[])
            .unwrap_err();
            assert_eq!(
                &invalid_err.to_string(),
                "query requires a default search field and none was supplied"
            );
        }
    }

    #[test]
    fn test_user_input_query_predefined_default_fields() {
        let ast = UserInputQuery {
            user_text: "hello".to_string(),
            default_fields: None,
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&["defaultfield".to_string()])
        .unwrap();
        let QueryAst::FullText(phrase_query) = ast else {
            panic!()
        };
        assert_eq!(&phrase_query.field, "defaultfield");
        assert_eq!(&phrase_query.text, "hello");
        assert_eq!(
            phrase_query.params.mode,
            FullTextMode::PhraseFallbackToIntersection
        );
    }

    #[test]
    fn test_user_input_query_phrase_with_prefix() {
        let ast = UserInputQuery {
            user_text: "field:\"hello\"*".to_string(),
            default_fields: None,
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&[])
        .unwrap();
        let QueryAst::PhrasePrefix(phrase_prefix_query) = ast else {
            panic!()
        };
        assert_eq!(&phrase_prefix_query.field, "field");
        assert_eq!(&phrase_prefix_query.phrase, "hello");
        assert_eq!(phrase_prefix_query.max_expansions, 50);
        assert_eq!(
            phrase_prefix_query.params.mode,
            FullTextMode::Phrase { slop: 0 }
        );
    }

    #[test]
    fn test_user_input_query_override_default_fields() {
        let ast = UserInputQuery {
            user_text: "hello".to_string(),
            default_fields: Some(vec!["defaultfield".to_string()]),
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&["defaultfieldweshouldignore".to_string()])
        .unwrap();
        let QueryAst::FullText(phrase_query) = ast else {
            panic!()
        };
        assert_eq!(&phrase_query.field, "defaultfield");
        assert_eq!(&phrase_query.text, "hello");
        assert_eq!(
            phrase_query.params.mode,
            FullTextMode::PhraseFallbackToIntersection
        );
    }

    #[test]
    fn test_user_input_query_several_default_fields() {
        let ast = UserInputQuery {
            user_text: "hello".to_string(),
            default_fields: Some(vec!["fielda".to_string(), "fieldb".to_string()]),
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&["defaultfieldweshouldignore".to_string()])
        .unwrap();
        let QueryAst::Bool(BoolQuery { should, .. }) = ast else {
            panic!()
        };
        assert_eq!(should.len(), 2);
    }

    #[test]
    fn test_user_input_query_field_specified_in_user_input() {
        let ast = UserInputQuery {
            user_text: "myfield:hello".to_string(),
            default_fields: Some(vec!["fieldtoignore".to_string()]),
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&["fieldtoignore".to_string()])
        .unwrap();
        let QueryAst::FullText(full_text_query) = ast else {
            panic!()
        };
        assert_eq!(&full_text_query.field, "myfield");
        assert_eq!(&full_text_query.text, "hello");
        assert_eq!(
            full_text_query.params.mode,
            FullTextMode::PhraseFallbackToIntersection
        );
    }

    #[test]
    fn test_user_input_query_different_delimiter() {
        let parse_user_query_delimiter_util = |query: &str| {
            let ast = UserInputQuery {
                user_text: query.to_string(),
                default_fields: None,
                default_operator: BooleanOperand::Or,
                lenient: false,
            }
            .parse_user_query(&[])
            .unwrap();
            let QueryAst::FullText(full_text_query) = ast else {
                panic!()
            };
            full_text_query
        };
        {
            let double_quote_query: FullTextQuery =
                parse_user_query_delimiter_util("jobtitle:\"editor-in-chief\"");
            assert_eq!(&double_quote_query.field, "jobtitle");
            assert_eq!(&double_quote_query.text, "editor-in-chief");
            assert_eq!(
                double_quote_query.params.mode,
                FullTextMode::Phrase { slop: 0 }
            );
        }
        {
            let double_quote_query: FullTextQuery =
                parse_user_query_delimiter_util("jobtitle:\"editor-in-chief\"~2");
            assert_eq!(&double_quote_query.field, "jobtitle");
            assert_eq!(&double_quote_query.text, "editor-in-chief");
            assert_eq!(
                double_quote_query.params.mode,
                FullTextMode::Phrase { slop: 2 }
            );
        }
        {
            let double_quote_query: FullTextQuery =
                parse_user_query_delimiter_util("jobtitle:'editor-in-chief'");
            assert_eq!(&double_quote_query.field, "jobtitle");
            assert_eq!(&double_quote_query.text, "editor-in-chief");
            assert_eq!(
                double_quote_query.params.mode,
                FullTextMode::Bool {
                    operator: BooleanOperand::And
                }
            );
        }
        {
            let double_quote_query: FullTextQuery =
                parse_user_query_delimiter_util("jobtitle:editor-in-chief");
            assert_eq!(&double_quote_query.field, "jobtitle");
            assert_eq!(&double_quote_query.text, "editor-in-chief");
            assert_eq!(
                double_quote_query.params.mode,
                FullTextMode::PhraseFallbackToIntersection
            );
        }
    }

    #[test]
    fn test_user_input_query_regex() {
        let ast = UserInputQuery {
            user_text: "field: /.*/".to_string(),
            default_fields: None,
            default_operator: BooleanOperand::And,
            lenient: false,
        }
        .parse_user_query(&[])
        .unwrap();
        let QueryAst::Regex(regex_query) = ast else {
            panic!()
        };
        assert_eq!(&regex_query.field, "field");
        assert_eq!(&regex_query.regex, ".*");
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/utils.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use tantivy::Term;
use tantivy::json_utils::convert_to_fast_value_and_append_to_json_term;
use tantivy::query::TermQuery as TantivyTermQuery;
use tantivy::schema::{
    Field, FieldEntry, FieldType, IndexRecordOption, JsonObjectOptions, Schema as TantivySchema,
    TextFieldIndexing, Type,
};

use crate::InvalidQuery;
use crate::MatchAllOrNone::MatchNone as TantivyEmptyQuery;
use crate::json_literal::InterpretUserInput;
use crate::query_ast::full_text_query::FullTextParams;
use crate::query_ast::tantivy_query_ast::{TantivyBoolQuery, TantivyQueryAst};
use crate::tokenizers::{RAW_TOKENIZER_NAME, TokenizerManager};

pub(crate) const DYNAMIC_FIELD_NAME: &str = "_dynamic";

fn make_term_query(term: Term) -> TantivyQueryAst {
    TantivyTermQuery::new(term, IndexRecordOption::WithFreqs).into()
}

/// Find the field or fallback to the dynamic field if it exists
pub fn find_field_or_hit_dynamic<'a>(
    full_path: &'a str,
    schema: &'a TantivySchema,
) -> Option<(Field, &'a FieldEntry, &'a str)> {
    let (field, path) = if let Some((field, path)) = schema.find_field(full_path) {
        (field, path)
    } else {
        let dynamic_field = schema.get_field(DYNAMIC_FIELD_NAME).ok()?;
        (dynamic_field, full_path)
    };
    let field_entry = schema.get_field_entry(field);
    let typ = field_entry.field_type().value_type();
    if !path.is_empty() && typ != Type::Json {
        return None;
    }
    Some((field, field_entry, path))
}

/// Find all the fields that are below the given path.
///
/// This will return a list of fields only when the path is that of a composite
/// type in the doc mapping.
pub fn find_subfields<'a>(
    path: &'a str,
    schema: &'a TantivySchema,
) -> Vec<(Field, &'a FieldEntry)> {
    let prefix = format!("{path}.");
    schema
        .fields()
        .filter(|(_, field_entry)| field_entry.name().starts_with(&prefix))
        .collect()
}

/// Creates a full text query.
///
/// If tokenize is set to true, the text will be tokenized.
pub(crate) fn full_text_query(
    full_path: &str,
    text_query: &str,
    full_text_params: &FullTextParams,
    schema: &TantivySchema,
    tokenizer_manager: &TokenizerManager,
    lenient: bool,
) -> Result<TantivyQueryAst, InvalidQuery> {
    let Some((field, field_entry, path)) = find_field_or_hit_dynamic(full_path, schema) else {
        if lenient {
            return Ok(TantivyEmptyQuery.into());
        } else {
            return Err(InvalidQuery::FieldDoesNotExist {
                full_path: full_path.to_string(),
            });
        }
    };
    compute_query_with_field(
        field,
        field_entry,
        path,
        text_query,
        full_text_params,
        tokenizer_manager,
    )
}

fn parse_value_from_user_text<'a, T: InterpretUserInput<'a>>(
    text: &'a str,
    field_name: &str,
) -> Result<T, InvalidQuery> {
    if let Some(parsed_value) = T::interpret_str(text) {
        return Ok(parsed_value);
    }
    Err(InvalidQuery::InvalidSearchTerm {
        expected_value_type: T::name(),
        field_name: field_name.to_string(),
        value: text.to_string(),
    })
}

fn compute_query_with_field(
    field: Field,
    field_entry: &FieldEntry,
    json_path: &str,
    value: &str,
    full_text_params: &FullTextParams,
    tokenizer_manager: &TokenizerManager,
) -> Result<TantivyQueryAst, InvalidQuery> {
    let field_type = field_entry.field_type();
    match field_type {
        FieldType::U64(_) => {
            let val = parse_value_from_user_text::<u64>(value, field_entry.name())?;
            let term = Term::from_field_u64(field, val);
            Ok(make_term_query(term))
        }
        FieldType::I64(_) => {
            let val = parse_value_from_user_text::<i64>(value, field_entry.name())?;
            let term = Term::from_field_i64(field, val);
            Ok(make_term_query(term))
        }
        FieldType::F64(_) => {
            let val = parse_value_from_user_text::<f64>(value, field_entry.name())?;
            let term = Term::from_field_f64(field, val);
            Ok(make_term_query(term))
        }
        FieldType::Bool(_) => {
            let bool_val = parse_value_from_user_text(value, field_entry.name())?;
            let term = Term::from_field_bool(field, bool_val);
            Ok(make_term_query(term))
        }
        FieldType::Date(date_options) => {
            let dt = parse_value_from_user_text(value, field_entry.name())?;
            let term = if date_options.is_indexed() {
                Term::from_field_date_for_search(field, dt)
            } else {
                Term::from_field_date(field, dt.truncate(date_options.get_precision()))
            };
            Ok(make_term_query(term))
        }
        FieldType::Str(text_options) => {
            let columnar_opt = TextFieldIndexing::default()
                .set_fieldnorms(false)
                .set_tokenizer(RAW_TOKENIZER_NAME);
            let text_field_indexing = text_options
                .get_indexing_options()
                .or_else(|| text_options.is_fast().then_some(&columnar_opt))
                .ok_or_else(|| {
                    InvalidQuery::SchemaError(format!(
                        "field {} is not full-text searchable",
                        field_entry.name()
                    ))
                })?;
            let terms = full_text_params.tokenize_text_into_terms(
                field,
                value,
                text_field_indexing,
                tokenizer_manager,
            )?;
            full_text_params.make_query(terms, text_field_indexing.index_option())
        }
        FieldType::IpAddr(_) => {
            let ip_v6 = parse_value_from_user_text(value, field_entry.name())?;
            let term = Term::from_field_ip_addr(field, ip_v6);
            Ok(make_term_query(term))
        }
        FieldType::JsonObject(json_options) => compute_tantivy_ast_query_for_json(
            field,
            json_path,
            value,
            full_text_params,
            json_options,
            tokenizer_manager,
        ),
        FieldType::Facet(_) => Err(InvalidQuery::SchemaError(
            "facets are not supported in Quickwit".to_string(),
        )),
        FieldType::Bytes(_) => {
            let buffer: Vec<u8> = parse_value_from_user_text(value, field_entry.name())?;
            let term = Term::from_field_bytes(field, &buffer[..]);
            Ok(make_term_query(term))
        }
    }
}

fn compute_tantivy_ast_query_for_json(
    field: Field,
    json_path: &str,
    text: &str,
    full_text_params: &FullTextParams,
    json_options: &JsonObjectOptions,
    tokenizer_manager: &TokenizerManager,
) -> Result<TantivyQueryAst, InvalidQuery> {
    let mut bool_query = TantivyBoolQuery::default();
    let term = Term::from_field_json_path(field, json_path, json_options.is_expand_dots_enabled());
    if let Some(term) = convert_to_fast_value_and_append_to_json_term(&term, text, true) {
        bool_query
            .should
            .push(TantivyTermQuery::new(term, IndexRecordOption::Basic).into());
    }
    let position_terms: Vec<(usize, Term)> = full_text_params.tokenize_text_into_terms_json(
        field,
        json_path,
        text,
        json_options,
        tokenizer_manager,
    )?;
    let index_record_option = json_options
        .get_text_indexing_options()
        .map(|text_indexing_options| text_indexing_options.index_option())
        .unwrap_or(IndexRecordOption::Basic);
    bool_query
        .should
        .push(full_text_params.make_query(position_terms, index_record_option)?);
    Ok(bool_query.into())
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/visitor.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use crate::not_nan_f32::NotNaNf32;
use crate::query_ast::cache_node::CacheState;
use crate::query_ast::field_presence::FieldPresenceQuery;
use crate::query_ast::user_input_query::UserInputQuery;
use crate::query_ast::{
    BoolQuery, CacheNode, FullTextQuery, PhrasePrefixQuery, QueryAst, RangeQuery, RegexQuery,
    TermQuery, TermSetQuery, WildcardQuery,
};

/// Simple trait to implement a Visitor over the QueryAst.
pub trait QueryAstVisitor<'a> {
    type Err;

    fn visit(&mut self, query_ast: &'a QueryAst) -> Result<(), Self::Err> {
        match query_ast {
            QueryAst::Bool(bool_query) => self.visit_bool(bool_query),
            QueryAst::Term(term_query) => self.visit_term(term_query),
            QueryAst::TermSet(term_set_query) => self.visit_term_set(term_set_query),
            QueryAst::FullText(full_text_query) => self.visit_full_text(full_text_query),
            QueryAst::PhrasePrefix(phrase_prefix_query) => {
                self.visit_phrase_prefix(phrase_prefix_query)
            }
            QueryAst::Range(range_query) => self.visit_range(range_query),
            QueryAst::MatchAll => self.visit_match_all(),
            QueryAst::MatchNone => self.visit_match_none(),
            QueryAst::Boost { underlying, boost } => self.visit_boost(underlying, *boost),
            QueryAst::UserInput(user_text_query) => self.visit_user_text(user_text_query),
            QueryAst::FieldPresence(exists) => self.visit_exists(exists),
            QueryAst::Wildcard(wildcard) => self.visit_wildcard(wildcard),
            QueryAst::Regex(regex) => self.visit_regex(regex),
            QueryAst::Cache(cache_node) => self.visit_cache_node(cache_node),
        }
    }

    fn visit_bool(&mut self, bool_query: &'a BoolQuery) -> Result<(), Self::Err> {
        for ast in bool_query
            .must
            .iter()
            .chain(bool_query.should.iter())
            .chain(bool_query.must_not.iter())
            .chain(bool_query.filter.iter())
        {
            self.visit(ast)?;
        }
        Ok(())
    }

    fn visit_term(&mut self, _term_query: &'a TermQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_term_set(&mut self, _term_query: &'a TermSetQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_full_text(&mut self, _full_text: &'a FullTextQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_phrase_prefix(
        &mut self,
        _phrase_query: &'a PhrasePrefixQuery,
    ) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_match_all(&mut self) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_match_none(&mut self) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_boost(
        &mut self,
        underlying: &'a QueryAst,
        _boost: NotNaNf32,
    ) -> Result<(), Self::Err> {
        self.visit(underlying)
    }

    fn visit_range(&mut self, _range_query: &'a RangeQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_user_text(&mut self, _user_text_query: &'a UserInputQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_exists(&mut self, _exists_query: &'a FieldPresenceQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_wildcard(&mut self, _wildcard_query: &'a WildcardQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_regex(&mut self, _regex_query: &'a RegexQuery) -> Result<(), Self::Err> {
        Ok(())
    }

    fn visit_cache_node(&mut self, cache_node: &'a CacheNode) -> Result<(), Self::Err> {
        // this goes a bit again how the rest of the default Visitor behave. The rational is that in
        // practice, on a cache hit, we don't want to do anything with that node.
        // On unitialized cache, any kind of data extract could make sense (extracing tags or
        // timestamp bounds) On cache miss, we still want to know what we need for warmup.
        // But on cache hit, it's too late to do optimisation based on tags and timestamps, and we
        // don't want to warmup anything.
        if !matches!(cache_node.state, CacheState::CacheHit(_)) {
            self.visit(&cache_node.inner)?
        }
        Ok(())
    }
}

/// Simple trait to implement a Visitor over the QueryAst.
pub trait QueryAstTransformer {
    type Err;

    fn transform(&mut self, query_ast: QueryAst) -> Result<Option<QueryAst>, Self::Err> {
        match query_ast {
            QueryAst::Bool(bool_query) => self.transform_bool(bool_query),
            QueryAst::Term(term_query) => self.transform_term(term_query),
            QueryAst::TermSet(term_set_query) => self.transform_term_set(term_set_query),
            QueryAst::FullText(full_text_query) => self.transform_full_text(full_text_query),
            QueryAst::PhrasePrefix(phrase_prefix_query) => {
                self.transform_phrase_prefix(phrase_prefix_query)
            }
            QueryAst::Range(range_query) => self.transform_range(range_query),
            QueryAst::MatchAll => self.transform_match_all(),
            QueryAst::MatchNone => self.transform_match_none(),
            QueryAst::Boost { underlying, boost } => self.transform_boost(*underlying, boost),
            QueryAst::UserInput(user_text_query) => self.transform_user_text(user_text_query),
            QueryAst::FieldPresence(exists) => self.transform_exists(exists),
            QueryAst::Wildcard(wildcard) => self.transform_wildcard(wildcard),
            QueryAst::Regex(regex) => self.transform_regex(regex),
            QueryAst::Cache(cache_node) => self.transform_cache_node(cache_node),
        }
    }

    fn transform_bool(&mut self, mut bool_query: BoolQuery) -> Result<Option<QueryAst>, Self::Err> {
        bool_query.must = bool_query
            .must
            .into_iter()
            .filter_map(|query_ast| self.transform(query_ast).transpose())
            .collect::<Result<Vec<_>, _>>()?;
        bool_query.should = bool_query
            .should
            .into_iter()
            .filter_map(|query_ast| self.transform(query_ast).transpose())
            .collect::<Result<Vec<_>, _>>()?;
        bool_query.must_not = bool_query
            .must_not
            .into_iter()
            .filter_map(|query_ast| self.transform(query_ast).transpose())
            .collect::<Result<Vec<_>, _>>()?;
        bool_query.filter = bool_query
            .filter
            .into_iter()
            .filter_map(|query_ast| self.transform(query_ast).transpose())
            .collect::<Result<Vec<_>, _>>()?;

        Ok(Some(QueryAst::Bool(bool_query)))
    }

    fn transform_term(&mut self, term_query: TermQuery) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::Term(term_query)))
    }

    fn transform_term_set(
        &mut self,
        term_set: TermSetQuery,
    ) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::TermSet(term_set)))
    }

    fn transform_full_text(
        &mut self,
        full_text: FullTextQuery,
    ) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::FullText(full_text)))
    }

    fn transform_phrase_prefix(
        &mut self,
        phrase_query: PhrasePrefixQuery,
    ) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::PhrasePrefix(phrase_query)))
    }

    fn transform_match_all(&mut self) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::MatchAll))
    }

    fn transform_match_none(&mut self) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::MatchNone))
    }

    fn transform_boost(
        &mut self,
        underlying: QueryAst,
        boost: NotNaNf32,
    ) -> Result<Option<QueryAst>, Self::Err> {
        self.transform(underlying).map(|maybe_ast| {
            maybe_ast.map(|underlying| QueryAst::Boost {
                underlying: Box::new(underlying),
                boost,
            })
        })
    }

    fn transform_range(&mut self, range_query: RangeQuery) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::Range(range_query)))
    }

    fn transform_user_text(
        &mut self,
        user_text_query: UserInputQuery,
    ) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::UserInput(user_text_query)))
    }

    fn transform_exists(
        &mut self,
        exists_query: FieldPresenceQuery,
    ) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::FieldPresence(exists_query)))
    }

    fn transform_wildcard(
        &mut self,
        wildcard_query: WildcardQuery,
    ) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::Wildcard(wildcard_query)))
    }

    fn transform_regex(&mut self, regex_query: RegexQuery) -> Result<Option<QueryAst>, Self::Err> {
        Ok(Some(QueryAst::Regex(regex_query)))
    }

    fn transform_cache_node(
        &mut self,
        cache_node: CacheNode,
    ) -> Result<Option<QueryAst>, Self::Err> {
        if matches!(cache_node.state, CacheState::CacheHit(_)) {
            return Ok(Some(cache_node.into()));
        }
        self.transform(*cache_node.inner).map(|maybe_ast| {
            maybe_ast.map(|inner| {
                QueryAst::Cache(CacheNode {
                    inner: Box::new(inner),
                    state: Default::default(),
                })
            })
        })
    }
}


================================================
FILE: quickwit/quickwit-query/src/query_ast/wildcard_query.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::sync::Arc;

use anyhow::{Context, bail};
use serde::{Deserialize, Serialize};
use tantivy::Term;
use tantivy::schema::{Field, FieldType, Schema as TantivySchema};

use super::{BuildTantivyAst, QueryAst};
use crate::query_ast::{AutomatonQuery, BuildTantivyAstContext, JsonPathPrefix, TantivyQueryAst};
use crate::tokenizers::TokenizerManager;
use crate::{InvalidQuery, find_field_or_hit_dynamic};

/// A Wildcard query allows to match 'bond' with a query like 'b*d'.
#[derive(PartialEq, Eq, Debug, Serialize, Deserialize, Clone)]
pub struct WildcardQuery {
    pub field: String,
    pub value: String,
    /// Support missing fields
    pub lenient: bool,
    pub case_insensitive: bool,
}

impl From<WildcardQuery> for QueryAst {
    fn from(wildcard_query: WildcardQuery) -> Self {
        Self::Wildcard(wildcard_query)
    }
}

fn parse_wildcard_query(mut query: &str) -> Vec<SubQuery> {
    let mut res = Vec::new();
    while let Some(pos) = query.find(['*', '?', '\\']) {
        if pos > 0 {
            res.push(SubQuery::Text(query[..pos].to_string()));
        }
        let chr = &query[pos..pos + 1];
        query = &query[pos + 1..];
        match chr {
            "*" => res.push(SubQuery::Wildcard),
            "?" => res.push(SubQuery::QuestionMark),
            "\\" => {
                if let Some(chr) = query.chars().next() {
                    res.push(SubQuery::Text(chr.to_string()));
                    query = &query[chr.len_utf8()..];
                } else {
                    // escaping at the end is invalid, handle it as if that escape sequence wasn't
                    // present
                    break;
                }
            }
            _ => unreachable!("find shouldn't return non-matching position"),
        }
    }
    if !query.is_empty() {
        res.push(SubQuery::Text(query.to_string()));
    }
    res
}

enum SubQuery {
    Text(String),
    Wildcard,
    QuestionMark,
}

fn sub_query_parts_to_regex(
    sub_query_parts: Vec<SubQuery>,
    tokenizer_name: &str,
    tokenizer_manager: &TokenizerManager,
) -> anyhow::Result<String> {
    let mut normalizer = tokenizer_manager
        .get_normalizer(tokenizer_name)
        .with_context(|| format!("no tokenizer named `{tokenizer_name}` is registered"))?;

    sub_query_parts
        .into_iter()
        .map(|part| match part {
            SubQuery::Text(text) => {
                let mut token_stream = normalizer.token_stream(&text);
                let expected_token = token_stream
                    .next()
                    .context("normalizer generated no content")?
                    .text
                    .clone();
                if let Some(_unexpected_token) = token_stream.next() {
                    bail!("normalizer generated multiple tokens")
                }
                Ok(Cow::Owned(regex::escape(&expected_token)))
            }
            SubQuery::Wildcard => Ok(Cow::Borrowed(".*")),
            SubQuery::QuestionMark => Ok(Cow::Borrowed(".")),
        })
        .collect::<Result<String, _>>()
}

impl WildcardQuery {
    pub fn to_regex(
        &self,
        schema: &TantivySchema,
        tokenizer_manager: &TokenizerManager,
    ) -> Result<(Field, Option<Vec<u8>>, String), InvalidQuery> {
        let Some((field, field_entry, json_path)) = find_field_or_hit_dynamic(&self.field, schema)
        else {
            return Err(InvalidQuery::FieldDoesNotExist {
                full_path: self.field.clone(),
            });
        };
        let field_type = field_entry.field_type();

        let sub_query_parts = parse_wildcard_query(&self.value);

        match field_type {
            FieldType::Str(text_options) => {
                let text_field_indexing = text_options.get_indexing_options().ok_or_else(|| {
                    InvalidQuery::SchemaError(format!(
                        "field {} is not full-text searchable",
                        field_entry.name()
                    ))
                })?;
                let tokenizer_name = text_field_indexing.tokenizer();
                let regex =
                    sub_query_parts_to_regex(sub_query_parts, tokenizer_name, tokenizer_manager)?;
                let regex = if self.case_insensitive {
                    format!("(?i){}", regex)
                } else {
                    regex
                };

                Ok((field, None, regex))
            }
            FieldType::JsonObject(json_options) => {
                let text_field_indexing =
                    json_options.get_text_indexing_options().ok_or_else(|| {
                        InvalidQuery::SchemaError(format!(
                            "field {} is not full-text searchable",
                            field_entry.name()
                        ))
                    })?;
                let tokenizer_name = text_field_indexing.tokenizer();
                let regex =
                    sub_query_parts_to_regex(sub_query_parts, tokenizer_name, tokenizer_manager)?;
                let regex = if self.case_insensitive {
                    format!("(?i){}", regex)
                } else {
                    regex
                };

                let mut term_for_path = Term::from_field_json_path(
                    field,
                    json_path,
                    json_options.is_expand_dots_enabled(),
                );
                term_for_path.append_type_and_str("");

                let value = term_for_path.value();
                // We skip the 1st byte which is a marker to tell this is json. This isn't present
                // in the dictionary
                let byte_path_prefix = value.as_serialized()[1..].to_owned();

                Ok((field, Some(byte_path_prefix), regex))
            }
            _ => Err(InvalidQuery::SchemaError(
                "trying to run a Wildcard query on a non-text field".to_string(),
            )),
        }
    }
}

impl BuildTantivyAst for WildcardQuery {
    fn build_tantivy_ast_impl(
        &self,
        context: &BuildTantivyAstContext,
    ) -> Result<TantivyQueryAst, InvalidQuery> {
        let (field, path, regex) = match self.to_regex(context.schema, context.tokenizer_manager) {
            Ok(res) => res,
            Err(InvalidQuery::FieldDoesNotExist { .. }) if self.lenient => {
                return Ok(TantivyQueryAst::match_none());
            }
            Err(e) => return Err(e),
        };
        let regex =
            tantivy_fst::Regex::new(&regex).context("failed to parse regex built from wildcard")?;
        let regex_automaton_with_path = JsonPathPrefix {
            prefix: path.unwrap_or_default(),
            automaton: regex.into(),
        };
        let regex_query_with_path = AutomatonQuery {
            field,
            automaton: Arc::new(regex_automaton_with_path),
        };
        Ok(regex_query_with_path.into())
    }
}

#[cfg(test)]
mod tests {
    use tantivy::schema::{TextFieldIndexing, TextOptions};

    use super::*;
    use crate::create_default_quickwit_tokenizer_manager;

    fn single_text_field_schema(field_name: &str, tokenizer: &str) -> TantivySchema {
        let mut schema_builder = TantivySchema::builder();
        let text_options = TextOptions::default()
            .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
        schema_builder.add_text_field(field_name, text_options);
        schema_builder.build()
    }

    #[test]
    fn test_wildcard_query_to_regex_on_text() {
        let query = WildcardQuery {
            field: "text_field".to_string(),
            value: "MyString Wh1ch?a.nOrMal Tokenizer would*cut".to_string(),
            lenient: false,
            case_insensitive: false,
        };

        let tokenizer_manager = create_default_quickwit_tokenizer_manager();
        for tokenizer in ["raw", "whitespace"] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_text_field("text_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "MyString Wh1ch.a\\.nOrMal Tokenizer would.*cut");
            assert!(path.is_none());
        }

        for tokenizer in [
            "raw_lowercase",
            "lowercase",
            "default",
            "chinese_compatible",
            "source_code_default",
            "source_code_with_hex",
        ] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_text_field("text_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "mystring wh1ch.a\\.normal tokenizer would.*cut");
            assert!(path.is_none());
        }
    }

    #[test]
    fn test_wildcard_query_to_regex_on_escaped_text() {
        let query = WildcardQuery {
            field: "text_field".to_string(),
            value: "MyString Wh1ch\\?a.nOrMal Tokenizer would\\*cut".to_string(),
            lenient: false,
            case_insensitive: false,
        };

        let tokenizer_manager = create_default_quickwit_tokenizer_manager();
        for tokenizer in ["raw", "whitespace"] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_text_field("text_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "MyString Wh1ch\\?a\\.nOrMal Tokenizer would\\*cut");
            assert!(path.is_none());
        }

        for tokenizer in [
            "raw_lowercase",
            "lowercase",
            "default",
            "chinese_compatible",
            "source_code_default",
            "source_code_with_hex",
        ] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_text_field("text_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "mystring wh1ch\\?a\\.normal tokenizer would\\*cut");
            assert!(path.is_none());
        }
    }

    #[test]
    fn test_wildcard_query_to_regex_on_json() {
        let query = WildcardQuery {
            // this volontarily contains uppercase and regex-unsafe char to make sure we properly
            // keep the case, but sanitize special chars
            field: "json_field.Inner.Fie*ld".to_string(),
            value: "MyString Wh1ch?a.nOrMal Tokenizer would*cut".to_string(),
            lenient: false,
            case_insensitive: false,
        };

        let tokenizer_manager = create_default_quickwit_tokenizer_manager();
        for tokenizer in ["raw", "whitespace"] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_json_field("json_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "MyString Wh1ch.a\\.nOrMal Tokenizer would.*cut");
            assert_eq!(path.unwrap(), "Inner\u{1}Fie*ld\0s".as_bytes());
        }

        for tokenizer in [
            "raw_lowercase",
            "lowercase",
            "default",
            "chinese_compatible",
            "source_code_default",
            "source_code_with_hex",
        ] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_json_field("json_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "mystring wh1ch.a\\.normal tokenizer would.*cut");
            assert_eq!(path.unwrap(), "Inner\u{1}Fie*ld\0s".as_bytes());
        }
    }

    #[test]
    fn test_extract_regex_wildcard_missing_field() {
        let query = WildcardQuery {
            field: "my_missing_field".to_string(),
            value: "My query value*".to_string(),
            lenient: false,
            case_insensitive: false,
        };
        let tokenizer_manager = create_default_quickwit_tokenizer_manager();
        let schema = single_text_field_schema("my_field", "whitespace");
        let err = query.to_regex(&schema, &tokenizer_manager).unwrap_err();
        let InvalidQuery::FieldDoesNotExist {
            full_path: missing_field_full_path,
        } = err
        else {
            panic!("unexpected error: {err:?}");
        };
        assert_eq!(missing_field_full_path, "my_missing_field");
    }

    #[test]
    fn test_wildcard_query_to_regex_on_text_case_insensitive() {
        let query = WildcardQuery {
            field: "text_field".to_string(),
            value: "MyString Wh1ch?a.nOrMal Tokenizer would*cut".to_string(),
            lenient: false,
            case_insensitive: true,
        };

        let tokenizer_manager = create_default_quickwit_tokenizer_manager();
        for tokenizer in ["raw", "whitespace"] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_text_field("text_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "(?i)MyString Wh1ch.a\\.nOrMal Tokenizer would.*cut");
            assert!(path.is_none());
        }

        for tokenizer in [
            "raw_lowercase",
            "lowercase",
            "default",
            "chinese_compatible",
            "source_code_default",
            "source_code_with_hex",
        ] {
            let mut schema_builder = TantivySchema::builder();
            let text_options = TextOptions::default()
                .set_indexing_options(TextFieldIndexing::default().set_tokenizer(tokenizer));
            schema_builder.add_text_field("text_field", text_options);
            let schema = schema_builder.build();

            let (_field, path, regex) = query.to_regex(&schema, &tokenizer_manager).unwrap();
            assert_eq!(regex, "(?i)mystring wh1ch.a\\.normal tokenizer would.*cut");
            assert!(path.is_none());
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/tokenizers/chinese_compatible.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::str::CharIndices;

use tantivy::tokenizer::{Token, TokenStream, Tokenizer};

#[derive(Clone)]
pub(crate) struct ChineseTokenizer;

impl Tokenizer for ChineseTokenizer {
    type TokenStream<'a> = ChineseTokenStream<'a>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        ChineseTokenStream {
            text,
            last_char: None,
            chars: text.char_indices(),
            token: Token::default(),
        }
    }
}

pub(crate) struct ChineseTokenStream<'a> {
    text: &'a str,
    last_char: Option<(usize, char)>,
    chars: CharIndices<'a>,
    token: Token,
}

fn char_is_cjk(c: char) -> bool {
    // Block                                   Range       Comment
    // CJK Unified Ideographs                  4E00-9FFF   Common
    // CJK Unified Ideographs Extension A      3400-4DBF   Rare
    // CJK Unified Ideographs Extension B      20000-2A6DF Rare, historic
    // CJK Unified Ideographs Extension C      2A700–2B73F Rare, historic
    // CJK Unified Ideographs Extension D      2B740–2B81F Uncommon, some in current use
    // CJK Unified Ideographs Extension E      2B820–2CEAF Rare, historic
    matches!(c,
        '\u{4500}'..='\u{9FFF}' |
        '\u{3400}'..='\u{4DBF}' |
        '\u{20000}'..='\u{2A6DF}' |
        '\u{2A700}'..='\u{2CEAF}' // merge of extension C,D and E.
    )
}

#[derive(Clone, Debug, Eq, PartialEq)]
enum Grouping {
    Keep,
    SplitKeep,
    SplitIgnore,
}

fn char_grouping(c: char) -> Grouping {
    if c.is_alphanumeric() {
        if char_is_cjk(c) {
            Grouping::SplitKeep
        } else {
            Grouping::Keep
        }
    } else {
        Grouping::SplitIgnore
    }
}

impl TokenStream for ChineseTokenStream<'_> {
    fn advance(&mut self) -> bool {
        self.token.text.clear();
        self.token.position = self.token.position.wrapping_add(1);

        let mut iter = self.last_char.take().into_iter().chain(&mut self.chars);

        while let Some((offset_from, c)) = iter.next() {
            match char_grouping(c) {
                Grouping::Keep => {
                    let offset_to = if let Some((next_index, next_char)) =
                        iter.find(|&(_, c)| char_grouping(c) != Grouping::Keep)
                    {
                        self.last_char = Some((next_index, next_char));
                        next_index
                    } else {
                        self.text.len()
                    };

                    self.token.offset_from = offset_from;
                    self.token.offset_to = offset_to;
                    self.token.text.push_str(&self.text[offset_from..offset_to]);
                    return true;
                }
                Grouping::SplitKeep => {
                    let num_bytes_in_char = c.len_utf8();
                    self.token.offset_from = offset_from;
                    self.token.offset_to = offset_from + num_bytes_in_char;
                    self.token
                        .text
                        .push_str(&self.text[offset_from..(self.token.offset_to)]);
                    return true;
                }
                Grouping::SplitIgnore => (),
            }
        }
        false
    }

    fn token(&self) -> &Token {
        &self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        &mut self.token
    }
}

#[cfg(test)]
mod tests {
    use tantivy::tokenizer::{Token, TokenStream};

    #[test]
    fn test_chinese_tokenizer() {
        let text = "Hello world, 你好世界, bonjour monde";
        let tokenizer_manager = crate::create_default_quickwit_tokenizer_manager();
        let mut tokenizer = tokenizer_manager
            .get_tokenizer("chinese_compatible")
            .unwrap();
        let mut text_stream = tokenizer.token_stream(text);

        let mut res = Vec::new();
        while let Some(tok) = text_stream.next() {
            res.push(tok.clone());
        }

        // latin alphabet split on white spaces, Han split on each char
        let expected = [
            Token {
                offset_from: 0,
                offset_to: 5,
                position: 0,
                text: "hello".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 6,
                offset_to: 11,
                position: 1,
                text: "world".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 13,
                offset_to: 16,
                position: 2,
                text: "你".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 16,
                offset_to: 19,
                position: 3,
                text: "好".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 19,
                offset_to: 22,
                position: 4,
                text: "世".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 22,
                offset_to: 25,
                position: 5,
                text: "界".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 27,
                offset_to: 34,
                position: 6,
                text: "bonjour".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 35,
                offset_to: 40,
                position: 7,
                text: "monde".to_owned(),
                position_length: 1,
            },
        ];

        assert_eq!(res, expected);
    }

    #[test]
    fn test_chinese_tokenizer_no_space() {
        let text = "Hello你好bonjour";
        let tokenizer_manager = crate::create_default_quickwit_tokenizer_manager();
        let mut tokenizer = tokenizer_manager
            .get_tokenizer("chinese_compatible")
            .unwrap();
        let mut text_stream = tokenizer.token_stream(text);

        let mut res = Vec::new();
        while let Some(tok) = text_stream.next() {
            res.push(tok.clone());
        }

        let expected = [
            Token {
                offset_from: 0,
                offset_to: 5,
                position: 0,
                text: "hello".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 5,
                offset_to: 8,
                position: 1,
                text: "你".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 8,
                offset_to: 11,
                position: 2,
                text: "好".to_owned(),
                position_length: 1,
            },
            Token {
                offset_from: 11,
                offset_to: 18,
                position: 3,
                text: "bonjour".to_owned(),
                position_length: 1,
            },
        ];

        assert_eq!(res, expected);
    }

    proptest::proptest! {
        #[test]
        fn test_proptest_ascii_default_chinese_equal(text in "[ -~]{0,64}") {
            let tokenizer_manager = crate::create_default_quickwit_tokenizer_manager();
            let mut cn_tok = tokenizer_manager.get_tokenizer("chinese_compatible").unwrap();
            let mut default_tok = tokenizer_manager.get_tokenizer("default").unwrap();

            let mut text_stream = cn_tok.token_stream(&text);

            let mut cn_res = Vec::new();
            while let Some(tok) = text_stream.next() {
                cn_res.push(tok.clone());
            }

            let mut text_stream = default_tok.token_stream(&text);

            let mut default_res = Vec::new();
            while let Some(tok) = text_stream.next() {
                default_res.push(tok.clone());
            }

            assert_eq!(cn_res, default_res);
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/tokenizers/code_tokenizer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Range;
use std::str::CharIndices;

use tantivy::tokenizer::{Token, TokenStream, Tokenizer};

/// A Tokenizer splitting based on casing families often used in code such ase camelCase or
/// PascalCase.
///
/// For instance, it splits `PigCaféFactory2` as `[Pig, Café, Factory, 2]`, or `RPCResult` into
/// `[RPC, Result]`.
///
/// Optionally, it can keep sequences of hexadecimal chars together, which can be useful when
/// dealing with ids encoded in that way, such as UUIDs.
#[derive(Clone, Default)]
pub struct CodeTokenizer {
    token: Token,
    enable_hex: bool,
}

impl CodeTokenizer {
    /// When hex support is enabled, the tokenizer tries to keep group of hexadecimal digits as one
    /// token, instead of splitting them in groups of letters and numbers.
    pub fn with_hex_support() -> Self {
        CodeTokenizer {
            token: Token::default(),
            enable_hex: true,
        }
    }
}

impl Tokenizer for CodeTokenizer {
    type TokenStream<'a> = CodeTokenStream<'a>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        self.token.reset();
        CodeTokenStream {
            chars: text.char_indices(),
            state: CodeTokenStreamState::Empty,
            text,
            token: &mut self.token,
            enable_hex: self.enable_hex,
        }
    }
}

pub struct CodeTokenStream<'a> {
    text: &'a str,
    chars: CharIndices<'a>,
    token: &'a mut Token,
    state: CodeTokenStreamState,
    enable_hex: bool,
}

enum AdvanceResult {
    None,
    Emit(TokenOffsets),
    Backtrack,
}

impl CodeTokenStream<'_> {
    fn advance_inner(&mut self, enable_hex: bool) -> bool {
        // this is cheap, just a copy of a few ptrs and integers
        let checkpoint = self.chars.clone();

        while let Some((next_char_offset, next_char)) = self.chars.next() {
            match self.state.advance(next_char_offset, next_char, enable_hex) {
                AdvanceResult::None => {}
                AdvanceResult::Emit(token_offsets) => {
                    self.update_token(token_offsets);
                    return true;
                }
                AdvanceResult::Backtrack => {
                    self.chars = checkpoint;
                    self.state.reset();
                    // this can't recurse more than once, Backtrack is only emitted from hex state,
                    // and calling with false prevent that state from being generated.
                    return self.advance_inner(false);
                }
            }
        }

        // No more chars.
        match self.state.finalize() {
            AdvanceResult::None => {}
            AdvanceResult::Emit(token_offsets) => {
                self.update_token(token_offsets);
                return true;
            }
            AdvanceResult::Backtrack => {
                self.chars = checkpoint;
                self.state.reset();
                return self.advance_inner(false);
            }
        }

        false
    }
}

impl TokenStream for CodeTokenStream<'_> {
    fn advance(&mut self) -> bool {
        self.token.text.clear();
        self.token.position = self.token.position.wrapping_add(1);

        self.advance_inner(self.enable_hex)
    }

    fn token(&self) -> &Token {
        self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

impl CodeTokenStream<'_> {
    fn update_token(&mut self, token_offsets: Range<usize>) {
        self.token.offset_from = token_offsets.start;
        self.token.offset_to = token_offsets.end;
        self.token
            .text
            .push_str(&self.text[token_offsets.start..token_offsets.end]);
    }
}

enum CodeTokenStreamState {
    Empty,
    ProcessingChars(ProcessingCharsState),
    ProcessingHex(ProcessingHexState),
}

struct ProcessingCharsState {
    is_first_char: bool,
    start_offset: usize,
    current_char: char,
    current_char_offset: usize,
    current_char_type: CharType,
}

type TokenOffsets = Range<usize>;

impl CodeTokenStreamState {
    fn reset(&mut self) {
        *self = CodeTokenStreamState::Empty;
    }

    fn advance(
        &mut self,
        next_char_offset: usize,
        next_char: char,
        allow_hex: bool,
    ) -> AdvanceResult {
        let next_char_type = get_char_type(next_char);
        match self {
            Self::Empty => {
                match next_char_type {
                    CharType::Delimiter => {
                        self.reset();
                    }
                    _ => {
                        let is_hex = next_char.is_ascii_digit()
                            || ('a'..='f').contains(&next_char)
                            || ('A'..='F').contains(&next_char);
                        if allow_hex && is_hex {
                            *self = CodeTokenStreamState::ProcessingHex(ProcessingHexState {
                                seen_lowercase: next_char_type == CharType::LowerCase,
                                seen_uppercase: next_char_type == CharType::UpperCase,
                                seen_number: next_char_type == CharType::Numeric,
                                start_offset: next_char_offset,
                                current_char: next_char,
                                current_char_offset: next_char_offset,
                            });
                        } else {
                            *self = CodeTokenStreamState::ProcessingChars(ProcessingCharsState {
                                is_first_char: true,
                                start_offset: next_char_offset,
                                current_char_offset: next_char_offset,
                                current_char: next_char,
                                current_char_type: next_char_type,
                            });
                        }
                    }
                }
                AdvanceResult::None
            }
            Self::ProcessingChars(state) => {
                match (state.current_char_type, next_char_type) {
                    (_, CharType::Delimiter) => {
                        let offsets = TokenOffsets {
                            start: state.start_offset,
                            end: state.current_char_offset + state.current_char.len_utf8(),
                        };
                        // this is the only case where we want to reset, otherwise we might get
                        // back to a hex-state in a place where we did not get a delimiter
                        self.reset();
                        AdvanceResult::Emit(offsets)
                    }
                    // We do not emit a token if we have only `Ac` (is_first_char = true).
                    // But we emit the token `AB` if we have `ABCa`,
                    (CharType::UpperCase, CharType::LowerCase) => {
                        if state.is_first_char {
                            state.is_first_char = false;
                            state.current_char_offset = next_char_offset;
                            state.current_char = next_char;
                            state.current_char_type = next_char_type;
                            AdvanceResult::None
                        } else {
                            let offsets = TokenOffsets {
                                start: state.start_offset,
                                end: state.current_char_offset,
                            };
                            state.is_first_char = false;
                            state.start_offset = state.current_char_offset;
                            state.current_char_offset = next_char_offset;
                            state.current_char = next_char;
                            state.current_char_type = next_char_type;
                            AdvanceResult::Emit(offsets)
                        }
                    }
                    // Don't emit tokens on identical char types.
                    (CharType::UpperCase, CharType::UpperCase)
                    | (CharType::LowerCase, CharType::LowerCase)
                    | (CharType::Numeric, CharType::Numeric) => {
                        state.is_first_char = false;
                        state.current_char_offset = next_char_offset;
                        state.current_char = next_char;
                        AdvanceResult::None
                    }
                    _ => {
                        let offsets = TokenOffsets {
                            start: state.start_offset,
                            end: state.current_char_offset + state.current_char.len_utf8(),
                        };
                        state.is_first_char = true;
                        state.start_offset = next_char_offset;
                        state.current_char_offset = next_char_offset;
                        state.current_char = next_char;
                        state.current_char_type = next_char_type;
                        AdvanceResult::Emit(offsets)
                    }
                }
            }
            Self::ProcessingHex(state) => {
                match state.consume_char(next_char_offset, next_char) {
                    HexResult::None => AdvanceResult::None,
                    HexResult::Emit(offsets) => {
                        self.reset();
                        AdvanceResult::Emit(offsets)
                    }
                    HexResult::RecoverableError(state) => {
                        *self = CodeTokenStreamState::ProcessingChars(state);
                        // the char wasn't actually consumed, we recurse once to make sure it is
                        self.advance(next_char_offset, next_char, allow_hex)
                    }
                    HexResult::IrrecoverableError => AdvanceResult::Backtrack,
                }
            }
        }
    }

    fn finalize(&mut self) -> AdvanceResult {
        match self {
            Self::Empty => AdvanceResult::None,
            Self::ProcessingChars(char_state) => {
                let offsets = TokenOffsets {
                    start: char_state.start_offset,
                    end: char_state.current_char_offset + char_state.current_char.len_utf8(),
                };
                *self = Self::Empty;
                AdvanceResult::Emit(offsets)
            }
            CodeTokenStreamState::ProcessingHex(hex_state) => match hex_state.finalize() {
                HexResult::None => unreachable!(),
                HexResult::Emit(offsets) => {
                    *self = Self::Empty;
                    AdvanceResult::Emit(offsets)
                }
                HexResult::RecoverableError(state) => {
                    *self = CodeTokenStreamState::ProcessingChars(state);
                    self.finalize()
                }
                HexResult::IrrecoverableError => AdvanceResult::Backtrack,
            },
        }
    }
}

/// Returns the type of the character:
/// - `UpperCase` for `p{Lu}`.
/// - `LowerCase` for `p{Ll}`.
/// - `Numeric` for `\d`.
/// - `Delimiter` for the remaining characters.
fn get_char_type(c: char) -> CharType {
    if c.is_alphabetic() {
        if c.is_uppercase() {
            CharType::UpperCase
        } else {
            CharType::LowerCase
        }
    } else if c.is_numeric() {
        CharType::Numeric
    } else {
        CharType::Delimiter
    }
}

#[derive(Clone, Copy, Debug, Eq, PartialEq)]
enum CharType {
    // Equivalent of regex `p{Lu}`.
    UpperCase,
    // Equivalent of regex `p{Ll}`.
    LowerCase,
    // Equivalent of regex `\d`.
    Numeric,
    // Other characters.
    Delimiter,
}

#[derive(Debug)]
struct ProcessingHexState {
    seen_uppercase: bool,
    seen_lowercase: bool,
    seen_number: bool,

    start_offset: usize,
    current_char_offset: usize,
    current_char: char,
}

enum HexResult {
    // no token emitted
    None,
    // a token is being emitted, after that the state needs to be reset.
    Emit(TokenOffsets),
    // we got an error, but where able to generate a code tokenizer state
    RecoverableError(ProcessingCharsState),
    // we got an error and can't generate a code tokenizer state, we need to backtrack
    IrrecoverableError,
}

impl ProcessingHexState {
    // if this returns an error, the char was *not* consumed
    fn consume_char(&mut self, next_char_offset: usize, next_char: char) -> HexResult {
        match next_char {
            '0'..='9' => self.seen_number = true,
            'a'..='f' => {
                if !self.seen_uppercase {
                    self.seen_lowercase = true;
                } else {
                    return self.to_processing_chars_state();
                }
            }
            'A'..='F' => {
                if !self.seen_lowercase {
                    self.seen_uppercase = true;
                } else {
                    return self.to_processing_chars_state();
                }
            }
            c => {
                if get_char_type(c) == CharType::Delimiter {
                    // end of sequence, check if size is multiple of 2, or try to generate code
                    // state. We use next_char_offset as it already takes into account the size of
                    // the last character
                    if (next_char_offset - self.start_offset).is_multiple_of(2) {
                        return HexResult::Emit(self.start_offset..next_char_offset);
                    }
                }
                // we got an invalid non-delimiter, or our sequence is an odd-length. Either way,
                // we need to go switch to the code tokenizer
                return self.to_processing_chars_state();
            }
        }
        // char was accepted, update state
        self.current_char_offset = next_char_offset;
        self.current_char = next_char;
        HexResult::None
    }

    fn to_processing_chars_state(&self) -> HexResult {
        let current_char_type = match (self.seen_uppercase, self.seen_lowercase, self.seen_number) {
            // for Aab, we actually take this branch has a hasn't been consumed just yet.
            (true, false, false) => CharType::UpperCase,
            (false, true, false) => CharType::LowerCase,
            (false, false, true) => CharType::Numeric,
            _ => return HexResult::IrrecoverableError,
        };
        HexResult::RecoverableError(ProcessingCharsState {
            current_char: self.current_char,
            current_char_offset: self.current_char_offset,
            start_offset: self.start_offset,
            is_first_char: self.current_char_offset == self.start_offset,
            current_char_type,
        })
    }

    fn finalize(&self) -> HexResult {
        let next_char_offset = self.current_char_offset + self.current_char.len_utf8();
        if (next_char_offset - self.start_offset).is_multiple_of(2) {
            return HexResult::Emit(self.start_offset..next_char_offset);
        }
        self.to_processing_chars_state()
    }
}

#[cfg(test)]
mod tests {
    use tantivy::tokenizer::{Token, TokenStream, Tokenizer};

    use super::CodeTokenizer;

    #[test]
    fn test_code_tokenizer() {
        let mut tokenizer = CodeTokenizer::default();
        {
            let mut token_stream = tokenizer.token_stream("PigCaféFactory2");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: "Pig".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 3,
                    offset_to: 8,
                    position: 1,
                    text: "Café".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 8,
                    offset_to: 15,
                    position: 2,
                    text: "Factory".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 15,
                    offset_to: 16,
                    position: 3,
                    text: "2".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
        {
            let mut token_stream = tokenizer.token_stream("PIG_CAFE_FACTORY");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: "PIG".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 4,
                    offset_to: 8,
                    position: 1,
                    text: "CAFE".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 9,
                    offset_to: 16,
                    position: 2,
                    text: "FACTORY".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
        {
            let mut token_stream = tokenizer.token_stream("TPigCafeFactory");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 1,
                    position: 0,
                    text: "T".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 1,
                    offset_to: 4,
                    position: 1,
                    text: "Pig".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 4,
                    offset_to: 8,
                    position: 2,
                    text: "Cafe".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 8,
                    offset_to: 15,
                    position: 3,
                    text: "Factory".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
        {
            let mut token_stream = tokenizer.token_stream("PIG# Cafe@FACTORY");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: "PIG".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 5,
                    offset_to: 9,
                    position: 1,
                    text: "Cafe".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 10,
                    offset_to: 17,
                    position: 2,
                    text: "FACTORY".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
    }

    #[test]
    fn test_code_tokenizer_hex() {
        let mut tokenizer = CodeTokenizer::with_hex_support();
        {
            let mut token_stream = tokenizer.token_stream("PigCaféFactory2");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: "Pig".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 3,
                    offset_to: 8,
                    position: 1,
                    text: "Café".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 8,
                    offset_to: 15,
                    position: 2,
                    text: "Factory".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 15,
                    offset_to: 16,
                    position: 3,
                    text: "2".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
        {
            let mut token_stream = tokenizer.token_stream("PIG_CAFE_FACTORY");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: "PIG".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 4,
                    offset_to: 8,
                    position: 1,
                    text: "CAFE".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 9,
                    offset_to: 16,
                    position: 2,
                    text: "FACTORY".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
        {
            let mut token_stream = tokenizer.token_stream("TPigCafeFactory");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 1,
                    position: 0,
                    text: "T".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 1,
                    offset_to: 4,
                    position: 1,
                    text: "Pig".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 4,
                    offset_to: 8,
                    position: 2,
                    text: "Cafe".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 8,
                    offset_to: 15,
                    position: 3,
                    text: "Factory".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
        {
            let mut token_stream = tokenizer.token_stream("PIG# Cafe@FACTORY");
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.clone());
            }
            let expected_tokens = vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: "PIG".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 5,
                    offset_to: 9,
                    position: 1,
                    text: "Cafe".to_owned(),
                    position_length: 1,
                },
                Token {
                    offset_from: 10,
                    offset_to: 17,
                    position: 2,
                    text: "FACTORY".to_owned(),
                    position_length: 1,
                },
            ];
            assert_eq!(res, expected_tokens);
        }
    }

    #[test]
    fn test_code_tokenizer_hex_scenaris() {
        let test_vectors = vec![
            // simple hex, separated by delimiter, or at end of string
            (
                "fa63bbbf-0fb9-5ec8-ae63-561dc0f444aa",
                vec!["fa63bbbf", "0fb9", "5ec8", "ae63", "561dc0f444aa"],
            ),
            (
                "FA63BBBF-0FB9-5EC8-AE63-561DC0F444AA",
                vec!["FA63BBBF", "0FB9", "5EC8", "AE63", "561DC0F444AA"],
            ),
            // last token has odd len
            (
                "fa63bbbf-0fb9-5ec8-ae63-561dc0f444a",
                vec![
                    "fa63bbbf", "0fb9", "5ec8", "ae63", "561", "dc", "0", "f", "444", "a",
                ],
            ),
            // a middle token has odd len
            (
                "fa63bbbf-0fb9-5ec8-ae6-561dc0f444aa",
                vec!["fa63bbbf", "0fb9", "5ec8", "ae", "6", "561dc0f444aa"],
            ),
            // token starts with upper case
            (
                "Fa63bbbf-0fb9-5ec8-ae63-561dc0f444aa",
                vec!["Fa", "63", "bbbf", "0fb9", "5ec8", "ae63", "561dc0f444aa"],
            ),
            // change in case during a token
            (
                "fa63Bbbf-0fb9-5ec8-ae63-561dc0f444aa",
                vec!["fa", "63", "Bbbf", "0fb9", "5ec8", "ae63", "561dc0f444aa"],
            ),
            (
                "fa63bbBf-0fb9-5ec8-ae63-561dc0f444aa",
                vec![
                    "fa",
                    "63",
                    "bb",
                    "Bf",
                    "0fb9",
                    "5ec8",
                    "ae63",
                    "561dc0f444aa",
                ],
            ),
            // token starts with lower case
            (
                "fA63BBBF-0FB9-5EC8-AE63-561DC0F444AA",
                vec![
                    "f",
                    "A",
                    "63",
                    "BBBF",
                    "0FB9",
                    "5EC8",
                    "AE63",
                    "561DC0F444AA",
                ],
            ),
            // token contain non hex
            (
                "fa63bgbf-0fb9-5ec8-ae63-561dc0f444aa",
                vec!["fa", "63", "bgbf", "0fb9", "5ec8", "ae63", "561dc0f444aa"],
            ),
            // non 0-9 numeric
            (
                "fa6③bbbf-0fb9-5ec8-ae63-561dc0f444aa",
                vec!["fa", "6③", "bbbf", "0fb9", "5ec8", "ae63", "561dc0f444aa"],
            ),
            ("301ms", vec!["301", "ms"]),
            ("301cd", vec!["301", "cd"]),
            ("30ms", vec!["30", "ms"]),
            // we don't know if it's candelas or hex, and assume hex in this case
            ("30cd", vec!["30cd"]),
            ("ABCDef", vec!["ABC", "Def"]),
        ];

        let mut tokenizer = CodeTokenizer::with_hex_support();
        for (text, expected) in test_vectors {
            let mut token_stream = tokenizer.token_stream(text);
            let mut res = Vec::new();
            while let Some(tok) = token_stream.next() {
                res.push(tok.text.clone());
            }
            assert_eq!(res, expected);
        }
    }
}


================================================
FILE: quickwit/quickwit-query/src/tokenizers/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod chinese_compatible;
mod code_tokenizer;
mod tokenizer_manager;

use once_cell::sync::Lazy;
use tantivy::tokenizer::{
    AsciiFoldingFilter, LowerCaser, RawTokenizer, RemoveLongFilter, SimpleTokenizer, TextAnalyzer,
    WhitespaceTokenizer,
};

use self::chinese_compatible::ChineseTokenizer;
pub use self::code_tokenizer::CodeTokenizer;
pub use self::tokenizer_manager::{RAW_TOKENIZER_NAME, TokenizerManager};

pub const DEFAULT_REMOVE_TOKEN_LENGTH: usize = 255;

/// Quickwit's tokenizer/analyzer manager.
pub fn create_default_quickwit_tokenizer_manager() -> TokenizerManager {
    let tokenizer_manager = TokenizerManager::new();

    let raw_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .build();
    tokenizer_manager.register("raw", raw_tokenizer, false);

    let raw_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
        .filter(LowerCaser)
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .build();
    tokenizer_manager.register("raw_lowercase", raw_tokenizer, true);

    let lower_case_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
        .filter(LowerCaser)
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .build();
    tokenizer_manager.register("lowercase", lower_case_tokenizer, true);

    let default_tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .filter(LowerCaser)
        .build();
    tokenizer_manager.register("default", default_tokenizer, true);
    tokenizer_manager.register("whitespace", WhitespaceTokenizer::default(), false);

    let chinese_tokenizer = TextAnalyzer::builder(ChineseTokenizer)
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .filter(LowerCaser)
        .build();
    tokenizer_manager.register("chinese_compatible", chinese_tokenizer, true);
    tokenizer_manager.register(
        "source_code_default",
        TextAnalyzer::builder(CodeTokenizer::default())
            .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
            .filter(LowerCaser)
            .filter(AsciiFoldingFilter)
            .build(),
        true,
    );
    tokenizer_manager.register(
        "source_code_with_hex",
        TextAnalyzer::builder(CodeTokenizer::with_hex_support())
            .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
            .filter(LowerCaser)
            .filter(AsciiFoldingFilter)
            .build(),
        true,
    );
    tokenizer_manager
}

fn create_quickwit_fastfield_normalizer_manager() -> TokenizerManager {
    let raw_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .build();
    let lower_case_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
        .filter(LowerCaser)
        .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
        .build();
    let tokenizer_manager = TokenizerManager::new();
    tokenizer_manager.register("raw", raw_tokenizer, false);
    tokenizer_manager.register("lowercase", lower_case_tokenizer, true);
    tokenizer_manager
}

pub fn get_quickwit_fastfield_normalizer_manager() -> &'static TokenizerManager {
    static QUICKWIT_FAST_FIELD_NORMALIZER_MANAGER: Lazy<TokenizerManager> =
        Lazy::new(create_quickwit_fastfield_normalizer_manager);
    &QUICKWIT_FAST_FIELD_NORMALIZER_MANAGER
}

#[cfg(test)]
mod tests {

    #[test]
    fn test_tokenizers_in_manager() {
        let tokenizer_manager = super::create_default_quickwit_tokenizer_manager();
        tokenizer_manager
            .get_tokenizer("chinese_compatible")
            .unwrap();
        tokenizer_manager.get_tokenizer("default").unwrap();
        tokenizer_manager.get_tokenizer("raw").unwrap();
    }

    #[test]
    fn test_raw_tokenizer() {
        let tokenizer_manager = super::create_default_quickwit_tokenizer_manager();
        let my_haiku = r#"
        white sandy beach
        a strong wind is coming
        sand in my face
        "#;
        let my_long_text = "a text, that is just too long, no one will type it, no one will like \
                            it, no one shall find it. I just need some more chars, now you may \
                            not pass.";

        let mut tokenizer = tokenizer_manager.get_tokenizer("raw").unwrap();
        let mut haiku_stream = tokenizer.token_stream(my_haiku);
        assert!(haiku_stream.advance());
        assert!(!haiku_stream.advance());
        let mut other_tokenizer = tokenizer_manager.get_tokenizer("raw").unwrap();
        let mut other_stream = other_tokenizer.token_stream(my_long_text);
        assert!(other_stream.advance());
        assert!(!other_stream.advance());
    }

    #[test]
    fn test_code_tokenizer_in_tokenizer_manager() {
        let mut code_tokenizer = super::create_default_quickwit_tokenizer_manager()
            .get_tokenizer("source_code_default")
            .unwrap();
        let mut token_stream = code_tokenizer.token_stream("PigCaféFactory2");
        let mut tokens = Vec::new();
        while let Some(token) = token_stream.next() {
            tokens.push(token.text.to_string());
        }
        assert_eq!(tokens, vec!["pig", "cafe", "factory", "2"])
    }

    #[test]
    fn test_raw_lowercase_tokenizer() {
        let tokenizer_manager = super::create_default_quickwit_tokenizer_manager();
        let my_long_text = "a text, that is just too long, no one will type it, no one will like \
                            it, no one shall find it. I just need some more chars, now you may \
                            not pass.";

        let mut tokenizer = tokenizer_manager.get_tokenizer("raw_lowercase").unwrap();
        let mut stream = tokenizer.token_stream(my_long_text);
        assert!(stream.advance());
        assert_eq!(stream.token().text.len(), my_long_text.len());
        // there are non letter, so we can't check for all lowercase directly
        assert!(stream.token().text.chars().all(|c| !c.is_uppercase()));
        assert!(!stream.advance());
    }
}


================================================
FILE: quickwit/quickwit-query/src/tokenizers/tokenizer_manager.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::sync::{Arc, RwLock};

use tantivy::tokenizer::{
    LowerCaser, RawTokenizer, RemoveLongFilter, TextAnalyzer,
    TokenizerManager as TantivyTokenizerManager,
};

use crate::DEFAULT_REMOVE_TOKEN_LENGTH;

pub const RAW_TOKENIZER_NAME: &str = "raw";
const LOWERCASE_TOKENIZER_NAME: &str = "lowercase";
const RAW_LOWERCASE_TOKENIZER_NAME: &str = "raw_lowercase";

#[derive(Clone)]
pub struct TokenizerManager {
    inner: TantivyTokenizerManager,
    is_lowercaser: Arc<RwLock<HashMap<String, bool>>>,
}

impl TokenizerManager {
    /// Creates an empty tokenizer manager.
    pub fn new() -> Self {
        let this = Self {
            inner: TantivyTokenizerManager::new(),
            is_lowercaser: Arc::new(RwLock::new(HashMap::new())),
        };

        // in practice these will almost always be overridden in
        // create_default_quickwit_tokenizer_manager()
        let raw_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
            .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
            .build();
        this.register(RAW_TOKENIZER_NAME, raw_tokenizer, false);
        let raw_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
            .filter(LowerCaser)
            .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
            .build();
        this.register(RAW_LOWERCASE_TOKENIZER_NAME, raw_tokenizer, true);
        let lower_case_tokenizer = TextAnalyzer::builder(RawTokenizer::default())
            .filter(LowerCaser)
            .filter(RemoveLongFilter::limit(DEFAULT_REMOVE_TOKEN_LENGTH))
            .build();
        this.register(LOWERCASE_TOKENIZER_NAME, lower_case_tokenizer, true);

        this
    }

    /// Registers a new tokenizer associated with a given name.
    pub fn register<T>(&self, tokenizer_name: &str, tokenizer: T, does_lowercasing: bool)
    where TextAnalyzer: From<T> {
        self.inner.register(tokenizer_name, tokenizer);
        self.is_lowercaser
            .write()
            .unwrap()
            .insert(tokenizer_name.to_string(), does_lowercasing);
    }

    /// Accessing a tokenizer given its name.
    pub fn get_tokenizer(&self, tokenizer_name: &str) -> Option<TextAnalyzer> {
        self.inner.get(tokenizer_name)
    }

    /// Query whether a given tokenizer does lowercasing
    pub fn get_normalizer(&self, tokenizer_name: &str) -> Option<TextAnalyzer> {
        let use_lowercaser = self
            .is_lowercaser
            .read()
            .unwrap()
            .get(tokenizer_name)
            .copied()?;
        let analyzer = if use_lowercaser {
            RAW_LOWERCASE_TOKENIZER_NAME
        } else {
            RAW_TOKENIZER_NAME
        };
        self.get_tokenizer(analyzer)
    }

    /// Get the inner TokenizerManager
    pub fn tantivy_manager(&self) -> &TantivyTokenizerManager {
        &self.inner
    }
}

impl Default for TokenizerManager {
    fn default() -> Self {
        Self::new()
    }
}


================================================
FILE: quickwit/quickwit-rest-client/Cargo.toml
================================================
[package]
name = "quickwit-rest-client"
description = "Rust client for Quickwit REST API"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
bytes = { workspace = true }
reqwest = { workspace = true }
reqwest-middleware = { workspace = true }
reqwest-retry = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }

quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-indexing = { workspace = true }
quickwit-ingest = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-serve = { workspace = true }

[dev-dependencies]
http = { workspace = true }
wiremock = { workspace = true }

quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }


================================================
FILE: quickwit/quickwit-rest-client/README.md
================================================
# quickwit-rest-client

This project hosts quickwit REST client.


================================================
FILE: quickwit/quickwit-rest-client/resources/tests/documents_to_ingest.json
================================================
{"user":"8","tags":["rust"]}
{"user":"7","tags":["python"]}


================================================
FILE: quickwit/quickwit-rest-client/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use reqwest::StatusCode;
use reqwest_middleware::Error as MiddlewareError;
use serde::Deserialize;
use thiserror::Error;

pub static DEFAULT_ADDRESS: &str = "http://127.0.0.1:7280";
pub static DEFAULT_CONTENT_TYPE: &str = "application/json";

#[derive(Error, Debug)]
pub enum Error {
    // Error returned by Quickwit server.
    #[error("API error: {0}")]
    Api(#[from] ApiError),
    // Error returned by reqwest lib.
    #[error("client error: {0:?}")]
    Client(#[from] reqwest::Error),
    // IO Error returned by tokio lib.
    #[error("IO error: {0}")]
    Io(#[from] tokio::io::Error),
    // Internal error returned by quickwit client lib.
    #[error("internal Quickwit client error: {0}")]
    Internal(String),
    // Error returned by reqwest middleware.
    #[error("client middleware error: {0:?}")]
    Middleware(anyhow::Error),
    // Error returned by url lib when parsing a string.
    #[error("URL parsing error: {0}")]
    UrlParse(String),
}

impl Error {
    pub fn status_code(&self) -> Option<StatusCode> {
        match &self {
            Self::Api(error) => Some(error.code),
            Self::Client(error) => error.status(),
            Self::Internal(_) => Some(StatusCode::INTERNAL_SERVER_ERROR),
            Self::Io(_) => Some(StatusCode::INTERNAL_SERVER_ERROR),
            Self::Middleware(_) => Some(StatusCode::INTERNAL_SERVER_ERROR),
            Self::UrlParse(_) => Some(StatusCode::BAD_REQUEST),
        }
    }
}

impl From<MiddlewareError> for Error {
    fn from(error: MiddlewareError) -> Self {
        match error {
            MiddlewareError::Middleware(error) => Error::Middleware(error),
            MiddlewareError::Reqwest(error) => Error::Client(error),
        }
    }
}

#[derive(Debug, Error)]
pub struct ApiError {
    pub message: Option<String>,
    pub code: StatusCode,
}

// Implement `Display` for `ApiError`.
impl std::fmt::Display for ApiError {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        if let Some(error) = &self.message {
            write!(f, "(code={}, message={})", self.code, error)
        } else {
            write!(f, "(code={})", self.code)
        }
    }
}

#[derive(Deserialize)]
pub(crate) struct ErrorResponsePayload {
    pub message: String,
}


================================================
FILE: quickwit/quickwit-rest-client/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::Path;
use std::{io, mem};

use bytes::Bytes;
use tokio::fs::File;
use tokio::io::{AsyncBufReadExt, AsyncRead, BufReader};
use tracing::warn;

pub mod error;
pub mod models;
pub mod rest_client;

// re-exports
pub use quickwit_config::ConfigFormat;
pub use reqwest::Url;

pub(crate) struct BatchLineReader {
    buf_reader: BufReader<Box<dyn AsyncRead + Send + Sync + Unpin>>,
    buffer: Vec<u8>,
    alloc_num_bytes: usize,
    max_batch_num_bytes: usize,
    num_lines: usize,
    has_next: bool,
}

impl BatchLineReader {
    pub async fn from_file(filepath: &Path, max_batch_num_bytes: usize) -> io::Result<Self> {
        let file = File::open(&filepath).await?;
        Ok(Self::new(Box::new(file), max_batch_num_bytes))
    }

    pub fn from_stdin(max_batch_num_bytes: usize) -> Self {
        Self::new(Box::new(tokio::io::stdin()), max_batch_num_bytes)
    }

    pub fn new(
        reader: Box<dyn AsyncRead + Send + Sync + Unpin>,
        max_batch_num_bytes: usize,
    ) -> Self {
        let alloc_num_bytes = max_batch_num_bytes + 100 * 1024; // Add 100 KiB headroom to avoid reallocation.
        Self {
            buf_reader: BufReader::new(reader),
            buffer: Vec::with_capacity(alloc_num_bytes),
            alloc_num_bytes,
            max_batch_num_bytes,
            num_lines: 0,
            has_next: true,
        }
    }

    pub async fn next_batch(&mut self) -> io::Result<Option<Bytes>> {
        loop {
            let line_num_bytes = self.buf_reader.read_until(b'\n', &mut self.buffer).await?;

            if line_num_bytes > self.max_batch_num_bytes {
                warn!(
                    "Skipping line {}, which exceeds the maximum allowed content length ({} vs. \
                     {} bytes).",
                    self.num_lines + 1,
                    line_num_bytes,
                    self.max_batch_num_bytes
                );
                let new_len = self.buffer.len() - line_num_bytes;
                self.buffer.truncate(new_len);
                continue;
            }
            if self.buffer.len() > self.max_batch_num_bytes {
                let mut new_buffer = Vec::with_capacity(self.alloc_num_bytes);
                let new_len = self.buffer.len() - line_num_bytes;
                new_buffer.extend_from_slice(&self.buffer[new_len..]);
                self.buffer.truncate(new_len);
                let batch = mem::replace(&mut self.buffer, new_buffer);
                return Ok(Some(Bytes::from(batch)));
            }
            if line_num_bytes == 0 {
                self.has_next = false;
                if self.buffer.is_empty() {
                    return Ok(None);
                }
                let batch = mem::take(&mut self.buffer);
                return Ok(Some(Bytes::from(batch)));
            }
            self.num_lines += 1;
        }
    }

    /// Returns whether there is still data available
    ///
    /// This can spuriously return `true` when there was no data
    /// to send at all.
    pub fn has_next(&self) -> bool {
        self.has_next
    }

    fn from_string(payload: impl ToString, max_batch_num_bytes: usize) -> Self {
        Self::new(
            Box::new(std::io::Cursor::new(payload.to_string().into_bytes())),
            max_batch_num_bytes,
        )
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[tokio::test]
    async fn test_batch_reader() {
        {
            let mut batch_reader = BatchLineReader::from_string("".to_string(), 10);
            assert!(batch_reader.next_batch().await.unwrap().is_none());
            assert!(batch_reader.next_batch().await.unwrap().is_none());
        }
        {
            let mut batch_reader = BatchLineReader::from_string("foo\n", 10);
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"foo\n"
            );
            assert!(batch_reader.next_batch().await.unwrap().is_none());
            assert!(batch_reader.next_batch().await.unwrap().is_none());
        }
        {
            let mut batch_reader = BatchLineReader::from_string("foo\nbar\nqux\n", 10);
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"foo\nbar\n"
            );
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"qux\n"
            );
            assert!(batch_reader.next_batch().await.unwrap().is_none());
            assert!(batch_reader.next_batch().await.unwrap().is_none());
        }
        {
            let mut batch_reader = BatchLineReader::from_string("fooo\nbaar\nqux\n", 10);
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"fooo\nbaar\n"
            );
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"qux\n"
            );
            assert!(batch_reader.next_batch().await.unwrap().is_none());
            assert!(batch_reader.next_batch().await.unwrap().is_none());
        }
        {
            let mut batch_reader =
                BatchLineReader::from_string("foobarquxbaz\nfoo\nbar\nqux\n", 10);
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"foo\nbar\n"
            );
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"qux\n"
            );
            assert!(batch_reader.next_batch().await.unwrap().is_none());
            assert!(batch_reader.next_batch().await.unwrap().is_none());
        }
        {
            let mut batch_reader =
                BatchLineReader::from_string("foo\nbar\nfoobarquxbaz\nqux\n", 10);
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"foo\nbar\n"
            );
            assert_eq!(
                &batch_reader.next_batch().await.unwrap().unwrap()[..],
                b"qux\n"
            );
            assert!(batch_reader.next_batch().await.unwrap().is_none());
            assert!(batch_reader.next_batch().await.unwrap().is_none());
        }
    }
}


================================================
FILE: quickwit/quickwit-rest-client/src/models.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::PathBuf;
use std::time::Duration;

use reqwest::StatusCode;
use serde::de::DeserializeOwned;
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;

use crate::error::{ApiError, Error, ErrorResponsePayload};

#[derive(Debug)]
pub struct ApiResponse {
    inner: reqwest::Response,
}

impl ApiResponse {
    pub fn new(inner: reqwest::Response) -> Self {
        Self { inner }
    }
    /// Get the HTTP status code of the response
    pub fn status_code(&self) -> StatusCode {
        self.inner.status()
    }

    /// Checks status and returns error if appropriate.
    pub async fn check(self) -> Result<(), Error> {
        if self.inner.status().is_client_error() || self.inner.status().is_server_error() {
            return Err(self.api_error().await);
        }
        Ok(())
    }

    async fn extract_error_message(self) -> Option<String> {
        let error_body_bytes = self.inner.bytes().await.ok()?;
        let error_body_text = std::str::from_utf8(&error_body_bytes).ok()?;
        if let Ok(error_payload) = serde_json::from_str::<ErrorResponsePayload>(error_body_text) {
            Some(error_payload.message)
        } else {
            Some(error_body_text.to_string())
        }
    }

    async fn api_error(self) -> Error {
        let code = self.inner.status();
        let error_message = self.extract_error_message().await;
        Error::from(ApiError {
            message: error_message,
            code,
        })
    }

    pub async fn deserialize<T: DeserializeOwned>(self) -> Result<T, Error> {
        if self.inner.status().is_client_error() || self.inner.status().is_server_error() {
            Err(self.api_error().await)
        } else {
            let object = self.inner.json::<T>().await?;
            Ok(object)
        }
    }
}

/// A cousin of `quickwit_search::SearchResponseRest` that implements [`Deserialize`]
///
/// This version of the response is necessary because
/// `serde_json_borrow::OwnedValue` is not deserializeable.
#[derive(Deserialize, Serialize, PartialEq, Debug)]
pub struct SearchResponseRestClient {
    pub num_hits: u64,
    pub hits: Vec<JsonValue>,
    pub snippets: Option<Vec<JsonValue>>,
    pub elapsed_time_micros: u64,
    pub errors: Vec<String>,
    pub aggregations: Option<JsonValue>,
}

#[derive(Clone)]
pub enum IngestSource {
    Str(String),
    File(PathBuf),
    Stdin,
}

/// A structure that represent a timeout. Unlike Duration it can also represent an infinite or no
/// timeout value.
#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Default, Debug)]
pub struct Timeout {
    duration: Duration,
}

const SECS_PER_MIN: u64 = 60;
const MINS_PER_HOUR: u64 = 60;
const HOURS_PER_DAY: u64 = 24;

impl Timeout {
    /// Creates a new timeout from duration
    pub const fn new(duration: Duration) -> Timeout {
        Timeout { duration }
    }

    /// Creates a new timeout from seconds
    pub const fn from_secs(secs: u64) -> Timeout {
        Timeout {
            duration: Duration::from_secs(secs),
        }
    }

    /// Creates a new timeout from minutes
    pub const fn from_mins(mins: u64) -> Timeout {
        Self::from_secs(mins * SECS_PER_MIN)
    }

    /// Creates a new timeout from hours
    pub const fn from_hours(hours: u64) -> Timeout {
        Self::from_secs(hours * SECS_PER_MIN * MINS_PER_HOUR)
    }

    /// Creates a new timeout from days
    pub const fn from_days(days: u64) -> Timeout {
        Self::from_secs(days * SECS_PER_MIN * MINS_PER_HOUR * HOURS_PER_DAY)
    }

    /// Creates a new infinite timeout
    pub const fn none() -> Timeout {
        Timeout {
            duration: Duration::MAX,
        }
    }

    /// Converts timeout into Some(Duration) or None if it is infinite.
    pub fn as_duration_opt(&self) -> Option<Duration> {
        if self.duration != Duration::MAX {
            Some(self.duration)
        } else {
            None
        }
    }
}


================================================
FILE: quickwit/quickwit-rest-client/src/rest_client.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::time::Duration;

use bytes::Bytes;
use quickwit_cluster::ClusterSnapshot;
use quickwit_config::{ConfigFormat, SourceConfig};
use quickwit_indexing::actors::IndexingServiceCounters;
pub use quickwit_ingest::CommitType;
use quickwit_metastore::{IndexMetadata, Split, SplitInfo};
use quickwit_proto::ingest::Shard;
use quickwit_serve::{
    ListSplitsQueryParams, ListSplitsResponse, RestIngestResponse, SearchRequestQueryString,
};
use reqwest::header::{CONTENT_TYPE, HeaderMap, HeaderValue};
use reqwest::tls::Certificate;
use reqwest::{ClientBuilder as ReqwestClientBuilder, Method, StatusCode, Url};
use reqwest_middleware::{ClientBuilder as ReqwestMiddlewareClientBuilder, ClientWithMiddleware};
use reqwest_retry::RetryTransientMiddleware;
use reqwest_retry::policies::ExponentialBackoff;
use serde::Serialize;
use serde_json::json;

use crate::BatchLineReader;
use crate::error::Error;
use crate::models::{ApiResponse, IngestSource, SearchResponseRestClient, Timeout};

pub const DEFAULT_BASE_URL: &str = "http://127.0.0.1:7280";
pub const DEFAULT_CONTENT_TYPE: &str = "application/json";
pub const INGEST_CONTENT_LENGTH_LIMIT: usize = 10 * 1024 * 1024; // 10MiB
pub const DEFAULT_CLIENT_CONNECT_TIMEOUT: Timeout = Timeout::from_secs(5);
pub const DEFAULT_CLIENT_TIMEOUT: Timeout = Timeout::from_secs(10);
pub const DEFAULT_CLIENT_SEARCH_TIMEOUT: Timeout = Timeout::from_mins(1);
pub const DEFAULT_CLIENT_INGEST_TIMEOUT: Timeout = Timeout::from_mins(1);
pub const DEFAULT_CLIENT_COMMIT_TIMEOUT: Timeout = Timeout::from_mins(30);

struct Transport {
    base_url: Url,
    api_url: Url,
    client: ClientWithMiddleware,
}

impl Transport {
    fn new(
        endpoint: Url,
        connect_timeout: Timeout,
        ca_cert: Option<Certificate>,
        num_retries: u32,
    ) -> Self {
        let base_url = endpoint;
        let api_url = base_url
            .join("api/v1/")
            .expect("root url should be well-formed");
        let mut reqwest_client_builder = ReqwestClientBuilder::new();
        if let Some(duration) = connect_timeout.as_duration_opt() {
            reqwest_client_builder = reqwest_client_builder.connect_timeout(duration);
        }
        if let Some(ca_cert) = ca_cert {
            reqwest_client_builder = reqwest_client_builder
                .tls_built_in_root_certs(false)
                .add_root_certificate(ca_cert);
        }
        let retry_policy = ExponentialBackoff::builder()
            .retry_bounds(Duration::from_secs(1), Duration::from_secs(60))
            .build_with_max_retries(num_retries);
        let retry_transient_middleware = RetryTransientMiddleware::new_with_policy(retry_policy);
        let reqwest_client = reqwest_client_builder
            .build()
            .expect("`client_builder.build()` should not fail");
        let client = ReqwestMiddlewareClientBuilder::new(reqwest_client)
            .with(retry_transient_middleware)
            .build();
        Self {
            base_url,
            api_url,
            client,
        }
    }

    /// Creates an asynchronous request that can be awaited
    async fn send<Q: Serialize + ?Sized>(
        &self,
        method: Method,
        path: &str,
        header_map: Option<HeaderMap>,
        query_string: Option<&Q>,
        body: Option<Bytes>,
        timeout: Timeout,
    ) -> Result<ApiResponse, Error> {
        let url = if path.starts_with('/') {
            self.base_url.join(path)
        } else {
            self.api_url.join(path)
        }
        .map_err(|error| Error::UrlParse(error.to_string()))?;
        let mut request_builder = self.client.request(method, url);
        if let Some(duration) = timeout.as_duration_opt() {
            request_builder = request_builder.timeout(duration);
        }
        let mut request_headers = HeaderMap::new();
        request_headers.insert(CONTENT_TYPE, HeaderValue::from_static(DEFAULT_CONTENT_TYPE));
        if let Some(header_map_val) = header_map {
            request_headers.extend(header_map_val.into_iter());
        }
        request_builder = request_builder.headers(request_headers);
        if let Some(bytes) = body {
            request_builder = request_builder.body(bytes);
        };
        if let Some(qs) = query_string {
            request_builder = request_builder.query(qs);
        }
        let response = request_builder.send().await?;

        Ok(ApiResponse::new(response))
    }
}

pub struct QuickwitClientBuilder {
    /// Base url for the client
    base_url: Url,
    /// Connection timeout.
    connect_timeout: Timeout,
    /// Timeout for most operations except search and ingest.
    timeout: Timeout,
    /// Timeout for search operations.
    search_timeout: Timeout,
    /// Timeout for the ingest operations with auto commit.
    ingest_timeout: Timeout,
    /// Timeout for the ingest operations that require waiting for commit.
    commit_timeout: Timeout,
    /// Forces use of ingest v1.
    use_legacy_ingest: bool,
    /// Request detailed parse failures report from the ingest api.
    detailed_response: bool,
    /// Validate against a custom TLS certificate authority
    ca_cert: Option<Certificate>,
    /// Maximum number of retries for transient errors.
    num_retries: u32,
}

impl QuickwitClientBuilder {
    pub fn new(endpoint: Url) -> Self {
        QuickwitClientBuilder {
            base_url: endpoint,
            connect_timeout: DEFAULT_CLIENT_CONNECT_TIMEOUT,
            timeout: DEFAULT_CLIENT_TIMEOUT,
            search_timeout: DEFAULT_CLIENT_SEARCH_TIMEOUT,
            ingest_timeout: DEFAULT_CLIENT_INGEST_TIMEOUT,
            commit_timeout: DEFAULT_CLIENT_COMMIT_TIMEOUT,
            use_legacy_ingest: false,
            detailed_response: false,
            ca_cert: None,
            num_retries: 0,
        }
    }

    pub fn connect_timeout(mut self, timeout: Timeout) -> Self {
        self.connect_timeout = timeout;
        self
    }

    pub fn timeout(mut self, timeout: Timeout) -> Self {
        self.timeout = timeout;
        self
    }

    pub fn search_timeout(mut self, timeout: Timeout) -> Self {
        self.search_timeout = timeout;
        self
    }

    pub fn ingest_timeout(mut self, timeout: Timeout) -> Self {
        self.ingest_timeout = timeout;
        self
    }

    // TODO(#5604)
    pub fn use_legacy_ingest(mut self, use_legacy_ingest: bool) -> Self {
        self.use_legacy_ingest = use_legacy_ingest;
        self
    }

    pub fn detailed_response(mut self, is_detailed: bool) -> Self {
        self.detailed_response = is_detailed;
        self
    }

    pub fn commit_timeout(mut self, timeout: Timeout) -> Self {
        self.commit_timeout = timeout;
        self
    }

    pub fn set_tls_ca(mut self, ca_cert: Option<Certificate>) -> Self {
        self.ca_cert = ca_cert;
        self
    }

    pub fn num_retries(mut self, num_retries: u32) -> Self {
        self.num_retries = num_retries;
        self
    }

    pub fn build(self) -> QuickwitClient {
        let transport = Transport::new(
            self.base_url,
            self.connect_timeout,
            self.ca_cert,
            self.num_retries,
        );
        QuickwitClient {
            transport,
            timeout: self.timeout,
            search_timeout: self.search_timeout,
            ingest_timeout: self.ingest_timeout,
            commit_timeout: self.commit_timeout,
            use_legacy_ingest: self.use_legacy_ingest,
            detailed_response: self.detailed_response,
        }
    }
}

/// Root client for top level APIs.
pub struct QuickwitClient {
    transport: Transport,
    /// Timeout for all operations except search and ingest.
    timeout: Timeout,
    /// Timeout for search operations.
    search_timeout: Timeout,
    /// Timeout for the ingest operations.
    ingest_timeout: Timeout,
    /// Timeout for the ingest operations that require waiting for commit.
    commit_timeout: Timeout,
    /// Forces use of ingest v1.
    use_legacy_ingest: bool,
    /// Request detailed parse failures report from the ingest api.
    detailed_response: bool,
}

impl QuickwitClient {
    pub async fn search(
        &self,
        index_id: &str,
        search_query: SearchRequestQueryString,
    ) -> Result<SearchResponseRestClient, Error> {
        let path = format!("{index_id}/search");
        let bytes = serde_json::to_string(&search_query)
            .unwrap()
            .as_bytes()
            .to_vec();
        let body = Bytes::from(bytes);
        let response = self
            .transport
            .send::<()>(
                Method::POST,
                &path,
                None,
                None,
                Some(body),
                self.search_timeout,
            )
            .await?;
        let search_response = response.deserialize().await?;
        Ok(search_response)
    }

    pub fn indexes(&self) -> IndexClient<'_> {
        IndexClient::new(&self.transport, self.timeout)
    }

    pub fn splits<'a>(&'a self, index_id: &'a str) -> SplitClient<'a, 'a> {
        SplitClient::new(&self.transport, self.timeout, index_id)
    }

    pub fn sources<'a>(&'a self, index_id: &'a str) -> SourceClient<'a> {
        SourceClient::new(&self.transport, self.timeout, index_id)
    }

    pub fn cluster(&self) -> ClusterClient<'_> {
        ClusterClient::new(&self.transport, self.timeout)
    }

    pub fn node_stats(&self) -> NodeStatsClient<'_> {
        NodeStatsClient::new(&self.transport, self.timeout)
    }

    pub fn node_health(&self) -> NodeHealthClient<'_> {
        NodeHealthClient::new(&self.transport, self.timeout)
    }

    pub async fn ingest(
        &self,
        index_id: &str,
        ingest_source: IngestSource,
        batch_size_limit_opt: Option<usize>,
        mut on_ingest_event: Option<&mut (dyn FnMut(IngestEvent) + Sync)>,
        last_block_commit: CommitType,
    ) -> Result<RestIngestResponse, Error> {
        let ingest_path = format!("{index_id}/ingest");
        let mut query_params = HashMap::new();
        // TODO(#5604)
        if self.use_legacy_ingest {
            query_params.insert("use_legacy_ingest", "true");
        }
        if self.detailed_response {
            query_params.insert("detailed_response", "true");
        }
        let batch_size_limit = batch_size_limit_opt.unwrap_or(INGEST_CONTENT_LENGTH_LIMIT);
        let mut batch_reader = match ingest_source {
            IngestSource::File(filepath) => {
                BatchLineReader::from_file(&filepath, batch_size_limit).await?
            }
            IngestSource::Stdin => BatchLineReader::from_stdin(batch_size_limit),
            IngestSource::Str(ingest_payload) => {
                BatchLineReader::from_string(ingest_payload, batch_size_limit)
            }
        };
        let mut cumulated_resp = RestIngestResponse::default();
        while let Some(batch) = batch_reader.next_batch().await? {
            loop {
                let timeout = if !batch_reader.has_next() && last_block_commit != CommitType::Auto {
                    self.commit_timeout
                } else {
                    self.ingest_timeout
                };
                match last_block_commit {
                    CommitType::Auto => {}
                    CommitType::WaitFor => {
                        query_params.insert("commit", "wait_for");
                    }
                    CommitType::Force => {
                        query_params.insert("commit", "force");
                    }
                }
                let response = self
                    .transport
                    .send(
                        Method::POST,
                        &ingest_path,
                        None,
                        Some(&query_params),
                        Some(batch.clone()),
                        timeout,
                    )
                    .await?;
                if response.status_code() == StatusCode::TOO_MANY_REQUESTS {
                    if let Some(event_fn) = &mut on_ingest_event {
                        event_fn(IngestEvent::Sleep)
                    }
                    tokio::time::sleep(Duration::from_millis(500)).await;
                } else {
                    let current_parsed_resp = response.deserialize().await?;
                    cumulated_resp = cumulated_resp.merge(current_parsed_resp);
                    break;
                }
            }
            if let Some(event_fn) = &mut on_ingest_event {
                event_fn(IngestEvent::IngestedDocBatch(batch.len()))
            }
        }

        Ok(cumulated_resp)
    }
}

pub enum IngestEvent {
    IngestedDocBatch(usize),
    Sleep,
}

/// Client for indexes APIs.
pub struct IndexClient<'a> {
    transport: &'a Transport,
    timeout: Timeout,
}

impl<'a> IndexClient<'a> {
    fn new(transport: &'a Transport, timeout: Timeout) -> Self {
        Self { transport, timeout }
    }

    pub async fn create(
        &self,
        index_config: impl AsRef<[u8]>,
        config_format: ConfigFormat,
        overwrite: bool,
    ) -> Result<IndexMetadata, Error> {
        let header_map = header_from_config_format(config_format);
        let body = Bytes::copy_from_slice(index_config.as_ref());
        let response = self
            .transport
            .send(
                Method::POST,
                "indexes",
                Some(header_map),
                Some(&[("overwrite", overwrite)]),
                Some(body),
                self.timeout,
            )
            .await?;
        let index_metadata = response.deserialize().await?;
        Ok(index_metadata)
    }

    pub async fn update(
        &self,
        index_id: &str,
        index_config: impl AsRef<[u8]>,
        config_format: ConfigFormat,
        create: bool,
    ) -> Result<IndexMetadata, Error> {
        let header_map = header_from_config_format(config_format);
        let body = Bytes::copy_from_slice(index_config.as_ref());
        let mut query_params = HashMap::new();
        if create {
            query_params.insert("create", "true");
        }
        let path = format!("indexes/{index_id}");
        let response = self
            .transport
            .send(
                Method::PUT,
                &path,
                Some(header_map),
                Some(&query_params),
                Some(body),
                self.timeout,
            )
            .await?;
        let index_metadata = response.deserialize().await?;
        Ok(index_metadata)
    }

    pub async fn list(&self) -> Result<Vec<IndexMetadata>, Error> {
        let response = self
            .transport
            .send::<()>(Method::GET, "indexes", None, None, None, self.timeout)
            .await?;
        let indexes_metadatas = response.deserialize().await?;
        Ok(indexes_metadatas)
    }

    pub async fn get(&self, index_id: &str) -> Result<IndexMetadata, Error> {
        let path = format!("indexes/{index_id}");
        let response = self
            .transport
            .send::<()>(Method::GET, &path, None, None, None, self.timeout)
            .await?;
        let index_metadata = response.deserialize().await?;
        Ok(index_metadata)
    }

    pub async fn clear(&self, index_id: &str) -> Result<(), Error> {
        let path = format!("indexes/{index_id}/clear");
        let response = self
            .transport
            .send::<()>(Method::PUT, &path, None, None, None, self.timeout)
            .await?;
        response.check().await?;
        Ok(())
    }

    pub async fn delete(&self, index_id: &str, dry_run: bool) -> Result<Vec<SplitInfo>, Error> {
        let path = format!("indexes/{index_id}");
        let response = self
            .transport
            .send(
                Method::DELETE,
                &path,
                None,
                Some(&[("dry_run", dry_run)]),
                None,
                self.timeout,
            )
            .await?;
        let file_entries = response.deserialize().await?;
        Ok(file_entries)
    }
}

/// Client for splits APIs.
pub struct SplitClient<'a, 'b> {
    transport: &'a Transport,
    timeout: Timeout,
    index_id: &'b str,
}

impl<'a, 'b> SplitClient<'a, 'b> {
    fn new(transport: &'a Transport, timeout: Timeout, index_id: &'b str) -> Self {
        Self {
            transport,
            timeout,
            index_id,
        }
    }

    fn splits_root_url(&self) -> String {
        format!("indexes/{}/splits", self.index_id)
    }

    pub async fn list(
        &self,
        list_splits_query_params: ListSplitsQueryParams,
    ) -> Result<Vec<Split>, Error> {
        let path = self.splits_root_url();
        let response = self
            .transport
            .send(
                Method::GET,
                &path,
                None,
                Some(&list_splits_query_params),
                None,
                self.timeout,
            )
            .await?;
        let list_splits_response: ListSplitsResponse = response.deserialize().await?;
        Ok(list_splits_response.splits)
    }

    pub async fn mark_for_deletion(&self, split_ids: Vec<String>) -> Result<(), Error> {
        let path = format!("{}/mark-for-deletion", self.splits_root_url());
        let body_json = json!({ "split_ids": split_ids });
        let body_vec =
            serde_json::to_vec(&body_json).expect("serializing `body_json` should never fail");
        let body_bytes = Bytes::from(body_vec);
        let response = self
            .transport
            .send::<()>(
                Method::PUT,
                &path,
                None,
                None,
                Some(body_bytes),
                self.timeout,
            )
            .await?;
        response.check().await?;
        Ok(())
    }
}

/// Client for source APIs.
pub struct SourceClient<'a> {
    transport: &'a Transport,
    timeout: Timeout,
    index_id: &'a str,
}

impl<'a> SourceClient<'a> {
    fn new(transport: &'a Transport, timeout: Timeout, index_id: &'a str) -> Self {
        Self {
            transport,
            timeout,
            index_id,
        }
    }

    fn sources_root_url(&self) -> String {
        format!("indexes/{}/sources", self.index_id)
    }

    pub async fn create(
        &self,
        source_config_input: impl AsRef<[u8]>,
        config_format: ConfigFormat,
    ) -> Result<SourceConfig, Error> {
        let header_map = header_from_config_format(config_format);
        let source_config_bytes = Bytes::copy_from_slice(source_config_input.as_ref());
        let response = self
            .transport
            .send::<()>(
                Method::POST,
                &self.sources_root_url(),
                Some(header_map),
                None,
                Some(source_config_bytes),
                self.timeout,
            )
            .await?;
        let source_config = response.deserialize().await?;
        Ok(source_config)
    }

    pub async fn update(
        &self,
        source_id: &str,
        source_config_input: impl AsRef<[u8]>,
        config_format: ConfigFormat,
        create: bool,
    ) -> Result<SourceConfig, Error> {
        let header_map = header_from_config_format(config_format);
        let source_config_bytes = Bytes::copy_from_slice(source_config_input.as_ref());
        let mut query_params = HashMap::new();
        if create {
            query_params.insert("create", "true");
        }
        let path = format!("{}/{source_id}", self.sources_root_url());
        let response = self
            .transport
            .send(
                Method::PUT,
                &path,
                Some(header_map),
                Some(&query_params),
                Some(source_config_bytes),
                self.timeout,
            )
            .await?;
        let source_config = response.deserialize().await?;
        Ok(source_config)
    }

    pub async fn get(&self, source_id: &str) -> Result<SourceConfig, Error> {
        let path = format!("{}/{source_id}", self.sources_root_url());
        let response = self
            .transport
            .send::<()>(Method::GET, &path, None, None, None, self.timeout)
            .await?;
        let source_config = response.deserialize().await?;
        Ok(source_config)
    }

    pub async fn toggle(&self, source_id: &str, enable: bool) -> Result<(), Error> {
        let json_value = json!({ "enable": enable });
        let json_bytes = serde_json::to_vec(&json_value).expect("Serialization should never fail.");
        let path = format!("{}/{source_id}/toggle", self.sources_root_url());
        let response = self
            .transport
            .send::<()>(
                Method::PUT,
                &path,
                None,
                None,
                Some(Bytes::from(json_bytes)),
                self.timeout,
            )
            .await?;
        response.check().await?;
        Ok(())
    }

    pub async fn reset_checkpoint(&self, source_id: &str) -> Result<(), Error> {
        let path = format!("{}/{source_id}/reset-checkpoint", self.sources_root_url());
        let response = self
            .transport
            .send::<()>(Method::PUT, &path, None, None, None, self.timeout)
            .await?;
        response.check().await?;
        Ok(())
    }

    pub async fn list(&self) -> Result<Vec<SourceConfig>, Error> {
        let response = self
            .transport
            .send::<()>(
                Method::GET,
                &self.sources_root_url(),
                None,
                None,
                None,
                self.timeout,
            )
            .await?;
        let source_configs = response.deserialize().await?;
        Ok(source_configs)
    }

    pub async fn delete(&self, source_id: &str) -> Result<(), Error> {
        let path = format!("{}/{source_id}", self.sources_root_url());
        let response = self
            .transport
            .send::<()>(Method::DELETE, &path, None, None, None, self.timeout)
            .await?;
        response.check().await?;
        Ok(())
    }

    pub async fn get_shards(&self, source_id: &str) -> Result<Vec<Shard>, Error> {
        let path = format!("{}/{source_id}/shards", self.sources_root_url());
        let response = self
            .transport
            .send::<()>(Method::GET, &path, None, None, None, self.timeout)
            .await?;
        let source_config = response.deserialize().await?;
        Ok(source_config)
    }
}

/// Client for Cluster APIs.
pub struct ClusterClient<'a> {
    transport: &'a Transport,
    timeout: Timeout,
}

impl<'a> ClusterClient<'a> {
    fn new(transport: &'a Transport, timeout: Timeout) -> Self {
        Self { transport, timeout }
    }

    pub async fn snapshot(&self) -> Result<ClusterSnapshot, Error> {
        let response = self
            .transport
            .send::<()>(Method::GET, "cluster", None, None, None, self.timeout)
            .await?;
        let cluster_snapshot = response.deserialize().await?;
        Ok(cluster_snapshot)
    }
}

/// Client for Node-level Stats APIs.
pub struct NodeStatsClient<'a> {
    transport: &'a Transport,
    timeout: Timeout,
}

impl<'a> NodeStatsClient<'a> {
    fn new(transport: &'a Transport, timeout: Timeout) -> Self {
        Self { transport, timeout }
    }

    pub async fn indexing(&self) -> Result<IndexingServiceCounters, Error> {
        let response = self
            .transport
            .send::<()>(Method::GET, "indexing", None, None, None, self.timeout)
            .await?;
        let indexing_stats = response.deserialize().await?;
        Ok(indexing_stats)
    }
}

/// Client for Node-level Health APIs.
pub struct NodeHealthClient<'a> {
    transport: &'a Transport,
    timeout: Timeout,
}

impl<'a> NodeHealthClient<'a> {
    fn new(transport: &'a Transport, timeout: Timeout) -> Self {
        Self { transport, timeout }
    }

    /// Returns true if the node is healthy, returns false or an error otherwise.
    pub async fn is_live(&self) -> Result<bool, Error> {
        let response = self
            .transport
            .send::<()>(Method::GET, "/health/livez", None, None, None, self.timeout)
            .await?;
        let result: bool = response.deserialize().await?;
        Ok(result)
    }

    /// Returns true if the node is ready, returns false or an error otherwise.
    pub async fn is_ready(&self) -> Result<bool, Error> {
        let response = self
            .transport
            .send::<()>(
                Method::GET,
                "/health/readyz",
                None,
                None,
                None,
                self.timeout,
            )
            .await?;
        let result: bool = response.deserialize().await?;
        Ok(result)
    }
}

fn header_from_config_format(config_format: ConfigFormat) -> HeaderMap {
    let mut header_map = HeaderMap::new();
    let content_type_value = format!("application/{}", config_format.as_str());
    header_map.insert(
        CONTENT_TYPE,
        HeaderValue::from_str(&content_type_value).expect("Content type should always be valid."),
    );
    header_map
}

#[cfg(test)]
mod test {

    use std::path::PathBuf;
    use std::str::FromStr;

    use http::StatusCode;
    use quickwit_config::{ConfigFormat, SourceConfig};
    use quickwit_indexing::mock_split;
    use quickwit_ingest::CommitType;
    use quickwit_metastore::IndexMetadata;
    use quickwit_serve::{
        ListSplitsQueryParams, ListSplitsResponse, RestIngestResponse, SearchRequestQueryString,
    };
    use reqwest::Url;
    use reqwest::header::CONTENT_TYPE;
    use serde_json::json;
    use tokio::fs::File;
    use tokio::io::AsyncReadExt;
    use wiremock::matchers::{
        body_bytes, body_json, header, method, path, query_param, query_param_is_missing,
    };
    use wiremock::{Mock, MockServer, ResponseTemplate};

    use crate::error::Error;
    use crate::models::{IngestSource, SearchResponseRestClient};
    use crate::rest_client::QuickwitClientBuilder;
    #[tokio::test]
    async fn test_client_no_server() {
        let port = quickwit_common::net::find_available_tcp_port().unwrap();
        let server_url = Url::parse(&format!("http://127.0.0.1:{port}")).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let error = qw_client.indexes().list().await.unwrap_err();
        assert!(matches!(error, Error::Middleware(_)));
        assert!(error.to_string().contains("tcp connect error"));
    }

    #[tokio::test]
    async fn test_search_endpoint() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        // Search
        let search_query_params = SearchRequestQueryString {
            ..Default::default()
        };
        let expected_search_response = SearchResponseRestClient {
            num_hits: 0,
            hits: Vec::new(),
            snippets: None,
            aggregations: None,
            elapsed_time_micros: 100,
            errors: Vec::new(),
        };
        Mock::given(method("POST"))
            .and(path("/api/v1/my-index/search"))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(
                json!({"num_hits": 0, "hits": [], "elapsed_time_micros": 100, "errors": []}),
            ))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client
                .search("my-index", search_query_params)
                .await
                .unwrap(),
            expected_search_response
        );
    }

    fn get_ndjson_filepath(ndjson_dataset_filename: &str) -> String {
        format!(
            "{}/resources/tests/{}",
            env!("CARGO_MANIFEST_DIR"),
            ndjson_dataset_filename
        )
    }

    #[tokio::test]
    async fn test_ingest_endpoint() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let ndjson_filepath = get_ndjson_filepath("documents_to_ingest.json");
        let mut buffer = Vec::new();
        File::open(&ndjson_filepath)
            .await
            .unwrap()
            .read_to_end(&mut buffer)
            .await
            .unwrap();
        Mock::given(method("POST"))
            .and(path("/api/v1/my-index/ingest"))
            .and(query_param_is_missing("commit"))
            .and(body_bytes(buffer.clone()))
            .respond_with(ResponseTemplate::new(StatusCode::TOO_MANY_REQUESTS))
            .up_to_n_times(2)
            .expect(2)
            .mount(&mock_server)
            .await;
        let mock_response = RestIngestResponse {
            num_docs_for_processing: 2,
            num_ingested_docs: Some(2),
            num_rejected_docs: Some(0),
            parse_failures: Some(Vec::new()),
        };
        Mock::given(method("POST"))
            .and(path("/api/v1/my-index/ingest"))
            .and(query_param_is_missing("commit"))
            .and(body_bytes(buffer))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(&mock_response))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        let ingest_source = IngestSource::File(PathBuf::from_str(&ndjson_filepath).unwrap());
        let actual_response = qw_client
            .ingest("my-index", ingest_source, None, None, CommitType::Auto)
            .await
            .unwrap();
        assert_eq!(actual_response, mock_response);
    }

    #[tokio::test]
    async fn test_ingest_endpoint_with_force_commit() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let ndjson_filepath = get_ndjson_filepath("documents_to_ingest.json");
        let mut buffer = Vec::new();
        File::open(&ndjson_filepath)
            .await
            .unwrap()
            .read_to_end(&mut buffer)
            .await
            .unwrap();
        let mock_response = RestIngestResponse {
            num_docs_for_processing: 2,
            num_ingested_docs: Some(2),
            num_rejected_docs: Some(0),
            parse_failures: Some(Vec::new()),
        };
        Mock::given(method("POST"))
            .and(path("/api/v1/my-index/ingest"))
            .and(query_param("commit", "force"))
            .and(body_bytes(buffer))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(&mock_response))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        let ingest_source = IngestSource::File(PathBuf::from_str(&ndjson_filepath).unwrap());
        let actual_response = qw_client
            .ingest("my-index", ingest_source, None, None, CommitType::Force)
            .await
            .unwrap();
        assert_eq!(actual_response, mock_response);
    }

    #[tokio::test]
    async fn test_ingest_endpoint_with_wait_for_commit() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let ndjson_filepath = get_ndjson_filepath("documents_to_ingest.json");
        let mut buffer = Vec::new();
        File::open(&ndjson_filepath)
            .await
            .unwrap()
            .read_to_end(&mut buffer)
            .await
            .unwrap();
        let mock_response = RestIngestResponse {
            num_docs_for_processing: 2,
            num_ingested_docs: Some(2),
            num_rejected_docs: Some(0),
            parse_failures: Some(Vec::new()),
        };
        Mock::given(method("POST"))
            .and(path("/api/v1/my-index/ingest"))
            .and(query_param("commit", "wait_for"))
            .and(body_bytes(buffer))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(&mock_response))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        let ingest_source = IngestSource::File(PathBuf::from_str(&ndjson_filepath).unwrap());
        let actual_response = qw_client
            .ingest("my-index", ingest_source, None, None, CommitType::WaitFor)
            .await
            .unwrap();
        assert_eq!(actual_response, mock_response);
    }

    #[tokio::test]
    async fn test_ingest_endpoint_should_return_api_error() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let ndjson_filepath = get_ndjson_filepath("documents_to_ingest.json");
        let mut buffer = Vec::new();
        File::open(&ndjson_filepath)
            .await
            .unwrap()
            .read_to_end(&mut buffer)
            .await
            .unwrap();
        Mock::given(method("POST"))
            .and(path("/api/v1/my-index/ingest"))
            .and(body_bytes(buffer.clone()))
            .respond_with(
                ResponseTemplate::new(405).set_body_json(json!({"message": "internal error"})),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        let ingest_source = IngestSource::File(PathBuf::from_str(&ndjson_filepath).unwrap());
        let error = qw_client
            .ingest(
                "my-index",
                ingest_source,
                Some(4096),
                None,
                CommitType::Auto,
            )
            .await
            .unwrap_err();
        assert!(matches!(error, Error::Api(_)));
        assert!(error.to_string().contains("internal error"));
    }

    #[tokio::test]
    async fn test_indexes_endpoints() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///indexes/test-index");
        // GET indexes
        Mock::given(method("GET"))
            .and(path("/api/v1/indexes"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(vec![index_metadata.clone()]),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client.indexes().list().await.unwrap(),
            vec![index_metadata.clone()]
        );

        // POST create index
        let index_config_to_create = index_metadata.index_config.clone();
        Mock::given(method("POST"))
            .and(path("/api/v1/indexes"))
            .and(body_json(index_config_to_create.clone()))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(index_metadata.clone()),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        let post_body = serde_json::to_string(&index_config_to_create).unwrap();
        assert_eq!(
            qw_client
                .indexes()
                .create(post_body, ConfigFormat::Json, false)
                .await
                .unwrap(),
            index_metadata
        );

        // POST create index with yaml
        Mock::given(method("POST"))
            .and(path("/api/v1/indexes"))
            .and(header(CONTENT_TYPE.as_str(), "application/yaml"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(index_metadata.clone()),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client
                .indexes()
                .create("", ConfigFormat::Yaml, false)
                .await
                .unwrap(),
            index_metadata
        );

        // PUT clear index
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/clear"))
            .respond_with(ResponseTemplate::new(StatusCode::OK))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client.indexes().clear("my-index").await.unwrap();

        // PUT clear index returns an error
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/clear"))
            .respond_with(ResponseTemplate::new(StatusCode::BAD_REQUEST))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client.indexes().clear("my-index").await.unwrap_err();

        // DELETE index
        Mock::given(method("DELETE"))
            .and(path("/api/v1/indexes/my-index"))
            .and(query_param("dry_run", "true"))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(json!([{
                "split_id": "my-split",
                "num_docs": 1,
                "uncompressed_docs_size_bytes": 1024,
                "file_name": "my-split.split",
                "file_size_bytes": 128,
            }])))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client.indexes().delete("my-index", true).await.unwrap();

        // DELETE index returns an error
        Mock::given(method("DELETE"))
            .and(path("/api/v1/indexes/my-index"))
            .respond_with(ResponseTemplate::new(StatusCode::UNSUPPORTED_MEDIA_TYPE))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .indexes()
            .delete("my-index", true)
            .await
            .unwrap_err();
    }

    #[tokio::test]
    async fn test_splits_endpoints() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let split = mock_split("split-1");
        // GET splits
        let list_splits_params = ListSplitsQueryParams {
            start_timestamp: Some(1),
            ..Default::default()
        };
        let response = ListSplitsResponse {
            offset: 0,
            size: 1,
            splits: vec![split.clone()],
        };
        Mock::given(method("GET"))
            .and(path("/api/v1/indexes/my-index/splits"))
            .and(query_param("start_timestamp", "1"))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(response))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client
                .splits("my-index")
                .list(list_splits_params)
                .await
                .unwrap(),
            vec![split.clone()]
        );

        // Mark for deletion
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/splits/mark-for-deletion"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK)
                    .set_body_json(json!({"split_ids": ["split-1"]})),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .splits("my-index")
            .mark_for_deletion(vec!["split-1".to_string()])
            .await
            .unwrap();

        // Mark for deletion returns an error
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/splits/mark-for-deletion"))
            .respond_with(ResponseTemplate::new(StatusCode::METHOD_NOT_ALLOWED))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .splits("my-index")
            .mark_for_deletion(vec!["split-1".to_string()])
            .await
            .unwrap_err();
    }

    #[tokio::test]
    async fn test_sources_endpoints() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();
        let source_config = SourceConfig::ingest_api_default();
        // POST create source with toml
        Mock::given(method("POST"))
            .and(path("/api/v1/indexes/my-index/sources"))
            .and(header(CONTENT_TYPE.as_str(), "application/toml"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(source_config.clone()),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client
                .sources("my-index")
                .create("", ConfigFormat::Toml)
                .await
                .unwrap(),
            source_config
        );

        // PUT update source with yaml
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/sources/my-source-1"))
            .and(header(CONTENT_TYPE.as_str(), "application/yaml"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(source_config.clone()),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client
                .sources("my-index")
                .update("my-source-1", "", ConfigFormat::Yaml, false)
                .await
                .unwrap(),
            source_config
        );

        // GET sources
        Mock::given(method("GET"))
            .and(path("/api/v1/indexes/my-index/sources"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(vec![source_config.clone()]),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        assert_eq!(
            qw_client.sources("my-index").list().await.unwrap(),
            vec![source_config.clone()]
        );

        // Toggle source
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/sources/my-source-1/toggle"))
            .respond_with(
                ResponseTemplate::new(StatusCode::OK).set_body_json(json!({"enable": true})),
            )
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .sources("my-index")
            .toggle("my-source-1", true)
            .await
            .unwrap();

        // Toggle source returns an error
        Mock::given(method("PUT"))
            .and(path("/api/v1/indexes/my-index/sources/my-source-2/toggle"))
            .respond_with(ResponseTemplate::new(StatusCode::BAD_REQUEST))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .sources("my-index")
            .toggle("my-source-2", true)
            .await
            .unwrap_err();

        // PUT reset checkpoint
        Mock::given(method("PUT"))
            .and(path(
                "/api/v1/indexes/my-index/sources/my-source/reset-checkpoint",
            ))
            .respond_with(ResponseTemplate::new(StatusCode::OK))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .sources("my-index")
            .reset_checkpoint("my-source")
            .await
            .unwrap();

        // PUT reset checkpoint returns an error
        Mock::given(method("PUT"))
            .and(path(
                "/api/v1/indexes/my-index/sources/my-source/reset-checkpoint",
            ))
            .respond_with(ResponseTemplate::new(StatusCode::BAD_GATEWAY))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .sources("my-index")
            .reset_checkpoint("my-source")
            .await
            .unwrap_err();

        // DELETE source
        Mock::given(method("DELETE"))
            .and(path("/api/v1/indexes/my-index/sources/my-source"))
            .respond_with(ResponseTemplate::new(StatusCode::OK))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .sources("my-index")
            .delete("my-source")
            .await
            .unwrap();

        // DELETE source returns an error
        Mock::given(method("DELETE"))
            .and(path("/api/v1/indexes/my-index/sources/my-source"))
            .respond_with(ResponseTemplate::new(StatusCode::BAD_GATEWAY))
            .up_to_n_times(1)
            .mount(&mock_server)
            .await;
        qw_client
            .sources("my-index")
            .delete("my-source")
            .await
            .unwrap_err();
    }

    #[tokio::test]
    async fn test_health_endpoints() {
        let mock_server = MockServer::start().await;
        let server_url = Url::parse(&mock_server.uri()).unwrap();
        let qw_client = QuickwitClientBuilder::new(server_url).build();

        assert!(qw_client.node_health().is_live().await.is_err());
        assert!(qw_client.node_health().is_ready().await.is_err());

        // GET /health/livez
        Mock::given(method("GET"))
            .and(path("/health/livez"))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(true))
            .expect(1)
            .mount(&mock_server)
            .await;
        assert!(qw_client.node_health().is_live().await.unwrap());

        // GET /health/readyz
        Mock::given(method("GET"))
            .and(path("/health/readyz"))
            .respond_with(ResponseTemplate::new(StatusCode::OK).set_body_json(true))
            .expect(1)
            .mount(&mock_server)
            .await;
        assert!(qw_client.node_health().is_ready().await.unwrap());
    }
}


================================================
FILE: quickwit/quickwit-search/Cargo.toml
================================================
[package]
name = "quickwit-search"
description = "Distributed search"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
base64 = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
fnv = { workspace = true }
futures = { workspace = true }
http = { workspace = true }
itertools = { workspace = true }
mockall = { workspace = true }
once_cell = { workspace = true }
pin-project = { workspace = true }
postcard = { workspace = true }
prost = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
tantivy = { workspace = true }
tantivy-fst = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tower = { workspace = true, features = ["timeout"] }
tracing = { workspace = true }
ttl_cache = { workspace = true }
ulid = { workspace = true }
utoipa = { workspace = true }

quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-directories = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-query = { workspace = true }
quickwit-storage = { workspace = true }

[dev-dependencies]
assert-json-diff = { workspace = true }
proptest = { workspace = true }
rand = { workspace = true }
serde_json = { workspace = true }

quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }

[features]
testsuite = []
ci-test = []


================================================
FILE: quickwit/quickwit-search/README.md
================================================
# Quickwit-search

This project implements quickwit's search API.

# Architecture

Quickwit relies on a pool of stateless search servers.
All search-servers are identical and are meant to be queried using a simple load balancer.

The server which receives the query acts as the *root* server for the time of the query.

The *root* role is to coordinate the work of the *leaf* servers:
- it interprets the user query
- queries the meta store to identify the list of relevant index splits
- dispatch the work to the leaf
- gathers and merge the leaf results.

The *leaf* servers are in charge of performing the actual search task on their
assigned subset of index splits.

A search request on one split typically works in phases
- downloading the hotcache and opening the directory
- download all of the data of required for the query phase on the split
- performing the query_search_phase
- if required, performing the fetch_docs_phase.


================================================
FILE: quickwit/quickwit-search/src/client.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::net::SocketAddr;
use std::sync::Arc;
use std::time::Duration;

use bytesize::ByteSize;
use http::Uri;
use quickwit_proto::search::{GetKvRequest, PutKvRequest, ReportSplitsRequest};
use quickwit_proto::tonic::Request;
use quickwit_proto::tonic::codegen::InterceptedService;
use quickwit_proto::tonic::transport::{Channel, Endpoint};
use quickwit_proto::{SpanContextInterceptor, tonic};
use tower::timeout::Timeout;
use tracing::warn;

use crate::SearchService;
use crate::error::parse_grpc_error;

/// Impl is an enumeration that meant to manage Quickwit's search service client types.
#[derive(Clone)]
enum SearchServiceClientImpl {
    Local(Arc<dyn SearchService>),
    Grpc(
        quickwit_proto::search::search_service_client::SearchServiceClient<
            InterceptedService<Timeout<Channel>, SpanContextInterceptor>,
        >,
    ),
}

/// A search service client.
/// It contains the client implementation and the gRPC address of the node to which the client
/// connects.
#[derive(Clone)]
pub struct SearchServiceClient {
    client_impl: SearchServiceClientImpl,
    grpc_addr: SocketAddr,
}

impl fmt::Debug for SearchServiceClient {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        match &self.client_impl {
            SearchServiceClientImpl::Local(_service) => {
                write!(formatter, "Local({:?})", self.grpc_addr)
            }
            SearchServiceClientImpl::Grpc(_grpc_client) => {
                write!(formatter, "Grpc({:?})", self.grpc_addr)
            }
        }
    }
}

impl SearchServiceClient {
    /// Create a search service client instance given a gRPC client and gRPC address.
    pub fn from_grpc_client(
        client: quickwit_proto::search::search_service_client::SearchServiceClient<
            InterceptedService<Timeout<Channel>, SpanContextInterceptor>,
        >,
        grpc_addr: SocketAddr,
    ) -> Self {
        SearchServiceClient {
            client_impl: SearchServiceClientImpl::Grpc(client),
            grpc_addr,
        }
    }

    /// Create a search service client instance given a search service and gRPC address.
    pub fn from_service(service: Arc<dyn SearchService>, grpc_addr: SocketAddr) -> Self {
        SearchServiceClient {
            client_impl: SearchServiceClientImpl::Local(service),
            grpc_addr,
        }
    }

    /// Return the grpc_addr the underlying client connects to.
    pub fn grpc_addr(&self) -> SocketAddr {
        self.grpc_addr
    }

    /// Returns whether the underlying client is local or remote.
    #[cfg(any(test, feature = "testsuite"))]
    pub fn is_local(&self) -> bool {
        matches!(self.client_impl, SearchServiceClientImpl::Local(_))
    }

    /// Perform root search.
    pub async fn root_search(
        &mut self,
        request: quickwit_proto::search::SearchRequest,
    ) -> crate::Result<quickwit_proto::search::SearchResponse> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Grpc(grpc_client) => grpc_client
                .root_search(request)
                .await
                .map(|tonic_response| tonic_response.into_inner())
                .map_err(|tonic_error| parse_grpc_error(&tonic_error)),
            SearchServiceClientImpl::Local(service) => service.root_search(request).await,
        }
    }

    /// Perform leaf search.
    pub async fn leaf_search(
        &mut self,
        request: quickwit_proto::search::LeafSearchRequest,
    ) -> crate::Result<quickwit_proto::search::LeafSearchResponse> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Grpc(grpc_client) => grpc_client
                .leaf_search(request)
                .await
                .map(|tonic_response| tonic_response.into_inner())
                .map_err(|tonic_error| parse_grpc_error(&tonic_error)),
            SearchServiceClientImpl::Local(service) => service.leaf_search(request).await,
        }
    }

    /// Perform leaf search.
    pub async fn leaf_list_fields(
        &mut self,
        request: quickwit_proto::search::LeafListFieldsRequest,
    ) -> crate::Result<quickwit_proto::search::ListFieldsResponse> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Grpc(grpc_client) => {
                let tonic_request = Request::new(request);
                let tonic_response = grpc_client
                    .leaf_list_fields(tonic_request)
                    .await
                    .map_err(|tonic_error| parse_grpc_error(&tonic_error))?;
                Ok(tonic_response.into_inner())
            }
            SearchServiceClientImpl::Local(service) => service.leaf_list_fields(request).await,
        }
    }

    /// Perform fetch docs.
    pub async fn fetch_docs(
        &mut self,
        request: quickwit_proto::search::FetchDocsRequest,
    ) -> crate::Result<quickwit_proto::search::FetchDocsResponse> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Grpc(grpc_client) => {
                let tonic_request = Request::new(request);
                let tonic_response = grpc_client
                    .fetch_docs(tonic_request)
                    .await
                    .map_err(|tonic_error| parse_grpc_error(&tonic_error))?;
                Ok(tonic_response.into_inner())
            }
            SearchServiceClientImpl::Local(service) => service.fetch_docs(request).await,
        }
    }

    /// Perform leaf list terms.
    pub async fn leaf_list_terms(
        &mut self,
        request: quickwit_proto::search::LeafListTermsRequest,
    ) -> crate::Result<quickwit_proto::search::LeafListTermsResponse> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Grpc(grpc_client) => {
                let tonic_request = Request::new(request);
                let tonic_response = grpc_client
                    .leaf_list_terms(tonic_request)
                    .await
                    .map_err(|tonic_error| parse_grpc_error(&tonic_error))?;
                Ok(tonic_response.into_inner())
            }
            SearchServiceClientImpl::Local(service) => service.leaf_list_terms(request).await,
        }
    }

    /// Gets the value associated to a key stored locally in the targeted node.
    /// This call is not "distributed".
    /// If the key is not present on the targeted search `None` is simply returned.
    pub async fn get_kv(&mut self, get_kv_req: GetKvRequest) -> crate::Result<Option<Vec<u8>>> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Local(service) => {
                let search_after_context_opt = service.get_kv(get_kv_req).await;
                Ok(search_after_context_opt)
            }
            SearchServiceClientImpl::Grpc(grpc_client) => {
                let grpc_resp: tonic::Response<quickwit_proto::search::GetKvResponse> = grpc_client
                    .get_kv(get_kv_req)
                    .await
                    .map_err(|tonic_error| parse_grpc_error(&tonic_error))?;
                let get_search_after_context_resp = grpc_resp.into_inner();
                Ok(get_search_after_context_resp.payload)
            }
        }
    }

    /// Gets the value associated to a key stored locally in the targeted node.
    /// This call is not "distributed". It is up to the client to put the K,V pair
    /// on several nodes.
    pub async fn put_kv(&mut self, put_kv_req: PutKvRequest) -> crate::Result<()> {
        match &mut self.client_impl {
            SearchServiceClientImpl::Local(service) => {
                service.put_kv(put_kv_req).await;
            }
            SearchServiceClientImpl::Grpc(grpc_client) => {
                grpc_client
                    .put_kv(put_kv_req)
                    .await
                    .map_err(|tonic_error| parse_grpc_error(&tonic_error))?;
            }
        }
        Ok(())
    }

    /// Indexers call report_splits to inform searchers node about the presence of a split, which
    /// would then be considered as a candidate for the searcher split cache.
    pub async fn report_splits(&mut self, report_splits_request: ReportSplitsRequest) {
        match &mut self.client_impl {
            SearchServiceClientImpl::Local(service) => {
                let _ = service.report_splits(report_splits_request).await;
            }
            SearchServiceClientImpl::Grpc(search_client) => {
                // Ignoring any error.
                if search_client
                    .report_splits(report_splits_request)
                    .await
                    .is_err()
                {
                    warn!(
                        "Failed to report splits. This is not critical as this message is only \
                         used to identify caching opportunities."
                    );
                }
            }
        }
    }
}

/// Creates a [`SearchServiceClient`] from a socket address.
/// The underlying channel connects lazily and is set up to time out after 5 seconds. It reconnects
/// automatically should the connection be dropped.
pub fn create_search_client_from_grpc_addr(
    grpc_addr: SocketAddr,
    max_message_size: ByteSize,
) -> SearchServiceClient {
    let uri = Uri::builder()
        .scheme("http")
        .authority(grpc_addr.to_string().as_str())
        .path_and_query("/")
        .build()
        .expect("The URI should be well-formed.");
    let channel = Endpoint::from(uri).connect_lazy();
    let timeout_channel = Timeout::new(channel, Duration::from_secs(5));
    create_search_client_from_channel(grpc_addr, timeout_channel, max_message_size)
}

/// Creates a [`SearchServiceClient`] from a pre-established connection (channel).
pub fn create_search_client_from_channel(
    grpc_addr: SocketAddr,
    channel: Timeout<Channel>,
    max_message_size: ByteSize,
) -> SearchServiceClient {
    let client =
        quickwit_proto::search::search_service_client::SearchServiceClient::with_interceptor(
            channel,
            SpanContextInterceptor,
        )
        .max_decoding_message_size(max_message_size.0 as usize)
        .max_encoding_message_size(max_message_size.0 as usize);
    SearchServiceClient::from_grpc_client(client, grpc_addr)
}


================================================
FILE: quickwit/quickwit-search/src/cluster_client.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use base64::Engine;
use futures::future::ready;
use futures::{Future, StreamExt};
use quickwit_proto::search::{
    FetchDocsRequest, FetchDocsResponse, GetKvRequest, LeafListFieldsRequest, LeafListTermsRequest,
    LeafListTermsResponse, LeafSearchRequest, LeafSearchResponse, ListFieldsResponse, PutKvRequest,
};
use tantivy::aggregation::intermediate_agg_result::IntermediateAggregationResults;
use tracing::{debug, error, info, warn};

use crate::retry::search::LeafSearchRetryPolicy;
use crate::retry::{DefaultRetryPolicy, RetryPolicy, retry_client};
use crate::{SearchJobPlacer, SearchServiceClient, merge_resource_stats_it};

/// Maximum number of put requests emitted to perform a replicated given PUT KV.
const MAX_PUT_KV_ATTEMPTS: usize = 6;

/// Maximum number of get requests emitted to perform a GET KV request.
const MAX_GET_KV_ATTEMPTS: usize = 6;

/// We attempt to store our KVs on two nodes.
const TARGET_NUM_REPLICATION: usize = 2;

/// Client that executes placed requests (Request, `SearchServiceClient`) and
/// provides retry policies for `FetchDocsRequest` and `LeafSearchRequest` to
/// retry on other `SearchServiceClient`.
#[derive(Clone)]
pub struct ClusterClient {
    pub(crate) search_job_placer: SearchJobPlacer,
}

impl ClusterClient {
    /// Instantiates [`ClusterClient`].
    pub fn new(search_job_placer: SearchJobPlacer) -> Self {
        Self { search_job_placer }
    }

    /// Fetches docs with retry on another node client.
    pub async fn fetch_docs(
        &self,
        request: FetchDocsRequest,
        mut client: SearchServiceClient,
    ) -> crate::Result<FetchDocsResponse> {
        let mut response_res = client.fetch_docs(request.clone()).await;
        let retry_policy = DefaultRetryPolicy {};
        if let Some(retry_request) = retry_policy.retry_request(request, &response_res) {
            assert!(!retry_request.split_offsets.is_empty());
            client = retry_client(
                &self.search_job_placer,
                client.grpc_addr(),
                &retry_request.split_offsets[0].split_id,
            )
            .await?;
            debug!(
                "Fetch docs response error: `{:?}`. Retry once to execute {:?} with {:?}",
                response_res, retry_request, client
            );
            response_res = client.fetch_docs(retry_request).await;
        }
        response_res
    }

    /// Leaf search with retry on another node client.
    pub async fn leaf_search(
        &self,
        request: LeafSearchRequest,
        mut client: SearchServiceClient,
    ) -> crate::Result<LeafSearchResponse> {
        let mut response_res = client.leaf_search(request.clone()).await;
        let retry_policy = LeafSearchRetryPolicy {};
        // We retry only once.
        let Some(retry_request) = retry_policy.retry_request(request, &response_res) else {
            return response_res;
        };
        let Some(first_split) = retry_request
            .leaf_requests
            .iter()
            .flat_map(|leaf_req| leaf_req.split_offsets.iter())
            .next()
        else {
            warn!(
                "the retry request did not contain any split to retry. this should never happen, \
                 please report"
            );
            return response_res;
        };
        // There could be more than one split in the retry request. We pick a single client
        // arbitrarily only considering the affinity of the first split.
        client = retry_client(
            &self.search_job_placer,
            client.grpc_addr(),
            &first_split.split_id,
        )
        .await?;
        debug!(
            "Leaf search response error: `{:?}`. Retry once to execute {:?} with {:?}",
            response_res, retry_request, client
        );
        let retry_result = client.leaf_search(retry_request).await;
        response_res = merge_original_with_retry_leaf_search_results(response_res, retry_result);
        response_res
    }

    /// Leaf search with retry on another node client.
    pub async fn leaf_list_fields(
        &self,
        request: LeafListFieldsRequest,
        mut client: SearchServiceClient,
    ) -> crate::Result<ListFieldsResponse> {
        client.leaf_list_fields(request.clone()).await
    }

    /// Leaf search with retry on another node client.
    pub async fn leaf_list_terms(
        &self,
        request: LeafListTermsRequest,
        mut client: SearchServiceClient,
    ) -> crate::Result<LeafListTermsResponse> {
        // TODO: implement retry
        client.leaf_list_terms(request.clone()).await
    }

    /// Attempts to store a given key value pair within the cluster.
    ///
    /// Tries to replicate the pair to [`TARGET_NUM_REPLICATION`] nodes, but this function may fail
    /// silently (e.g if no client was available). Even in case of success, this storage is not
    /// persistent. For instance during a rolling upgrade, all replicas will be lost as there is no
    /// mechanism to maintain the replication count.
    pub async fn put_kv(&self, key: &[u8], payload: &[u8], ttl: Duration) {
        let clients: Vec<SearchServiceClient> = self
            .search_job_placer
            .best_nodes_per_affinity(key)
            .await
            .take(MAX_PUT_KV_ATTEMPTS)
            .collect();

        if clients.is_empty() {
            // We only log a warning as it might be that we are just running in a
            // single node cluster.
            // (That's odd though, the node running this code should be in the pool too)
            warn!("no other node available to replicate scroll context");
            return;
        }

        // We run the put requests concurrently.
        // Our target is a replication over TARGET_NUM_REPLICATION nodes, we therefore try to avoid
        // replicating on more than TARGET_NUM_REPLICATION nodes at the same time. Of
        // course, this may still result in the replication over more nodes, but this is not
        // a problem.
        //
        // The requests are made in a concurrent manner, up to TARGET_NUM_REPLICATION at a time. As
        // soon as TARGET_NUM_REPLICATION requests are successful, we stop.
        let put_kv_futs = clients
            .into_iter()
            .map(|client| replicate_kv_to_one_server(client, key, payload, ttl));
        let successful_replication = futures::stream::iter(put_kv_futs)
            .buffer_unordered(TARGET_NUM_REPLICATION)
            .filter(|put_kv_successful| ready(*put_kv_successful))
            .take(TARGET_NUM_REPLICATION)
            .count()
            .await;

        if successful_replication == 0 {
            error!(successful_replication=%successful_replication,"failed-to-replicate-scroll-context");
        }
    }

    /// Returns a search_after context
    pub async fn get_kv(&self, key: &[u8]) -> Option<Vec<u8>> {
        let clients = self.search_job_placer.best_nodes_per_affinity(key).await;
        // On the read side, we attempt to contact up to 6 nodes.
        for mut client in clients.take(MAX_GET_KV_ATTEMPTS) {
            let get_request = GetKvRequest { key: key.to_vec() };
            if let Ok(Some(search_after_resp)) = client.get_kv(get_request.clone()).await {
                return Some(search_after_resp);
            } else {
                let base64_key: String = base64::prelude::BASE64_STANDARD.encode(key);
                info!(destination=?client, key=base64_key, "Failed to get KV");
            }
        }
        None
    }
}

fn replicate_kv_to_one_server(
    mut client: SearchServiceClient,
    key: &[u8],
    payload: &[u8],
    ttl: Duration,
) -> impl Future<Output = bool> {
    let put_kv_request = PutKvRequest {
        key: key.to_vec(),
        payload: payload.to_vec(),
        ttl_secs: ttl.as_secs() as u32,
    };
    let base64_key: String = base64::prelude::BASE64_STANDARD.encode(key);
    async move {
        if client.put_kv(put_kv_request).await.is_ok() {
            true
        } else {
            warn!(destination=?client, key=base64_key, "Failed to replicate KV");
            false
        }
    }
}

/// Takes two intermediate aggregation results serialized using postcard,
/// merge them and returns the merged serialized result.
fn merge_intermediate_aggregation(left: &[u8], right: &[u8]) -> crate::Result<Vec<u8>> {
    let mut intermediate_aggregation_results_left: IntermediateAggregationResults =
        postcard::from_bytes(left)?;
    let intermediate_aggregation_results_right: IntermediateAggregationResults =
        postcard::from_bytes(right)?;
    intermediate_aggregation_results_left.merge_fruits(intermediate_aggregation_results_right)?;
    let serialized = postcard::to_allocvec(&intermediate_aggregation_results_left)?;
    Ok(serialized)
}

/// Merge two leaf search response.
///
/// # Quirk
///
/// This is implemented for a retries.
/// For instance, the set of attempted splits of right is supposed to be the set of failed
/// list of the left one, so that the list of the overal failed splits is the list of splits on the
/// `right_response`.
fn merge_original_with_retry_leaf_search_response(
    mut original_response: LeafSearchResponse,
    retry_response: LeafSearchResponse,
) -> crate::Result<LeafSearchResponse> {
    original_response
        .partial_hits
        .extend(retry_response.partial_hits);
    let intermediate_aggregation_result: Option<Vec<u8>> = match (
        original_response.intermediate_aggregation_result,
        retry_response.intermediate_aggregation_result,
    ) {
        (Some(left_agg_bytes), Some(right_agg_bytes)) => {
            let intermediate_aggregation_bytes: Vec<u8> =
                merge_intermediate_aggregation(&left_agg_bytes[..], &right_agg_bytes[..])?;
            Some(intermediate_aggregation_bytes)
        }
        (None, Some(right)) => Some(right),
        (Some(left), None) => Some(left),
        (None, None) => None,
    };
    let resource_stats = merge_resource_stats_it([
        &original_response.resource_stats,
        &retry_response.resource_stats,
    ]);
    Ok(LeafSearchResponse {
        intermediate_aggregation_result,
        num_hits: original_response.num_hits + retry_response.num_hits,
        num_attempted_splits: original_response.num_attempted_splits
            + retry_response.num_attempted_splits,
        failed_splits: retry_response.failed_splits,
        partial_hits: original_response.partial_hits,
        num_successful_splits: original_response.num_successful_splits
            + retry_response.num_successful_splits,
        resource_stats,
    })
}

// Merge initial leaf search results with results obtained from a retry.
fn merge_original_with_retry_leaf_search_results(
    left_search_response_result: crate::Result<LeafSearchResponse>,
    right_search_response_result: crate::Result<LeafSearchResponse>,
) -> crate::Result<LeafSearchResponse> {
    match (left_search_response_result, right_search_response_result) {
        (Ok(left_response), Ok(right_response)) => {
            merge_original_with_retry_leaf_search_response(left_response, right_response)
        }
        (Ok(single_valid_response), Err(_)) => Ok(single_valid_response),
        (Err(_), Ok(single_valid_response)) => Ok(single_valid_response),
        (Err(error), Err(_)) => Err(error),
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;
    use std::net::SocketAddr;

    use quickwit_proto::search::{
        LeafRequestRef, PartialHit, SearchRequest, SortValue, SplitIdAndFooterOffsets,
        SplitSearchError,
    };
    use quickwit_query::query_ast::qast_json_helper;

    use super::*;
    use crate::root::SearchJob;
    use crate::{MockSearchService, SearchError, searcher_pool_for_test};

    fn mock_partial_hit(split_id: &str, sort_value: u64, doc_id: u32) -> PartialHit {
        PartialHit {
            sort_value: Some(SortValue::U64(sort_value).into()),
            sort_value2: None,
            split_id: split_id.to_string(),
            segment_ord: 1,
            doc_id,
        }
    }

    fn mock_doc_request(split_id: &str) -> FetchDocsRequest {
        FetchDocsRequest {
            partial_hits: Vec::new(),
            index_uri: "uri".to_string(),
            split_offsets: vec![SplitIdAndFooterOffsets {
                split_id: split_id.to_string(),
                split_footer_end: 100,
                split_footer_start: 0,
                timestamp_start: None,
                timestamp_end: None,
                num_docs: 0,
            }],
            ..Default::default()
        }
    }

    fn mock_leaf_search_request() -> LeafSearchRequest {
        let search_request = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        LeafSearchRequest {
            search_request: Some(search_request),
            doc_mappers: vec!["doc_mapper".to_string()],
            index_uris: vec!["uri".to_string()],
            leaf_requests: vec![LeafRequestRef {
                index_uri_ord: 0,
                doc_mapper_ord: 0,
                split_offsets: vec![
                    SplitIdAndFooterOffsets {
                        split_id: "split_1".to_string(),
                        split_footer_start: 0,
                        split_footer_end: 100,
                        timestamp_start: None,
                        timestamp_end: None,
                        num_docs: 0,
                    },
                    SplitIdAndFooterOffsets {
                        split_id: "split_2".to_string(),
                        split_footer_start: 0,
                        split_footer_end: 100,
                        timestamp_start: None,
                        timestamp_end: None,
                        num_docs: 0,
                    },
                ],
            }],
        }
    }

    #[tokio::test]
    async fn test_cluster_client_fetch_docs_no_retry() {
        let request = mock_doc_request("split_1");
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_fetch_docs().return_once(
            |_: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse { hits: Vec::new() })
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let first_client = search_job_placer
            .assign_job(SearchJob::for_test("split_1", 0), &HashSet::new())
            .await
            .unwrap();
        let cluster_client = ClusterClient::new(search_job_placer);
        let fetch_docs_response = cluster_client
            .fetch_docs(request, first_client)
            .await
            .unwrap();
        assert_eq!(fetch_docs_response.hits.len(), 0);
    }

    #[tokio::test]
    async fn test_cluster_client_fetch_docs_retry_with_final_success() {
        let request = mock_doc_request("split_1");
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_fetch_docs().return_once(
            |_: quickwit_proto::search::FetchDocsRequest| {
                Err(SearchError::Internal("error".to_string()))
            },
        );
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_fetch_docs().return_once(
            |_: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse { hits: Vec::new() })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let first_client_addr: SocketAddr = "127.0.0.1:1001".parse().unwrap();
        let first_client = searcher_pool.get(&first_client_addr).unwrap();
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer);
        let fetch_docs_response = cluster_client
            .fetch_docs(request, first_client)
            .await
            .unwrap();
        assert_eq!(fetch_docs_response.hits.len(), 0);
    }

    #[tokio::test]
    async fn test_cluster_client_fetch_docs_retry_with_final_error() {
        let request = mock_doc_request("split_1");
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_fetch_docs().returning(
            |_: quickwit_proto::search::FetchDocsRequest| {
                Err(SearchError::Internal("error".to_string()))
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let first_client_addr: SocketAddr = "127.0.0.1:1001".parse().unwrap();
        let first_client = searcher_pool.get(&first_client_addr).unwrap();
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer);
        let search_error = cluster_client
            .fetch_docs(request, first_client)
            .await
            .unwrap_err();
        assert!(matches!(search_error, SearchError::Internal(_)));
    }

    #[tokio::test]
    async fn test_cluster_client_leaf_search_no_retry() {
        let request = mock_leaf_search_request();
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_leaf_search()
            .return_once(|_: LeafSearchRequest| {
                Ok(LeafSearchResponse {
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let first_client = search_job_placer
            .assign_job(SearchJob::for_test("split_1", 0), &HashSet::new())
            .await
            .unwrap();
        let cluster_client = ClusterClient::new(search_job_placer);
        let leaf_search_response = cluster_client
            .leaf_search(request, first_client)
            .await
            .unwrap();
        assert_eq!(leaf_search_response.num_attempted_splits, 1);
    }

    #[tokio::test]
    async fn test_cluster_client_leaf_search_retry_on_failing_splits() {
        let request = mock_leaf_search_request();
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_leaf_search()
            .withf(|request| request.leaf_requests[0].split_offsets[0].split_id == "split_1")
            .return_once(|_: LeafSearchRequest| {
                Ok(LeafSearchResponse {
                    num_hits: 1,
                    failed_splits: vec![SplitSearchError {
                        error: "mock_error".to_string(),
                        split_id: "split_2".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        mock_search_service
            .expect_leaf_search()
            .withf(|request| request.leaf_requests[0].split_offsets[0].split_id == "split_2")
            .return_once(|_: LeafSearchRequest| {
                Ok(LeafSearchResponse {
                    num_hits: 1,
                    partial_hits: Vec::new(),
                    failed_splits: vec![SplitSearchError {
                        error: "mock_error".to_string(),
                        split_id: "split_3".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let first_client = search_job_placer
            .assign_job(SearchJob::for_test("split_1", 0), &HashSet::new())
            .await
            .unwrap();
        let cluster_client = ClusterClient::new(search_job_placer);
        let result = cluster_client.leaf_search(request, first_client).await;
        assert!(result.is_ok());
        assert_eq!(result.unwrap().num_hits, 2);
    }

    #[test]
    fn test_merge_leaf_search_retry_on_partial_success() -> anyhow::Result<()> {
        let split_error = SplitSearchError {
            error: "error".to_string(),
            split_id: "split_2".to_string(),
            retryable_error: true,
        };
        let leaf_response = LeafSearchResponse {
            num_hits: 1,
            partial_hits: vec![mock_partial_hit("split_1", 3, 1)],
            failed_splits: vec![split_error],
            num_attempted_splits: 1,
            ..Default::default()
        };
        let leaf_response_retry = LeafSearchResponse {
            num_hits: 1,
            partial_hits: vec![mock_partial_hit("split_2", 3, 1)],
            failed_splits: Vec::new(),
            num_attempted_splits: 1,
            ..Default::default()
        };
        let merged_leaf_search_response = merge_original_with_retry_leaf_search_results(
            Ok(leaf_response),
            Ok(leaf_response_retry),
        )
        .unwrap();
        assert_eq!(merged_leaf_search_response.num_attempted_splits, 2);
        assert_eq!(merged_leaf_search_response.num_hits, 2);
        assert_eq!(merged_leaf_search_response.partial_hits.len(), 2);
        assert_eq!(merged_leaf_search_response.failed_splits.len(), 0);
        Ok(())
    }

    #[test]
    fn test_merge_leaf_search_retry_on_error() -> anyhow::Result<()> {
        let split_error = SplitSearchError {
            error: "error".to_string(),
            split_id: "split_2".to_string(),
            retryable_error: true,
        };
        let leaf_response = LeafSearchResponse {
            num_hits: 1,
            partial_hits: vec![mock_partial_hit("split_1", 3, 1)],
            failed_splits: vec![split_error],
            num_attempted_splits: 1,
            ..Default::default()
        };
        let merged_result = merge_original_with_retry_leaf_search_results(
            Err(SearchError::Internal("error".to_string())),
            Ok(leaf_response),
        )
        .unwrap();
        assert_eq!(merged_result.num_attempted_splits, 1);
        assert_eq!(merged_result.num_hits, 1);
        assert_eq!(merged_result.partial_hits.len(), 1);
        assert_eq!(merged_result.failed_splits.len(), 1);
        Ok(())
    }

    #[test]
    fn test_merge_leaf_search_retry_error_on_error() -> anyhow::Result<()> {
        let merge_error = merge_original_with_retry_leaf_search_results(
            Err(SearchError::Internal("error".to_string())),
            Err(SearchError::Internal("retry error".to_string())),
        )
        .unwrap_err();
        assert_eq!(merge_error.to_string(), "internal error: `error`");
        Ok(())
    }

    #[tokio::test]
    async fn test_put_kv_happy_path() {
        // 3 servers 1, 2, 3
        // Targeted key has affinity [2, 3, 1].
        //
        // Put on 2 and 3 is successful
        // Get succeeds on 2.
        let mock_search_service_1 = MockSearchService::new();
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_put_kv().once().returning(
            |put_req: quickwit_proto::search::PutKvRequest| {
                assert_eq!(put_req.key, b"my_key");
                assert_eq!(put_req.payload, b"my_payload");
            },
        );
        mock_search_service_2.expect_get_kv().once().returning(
            |get_req: quickwit_proto::search::GetKvRequest| {
                assert_eq!(get_req.key, b"my_key");
                Some(b"my_payload".to_vec())
            },
        );
        let mut mock_search_service_3 = MockSearchService::new();
        // Due to the buffered call it is possible for the
        // put request to 3 to be emitted too.
        mock_search_service_3
            .expect_put_kv()
            .returning(|_put_req: quickwit_proto::search::PutKvRequest| {});
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
            ("127.0.0.1:1003", mock_search_service_3),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer);
        cluster_client
            .put_kv(
                &b"my_key"[..],
                &b"my_payload"[..],
                Duration::from_secs(10 * 60),
            )
            .await;
        let result = cluster_client.get_kv(&b"my_key"[..]).await;
        assert_eq!(result, Some(b"my_payload".to_vec()))
    }

    #[tokio::test]
    async fn test_put_kv_failing_get() {
        // 3 servers 1, 2, 3
        // Targeted key has affinity [2, 3, 1].
        //
        // Put on 2 and 3 is successful
        // Get fails on 2.
        // Get succeeds on 3.
        let mock_search_service_1 = MockSearchService::new();
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_put_kv().once().returning(
            |put_req: quickwit_proto::search::PutKvRequest| {
                assert_eq!(put_req.key, b"my_key");
                assert_eq!(put_req.payload, b"my_payload");
            },
        );
        mock_search_service_2.expect_get_kv().once().returning(
            |get_req: quickwit_proto::search::GetKvRequest| {
                assert_eq!(get_req.key, b"my_key");
                None
            },
        );
        let mut mock_search_service_3 = MockSearchService::new();
        mock_search_service_3.expect_put_kv().once().returning(
            |put_req: quickwit_proto::search::PutKvRequest| {
                assert_eq!(put_req.key, b"my_key");
                assert_eq!(put_req.payload, b"my_payload");
            },
        );
        mock_search_service_3.expect_get_kv().once().returning(
            |get_req: quickwit_proto::search::GetKvRequest| {
                assert_eq!(get_req.key, b"my_key");
                Some(b"my_payload".to_vec())
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
            ("127.0.0.1:1003", mock_search_service_3),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer);
        cluster_client
            .put_kv(
                &b"my_key"[..],
                &b"my_payload"[..],
                Duration::from_secs(10 * 60),
            )
            .await;
        let result = cluster_client.get_kv(&b"my_key"[..]).await;
        assert_eq!(result, Some(b"my_payload".to_vec()))
    }
}


================================================
FILE: quickwit/quickwit-search/src/collector.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Cow;
use std::cmp::Ordering;
use std::collections::HashSet;

use itertools::Itertools;
use quickwit_common::binary_heap::{SortKeyMapper, TopK};
use quickwit_doc_mapper::{FastFieldWarmupInfo, WarmupInfo};
use quickwit_proto::search::{
    LeafSearchResponse, PartialHit, ResourceStats, SearchRequest, SortByValue, SortOrder,
    SortValue, SplitSearchError,
};
use quickwit_proto::types::SplitId;
use serde::Deserialize;
use tantivy::aggregation::agg_req::{Aggregations, get_fast_field_names};
use tantivy::aggregation::intermediate_agg_result::IntermediateAggregationResults;
use tantivy::aggregation::{AggContextParams, AggregationLimitsGuard, AggregationSegmentCollector};
use tantivy::collector::{Collector, SegmentCollector};
use tantivy::columnar::{ColumnType, MonotonicallyMappableToU64};
use tantivy::fastfield::Column;
use tantivy::tokenizer::TokenizerManager;
use tantivy::{DateTime, DocId, Score, SegmentOrdinal, SegmentReader, TantivyError};

use crate::find_trace_ids_collector::{FindTraceIdsCollector, FindTraceIdsSegmentCollector, Span};
use crate::top_k_collector::{QuickwitSegmentTopKCollector, specialized_top_k_segment_collector};
use crate::{GlobalDocAddress, merge_resource_stats, merge_resource_stats_it};

#[derive(Clone, Debug)]
pub(crate) enum SortByComponent {
    DocId {
        order: SortOrder,
    },
    FastField {
        field_name: String,
        order: SortOrder,
    },
    Score {
        order: SortOrder,
    },
}
impl From<SortByComponent> for SortByPair {
    fn from(value: SortByComponent) -> Self {
        Self {
            first: value,
            second: None,
        }
    }
}
#[derive(Clone)]
pub(crate) struct SortByPair {
    first: SortByComponent,
    second: Option<SortByComponent>,
}
impl SortByPair {
    pub fn sort_orders(&self) -> (SortOrder, SortOrder) {
        (
            self.first.sort_order(),
            self.second
                .as_ref()
                .map(|sort_by| sort_by.sort_order())
                .unwrap_or(SortOrder::Desc),
        )
    }
}
impl SortByComponent {
    fn to_sorting_field_extractor_component(
        &self,
        segment_reader: &SegmentReader,
    ) -> tantivy::Result<SortingFieldExtractorComponent> {
        match self {
            SortByComponent::DocId { .. } => Ok(SortingFieldExtractorComponent::DocId),
            SortByComponent::FastField { field_name, .. } => {
                let sort_column_opt: Option<(Column<u64>, ColumnType)> =
                    segment_reader.fast_fields().u64_lenient(field_name)?;
                let (sort_column, column_type) = sort_column_opt.unwrap_or_else(|| {
                    (
                        Column::build_empty_column(segment_reader.max_doc()),
                        ColumnType::U64,
                    )
                });
                let sort_field_type = SortFieldType::try_from(column_type)?;
                Ok(SortingFieldExtractorComponent::FastField {
                    sort_column,
                    sort_field_type,
                })
            }
            SortByComponent::Score { .. } => Ok(SortingFieldExtractorComponent::Score),
        }
    }
    pub fn requires_scoring(&self) -> bool {
        match self {
            SortByComponent::DocId { .. } => false,
            SortByComponent::FastField { .. } => false,
            SortByComponent::Score { .. } => true,
        }
    }
    pub fn add_fast_field(&self, set: &mut HashSet<String>) {
        if let SortByComponent::FastField {
            field_name,
            order: _,
        } = self
        {
            set.insert(field_name.clone());
        }
    }
    pub fn sort_order(&self) -> SortOrder {
        match self {
            SortByComponent::DocId { order } => *order,
            SortByComponent::FastField { order, .. } => *order,
            SortByComponent::Score { order } => *order,
        }
    }
}

#[derive(Copy, Clone, Debug, Eq, PartialEq)]
pub(crate) enum SortFieldType {
    U64,
    I64,
    F64,
    DateTime,
    Bool,
}

/// The `SortingFieldExtractor` is used to extract a score, which can either be a true score,
/// a value from a fast field, or nothing (sort by DocId).
pub(crate) enum SortingFieldExtractorComponent {
    /// If undefined, we simply sort by DocIds.
    DocId,
    FastField {
        sort_column: Column<u64>,
        sort_field_type: SortFieldType,
    },
    Score,
}

impl SortingFieldExtractorComponent {
    pub fn is_score(&self) -> bool {
        matches!(self, SortingFieldExtractorComponent::Score)
    }
    pub fn is_fast_field(&self) -> bool {
        matches!(self, SortingFieldExtractorComponent::FastField { .. })
    }
    /// Loads the fast field values for the given doc_ids in its u64 representation. The returned
    /// u64 representation maintains the ordering of the original value.
    #[inline]
    pub fn extract_typed_sort_values_block(&self, doc_ids: &[DocId], values: &mut [Option<u64>]) {
        // In the collect block case we don't have scores to extract
        if let SortingFieldExtractorComponent::FastField { sort_column, .. } = self {
            let values = &mut values[..doc_ids.len()];
            sort_column.first_vals(doc_ids, values);
        }
    }

    /// Returns the sort value for the given element in its u64 representation. The returned u64
    /// representation maintains the ordering of the original value.
    ///
    /// The function returns None if the sort key is a fast field, for which we have no value
    /// for the given doc_id, or we sort by DocId.
    #[inline]
    fn extract_typed_sort_value_opt(&self, doc_id: DocId, score: Score) -> Option<u64> {
        match self {
            // Tie breaks are not handled here, but in SegmentPartialHit
            SortingFieldExtractorComponent::DocId => None,
            SortingFieldExtractorComponent::FastField { sort_column, .. } => {
                sort_column.first(doc_id)
            }
            SortingFieldExtractorComponent::Score => Some((score as f64).to_u64()),
        }
    }

    #[inline]
    /// Converts u64 fast field values to its correct type.
    /// The conversion is delayed for performance reasons.
    ///
    /// This is used to convert `search_after` sort value to a u64 representation that will respect
    /// the same order as the `SortValue` representation.
    pub fn convert_u64_ff_val_to_sort_value(&self, sort_value: u64) -> SortValue {
        let map_fast_field_to_value = |fast_field_value, field_type| match field_type {
            SortFieldType::U64 => SortValue::U64(fast_field_value),
            SortFieldType::I64 => SortValue::I64(i64::from_u64(fast_field_value)),
            SortFieldType::F64 => SortValue::F64(f64::from_u64(fast_field_value)),
            SortFieldType::DateTime => SortValue::I64(i64::from_u64(fast_field_value)),
            SortFieldType::Bool => SortValue::Boolean(fast_field_value != 0u64),
        };
        match self {
            SortingFieldExtractorComponent::DocId => SortValue::U64(sort_value),
            SortingFieldExtractorComponent::FastField {
                sort_field_type, ..
            } => map_fast_field_to_value(sort_value, *sort_field_type),
            SortingFieldExtractorComponent::Score => SortValue::F64(f64::from_u64(sort_value)),
        }
    }
    /// Converts fast field values into their u64 fast field representation.
    ///
    /// Returns None if value is out of bounds of target value.
    /// None means that the search_after will be disabled and everything matches.
    ///
    /// What's currently missing is to signal that _nothing_ matches to generate an optimized
    /// query. For now we just choose the max value of the target type.
    #[inline]
    pub fn convert_to_u64_ff_val(
        &self,
        sort_value: SortValue,
        sort_order: SortOrder,
    ) -> Option<u64> {
        match self {
            SortingFieldExtractorComponent::DocId => match sort_value {
                SortValue::U64(val) => Some(val),
                _ => panic!("Internal error: Got non-U64 sort value for DocId."),
            },
            SortingFieldExtractorComponent::FastField {
                sort_field_type, ..
            } => {
                // We need to convert a (potential user provided) value in the correct u64
                // representation of the fast field.
                // This requires this weird conversion of first casting into the target type
                // (if possible) and then to its u64 presentation.
                //
                // For the conversion into the target type it's important to know if the target
                // type does not cover the whole range of the source type. In that case we need to
                // add additional conversion checks, to see if it matches everything
                // or nothing. (Which also depends on the sort order).
                // Below are the visual representations of the value ranges of the different types.
                // Note: DateTime is equal to I64 and omitted.
                //
                //     Bool value range (0, 1):
                //                        <->
                //
                //     I64 value range (signed 64-bit integer):
                //     <------------------------------------>
                //     -2^63                             2^63-1
                //     U64 value range (unsigned 64-bit integer):
                //                        <------------------------------------>
                //                        0                                  2^64-1
                // F64 value range (64-bit floating point, conceptual, not to scale):
                // <-------------------------------------------------------------------->
                // Very negative numbers                                       Very positive numbers
                //
                // Those conversions have limited target type value space:
                // - [X] U64 -> I64
                // - [X] F64 -> I64
                // - [X] I64 -> U64
                // - [X] F64 -> U64
                //
                // - [X] F64 -> Bool
                // - [X] I64 -> Bool
                // - [X] U64 -> Bool
                //
                let val = match (sort_value, sort_field_type) {
                    // Same field type, no conversion needed.
                    (SortValue::U64(val), SortFieldType::U64) => val,
                    (SortValue::F64(val), SortFieldType::F64) => val.to_u64(),
                    (SortValue::Boolean(val), SortFieldType::Bool) => val.to_u64(),
                    (SortValue::I64(val), SortFieldType::I64) => val.to_u64(),
                    (SortValue::U64(mut val), SortFieldType::I64) => {
                        if sort_order == SortOrder::Desc && val > i64::MAX as u64 {
                            return None;
                        }
                        // Add a limit to avoid overflow.
                        val = val.min(i64::MAX as u64);
                        (val as i64).to_u64()
                    }
                    (SortValue::U64(val), SortFieldType::F64) => (val as f64).to_u64(),
                    (SortValue::U64(mut val), SortFieldType::DateTime) => {
                        // Match everything
                        if sort_order == SortOrder::Desc && val > i64::MAX as u64 {
                            return None;
                        }
                        // Add a limit to avoid overflow.
                        val = val.min(i64::MAX as u64);
                        DateTime::from_timestamp_nanos(val as i64).to_u64()
                    }
                    (SortValue::I64(val), SortFieldType::U64) => {
                        if val < 0 && sort_order == SortOrder::Asc {
                            return None;
                        }
                        if val < 0 && sort_order == SortOrder::Desc {
                            u64::MIN // matches nothing as search_after is not inclusive
                        } else {
                            val as u64
                        }
                    }
                    (SortValue::I64(val), SortFieldType::F64) => (val as f64).to_u64(),
                    (SortValue::I64(val), SortFieldType::DateTime) => {
                        DateTime::from_timestamp_nanos(val).to_u64()
                    }
                    (SortValue::F64(val), SortFieldType::U64) => {
                        let all_values_ahead1 =
                            val < u64::MIN as f64 && sort_order == SortOrder::Asc;
                        let all_values_ahead2 =
                            val > u64::MAX as f64 && sort_order == SortOrder::Desc;
                        if all_values_ahead1 || all_values_ahead2 {
                            return None;
                        }
                        // f64 cast already handles under/overflow and clamps the value
                        (val as u64).to_u64()
                    }
                    (SortValue::F64(val), SortFieldType::I64)
                    | (SortValue::F64(val), SortFieldType::DateTime) => {
                        let all_values_ahead1 =
                            val < i64::MIN as f64 && sort_order == SortOrder::Asc;
                        let all_values_ahead2 =
                            val > i64::MAX as f64 && sort_order == SortOrder::Desc;
                        if all_values_ahead1 || all_values_ahead2 {
                            return None;
                        }
                        // f64 cast already handles under/overflow and clamps the value
                        let val_i64 = val as i64;

                        if *sort_field_type == SortFieldType::DateTime {
                            DateTime::from_timestamp_nanos(val_i64).to_u64()
                        } else {
                            val_i64.to_u64()
                        }
                    }
                    // Not sure when we hit this, it's probably are very rare case.
                    (SortValue::Boolean(val), SortFieldType::U64) => val as u64,
                    (SortValue::Boolean(val), SortFieldType::F64) => (val as u64 as f64).to_u64(),
                    (SortValue::Boolean(val), SortFieldType::I64) => (val as i64).to_u64(),
                    (SortValue::Boolean(val), SortFieldType::DateTime) => {
                        DateTime::from_timestamp_nanos(val as i64).to_u64()
                    }
                    (SortValue::U64(mut val), SortFieldType::Bool) => {
                        let all_values_ahead1 = val > 1 && sort_order == SortOrder::Desc;
                        if all_values_ahead1 {
                            return None;
                        }
                        // clamp value for comparison
                        val = val.clamp(0, 1);
                        (val == 1).to_u64()
                    }
                    (SortValue::I64(mut val), SortFieldType::Bool) => {
                        let all_values_ahead1 = val > 1 && sort_order == SortOrder::Desc;
                        let all_values_ahead2 = val < 0 && sort_order == SortOrder::Asc;
                        if all_values_ahead1 || all_values_ahead2 {
                            return None;
                        }
                        // clamp value for comparison
                        val = val.clamp(0, 1);
                        (val == 1).to_u64()
                    }
                    (SortValue::F64(mut val), SortFieldType::Bool) => {
                        let all_values_ahead1 = val > 1.0 && sort_order == SortOrder::Desc;
                        let all_values_ahead2 = val < 0.0 && sort_order == SortOrder::Asc;
                        if all_values_ahead1 || all_values_ahead2 {
                            return None;
                        }
                        val = val.clamp(0.0, 1.0);
                        (val >= 0.5).to_u64() // Is this correct?
                    }
                };
                Some(val)
            }
            SortingFieldExtractorComponent::Score => match sort_value {
                SortValue::F64(val) => Some(val.to_u64()),
                _ => panic!("Internal error: Got non-F64 sort value for Score."),
            },
        }
    }
}

impl From<SortingFieldExtractorComponent> for SortingFieldExtractorPair {
    fn from(value: SortingFieldExtractorComponent) -> Self {
        Self {
            first: value,
            second: None,
        }
    }
}

pub(crate) struct SortingFieldExtractorPair {
    pub first: SortingFieldExtractorComponent,
    pub second: Option<SortingFieldExtractorComponent>,
}

impl SortingFieldExtractorPair {
    pub fn is_score(&self) -> bool {
        self.first.is_score()
            || self
                .second
                .as_ref()
                .map(|second| second.is_score())
                .unwrap_or(false)
    }
    /// Returns the list of sort values for the given element
    ///
    /// See also [`SortingFieldExtractorComponent::extract_typed_sort_values_block`] for more
    /// information.
    #[inline]
    pub(crate) fn extract_typed_sort_values(
        &self,
        doc_ids: &[DocId],
        values1: &mut [Option<u64>],
        values2: &mut [Option<u64>],
    ) {
        self.first
            .extract_typed_sort_values_block(doc_ids, &mut values1[..doc_ids.len()]);
        if let Some(second) = self.second.as_ref() {
            second.extract_typed_sort_values_block(doc_ids, &mut values2[..doc_ids.len()]);
        }
    }
    /// Returns the list of sort values for the given element
    ///
    /// See also [`SortingFieldExtractorComponent::extract_typed_sort_value_opt`] for more
    /// information.
    #[inline]
    pub(crate) fn extract_typed_sort_value(
        &self,
        doc_id: DocId,
        score: Score,
    ) -> (Option<u64>, Option<u64>) {
        let first = self.first.extract_typed_sort_value_opt(doc_id, score);
        let second = self
            .second
            .as_ref()
            .and_then(|second| second.extract_typed_sort_value_opt(doc_id, score));
        (first, second)
    }
}

impl TryFrom<ColumnType> for SortFieldType {
    type Error = tantivy::TantivyError;

    fn try_from(column_type: ColumnType) -> tantivy::Result<Self> {
        match column_type {
            ColumnType::U64 => Ok(SortFieldType::U64),
            ColumnType::I64 => Ok(SortFieldType::I64),
            ColumnType::F64 => Ok(SortFieldType::F64),
            ColumnType::DateTime => Ok(SortFieldType::DateTime),
            ColumnType::Bool => Ok(SortFieldType::Bool),
            _ => Err(TantivyError::InvalidArgument(format!(
                "Unsupported sort field type `{column_type:?}`."
            ))),
        }
    }
}

/// Takes a user-defined sorting criteria and resolves it to a
/// segment specific `SortingFieldExtractorPair`.
fn get_score_extractor(
    sort_by: &SortByPair,
    segment_reader: &SegmentReader,
) -> tantivy::Result<SortingFieldExtractorPair> {
    Ok(SortingFieldExtractorPair {
        first: sort_by
            .first
            .to_sorting_field_extractor_component(segment_reader)?,
        second: sort_by
            .second
            .as_ref()
            .map(|first| first.to_sorting_field_extractor_component(segment_reader))
            .transpose()?,
    })
}

#[allow(clippy::large_enum_variant)]
enum AggregationSegmentCollectors {
    FindTraceIdsSegmentCollector(Box<FindTraceIdsSegmentCollector>),
    TantivyAggregationSegmentCollector(AggregationSegmentCollector),
}

/// Quickwit collector working at the scale of the segment.
pub struct QuickwitSegmentCollector {
    segment_top_k_collector: Option<Box<dyn QuickwitSegmentTopKCollector>>,
    aggregation: Option<AggregationSegmentCollectors>,
    num_hits: u64,
}

#[derive(Copy, Clone, Debug)]
pub(crate) struct SegmentPartialHit {
    /// Normalized to u64, the typed value can be reconstructed with
    /// SortingFieldExtractorComponent.
    pub sort_value: Option<u64>,
    pub sort_value2: Option<u64>,
    pub doc_id: DocId,
}

impl SegmentPartialHit {
    pub fn into_partial_hit(
        self,
        split_id: SplitId,
        segment_ord: SegmentOrdinal,
        first: &SortingFieldExtractorComponent,
        second: &Option<SortingFieldExtractorComponent>,
    ) -> PartialHit {
        PartialHit {
            sort_value: self
                .sort_value
                .map(|sort_value| first.convert_u64_ff_val_to_sort_value(sort_value))
                .map(|sort_value| SortByValue {
                    sort_value: Some(sort_value),
                }),
            sort_value2: self
                .sort_value2
                .map(|sort_value| {
                    second
                        .as_ref()
                        .expect("Internal error: Got sort_value2, but no sort extractor")
                        .convert_u64_ff_val_to_sort_value(sort_value)
                })
                .map(|sort_value| SortByValue {
                    sort_value: Some(sort_value),
                }),
            doc_id: self.doc_id,
            split_id,
            segment_ord,
        }
    }
}

impl SegmentCollector for QuickwitSegmentCollector {
    type Fruit = tantivy::Result<LeafSearchResponse>;

    #[inline]
    fn collect_block(&mut self, filtered_docs: &[DocId]) {
        // Update results
        self.num_hits += filtered_docs.len() as u64;

        if let Some(segment_top_k_collector) = self.segment_top_k_collector.as_mut() {
            segment_top_k_collector.collect_top_k_block(filtered_docs);
        }

        match self.aggregation.as_mut() {
            Some(AggregationSegmentCollectors::FindTraceIdsSegmentCollector(collector)) => {
                collector.collect_block(filtered_docs)
            }
            Some(AggregationSegmentCollectors::TantivyAggregationSegmentCollector(collector)) => {
                collector.collect_block(filtered_docs)
            }
            None => (),
        }
    }

    #[inline]
    fn collect(&mut self, doc_id: DocId, score: Score) {
        self.num_hits += 1;
        if let Some(segment_top_k_collector) = self.segment_top_k_collector.as_mut() {
            segment_top_k_collector.collect_top_k(doc_id, score);
        }

        match self.aggregation.as_mut() {
            Some(AggregationSegmentCollectors::FindTraceIdsSegmentCollector(collector)) => {
                collector.collect(doc_id, score)
            }
            Some(AggregationSegmentCollectors::TantivyAggregationSegmentCollector(collector)) => {
                collector.collect(doc_id, score)
            }
            None => (),
        }
    }

    fn harvest(self) -> Self::Fruit {
        let mut partial_hits: Vec<PartialHit> = Vec::new();
        if let Some(segment_top_k_collector) = self.segment_top_k_collector {
            partial_hits = segment_top_k_collector.get_top_k();
        }

        let intermediate_aggregation_result = match self.aggregation {
            Some(AggregationSegmentCollectors::FindTraceIdsSegmentCollector(collector)) => {
                let fruit: Vec<Span> = collector.harvest();
                let serialized =
                    postcard::to_allocvec(&fruit).expect("Collector fruit should be serializable.");
                Some(serialized)
            }
            Some(AggregationSegmentCollectors::TantivyAggregationSegmentCollector(collector)) => {
                let serialized = postcard::to_allocvec(&collector.harvest()?)
                    .expect("Collector fruit should be serializable.");
                Some(serialized)
            }
            None => None,
        };

        Ok(LeafSearchResponse {
            intermediate_aggregation_result,
            num_hits: self.num_hits,
            partial_hits,
            failed_splits: Vec::new(),
            num_attempted_splits: 1,
            num_successful_splits: 1,
            resource_stats: None,
        })
    }
}

/// Available aggregation types.
#[derive(Debug, Clone, PartialEq, Deserialize)]
#[serde(untagged)]
pub enum QuickwitAggregations {
    /// Aggregation used by the Jaeger service to find trace IDs that match a
    /// [`quickwit_proto::jaeger::storage::v1::FindTraceIDsRequest`].
    FindTraceIdsAggregation(FindTraceIdsCollector),
    /// Your classic Tantivy aggregation.
    TantivyAggregations(Aggregations),
}

impl QuickwitAggregations {
    /// Returns the list of fast fields that should be loaded for the aggregation.
    pub fn fast_field_names(&self) -> HashSet<String> {
        match self {
            QuickwitAggregations::FindTraceIdsAggregation(collector) => {
                collector.fast_field_names()
            }
            QuickwitAggregations::TantivyAggregations(aggregations) => {
                get_fast_field_names(aggregations)
            }
        }
    }

    fn maybe_incremental_aggregator(&self) -> QuickwitIncrementalAggregations {
        match self {
            QuickwitAggregations::FindTraceIdsAggregation(aggreg) => {
                QuickwitIncrementalAggregations::FindTraceIdsAggregation(aggreg.clone(), Vec::new())
            }
            QuickwitAggregations::TantivyAggregations(aggreg) => {
                QuickwitIncrementalAggregations::TantivyAggregations(aggreg.clone(), Vec::new())
            }
        }
    }
}

#[derive(Clone)]
enum QuickwitIncrementalAggregations {
    FindTraceIdsAggregation(FindTraceIdsCollector, Vec<Vec<Span>>),
    TantivyAggregations(Aggregations, Vec<Vec<u8>>),
    NoAggregation,
}

impl QuickwitIncrementalAggregations {
    fn add(&mut self, intermediate_result: Vec<u8>) -> tantivy::Result<()> {
        match self {
            QuickwitIncrementalAggregations::FindTraceIdsAggregation(collector, state) => {
                let fruits: Vec<Span> =
                    postcard::from_bytes(&intermediate_result).map_err(map_error)?;
                state.push(fruits);
                if state.iter().map(Vec::len).sum::<usize>() >= collector.num_traces {
                    let new_state = collector.merge_fruits(std::mem::take(state))?;
                    state.push(new_state);
                }
            }
            QuickwitIncrementalAggregations::TantivyAggregations(_, state) => {
                state.push(intermediate_result);
            }
            QuickwitIncrementalAggregations::NoAggregation => (),
        }
        Ok(())
    }

    fn virtual_worst_hit(&self) -> Option<PartialHit> {
        match self {
            QuickwitIncrementalAggregations::FindTraceIdsAggregation(collector, state) => {
                if let Some(first) = state.first()
                    && first.len() >= collector.num_traces
                    && let Some(last_elem) = first.last()
                {
                    let timestamp = last_elem.span_timestamp.into_timestamp_nanos();
                    return Some(PartialHit {
                        sort_value: Some(SortByValue {
                            sort_value: Some(SortValue::I64(timestamp)),
                        }),
                        sort_value2: None,
                        split_id: SplitId::new(),
                        segment_ord: 0,
                        doc_id: 0,
                    });
                }
                None
            }
            QuickwitIncrementalAggregations::TantivyAggregations(_, _) => None,
            QuickwitIncrementalAggregations::NoAggregation => None,
        }
    }

    fn finalize(self) -> tantivy::Result<Option<Vec<u8>>> {
        match self {
            QuickwitIncrementalAggregations::FindTraceIdsAggregation(collector, mut state) => {
                let merged_fruit = if state.len() > 1 {
                    collector.merge_fruits(state)?
                } else {
                    state.pop().unwrap_or_default()
                };
                let serialized = postcard::to_allocvec(&merged_fruit).map_err(map_error)?;
                Ok(Some(serialized))
            }
            QuickwitIncrementalAggregations::TantivyAggregations(aggregation, state) => {
                merge_intermediate_aggregation_result(
                    &Some(QuickwitAggregations::TantivyAggregations(aggregation)),
                    state.iter().map(|vec| vec.as_slice()),
                )
            }
            QuickwitIncrementalAggregations::NoAggregation => Ok(None),
        }
    }
}

/// The quickwit collector is the tantivy Collector used in Quickwit.
///
/// It defines the data that should be accumulated about the documents matching
/// the query.
#[derive(Clone)]
pub(crate) struct QuickwitCollector {
    pub split_id: SplitId,
    pub start_offset: usize,
    pub max_hits: usize,
    pub sort_by: SortByPair,
    pub aggregation: Option<QuickwitAggregations>,
    pub agg_context_params: AggContextParams,
    search_after: Option<PartialHit>,
}

impl QuickwitCollector {
    pub fn is_count_only(&self) -> bool {
        self.max_hits == 0 && self.aggregation.is_none()
    }
    /// Updates search parameters affecting the returned documents.
    /// Does not update aggregations.
    pub fn update_search_param(&mut self, search_request: &SearchRequest) {
        let sort_by = sort_by_from_request(search_request);
        self.sort_by = sort_by;
        self.max_hits = search_request.max_hits as usize;
        self.start_offset = search_request.start_offset as usize;
        self.search_after.clone_from(&search_request.search_after);
    }
    pub fn fast_field_names(&self) -> HashSet<String> {
        let mut fast_field_names = HashSet::default();
        self.sort_by.first.add_fast_field(&mut fast_field_names);
        if let Some(sort_by_second) = &self.sort_by.second {
            sort_by_second.add_fast_field(&mut fast_field_names);
        }
        if let Some(aggregations) = &self.aggregation {
            fast_field_names.extend(aggregations.fast_field_names());
        }
        fast_field_names
    }

    pub fn warmup_info(&self) -> WarmupInfo {
        WarmupInfo {
            fast_fields: self
                .fast_field_names()
                .into_iter()
                .map(|name| FastFieldWarmupInfo {
                    name,
                    with_subfields: false,
                })
                .collect(),
            field_norms: self.requires_scoring(),
            ..WarmupInfo::default()
        }
    }
}

impl Collector for QuickwitCollector {
    type Child = QuickwitSegmentCollector;
    type Fruit = LeafSearchResponse;

    fn for_segment(
        &self,
        segment_ord: SegmentOrdinal,
        segment_reader: &SegmentReader,
    ) -> tantivy::Result<Self::Child> {
        // Regardless of the start_offset, we need to collect top-K
        // starting from 0 for every leaves.
        let leaf_max_hits = self.max_hits + self.start_offset;

        let aggregation = match &self.aggregation {
            Some(QuickwitAggregations::FindTraceIdsAggregation(collector)) => {
                Some(AggregationSegmentCollectors::FindTraceIdsSegmentCollector(
                    Box::new(collector.for_segment(0, segment_reader)?),
                ))
            }
            Some(QuickwitAggregations::TantivyAggregations(aggs)) => Some(
                AggregationSegmentCollectors::TantivyAggregationSegmentCollector(
                    AggregationSegmentCollector::from_agg_req_and_reader(
                        aggs,
                        segment_reader,
                        segment_ord,
                        &self.agg_context_params,
                    )?,
                ),
            ),
            None => None,
        };
        let score_extractor = get_score_extractor(&self.sort_by, segment_reader)?;
        let (order1, order2) = self.sort_by.sort_orders();

        let segment_top_k_collector = if leaf_max_hits == 0 {
            None
        } else {
            let coll: Box<dyn QuickwitSegmentTopKCollector> = specialized_top_k_segment_collector(
                self.split_id.clone(),
                score_extractor,
                leaf_max_hits,
                segment_ord,
                self.search_after.clone(),
                order1,
                order2,
            );
            Some(coll)
        };

        Ok(QuickwitSegmentCollector {
            num_hits: 0,
            segment_top_k_collector,
            aggregation,
        })
    }

    fn requires_scoring(&self) -> bool {
        // We do not need BM25 scoring in Quickwit if it is not opted-in.
        // By returning false, we inform tantivy that it does not need to decompress
        // term frequencies.
        self.sort_by.first.requires_scoring()
            || self
                .sort_by
                .second
                .as_ref()
                .map(|sort_by| sort_by.requires_scoring())
                .unwrap_or(false)
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<tantivy::Result<LeafSearchResponse>>,
    ) -> tantivy::Result<Self::Fruit> {
        let segment_fruits: tantivy::Result<Vec<LeafSearchResponse>> =
            segment_fruits.into_iter().collect();
        // We want the hits in [start_offset..start_offset + max_hits).
        // All leaves will return their top [0..start_offset + max_hits) documents.
        // We compute the overall [0..start_offset + max_hits) documents ...
        let num_hits = self.start_offset + self.max_hits;
        let (sort_order1, sort_order2) = self.sort_by.sort_orders();
        let mut merged_leaf_response = merge_leaf_responses(
            &self.aggregation,
            segment_fruits?,
            sort_order1,
            sort_order2,
            num_hits,
        )?;
        // ... and drop the first [..start_offsets) hits.
        // note that self.start_offset is 0 when merging from leaf_search, and is only set when
        // merging from root_search, so as to remove the firsts elements only once.
        merged_leaf_response.partial_hits.drain(
            0..self
                .start_offset
                .min(merged_leaf_response.partial_hits.len()),
        );
        merged_leaf_response.partial_hits.truncate(self.max_hits);
        Ok(merged_leaf_response)
    }
}

fn map_error(error: postcard::Error) -> TantivyError {
    TantivyError::InternalError(format!(
        "failed to merge intermediate aggregation results: Postcard error: {error}"
    ))
}

/// Merges a set of Leaf Results.
fn merge_intermediate_aggregation_result<'a>(
    aggregations_opt: &Option<QuickwitAggregations>,
    intermediate_aggregation_results: impl Iterator<Item = &'a [u8]>,
) -> tantivy::Result<Option<Vec<u8>>> {
    let merged_intermediate_aggregation_result = match aggregations_opt {
        Some(QuickwitAggregations::FindTraceIdsAggregation(collector)) => {
            let fruits: Vec<
                <<FindTraceIdsCollector as Collector>::Child as SegmentCollector>::Fruit,
            > = intermediate_aggregation_results
                .map(|intermediate_aggregation_result| {
                    postcard::from_bytes(intermediate_aggregation_result).map_err(map_error)
                })
                .collect::<Result<_, _>>()?;
            let merged_fruit: Vec<Span> = collector.merge_fruits(fruits)?;
            let serialized = postcard::to_allocvec(&merged_fruit).map_err(map_error)?;
            Some(serialized)
        }
        Some(QuickwitAggregations::TantivyAggregations(_)) => {
            let merged_opt = intermediate_aggregation_results
                .map(|bytes| postcard::from_bytes(bytes).map_err(map_error))
                .try_fold::<_, _, Result<_, TantivyError>>(
                    None,
                    |acc: Option<IntermediateAggregationResults>, fruits_res| {
                        let fruits = fruits_res?;
                        match acc {
                            Some(mut merged_fruits) => {
                                merged_fruits.merge_fruits(fruits)?;
                                Ok(Some(merged_fruits))
                            }
                            None => Ok(Some(fruits)),
                        }
                    },
                )?;
            let serialized =
                postcard::to_allocvec(&merged_opt.unwrap_or_default()).map_err(map_error)?;
            Some(serialized)
        }
        None => None,
    };

    Ok(merged_intermediate_aggregation_result)
}

/// Merges a set of Leaf Results.
fn merge_leaf_responses(
    aggregations_opt: &Option<QuickwitAggregations>,
    mut leaf_responses: Vec<LeafSearchResponse>,
    sort_order1: SortOrder,
    sort_order2: SortOrder,
    max_hits: usize,
) -> tantivy::Result<LeafSearchResponse> {
    // Optimization: No merging needed if there is only one result.
    if leaf_responses.len() == 1 {
        return Ok(leaf_responses.pop().unwrap());
    }

    let resource_stats_it = leaf_responses
        .iter()
        .map(|leaf_response| &leaf_response.resource_stats);
    let merged_resource_stats = merge_resource_stats_it(resource_stats_it);

    let merged_intermediate_aggregation_result: Option<Vec<u8>> =
        merge_intermediate_aggregation_result(
            aggregations_opt,
            leaf_responses.iter().filter_map(|leaf_response| {
                leaf_response.intermediate_aggregation_result.as_deref()
            }),
        )?;
    let num_attempted_splits = leaf_responses
        .iter()
        .map(|leaf_response| leaf_response.num_attempted_splits)
        .sum();
    let num_successful_splits = leaf_responses
        .iter()
        .map(|leaf_response| leaf_response.num_successful_splits)
        .sum::<u64>();
    let num_hits: u64 = leaf_responses
        .iter()
        .map(|leaf_response| leaf_response.num_hits)
        .sum();
    let failed_splits = leaf_responses
        .iter()
        .flat_map(|leaf_response| leaf_response.failed_splits.iter())
        .cloned()
        .collect_vec();
    let all_partial_hits: Vec<PartialHit> = leaf_responses
        .into_iter()
        .flat_map(|leaf_response| leaf_response.partial_hits)
        .collect();
    let top_k_partial_hits: Vec<PartialHit> = top_k_partial_hits(
        all_partial_hits.into_iter(),
        sort_order1,
        sort_order2,
        max_hits,
    );
    Ok(LeafSearchResponse {
        intermediate_aggregation_result: merged_intermediate_aggregation_result,
        num_hits,
        partial_hits: top_k_partial_hits,
        failed_splits,
        num_attempted_splits,
        num_successful_splits,
        resource_stats: merged_resource_stats,
    })
}

/// Mutates partial_hits so that it contains the top-num_hitso hits,
/// and so that these elements are sorted.
///
/// TODO we could possibly optimize the sort away (but I doubt it matters).
fn top_k_partial_hits(
    partial_hits: impl Iterator<Item = PartialHit>,
    order1: SortOrder,
    order2: SortOrder,
    num_hits: usize,
) -> Vec<PartialHit> {
    let sort_key_mapper = HitSortingMapper { order1, order2 };
    let mut top_k_hits = TopK::new(num_hits, sort_key_mapper);

    partial_hits.for_each(|hit| top_k_hits.add_entry(hit));

    top_k_hits.finalize()
}

pub(crate) fn sort_by_from_request(search_request: &SearchRequest) -> SortByPair {
    let to_sort_by_component = |field_name: &str, order| {
        if field_name == "_score" {
            SortByComponent::Score { order }
        } else if field_name == "_shard_doc" || field_name == "_doc" {
            SortByComponent::DocId { order }
        } else {
            SortByComponent::FastField {
                field_name: field_name.to_string(),
                order,
            }
        }
    };

    let num_sort_fields = search_request.sort_fields.len();
    if num_sort_fields == 0 {
        SortByComponent::DocId {
            order: SortOrder::Desc,
        }
        .into()
    } else if num_sort_fields == 1 {
        let sort_field = &search_request.sort_fields[0];
        let order = SortOrder::try_from(sort_field.sort_order).unwrap_or(SortOrder::Desc);
        to_sort_by_component(&sort_field.field_name, order).into()
    } else if num_sort_fields == 2 {
        let sort_field1 = &search_request.sort_fields[0];
        let order1 = SortOrder::try_from(sort_field1.sort_order).unwrap_or(SortOrder::Desc);
        let sort_field2 = &search_request.sort_fields[1];
        let order2 = SortOrder::try_from(sort_field2.sort_order).unwrap_or(SortOrder::Desc);
        SortByPair {
            first: to_sort_by_component(&sort_field1.field_name, order1),
            second: Some(to_sort_by_component(&sort_field2.field_name, order2)),
        }
    } else {
        panic!("Sort by more than 2 fields is not supported yet.")
    }
}

/// Builds the QuickwitCollector, in function of the information that was requested by the user.
pub(crate) fn make_collector_for_split(
    split_id: SplitId,
    search_request: &SearchRequest,
    agg_context_params: AggContextParams,
) -> crate::Result<QuickwitCollector> {
    let aggregation = match &search_request.aggregation_request {
        Some(aggregation) => Some(serde_json::from_str(aggregation)?),
        None => None,
    };
    let sort_by = sort_by_from_request(search_request);
    Ok(QuickwitCollector {
        split_id,
        start_offset: search_request.start_offset as usize,
        max_hits: search_request.max_hits as usize,
        sort_by,
        aggregation,
        agg_context_params,
        search_after: search_request.search_after.clone(),
    })
}

/// Builds a QuickwitCollector that's only useful for merging fruits.
pub(crate) fn make_merge_collector(
    search_request: &SearchRequest,
    agg_limits: AggregationLimitsGuard,
) -> crate::Result<QuickwitCollector> {
    // Note: at this point the tokenizer manager is not used anymore by aggregations (filter query),
    // so we can create an empty one. So if it will ever be used, it would panic.
    let agg_context_params = AggContextParams {
        limits: agg_limits,
        tokenizers: TokenizerManager::new(),
    };

    let aggregation = match &search_request.aggregation_request {
        Some(aggregation) => Some(serde_json::from_str(aggregation)?),
        None => None,
    };
    let sort_by = sort_by_from_request(search_request);
    Ok(QuickwitCollector {
        split_id: SplitId::default(),
        start_offset: search_request.start_offset as usize,
        max_hits: search_request.max_hits as usize,
        sort_by,
        aggregation,
        agg_context_params,
        search_after: search_request.search_after.clone(),
    })
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
pub struct SegmentPartialHitSortingKey {
    sort_value: Option<u64>,
    sort_value2: Option<u64>,
    doc_id: DocId,
    // TODO This should not be there.
    sort_order: SortOrder,
    // TODO This should not be there.
    sort_order2: SortOrder,
}

impl Ord for SegmentPartialHitSortingKey {
    fn cmp(&self, other: &SegmentPartialHitSortingKey) -> Ordering {
        debug_assert_eq!(
            self.sort_order, other.sort_order,
            "comparing two PartialHitSortingKey of different ordering"
        );
        debug_assert_eq!(
            self.sort_order2, other.sort_order2,
            "comparing two PartialHitSortingKey of different ordering"
        );
        let order = self
            .sort_order
            .compare_opt(&self.sort_value, &other.sort_value);
        let order2 = self
            .sort_order2
            .compare_opt(&self.sort_value2, &other.sort_value2);
        let order_addr = self.sort_order.compare(&self.doc_id, &other.doc_id);
        order.then(order2).then(order_addr)
    }
}

impl PartialOrd for SegmentPartialHitSortingKey {
    fn partial_cmp(&self, other: &SegmentPartialHitSortingKey) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

#[derive(Clone, Debug, PartialEq, Eq)]
pub(crate) struct PartialHitSortingKey {
    sort_value: Option<SortValue>,
    sort_value2: Option<SortValue>,
    address: GlobalDocAddress,
    // TODO remove this
    sort_order: SortOrder,
    sort_order2: SortOrder,
}

impl Ord for PartialHitSortingKey {
    fn cmp(&self, other: &PartialHitSortingKey) -> Ordering {
        assert_eq!(
            self.sort_order, other.sort_order,
            "comparing two PartialHitSortingKey of different ordering"
        );
        assert_eq!(
            self.sort_order2, other.sort_order2,
            "comparing two PartialHitSortingKey of different ordering"
        );

        let order = self
            .sort_order
            .compare_opt(&self.sort_value, &other.sort_value);

        let order2 = self
            .sort_order2
            .compare_opt(&self.sort_value2, &other.sort_value2);

        let order_addr = self.sort_order.compare(&self.address, &other.address);

        order.then(order2).then(order_addr)
    }
}

impl PartialOrd for PartialHitSortingKey {
    fn partial_cmp(&self, other: &PartialHitSortingKey) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

#[derive(Clone)]
pub(crate) struct HitSortingMapper {
    pub order1: SortOrder,
    pub order2: SortOrder,
}

impl SortKeyMapper<PartialHit> for HitSortingMapper {
    type Key = PartialHitSortingKey;
    fn get_sort_key(&self, partial_hit: &PartialHit) -> PartialHitSortingKey {
        PartialHitSortingKey {
            sort_value: partial_hit.sort_value.and_then(|v| v.sort_value),
            sort_value2: partial_hit.sort_value2.and_then(|v| v.sort_value),
            address: GlobalDocAddress::from_partial_hit(partial_hit),
            sort_order: self.order1,
            sort_order2: self.order2,
        }
    }
}

impl SortKeyMapper<SegmentPartialHit> for HitSortingMapper {
    type Key = SegmentPartialHitSortingKey;
    fn get_sort_key(&self, partial_hit: &SegmentPartialHit) -> SegmentPartialHitSortingKey {
        SegmentPartialHitSortingKey {
            sort_value: partial_hit.sort_value,
            sort_value2: partial_hit.sort_value2,
            doc_id: partial_hit.doc_id,
            sort_order: self.order1,
            sort_order2: self.order2,
        }
    }
}

/// Incrementally merge segment results.
#[derive(Clone)]
pub(crate) struct IncrementalCollector {
    top_k_hits: TopK<PartialHit, PartialHitSortingKey, HitSortingMapper>,
    incremental_aggregation: QuickwitIncrementalAggregations,
    num_hits: u64,
    failed_splits: Vec<SplitSearchError>,
    num_attempted_splits: u64,
    num_successful_splits: u64,
    start_offset: usize,
    resource_stats: Option<ResourceStats>,
}

impl IncrementalCollector {
    /// Create a new incremental collector
    pub(crate) fn new(collector: QuickwitCollector) -> Self {
        let incremental_aggregation = collector
            .aggregation
            .as_ref()
            .map(QuickwitAggregations::maybe_incremental_aggregator)
            .unwrap_or(QuickwitIncrementalAggregations::NoAggregation);
        let (order1, order2) = collector.sort_by.sort_orders();
        let sort_key_mapper = HitSortingMapper { order1, order2 };
        IncrementalCollector {
            top_k_hits: TopK::new(collector.max_hits + collector.start_offset, sort_key_mapper),
            start_offset: collector.start_offset,
            incremental_aggregation,
            num_hits: 0,
            failed_splits: Vec::new(),
            num_attempted_splits: 0,
            num_successful_splits: 0,
            resource_stats: None,
        }
    }

    /// Merge one search result with the current state
    pub(crate) fn add_result(&mut self, leaf_response: LeafSearchResponse) -> tantivy::Result<()> {
        let LeafSearchResponse {
            num_hits,
            partial_hits,
            failed_splits,
            num_attempted_splits,
            intermediate_aggregation_result,
            num_successful_splits,
            resource_stats,
        } = leaf_response;

        merge_resource_stats(&resource_stats, &mut self.resource_stats);

        self.num_hits += num_hits;
        self.top_k_hits.add_entries(partial_hits.into_iter());
        self.failed_splits.extend(failed_splits);
        self.num_attempted_splits += num_attempted_splits;
        self.num_successful_splits += num_successful_splits;
        if let Some(intermediate_aggregation_result) = intermediate_aggregation_result {
            self.incremental_aggregation
                .add(intermediate_aggregation_result)?;
        }
        Ok(())
    }

    /// Add a failed split to the state
    pub(crate) fn add_failed_split(&mut self, split_error: SplitSearchError) {
        self.failed_splits.push(split_error)
    }

    /// Get the worst top-hit. Can be used to skip splits if they can't possibly do better.
    ///
    /// Only returns a result if enough hits were recorded already.
    pub(crate) fn peek_worst_hit(&self) -> Option<Cow<'_, PartialHit>> {
        if self.top_k_hits.max_len() == 0 {
            return self
                .incremental_aggregation
                .virtual_worst_hit()
                .map(Cow::Owned);
        }

        if self.top_k_hits.at_capacity() {
            self.top_k_hits.peek_worst().map(Cow::Borrowed)
        } else {
            None
        }
    }

    /// Finalize the merge, creating a LeafSearchResponse.
    pub(crate) fn finalize(self) -> tantivy::Result<LeafSearchResponse> {
        let intermediate_aggregation_result = self.incremental_aggregation.finalize()?;
        let mut partial_hits = self.top_k_hits.finalize();
        if self.start_offset != 0 {
            partial_hits.drain(0..self.start_offset.min(partial_hits.len()));
        }
        Ok(LeafSearchResponse {
            num_hits: self.num_hits,
            partial_hits,
            failed_splits: self.failed_splits,
            num_attempted_splits: self.num_attempted_splits,
            num_successful_splits: self.num_successful_splits,
            intermediate_aggregation_result,
            resource_stats: self.resource_stats,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::cmp::Ordering;

    use quickwit_proto::search::{
        LeafSearchResponse, PartialHit, ResourceStats, SearchRequest, SortByValue, SortField,
        SortOrder, SortValue, SplitSearchError,
    };
    use tantivy::TantivyDocument;
    use tantivy::aggregation::agg_req::Aggregations;
    use tantivy::aggregation::intermediate_agg_result::IntermediateAggregationResults;
    use tantivy::collector::Collector;

    use super::{IncrementalCollector, make_merge_collector};
    use crate::QuickwitAggregations;
    use crate::collector::{merge_intermediate_aggregation_result, top_k_partial_hits};

    #[test]
    fn test_merge_partial_hits_no_tie() {
        let make_doc = |sort_value: u64| PartialHit {
            sort_value: Some(SortValue::U64(sort_value).into()),
            sort_value2: None,
            split_id: "split1".to_string(),
            segment_ord: 0u32,
            doc_id: 0u32,
        };
        assert_eq!(
            top_k_partial_hits(
                vec![make_doc(1u64), make_doc(3u64), make_doc(2u64),].into_iter(),
                SortOrder::Asc,
                SortOrder::Asc,
                2
            ),
            vec![make_doc(1), make_doc(2)]
        );
    }

    #[test]
    fn test_merge_partial_hits_with_tie() {
        let make_hit_given_split_id = |split_id: u64| PartialHit {
            sort_value: Some(SortValue::U64(0u64).into()),
            sort_value2: None,
            split_id: format!("split_{split_id}"),
            segment_ord: 0u32,
            doc_id: 0u32,
        };
        assert_eq!(
            &top_k_partial_hits(
                vec![
                    make_hit_given_split_id(1u64),
                    make_hit_given_split_id(3u64),
                    make_hit_given_split_id(2u64),
                ]
                .into_iter(),
                SortOrder::Desc,
                SortOrder::Desc,
                2
            ),
            &[make_hit_given_split_id(3), make_hit_given_split_id(2)]
        );
        assert_eq!(
            &top_k_partial_hits(
                vec![
                    make_hit_given_split_id(1u64),
                    make_hit_given_split_id(3u64),
                    make_hit_given_split_id(2u64),
                ]
                .into_iter(),
                SortOrder::Asc,
                SortOrder::Asc,
                2
            ),
            &[make_hit_given_split_id(1), make_hit_given_split_id(2)]
        );
    }

    fn sort_dataset() -> Vec<(Option<u64>, Option<u64>)> {
        // every combination of 0..=2 + None, in random order.
        // (2, 1) is duplicated to allow testing for DocId sorting with two sort fields
        vec![
            (Some(2), Some(1)),
            (Some(0), Some(1)),
            (Some(1), Some(1)),
            (Some(0), Some(0)),
            (None, Some(1)),
            (None, Some(2)),
            (Some(2), Some(1)),
            (Some(1), Some(2)),
            (Some(0), None),
            (None, Some(0)),
            (Some(2), Some(0)),
            (Some(2), Some(2)),
            (Some(0), Some(2)),
            (Some(2), None),
            (None, None),
            (Some(1), Some(0)),
            (Some(1), None),
        ]
    }

    fn make_request(max_hits: u64, sort_fields: &str) -> SearchRequest {
        SearchRequest {
            max_hits,
            sort_fields: sort_fields
                .split(',')
                .filter(|field| !field.is_empty())
                .map(|field| {
                    if let Some(field) = field.strip_prefix('-') {
                        SortField {
                            field_name: field.to_string(),
                            sort_order: SortOrder::Asc.into(),
                            sort_datetime_format: None,
                        }
                    } else {
                        SortField {
                            field_name: field.to_string(),
                            sort_order: SortOrder::Desc.into(),
                            sort_datetime_format: None,
                        }
                    }
                })
                .collect(),
            ..SearchRequest::default()
        }
    }

    fn make_index() -> tantivy::Index {
        use tantivy::Index;
        use tantivy::indexer::UserOperation;
        use tantivy::schema::{NumericOptions, Schema};

        let dataset = sort_dataset();

        let mut schema_builder = Schema::builder();
        let opts = NumericOptions::default().set_fast();

        schema_builder.add_u64_field("sort1", opts.clone());
        schema_builder.add_u64_field("sort2", opts);
        let schema = schema_builder.build();

        let field1 = schema.get_field("sort1").unwrap();
        let field2 = schema.get_field("sort2").unwrap();

        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer(50_000_000).unwrap();

        index_writer
            .run(
                dataset
                    .into_iter()
                    .map(|(val1, val2)| {
                        let mut doc = TantivyDocument::new();
                        if let Some(val1) = val1 {
                            doc.add_u64(field1, val1);
                        }
                        if let Some(val2) = val2 {
                            doc.add_u64(field2, val2);
                        }
                        doc
                    })
                    .map(UserOperation::Add),
            )
            .unwrap();
        index_writer.commit().unwrap();

        index
    }

    #[test]
    fn test_single_split_sorting() {
        let index = make_index();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        // tuple of DocId and sort value
        type Doc = (usize, (Option<u64>, Option<u64>));

        let mut dataset: Vec<Doc> = sort_dataset().into_iter().enumerate().collect();

        let reverse_int = |val: &Option<u64>| val.as_ref().map(|val| u64::MAX - val);
        let cmp_doc_id_desc = |a: &Doc, b: &Doc| b.0.cmp(&a.0);
        let cmp_doc_id_asc = |a: &Doc, b: &Doc| a.0.cmp(&b.0);
        let cmp_1_desc = |a: &Doc, b: &Doc| b.1.0.cmp(&a.1.0);
        let cmp_1_asc = |a: &Doc, b: &Doc| reverse_int(&b.1.0).cmp(&reverse_int(&a.1.0));
        let cmp_2_desc = |a: &Doc, b: &Doc| b.1.1.cmp(&a.1.1);
        let cmp_2_asc = |a: &Doc, b: &Doc| reverse_int(&b.1.1).cmp(&reverse_int(&a.1.1));

        {
            // the logic for sorting isn't easy to wrap one's head around. These simple tests are
            // here to convince oneself they do what we want them todo
            let mut data = vec![(1, (None, None)), (0, (None, None))];
            let data_copy = data.clone();
            data.sort_by(cmp_doc_id_desc);
            assert_eq!(data, data_copy);

            let mut data = vec![(0, (None, None)), (1, (None, None))];
            let data_copy = data.clone();
            data.sort_by(cmp_doc_id_asc);
            assert_eq!(data, data_copy);

            let mut data = vec![
                (1, (Some(2), None)),
                (0, (Some(1), None)),
                (2, (None, None)),
            ];
            let data_copy = data.clone();
            data.sort_by(cmp_1_desc);
            assert_eq!(data, data_copy);

            let mut data = vec![
                (1, (Some(1), None)),
                (0, (Some(2), None)),
                (2, (None, None)),
            ];
            let data_copy = data.clone();
            data.sort_by(cmp_1_asc);
            assert_eq!(data, data_copy);

            let mut data = vec![
                (1, (None, Some(2))),
                (0, (None, Some(1))),
                (2, (None, None)),
            ];
            let data_copy = data.clone();
            data.sort_by(cmp_2_desc);
            assert_eq!(data, data_copy);

            let mut data = vec![
                (1, (None, Some(1))),
                (0, (None, Some(2))),
                (2, (None, None)),
            ];
            let data_copy = data.clone();
            data.sort_by(cmp_2_asc);
            assert_eq!(data, data_copy);
        }

        #[allow(clippy::type_complexity)]
        let sort_orders: Vec<(_, Box<dyn Fn(&Doc, &Doc) -> Ordering>)> = vec![
            ("", Box::new(cmp_doc_id_desc)),
            (
                "sort1",
                Box::new(|a, b| cmp_1_desc(a, b).then(cmp_doc_id_desc(a, b))),
            ),
            (
                "-sort1",
                Box::new(|a, b| cmp_1_asc(a, b).then(cmp_doc_id_asc(a, b))),
            ),
            (
                "sort1,sort2",
                Box::new(|a, b| {
                    cmp_1_desc(a, b).then(cmp_2_desc(a, b).then(cmp_doc_id_desc(a, b)))
                }),
            ),
            (
                "-sort1,sort2",
                Box::new(|a, b| {
                    cmp_1_asc(a, b)
                        .then(cmp_2_desc(a, b))
                        .then(cmp_doc_id_asc(a, b))
                }),
            ),
            (
                "sort1,-sort2",
                Box::new(|a, b| cmp_1_desc(a, b).then(cmp_2_asc(a, b).then(cmp_doc_id_desc(a, b)))),
            ),
            (
                "-sort1,-sort2",
                Box::new(|a, b| {
                    cmp_1_asc(a, b)
                        .then(cmp_2_asc(a, b))
                        .then(cmp_doc_id_asc(a, b))
                }),
            ),
        ];

        for (sort_str, sort_function) in sort_orders {
            dataset.sort_by(sort_function);
            // Check increasing slice sizes of the dataset
            for slice_len in 0..dataset.len() {
                let collector = super::make_collector_for_split(
                    "fake_split_id".to_string(),
                    &make_request(slice_len as u64, sort_str),
                    Default::default(),
                )
                .unwrap();
                let res = searcher
                    .search(&tantivy::query::AllQuery, &collector)
                    .unwrap();
                assert_eq!(
                    res.partial_hits.len(),
                    slice_len,
                    "mismatch slice_len for \"{sort_str}\":{slice_len}"
                );
                for (expected, got) in dataset.iter().zip(res.partial_hits.iter()) {
                    if expected.0 as u32 != got.doc_id {
                        let expected_docids = dataset
                            .iter()
                            .map(|(docid, val)| {
                                format!("{} {:?} {:?}", *docid as u32, val.0.clone(), val.1.clone())
                            })
                            .collect::<Vec<_>>();
                        let got_docids = res
                            .partial_hits
                            .iter()
                            .map(|hit| {
                                format!(
                                    "{} {:?} {:?}",
                                    hit.doc_id,
                                    hit.sort_value.and_then(|el| el.sort_value).clone(),
                                    hit.sort_value2.and_then(|el| el.sort_value).clone()
                                )
                            })
                            .collect::<Vec<_>>();
                        eprintln!("expected: {expected_docids:#?}");
                        eprintln!("got: {got_docids:#?}");
                        panic!("mismatch ordering for \"{sort_str}\":{slice_len}");
                    }
                }
            }
        }
    }

    #[test]
    fn test_search_after() {
        let index = make_index();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        // tuple of DocId and sort value
        type Doc = (usize, (Option<u64>, Option<u64>));

        let mut dataset: Vec<Doc> = sort_dataset().into_iter().enumerate().collect();

        let reverse_int = |val: &Option<u64>| val.as_ref().map(|val| u64::MAX - val);
        let cmp_doc_id_desc = |a: &Doc, b: &Doc| b.0.cmp(&a.0);
        let cmp_1_desc = |a: &Doc, b: &Doc| b.1.0.cmp(&a.1.0);
        let cmp_2_asc = |a: &Doc, b: &Doc| reverse_int(&b.1.1).cmp(&reverse_int(&a.1.1));

        let sort_function =
            |a: &Doc, b: &Doc| cmp_1_desc(a, b).then(cmp_2_asc(a, b).then(cmp_doc_id_desc(a, b)));
        dataset.sort_by(sort_function);
        let partial_sort_value = dataset
            .iter()
            .map(|(doc_id, (val1, val2))| PartialHit {
                split_id: "fake_split_id".to_string(),
                segment_ord: 0,
                doc_id: *doc_id as u32,
                sort_value: Some(SortByValue {
                    sort_value: val1.map(SortValue::U64),
                }),
                sort_value2: Some(SortByValue {
                    sort_value: val2.map(SortValue::U64),
                }),
            })
            .collect::<Vec<_>>();
        // we eliminate based on sort value
        for (i, search_after) in partial_sort_value.into_iter().enumerate() {
            let request = SearchRequest {
                max_hits: 1000,
                sort_fields: vec![
                    SortField {
                        field_name: "sort1".to_string(),
                        sort_order: SortOrder::Desc.into(),
                        sort_datetime_format: None,
                    },
                    SortField {
                        field_name: "sort2".to_string(),
                        sort_order: SortOrder::Asc.into(),
                        sort_datetime_format: None,
                    },
                ],
                search_after: Some(search_after),
                ..SearchRequest::default()
            };
            let collector = super::make_collector_for_split(
                "fake_split_id".to_string(),
                &request,
                Default::default(),
            )
            .unwrap();
            let res = searcher
                .search(&tantivy::query::AllQuery, &collector)
                .unwrap();
            // we count results even if they were removed due to search_after
            assert_eq!(res.num_hits, dataset.len() as u64);
            // we get as many result as expected
            assert_eq!(res.partial_hits.len(), dataset.len() - i - 1);
            for (expected, got) in dataset[i + 1..].iter().zip(res.partial_hits.iter()) {
                assert_eq!(expected.0 as u32, got.doc_id,);
            }
        }

        // we eliminate based on split id
        {
            let search_after = PartialHit {
                split_id: "fake_split_id2".to_string(),
                segment_ord: 0,
                doc_id: 5,
                sort_value: None,
                sort_value2: None,
            };
            let request = SearchRequest {
                max_hits: 1000,
                sort_fields: vec![SortField {
                    field_name: "_shard_doc".to_string(),
                    sort_order: SortOrder::Desc.into(),
                    sort_datetime_format: None,
                }],
                search_after: Some(search_after),
                ..SearchRequest::default()
            };

            let collector = super::make_collector_for_split(
                "fake_split_id1".to_string(),
                &request,
                Default::default(),
            )
            .unwrap();
            let res = searcher
                .search(&tantivy::query::AllQuery, &collector)
                .unwrap();
            assert_eq!(res.num_hits, dataset.len() as u64);
            // we are searching split id1, and we remove anything before id2 in descending order
            // (i.e. higher than id2 lexicographically), so every document matches
            assert_eq!(res.partial_hits.len(), dataset.len());

            let collector = super::make_collector_for_split(
                "fake_split_id2".to_string(),
                &request,
                Default::default(),
            )
            .unwrap();
            let res = searcher
                .search(&tantivy::query::AllQuery, &collector)
                .unwrap();
            assert_eq!(res.num_hits, dataset.len() as u64);
            // we are searching the limit split, but only doc_id in 0..5
            assert_eq!(res.partial_hits.len(), 5);

            let collector = super::make_collector_for_split(
                "fake_split_id3".to_string(),
                &request,
                Default::default(),
            )
            .unwrap();
            let res = searcher
                .search(&tantivy::query::AllQuery, &collector)
                .unwrap();
            assert_eq!(res.num_hits, dataset.len() as u64);
            // we are searching split id3, and we remove anything before id2 in descending order
            // (i.e. higher than id2 lexicographically), so everything is removed
            assert_eq!(res.partial_hits.len(), 0);
        }
    }

    fn merge_collector_equal_results(
        request: &SearchRequest,
        results: Vec<LeafSearchResponse>,
    ) -> LeafSearchResponse {
        let collector = make_merge_collector(request, Default::default()).unwrap();
        let mut incremental_collector = IncrementalCollector::new(collector.clone());

        let result = collector
            .merge_fruits(results.iter().cloned().map(Ok).collect())
            .unwrap();

        for split_result in results {
            incremental_collector.add_result(split_result).unwrap();
        }

        let incremental_result = incremental_collector.finalize().unwrap();
        assert_eq!(result, incremental_result);
        result
    }

    #[test]
    fn test_merge_collectors() {
        let result = merge_collector_equal_results(
            &SearchRequest {
                start_offset: 0,
                max_hits: 2,
                sort_fields: vec![SortField {
                    field_name: "timestamp".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: None,
                }],
                aggregation_request: None,
                ..Default::default()
            },
            vec![LeafSearchResponse {
                num_hits: 1234,
                partial_hits: vec![PartialHit {
                    split_id: "1".to_string(),
                    segment_ord: 0,
                    doc_id: 123,
                    sort_value: Some(SortValue::I64(1234).into()),
                    sort_value2: None,
                }],
                failed_splits: Vec::new(),
                num_attempted_splits: 3,
                num_successful_splits: 3,
                intermediate_aggregation_result: None,
                resource_stats: None,
            }],
        );

        assert_eq!(
            result,
            LeafSearchResponse {
                num_hits: 1234,
                partial_hits: vec![PartialHit {
                    split_id: "1".to_string(),
                    segment_ord: 0,
                    doc_id: 123,
                    sort_value: Some(SortValue::I64(1234).into()),
                    sort_value2: None,
                }],
                failed_splits: Vec::new(),
                num_attempted_splits: 3,
                num_successful_splits: 3,
                intermediate_aggregation_result: None,
                resource_stats: None,
            }
        );

        let result = merge_collector_equal_results(
            &SearchRequest {
                start_offset: 0,
                max_hits: 2,
                sort_fields: vec![SortField {
                    field_name: "timestamp".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: None,
                }],
                aggregation_request: None,
                ..Default::default()
            },
            vec![
                LeafSearchResponse {
                    num_hits: 1234,
                    partial_hits: vec![
                        PartialHit {
                            split_id: "1".to_string(),
                            segment_ord: 0,
                            doc_id: 123,
                            sort_value: Some(SortValue::I64(1234).into()),
                            sort_value2: None,
                        },
                        PartialHit {
                            split_id: "1".to_string(),
                            segment_ord: 0,
                            doc_id: 125,
                            sort_value: Some(SortValue::I64(1236).into()),
                            sort_value2: None,
                        },
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 3,
                    num_successful_splits: 3,
                    intermediate_aggregation_result: None,
                    resource_stats: None,
                },
                LeafSearchResponse {
                    num_hits: 10,
                    partial_hits: vec![PartialHit {
                        split_id: "2".to_string(),
                        segment_ord: 0,
                        doc_id: 3,
                        sort_value: Some(SortValue::I64(1235).into()),
                        sort_value2: None,
                    }],
                    failed_splits: vec![SplitSearchError {
                        error: "fake error".to_string(),
                        split_id: "3".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 2,
                    num_successful_splits: 1,
                    intermediate_aggregation_result: None,
                    resource_stats: None,
                },
            ],
        );

        assert_eq!(
            result,
            LeafSearchResponse {
                num_hits: 1244,
                partial_hits: vec![
                    PartialHit {
                        split_id: "1".to_string(),
                        segment_ord: 0,
                        doc_id: 125,
                        sort_value: Some(SortValue::I64(1236).into()),
                        sort_value2: None,
                    },
                    PartialHit {
                        split_id: "2".to_string(),
                        segment_ord: 0,
                        doc_id: 3,
                        sort_value: Some(SortValue::I64(1235).into()),
                        sort_value2: None,
                    },
                ],
                failed_splits: vec![SplitSearchError {
                    error: "fake error".to_string(),
                    split_id: "3".to_string(),
                    retryable_error: true,
                }],
                num_attempted_splits: 5,
                num_successful_splits: 4,
                intermediate_aggregation_result: None,
                resource_stats: None,
            }
        );

        // same request, but we reverse sort order
        let result = merge_collector_equal_results(
            &SearchRequest {
                start_offset: 0,
                max_hits: 2,
                sort_fields: vec![SortField {
                    field_name: "timestamp".to_string(),
                    sort_order: SortOrder::Asc as i32,
                    sort_datetime_format: None,
                }],
                aggregation_request: None,
                ..Default::default()
            },
            vec![
                LeafSearchResponse {
                    num_hits: 1234,
                    partial_hits: vec![
                        PartialHit {
                            split_id: "1".to_string(),
                            segment_ord: 0,
                            doc_id: 123,
                            sort_value: Some(SortValue::I64(1234).into()),
                            sort_value2: None,
                        },
                        PartialHit {
                            split_id: "1".to_string(),
                            segment_ord: 0,
                            doc_id: 125,
                            sort_value: Some(SortValue::I64(1236).into()),
                            sort_value2: None,
                        },
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 3,
                    num_successful_splits: 3,
                    intermediate_aggregation_result: None,
                    resource_stats: Some(ResourceStats {
                        cpu_microsecs: 100,
                        ..Default::default()
                    }),
                },
                LeafSearchResponse {
                    num_hits: 10,
                    partial_hits: vec![PartialHit {
                        split_id: "2".to_string(),
                        segment_ord: 0,
                        doc_id: 3,
                        sort_value: Some(SortValue::I64(1235).into()),
                        sort_value2: None,
                    }],
                    failed_splits: vec![SplitSearchError {
                        error: "fake error".to_string(),
                        split_id: "3".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 2,
                    num_successful_splits: 1,
                    intermediate_aggregation_result: None,
                    resource_stats: Some(ResourceStats {
                        cpu_microsecs: 50,
                        ..Default::default()
                    }),
                },
            ],
        );

        assert_eq!(
            result,
            LeafSearchResponse {
                num_hits: 1244,
                partial_hits: vec![
                    PartialHit {
                        split_id: "1".to_string(),
                        segment_ord: 0,
                        doc_id: 123,
                        sort_value: Some(SortValue::I64(1234).into()),
                        sort_value2: None,
                    },
                    PartialHit {
                        split_id: "2".to_string(),
                        segment_ord: 0,
                        doc_id: 3,
                        sort_value: Some(SortValue::I64(1235).into()),
                        sort_value2: None,
                    },
                ],
                failed_splits: vec![SplitSearchError {
                    error: "fake error".to_string(),
                    split_id: "3".to_string(),
                    retryable_error: true,
                }],
                num_attempted_splits: 5,
                num_successful_splits: 4,
                intermediate_aggregation_result: None,
                resource_stats: Some(ResourceStats {
                    cpu_microsecs: 150,
                    ..Default::default()
                }),
            }
        );
        // TODO would be nice to test aggregation too.
    }

    #[test]
    fn test_merge_empty_intermediate_aggregation_result() {
        let merged = merge_intermediate_aggregation_result(&None, std::iter::empty()).unwrap();
        assert!(merged.is_none());

        let aggregations_json = r#"{
            "avg_price": { "avg": { "field": "price" } }
        }"#;
        let ttv_aggregations: Aggregations = serde_json::from_str(aggregations_json).unwrap();
        let qw_aggregations = QuickwitAggregations::TantivyAggregations(ttv_aggregations);
        let serialized =
            merge_intermediate_aggregation_result(&Some(qw_aggregations), std::iter::empty())
                .unwrap()
                .unwrap();
        let _merged: IntermediateAggregationResults = postcard::from_bytes(&serialized).unwrap();
        // Hopefully `_merged` is empty but the API does not allow us to assert that.
    }
}


================================================
FILE: quickwit/quickwit-search/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use itertools::Itertools;
use quickwit_common::rate_limited_error;
use quickwit_common::retry::Retryable;
use quickwit_doc_mapper::QueryParserError;
use quickwit_proto::error::grpc_error_to_grpc_status;
use quickwit_proto::metastore::{EntityKind, MetastoreError};
use quickwit_proto::search::SplitSearchError;
use quickwit_proto::{GrpcServiceError, ServiceError, ServiceErrorCode, tonic};
use quickwit_storage::StorageResolverError;
use serde::{Deserialize, Serialize};
use tantivy::TantivyError;
use thiserror::Error;
use tokio::task::JoinError;

/// Possible SearchError
#[allow(missing_docs)]
#[derive(Error, Debug, Serialize, Deserialize, Clone)]
#[serde(rename_all = "snake_case")]
pub enum SearchError {
    #[error("could not find indexes matching the IDs `{index_ids:?}`")]
    IndexesNotFound { index_ids: Vec<String> },
    #[error("internal error: `{0}`")]
    Internal(String),
    #[error("invalid aggregation request: {0}")]
    InvalidAggregationRequest(String),
    #[error("Invalid argument: {0}")]
    InvalidArgument(String),
    #[error("{0}")]
    InvalidQuery(String),
    #[error("storage not found: `{0}`)")]
    StorageResolver(#[from] StorageResolverError),
    #[error("request timed out: {0}")]
    Timeout(String),
    #[error("too many requests")]
    TooManyRequests,
    #[error("service unavailable: {0}")]
    Unavailable(String),
}

impl SearchError {
    /// Creates an internal `SearchError` from a list of split search errors.
    pub fn from_split_errors(failed_splits: &[SplitSearchError]) -> Option<SearchError> {
        let first_failing_split = failed_splits.first()?;
        let failed_splits = failed_splits
            .iter()
            .map(|failed_split| &failed_split.split_id)
            .join(", ");
        let error_msg = format!(
            "search failed for the following splits: {failed_splits:}. For instance, split {} \
             failed with the following error message: {}",
            first_failing_split.split_id, first_failing_split.error,
        );
        Some(SearchError::Internal(error_msg))
    }
}

impl ServiceError for SearchError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            Self::IndexesNotFound { .. } => ServiceErrorCode::NotFound,
            Self::Internal(error_msg) => {
                rate_limited_error!(limit_per_min = 6, "search internal error: {error_msg}");
                ServiceErrorCode::Internal
            }
            Self::InvalidAggregationRequest(_) => ServiceErrorCode::BadRequest,
            Self::InvalidArgument(_) => ServiceErrorCode::BadRequest,
            Self::InvalidQuery(_) => ServiceErrorCode::BadRequest,
            Self::StorageResolver(storage_err) => {
                rate_limited_error!(
                    limit_per_min = 6,
                    "search's storager resolver internal error: {storage_err}"
                );
                ServiceErrorCode::Internal
            }
            Self::Timeout(_) => ServiceErrorCode::Timeout,
            Self::TooManyRequests => ServiceErrorCode::TooManyRequests,
            Self::Unavailable(_) => ServiceErrorCode::Unavailable,
        }
    }
}

impl GrpcServiceError for SearchError {
    fn new_internal(message: String) -> Self {
        Self::Internal(message)
    }

    fn new_timeout(message: String) -> Self {
        Self::Timeout(message)
    }

    fn new_too_many_requests() -> Self {
        Self::TooManyRequests
    }

    fn new_unavailable(message: String) -> Self {
        Self::Unavailable(message)
    }
}

impl From<SearchError> for tonic::Status {
    fn from(error: SearchError) -> Self {
        grpc_error_to_grpc_status(error)
    }
}

/// Parse tonic error and returns `SearchError`.
pub fn parse_grpc_error(grpc_error: &tonic::Status) -> SearchError {
    // TODO: the serialization to JSON part is missing.
    serde_json::from_str(grpc_error.message())
        .unwrap_or_else(|_| SearchError::Internal(grpc_error.message().to_string()))
}

impl From<TantivyError> for SearchError {
    fn from(tantivy_error: TantivyError) -> Self {
        SearchError::Internal(format!("tantivy error: {tantivy_error}"))
    }
}

impl From<tokio::time::error::Elapsed> for SearchError {
    fn from(_elapsed: tokio::time::error::Elapsed) -> Self {
        SearchError::Timeout("timeout exceeded".to_string())
    }
}

impl From<postcard::Error> for SearchError {
    fn from(error: postcard::Error) -> Self {
        SearchError::Internal(format!("Postcard error: {error}"))
    }
}

impl From<serde_json::Error> for SearchError {
    fn from(serde_error: serde_json::Error) -> Self {
        SearchError::Internal(format!("serde error: {serde_error}"))
    }
}

impl From<anyhow::Error> for SearchError {
    fn from(any_error: anyhow::Error) -> Self {
        SearchError::Internal(any_error.to_string())
    }
}

impl From<QueryParserError> for SearchError {
    fn from(query_parser_error: QueryParserError) -> Self {
        SearchError::InvalidQuery(query_parser_error.to_string())
    }
}

impl From<MetastoreError> for SearchError {
    fn from(metastore_error: MetastoreError) -> SearchError {
        match metastore_error {
            MetastoreError::NotFound(EntityKind::Index { index_id }) => {
                SearchError::IndexesNotFound {
                    index_ids: vec![index_id],
                }
            }
            MetastoreError::NotFound(EntityKind::Indexes { index_ids }) => {
                SearchError::IndexesNotFound { index_ids }
            }
            _ => SearchError::Internal(metastore_error.to_string()),
        }
    }
}

impl Retryable for SearchError {
    fn is_retryable(&self) -> bool {
        matches!(self, SearchError::TooManyRequests | SearchError::Timeout(_))
    }
}

impl From<JoinError> for SearchError {
    fn from(join_error: JoinError) -> SearchError {
        SearchError::Internal(format!("spawned task in root join failed: {join_error}"))
    }
}

impl From<std::convert::Infallible> for SearchError {
    fn from(infallible: std::convert::Infallible) -> SearchError {
        match infallible {}
    }
}


================================================
FILE: quickwit/quickwit-search/src/fetch_docs.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeMap, HashMap};
use std::sync::Arc;

use anyhow::{Context, Ok};
use futures::{StreamExt, TryStreamExt};
use itertools::Itertools;
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::search::{
    FetchDocsResponse, PartialHit, SnippetRequest, SplitIdAndFooterOffsets,
};
use quickwit_storage::Storage;
use tantivy::query::Query;
use tantivy::schema::document::CompactDocValue;
use tantivy::schema::{Document as DocumentTrait, Field, TantivyDocument, Value};
use tantivy::snippet::SnippetGenerator;
use tantivy::{ReloadPolicy, Score, Searcher, Term};
use tracing::{Instrument, error};

use crate::leaf::open_index_with_caches;
use crate::service::SearcherContext;
use crate::{GlobalDocAddress, convert_document_to_json_string};

const SNIPPET_MAX_NUM_CHARS: usize = 150;

/// Given a list of global doc address, fetches all the documents and
/// returns them as a hashmap.
async fn fetch_docs_to_map(
    searcher_context: Arc<SearcherContext>,
    mut global_doc_addrs: Vec<GlobalDocAddress>,
    index_storage: Arc<dyn Storage>,
    splits: &[SplitIdAndFooterOffsets],
    doc_mapper: Arc<DocMapper>,
    snippet_request_opt: Option<&SnippetRequest>,
) -> anyhow::Result<HashMap<GlobalDocAddress, Document>> {
    let mut split_fetch_docs_futures = Vec::new();

    let split_offsets_map: HashMap<&str, &SplitIdAndFooterOffsets> = splits
        .iter()
        .map(|split| (split.split_id.as_str(), split))
        .collect();

    // We sort global hit addrs in order to allow for the grouby.
    global_doc_addrs.sort_by(|a, b| a.split.cmp(&b.split));
    for (split_id, global_doc_addrs) in global_doc_addrs
        .iter()
        .chunk_by(|global_doc_addr| global_doc_addr.split.as_str())
        .into_iter()
    {
        let global_doc_addrs: Vec<GlobalDocAddress> =
            global_doc_addrs.into_iter().cloned().collect();
        let split_and_offset = split_offsets_map
            .get(split_id)
            .ok_or_else(|| anyhow::anyhow!("failed to find offset for split {}", split_id))?;
        split_fetch_docs_futures.push(fetch_docs_in_split(
            searcher_context.clone(),
            global_doc_addrs,
            index_storage.clone(),
            split_and_offset,
            doc_mapper.clone(),
            snippet_request_opt,
        ));
    }

    let split_fetch_docs: Vec<Vec<(GlobalDocAddress, Document)>> = futures::future::try_join_all(
        split_fetch_docs_futures,
    )
    .await
    .map_err(|error| {
        let split_ids = splits
            .iter()
            .map(|split| split.split_id.clone())
            .collect_vec();
        error!(split_ids = ?split_ids, error = ?error, "error when fetching docs in splits");
        anyhow::anyhow!(
            "error when fetching docs for splits {:?}: {:?}",
            split_ids,
            error
        )
    })?;

    let global_doc_addr_to_doc_json: HashMap<GlobalDocAddress, Document> = split_fetch_docs
        .into_iter()
        .flat_map(|docs| docs.into_iter())
        .collect();

    Ok(global_doc_addr_to_doc_json)
}

/// `fetch_docs` step of search.
///
/// This function takes a list of partial hits (possibly from different splits)
/// and the storage associated to an index, fetches the document from
/// the split document stores, and returns the full hits.
pub async fn fetch_docs(
    searcher_context: Arc<SearcherContext>,
    partial_hits: Vec<PartialHit>,
    index_storage: Arc<dyn Storage>,
    splits: &[SplitIdAndFooterOffsets],
    doc_mapper: Arc<DocMapper>,
    snippet_request_opt: Option<&SnippetRequest>,
) -> anyhow::Result<FetchDocsResponse> {
    let global_doc_addrs: Vec<GlobalDocAddress> = partial_hits
        .iter()
        .map(GlobalDocAddress::from_partial_hit)
        .collect();

    let mut global_doc_addr_to_doc_json = fetch_docs_to_map(
        searcher_context,
        global_doc_addrs,
        index_storage,
        splits,
        doc_mapper,
        snippet_request_opt,
    )
    .await?;

    let hits: Vec<quickwit_proto::search::LeafHit> = partial_hits
        .into_iter()
        .flat_map(|partial_hit| {
            let global_doc_addr = GlobalDocAddress::from_partial_hit(&partial_hit);
            if let Some((_, document)) = global_doc_addr_to_doc_json.remove_entry(&global_doc_addr)
            {
                Some(quickwit_proto::search::LeafHit {
                    leaf_json: document.content_json,
                    partial_hit: Some(partial_hit),
                    leaf_snippet_json: document.snippet_json,
                })
            } else {
                None
            }
        })
        .collect();
    Ok(FetchDocsResponse { hits })
}

// number of concurrent fetch allowed for a single split.
const NUM_CONCURRENT_REQUESTS: usize = 30;

/// A struct for holding a fetched document's content and snippet.
#[derive(Debug)]
struct Document {
    content_json: String,
    snippet_json: Option<String>,
}

/// Fetching docs from a specific split.
async fn fetch_docs_in_split(
    searcher_context: Arc<SearcherContext>,
    mut global_doc_addrs: Vec<GlobalDocAddress>,
    index_storage: Arc<dyn Storage>,
    split: &SplitIdAndFooterOffsets,
    doc_mapper: Arc<DocMapper>,
    snippet_request_opt: Option<&SnippetRequest>,
) -> anyhow::Result<Vec<(GlobalDocAddress, Document)>> {
    global_doc_addrs.sort_by_key(|doc| doc.doc_addr);
    // Opens the index without the ephemeral unbounded cache, this cache is indeed not useful
    // when fetching docs as we will fetch them only once.
    let (mut index, _) = open_index_with_caches(
        &searcher_context,
        index_storage,
        split,
        Some(doc_mapper.tokenizer_manager()),
        None,
    )
    .await
    .context("open-index-for-split")?;
    // we add an executor here, we could add it in open_index_with_caches, though we should verify
    // the side-effect before
    let tantivy_executor = crate::search_thread_pool()
        .get_underlying_rayon_thread_pool()
        .into();
    index.set_executor(tantivy_executor);
    let index_reader = index
        .reader_builder()
        // the docs are presorted so a cache size of NUM_CONCURRENT_REQUESTS is fine
        .doc_store_cache_num_blocks(NUM_CONCURRENT_REQUESTS)
        .reload_policy(ReloadPolicy::Manual)
        .try_into()?;
    let searcher = Arc::new(index_reader.searcher());
    let fields_snippet_generator_opt = if let Some(snippet_request) = snippet_request_opt {
        Some(create_fields_snippet_generator(&searcher, doc_mapper.clone(), snippet_request).await?)
    } else {
        None
    };

    let doc_futures = global_doc_addrs.into_iter().map(|global_doc_addr| {
        let moved_searcher = searcher.clone();
        let moved_doc_mapper = doc_mapper.clone();
        let fields_snippet_generator_opt_clone = fields_snippet_generator_opt.clone();
        async move {
            let doc: TantivyDocument = moved_searcher
                .doc_async(global_doc_addr.doc_addr)
                .await
                .context("searcher-doc-async")?;

            let named_field_doc = doc.to_named_doc(moved_searcher.schema());
            let content_json = convert_document_to_json_string(named_field_doc, &moved_doc_mapper)?;
            if fields_snippet_generator_opt_clone.is_none() {
                return Ok((
                    global_doc_addr,
                    Document {
                        content_json,
                        snippet_json: None,
                    },
                ));
            }

            let fields_snippet_generator_clone = fields_snippet_generator_opt_clone.unwrap();
            if fields_snippet_generator_clone.is_empty() {
                return Ok((
                    global_doc_addr,
                    Document {
                        content_json,
                        snippet_json: None,
                    },
                ));
            }

            let mut snippets = HashMap::new();
            for (field, field_values) in doc.get_sorted_field_values() {
                let field_name = moved_searcher.schema().get_field_name(field);
                if let Some(values) = fields_snippet_generator_clone
                    .snippets_from_field_values(field_name, field_values)
                {
                    snippets.insert(field_name, values);
                }
            }
            let snippet_json = serde_json::to_string(&snippets)?;
            Ok((
                global_doc_addr,
                Document {
                    content_json,
                    snippet_json: Some(snippet_json),
                },
            ))
        }
        .in_current_span()
    });

    futures::stream::iter(doc_futures)
        .buffer_unordered(NUM_CONCURRENT_REQUESTS)
        .try_collect::<Vec<_>>()
        .await
}

// A struct to hold the snippet generators associated to
// the snippet fields from a search request.
#[derive(Clone)]
struct FieldsSnippetGenerator {
    field_generators: Arc<HashMap<String, SnippetGenerator>>,
}

impl FieldsSnippetGenerator {
    // Returns the  snippets from fields values.
    fn snippets_from_field_values(
        &self,
        field_name: &str,
        field_values: Vec<CompactDocValue<'_>>,
    ) -> Option<Vec<String>> {
        if let Some(snippet_generator) = self.field_generators.get(field_name) {
            let values = field_values
                .into_iter()
                .filter_map(|value| {
                    value.as_str().and_then(|text| {
                        let snippet = snippet_generator.snippet(text);
                        match snippet.is_empty() {
                            false => Some(snippet.to_html()),
                            _ => None,
                        }
                    })
                })
                .collect();
            Some(values)
        } else {
            None
        }
    }

    fn is_empty(&self) -> bool {
        self.field_generators.is_empty()
    }
}

// Creates FieldsSnippetGenerator.
async fn create_fields_snippet_generator(
    searcher: &Searcher,
    doc_mapper: Arc<DocMapper>,
    snippet_request: &SnippetRequest,
) -> anyhow::Result<FieldsSnippetGenerator> {
    let schema = searcher.schema();
    let query_ast_resolved = serde_json::from_str(&snippet_request.query_ast_resolved)
        .context("failed to deserialize QueryAst")?;
    let (query, _) = doc_mapper.query(schema.clone(), query_ast_resolved, false, None)?;
    let mut snippet_generators = HashMap::new();
    for field_name in &snippet_request.snippet_fields {
        let field = schema.get_field(field_name)?;
        let snippet_generator = create_snippet_generator(searcher, &query, field).await?;
        snippet_generators.insert(field_name.clone(), snippet_generator);
    }

    Ok(FieldsSnippetGenerator {
        field_generators: Arc::new(snippet_generators),
    })
}

// Creates a snippet generator associated to a field.
async fn create_snippet_generator(
    searcher: &Searcher,
    query: &dyn Query,
    field: Field,
) -> anyhow::Result<SnippetGenerator> {
    let mut terms: Vec<&Term> = Vec::new();
    // TODO ok with termset?
    query.query_terms(&mut |term, _need_position| {
        if term.field() == field {
            terms.push(term);
        }
    });
    let mut terms_text: BTreeMap<String, f32> = BTreeMap::default();
    for term in terms {
        let value = term.value();
        let Some(term_str) = value.as_str() else {
            continue;
        };
        let doc_freq = searcher.doc_freq_async(term).await?;
        if doc_freq > 0 {
            let score = 1.0 / (1.0 + doc_freq as Score);
            terms_text.insert(term_str.to_string(), score);
        }
    }
    let tokenizer = searcher.index().tokenizer_for_field(field)?;
    Ok(SnippetGenerator::new(
        terms_text,
        tokenizer,
        field,
        SNIPPET_MAX_NUM_CHARS,
    ))
}


================================================
FILE: quickwit/quickwit-search/src/find_trace_ids_collector.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::{Ord, Ordering};
use std::collections::HashSet;

use fnv::{FnvHashMap, FnvHashSet};
use itertools::Itertools;
use quickwit_proto::search::TraceId;
use serde::{Deserialize, Serialize};
use tantivy::collector::{Collector, SegmentCollector};
use tantivy::columnar::BytesColumn;
use tantivy::fastfield::Column;
use tantivy::{DateTime, DocId, Score, SegmentReader};

type TermOrd = u64;

#[derive(Debug, Clone, Serialize, Deserialize)]
/// Metadata about a single span
pub struct Span {
    /// The trace id this span is part of
    pub trace_id: TraceId,
    /// The start timestamp of the span
    #[serde(with = "serde_datetime")]
    pub span_timestamp: DateTime,
}

impl Span {
    fn new(trace_id: TraceId, span_timestamp: DateTime) -> Self {
        Self {
            trace_id,
            span_timestamp,
        }
    }
}

impl Ord for Span {
    fn cmp(&self, other: &Self) -> Ordering {
        self.span_timestamp
            .cmp(&other.span_timestamp)
            .reverse()
            .then(self.trace_id.cmp(&other.trace_id))
    }
}

impl PartialOrd for Span {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl PartialEq for Span {
    fn eq(&self, other: &Self) -> bool {
        self.cmp(other) == Ordering::Equal
    }
}

impl Eq for Span {}

#[derive(Debug)]
pub struct TraceIdTermOrd {
    pub term_ord: TermOrd,
    pub span_timestamp: DateTime,
}

impl TraceIdTermOrd {
    pub fn new(term_ord: TermOrd, span_timestamp: DateTime) -> Self {
        Self {
            term_ord,
            span_timestamp,
        }
    }
}

impl Ord for TraceIdTermOrd {
    fn cmp(&self, other: &Self) -> Ordering {
        self.span_timestamp
            .cmp(&other.span_timestamp)
            .reverse()
            .then(self.term_ord.cmp(&other.term_ord))
    }
}

impl PartialOrd for TraceIdTermOrd {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl PartialEq for TraceIdTermOrd {
    fn eq(&self, other: &Self) -> bool {
        self.cmp(other) == Ordering::Equal
    }
}

impl Eq for TraceIdTermOrd {}

/// Finds the most recent trace ids among a set of matching spans. Multiple spans belonging to the
/// same trace can be found in the document set. As a result, this problem is akin to finding the
/// top k elements with duplicates
#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub struct FindTraceIdsCollector {
    /// The number of traces to select.
    pub num_traces: usize,
    /// The name of the fast field storing the trace IDs.
    pub trace_id_field_name: String,
    /// The name of the fast field recording the spans' start timestamp.
    pub span_timestamp_field_name: String,
}

impl FindTraceIdsCollector {
    /// The names of the fast fields accessed by this collector.
    pub fn fast_field_names(&self) -> HashSet<String> {
        HashSet::from_iter([
            self.trace_id_field_name.clone(),
            self.span_timestamp_field_name.clone(),
        ])
    }

    /// The field names of the term dictionaries accessed by this collector.
    pub fn term_dict_field_names(&self) -> HashSet<String> {
        HashSet::from_iter([self.trace_id_field_name.clone()])
    }
}

impl Collector for FindTraceIdsCollector {
    type Fruit = Vec<Span>;
    type Child = FindTraceIdsSegmentCollector;

    fn for_segment(
        &self,
        _segment_local_id: u32,
        segment_reader: &SegmentReader,
    ) -> tantivy::Result<Self::Child> {
        let trace_id_column = segment_reader
            .fast_fields()
            .bytes(&self.trace_id_field_name)?
            .ok_or_else(|| {
                let err_msg = format!(
                    "failed to find column for trace_id field `{}`",
                    self.trace_id_field_name
                );
                tantivy::TantivyError::InternalError(err_msg)
            })?;
        let span_timestamp_column: Column<DateTime> = segment_reader
            .fast_fields()
            .date(&self.span_timestamp_field_name)?;
        Ok(FindTraceIdsSegmentCollector {
            trace_id_column,
            span_timestamp_column,
            select_trace_ids: SelectTraceIds::new(self.num_traces),
        })
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> tantivy::Result<Self::Fruit> {
        Ok(merge_segment_fruits(segment_fruits, self.num_traces))
    }

    fn requires_scoring(&self) -> bool {
        false
    }
}

fn merge_segment_fruits(mut segment_fruits: Vec<Vec<Span>>, num_traces: usize) -> Vec<Span> {
    // Spans are ordered in reverse order of their timestamp.
    for segment_fruit in &mut segment_fruits {
        segment_fruit.sort_unstable()
    }
    let mut spans: Vec<Span> = Vec::with_capacity(num_traces);
    let mut seen_trace_ids: FnvHashSet<TraceId> = FnvHashSet::default();

    for span in segment_fruits.into_iter().kmerge() {
        if seen_trace_ids.insert(span.trace_id) {
            spans.push(span);

            if spans.len() == num_traces {
                break;
            }
        }
    }
    spans
}

pub struct FindTraceIdsSegmentCollector {
    trace_id_column: BytesColumn,
    span_timestamp_column: Column<DateTime>,
    select_trace_ids: SelectTraceIds,
}

impl FindTraceIdsSegmentCollector {
    fn trace_id_term_ord(&self, doc: DocId) -> TermOrd {
        self.trace_id_column
            .term_ords(doc)
            .next()
            .unwrap_or_default()
    }

    fn span_timestamp(&self, doc: DocId) -> DateTime {
        self.span_timestamp_column.first(doc).unwrap_or_default()
    }
}

impl SegmentCollector for FindTraceIdsSegmentCollector {
    type Fruit = Vec<Span>;

    fn collect(&mut self, doc: DocId, _score: Score) {
        let term_ord = self.trace_id_term_ord(doc);
        let span_timestamp = self.span_timestamp(doc);
        self.select_trace_ids.collect(term_ord, span_timestamp);
    }

    fn harvest(self) -> Self::Fruit {
        let mut buffer = Vec::with_capacity(TraceId::HEX_LENGTH);
        self.select_trace_ids
            .harvest()
            .into_iter()
            .map(|trace_id_term_ord| {
                let span_timestamp = trace_id_term_ord.span_timestamp;
                let found_term = self
                    .trace_id_column
                    .ord_to_bytes(trace_id_term_ord.term_ord, &mut buffer)
                    .expect("Failed to lookup trace ID in the column term dictionary");
                debug_assert!(found_term);
                let trace_id = TraceId::try_from(buffer.as_slice())
                    .expect("The term dict should store valid trace IDs.");
                Span::new(trace_id, span_timestamp)
            })
            .collect()
    }
}

struct SelectTraceIds {
    num_traces: usize,
    dedup_workbench: FnvHashMap<TermOrd, DateTime>,
    select_workbench: Vec<TraceIdTermOrd>,
    running_term_ord: Option<TermOrd>,
    running_span_timestamp: DateTime,
    // This is the lowest timestamp required to enter our top K.
    span_timestamp_sentinel: DateTime,
}

impl SelectTraceIds {
    fn new(num_traces: usize) -> Self {
        Self {
            num_traces,
            dedup_workbench: FnvHashMap::with_capacity_and_hasher(
                2 * num_traces,
                Default::default(),
            ),
            select_workbench: Vec::with_capacity(2 * num_traces),
            running_term_ord: None,
            running_span_timestamp: DateTime::default(),
            span_timestamp_sentinel: DateTime::from_timestamp_nanos(i64::MIN),
        }
    }

    fn collect(&mut self, term_ord: TermOrd, span_timestamp: DateTime) {
        if self.running_term_ord.is_none() {
            self.running_term_ord = Some(term_ord);
            self.running_span_timestamp = span_timestamp;
            return;
        }
        if self.span_timestamp_sentinel >= span_timestamp {
            return;
        }
        let running_term_ord = self
            .running_term_ord
            .expect("The running trace ID should be set.");

        if running_term_ord == term_ord {
            self.running_span_timestamp = self.running_span_timestamp.max(span_timestamp);
        } else {
            self.dedup(running_term_ord, self.running_span_timestamp);
            self.truncate();
            self.running_term_ord = Some(term_ord);
            self.running_span_timestamp = span_timestamp;
        }
    }

    fn dedup(&mut self, term_ord: TermOrd, span_timestamp: DateTime) {
        self.dedup_workbench
            .entry(term_ord)
            .and_modify(|entry| {
                if *entry < span_timestamp {
                    *entry = span_timestamp
                }
            })
            .or_insert(span_timestamp);
    }

    fn select(&mut self) {
        if self.num_traces == 0 || self.dedup_workbench.is_empty() {
            return;
        }
        self.select_workbench.clear();

        for (term_ord, span_timestamp) in self.dedup_workbench.drain() {
            let trace_id = TraceIdTermOrd::new(term_ord, span_timestamp);
            self.select_workbench.push(trace_id);
        }
        let select_len = self.num_traces.min(self.select_workbench.len());
        let select_index = select_len - 1;
        self.select_workbench.select_nth_unstable(select_index);
        self.select_workbench.truncate(select_len);
        self.span_timestamp_sentinel = self.select_workbench[select_index].span_timestamp;
    }

    fn truncate(&mut self) {
        if self.dedup_workbench.len() < 2 * self.num_traces {
            return;
        }
        self.select();
        for trace_id in self.select_workbench.drain(..self.num_traces) {
            self.dedup_workbench
                .insert(trace_id.term_ord, trace_id.span_timestamp);
        }
    }

    fn harvest(mut self) -> Vec<TraceIdTermOrd> {
        if let Some(running_term_ord) = self.running_term_ord.take() {
            self.dedup(running_term_ord, self.running_span_timestamp);
        }
        self.select();
        self.select_workbench
    }
}

mod serde_datetime {
    use serde::{Deserialize, Deserializer, Serializer};
    use tantivy::DateTime;

    pub(crate) fn serialize<S>(datetime: &DateTime, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.serialize_i64(datetime.into_timestamp_nanos())
    }

    pub(crate) fn deserialize<'de, D>(deserializer: D) -> Result<DateTime, D::Error>
    where D: Deserializer<'de> {
        let datetime_i64: i64 = Deserialize::deserialize(deserializer)?;
        Ok(DateTime::from_timestamp_nanos(datetime_i64))
    }
}

#[cfg(test)]
mod tests {
    use tantivy::DateTime;
    use tantivy::time::OffsetDateTime;

    use super::*;
    use crate::collector::QuickwitAggregations;

    impl Span {
        fn for_test(bytes: &[u8], span_timestamp_nanos: i64) -> Self {
            let mut trace_id = [0u8; 16];
            trace_id[..bytes.len()].copy_from_slice(bytes);
            let span_timestamp = DateTime::from_timestamp_nanos(span_timestamp_nanos);
            Self::new(TraceId::new(trace_id), span_timestamp)
        }
    }

    impl TraceIdTermOrd {
        fn for_test(term_ord: TermOrd, span_timestamp_nanos: i64) -> Self {
            Self {
                term_ord,
                span_timestamp: DateTime::from_timestamp_nanos(span_timestamp_nanos),
            }
        }
    }

    impl SelectTraceIds {
        fn collect_for_test(&mut self, term_ord: TermOrd, span_timestamp_nanos: i64) {
            let span_timestamp = DateTime::from_timestamp_nanos(span_timestamp_nanos);
            self.collect(term_ord, span_timestamp)
        }
    }

    #[test]
    fn test_find_trace_ids_collector_serde() {
        let collector_json = serde_json::to_string(&FindTraceIdsCollector {
            num_traces: 10,
            trace_id_field_name: "trace_id".to_string(),
            span_timestamp_field_name: "span_timestamp".to_string(),
        })
        .unwrap();
        let aggregation: QuickwitAggregations = serde_json::from_str(&collector_json).unwrap();
        let QuickwitAggregations::FindTraceIdsAggregation(collector) = aggregation else {
            panic!("Expected FindTraceIdsAggregation");
        };
        assert_eq!(collector.num_traces, 10);
        assert_eq!(collector.trace_id_field_name, "trace_id");
        assert_eq!(collector.span_timestamp_field_name, "span_timestamp");
    }

    #[test]
    fn test_span_serde() {
        let span_timestamp_nanos = OffsetDateTime::now_utc().unix_timestamp_nanos() as i64;
        let expected_span = Span::for_test(b"trace_id", span_timestamp_nanos);
        let span_json = serde_json::to_string(&expected_span).unwrap();
        let span = serde_json::from_str::<Span>(&span_json).unwrap();
        assert_eq!(span, expected_span);
    }

    #[test]
    fn test_select_trace_ids() {
        {
            let select_trace_ids = SelectTraceIds::new(0);
            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();
            assert_eq!(trace_ids, &[]);
        }
        {
            let select_trace_ids = SelectTraceIds::new(3);

            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();

            assert_eq!(trace_ids, &[]);
        }
        {
            let mut select_trace_ids = SelectTraceIds::new(0);
            select_trace_ids.collect_for_test(0, 0);

            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();

            assert_eq!(trace_ids, &[]);
        }
        {
            let mut select_trace_ids = SelectTraceIds::new(3);
            select_trace_ids.collect_for_test(0, 0);

            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();

            assert_eq!(trace_ids, &[TraceIdTermOrd::for_test(0, 0)]);
        }
        {
            let mut select_trace_ids = SelectTraceIds::new(3);
            select_trace_ids.collect_for_test(0, 1);
            select_trace_ids.collect_for_test(0, 0);

            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();

            assert_eq!(trace_ids, &[TraceIdTermOrd::for_test(0, 1)]);
        }
        {
            let mut select_trace_ids = SelectTraceIds::new(3);
            select_trace_ids.collect_for_test(0, 2);
            select_trace_ids.collect_for_test(1, 1);
            select_trace_ids.collect_for_test(2, 0);

            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();

            assert_eq!(
                trace_ids,
                &[
                    TraceIdTermOrd::for_test(0, 2),
                    TraceIdTermOrd::for_test(1, 1),
                    TraceIdTermOrd::for_test(2, 0),
                ]
            );
        }
        {
            let mut select_trace_ids = SelectTraceIds::new(3);
            select_trace_ids.collect_for_test(0, 7);
            select_trace_ids.collect_for_test(1, 6);
            select_trace_ids.collect_for_test(2, 5);
            select_trace_ids.collect_for_test(3, 4);
            select_trace_ids.collect_for_test(4, 3);
            select_trace_ids.collect_for_test(5, 2);
            select_trace_ids.collect_for_test(6, 1);
            select_trace_ids.collect_for_test(7, 0);

            assert_eq!(select_trace_ids.select_workbench.capacity(), 6);

            let mut trace_ids = select_trace_ids.harvest();
            trace_ids.sort();

            assert_eq!(
                trace_ids,
                &[
                    TraceIdTermOrd::for_test(0, 7),
                    TraceIdTermOrd::for_test(1, 6),
                    TraceIdTermOrd::for_test(2, 5),
                ]
            );
        }
    }

    #[test]
    fn test_merge_segment_fruits() {
        {
            let segment_fruits = Vec::new();
            let merged_fruit = merge_segment_fruits(segment_fruits, 0);
            assert_eq!(merged_fruit, &[]);
        }
        {
            let segment_fruits = vec![vec![Span::for_test(b"foo", 0), Span::for_test(b"foo", 1)]];
            let merged_fruit = merge_segment_fruits(segment_fruits, 3);
            assert_eq!(merged_fruit, &[Span::for_test(b"foo", 1)]);
        }
        {
            let segment_fruits = vec![
                vec![Span::for_test(b"foo", 0), Span::for_test(b"foo", 1)],
                vec![Span::for_test(b"foo", 1), Span::for_test(b"foo", 2)],
            ];
            let merged_fruit = merge_segment_fruits(segment_fruits, 3);
            assert_eq!(merged_fruit, &[Span::for_test(b"foo", 2)]);
        }
        {
            let segment_fruits = vec![
                vec![
                    Span::for_test(b"foo", 0),
                    Span::for_test(b"foo", 1),
                    Span::for_test(b"foo", 2),
                ],
                vec![Span::for_test(b"foo", 2), Span::for_test(b"bar", 2)],
                vec![Span::for_test(b"foo", 2), Span::for_test(b"bar", 3)],
            ];
            let merged_fruit = merge_segment_fruits(segment_fruits, 3);
            assert_eq!(
                merged_fruit,
                &[Span::for_test(b"bar", 3), Span::for_test(b"foo", 2)]
            );
        }
        {
            let segment_fruits = vec![
                vec![
                    Span::for_test(b"foo", 0),
                    Span::for_test(b"foo", 1),
                    Span::for_test(b"foo", 2),
                ],
                vec![Span::for_test(b"foo", 2), Span::for_test(b"bar", 2)],
                vec![Span::for_test(b"foo", 2), Span::for_test(b"bar", 3)],
                vec![Span::for_test(b"qux", 4)],
            ];
            let merged_fruit = merge_segment_fruits(segment_fruits, 3);
            assert_eq!(
                merged_fruit,
                &[
                    Span::for_test(b"qux", 4),
                    Span::for_test(b"bar", 3),
                    Span::for_test(b"foo", 2)
                ]
            );
        }
    }

    use proptest::prelude::*;

    fn span_strategy() -> impl Strategy<Value = Span> {
        let trace_id_strat = proptest::array::uniform16(any::<u8>());
        let span_timestamp_strat = any::<i64>();
        (trace_id_strat, span_timestamp_strat).prop_map(|(trace_id, span_timestamp)| {
            Span::new(
                TraceId::new(trace_id),
                tantivy::DateTime::from_timestamp_nanos(span_timestamp),
            )
        })
    }

    fn test_postcard_aux<I: Serialize + std::fmt::Debug + for<'a> Deserialize<'a> + Eq>(item: &I) {
        let payload = postcard::to_allocvec(item).unwrap();
        let deserialized_item: I = postcard::from_bytes(&payload).unwrap();
        assert_eq!(item, &deserialized_item);
    }

    #[test]
    fn test_proptest_spans_postcard_empty_vec() {
        test_postcard_aux(&Vec::<Span>::new());
    }

    #[test]
    fn test_proptest_spans_postcard_extreme_values() {
        test_postcard_aux(&vec![Span {
            trace_id: TraceId::new([255u8; 16]),
            span_timestamp: tantivy::DateTime::from_timestamp_nanos(i64::MIN),
        }]);
    }

    proptest::proptest! {

        #[test]
        fn test_proptest_spans_postcard_serdeser(span in span_strategy()) {
            test_postcard_aux(&span);
        }

        #[test]
        fn test_proptest_spans_vec_postcard_serdeser(spans in proptest::collection::vec(span_strategy(), 0..100)) {
            test_postcard_aux(&spans);
        }
    }
}


================================================
FILE: quickwit/quickwit-search/src/invoker.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! Trait for invoking remote serverless functions for leaf search.

use async_trait::async_trait;
use quickwit_proto::search::{LambdaSingleSplitResult, LeafSearchRequest};

use crate::SearchError;

/// Trait for invoking remote serverless functions (e.g., AWS Lambda) for leaf search.
///
/// This abstraction allows different cloud providers to be supported.
/// Implementations are provided by the `quickwit-lambda` crate.
#[async_trait]
pub trait LambdaLeafSearchInvoker: Send + Sync + 'static {
    /// Invoke the remote function with a LeafSearchRequest.
    ///
    /// Returns one `LambdaSingleSplitResult` per split in the request.
    /// Each result is tagged with its split_id so ordering is irrelevant.
    /// Individual split failures are reported per-split; the outer `Result`
    /// only represents transport-level errors.
    async fn invoke_leaf_search(
        &self,
        request: LeafSearchRequest,
    ) -> Result<Vec<LambdaSingleSplitResult>, SearchError>;
}

#[async_trait]
impl<T> LambdaLeafSearchInvoker for Box<T>
where T: LambdaLeafSearchInvoker + ?Sized
{
    async fn invoke_leaf_search(
        &self,
        request: LeafSearchRequest,
    ) -> Result<Vec<LambdaSingleSplitResult>, SearchError> {
        (**self).invoke_leaf_search(request).await
    }
}

#[async_trait]
impl<T> LambdaLeafSearchInvoker for std::sync::Arc<T>
where T: LambdaLeafSearchInvoker + ?Sized
{
    async fn invoke_leaf_search(
        &self,
        request: LeafSearchRequest,
    ) -> Result<Vec<LambdaSingleSplitResult>, SearchError> {
        (**self).invoke_leaf_search(request).await
    }
}


================================================
FILE: quickwit/quickwit-search/src/leaf.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Reverse;
use std::collections::binary_heap::PeekMut;
use std::collections::{BinaryHeap, HashMap, HashSet};
use std::num::NonZeroUsize;
use std::ops::Bound;
use std::path::PathBuf;
use std::str::FromStr;
use std::sync::{Arc, Mutex, RwLock};
use std::time::{Duration, Instant};

use anyhow::Context;
use bytesize::ByteSize;
use futures::future::try_join_all;
use quickwit_common::pretty::PrettySample;
use quickwit_common::uri::Uri;
use quickwit_directories::{CachingDirectory, HotDirectory, StorageDirectory};
use quickwit_doc_mapper::{Automaton, DocMapper, FastFieldWarmupInfo, TermRange, WarmupInfo};
use quickwit_proto::search::lambda_single_split_result::Outcome;
use quickwit_proto::search::{
    CountHits, LeafSearchRequest, LeafSearchResponse, PartialHit, ResourceStats, SearchRequest,
    SortOrder, SortValue, SplitIdAndFooterOffsets, SplitSearchError,
};
use quickwit_query::query_ast::{
    BoolQuery, CacheNode, QueryAst, QueryAstTransformer, RangeQuery, TermQuery,
};
use quickwit_query::tokenizers::TokenizerManager;
use quickwit_storage::{
    BundleStorage, ByteRangeCache, MemorySizedCache, OwnedBytes, SplitCache, Storage,
    StorageResolver, TimeoutAndRetryStorage, wrap_storage_with_cache,
};
use tantivy::aggregation::AggContextParams;
use tantivy::aggregation::agg_req::{AggregationVariants, Aggregations};
use tantivy::collector::Collector;
use tantivy::directory::FileSlice;
use tantivy::fastfield::FastFieldReaders;
use tantivy::schema::Field;
use tantivy::{DateTime, Index, ReloadPolicy, Searcher, TantivyError, Term};
use tokio::task::{JoinError, JoinSet};
use tracing::*;

use crate::collector::{IncrementalCollector, make_collector_for_split, make_merge_collector};
use crate::leaf_cache::LeafSearchCache;
use crate::metrics::SplitSearchOutcomeCounters;
use crate::root::is_metadata_count_request_with_ast;
use crate::search_permit_provider::{
    SearchPermit, SearchPermitFuture, compute_initial_memory_allocation,
};
use crate::service::{SearcherContext, deserialize_doc_mapper};
use crate::{QuickwitAggregations, SearchError};

/// Distributes items across batches using a greedy LPT (Longest Processing Time)
/// algorithm to balance total weight across batches.
///
/// Items are sorted by weight descending, then each item is assigned to the
/// batch with the smallest current total weight. This produces a good
/// approximation of balanced batches.
fn greedy_batch_split<T>(
    items: Vec<T>,
    weight_fn: impl Fn(&T) -> u64,
    max_items_per_batch: NonZeroUsize,
) -> Vec<Vec<T>> {
    if items.is_empty() {
        return Vec::new();
    }

    let num_items = items.len();
    let max_items_per_batch: usize = max_items_per_batch.get();
    let num_batches = num_items.div_ceil(max_items_per_batch);

    // Compute weights, then sort descending by weight
    let mut weighted_items: Vec<(u64, T)> = Vec::with_capacity(num_items);
    for item in items {
        let weight = weight_fn(&item);
        weighted_items.push((weight, item));
    }
    weighted_items.sort_unstable_by_key(|(weight, _)| std::cmp::Reverse(*weight));

    let mut batches: Vec<Vec<T>> = std::iter::repeat_with(Vec::new).take(num_batches).collect();

    // Min-heap of (weight, item_count, batch_index).
    // Reverse turns BinaryHeap into a min-heap.
    // Ties break naturally: lighter weight → fewer items → lower index.
    let mut heap: BinaryHeap<Reverse<(u64, usize, usize)>> = BinaryHeap::with_capacity(num_batches);
    for batch_idx in 0..num_batches {
        heap.push(Reverse((0, 0, batch_idx)));
    }

    // Greedily assign each item to the lightest batch.
    // Full batches are removed via PeekMut::pop().
    for (weight, item) in weighted_items {
        let mut top = heap.peek_mut().unwrap();
        let Reverse((ref mut batch_weight, ref mut batch_count, batch_idx)) = *top;
        batches[batch_idx].push(item);
        *batch_weight += weight;
        *batch_count += 1;
        if *batch_count >= max_items_per_batch {
            PeekMut::pop(top);
        }
    }

    batches
}

async fn get_split_footer_from_cache_or_fetch(
    index_storage: Arc<dyn Storage>,
    split_and_footer_offsets: &SplitIdAndFooterOffsets,
    footer_cache: &MemorySizedCache<String>,
) -> anyhow::Result<OwnedBytes> {
    {
        let possible_val = footer_cache.get(&split_and_footer_offsets.split_id);
        if let Some(footer_data) = possible_val {
            return Ok(footer_data);
        }
    }
    let split_file = PathBuf::from(format!("{}.split", split_and_footer_offsets.split_id));
    let footer_data_opt = index_storage
        .get_slice(
            &split_file,
            split_and_footer_offsets.split_footer_start as usize
                ..split_and_footer_offsets.split_footer_end as usize,
        )
        .await
        .with_context(|| {
            format!(
                "failed to fetch hotcache and footer from {} for split `{}`",
                index_storage.uri(),
                split_and_footer_offsets.split_id
            )
        })?;

    footer_cache.put(
        split_and_footer_offsets.split_id.to_owned(),
        footer_data_opt.clone(),
    );

    Ok(footer_data_opt)
}

/// Returns hotcache_bytes and the split directory (`BundleStorage`) with cache layer:
/// - A split footer cache given by `SearcherContext.split_footer_cache`.
pub(crate) async fn open_split_bundle(
    searcher_context: &SearcherContext,
    index_storage: Arc<dyn Storage>,
    split_and_footer_offsets: &SplitIdAndFooterOffsets,
) -> anyhow::Result<(FileSlice, BundleStorage)> {
    let split_file = PathBuf::from(format!("{}.split", split_and_footer_offsets.split_id));
    let footer_data = get_split_footer_from_cache_or_fetch(
        index_storage.clone(),
        split_and_footer_offsets,
        &searcher_context.split_footer_cache,
    )
    .await?;

    // We wrap the top-level storage with the split cache.
    // This is before the bundle storage: at this point, this storage is reading `.split` files.
    let index_storage_with_split_cache =
        if let Some(split_cache) = searcher_context.split_cache_opt.as_ref() {
            SplitCache::wrap_storage(split_cache.clone(), index_storage.clone())
        } else {
            index_storage.clone()
        };

    let (hotcache_bytes, bundle_storage) = BundleStorage::open_from_split_data(
        index_storage_with_split_cache,
        split_file,
        FileSlice::new(Arc::new(footer_data)),
    )?;

    Ok((hotcache_bytes, bundle_storage))
}

/// Add a storage proxy to retry `get_slice` requests if they are taking too long,
/// if configured in the searcher config.
///
/// The goal here is too ensure a low latency.
fn configure_storage_retries(
    searcher_context: &SearcherContext,
    index_storage: Arc<dyn Storage>,
) -> Arc<dyn Storage> {
    if let Some(storage_timeout_policy) = &searcher_context.searcher_config.storage_timeout_policy {
        Arc::new(TimeoutAndRetryStorage::new(
            index_storage,
            storage_timeout_policy.clone(),
        ))
    } else {
        index_storage
    }
}

/// Opens a `tantivy::Index` for the given split with several cache layers:
/// - A split footer cache given by `SearcherContext.split_footer_cache`.
/// - A fast fields cache given by `SearcherContext.storage_long_term_cache`.
/// - An ephemeral unbounded cache directory (whose lifetime is tied to the returned `Index` if no
///   `ByteRangeCache` is provided).
pub(crate) async fn open_index_with_caches(
    searcher_context: &SearcherContext,
    index_storage: Arc<dyn Storage>,
    split_and_footer_offsets: &SplitIdAndFooterOffsets,
    tokenizer_manager: Option<&TokenizerManager>,
    ephemeral_unbounded_cache: Option<ByteRangeCache>,
) -> anyhow::Result<(Index, HotDirectory)> {
    let index_storage_with_retry_on_timeout =
        configure_storage_retries(searcher_context, index_storage);

    let (hotcache_bytes, bundle_storage) = open_split_bundle(
        searcher_context,
        index_storage_with_retry_on_timeout,
        split_and_footer_offsets,
    )
    .await?;

    let bundle_storage_with_cache = wrap_storage_with_cache(
        searcher_context.fast_fields_cache.clone(),
        Arc::new(bundle_storage),
    );

    let directory = StorageDirectory::new(bundle_storage_with_cache);

    let hot_directory = if let Some(cache) = ephemeral_unbounded_cache {
        let caching_directory = CachingDirectory::new(Arc::new(directory), cache);
        HotDirectory::open(caching_directory, hotcache_bytes.read_bytes()?)?
    } else {
        HotDirectory::open(directory, hotcache_bytes.read_bytes()?)?
    };

    let mut index = Index::open(hot_directory.clone())?;
    if let Some(tokenizer_manager) = tokenizer_manager {
        index.set_tokenizers(tokenizer_manager.tantivy_manager().clone());
    }
    index.set_fast_field_tokenizers(
        quickwit_query::get_quickwit_fastfield_normalizer_manager()
            .tantivy_manager()
            .clone(),
    );
    Ok((index, hot_directory))
}

/// Tantivy search does not make it possible to fetch data asynchronously during
/// search.
///
/// It is required to download all required information in advance.
/// This is the role of the `warmup` function.
///
/// The downloaded data depends on the query (which term's posting list is required,
/// are position required too), and the collector.
///
/// * `query` - query is used to extract the terms and their fields which will be loaded from the
/// inverted_index.
///
/// * `term_dict_field_names` - A list of fields, where the whole dictionary needs to be loaded.
/// This is e.g. required for term aggregation, since we don't know in advance which terms are going
/// to be hit.
#[instrument(skip_all)]
pub(crate) async fn warmup(searcher: &Searcher, warmup_info: &WarmupInfo) -> anyhow::Result<()> {
    debug!(warmup_info=?warmup_info);
    let warm_up_terms_future = warm_up_terms(searcher, &warmup_info.terms_grouped_by_field)
        .instrument(debug_span!("warm_up_terms"));
    let warm_up_term_ranges_future =
        warm_up_term_ranges(searcher, &warmup_info.term_ranges_grouped_by_field)
            .instrument(debug_span!("warm_up_term_ranges"));
    let warm_up_term_dict_future =
        warm_up_term_dict_fields(searcher, &warmup_info.term_dict_fields)
            .instrument(debug_span!("warm_up_term_dicts"));
    let warm_up_fastfields_future = warm_up_fastfields(searcher, &warmup_info.fast_fields)
        .instrument(debug_span!("warm_up_fastfields"));
    let warm_up_fieldnorms_future = warm_up_fieldnorms(searcher, warmup_info.field_norms)
        .instrument(debug_span!("warm_up_fieldnorms"));
    // TODO merge warm_up_postings into warm_up_term_dict_fields
    let warm_up_postings_future = warm_up_postings(searcher, &warmup_info.term_dict_fields)
        .instrument(debug_span!("warm_up_postings"));
    let warm_up_automatons_future =
        warm_up_automatons(searcher, &warmup_info.automatons_grouped_by_field)
            .instrument(debug_span!("warm_up_automatons"));

    tokio::try_join!(
        warm_up_terms_future,
        warm_up_term_ranges_future,
        warm_up_fastfields_future,
        warm_up_term_dict_future,
        warm_up_fieldnorms_future,
        warm_up_postings_future,
        warm_up_automatons_future,
    )?;

    Ok(())
}

async fn warm_up_term_dict_fields(
    searcher: &Searcher,
    term_dict_fields: &HashSet<Field>,
) -> anyhow::Result<()> {
    let mut warm_up_futures = Vec::new();
    for field in term_dict_fields {
        for segment_reader in searcher.segment_readers() {
            let inverted_index = segment_reader.inverted_index(*field)?.clone();
            warm_up_futures.push(async move {
                let dict = inverted_index.terms();
                dict.warm_up_dictionary().await
            });
        }
    }
    try_join_all(warm_up_futures).await?;
    Ok(())
}

async fn warm_up_postings(searcher: &Searcher, fields: &HashSet<Field>) -> anyhow::Result<()> {
    let mut warm_up_futures = Vec::new();
    for field in fields {
        for segment_reader in searcher.segment_readers() {
            let inverted_index = segment_reader.inverted_index(*field)?.clone();
            warm_up_futures.push(async move { inverted_index.warm_postings_full(false).await });
        }
    }
    try_join_all(warm_up_futures).await?;
    Ok(())
}

async fn warm_up_fastfield(
    fast_field_reader: &FastFieldReaders,
    fast_field: &FastFieldWarmupInfo,
) -> anyhow::Result<()> {
    let mut columns = fast_field_reader
        .list_dynamic_column_handles(&fast_field.name)
        .await?;
    if fast_field.with_subfields {
        let subpath_columns = fast_field_reader
            .list_subpath_dynamic_column_handles(&fast_field.name)
            .await?;
        columns.extend(subpath_columns);
    }
    futures::future::try_join_all(
        columns
            .into_iter()
            .map(|col| async move { col.file_slice().read_bytes_async().await }),
    )
    .await?;
    Ok(())
}

/// Populates the short-lived cache with the data for
/// all of the fast fields passed as argument.
async fn warm_up_fastfields(
    searcher: &Searcher,
    fast_fields: &HashSet<FastFieldWarmupInfo>,
) -> anyhow::Result<()> {
    let mut warm_up_futures = Vec::new();
    for segment_reader in searcher.segment_readers() {
        let fast_field_reader = segment_reader.fast_fields();
        for fast_field in fast_fields {
            let warm_up_fut = warm_up_fastfield(fast_field_reader, fast_field);
            warm_up_futures.push(Box::pin(warm_up_fut));
        }
    }
    futures::future::try_join_all(warm_up_futures).await?;
    Ok(())
}

async fn warm_up_terms(
    searcher: &Searcher,
    terms_grouped_by_field: &HashMap<Field, HashMap<Term, bool>>,
) -> anyhow::Result<()> {
    let mut warm_up_futures = Vec::new();
    for (field, terms) in terms_grouped_by_field {
        for segment_reader in searcher.segment_readers() {
            let inv_idx = segment_reader.inverted_index(*field)?;
            for (term, position_needed) in terms.iter() {
                let inv_idx_clone = inv_idx.clone();
                warm_up_futures
                    .push(async move { inv_idx_clone.warm_postings(term, *position_needed).await });
            }
        }
    }
    try_join_all(warm_up_futures).await?;
    Ok(())
}

async fn warm_up_term_ranges(
    searcher: &Searcher,
    terms_grouped_by_field: &HashMap<Field, HashMap<TermRange, bool>>,
) -> anyhow::Result<()> {
    let mut warm_up_futures = Vec::new();
    for (field, terms) in terms_grouped_by_field {
        for segment_reader in searcher.segment_readers() {
            let inv_idx = segment_reader.inverted_index(*field)?;
            for (term_range, position_needed) in terms.iter() {
                let inv_idx_clone = inv_idx.clone();
                let range = (term_range.start.as_ref(), term_range.end.as_ref());
                warm_up_futures.push(async move {
                    inv_idx_clone
                        .warm_postings_range(range, term_range.limit, *position_needed)
                        .await
                });
            }
        }
    }
    try_join_all(warm_up_futures).await?;
    Ok(())
}

async fn warm_up_automatons(
    searcher: &Searcher,
    terms_grouped_by_field: &HashMap<Field, HashSet<Automaton>>,
) -> anyhow::Result<()> {
    let mut warm_up_futures = Vec::new();
    let cpu_intensive_executor = |task| async {
        crate::search_thread_pool()
            .run_cpu_intensive(task)
            .await
            .map_err(|_| std::io::Error::other("task panicked"))?
    };
    for (field, automatons) in terms_grouped_by_field {
        for segment_reader in searcher.segment_readers() {
            let inv_idx = segment_reader.inverted_index(*field)?;
            for automaton in automatons {
                let inv_idx_clone = inv_idx.clone();
                warm_up_futures.push(async move {
                    match automaton {
                        Automaton::Regex(path, regex_str) => {
                            let regex = tantivy_fst::Regex::new(regex_str)
                                .context("failed to parse regex during warmup")?;
                            inv_idx_clone
                                .warm_postings_automaton(
                                    quickwit_query::query_ast::JsonPathPrefix {
                                        automaton: regex.into(),
                                        prefix: path.clone().unwrap_or_default(),
                                    },
                                    cpu_intensive_executor,
                                )
                                .await
                                .context("failed to load automaton")
                        }
                    }
                });
            }
        }
    }
    try_join_all(warm_up_futures).await?;
    Ok(())
}

async fn warm_up_fieldnorms(searcher: &Searcher, requires_scoring: bool) -> anyhow::Result<()> {
    if !requires_scoring {
        return Ok(());
    }
    let mut warm_up_futures = Vec::new();
    for field in searcher.schema().fields() {
        for segment_reader in searcher.segment_readers() {
            let fieldnorm_readers = segment_reader.fieldnorms_readers();
            let file_handle_opt = fieldnorm_readers.get_inner_file().open_read(field.0);
            if let Some(file_handle) = file_handle_opt {
                warm_up_futures.push(async move { file_handle.read_bytes_async().await })
            }
        }
    }
    try_join_all(warm_up_futures).await?;
    Ok(())
}

fn get_leaf_resp_from_count(count: u64) -> LeafSearchResponse {
    LeafSearchResponse {
        num_hits: count,
        partial_hits: Vec::new(),
        failed_splits: Vec::new(),
        num_attempted_splits: 1,
        num_successful_splits: 1,
        intermediate_aggregation_result: None,
        resource_stats: None,
    }
}

/// Compute the size of the index, store excluded.
fn compute_index_size(hot_directory: &HotDirectory) -> ByteSize {
    let size_bytes = hot_directory
        .get_file_lengths()
        .iter()
        .filter(|(path, _)| !path.to_string_lossy().ends_with("store"))
        .map(|(_, size)| *size)
        .sum();
    ByteSize(size_bytes)
}

/// Apply a leaf search on a single split.
#[allow(clippy::too_many_arguments)]
async fn leaf_search_single_split(
    search_request: SearchRequest,
    ctx: Arc<LeafSearchContext>,
    storage: Arc<dyn Storage>,
    split: SplitIdAndFooterOffsets,
    search_permit: &mut SearchPermit,
) -> crate::Result<Option<LeafSearchResponse>> {
    let mut leaf_search_state_guard =
        SplitSearchStateGuard::new(ctx.split_outcome_counters.clone());

    // We already checked if the result was already in the partial result cache,
    // but it's not a bad idea to check again.
    if let Some(cached_answer) = ctx
        .searcher_context
        .leaf_search_cache
        .get(split.clone(), search_request.clone())
    {
        leaf_search_state_guard.set_state(SplitSearchState::CacheHit);
        return Ok(Some(cached_answer));
    }

    let query_ast: QueryAst = serde_json::from_str(search_request.query_ast.as_str())
        .map_err(|err| SearchError::InvalidQuery(err.to_string()))?;

    // CanSplitDoBetter or rewrite_request may have changed the request to be a count only request
    // This may be the case for AllQuery with a sort by date and time filter, where the current
    // split can't have better results.
    if is_metadata_count_request_with_ast(&query_ast, &search_request) {
        leaf_search_state_guard.set_state(SplitSearchState::PrunedBeforeWarmup);
        return Ok(Some(get_leaf_resp_from_count(split.num_docs)));
    }

    let split_id = split.split_id.to_string();
    let byte_range_cache =
        ByteRangeCache::with_infinite_capacity(&quickwit_storage::STORAGE_METRICS.shortlived_cache);
    let (index, hot_directory) = open_index_with_caches(
        &ctx.searcher_context,
        storage,
        &split,
        Some(ctx.doc_mapper.tokenizer_manager()),
        Some(byte_range_cache.clone()),
    )
    .await?;

    let index_size = compute_index_size(&hot_directory);
    if index_size < search_permit.memory_allocation() {
        search_permit.update_memory_usage(index_size);
    }

    let searcher = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()?
        .searcher();

    let agg_context_params = AggContextParams {
        limits: ctx.searcher_context.get_aggregation_limits(),
        tokenizers: ctx.doc_mapper.tokenizer_manager().tantivy_manager().clone(),
    };
    let mut collector =
        make_collector_for_split(split_id.clone(), &search_request, agg_context_params)?;

    let predicate_cache = if collector.requires_scoring() {
        // at the moment the predicate cache doesn't support scoring
        None
    } else {
        Some((
            ctx.searcher_context.predicate_cache.clone() as _,
            split.split_id.clone(),
        ))
    };
    let split_schema = index.schema();
    let (query, mut warmup_info) = ctx.doc_mapper.query(
        split_schema.clone(),
        query_ast.clone(),
        false,
        predicate_cache,
    )?;

    let collector_warmup_info = collector.warmup_info();
    warmup_info.merge(collector_warmup_info);
    warmup_info.simplify();

    let warmup_start = Instant::now();
    leaf_search_state_guard.set_state(SplitSearchState::WarmUp);
    warmup(&searcher, &warmup_info).await?;
    let warmup_end = Instant::now();
    let warmup_duration: Duration = warmup_end.duration_since(warmup_start);
    let warmup_size = ByteSize(byte_range_cache.get_num_bytes());
    if warmup_size > search_permit.memory_allocation() {
        warn!(
            memory_usage = ?warmup_size,
            memory_allocation = ?search_permit.memory_allocation(),
            "current leaf search is consuming more memory than the initial allocation"
        );
    }
    crate::SEARCH_METRICS
        .leaf_search_single_split_warmup_num_bytes
        .observe(warmup_size.as_u64() as f64);
    search_permit.update_memory_usage(warmup_size);
    search_permit.free_warmup_slot();

    let split_num_docs = split.num_docs;

    let span = info_span!("tantivy_search");

    let split_clone = split.clone();

    let ctx_clone = ctx.clone();
    leaf_search_state_guard.set_state(SplitSearchState::CpuQueue);
    let search_request_and_result: Option<(SearchRequest, LeafSearchResponse)> =
        crate::search_thread_pool()
            .run_cpu_intensive(move || {
                leaf_search_state_guard.set_state(SplitSearchState::Cpu);
                let cpu_start = Instant::now();
                let cpu_thread_pool_wait_microsecs = cpu_start.duration_since(warmup_end);
                let _span_guard = span.enter();
                // Our search execution has been scheduled, let's check if we can improve the
                // request based on the results of the preceding searches
                let Some(simplified_search_request) =
                    simplify_search_request(search_request, &split_clone, &ctx_clone.split_filter)
                else {
                    leaf_search_state_guard.set_state(SplitSearchState::PrunedAfterWarmup);
                    return Ok(None);
                };
                collector.update_search_param(&simplified_search_request);
                let mut leaf_search_response: LeafSearchResponse =
                    if is_metadata_count_request_with_ast(&query_ast, &simplified_search_request) {
                        get_leaf_resp_from_count(searcher.num_docs())
                    } else if collector.is_count_only() {
                        let count = query.count(&searcher)? as u64;
                        get_leaf_resp_from_count(count)
                    } else {
                        searcher.search(&query, &collector)?
                    };
                leaf_search_response.resource_stats = Some(ResourceStats {
                    cpu_microsecs: cpu_start.elapsed().as_micros() as u64,
                    short_lived_cache_num_bytes: warmup_size.as_u64(),
                    split_num_docs,
                    warmup_microsecs: warmup_duration.as_micros() as u64,
                    cpu_thread_pool_wait_microsecs: cpu_thread_pool_wait_microsecs.as_micros()
                        as u64,
                });
                leaf_search_state_guard.set_state(SplitSearchState::Success);
                Result::<_, TantivyError>::Ok(Some((
                    simplified_search_request,
                    leaf_search_response,
                )))
            })
            .await
            .map_err(|_| {
                crate::SearchError::Internal(format!("leaf search panicked. split={split_id}"))
            })??;

    // Let's cache this result in the partial result cache.
    let Some((leaf_search_req, leaf_search_resp)) = search_request_and_result else {
        return Ok(None);
    };
    // We save our result in the cache.
    ctx.searcher_context
        .leaf_search_cache
        .put(split, leaf_search_req, leaf_search_resp.clone());
    Ok(Some(leaf_search_resp))
}

/// Rewrite a request removing parts which incur additional download or computation with no
/// effect.
///
/// This include things such as sorting result by a field or _score when no document is requested,
/// or applying date range when the range covers the entire split.
fn rewrite_request(
    search_request: &mut SearchRequest,
    split: &SplitIdAndFooterOffsets,
    timestamp_field: Option<&str>,
) {
    if search_request.max_hits == 0 {
        search_request.sort_fields = Vec::new();
    }
    if let Some(timestamp_field) = timestamp_field {
        remove_redundant_timestamp_range(search_request, split, timestamp_field);
    }
    rewrite_aggregation(search_request);
    // we add a top level cache node when search_after is set, this won't help for this query (which
    // is the 2nd in its series), but should speedup every other request that comes after
    if search_request.search_after.is_some() {
        add_top_cache_node(search_request)
    }
}

fn add_top_cache_node(search_request: &mut SearchRequest) {
    let Ok(query_ast) = serde_json::from_str(search_request.query_ast.as_str()) else {
        // an error will get raised a bit after anyway
        return;
    };
    let new_ast: QueryAst = CacheNode::new(query_ast).into();
    search_request.query_ast = serde_json::to_string(&new_ast).unwrap();
}

/// Rewrite aggregation to make them easier to cache
///
/// This is only valid for options which are handled while merging results, which is
/// mostly `extended_bounds`.
fn rewrite_aggregation(search_request: &mut SearchRequest) {
    if let Some(aggregation) = &search_request.aggregation_request {
        let Ok(QuickwitAggregations::TantivyAggregations(mut aggregations)) =
            serde_json::from_str(aggregation)
        else {
            return;
        };
        let modified_something = visit_aggregation_mut(&mut aggregations, &|aggregation_variant| {
            match aggregation_variant {
                // we take() away the extended bounds, and record we did something
                AggregationVariants::Histogram(histogram) => {
                    histogram.extended_bounds.take().is_some()
                }
                AggregationVariants::DateHistogram(histogram) => {
                    histogram.extended_bounds.take().is_some()
                }
                _ => false,
            }
        });
        if modified_something {
            // it's fine to put a (Tantivy)Aggregations and not a QuickwitAggregations because
            // the former is an serde-untagged variant of the later
            search_request.aggregation_request =
                Some(serde_json::to_string(&aggregations).expect("serializing should never fail"));
        }
    }
}

// this is a rather limited visitor, but enough to do the job
fn visit_aggregation_mut(
    aggregations: &mut Aggregations,
    callback: &impl Fn(&mut AggregationVariants) -> bool,
) -> bool {
    let mut modified_something = false;
    for aggregation in aggregations.values_mut() {
        modified_something |= callback(&mut aggregation.agg);
        modified_something |= visit_aggregation_mut(&mut aggregation.sub_aggregation, callback);
    }
    modified_something
}

// returns the max of left and right, that isn't unbounded. Useful for making
// the intersection of lower bound of ranges
fn max_bound<T: Ord + Copy>(left: Bound<T>, right: Bound<T>) -> Bound<T> {
    use Bound::*;
    match (left, right) {
        (Unbounded, right) => right,
        (left, Unbounded) => left,
        (Included(left), Included(right)) => Included(left.max(right)),
        (Excluded(left), Excluded(right)) => Excluded(left.max(right)),
        (excluded_total @ Excluded(excluded), included_total @ Included(included)) => {
            if included > excluded {
                included_total
            } else {
                excluded_total
            }
        }
        (included_total @ Included(included), excluded_total @ Excluded(excluded)) => {
            if included > excluded {
                included_total
            } else {
                excluded_total
            }
        }
    }
}

// returns the min of left and right, that isn't unbounded. Useful for making
// the intersection of upper bound of ranges
fn min_bound<T: Ord + Copy>(left: Bound<T>, right: Bound<T>) -> Bound<T> {
    use Bound::*;
    match (left, right) {
        (Unbounded, right) => right,
        (left, Unbounded) => left,
        (Included(left), Included(right)) => Included(left.min(right)),
        (Excluded(left), Excluded(right)) => Excluded(left.min(right)),
        (excluded_total @ Excluded(excluded), included_total @ Included(included)) => {
            if included < excluded {
                included_total
            } else {
                excluded_total
            }
        }
        (included_total @ Included(included), excluded_total @ Excluded(excluded)) => {
            if included < excluded {
                included_total
            } else {
                excluded_total
            }
        }
    }
}

/// remove timestamp range that would be present both in QueryAst and SearchRequest
///
/// this can save us from doing double the work in some cases, and help with the partial request
/// cache.
fn remove_redundant_timestamp_range(
    search_request: &mut SearchRequest,
    split: &SplitIdAndFooterOffsets,
    timestamp_field: &str,
) {
    let Ok(query_ast) = serde_json::from_str(search_request.query_ast.as_str()) else {
        // an error will get raised a bit after anyway
        return;
    };

    let start_timestamp = search_request
        .start_timestamp
        .map(DateTime::from_timestamp_secs)
        .map(Bound::Included)
        .unwrap_or(Bound::Unbounded);
    let end_timestamp = search_request
        .end_timestamp
        .map(DateTime::from_timestamp_secs)
        .map(Bound::Excluded)
        .unwrap_or(Bound::Unbounded);

    let mut visitor = RemoveTimestampRange {
        timestamp_field,
        start_timestamp,
        end_timestamp,
    };
    let mut new_ast = visitor
        .transform(query_ast)
        .expect("can't fail unwrapping Infallible")
        .unwrap_or(QueryAst::MatchAll);

    let final_start_timestamp = match (
        visitor.start_timestamp,
        split.timestamp_start.map(DateTime::from_timestamp_secs),
    ) {
        (Bound::Included(query_ts), Some(split_ts)) => {
            if query_ts > split_ts {
                Bound::Included(query_ts)
            } else {
                Bound::Unbounded
            }
        }
        (Bound::Excluded(query_ts), Some(split_ts)) => {
            if query_ts >= split_ts {
                Bound::Excluded(query_ts)
            } else {
                Bound::Unbounded
            }
        }
        (Bound::Unbounded, Some(_)) => Bound::Unbounded,
        (timestamp, None) => timestamp,
    };
    let final_end_timestamp = match (
        visitor.end_timestamp,
        split.timestamp_end.map(DateTime::from_timestamp_secs),
    ) {
        (Bound::Included(query_ts), Some(split_ts)) => {
            if query_ts < split_ts {
                Bound::Included(query_ts)
            } else {
                Bound::Unbounded
            }
        }
        (Bound::Excluded(query_ts), Some(split_ts)) => {
            if query_ts <= split_ts {
                Bound::Excluded(query_ts)
            } else {
                Bound::Unbounded
            }
        }
        (Bound::Unbounded, Some(_)) => Bound::Unbounded,
        (timestamp, None) => timestamp,
    };
    if final_start_timestamp != Bound::Unbounded || final_end_timestamp != Bound::Unbounded {
        let range = RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: final_start_timestamp.map(|bound| bound.into_timestamp_nanos().into()),
            upper_bound: final_end_timestamp.map(|bound| bound.into_timestamp_nanos().into()),
        };
        new_ast = if let QueryAst::Bool(mut bool_query) = new_ast {
            if bool_query.must.is_empty()
                && bool_query.filter.is_empty()
                && !bool_query.should.is_empty()
            {
                // we can't simply add a filter if we have some should but no must/filter. We must
                // add a new layer of bool query
                BoolQuery {
                    must: vec![bool_query.into()],
                    filter: vec![range.into()],
                    ..Default::default()
                }
                .into()
            } else {
                bool_query.filter.push(range.into());
                QueryAst::Bool(bool_query)
            }
        } else {
            BoolQuery {
                must: vec![new_ast],
                filter: vec![range.into()],
                ..Default::default()
            }
            .into()
        }
    }

    search_request.query_ast = serde_json::to_string(&new_ast).unwrap();
    search_request.start_timestamp = None;
    search_request.end_timestamp = None;
}

/// Remove all `must` and `filter timestamp ranges, and summarize them
#[derive(Debug, Clone)]
struct RemoveTimestampRange<'a> {
    timestamp_field: &'a str,
    start_timestamp: Bound<DateTime>,
    end_timestamp: Bound<DateTime>,
}

impl RemoveTimestampRange<'_> {
    fn update_start_timestamp(
        &mut self,
        lower_bound: &quickwit_query::JsonLiteral,
        included: bool,
    ) {
        use quickwit_query::InterpretUserInput;
        let Some(lower_bound) = DateTime::interpret_json(lower_bound) else {
            // we shouldn't be able to get here, we would have errored much earlier in root search
            warn!("unparsable time bound in leaf search: {lower_bound:?}");
            return;
        };
        let bound = if included {
            Bound::Included(lower_bound)
        } else {
            Bound::Excluded(lower_bound)
        };

        self.start_timestamp = max_bound(self.start_timestamp, bound);
    }

    fn update_end_timestamp(&mut self, upper_bound: &quickwit_query::JsonLiteral, included: bool) {
        use quickwit_query::InterpretUserInput;
        let Some(upper_bound) = DateTime::interpret_json(upper_bound) else {
            // we shouldn't be able to get here, we would have errored much earlier in root search
            warn!("unparsable time bound in leaf search: {upper_bound:?}");
            return;
        };
        let bound = if included {
            Bound::Included(upper_bound)
        } else {
            Bound::Excluded(upper_bound)
        };

        self.end_timestamp = min_bound(self.end_timestamp, bound);
    }
}

impl QueryAstTransformer for RemoveTimestampRange<'_> {
    type Err = std::convert::Infallible;

    fn transform_bool(&mut self, mut bool_query: BoolQuery) -> Result<Option<QueryAst>, Self::Err> {
        // we only want to visit sub-queries which are strict (positive) requirements
        bool_query.must = bool_query
            .must
            .into_iter()
            .filter_map(|query_ast| self.transform(query_ast).transpose())
            .collect::<Result<Vec<_>, _>>()?;
        bool_query.filter = bool_query
            .filter
            .into_iter()
            .filter_map(|query_ast| self.transform(query_ast).transpose())
            .collect::<Result<Vec<_>, _>>()?;

        Ok(Some(QueryAst::Bool(bool_query)))
    }

    fn transform_range(&mut self, range_query: RangeQuery) -> Result<Option<QueryAst>, Self::Err> {
        if range_query.field == self.timestamp_field {
            match range_query.lower_bound {
                Bound::Included(lower_bound) => {
                    self.update_start_timestamp(&lower_bound, true);
                }
                Bound::Excluded(lower_bound) => {
                    self.update_start_timestamp(&lower_bound, false);
                }
                Bound::Unbounded => (),
            };

            match range_query.upper_bound {
                Bound::Included(upper_bound) => {
                    self.update_end_timestamp(&upper_bound, true);
                }
                Bound::Excluded(upper_bound) => {
                    self.update_end_timestamp(&upper_bound, false);
                }
                Bound::Unbounded => (),
            };

            Ok(Some(QueryAst::MatchAll))
        } else {
            Ok(Some(range_query.into()))
        }
    }

    fn transform_term(&mut self, term_query: TermQuery) -> Result<Option<QueryAst>, Self::Err> {
        // TODO we could remove query bounds, this point query surely is more precise, and it
        // doesn't require loading a fastfield
        Ok(Some(QueryAst::Term(term_query)))
    }
}

/// Checks if request is a simple all query.
/// Simple in this case would still including sorting
fn is_simple_all_query(search_request: &SearchRequest) -> bool {
    if search_request.aggregation_request.is_some() {
        return false;
    }

    if search_request.search_after.is_some() {
        return false;
    }

    // TODO: Update the logic to handle start_timestamp end_timestamp ranges
    if search_request.start_timestamp.is_some() || search_request.end_timestamp.is_some() {
        return false;
    }

    let Ok(query_ast) = serde_json::from_str(&search_request.query_ast) else {
        return false;
    };

    matches!(query_ast, QueryAst::MatchAll)
}

#[derive(Debug, Clone)]
enum CanSplitDoBetter {
    Uninformative,
    SplitIdHigher(Option<String>),
    SplitTimestampHigher(Option<i64>),
    SplitTimestampLower(Option<i64>),
    FindTraceIdsAggregation(Option<i64>),
}

impl CanSplitDoBetter {
    /// Create a CanSplitDoBetter from a SearchRequest
    fn from_request(request: &SearchRequest, timestamp_field_name: Option<&str>) -> Self {
        if request.max_hits == 0
            && let Some(aggregation) = &request.aggregation_request
            && let Ok(crate::QuickwitAggregations::FindTraceIdsAggregation(find_trace_aggregation)) =
                serde_json::from_str(aggregation)
            && Some(find_trace_aggregation.span_timestamp_field_name.as_str())
                == timestamp_field_name
        {
            return CanSplitDoBetter::FindTraceIdsAggregation(None);
        }

        if request.sort_fields.is_empty() {
            CanSplitDoBetter::SplitIdHigher(None)
        } else if let Some((sort_by, timestamp_field)) =
            request.sort_fields.first().zip(timestamp_field_name)
        {
            if sort_by.field_name == timestamp_field {
                if sort_by.sort_order() == SortOrder::Desc {
                    CanSplitDoBetter::SplitTimestampHigher(None)
                } else {
                    CanSplitDoBetter::SplitTimestampLower(None)
                }
            } else {
                CanSplitDoBetter::Uninformative
            }
        } else {
            CanSplitDoBetter::Uninformative
        }
    }

    /// Optimize the order in which splits will get processed based on how it can skip the most
    /// splits.
    ///
    /// The leaf search code contains some logic that makes it possible to skip entire splits
    /// when we are confident they won't make it into top K.
    /// To make this optimization as potent as possible, we sort the splits so that the first splits
    /// are the most likely to fill our Top K.
    /// In the future, as split get more metadata per column, we may be able to do this more than
    /// just for timestamp and "unsorted" request.
    fn optimize_split_order(&self, splits: &mut [SplitIdAndFooterOffsets]) {
        match self {
            CanSplitDoBetter::SplitIdHigher(_) => {
                splits.sort_unstable_by(|a, b| b.split_id.cmp(&a.split_id))
            }
            CanSplitDoBetter::SplitTimestampHigher(_)
            | CanSplitDoBetter::FindTraceIdsAggregation(_) => {
                splits.sort_unstable_by_key(|split| std::cmp::Reverse(split.timestamp_end()))
            }
            CanSplitDoBetter::SplitTimestampLower(_) => {
                splits.sort_unstable_by_key(|split| split.timestamp_start())
            }
            CanSplitDoBetter::Uninformative => (),
        }
    }

    /// This function tries to detect upfront which splits contain the top n hits and convert other
    /// split searches to count only searches. It also optimizes split order.
    ///
    /// Returns the search_requests with their split.
    fn optimize(
        &self,
        request: &SearchRequest,
        mut splits: Vec<SplitIdAndFooterOffsets>,
    ) -> Result<Vec<(SplitIdAndFooterOffsets, SearchRequest)>, SearchError> {
        self.optimize_split_order(&mut splits);

        if !is_simple_all_query(request) {
            // no optimization opportunity here.
            return Ok(splits
                .into_iter()
                .map(|split| (split, (*request).clone()))
                .collect::<Vec<_>>());
        }

        let num_requested_docs = request.start_offset + request.max_hits;

        // Calculate the number of splits which are guaranteed to deliver enough documents.
        let min_required_splits = splits
            .iter()
            .map(|split| split.num_docs)
            // computing the partial sum
            .scan(0u64, |partial_sum: &mut u64, num_docs_in_split: u64| {
                *partial_sum += num_docs_in_split;
                Some(*partial_sum)
            })
            .take_while(|partial_sum| *partial_sum < num_requested_docs)
            .count()
            + 1;

        // TODO: we maybe want here some deduplication + Cow logic
        let mut split_with_req = splits
            .into_iter()
            .map(|split| (split, (*request).clone()))
            .collect::<Vec<_>>();

        // reuse the detected sort order in split_filter
        // we want to detect cases where we can convert some split queries to count only queries
        match self {
            CanSplitDoBetter::SplitIdHigher(_) => {
                // In this case there is no sort order, we order by split id.
                // If the first split has enough documents, we can convert the other queries to
                // count only queries
                for (_split, request) in split_with_req.iter_mut().skip(min_required_splits) {
                    disable_search_request_hits(request);
                }
            }
            CanSplitDoBetter::Uninformative => {}
            CanSplitDoBetter::SplitTimestampLower(_) => {
                // We order by timestamp asc. split_with_req is sorted by timestamp_start.
                //
                // If we know that some splits will deliver enough documents, we can convert the
                // others to count only queries.
                // Since we only have start and end ranges and don't know the distribution we make
                // sure the splits dont' overlap, since the distribution of two
                // splits could be like this (dot is a timestamp doc on a x axis), for top 2
                // queries.
                // ```
                // [.          .] Split1 has enough docs, but last doc is not in top 2
                //           [..         .] Split2 first doc is in top2
                // ```
                // Let's get the biggest timestamp_end of the first num_splits splits
                let biggest_end_timestamp = split_with_req
                    .iter()
                    .take(min_required_splits)
                    .map(|(split, _)| split.timestamp_end())
                    .max()
                    // if min_required_splits is 0, we choose a value that disables all splits
                    .unwrap_or(i64::MIN);
                for (split, request) in split_with_req.iter_mut().skip(min_required_splits) {
                    if split.timestamp_start() > biggest_end_timestamp {
                        disable_search_request_hits(request);
                    }
                }
            }
            CanSplitDoBetter::SplitTimestampHigher(_) => {
                // We order by timestamp desc. split_with_req is sorted by timestamp_end desc.
                //
                // We have the number of splits we need to search to get enough docs, now we need to
                // find the splits that don't overlap.
                //
                // Let's get the smallest timestamp_start of the first num_splits splits
                let smallest_start_timestamp = split_with_req
                    .iter()
                    .take(min_required_splits)
                    .map(|(split, _)| split.timestamp_start())
                    .min()
                    // if min_required_splits is 0, we choose a value that disables all splits
                    .unwrap_or(i64::MAX);
                for (split, request) in split_with_req.iter_mut().skip(min_required_splits) {
                    if split.timestamp_end() < smallest_start_timestamp {
                        disable_search_request_hits(request);
                    }
                }
            }
            CanSplitDoBetter::FindTraceIdsAggregation(_) => {}
        }

        Ok(split_with_req)
    }

    /// Returns whether the given split can possibly give documents better than the one already
    /// known to match.
    fn can_be_better(&self, split: &SplitIdAndFooterOffsets) -> bool {
        match self {
            CanSplitDoBetter::SplitIdHigher(Some(split_id)) => split.split_id >= *split_id,
            CanSplitDoBetter::SplitTimestampHigher(Some(timestamp))
            | CanSplitDoBetter::FindTraceIdsAggregation(Some(timestamp)) => {
                split.timestamp_end() >= *timestamp
            }
            CanSplitDoBetter::SplitTimestampLower(Some(timestamp)) => {
                split.timestamp_start() <= *timestamp
            }
            _ => true,
        }
    }

    /// Record the new worst-of-the-top document, that is, the document which would first be
    /// evicted from the list of best documents, if a better document was found. Only call this
    /// function if you have at least max_hits documents already.
    fn record_new_worst_hit(&mut self, hit: &PartialHit) {
        match self {
            CanSplitDoBetter::Uninformative => (),
            CanSplitDoBetter::SplitIdHigher(split_id) => *split_id = Some(hit.split_id.clone()),
            CanSplitDoBetter::SplitTimestampHigher(timestamp)
            | CanSplitDoBetter::FindTraceIdsAggregation(timestamp) => {
                if let Some(SortValue::I64(timestamp_ns)) = hit.sort_value() {
                    // if we get a timestamp of, says 1.5s, we need to check up to 2s to make
                    // sure we don't throw away something like 1.2s, so we should round up while
                    // dividing.
                    *timestamp = Some(quickwit_common::div_ceil(timestamp_ns, 1_000_000_000));
                }
            }
            CanSplitDoBetter::SplitTimestampLower(timestamp) => {
                if let Some(SortValue::I64(timestamp_ns)) = hit.sort_value() {
                    // if we get a timestamp of, says 1.5s, we need to check down to 1s to make
                    // sure we don't throw away something like 1.7s, so we should truncate,
                    // which is the default behavior of division
                    let timestamp_s = timestamp_ns / 1_000_000_000;
                    *timestamp = Some(timestamp_s);
                }
            }
        }
    }
}

/// Searches multiple splits, potentially in multiple indexes, sitting on different storages and
/// having different doc mappings.
#[instrument(skip_all, fields(index = ?leaf_search_request.search_request.as_ref().unwrap().index_id_patterns))]
pub async fn multi_index_leaf_search(
    searcher_context: Arc<SearcherContext>,
    leaf_search_request: LeafSearchRequest,
    storage_resolver: StorageResolver,
) -> Result<LeafSearchResponse, SearchError> {
    let search_request: Arc<SearchRequest> = leaf_search_request
        .search_request
        .ok_or_else(|| SearchError::Internal("no search request".to_string()))?
        .into();

    let doc_mappers: Vec<Arc<DocMapper>> = leaf_search_request
        .doc_mappers
        .iter()
        .map(|doc_mapper| deserialize_doc_mapper(doc_mapper))
        .collect::<crate::Result<_>>()?;

    // TODO: to avoid lockstep, we should pull up the future creation over the list of split ids
    // and have the semaphore on this level.
    // This will lower resource consumption due to less in-flight futures and avoid contention.
    // It also allows passing early exit conditions between indices.
    //
    // It is a little bit tricky how to handle which is now the incremental_merge_collector, one
    // per index, e.g. when to merge results and how to avoid lock contention.
    let mut leaf_request_futures = JoinSet::new();
    for leaf_search_request_ref in leaf_search_request.leaf_requests.into_iter() {
        let index_uri = quickwit_common::uri::Uri::from_str(
            leaf_search_request
                .index_uris
                .get(leaf_search_request_ref.index_uri_ord as usize)
                .ok_or_else(|| {
                    SearchError::Internal(format!(
                        "Received incorrect request, index_uri_ord out of bounds: {}",
                        leaf_search_request_ref.index_uri_ord
                    ))
                })?,
        )?;
        let doc_mapper = doc_mappers
            .get(leaf_search_request_ref.doc_mapper_ord as usize)
            .ok_or_else(|| {
                SearchError::Internal(format!(
                    "Received incorrect request, doc_mapper_ord out of bounds: {}",
                    leaf_search_request_ref.doc_mapper_ord
                ))
            })?
            .clone();

        let storage_resolver = storage_resolver.clone();
        let searcher_context = searcher_context.clone();
        let search_request = search_request.clone();

        leaf_request_futures.spawn({
            async move {
                let storage = storage_resolver.resolve(&index_uri).await?;
                single_doc_mapping_leaf_search(
                    searcher_context,
                    search_request,
                    storage,
                    leaf_search_request_ref.split_offsets,
                    doc_mapper,
                )
                .in_current_span()
                .await
            }
        });
    }

    // Creates a collector which merges responses into one
    let merge_collector =
        make_merge_collector(&search_request, searcher_context.get_aggregation_limits())?;
    let mut incremental_merge_collector = IncrementalCollector::new(merge_collector);

    while let Some(leaf_response_join_result) = leaf_request_futures.join_next().await {
        // abort the search on join errors
        let leaf_response_result = leaf_response_join_result?;
        match leaf_response_result {
            Ok(leaf_response) => {
                incremental_merge_collector.add_result(leaf_response)?;
            }
            Err(err) => {
                incremental_merge_collector.add_failed_split(SplitSearchError {
                    split_id: "unknown".to_string(),
                    error: format!("{err}"),
                    retryable_error: true,
                });
            }
        }
    }

    crate::search_thread_pool()
        .run_cpu_intensive(|| incremental_merge_collector.finalize().map_err(Into::into))
        .instrument(info_span!("incremental_merge_finalize"))
        .await
        .context("failed to merge split search responses")?
}

/// Optimizes the search_request based on CanSplitDoBetter
/// Returns None if the search request does nothing can be skipped.
#[must_use]
fn simplify_search_request(
    mut search_request: SearchRequest,
    split: &SplitIdAndFooterOffsets,
    split_filter_lock: &Arc<RwLock<CanSplitDoBetter>>,
) -> Option<SearchRequest> {
    let can_be_better: bool;
    let is_trace_req: bool;
    {
        let split_filter_guard = split_filter_lock.read().unwrap();
        can_be_better = split_filter_guard.can_be_better(split);
        // The info is originally from the search_request.aggregation as a string (yes we need to
        // clean this eventually). We don't want to parse it again, so we use the
        // split_filter variant to get that info.
        is_trace_req = matches!(
            &*split_filter_guard,
            &CanSplitDoBetter::FindTraceIdsAggregation(_)
        );
    }
    if !can_be_better {
        disable_search_request_hits(&mut search_request);
    }
    if is_trace_req {
        return Some(search_request);
    }
    if search_request.max_hits > 0 {
        return Some(search_request);
    }
    if search_request.aggregation_request.is_some() {
        return Some(search_request);
    }
    if search_request.count_hits() == CountHits::CountAll {
        return Some(search_request);
    }
    None
}

/// Alter the search request so it does not return any docs.
///
/// This is usually done since it cannot provide better hits results than existing fetched results.
fn disable_search_request_hits(search_request: &mut SearchRequest) {
    search_request.max_hits = 0;
    search_request.start_offset = 0;
    search_request.sort_fields.clear();
    search_request.search_after = None;
}

/// Searches multiple splits for a specific index and a single doc mapping
/// Offloads splits to Lambda invocations, distributing them across batches
/// balanced by document count. Each batch is invoked independently; a failure
/// in one batch does not affect others.
async fn run_offloaded_search_tasks(
    searcher_context: &SearcherContext,
    search_request: &SearchRequest,
    doc_mapper: &DocMapper,
    index_uri: Uri,
    splits_with_requests: Vec<(SplitIdAndFooterOffsets, SearchRequest)>,
    incremental_merge_collector: &Mutex<IncrementalCollector>,
) -> Result<(), SearchError> {
    if splits_with_requests.is_empty() {
        return Ok(());
    }

    info!(
        num_offloaded_splits = splits_with_requests.len(),
        "offloading to lambda"
    );

    let lambda_invoker = searcher_context.lambda_invoker.as_ref().expect(
        "did not receive enough permit futures despite not having any lambda invoker to offload to",
    );
    let lambda_config = searcher_context.searcher_config.lambda.as_ref().unwrap();

    let doc_mapper_str = serde_json::to_string(doc_mapper)
        .map_err(|err| SearchError::Internal(format!("failed to serialize doc mapper: {err}")))?;

    // Build a lookup so we can match lambda results (tagged by split_id) back to the
    // split metadata and per-split SearchRequest needed for caching.
    let mut split_lookup: HashMap<String, (SplitIdAndFooterOffsets, SearchRequest)> =
        HashMap::with_capacity(splits_with_requests.len());
    let splits: Vec<SplitIdAndFooterOffsets> = splits_with_requests
        .into_iter()
        .map(|(split, search_req)| {
            split_lookup.insert(split.split_id.clone(), (split.clone(), search_req));
            split
        })
        .collect();

    let batches: Vec<Vec<SplitIdAndFooterOffsets>> = greedy_batch_split(
        splits,
        |split| split.num_docs,
        lambda_config.max_splits_per_invocation,
    );

    let mut lambda_tasks_joinset = JoinSet::new();
    for batch in batches {
        let batch_split_ids: Vec<String> =
            batch.iter().map(|split| split.split_id.clone()).collect();
        let leaf_request = LeafSearchRequest {
            // Note this is not the split-specific rewritten request, we ship the main request,
            // and the leaf will apply the split specific rewrite on its own.
            search_request: Some(search_request.clone()),
            doc_mappers: vec![doc_mapper_str.clone()],
            index_uris: vec![index_uri.as_str().to_string()], //< careful here. Calling to_string() directly would return a redacted uri.
            leaf_requests: vec![quickwit_proto::search::LeafRequestRef {
                index_uri_ord: 0,
                doc_mapper_ord: 0,
                split_offsets: batch,
            }],
        };
        let invoker = lambda_invoker.clone();
        lambda_tasks_joinset.spawn(async move {
            (
                batch_split_ids,
                invoker.invoke_leaf_search(leaf_request).await,
            )
        });
    }

    while let Some(join_res) = lambda_tasks_joinset.join_next().await {
        let Ok((batch_split_ids, result)) = join_res else {
            error!("lambda join error");
            return Err(SearchError::Internal("lambda join error".to_string()));
        };
        match result {
            Ok(split_results) => {
                let mut locked = incremental_merge_collector.lock().unwrap();
                for split_result in split_results {
                    match split_result.outcome {
                        Some(Outcome::Response(response)) => {
                            if let Some((split_info, single_split_search_req)) =
                                split_lookup.remove(&split_result.split_id)
                            {
                                // We use the single_split_search_req to perform the search
                                searcher_context.leaf_search_cache.put(
                                    split_info,
                                    single_split_search_req,
                                    response.clone(),
                                );
                            }
                            if let Err(err) = locked.add_result(response) {
                                error!(error = %err, "failed to add lambda result to collector");
                            }
                        }
                        Some(Outcome::Error(error_msg)) => {
                            locked.add_failed_split(SplitSearchError {
                                split_id: split_result.split_id,
                                error: format!("lambda split error: {error_msg}"),
                                retryable_error: true,
                            });
                        }
                        None => {
                            locked.add_failed_split(SplitSearchError {
                                split_id: split_result.split_id,
                                error: "lambda returned empty outcome".to_string(),
                                retryable_error: true,
                            });
                        }
                    }
                }
            }
            Err(err) => {
                // Transport-level failure: the Lambda invocation itself failed.
                // Mark all splits in this batch as failed.
                error!(
                    error = %err,
                    num_splits = batch_split_ids.len(),
                    "lambda invocation failed for batch"
                );
                let mut locked = incremental_merge_collector.lock().unwrap();
                for split_id in batch_split_ids {
                    locked.add_failed_split(SplitSearchError {
                        split_id,
                        error: format!("lambda invocation error: {err}"),
                        retryable_error: true,
                    });
                }
            }
        }
    }

    Ok(())
}

struct LocalSearchTask {
    split: SplitIdAndFooterOffsets,
    search_request: SearchRequest,
    search_permit_future: SearchPermitFuture,
}

struct ScheduleSearchTaskResult {
    // The search permit futures associated to each local_search_task are
    // guaranteed to resolve in order.
    local_search_tasks: Vec<LocalSearchTask>,
    // The per-split SearchRequest (already rewritten by `rewrite_request()`) is preserved
    // so that lambda results can be cached with the correct cache key in `leaf_search_cache`.
    offloaded_search_tasks: Vec<(SplitIdAndFooterOffsets, SearchRequest)>,
}

/// Schedule search tasks, either:
/// - locally
/// - remotely on lambdas, if lambda are configured, and the number of tasks scheduled exceed the
///   offload threshold.
async fn schedule_search_tasks(
    mut splits: Vec<(SplitIdAndFooterOffsets, SearchRequest)>,
    searcher_context: &SearcherContext,
) -> ScheduleSearchTaskResult {
    let permit_sizes: Vec<ByteSize> = splits
        .iter()
        .map(|(split, _)| {
            compute_initial_memory_allocation(
                split,
                searcher_context
                    .searcher_config
                    .warmup_single_split_initial_allocation,
            )
        })
        .collect();

    let offload_threshold: usize = if searcher_context.lambda_invoker.is_some()
        && let Some(lambda_config) = &searcher_context.searcher_config.lambda
    {
        lambda_config.offload_threshold
    } else {
        usize::MAX
    };

    let search_permit_futures = searcher_context
        .search_permit_provider
        .get_permits_with_offload(permit_sizes, offload_threshold)
        .await;

    let splits_to_run_on_lambda: Vec<(SplitIdAndFooterOffsets, SearchRequest)> =
        splits.drain(search_permit_futures.len()..).collect();

    let splits_to_run_locally: Vec<LocalSearchTask> = splits
        .into_iter()
        .zip(search_permit_futures)
        .map(
            |((split, search_request), search_permit_future)| LocalSearchTask {
                split,
                search_request,
                search_permit_future,
            },
        )
        .collect();

    ScheduleSearchTaskResult {
        local_search_tasks: splits_to_run_locally,
        offloaded_search_tasks: splits_to_run_on_lambda,
    }
}

/// The leaf search collects all kind of information, and returns a set of
/// [PartialHit] candidates. The root will be in
/// charge to consolidate, identify the actual final top hits to display, and
/// fetch the actual documents to convert the partial hits into actual Hits.
pub async fn single_doc_mapping_leaf_search(
    searcher_context: Arc<SearcherContext>,
    request: Arc<SearchRequest>,
    index_storage: Arc<dyn Storage>,
    splits: Vec<SplitIdAndFooterOffsets>,
    doc_mapper: Arc<DocMapper>,
) -> Result<LeafSearchResponse, SearchError> {
    let num_docs: u64 = splits.iter().map(|split| split.num_docs).sum();
    let num_splits = splits.len();
    info!(num_docs, num_splits, split_offsets = ?PrettySample::new(&splits, 5));

    // We simplify the request as much as possible.
    let split_filter: CanSplitDoBetter =
        CanSplitDoBetter::from_request(&request, doc_mapper.timestamp_field_name());
    let mut split_with_req: Vec<(SplitIdAndFooterOffsets, SearchRequest)> =
        split_filter.optimize(&request, splits)?;
    for (split, single_split_search_request) in &mut split_with_req {
        rewrite_request(
            single_split_search_request,
            split,
            doc_mapper.timestamp_field_name(),
        );
    }
    let split_filter_arc: Arc<RwLock<CanSplitDoBetter>> = Arc::new(RwLock::new(split_filter));

    let merge_collector =
        make_merge_collector(&request, searcher_context.get_aggregation_limits())?;
    let mut incremental_merge_collector = IncrementalCollector::new(merge_collector);

    let split_outcome_counters = Arc::new(SplitSearchOutcomeCounters::new_unregistered());

    // Sort out the splits that are already in the partial result cache.
    let uncached_splits: Vec<(SplitIdAndFooterOffsets, SearchRequest)> =
        process_partial_result_cache(
            &searcher_context.leaf_search_cache,
            split_with_req,
            split_outcome_counters.clone(),
            &mut incremental_merge_collector,
        )?;
    let incremental_merge_collector_arc: Arc<Mutex<IncrementalCollector>> =
        Arc::new(Mutex::new(incremental_merge_collector));

    // Determine which uncached splits to process locally vs offload.
    let ScheduleSearchTaskResult {
        local_search_tasks,
        offloaded_search_tasks,
    } = schedule_search_tasks(uncached_splits, &searcher_context).await;

    // Offload splits to Lambda.
    let run_offloaded_search_tasks_fut = run_offloaded_search_tasks(
        &searcher_context,
        &request,
        &doc_mapper,
        index_storage.uri().clone(),
        offloaded_search_tasks,
        &incremental_merge_collector_arc,
    );

    // Spawn local split search tasks.
    let leaf_search_context = Arc::new(LeafSearchContext {
        searcher_context: searcher_context.clone(),
        split_outcome_counters,
        incremental_merge_collector: incremental_merge_collector_arc.clone(),
        doc_mapper: doc_mapper.clone(),
        split_filter: split_filter_arc.clone(),
    });
    let run_local_search_tasks_fut = run_local_search_tasks(
        local_search_tasks,
        index_storage,
        split_filter_arc,
        leaf_search_context,
    );

    let (offloaded_res, _) =
        tokio::join!(run_offloaded_search_tasks_fut, run_local_search_tasks_fut);
    offloaded_res?;

    // we can't use unwrap_or_clone because mutexes aren't Clone
    let incremental_merge_collector = match Arc::try_unwrap(incremental_merge_collector_arc) {
        Ok(filter_merger) => filter_merger.into_inner().unwrap(),
        Err(filter_merger) => filter_merger.lock().unwrap().clone(),
    };

    let leaf_search_response_result: tantivy::Result<LeafSearchResponse> =
        crate::search_thread_pool()
            .run_cpu_intensive(|| incremental_merge_collector.finalize())
            .instrument(info_span!("incremental_merge_intermediate"))
            .await
            .context("failed to merge split search responses: thread panicked")?;

    Ok(leaf_search_response_result?)
}

async fn run_local_search_tasks(
    local_search_tasks: Vec<LocalSearchTask>,
    index_storage: Arc<dyn Storage + 'static>,
    split_filter_arc: Arc<RwLock<CanSplitDoBetter>>,
    leaf_search_context: Arc<LeafSearchContext>,
) {
    let mut split_search_joinset = JoinSet::new();
    let mut task_id_to_split_id_map = HashMap::with_capacity(local_search_tasks.len());

    for LocalSearchTask {
        split,
        search_request,
        search_permit_future,
    } in local_search_tasks
    {
        let leaf_split_search_permit = search_permit_future
            .instrument(info_span!("waiting_for_leaf_search_split_semaphore"))
            .await;

        // We run simplify search request again: as we push split into the merge collector,
        // we may have discovered that we won't find any better candidates for top hits in this
        // split, in which case we can remove top hits collection.
        let Some(simplified_search_request) =
            simplify_search_request(search_request, &split, &split_filter_arc)
        else {
            let mut leaf_search_state_guard =
                SplitSearchStateGuard::new(leaf_search_context.split_outcome_counters.clone());
            leaf_search_state_guard.set_state(SplitSearchState::PrunedBeforeWarmup);
            continue;
        };
        let split_id = split.split_id.clone();
        let handle = split_search_joinset.spawn(
            leaf_search_single_split_wrapper(
                simplified_search_request,
                leaf_search_context.clone(),
                index_storage.clone(),
                split.clone(),
                leaf_split_search_permit,
            )
            .in_current_span(),
        );
        task_id_to_split_id_map.insert(handle.id(), split_id);
    }

    // Await all local tasks.
    let mut split_search_join_errors: Vec<(String, JoinError)> = Vec::new();

    while let Some(leaf_search_join_result) = split_search_joinset.join_next().await {
        if let Err(join_error) = leaf_search_join_result {
            if join_error.is_cancelled() {
                continue;
            }
            let split_id = task_id_to_split_id_map.get(&join_error.id()).unwrap();
            if join_error.is_panic() {
                error!(split=%split_id, "leaf search task panicked");
            } else {
                error!(split=%split_id, "please report: leaf search was not cancelled, and could not extract panic. this should never happen");
            }
            split_search_join_errors.push((split_id.clone(), join_error));
        }
    }

    let mut incremental_merge_collector_lock = leaf_search_context
        .incremental_merge_collector
        .lock()
        .unwrap();
    for (split_id, split_search_join_error) in split_search_join_errors {
        incremental_merge_collector_lock.add_failed_split(SplitSearchError {
            split_id,
            error: SearchError::from(split_search_join_error).to_string(),
            retryable_error: true,
        });
    }

    info!(split_outcome_counters=%leaf_search_context.split_outcome_counters, "leaf split search finished");
}

/// We identify the splits that are in the cache and append them to the incremental merge collector.
/// The (split, request) that are yet to be processed are returned.
fn process_partial_result_cache(
    leaf_search_cache: &LeafSearchCache,
    split_with_req: Vec<(SplitIdAndFooterOffsets, SearchRequest)>,
    split_outcome_counters: Arc<SplitSearchOutcomeCounters>,
    incremental_merge_collector: &mut IncrementalCollector,
) -> Result<Vec<(SplitIdAndFooterOffsets, SearchRequest)>, SearchError> {
    let mut uncached_splits: Vec<(SplitIdAndFooterOffsets, SearchRequest)> =
        Vec::with_capacity(split_with_req.len());
    for (split, search_request) in split_with_req {
        if let Some(cached_response) = leaf_search_cache
            // TODO remove the clone here.
            .get(split.clone(), search_request.clone())
        {
            let mut split_search_guard = SplitSearchStateGuard::new(split_outcome_counters.clone());
            split_search_guard.set_state(SplitSearchState::CacheHit);
            incremental_merge_collector.add_result(cached_response)?;
        } else {
            uncached_splits.push((split, search_request));
        }
    }
    Ok(uncached_splits)
}

#[derive(Copy, Clone)]
enum SplitSearchState {
    Start,
    CacheHit,
    PrunedBeforeWarmup,
    WarmUp,
    PrunedAfterWarmup,
    CpuQueue,
    Cpu,
    Success,
}

impl SplitSearchState {
    pub fn inc(self, counters: &SplitSearchOutcomeCounters) {
        match self {
            SplitSearchState::Start => counters.cancel_before_warmup.inc(),
            SplitSearchState::CacheHit => counters.cache_hit.inc(),
            SplitSearchState::PrunedBeforeWarmup => counters.pruned_before_warmup.inc(),
            SplitSearchState::WarmUp => counters.cancel_warmup.inc(),
            SplitSearchState::PrunedAfterWarmup => counters.pruned_after_warmup.inc(),
            SplitSearchState::CpuQueue => counters.cancel_cpu_queue.inc(),
            SplitSearchState::Cpu => counters.cancel_cpu.inc(),
            SplitSearchState::Success => counters.success.inc(),
        }
    }
}

impl Drop for SplitSearchStateGuard {
    fn drop(&mut self) {
        self.state
            .inc(&crate::metrics::SEARCH_METRICS.split_search_outcome_total);
        self.state.inc(&self.local_split_search_outcome_counters);
    }
}

struct SplitSearchStateGuard {
    state: SplitSearchState,
    local_split_search_outcome_counters: Arc<SplitSearchOutcomeCounters>,
}

impl SplitSearchStateGuard {
    pub fn new(local_split_search_outcome_counters: Arc<SplitSearchOutcomeCounters>) -> Self {
        SplitSearchStateGuard {
            state: SplitSearchState::Start,
            local_split_search_outcome_counters: local_split_search_outcome_counters.clone(),
        }
    }

    pub fn set_state(&mut self, state: SplitSearchState) {
        self.state = state;
    }
}

struct LeafSearchContext {
    searcher_context: Arc<SearcherContext>,
    split_outcome_counters: Arc<SplitSearchOutcomeCounters>,
    incremental_merge_collector: Arc<Mutex<IncrementalCollector>>,
    doc_mapper: Arc<DocMapper>,
    split_filter: Arc<RwLock<CanSplitDoBetter>>,
}

#[allow(clippy::too_many_arguments)]
#[instrument(skip_all, fields(split_id = split.split_id, num_docs = split.num_docs))]
async fn leaf_search_single_split_wrapper(
    request: SearchRequest,
    ctx: Arc<LeafSearchContext>,
    index_storage: Arc<dyn Storage>,
    split: SplitIdAndFooterOffsets,
    mut search_permit: SearchPermit,
) {
    let timer = crate::SEARCH_METRICS
        .leaf_search_split_duration_secs
        .start_timer();
    let leaf_search_single_split_opt_res: crate::Result<Option<LeafSearchResponse>> =
        leaf_search_single_split(
            request,
            ctx.clone(),
            index_storage,
            split.clone(),
            &mut search_permit,
        )
        .await;

    // Explicitly drop the permit for readability.
    // This should always happen after the ephemeral search cache is dropped.
    std::mem::drop(search_permit);

    if leaf_search_single_split_opt_res.is_ok() {
        timer.observe_duration();
    }

    let mut locked_incremental_merge_collector = ctx.incremental_merge_collector.lock().unwrap();
    match leaf_search_single_split_opt_res {
        Ok(Some(split_search_res)) => {
            if let Err(err) = locked_incremental_merge_collector.add_result(split_search_res) {
                locked_incremental_merge_collector.add_failed_split(SplitSearchError {
                    split_id: split.split_id.clone(),
                    error: format!("Error parsing aggregation result: {err}"),
                    retryable_error: true,
                });
            }
        }
        Ok(None) => {}
        Err(err) => locked_incremental_merge_collector.add_failed_split(SplitSearchError {
            split_id: split.split_id.clone(),
            error: format!("{err}"),
            retryable_error: true,
        }),
    }
    if let Some(last_hit) = locked_incremental_merge_collector.peek_worst_hit() {
        // TODO: we could use the RWLock instead and read the value instead of updating it
        // unconditionally.
        ctx.split_filter
            .write()
            .unwrap()
            .record_new_worst_hit(last_hit.as_ref());
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Bound;

    use async_trait::async_trait;
    use bytes::BufMut;
    use quickwit_config::{LambdaConfig, SearcherConfig};
    use quickwit_directories::write_hotcache;
    use quickwit_proto::search::LambdaSingleSplitResult;
    use rand::Rng;
    use tantivy::TantivyDocument;
    use tantivy::directory::RamDirectory;
    use tantivy::schema::{
        BytesOptions, FieldEntry, Schema, TextFieldIndexing, TextOptions, Value,
    };

    use super::*;
    use crate::LambdaLeafSearchInvoker;

    fn bool_filter(ast: impl Into<QueryAst>) -> QueryAst {
        BoolQuery {
            must: vec![QueryAst::MatchAll],
            filter: vec![ast.into()],
            ..Default::default()
        }
        .into()
    }

    #[track_caller]
    fn assert_ast_eq(got: &SearchRequest, expected: &QueryAst) {
        let got_ast: QueryAst = serde_json::from_str(&got.query_ast).unwrap();
        assert_eq!(&got_ast, expected);
        assert!(got.start_timestamp.is_none());
        assert!(got.end_timestamp.is_none());
    }

    #[track_caller]
    fn remove_timestamp_test_case(
        request: &SearchRequest,
        split: &SplitIdAndFooterOffsets,
        expected: Option<RangeQuery>,
    ) {
        let timestamp_field = "timestamp";

        // test the query directly
        let mut request_direct = request.clone();
        remove_redundant_timestamp_range(&mut request_direct, split, timestamp_field);
        let expected_direct = expected
            .clone()
            .map(bool_filter)
            .unwrap_or(QueryAst::MatchAll);
        assert_ast_eq(&request_direct, &expected_direct);
    }

    #[test]
    fn test_remove_timestamp_range() {
        const S_TO_NS: i64 = 1_000_000_000;
        let time1 = 1700001000;
        let time2 = 1700002000;
        let time3 = 1700003000;
        let time4 = 1700004000;

        let timestamp_field = "timestamp".to_string();

        // cases where the bounds are larger than the split: no bound is emitted
        let split = SplitIdAndFooterOffsets {
            timestamp_start: Some(time2),
            timestamp_end: Some(time3),
            ..SplitIdAndFooterOffsets::default()
        };

        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time1.into()),
                // *1000 has no impact, we detect timestamp in ms instead of s
                upper_bound: Bound::Included((time4 * 1000).into()),
            }))
            .unwrap(),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, None);

        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time1.into()),
                upper_bound: Bound::Included(time3.into()),
            }))
            .unwrap(),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, None);

        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::MatchAll).unwrap(),
            start_timestamp: Some(time1),
            end_timestamp: Some(time4),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, None);

        // request bound that are exclusive are treated properly
        let expected_upper_exclusive = RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Unbounded,
            upper_bound: Bound::Excluded((time3 * S_TO_NS).into()),
        };
        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time1.into()),
                upper_bound: Bound::Excluded(time3.into()),
            }))
            .unwrap(),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(
            &search_request,
            &split,
            Some(expected_upper_exclusive.clone()),
        );

        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::MatchAll).unwrap(),
            start_timestamp: Some(time1),
            end_timestamp: Some(time3),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(
            &search_request,
            &split,
            Some(expected_upper_exclusive.clone()),
        );

        let expected_lower_exclusive = RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Excluded((time2 * S_TO_NS).into()),
            upper_bound: Bound::Unbounded,
        };
        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Excluded(time2.into()),
                upper_bound: Bound::Included(time3.into()),
            }))
            .unwrap(),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(
            &search_request,
            &split,
            Some(expected_lower_exclusive.clone()),
        );

        // we take the most restrictive bounds
        let split = SplitIdAndFooterOffsets {
            timestamp_start: Some(time1),
            timestamp_end: Some(time4),
            ..SplitIdAndFooterOffsets::default()
        };

        let expected_upper_2_ex = RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Unbounded,
            upper_bound: Bound::Excluded((time2 * S_TO_NS).into()),
        };
        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time1.into()),
                upper_bound: Bound::Included(time3.into()),
            }))
            .unwrap(),
            start_timestamp: Some(time1),
            end_timestamp: Some(time2),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, Some(expected_upper_2_ex));

        let expected_upper_2_inc = RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Unbounded,
            upper_bound: Bound::Included((time2 * S_TO_NS).into()),
        };
        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time1.into()),
                upper_bound: Bound::Included(time2.into()),
            }))
            .unwrap(),
            start_timestamp: Some(time1),
            end_timestamp: Some(time3),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, Some(expected_upper_2_inc));

        let expected_lower_3 = RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Included((time3 * S_TO_NS).into()),
            upper_bound: Bound::Unbounded,
        };

        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time2.into()),
                upper_bound: Bound::Included(time4.into()),
            }))
            .unwrap(),
            start_timestamp: Some(time3),
            end_timestamp: Some(time4 + 1),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, Some(expected_lower_3.clone()));

        let search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Range(RangeQuery {
                field: timestamp_field.to_string(),
                lower_bound: Bound::Included(time3.into()),
                upper_bound: Bound::Included(time4.into()),
            }))
            .unwrap(),
            start_timestamp: Some(time2),
            end_timestamp: Some(time4 + 1),
            ..SearchRequest::default()
        };
        remove_timestamp_test_case(&search_request, &split, Some(expected_lower_3));

        let mut search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::MatchAll).unwrap(),
            start_timestamp: Some(time1),
            end_timestamp: Some(time4),
            ..SearchRequest::default()
        };
        let split = SplitIdAndFooterOffsets {
            timestamp_start: Some(time2),
            timestamp_end: Some(time3),
            ..SplitIdAndFooterOffsets::default()
        };
        remove_redundant_timestamp_range(&mut search_request, &split, &timestamp_field);
        assert_ast_eq(&search_request, &QueryAst::MatchAll);
    }

    // regression test for #4935
    #[test]
    fn test_remove_timestamp_range_keep_should() {
        let time1 = 1700001000;
        let time2 = 1700002000;
        let time3 = 1700003000;

        let timestamp_field = "timestamp".to_string();

        // cases where the bounds are larger than the split: no bound is emitted
        let split = SplitIdAndFooterOffsets {
            timestamp_start: Some(time1),
            timestamp_end: Some(time3),
            ..SplitIdAndFooterOffsets::default()
        };

        let mut search_request = SearchRequest {
            query_ast: serde_json::to_string(&QueryAst::Bool(BoolQuery {
                should: vec![QueryAst::MatchAll],
                ..BoolQuery::default()
            }))
            .unwrap(),
            start_timestamp: Some(time2),
            end_timestamp: None,
            ..SearchRequest::default()
        };
        remove_redundant_timestamp_range(&mut search_request, &split, &timestamp_field);
        assert_ast_eq(
            &search_request,
            &QueryAst::Bool(BoolQuery {
                // original request
                must: vec![QueryAst::Bool(BoolQuery {
                    should: vec![QueryAst::MatchAll],
                    ..BoolQuery::default()
                })],
                // time bound
                filter: vec![
                    RangeQuery {
                        field: "timestamp".to_string(),
                        lower_bound: Bound::Included(1_700_002_000_000_000_000u64.into()),
                        upper_bound: Bound::Unbounded,
                    }
                    .into(),
                ],
                ..BoolQuery::default()
            }),
        );
    }

    #[test]
    fn test_remove_extended_bounds_from_histogram() {
        let histo_at_root = r#"
{
  "date_histo": {
    "date_histogram": {
      "extended_bounds": {
        "max": 1425254400000,
        "min": 1420070400000
      },
      "field": "date",
      "fixed_interval": "30d",
      "offset": "-4d"
    }
  }
}
"#;

        let histo_at_root_no_bounds = r#"
{
  "date_histo": {
    "date_histogram": {
      "field": "date",
      "fixed_interval": "30d",
      "offset": "-4d"
    }
  }
}
"#;

        let histo_at_root_with_sibling = r#"
{
  "metrics": {
    "aggs": {
      "response": {
        "percentiles": {
          "field": "response",
          "keyed": false,
          "percents": [
            85
          ]
        }
      }
    },
    "date_histogram": {
      "extended_bounds": {
        "max": 1425254400000,
        "min": 1420070400000
      },
      "field": "date",
      "fixed_interval": "30d",
      "offset": "-4d"
    }
  }
}
"#;

        let histo_at_root_with_sibling_no_bounds = r#"
{
  "metrics": {
    "aggs": {
      "response": {
        "percentiles": {
          "field": "response",
          "keyed": false,
          "percents": [
            85
          ]
        }
      }
    },
    "date_histogram": {
      "field": "date",
      "fixed_interval": "30d",
      "offset": "-4d"
    }
  }
}
"#;
        let histo_at_leaf = r#"
{
  "metrics": {
    "aggs": {
      "response": {
        "date_histogram": {
          "extended_bounds": {
            "max": 1425254400000,
            "min": 1420070400000
          },
          "field": "date",
          "fixed_interval": "30d",
          "offset": "-4d"
        }
      }
    },
    "percentiles": {
      "field": "response",
      "keyed": false,
      "percents": [
        85
      ]
    }
  }
}
"#;

        let histo_at_leaf_no_bounds = r#"
{
  "metrics": {
    "aggs": {
      "response": {
        "date_histogram": {
          "field": "date",
          "fixed_interval": "30d",
          "offset": "-4d"
        }
      }
    },
    "percentiles": {
      "field": "response",
      "keyed": false,
      "percents": [
        85
      ]
    }
  }
}
"#;
        for (bounds, no_bounds) in [
            (histo_at_root, histo_at_root_no_bounds),
            (
                histo_at_root_with_sibling,
                histo_at_root_with_sibling_no_bounds,
            ),
            (histo_at_leaf, histo_at_leaf_no_bounds),
        ] {
            // first assert we do nothing when there are no bounds
            let request_no_bounds = SearchRequest {
                aggregation_request: Some(no_bounds.to_string()),
                ..SearchRequest::default()
            };
            let mut request_no_bounds_clone = request_no_bounds.clone();
            rewrite_aggregation(&mut request_no_bounds_clone);
            assert_eq!(request_no_bounds, request_no_bounds_clone);

            let mut request_bounds = SearchRequest {
                aggregation_request: Some(bounds.to_string()),
                ..SearchRequest::default()
            };
            rewrite_aggregation(&mut request_bounds);
            // we can't just compare bounds and no_bounds, they must be structuraly equal, but not
            // necessarily identical (field order, null vs absent...). So we parse both and verify
            // the results are equal instead
            let no_bounds_agg: QuickwitAggregations =
                serde_json::from_str(&request_no_bounds.aggregation_request.unwrap()).unwrap();
            let rewrote_bounds_agg: QuickwitAggregations =
                serde_json::from_str(&request_bounds.aggregation_request.unwrap()).unwrap();
            assert_eq!(rewrote_bounds_agg, no_bounds_agg);
        }
    }

    fn create_tantivy_dir_with_hotcache<'a, V>(
        field_entry: FieldEntry,
        field_value: V,
    ) -> (HotDirectory, usize)
    where
        V: Value<'a>,
    {
        let field_name = field_entry.name().to_string();
        let mut schema_builder = Schema::builder();
        schema_builder.add_field(field_entry);
        let schema = schema_builder.build();

        let ram_directory = RamDirectory::create();
        let index = Index::open_or_create(ram_directory.clone(), schema.clone()).unwrap();

        let mut index_writer = index.writer(15_000_000).unwrap();
        let field = schema.get_field(&field_name).unwrap();
        let mut new_doc = TantivyDocument::default();
        new_doc.add_field_value(field, field_value);
        index_writer.add_document(new_doc).unwrap();
        index_writer.commit().unwrap();

        let mut hotcache_bytes_writer = Vec::new().writer();
        write_hotcache(ram_directory.clone(), &mut hotcache_bytes_writer).unwrap();
        let hotcache_bytes = OwnedBytes::new(hotcache_bytes_writer.into_inner());
        let hot_directory = HotDirectory::open(ram_directory.clone(), hotcache_bytes).unwrap();
        (hot_directory, ram_directory.total_mem_usage())
    }

    #[test]
    fn test_compute_index_size_without_store() {
        // We don't want to make assertions on absolute index sizes (it might
        // change in future Tantivy versions), but rather verify that the store
        // is properly excluded from the computed size.

        // We use random bytes so that the store can't compress them
        let mut payload = vec![0u8; 1024];
        rand::rng().fill(&mut payload[..]);

        let (hotcache_directory_stored_payload, directory_size_stored_payload) =
            create_tantivy_dir_with_hotcache(
                FieldEntry::new_bytes("payload".to_string(), BytesOptions::default().set_stored()),
                &payload,
            );
        let size_with_stored_payload =
            compute_index_size(&hotcache_directory_stored_payload).as_u64();

        let (hotcache_directory_index_only, directory_size_index_only) =
            create_tantivy_dir_with_hotcache(
                FieldEntry::new_bytes("payload".to_string(), BytesOptions::default()),
                &payload,
            );
        let size_index_only = compute_index_size(&hotcache_directory_index_only).as_u64();

        assert!(directory_size_stored_payload > directory_size_index_only + 1000);
        assert!(size_with_stored_payload.abs_diff(size_index_only) < 10);
    }

    #[test]
    fn test_compute_index_size_varies_with_data() {
        // We don't want to make assertions on absolute index sizes (it might
        // change in future Tantivy versions), but rather verify that an index
        // with more data is indeed bigger.

        let indexing_options =
            TextOptions::default().set_indexing_options(TextFieldIndexing::default());

        let (hotcache_directory_larger, directory_size_larger) = create_tantivy_dir_with_hotcache(
            FieldEntry::new_text("text".to_string(), indexing_options.clone()),
            "Sed ut perspiciatis unde omnis iste natus error sit voluptatem accusantium \
             doloremque laudantium, totam rem aperiam, eaque ipsa quae ab illo inventore \
             veritatis et quasi architecto beatae vitae dicta sunt explicabo. Nemo enim ipsam \
             voluptatem quia voluptas sit aspernatur aut odit aut fugit, sed quia consequuntur \
             magni dolores eos qui ratione voluptatem sequi nesciunt. Neque porro quisquam est, \
             qui dolorem ipsum quia dolor sit amet, consectetur, adipisci velit, sed quia non \
             numquam eius modi tempora incidunt ut labore et dolore magnam aliquam quaerat \
             voluptatem. Ut enim ad minima veniam, quis nostrum exercitationem ullam corporis \
             suscipit laboriosam, nisi ut aliquid ex ea commodi consequatur? Quis autem vel eum \
             iure reprehenderit qui in ea voluptate velit esse quam nihil molestiae consequatur, \
             vel illum qui dolorem eum fugiat quo voluptas nulla pariatur?",
        );
        let larger_size = compute_index_size(&hotcache_directory_larger).as_u64();

        let (hotcache_directory_smaller, directory_size_smaller) = create_tantivy_dir_with_hotcache(
            FieldEntry::new_text("text".to_string(), indexing_options),
            "hi",
        );
        let smaller_size = compute_index_size(&hotcache_directory_smaller).as_u64();

        assert!(directory_size_larger > directory_size_smaller + 100);
        assert!(larger_size > smaller_size + 100);
    }

    fn nz(n: usize) -> std::num::NonZeroUsize {
        std::num::NonZeroUsize::new(n).unwrap()
    }

    #[test]
    fn test_greedy_batch_split_empty() {
        let items: Vec<u64> = vec![];
        let batches = super::greedy_batch_split(items, |&x| x, nz(5));
        assert!(batches.is_empty());
    }

    #[test]
    fn test_greedy_batch_split_single_batch() {
        let items = vec![10u64, 20, 30];
        let batches = super::greedy_batch_split(items, |&x| x, nz(10));
        assert_eq!(batches.len(), 1);
        assert_eq!(batches[0].len(), 3);
    }

    #[test]
    fn test_greedy_batch_split_balances_weights() {
        // 7 items with weights, max 3 per batch -> 3 batches
        let items = vec![100u64, 80, 60, 50, 40, 30, 20];
        let batches = super::greedy_batch_split(items, |&x| x, nz(3));

        assert_eq!(batches.len(), 3);

        // All items should be present
        let mut all_items: Vec<u64> = batches.iter().flatten().copied().collect();
        all_items.sort_unstable();
        assert_eq!(all_items, vec![20, 30, 40, 50, 60, 80, 100]);

        // Check weights are reasonably balanced
        let weights: Vec<u64> = batches.iter().map(|b| b.iter().sum()).collect();
        let max_weight = *weights.iter().max().unwrap();
        let min_weight = *weights.iter().min().unwrap();
        // With greedy LPT, the imbalance should be bounded
        assert!(
            max_weight <= min_weight * 2,
            "weights should be reasonably balanced: {:?}",
            weights
        );
    }

    #[test]
    fn test_greedy_batch_split_count_balance() {
        // 10 items, max 3 per batch -> 4 batches
        // counts should be either 2 or 3 per batch
        let items: Vec<u64> = (0..10).collect();
        let batches = super::greedy_batch_split(items, |&x| x, nz(3));

        assert_eq!(batches.len(), 4);
        let counts: Vec<usize> = batches.iter().map(|b| b.len()).collect();
        for count in &counts {
            assert!(
                *count >= 2 && *count <= 3,
                "count should be 2 or 3, got {}",
                count
            );
        }
        assert_eq!(counts.iter().sum::<usize>(), 10);
    }

    fn make_splits_with_requests(
        num_splits: usize,
    ) -> Vec<(SplitIdAndFooterOffsets, SearchRequest)> {
        (0..num_splits)
            .map(|idx| {
                let split = SplitIdAndFooterOffsets {
                    split_id: format!("split_{idx}"),
                    num_docs: 100,
                    ..Default::default()
                };
                (split, SearchRequest::default())
            })
            .collect()
    }

    #[tokio::test]
    async fn test_schedule_search_tasks_no_lambda_all_local() {
        let searcher_context = SearcherContext::for_test();
        let splits = make_splits_with_requests(5);
        let result = super::schedule_search_tasks(splits, &searcher_context).await;
        assert_eq!(result.local_search_tasks.len(), 5);
        assert!(result.offloaded_search_tasks.is_empty());
        for (idx, task) in result.local_search_tasks.iter().enumerate() {
            assert_eq!(task.split.split_id, format!("split_{idx}"));
        }
    }

    struct DummyInvoker;
    #[async_trait]
    impl LambdaLeafSearchInvoker for DummyInvoker {
        async fn invoke_leaf_search(
            &self,
            _req: LeafSearchRequest,
        ) -> Result<Vec<LambdaSingleSplitResult>, SearchError> {
            todo!()
        }
    }

    #[tokio::test]
    async fn test_schedule_search_tasks_lambda_offloads_excess() {
        let mut config = SearcherConfig::default();
        config.lambda = Some(LambdaConfig {
            offload_threshold: 3,
            ..LambdaConfig::for_test()
        });
        let searcher_context = SearcherContext::new(config, None, Some(Arc::new(DummyInvoker)));
        let splits = make_splits_with_requests(7);
        let result = super::schedule_search_tasks(splits, &searcher_context).await;
        assert_eq!(result.local_search_tasks.len(), 3);
        assert_eq!(result.offloaded_search_tasks.len(), 4);
        for (idx, task) in result.local_search_tasks.iter().enumerate() {
            assert_eq!(task.split.split_id, format!("split_{idx}"));
        }
        for (idx, (split, _req)) in result.offloaded_search_tasks.iter().enumerate() {
            assert_eq!(split.split_id, format!("split_{}", idx + 3));
        }
    }

    #[tokio::test]
    async fn test_schedule_search_tasks_lambda_threshold_zero_offloads_all() {
        let mut config = SearcherConfig::default();
        config.lambda = Some(LambdaConfig {
            offload_threshold: 0,
            ..LambdaConfig::for_test()
        });
        let searcher_context = SearcherContext::new(config, None, Some(Arc::new(DummyInvoker)));
        let splits = make_splits_with_requests(5);
        let result = super::schedule_search_tasks(splits, &searcher_context).await;
        assert!(result.local_search_tasks.is_empty());
        assert_eq!(result.offloaded_search_tasks.len(), 5);
    }

    #[tokio::test]
    async fn test_schedule_search_tasks_lambda_threshold_above_split_count() {
        let mut config = SearcherConfig::default();
        config.lambda = Some(LambdaConfig {
            offload_threshold: 100,
            ..LambdaConfig::for_test()
        });
        let searcher_context = SearcherContext::new(config, None, Some(Arc::new(DummyInvoker)));
        let splits = make_splits_with_requests(5);
        let result = super::schedule_search_tasks(splits, &searcher_context).await;
        assert_eq!(result.local_search_tasks.len(), 5);
        assert!(result.offloaded_search_tasks.is_empty());
    }

    #[tokio::test]
    async fn test_schedule_search_tasks_empty() {
        let searcher_context = SearcherContext::for_test();
        let result = super::schedule_search_tasks(Vec::new(), &searcher_context).await;
        assert!(result.local_search_tasks.is_empty());
        assert!(result.offloaded_search_tasks.is_empty());
    }

    mod proptest_greedy_batch {
        use std::num::NonZeroUsize;

        use proptest::prelude::*;

        proptest! {
            #[test]
            fn all_items_preserved(
                items in prop::collection::vec(0u64..1000, 0..100),
                max_per_batch in 1usize..20
            ) {
                let original: Vec<u64> = items.clone();
                let max_per_batch = NonZeroUsize::new(max_per_batch).unwrap();
                let batches = super::super::greedy_batch_split(items, |&x| x, max_per_batch);

                // All items should be present exactly once
                let mut result: Vec<u64> = batches.into_iter().flatten().collect();
                result.sort_unstable();
                let mut expected = original;
                expected.sort_unstable();
                prop_assert_eq!(result, expected);
            }

            #[test]
            fn batch_count_correct(
                items in prop::collection::vec(0u64..1000, 1..100),
                max_per_batch in 1usize..20
            ) {
                let n = items.len();
                let max_per_batch_nz = NonZeroUsize::new(max_per_batch).unwrap();
                let batches = super::super::greedy_batch_split(items, |&x| x, max_per_batch_nz);

                let expected_batches = n.div_ceil(max_per_batch);
                prop_assert_eq!(batches.len(), expected_batches);
            }

            #[test]
            fn total_items_matches(
                items in prop::collection::vec(0u64..1000, 1..100),
                max_per_batch in 1usize..20
            ) {
                let n = items.len();
                let max_per_batch = NonZeroUsize::new(max_per_batch).unwrap();
                let batches = super::super::greedy_batch_split(items, |&x| x, max_per_batch);

                // Total items across all batches equals input
                let total: usize = batches.iter().map(|b| b.len()).sum();
                prop_assert_eq!(total, n);
            }

            #[test]
            fn greedy_balances_by_weight_not_count(
                // Use items with significant weights to test weight balancing
                items in prop::collection::vec(100u64..1000, 4..30),
                max_per_batch in 2usize..10
            ) {
                let max_per_batch = NonZeroUsize::new(max_per_batch).unwrap();
                let batches = super::super::greedy_batch_split(items, |&x| x, max_per_batch);

                if batches.len() >= 2 {
                    let weights: Vec<u64> = batches.iter().map(|b| b.iter().sum()).collect();
                    let total_weight: u64 = weights.iter().sum();
                    let avg_weight = total_weight / batches.len() as u64;

                    // LPT guarantees max makespan <= (4/3) * optimal
                    // With balanced input, max should be close to average
                    let max_weight = *weights.iter().max().unwrap();

                    // Max weight should be at most 2x average (generous bound)
                    prop_assert!(
                        max_weight <= avg_weight * 2 + 1000, // +1000 for rounding slack
                        "max weight {} too far from average {}",
                        max_weight,
                        avg_weight
                    );
                }
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-search/src/leaf_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::{Bound, RangeBounds};

use prost::Message;
use quickwit_config::CacheConfig;
use quickwit_proto::search::{
    CountHits, LeafSearchResponse, SearchRequest, SplitIdAndFooterOffsets,
};
use quickwit_proto::types::SplitId;
use quickwit_storage::{MemorySizedCache, OwnedBytes};
use tantivy::index::SegmentId;

/// A cache to memoize `leaf_search_single_split` results.
pub struct LeafSearchCache {
    content: MemorySizedCache<CacheKey>,
}

// TODO we could be smarter about search_after. If we have a cached request with a search_after
// (possibly equal to None) A, and a corresponding response with the 1st element having the value
// B, and we receive a 2nd request with a search_after such that A <= C < B, we can serve from
// cache directly. Only the case A = C < B is currently handled.
// TODO if we don't request counting all results, have no aggregation, and we get a request we can
// match, the merged_time_range is strictly smaller, and every hit we had fits in the new
// timebound, we can reply from cache, saying we hit only result.partial_hits.len() res. It always
// undercount, and necessarily returns the right hits.
// TODO if we stored a result for X hits, but a subsequent request asks for Y < X hits, we can
// modify the answer and serve from cache.
// TODO mix of 1 and 3.
// TODO this means given a request for X documents, we could search for k*X docs in each split,
// truncate to X while merging, and get free results from cache for at least the next k subsequent
// queries which vary only by search_after.

impl LeafSearchCache {
    pub fn new(config: &CacheConfig) -> LeafSearchCache {
        LeafSearchCache {
            content: MemorySizedCache::from_config(
                config,
                &quickwit_storage::STORAGE_METRICS.partial_request_cache,
            ),
        }
    }
    pub fn get(
        &self,
        split_info: SplitIdAndFooterOffsets,
        search_request: SearchRequest,
    ) -> Option<LeafSearchResponse> {
        let key = CacheKey::from_split_meta_and_request(split_info, search_request);
        let encoded_result = self.content.get(&key)?;
        // this should never fail
        LeafSearchResponse::decode(&*encoded_result).ok()
    }

    pub fn put(
        &self,
        split_info: SplitIdAndFooterOffsets,
        search_request: SearchRequest,
        result: LeafSearchResponse,
    ) {
        let key = CacheKey::from_split_meta_and_request(split_info, search_request);
        let encoded_result = result.encode_to_vec();
        self.content.put(key, OwnedBytes::new(encoded_result));
    }
}

/// A key inside a [`LeafSearchCache`].
#[derive(Debug, Hash, Clone, PartialEq, Eq)]
struct CacheKey {
    /// The split this entry refers to
    split_id: SplitId,
    /// The request this matches. The timerange of the request was removed.
    request: SearchRequest,
    /// The effective time range of the request, that is, the intersection of the timerange
    /// requested, and the timerange covered by the split.
    merged_time_range: HalfOpenRange,
}

impl CacheKey {
    fn from_split_meta_and_request(
        split_info: SplitIdAndFooterOffsets,
        mut search_request: SearchRequest,
    ) -> Self {
        let split_time_range = HalfOpenRange::from_bounds(split_info.time_range());
        let request_time_range = HalfOpenRange::from_bounds(search_request.time_range());
        let merged_time_range = request_time_range.intersect(&split_time_range);

        search_request.start_timestamp = None;
        search_request.end_timestamp = None;
        // it doesn't matter whether or not we count all hits at the scale of a
        // single split: either we did process it and got everything, or we didn't.
        search_request.count_hits = CountHits::CountAll.into();

        CacheKey {
            split_id: split_info.split_id,
            request: search_request,
            merged_time_range,
        }
    }
}

/// A (half-open) range bounded inclusively below and exclusively above [start..end).
#[derive(Debug, Copy, Clone, PartialEq, Eq, Hash)]
struct HalfOpenRange {
    start: i64,
    end: Option<i64>,
}

impl HalfOpenRange {
    fn empty_range() -> HalfOpenRange {
        HalfOpenRange {
            start: 0,
            end: Some(0),
        }
    }

    /// Create a Range from bounds.
    fn from_bounds(range: impl RangeBounds<i64>) -> Self {
        let start = match range.start_bound() {
            Bound::Included(start) => *start,
            Bound::Excluded(start) => {
                // if we exclude i64::MAX from the start bound, the range is necessarily empty
                if let Some(start) = start.checked_add(1) {
                    start
                } else {
                    return Self::empty_range();
                }
            }
            Bound::Unbounded => i64::MIN,
        };
        let end = match range.end_bound() {
            // if we include i64::MAX at the end bound, this is essentially boundless
            Bound::Included(end) => end.checked_add(1),
            Bound::Excluded(end) => Some(*end),
            Bound::Unbounded => None,
        };

        HalfOpenRange { start, end }.normalize()
    }

    fn is_empty(self) -> bool {
        !self.contains(&self.start)
    }

    /// Normalize empty ranges to be 0..0
    fn normalize(self) -> HalfOpenRange {
        if self.is_empty() {
            Self::empty_range()
        } else {
            self
        }
    }

    /// Return the intersection of self and other.
    fn intersect(&self, other: &HalfOpenRange) -> HalfOpenRange {
        let start = self.start.max(other.start);
        let end = match (self.end, other.end) {
            (Some(this), Some(other)) => Some(this.min(other)),
            (Some(this), None) => Some(this),
            (None, other) => other,
        };
        HalfOpenRange { start, end }.normalize()
    }
}

impl RangeBounds<i64> for HalfOpenRange {
    fn start_bound(&self) -> Bound<&i64> {
        Bound::Included(&self.start)
    }

    fn end_bound(&self) -> Bound<&i64> {
        if let Some(end_bound) = &self.end {
            Bound::Excluded(end_bound)
        } else {
            Bound::Unbounded
        }
    }
}

pub struct PredicateCacheImpl {
    content: MemorySizedCache<(SplitId, String)>,
}

impl PredicateCacheImpl {
    pub fn new(config: &CacheConfig) -> Self {
        PredicateCacheImpl {
            content: MemorySizedCache::from_config(
                config,
                &quickwit_storage::STORAGE_METRICS.predicate_cache,
            ),
        }
    }
}

impl quickwit_query::query_ast::PredicateCache for PredicateCacheImpl {
    fn get(
        &self,
        split_id: SplitId,
        query_ast_json: String,
    ) -> Option<(SegmentId, quickwit_query::query_ast::HitSet)> {
        let encoded_result = self.content.get(&(split_id, query_ast_json))?;
        let (segment_id_bytes, hits_buffer) = encoded_result.split(32);
        let segment_id =
            SegmentId::from_uuid_string(str::from_utf8(&segment_id_bytes).ok()?).ok()?;
        let hits = quickwit_query::query_ast::HitSet::from_buffer(hits_buffer);
        Some((segment_id, hits))
    }

    fn put(
        &self,
        split_id: SplitId,
        query_ast_json: String,
        segment: SegmentId,
        hits: quickwit_query::query_ast::HitSet,
    ) {
        let hits_buffer = hits.into_buffer();
        let mut buffer = Vec::with_capacity(32 + hits_buffer.len());
        buffer.extend_from_slice(segment.uuid_string().as_bytes());
        buffer.extend_from_slice(&hits_buffer);
        self.content
            .put((split_id, query_ast_json), OwnedBytes::new(buffer));
    }
}

#[cfg(test)]
mod tests {
    use bytesize::ByteSize;
    use quickwit_proto::search::{
        LeafSearchResponse, PartialHit, ResourceStats, SearchRequest, SortValue,
        SplitIdAndFooterOffsets,
    };

    use super::LeafSearchCache;

    #[test]
    fn test_leaf_search_cache_no_timestamp() {
        let cache = LeafSearchCache::new(&ByteSize::mb(64).into());

        let split_1 = SplitIdAndFooterOffsets {
            split_id: "split_1".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: None,
            timestamp_end: None,
            num_docs: 0,
        };

        let split_2 = SplitIdAndFooterOffsets {
            split_id: "split_2".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: None,
            timestamp_end: None,
            num_docs: 0,
        };

        let query_1 = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: "test".to_string(),
            start_timestamp: None,
            end_timestamp: None,
            max_hits: 10,
            start_offset: 0,
            ..Default::default()
        };

        let query_2 = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: "test2".to_string(),
            start_timestamp: None,
            end_timestamp: None,
            max_hits: 10,
            start_offset: 0,
            ..Default::default()
        };

        let result = LeafSearchResponse {
            failed_splits: Vec::new(),
            intermediate_aggregation_result: None,
            num_attempted_splits: 1,
            num_successful_splits: 1,
            num_hits: 1234,
            partial_hits: vec![PartialHit {
                doc_id: 1,
                segment_ord: 0,
                sort_value: Some(SortValue::U64(0u64).into()),
                sort_value2: None,
                split_id: "split_1".to_string(),
            }],
            resource_stats: None,
        };

        assert!(cache.get(split_1.clone(), query_1.clone()).is_none());

        cache.put(split_1.clone(), query_1.clone(), result.clone());
        assert_eq!(cache.get(split_1.clone(), query_1.clone()).unwrap(), result);
        assert!(cache.get(split_2, query_1).is_none());
        assert!(cache.get(split_1, query_2).is_none());
    }

    #[test]
    fn test_leaf_search_cache_timestamp() {
        let cache = LeafSearchCache::new(&ByteSize::mb(64).into());

        let split_1 = SplitIdAndFooterOffsets {
            split_id: "split_1".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: Some(100),
            timestamp_end: Some(199),
            num_docs: 0,
        };
        let split_2 = SplitIdAndFooterOffsets {
            split_id: "split_2".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: Some(150),
            timestamp_end: Some(249),
            num_docs: 0,
        };
        let split_3 = SplitIdAndFooterOffsets {
            split_id: "split_3".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: Some(150),
            timestamp_end: Some(249),
            num_docs: 0,
        };

        let query_1 = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: "test".to_string(),
            start_timestamp: Some(100),
            end_timestamp: Some(250),
            max_hits: 10,
            start_offset: 0,
            ..Default::default()
        };
        let query_1bis = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: "test".to_string(),
            start_timestamp: Some(150),
            end_timestamp: Some(300),
            max_hits: 10,
            start_offset: 0,
            ..Default::default()
        };

        let query_2 = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: "test2".to_string(),
            start_timestamp: None,
            end_timestamp: None,
            max_hits: 10,
            start_offset: 0,
            ..Default::default()
        };
        let query_2bis = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: "test2".to_string(),
            start_timestamp: Some(50),
            end_timestamp: Some(200),
            max_hits: 10,
            start_offset: 0,
            ..Default::default()
        };

        let result = LeafSearchResponse {
            failed_splits: Vec::new(),
            intermediate_aggregation_result: None,
            num_attempted_splits: 1,
            num_successful_splits: 1,
            num_hits: 1234,
            partial_hits: vec![PartialHit {
                doc_id: 1,
                segment_ord: 0,
                sort_value: Some(SortValue::U64(0).into()),
                sort_value2: None,
                split_id: "split_1".to_string(),
            }],
            resource_stats: Some(ResourceStats::default()),
        };

        // for split_1, 1 and 1bis cover different timestamp ranges
        cache.put(split_1.clone(), query_1.clone(), result.clone());
        assert!(cache.get(split_1.clone(), query_1.clone()).is_some());
        assert!(cache.get(split_1.clone(), query_1bis.clone()).is_none());

        // for split_2, both 1 and 1bis cover everything, so it should cache-hit
        cache.put(split_2.clone(), query_1.clone(), result.clone());
        assert!(cache.get(split_2.clone(), query_1).is_some());
        assert!(cache.get(split_2.clone(), query_1bis).is_some());

        // for split_1, both 1 and 1bis cover everything, so it should cache-hit
        cache.put(split_1.clone(), query_2.clone(), result.clone());
        assert!(cache.get(split_1.clone(), query_2.clone()).is_some());
        assert!(cache.get(split_1, query_2bis.clone()).is_some());

        // for split_2, 2 covers everything, but 2bis cover only a subrange
        cache.put(split_2.clone(), query_2.clone(), result.clone());
        assert!(cache.get(split_2.clone(), query_2.clone()).is_some());
        assert!(cache.get(split_2, query_2bis.clone()).is_none());

        // same for split_3, but we try caching the bounded request and query for the unbounded one
        cache.put(split_3.clone(), query_2bis.clone(), result);
        assert!(cache.get(split_3.clone(), query_2).is_none());
        assert!(cache.get(split_3, query_2bis).is_some());
    }
}


================================================
FILE: quickwit/quickwit-search/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

//! This projects implements quickwit's search API.
#![warn(missing_docs)]
#![allow(clippy::bool_assert_comparison)]
#![deny(clippy::disallowed_methods)]

mod client;
mod cluster_client;
mod collector;
mod error;
mod fetch_docs;
mod find_trace_ids_collector;

mod invoker;
/// Leaf search operations.
pub mod leaf;
mod leaf_cache;
mod list_fields;
mod list_fields_cache;
mod list_terms;
mod metrics_trackers;
mod retry;
mod root;
mod scroll_context;
mod search_job_placer;
mod search_response_rest;
mod service;
pub(crate) mod top_k_collector;

mod metrics;
mod search_permit_provider;

#[cfg(test)]
mod tests;

pub use collector::QuickwitAggregations;
use metrics::SEARCH_METRICS;
use quickwit_common::thread_pool::ThreadPool;
use quickwit_common::tower::Pool;
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::metastore::{
    ListIndexesMetadataRequest, ListSplitsRequest, MetastoreService, MetastoreServiceClient,
};
use tantivy::schema::NamedFieldDocument;

/// Refer to this as `crate::Result<T>`.
pub type Result<T> = std::result::Result<T, SearchError>;

use std::net::{Ipv4Addr, SocketAddr};
use std::sync::{Arc, OnceLock};

pub use find_trace_ids_collector::{FindTraceIdsCollector, Span};
use quickwit_config::SearcherConfig;
use quickwit_doc_mapper::tag_pruning::TagFilterAst;
use quickwit_metastore::{
    IndexMetadata, ListIndexesMetadataResponseExt, ListSplitsQuery, ListSplitsRequestExt,
    MetastoreServiceStreamSplitsExt, SplitMetadata, SplitState,
};
use quickwit_proto::search::{
    PartialHit, ResourceStats, SearchRequest, SearchResponse, SplitIdAndFooterOffsets,
};
use quickwit_proto::types::IndexUid;
use quickwit_storage::StorageResolver;
pub use service::SearcherContext;
use tantivy::DocAddress;

pub use crate::client::{
    SearchServiceClient, create_search_client_from_channel, create_search_client_from_grpc_addr,
};
pub use crate::cluster_client::ClusterClient;
pub use crate::error::{SearchError, parse_grpc_error};
use crate::fetch_docs::fetch_docs;
pub use crate::invoker::LambdaLeafSearchInvoker;
pub use crate::root::{
    IndexMetasForLeafSearch, SearchJob, ensure_all_indexes_found, jobs_to_leaf_request,
    root_search, search_plan,
};
pub use crate::search_job_placer::{Job, SearchJobPlacer};
pub use crate::search_response_rest::{
    AggregationResults, SearchPlanResponseRest, SearchResponseRest,
};
pub use crate::service::{MockSearchService, SearchService, SearchServiceImpl};

/// A pool of searcher clients identified by their gRPC socket address.
pub type SearcherPool = Pool<SocketAddr, SearchServiceClient>;

fn search_thread_pool() -> &'static ThreadPool {
    static SEARCH_THREAD_POOL: OnceLock<ThreadPool> = OnceLock::new();
    SEARCH_THREAD_POOL.get_or_init(|| ThreadPool::new("search", None))
}

/// GlobalDocAddress serves as a hit address.
#[derive(Clone, Eq, Debug, PartialEq, Hash, Ord, PartialOrd)]
pub struct GlobalDocAddress {
    /// Split containing the document
    pub split: String,
    /// Document address inside the split
    pub doc_addr: DocAddress,
}

/// An error happened converting a string to a GLobalDocAddress
#[derive(Debug, Clone, Copy)]
pub struct GlobalDocAddressParseError;

impl GlobalDocAddress {
    /// Extract a GlobalDocAddress from a PartialHit
    pub fn from_partial_hit(partial_hit: &PartialHit) -> Self {
        Self {
            split: partial_hit.split_id.to_string(),
            doc_addr: DocAddress {
                segment_ord: partial_hit.segment_ord,
                doc_id: partial_hit.doc_id,
            },
        }
    }
}

impl std::fmt::Display for GlobalDocAddress {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.write_str(&self.split)?;
        write!(
            f,
            ":{:08x}:{:08x}",
            self.doc_addr.segment_ord, self.doc_addr.doc_id
        )
    }
}

impl std::str::FromStr for GlobalDocAddress {
    type Err = GlobalDocAddressParseError;

    fn from_str(s: &str) -> std::result::Result<Self, Self::Err> {
        let mut s_iter = s.splitn(3, ':');
        let split = s_iter.next().ok_or(GlobalDocAddressParseError)?.to_string();
        let segment = s_iter.next().ok_or(GlobalDocAddressParseError)?;
        let doc_id = s_iter.next().ok_or(GlobalDocAddressParseError)?;

        let segment_ord =
            u32::from_str_radix(segment, 16).map_err(|_| GlobalDocAddressParseError)?;
        let doc_id = u32::from_str_radix(doc_id, 16).map_err(|_| GlobalDocAddressParseError)?;

        Ok(GlobalDocAddress {
            split,
            doc_addr: DocAddress {
                segment_ord,
                doc_id,
            },
        })
    }
}

fn extract_split_and_footer_offsets(split_metadata: &SplitMetadata) -> SplitIdAndFooterOffsets {
    SplitIdAndFooterOffsets {
        split_id: split_metadata.split_id.clone(),
        split_footer_start: split_metadata.footer_offsets.start,
        split_footer_end: split_metadata.footer_offsets.end,
        timestamp_start: split_metadata
            .time_range
            .as_ref()
            .map(|time_range| *time_range.start()),
        timestamp_end: split_metadata
            .time_range
            .as_ref()
            .map(|time_range| *time_range.end()),
        num_docs: split_metadata.num_docs as u64,
    }
}

/// Get all splits of given index ids
pub async fn list_all_splits(
    index_uids: Vec<IndexUid>,
    metastore: &mut MetastoreServiceClient,
) -> crate::Result<Vec<SplitMetadata>> {
    list_relevant_splits(index_uids, None, None, None, metastore).await
}

/// Extract the list of relevant splits for a given request.
pub async fn list_relevant_splits(
    index_uids: Vec<IndexUid>,
    start_timestamp: Option<i64>,
    end_timestamp: Option<i64>,
    tags_filter_opt: Option<TagFilterAst>,
    metastore: &mut MetastoreServiceClient,
) -> crate::Result<Vec<SplitMetadata>> {
    let Some(mut query) = ListSplitsQuery::try_from_index_uids(index_uids) else {
        return Ok(Vec::new());
    };
    query = query.with_split_state(SplitState::Published);

    if let Some(start_ts) = start_timestamp {
        query = query.with_time_range_start_gte(start_ts);
    }
    if let Some(end_ts) = end_timestamp {
        query = query.with_time_range_end_lt(end_ts);
    }
    if let Some(tags_filter) = tags_filter_opt {
        query = query.with_tags_filter(tags_filter);
    }
    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
    let splits_metadata: Vec<SplitMetadata> = metastore
        .list_splits(list_splits_request)
        .await?
        .collect_splits_metadata()
        .await?;
    Ok(splits_metadata)
}

/// Resolve index patterns and returns IndexMetadata for found indices.
/// Patterns follow the elastic search patterns.
pub async fn resolve_index_patterns(
    index_id_patterns: &[String],
    metastore: &mut MetastoreServiceClient,
) -> crate::Result<Vec<IndexMetadata>> {
    let list_indexes_metadata_request = if index_id_patterns.is_empty() {
        ListIndexesMetadataRequest::all()
    } else {
        ListIndexesMetadataRequest {
            index_id_patterns: index_id_patterns.to_vec(),
        }
    };

    // Get the index ids from the request
    let indexes_metadata = metastore
        .list_indexes_metadata(list_indexes_metadata_request)
        .await?
        .deserialize_indexes_metadata()
        .await?;
    ensure_all_indexes_found(&indexes_metadata, index_id_patterns)?;
    Ok(indexes_metadata)
}

/// Converts a Tantivy `NamedFieldDocument` into a json string using the
/// schema defined by the DocMapper.
///
/// We perform this conversion at leaf level only to avoid having
/// another intermediate json format between the leaves and the root.
fn convert_document_to_json_string(
    named_field_doc: NamedFieldDocument,
    doc_mapper: &DocMapper,
) -> anyhow::Result<String> {
    let NamedFieldDocument(named_field_doc_map) = named_field_doc;
    let doc_json_map = doc_mapper.doc_to_json(named_field_doc_map)?;
    let content_json =
        serde_json::to_string(&doc_json_map).expect("Json serialization should never fail.");
    Ok(content_json)
}

/// Starts a search node, aka a `searcher`.
pub async fn start_searcher_service(
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
    search_job_placer: SearchJobPlacer,
    searcher_context: Arc<SearcherContext>,
) -> anyhow::Result<Arc<dyn SearchService>> {
    let cluster_client = ClusterClient::new(search_job_placer);
    let search_service = Arc::new(SearchServiceImpl::new(
        metastore,
        storage_resolver,
        cluster_client,
        searcher_context,
    ));
    Ok(search_service)
}

/// Performs a search on the current node.
/// See also `[distributed_search]`.
pub async fn single_node_search(
    search_request: SearchRequest,
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
) -> crate::Result<SearchResponse> {
    let socket_addr = SocketAddr::new(Ipv4Addr::new(127, 0, 0, 1).into(), 7280u16);
    let searcher_pool = SearcherPool::default();
    let search_job_placer = SearchJobPlacer::new(searcher_pool.clone());
    let cluster_client = ClusterClient::new(search_job_placer);
    let searcher_config = SearcherConfig::default();
    let searcher_context = Arc::new(SearcherContext::new_without_invoker(searcher_config, None));
    let search_service = Arc::new(SearchServiceImpl::new(
        metastore.clone(),
        storage_resolver,
        cluster_client.clone(),
        searcher_context.clone(),
    ));
    let search_service_client =
        SearchServiceClient::from_service(search_service.clone(), socket_addr);
    searcher_pool.insert(socket_addr, search_service_client);
    root_search(
        &searcher_context,
        search_request,
        metastore,
        &cluster_client,
    )
    .await
}

/// Creates a tantivy Term from a &str.
#[cfg(any(test, feature = "testsuite"))]
#[macro_export]
macro_rules! encode_term_for_test {
    ($field:expr, $value:expr) => {{
        #[allow(deprecated)]
        {
            ::tantivy::schema::Term::from_field_text(
                ::tantivy::schema::Field::from_field_id($field),
                $value,
            )
            .serialized_term()
            .to_vec()
        }
    }};
    ($value:expr) => {
        encode_term_for_test!(0, $value)
    };
}

/// Creates a `SearcherPool` for tests from an iterator of socket addresses and mock search
/// services.
#[cfg(any(test, feature = "testsuite"))]
pub fn searcher_pool_for_test(
    iter: impl IntoIterator<Item = (&'static str, MockSearchService)>,
) -> SearcherPool {
    SearcherPool::from_iter(
        iter.into_iter()
            .map(|(grpc_addr_str, mock_search_service)| {
                let grpc_addr: SocketAddr = grpc_addr_str
                    .parse()
                    .expect("The gRPC address should be valid socket address.");
                let client =
                    SearchServiceClient::from_service(Arc::new(mock_search_service), grpc_addr);
                (grpc_addr, client)
            }),
    )
}

pub(crate) fn merge_resource_stats_it<'a>(
    stats_it: impl IntoIterator<Item = &'a Option<ResourceStats>>,
) -> Option<ResourceStats> {
    let mut acc_stats: Option<ResourceStats> = None;
    for new_stats in stats_it {
        merge_resource_stats(new_stats, &mut acc_stats);
    }
    acc_stats
}

fn merge_resource_stats(
    new_stats_opt: &Option<ResourceStats>,
    stat_accs_opt: &mut Option<ResourceStats>,
) {
    if let Some(new_stats) = new_stats_opt {
        if let Some(stat_accs) = stat_accs_opt {
            stat_accs.short_lived_cache_num_bytes += new_stats.short_lived_cache_num_bytes;
            stat_accs.split_num_docs += new_stats.split_num_docs;
            stat_accs.warmup_microsecs += new_stats.warmup_microsecs;
            stat_accs.cpu_thread_pool_wait_microsecs += new_stats.cpu_thread_pool_wait_microsecs;
            stat_accs.cpu_microsecs += new_stats.cpu_microsecs;
        } else {
            *stat_accs_opt = Some(*new_stats);
        }
    }
}
#[cfg(test)]
mod stats_merge_tests {
    use super::*;

    #[test]
    fn test_merge_resource_stats() {
        let mut acc_stats = None;

        merge_resource_stats(&None, &mut acc_stats);

        assert_eq!(acc_stats, None);

        let stats = Some(ResourceStats {
            short_lived_cache_num_bytes: 100,
            split_num_docs: 200,
            warmup_microsecs: 300,
            cpu_thread_pool_wait_microsecs: 400,
            cpu_microsecs: 500,
        });

        merge_resource_stats(&stats, &mut acc_stats);

        assert_eq!(acc_stats, stats);

        let new_stats = Some(ResourceStats {
            short_lived_cache_num_bytes: 50,
            split_num_docs: 100,
            warmup_microsecs: 150,
            cpu_thread_pool_wait_microsecs: 200,
            cpu_microsecs: 250,
        });

        merge_resource_stats(&new_stats, &mut acc_stats);

        let stats_plus_new_stats = Some(ResourceStats {
            short_lived_cache_num_bytes: 150,
            split_num_docs: 300,
            warmup_microsecs: 450,
            cpu_thread_pool_wait_microsecs: 600,
            cpu_microsecs: 750,
        });

        assert_eq!(acc_stats, stats_plus_new_stats);

        merge_resource_stats(&None, &mut acc_stats);

        assert_eq!(acc_stats, stats_plus_new_stats);
    }

    #[test]
    fn test_merge_resource_stats_it() {
        let merged_stats = merge_resource_stats_it(Vec::<&Option<ResourceStats>>::new());
        assert_eq!(merged_stats, None);

        let stats1 = Some(ResourceStats {
            short_lived_cache_num_bytes: 100,
            split_num_docs: 200,
            warmup_microsecs: 300,
            cpu_thread_pool_wait_microsecs: 400,
            cpu_microsecs: 500,
        });

        let merged_stats = merge_resource_stats_it(vec![&None, &stats1, &None]);

        assert_eq!(merged_stats, stats1);

        let stats2 = Some(ResourceStats {
            short_lived_cache_num_bytes: 50,
            split_num_docs: 100,
            warmup_microsecs: 150,
            cpu_thread_pool_wait_microsecs: 200,
            cpu_microsecs: 250,
        });

        let stats3 = Some(ResourceStats {
            short_lived_cache_num_bytes: 25,
            split_num_docs: 50,
            warmup_microsecs: 75,
            cpu_thread_pool_wait_microsecs: 100,
            cpu_microsecs: 125,
        });

        let merged_stats = merge_resource_stats_it(vec![&stats1, &stats2, &stats3]);

        assert_eq!(
            merged_stats,
            Some(ResourceStats {
                short_lived_cache_num_bytes: 175,
                split_num_docs: 350,
                warmup_microsecs: 525,
                cpu_thread_pool_wait_microsecs: 700,
                cpu_microsecs: 875,
            })
        );
    }
}


================================================
FILE: quickwit/quickwit-search/src/list_fields.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::path::Path;
use std::str::FromStr;
use std::sync::{Arc, LazyLock};

use anyhow::Context;
use futures::future;
use futures::future::try_join_all;
use itertools::Itertools;
use quickwit_common::rate_limited_warn;
use quickwit_common::shared_consts::{FIELD_PRESENCE_FIELD_NAME, SPLIT_FIELDS_FILE_NAME};
use quickwit_common::uri::Uri;
use quickwit_config::build_doc_mapper;
use quickwit_doc_mapper::tag_pruning::extract_tags_from_query;
use quickwit_metastore::SplitMetadata;
use quickwit_proto::metastore::MetastoreServiceClient;
use quickwit_proto::search::{
    LeafListFieldsRequest, ListFields, ListFieldsEntryResponse, ListFieldsRequest,
    ListFieldsResponse, SplitIdAndFooterOffsets, deserialize_split_fields,
};
use quickwit_proto::types::{IndexId, IndexUid};
use quickwit_query::query_ast::QueryAst;
use quickwit_storage::Storage;

use crate::leaf::open_split_bundle;
use crate::search_job_placer::group_jobs_by_index_id;
use crate::service::SearcherContext;
use crate::{
    ClusterClient, SearchError, SearchJob, list_relevant_splits, resolve_index_patterns,
    search_thread_pool,
};

/// QW_FIELD_LIST_SIZE_LIMIT defines a hard limit on the number of fields that
/// can be returned (error otherwise).
///
/// Having many fields can happen when a user is creating fields dynamically in
/// a JSON type with random field names. This leads to huge memory consumption
/// when building the response. This is a workaround until a way is found to
/// prune the long tail of rare fields.
static FIELD_LIST_SIZE_LIMIT: LazyLock<usize> =
    LazyLock::new(|| quickwit_common::get_from_env("QW_FIELD_LIST_SIZE_LIMIT", 100_000, false));

const DYNAMIC_FIELD_PREFIX: &str = "_dynamic.";

/// Get the list of fields in the given split.
/// The returned list is guaranteed to be strictly sorted by (field_name, field_type).
async fn get_fields_from_split(
    searcher_context: &SearcherContext,
    index_id: IndexId,
    split_and_footer_offsets: &SplitIdAndFooterOffsets,
    index_storage: Arc<dyn Storage>,
) -> anyhow::Result<Vec<ListFieldsEntryResponse>> {
    if let Some(list_fields) = searcher_context
        .list_fields_cache
        .get(split_and_footer_offsets.clone())
    {
        return Ok(list_fields.fields);
    }
    let (_, split_bundle) =
        open_split_bundle(searcher_context, index_storage, split_and_footer_offsets).await?;

    let serialized_split_fields = split_bundle
        .get_all(Path::new(SPLIT_FIELDS_FILE_NAME))
        .await?;
    let serialized_split_fields_len = serialized_split_fields.len();
    let list_fields_proto =
        deserialize_split_fields(serialized_split_fields).with_context(|| {
            format!("could not read split fields (serialized len: {serialized_split_fields_len})",)
        })?;

    let mut list_fields = list_fields_proto.fields;
    list_fields.retain(|list_field_entry| list_field_entry.field_name != FIELD_PRESENCE_FIELD_NAME);

    for list_field_entry in list_fields.iter_mut() {
        list_field_entry.index_ids = vec![index_id.to_string()];

        if list_field_entry
            .field_name
            .starts_with(DYNAMIC_FIELD_PREFIX)
        {
            list_field_entry
                .field_name
                .replace_range(..DYNAMIC_FIELD_PREFIX.len(), "");
        }
    }

    // We sort our fields, as the removal of dynamic_field prefix could have caused them to be out
    // of order. We also defensively make sure there are no duplicates here.
    make_sorted_and_dedup(&mut list_fields);

    // Put result into cache
    searcher_context.list_fields_cache.put(
        split_and_footer_offsets.clone(),
        ListFields {
            fields: list_fields.clone(),
        },
    );

    Ok(list_fields)
}

fn field_order(
    left: &ListFieldsEntryResponse,
    right: &ListFieldsEntryResponse,
) -> std::cmp::Ordering {
    left.field_name
        .cmp(&right.field_name)
        .then_with(|| left.field_type.cmp(&right.field_type))
}

// Sorts and deduplicates the list of fields.
//
// If somehow we end up with duplicate fields, only the first one is kept,
// and we log a warning.
fn make_sorted_and_dedup(list_fields: &mut Vec<ListFieldsEntryResponse>) {
    list_fields.sort_unstable_by(field_order);

    // We defensively make sure there are no duplicates here.
    list_fields.dedup_by(|left, right| {
        if left.field_name == right.field_name && left.field_type == right.field_type {
            rate_limited_warn!(
                limit_per_min = 1,
                left.field_name,
                "duplicate fields found, please report"
            );
            true
        } else {
            false
        }
    });
}

/// `current_group` needs to contain at least one element.
/// The group needs to be of the same field name and type.
fn merge_same_field_group(
    current_group: &mut Vec<ListFieldsEntryResponse>,
) -> ListFieldsEntryResponse {
    // Make sure all fields have the same name and type in current_group
    assert!(!current_group.is_empty());
    assert!(
        current_group
            .windows(2)
            .all(|window| window[0].field_name == window[1].field_name
                && window[0].field_type == window[1].field_type)
    );

    if current_group.len() == 1 {
        return current_group
            .pop()
            .expect("`current_group` should not be empty");
    }
    let metadata = current_group
        .last()
        .expect("`current_group` should not be empty");
    let searchable = current_group.iter().any(|entry| entry.searchable);
    let aggregatable = current_group.iter().any(|entry| entry.aggregatable);
    let field_name = metadata.field_name.to_string();
    let field_type = metadata.field_type;
    let mut non_searchable_index_ids = if searchable {
        // We need to combine the non_searchable_index_ids + index_ids where searchable is set to
        // false (as they are all non_searchable)
        current_group
            .iter()
            .flat_map(|entry| {
                if !entry.searchable {
                    entry.index_ids.iter().cloned()
                } else {
                    entry.non_searchable_index_ids.iter().cloned()
                }
            })
            .collect()
    } else {
        // Not searchable => no need to list all the indices
        Vec::new()
    };
    non_searchable_index_ids.sort_unstable();
    non_searchable_index_ids.dedup();

    let mut non_aggregatable_index_ids = if aggregatable {
        // We need to combine the non_aggregatable_index_ids + index_ids where aggregatable is set
        // to false (as they are all non_aggregatable)
        current_group
            .iter()
            .flat_map(|entry| {
                if !entry.aggregatable {
                    entry.index_ids.iter().cloned()
                } else {
                    entry.non_aggregatable_index_ids.iter().cloned()
                }
            })
            .collect()
    } else {
        // Not aggregatable => no need to list all the indices
        Vec::new()
    };
    non_aggregatable_index_ids.sort_unstable();
    non_aggregatable_index_ids.dedup();
    let mut index_ids: Vec<String> = current_group
        .drain(..)
        .flat_map(|entry| entry.index_ids.into_iter())
        .collect();
    index_ids.sort_unstable();
    index_ids.dedup();

    ListFieldsEntryResponse {
        field_name,
        field_type,
        searchable,
        aggregatable,
        non_searchable_index_ids,
        non_aggregatable_index_ids,
        index_ids,
    }
}

/// Merge iterators of ListFieldsEntryResponse into a `Vec<ListFieldsEntryResponse>`.
///
/// The iterators need to be sorted by (field_name, fieldtype)
fn merge_leaf_list_fields(
    iterators: Vec<impl Iterator<Item = ListFieldsEntryResponse>>,
) -> crate::Result<Vec<ListFieldsEntryResponse>> {
    let merged = iterators
        .into_iter()
        .kmerge_by(|a, b| (&a.field_name, a.field_type) <= (&b.field_name, b.field_type));
    let mut responses = Vec::new();

    let mut current_group: Vec<ListFieldsEntryResponse> = Vec::new();
    // Build ListFieldsEntryResponse from current group
    let flush_group = |responses: &mut Vec<_>, current_group: &mut Vec<ListFieldsEntryResponse>| {
        let entry = merge_same_field_group(current_group);
        responses.push(entry);
        current_group.clear();
    };

    for entry in merged {
        if let Some(last) = current_group.last()
            && (last.field_name != entry.field_name || last.field_type != entry.field_type)
        {
            flush_group(&mut responses, &mut current_group);
        }
        if responses.len() >= *FIELD_LIST_SIZE_LIMIT {
            return Err(SearchError::Internal(format!(
                "list fields response exceeded {} fields",
                *FIELD_LIST_SIZE_LIMIT
            )));
        }
        current_group.push(entry);
    }
    if !current_group.is_empty() {
        flush_group(&mut responses, &mut current_group);
    }

    Ok(responses)
}

// Returns true if any of the patterns match the field name.
fn matches_any_pattern(field_name: &str, field_patterns: &[FieldPattern]) -> bool {
    field_patterns
        .iter()
        .any(|pattern| pattern.matches(field_name))
}

enum FieldPattern {
    Match { field: String },
    Wildcard { prefix: String, suffix: String },
}

impl FromStr for FieldPattern {
    type Err = crate::SearchError;

    fn from_str(field_pattern: &str) -> crate::Result<Self> {
        match field_pattern.find('*') {
            None => Ok(FieldPattern::Match {
                field: field_pattern.to_string(),
            }),
            Some(pos) => {
                let prefix = field_pattern[..pos].to_string();
                let suffix = field_pattern[pos + 1..].to_string();
                if suffix.contains("*") {
                    return Err(crate::SearchError::InvalidArgument(format!(
                        "invalid field pattern `{field_pattern}`: we only support one wildcard"
                    )));
                }
                Ok(FieldPattern::Wildcard { prefix, suffix })
            }
        }
    }
}

impl FieldPattern {
    pub fn matches(&self, field_name: &str) -> bool {
        match self {
            FieldPattern::Match { field } => field == field_name,
            FieldPattern::Wildcard { prefix, suffix } => {
                field_name.starts_with(prefix) && field_name.ends_with(suffix)
            }
        }
    }
}

/// `leaf` step of list fields.
///
/// Returns field metadata from the assigned splits.
pub async fn leaf_list_fields(
    index_id: IndexId,
    index_storage: Arc<dyn Storage>,
    searcher_context: &SearcherContext,
    split_ids: &[SplitIdAndFooterOffsets],
    field_patterns_str: &[String],
) -> crate::Result<ListFieldsResponse> {
    let field_patterns: Vec<FieldPattern> = field_patterns_str
        .iter()
        .map(|pattern_str| FieldPattern::from_str(pattern_str))
        .collect::<crate::Result<_>>()?;

    // If no splits, return empty response
    if split_ids.is_empty() {
        return Ok(ListFieldsResponse { fields: Vec::new() });
    }

    // Get fields from all splits
    let single_split_list_fields_futures: Vec<_> = split_ids
        .iter()
        .map(|split_id| {
            get_fields_from_split(
                searcher_context,
                index_id.to_string(),
                split_id,
                index_storage.clone(),
            )
        })
        .collect();

    let mut single_split_list_fields_vec: Vec<Vec<ListFieldsEntryResponse>> =
        future::try_join_all(single_split_list_fields_futures).await?;

    let fields = search_thread_pool()
        .run_cpu_intensive(move || {
            for single_split_list_fields in &mut single_split_list_fields_vec {
                // This contract is enforced on a different node, etc. so we defensively check that
                // the fields are sorted and deduplicated.
                if !single_split_list_fields.is_sorted_by(|left, right| {
                    // Checking on less ensure that this is both sorted AND that there are no
                    // duplicates
                    field_order(left, right) == std::cmp::Ordering::Less
                }) {
                    rate_limited_warn!(
                        limit_per_min = 1,
                        "contract breach: fields returned by a leaf are not strictly sorted! \
                         please report"
                    );
                    make_sorted_and_dedup(single_split_list_fields);
                }
            }

            let filtered_list_fields_sorted_iters: Vec<_> = single_split_list_fields_vec
                .into_iter()
                .map(|list_fields_sorted| {
                    list_fields_sorted.into_iter().filter(|field| {
                        if field_patterns.is_empty() {
                            true
                        } else {
                            matches_any_pattern(&field.field_name, &field_patterns)
                        }
                    })
                })
                .collect();
            merge_leaf_list_fields(filtered_list_fields_sorted_iters)
        })
        .await
        .context("failed to merge single split list fields")??;
    Ok(ListFieldsResponse { fields })
}

/// Index metas needed for executing a leaf list fields request.
#[derive(Clone, Debug)]
pub struct IndexMetasForLeafSearch {
    /// Index id.
    pub index_id: IndexId,
    /// Index URI.
    pub index_uri: Uri,
}

/// Performs a distributed list fields request.
/// 1. Sends leaf requests over gRPC to multiple leaf nodes.
/// 2. Merges the search results.
/// 3. Builds the response and returns.
pub async fn root_list_fields(
    list_fields_req: ListFieldsRequest,
    cluster_client: &ClusterClient,
    mut metastore: MetastoreServiceClient,
) -> crate::Result<ListFieldsResponse> {
    let indexes_metadata =
        resolve_index_patterns(&list_fields_req.index_id_patterns[..], &mut metastore).await?;
    // The request contains a wildcard, but couldn't find any index.
    if indexes_metadata.is_empty() {
        return Ok(ListFieldsResponse { fields: Vec::new() });
    }

    // Build index metadata map and extract timestamp field for time range refinement
    let mut index_uid_to_index_meta: HashMap<IndexUid, IndexMetasForLeafSearch> = HashMap::new();
    let mut index_uids: Vec<IndexUid> = Vec::new();
    let mut timestamp_field_opt: Option<String> = None;

    for index_metadata in indexes_metadata {
        // Extract timestamp field for time range refinement (use first index's field)
        if timestamp_field_opt.is_none()
            && list_fields_req.query_ast.is_some()
            && let Ok(doc_mapper) = build_doc_mapper(
                &index_metadata.index_config.doc_mapping,
                &index_metadata.index_config.search_settings,
            )
        {
            timestamp_field_opt = doc_mapper.timestamp_field_name().map(|s| s.to_string());
        }

        let index_metadata_for_leaf_search = IndexMetasForLeafSearch {
            index_uri: index_metadata.index_uri().clone(),
            index_id: index_metadata.index_config.index_id.to_string(),
        };

        index_uids.push(index_metadata.index_uid.clone());
        index_uid_to_index_meta.insert(
            index_metadata.index_uid.clone(),
            index_metadata_for_leaf_search,
        );
    }

    // Extract tags and refine time range from query_ast for split pruning
    let mut start_timestamp = list_fields_req.start_timestamp;
    let mut end_timestamp = list_fields_req.end_timestamp;
    let tags_filter_opt = if let Some(ref query_ast_json) = list_fields_req.query_ast {
        let query_ast: QueryAst = serde_json::from_str(query_ast_json)
            .map_err(|err| SearchError::InvalidQuery(err.to_string()))?;

        // Refine time range from query AST if timestamp field is available
        if let Some(ref timestamp_field) = timestamp_field_opt {
            crate::root::refine_start_end_timestamp_from_ast(
                &query_ast,
                timestamp_field,
                &mut start_timestamp,
                &mut end_timestamp,
            );
        }

        extract_tags_from_query(query_ast)
    } else {
        None
    };

    let split_metadatas: Vec<SplitMetadata> = list_relevant_splits(
        index_uids,
        start_timestamp,
        end_timestamp,
        tags_filter_opt,
        &mut metastore,
    )
    .await?;

    // Build requests for each index id
    let jobs: Vec<SearchJob> = split_metadatas.iter().map(SearchJob::from).collect();
    let assigned_leaf_search_jobs = cluster_client
        .search_job_placer
        .assign_jobs(jobs, &HashSet::default())
        .await?;
    let mut leaf_request_tasks = Vec::new();
    // For each node, forward to a node with an affinity for that index id.
    for (client, client_jobs) in assigned_leaf_search_jobs {
        let leaf_requests =
            jobs_to_leaf_requests(&list_fields_req, &index_uid_to_index_meta, client_jobs)?;
        for leaf_request in leaf_requests {
            leaf_request_tasks.push(cluster_client.leaf_list_fields(leaf_request, client.clone()));
        }
    }
    let leaf_list_fields_protos: Vec<ListFieldsResponse> = try_join_all(leaf_request_tasks).await?;
    let fields = search_thread_pool()
        .run_cpu_intensive(move || {
            let leaf_list_fields = leaf_list_fields_protos
                .into_iter()
                .map(|leaf_list_fields_proto| leaf_list_fields_proto.fields.into_iter())
                .collect();
            merge_leaf_list_fields(leaf_list_fields)
        })
        .await
        .context("failed to merge leaf list fields responses")??;

    Ok(ListFieldsResponse { fields })
}

/// Builds a list of [`LeafListFieldsRequest`], one per index, from a list of [`SearchJob`].
pub fn jobs_to_leaf_requests(
    request: &ListFieldsRequest,
    index_uid_to_id: &HashMap<IndexUid, IndexMetasForLeafSearch>,
    jobs: Vec<SearchJob>,
) -> crate::Result<Vec<LeafListFieldsRequest>> {
    let search_request_for_leaf = request.clone();
    let mut leaf_search_requests = Vec::new();
    // Group jobs by index uid.
    group_jobs_by_index_id(jobs, |job_group| {
        let index_uid = &job_group[0].index_uid;
        let index_meta = index_uid_to_id.get(index_uid).ok_or_else(|| {
            SearchError::Internal(format!(
                "received list fields job for an unknown index {index_uid}. it should never happen"
            ))
        })?;

        let leaf_search_request = LeafListFieldsRequest {
            index_id: index_meta.index_id.to_string(),
            index_uri: index_meta.index_uri.to_string(),
            fields: search_request_for_leaf.fields.clone(),
            split_offsets: job_group.into_iter().map(|job| job.offsets).collect(),
        };
        leaf_search_requests.push(leaf_search_request);
        Ok(())
    })?;

    Ok(leaf_search_requests)
}

#[cfg(test)]
mod tests {
    use quickwit_proto::search::{ListFieldType, ListFieldsEntryResponse};

    use super::*;

    #[test]
    fn merge_leaf_list_fields_identical_test() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        assert_eq!(resp, vec![entry1]);
    }
    #[test]
    fn merge_leaf_list_fields_different_test() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field2".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        assert_eq!(resp, vec![entry1, entry2]);
    }
    #[test]
    fn merge_leaf_list_fields_non_searchable_test() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: false,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index2".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        let expected = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: vec!["index2".to_string()],
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string(), "index2".to_string()],
        };
        assert_eq!(resp, vec![expected]);
    }
    #[test]
    fn merge_leaf_list_fields_non_aggregatable_test() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: false,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index2".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        let expected = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: vec!["index2".to_string()],
            index_ids: vec!["index1".to_string(), "index2".to_string()],
        };
        assert_eq!(resp, vec![expected]);
    }
    #[test]
    fn merge_leaf_list_fields_mixed_types1() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry3 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::U64 as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone(), entry2.clone()].into_iter(),
            vec![entry3.clone()].into_iter(),
        ])
        .unwrap();
        assert_eq!(resp, vec![entry1.clone(), entry3.clone()]);
    }
    #[test]
    fn merge_leaf_list_fields_mixed_types2() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry3 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::U64 as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone(), entry3.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        assert_eq!(resp, vec![entry1.clone(), entry3.clone()]);
    }
    #[test]
    fn merge_leaf_list_fields_multiple_field_names() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let entry3 = ListFieldsEntryResponse {
            field_name: "field2".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index1".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone(), entry3.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        assert_eq!(resp, vec![entry1.clone(), entry3.clone()]);
    }
    #[test]
    fn merge_leaf_list_fields_non_aggregatable_list_test() {
        let entry1 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: vec!["index1".to_string()],
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec![
                "index1".to_string(),
                "index2".to_string(),
                "index3".to_string(),
            ],
        };
        let entry2 = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: false,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index4".to_string()],
        };
        let resp = merge_leaf_list_fields(vec![
            vec![entry1.clone()].into_iter(),
            vec![entry2.clone()].into_iter(),
        ])
        .unwrap();
        let expected = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: true,
            aggregatable: true,
            non_searchable_index_ids: vec!["index1".to_string(), "index4".to_string()],
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec![
                "index1".to_string(),
                "index2".to_string(),
                "index3".to_string(),
                "index4".to_string(),
            ],
        };
        assert_eq!(resp, vec![expected]);
    }

    #[test]
    fn test_field_pattern() {
        let prefix_pattern = FieldPattern::from_str("toto*").unwrap();
        assert!(!prefix_pattern.matches(""));
        assert!(!prefix_pattern.matches("tot3"));
        assert!(!prefix_pattern.matches("atoto"));
        assert!(prefix_pattern.matches("toto"));
        assert!(prefix_pattern.matches("totowhatever"));

        let suffix_pattern = FieldPattern::from_str("*toto").unwrap();
        assert!(!suffix_pattern.matches(""));
        assert!(!suffix_pattern.matches("3tot"));
        assert!(!suffix_pattern.matches("totoa"));
        assert!(suffix_pattern.matches("toto"));
        assert!(suffix_pattern.matches("whatevertoto"));

        let inner_pattern = FieldPattern::from_str("to*ti").unwrap();
        assert!(!inner_pattern.matches(""));
        assert!(!inner_pattern.matches("tot"));
        assert!(!inner_pattern.matches("totia"));
        assert!(!inner_pattern.matches("atoti"));
        assert!(inner_pattern.matches("toti"));
        assert!(!inner_pattern.matches("tito"));
        assert!(inner_pattern.matches("towhateverti"));

        assert!(FieldPattern::from_str("to**").is_err());
    }
}


================================================
FILE: quickwit/quickwit-search/src/list_fields_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::CacheConfig;
use quickwit_proto::search::{
    ListFields, SplitIdAndFooterOffsets, deserialize_split_fields, serialize_split_fields,
};
use quickwit_proto::types::SplitId;
use quickwit_storage::{MemorySizedCache, OwnedBytes};

/// A cache to memoize `leaf_search_single_split` results.
pub struct ListFieldsCache {
    content: MemorySizedCache<CacheKey>,
}

// TODO For now this simply caches the whole ListFieldsEntryResponse. We could
// be more clever and cache aggregates instead.
impl ListFieldsCache {
    pub fn new(config: &CacheConfig) -> ListFieldsCache {
        ListFieldsCache {
            content: MemorySizedCache::from_config(
                config,
                &quickwit_storage::STORAGE_METRICS.partial_request_cache,
            ),
        }
    }
    pub fn get(&self, split_info: SplitIdAndFooterOffsets) -> Option<ListFields> {
        let key = CacheKey::from_split_meta(split_info);
        let encoded_result = self.content.get(&key)?;
        // this should never fail
        deserialize_split_fields(encoded_result).ok()
    }

    pub fn put(&self, split_info: SplitIdAndFooterOffsets, list_fields: ListFields) {
        let key = CacheKey::from_split_meta(split_info);

        let encoded_result = serialize_split_fields(list_fields);
        self.content.put(key, OwnedBytes::new(encoded_result));
    }
}

/// A key inside a [`ListFieldsCache`].
#[derive(Debug, Hash, Clone, PartialEq, Eq)]
struct CacheKey {
    /// The split this entry refers to
    split_id: SplitId,
}

impl CacheKey {
    fn from_split_meta(split_info: SplitIdAndFooterOffsets) -> Self {
        CacheKey {
            split_id: split_info.split_id,
        }
    }
}

#[cfg(test)]
mod tests {
    use bytesize::ByteSize;
    use quickwit_proto::search::{
        ListFieldType, ListFields, ListFieldsEntryResponse, SplitIdAndFooterOffsets,
    };

    use super::ListFieldsCache;

    #[test]
    fn test_list_fields_cache() {
        let cache = ListFieldsCache::new(&ByteSize::mb(64).into());

        let split_1 = SplitIdAndFooterOffsets {
            split_id: "split_1".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: None,
            timestamp_end: None,
            num_docs: 0,
        };

        let split_2 = SplitIdAndFooterOffsets {
            split_id: "split_2".to_string(),
            split_footer_start: 0,
            split_footer_end: 100,
            timestamp_start: None,
            timestamp_end: None,
            num_docs: 0,
        };

        let result = ListFieldsEntryResponse {
            field_name: "field1".to_string(),
            field_type: ListFieldType::Str as i32,
            searchable: false,
            aggregatable: true,
            non_searchable_index_ids: Vec::new(),
            non_aggregatable_index_ids: Vec::new(),
            index_ids: vec!["index4".to_string()],
        };

        assert!(cache.get(split_1.clone()).is_none());

        let list_fields = ListFields {
            fields: vec![result.clone()],
        };

        cache.put(split_1.clone(), list_fields.clone());
        assert_eq!(cache.get(split_1.clone()).unwrap(), list_fields);
        assert!(cache.get(split_2).is_none());
    }
}


================================================
FILE: quickwit/quickwit-search/src/list_terms.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::ops::Bound;
use std::sync::Arc;

use anyhow::Context;
use bytesize::ByteSize;
use futures::future::try_join_all;
use itertools::{Either, Itertools};
use quickwit_common::pretty::PrettySample;
use quickwit_config::build_doc_mapper;
use quickwit_metastore::{ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, SplitMetadata};
use quickwit_proto::metastore::{ListSplitsRequest, MetastoreService, MetastoreServiceClient};
use quickwit_proto::search::{
    LeafListTermsRequest, LeafListTermsResponse, ListTermsRequest, ListTermsResponse,
    SplitIdAndFooterOffsets, SplitSearchError,
};
use quickwit_proto::types::IndexUid;
use quickwit_storage::{ByteRangeCache, Storage};
use tantivy::schema::{Field, FieldType};
use tantivy::{ReloadPolicy, Term};
use tracing::{debug, error, info, instrument};

use crate::leaf::open_index_with_caches;
use crate::search_job_placer::group_jobs_by_index_id;
use crate::search_permit_provider::compute_initial_memory_allocation;
use crate::{ClusterClient, SearchError, SearchJob, SearcherContext, resolve_index_patterns};

/// Performs a distributed list terms.
/// 1. Sends leaf requests over gRPC to multiple leaf nodes.
/// 2. Merges the search results.
/// 3. Builds the response and returns.
/// this is much simpler than `root_search` as it doesn't need to get actual docs.
#[instrument(skip(list_terms_request, cluster_client, metastore))]
pub async fn root_list_terms(
    list_terms_request: &ListTermsRequest,
    mut metastore: MetastoreServiceClient,
    cluster_client: &ClusterClient,
) -> crate::Result<ListTermsResponse> {
    let start_instant = tokio::time::Instant::now();
    let indexes_metadata =
        resolve_index_patterns(&list_terms_request.index_id_patterns, &mut metastore).await?;
    // The request contains a wildcard, but couldn't find any index.
    if indexes_metadata.is_empty() {
        return Ok(ListTermsResponse {
            num_hits: 0,
            terms: Vec::new(),
            elapsed_time_micros: 0,
            errors: Vec::new(),
        });
    }

    for index_metadata in indexes_metadata.iter() {
        let index_config = &index_metadata.index_config;
        let doc_mapper = build_doc_mapper(&index_config.doc_mapping, &index_config.search_settings)
            .map_err(|err| {
                SearchError::Internal(format!("failed to build doc mapper. cause: {err}"))
            })?;
        let schema = doc_mapper.schema();
        let field = schema.get_field(&list_terms_request.field).map_err(|_| {
            SearchError::InvalidQuery(format!(
                "failed to list terms in `{}`, field doesn't exist",
                list_terms_request.field
            ))
        })?;
        let field_entry = schema.get_field_entry(field);
        if !field_entry.is_indexed() {
            return Err(SearchError::InvalidQuery(
                "trying to list terms on field which isn't indexed".to_string(),
            ));
        }
    }
    let index_uids: Vec<IndexUid> = indexes_metadata
        .iter()
        .map(|index_metadata| index_metadata.index_uid.clone())
        .collect();

    let Some(mut query) = quickwit_metastore::ListSplitsQuery::try_from_index_uids(index_uids)
    else {
        return Ok(ListTermsResponse::default());
    };
    query = query.with_split_state(quickwit_metastore::SplitState::Published);

    if let Some(start_ts) = list_terms_request.start_timestamp {
        query = query.with_time_range_start_gte(start_ts);
    }

    if let Some(end_ts) = list_terms_request.end_timestamp {
        query = query.with_time_range_end_lt(end_ts);
    }
    let index_uid_to_index_uri: HashMap<IndexUid, String> = indexes_metadata
        .iter()
        .map(|index_metadata| {
            (
                index_metadata.index_uid.clone(),
                index_metadata.index_uri().to_string(),
            )
        })
        .collect();
    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
    let split_metadatas: Vec<SplitMetadata> = metastore
        .clone()
        .list_splits(list_splits_request)
        .await?
        .collect_splits_metadata()
        .await?;

    let jobs: Vec<SearchJob> = split_metadatas.iter().map(SearchJob::from).collect();
    let assigned_leaf_search_jobs = cluster_client
        .search_job_placer
        .assign_jobs(jobs, &HashSet::default())
        .await?;
    let mut leaf_request_tasks = Vec::new();
    // For each node, forward to a node with an affinity for that index id.
    for (client, client_jobs) in assigned_leaf_search_jobs {
        let leaf_requests =
            jobs_to_leaf_requests(list_terms_request, &index_uid_to_index_uri, client_jobs)?;
        for leaf_request in leaf_requests {
            leaf_request_tasks.push(cluster_client.leaf_list_terms(leaf_request, client.clone()));
        }
    }
    let leaf_search_responses: Vec<LeafListTermsResponse> =
        try_join_all(leaf_request_tasks).await?;

    let failed_splits: Vec<_> = leaf_search_responses
        .iter()
        .flat_map(|leaf_search_response| &leaf_search_response.failed_splits)
        .collect();

    if !failed_splits.is_empty() {
        error!(failed_splits = ?failed_splits, "leaf search response contains at least one failed split");
        let errors: String = failed_splits
            .iter()
            .map(|splits| splits.to_string())
            .collect::<Vec<_>>()
            .join(", ");
        return Err(SearchError::Internal(errors));
    }

    // Merging is a cpu-bound task, but probably fast enough to not require
    // spawning it on a blocking thread.
    let merged_iter = leaf_search_responses
        .into_iter()
        .map(|leaf_search_response| leaf_search_response.terms)
        .kmerge()
        .dedup();
    let leaf_list_terms_response: Vec<Vec<u8>> = if let Some(limit) = list_terms_request.max_hits {
        merged_iter.take(limit as usize).collect()
    } else {
        merged_iter.collect()
    };

    debug!(
        leaf_list_terms_response_count = leaf_list_terms_response.len(),
        "Merged leaf search response."
    );

    let elapsed = start_instant.elapsed();

    Ok(ListTermsResponse {
        num_hits: leaf_list_terms_response.len() as u64,
        terms: leaf_list_terms_response,
        elapsed_time_micros: elapsed.as_micros() as u64,
        errors: Vec::new(),
    })
}

/// Builds a list of [`LeafListTermsRequest`], one per index, from a list of [`SearchJob`].
pub fn jobs_to_leaf_requests(
    request: &ListTermsRequest,
    index_uid_to_uri: &HashMap<IndexUid, String>,
    jobs: Vec<SearchJob>,
) -> crate::Result<Vec<LeafListTermsRequest>> {
    let search_request_for_leaf = request.clone();
    let mut leaf_search_requests = Vec::new();
    group_jobs_by_index_id(jobs, |job_group| {
        let index_uid = &job_group[0].index_uid;
        let index_uri = index_uid_to_uri.get(index_uid).ok_or_else(|| {
            SearchError::Internal(format!(
                "received list fields job for an unknown index {index_uid}. it should never happen"
            ))
        })?;

        let leaf_search_request = LeafListTermsRequest {
            list_terms_request: Some(search_request_for_leaf.clone()),
            index_uri: index_uri.to_string(),
            split_offsets: job_group.into_iter().map(|job| job.offsets).collect(),
        };
        leaf_search_requests.push(leaf_search_request);
        Ok(())
    })?;
    Ok(leaf_search_requests)
}

/// Apply a leaf list terms on a single split.
#[instrument(skip_all, fields(split_id = split.split_id))]
#[allow(deprecated)]
async fn leaf_list_terms_single_split(
    searcher_context: &SearcherContext,
    search_request: &ListTermsRequest,
    storage: Arc<dyn Storage>,
    split: SplitIdAndFooterOffsets,
) -> crate::Result<LeafListTermsResponse> {
    let cache =
        ByteRangeCache::with_infinite_capacity(&quickwit_storage::STORAGE_METRICS.shortlived_cache);
    let (index, _) =
        open_index_with_caches(searcher_context, storage, &split, None, Some(cache)).await?;
    let split_schema = index.schema();
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()?;
    let searcher = reader.searcher();

    let field = split_schema
        .get_field(&search_request.field)
        .with_context(|| {
            format!(
                "couldn't get field named {:?} from schema to list terms",
                search_request.field
            )
        })?;

    let field_type = split_schema.get_field_entry(field).field_type();
    let start_term: Option<Term> = search_request
        .start_key
        .as_ref()
        .map(|data| term_from_data(field, field_type, data));
    let end_term: Option<Term> = search_request
        .end_key
        .as_ref()
        .map(|data| term_from_data(field, field_type, data));

    let mut segment_results = Vec::new();
    for segment_reader in searcher.segment_readers() {
        let inverted_index = segment_reader.inverted_index(field)?.clone();
        let dict = inverted_index.terms();
        dict.file_slice_for_range(
            (
                start_term
                    .as_ref()
                    .map(Term::serialized_value_bytes)
                    .map(Bound::Included)
                    .unwrap_or(Bound::Unbounded),
                end_term
                    .as_ref()
                    .map(Term::serialized_value_bytes)
                    .map(Bound::Excluded)
                    .unwrap_or(Bound::Unbounded),
            ),
            search_request.max_hits,
        )
        .read_bytes_async()
        .await
        .with_context(|| "failed to load sstable range")?;

        let mut range = dict.range();
        if let Some(limit) = search_request.max_hits {
            range = range.limit(limit);
        }
        if let Some(start_term) = &start_term {
            range = range.ge(start_term.serialized_value_bytes())
        }
        if let Some(end_term) = &end_term {
            range = range.lt(end_term.serialized_value_bytes())
        }
        let mut stream = range
            .into_stream()
            .with_context(|| "failed to create stream over sstable")?;
        let mut segment_result: Vec<Vec<u8>> =
            Vec::with_capacity(search_request.max_hits.unwrap_or(0) as usize);
        while stream.advance() {
            segment_result.push(term_to_data(field, field_type, stream.key()));
        }
        segment_results.push(segment_result);
    }

    let merged_iter = segment_results.into_iter().kmerge().dedup();
    let merged_results: Vec<Vec<u8>> = if let Some(limit) = search_request.max_hits {
        merged_iter.take(limit as usize).collect()
    } else {
        merged_iter.collect()
    };

    Ok(LeafListTermsResponse {
        num_hits: merged_results.len() as u64,
        terms: merged_results,
        num_attempted_splits: 1,
        failed_splits: Vec::new(),
    })
}

fn term_from_data(field: Field, field_type: &FieldType, data: &[u8]) -> Term {
    let mut term = Term::from_field_bool(field, false);
    term.clear_with_type(field_type.value_type());
    term.append_bytes(data);
    term
}

#[allow(deprecated)]
fn term_to_data(field: Field, field_type: &FieldType, field_value: &[u8]) -> Vec<u8> {
    let mut term = Term::from_field_bool(field, false);
    term.clear_with_type(field_type.value_type());
    term.append_bytes(field_value);
    term.serialized_term().to_vec()
}

/// `leaf` step of list terms.
#[instrument(skip_all)]
pub async fn leaf_list_terms(
    searcher_context: Arc<SearcherContext>,
    request: &ListTermsRequest,
    index_storage: Arc<dyn Storage>,
    splits: &[SplitIdAndFooterOffsets],
) -> Result<LeafListTermsResponse, SearchError> {
    info!(split_offsets = ?PrettySample::new(splits, 5));
    let permit_sizes: Vec<ByteSize> = splits
        .iter()
        .map(|split| {
            compute_initial_memory_allocation(
                split,
                searcher_context
                    .searcher_config
                    .warmup_single_split_initial_allocation,
            )
        })
        .collect();
    // We have added offloading leaf search to lambdas, but not for list_terms yet.
    // TODO (Add it)
    // https://github.com/quickwit-oss/quickwit/issues/6150
    let permits = searcher_context
        .search_permit_provider
        .get_permits(permit_sizes)
        .await;
    let leaf_search_single_split_futures: Vec<_> = splits
        .iter()
        .zip(permits.into_iter())
        .map(|(split, search_permit_recv)| {
            let index_storage_clone = index_storage.clone();
            let searcher_context_clone = searcher_context.clone();
            async move {
                let leaf_split_search_permit = search_permit_recv.await;
                // TODO dedicated counter and timer?
                crate::SEARCH_METRICS.leaf_list_terms_splits_total.inc();
                let timer = crate::SEARCH_METRICS
                    .leaf_search_split_duration_secs
                    .start_timer();
                let leaf_search_single_split_res = leaf_list_terms_single_split(
                    &searcher_context_clone,
                    request,
                    index_storage_clone,
                    split.clone(),
                )
                .await;
                timer.observe_duration();

                // Explicitly drop the permit for readability.
                // This should always happen after the ephemeral search cache is dropped.
                std::mem::drop(leaf_split_search_permit);

                leaf_search_single_split_res.map_err(|err| (split.split_id.clone(), err))
            }
        })
        .collect();

    let split_search_results = futures::future::join_all(leaf_search_single_split_futures).await;

    let (split_search_responses, errors): (Vec<LeafListTermsResponse>, Vec<(String, SearchError)>) =
        split_search_results
            .into_iter()
            .partition_map(|split_search_res| match split_search_res {
                Ok(split_search_resp) => Either::Left(split_search_resp),
                Err(err) => Either::Right(err),
            });

    let merged_iter = split_search_responses
        .into_iter()
        .map(|leaf_search_response| leaf_search_response.terms)
        .kmerge()
        .dedup();
    let terms: Vec<Vec<u8>> = if let Some(limit) = request.max_hits {
        merged_iter.take(limit as usize).collect()
    } else {
        merged_iter.collect()
    };

    let failed_splits = errors
        .into_iter()
        .map(|(split_id, err)| SplitSearchError {
            split_id,
            error: err.to_string(),
            retryable_error: true,
        })
        .collect();
    let merged_search_response = LeafListTermsResponse {
        num_hits: terms.len() as u64,
        terms,
        num_attempted_splits: splits.len() as u64,
        failed_splits,
    };

    Ok(merged_search_response)
}


================================================
FILE: quickwit/quickwit-search/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// See https://prometheus.io/docs/practices/naming/

use std::fmt;

use bytesize::ByteSize;
use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    Histogram, HistogramVec, IntCounter, IntCounterVec, IntGauge, exponential_buckets,
    linear_buckets, new_counter, new_counter_vec, new_gauge, new_gauge_vec, new_histogram,
    new_histogram_vec,
};

fn print_if_not_null(
    field_name: &'static str,
    counter: &IntCounter,
    f: &mut fmt::Formatter,
) -> fmt::Result {
    let val = counter.get();
    if val > 0 {
        write!(f, "{}={} ", field_name, val)?;
    }
    Ok(())
}

pub struct SplitSearchOutcomeCounters {
    pub cancel_before_warmup: IntCounter,
    pub cache_hit: IntCounter,
    pub pruned_before_warmup: IntCounter,
    pub cancel_warmup: IntCounter,
    pub pruned_after_warmup: IntCounter,
    pub cancel_cpu_queue: IntCounter,
    pub cancel_cpu: IntCounter,
    pub success: IntCounter,
}

impl fmt::Display for SplitSearchOutcomeCounters {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        print_if_not_null("cancel_before_warmup", &self.cancel_before_warmup, f)?;
        print_if_not_null("cache_hit", &self.cache_hit, f)?;
        print_if_not_null("pruned_before_warmup", &self.pruned_before_warmup, f)?;
        print_if_not_null("cancel_warmup", &self.cancel_warmup, f)?;
        print_if_not_null("pruned_after_warmup", &self.pruned_after_warmup, f)?;
        print_if_not_null("cancel_cpu_queue", &self.cancel_cpu_queue, f)?;
        print_if_not_null("cancel_cpu", &self.cancel_cpu, f)?;
        print_if_not_null("success", &self.success, f)?;
        Ok(())
    }
}

impl SplitSearchOutcomeCounters {
    /// Create a new SplitSearchOutcomeCounters instance, registered in prometheus.
    pub fn new_registered() -> Self {
        let search_split_outcome_vec = new_counter_vec(
            "split_search_outcome",
            "Count the state in which each leaf search split ended",
            "search",
            &[],
            ["category"],
        );
        Self::new_from_counter_vec(search_split_outcome_vec)
    }

    /// Create a new SplitSearchOutcomeCounters instance, but this one won't be reported to
    /// prometheus.
    pub fn new_unregistered() -> Self {
        let search_split_outcome_vec = IntCounterVec::new(
            "split_search_outcome",
            "Count the state in which each leaf search split ended",
            "search",
            &[],
            ["category"],
        );
        Self::new_from_counter_vec(search_split_outcome_vec)
    }

    pub fn new_from_counter_vec(search_split_outcome_vec: IntCounterVec<1>) -> Self {
        SplitSearchOutcomeCounters {
            cancel_before_warmup: search_split_outcome_vec
                .with_label_values(["cancel_before_warmup"]),
            cache_hit: search_split_outcome_vec.with_label_values(["cache_hit"]),
            pruned_before_warmup: search_split_outcome_vec
                .with_label_values(["pruned_before_warmup"]),
            cancel_warmup: search_split_outcome_vec.with_label_values(["cancel_warmup"]),
            pruned_after_warmup: search_split_outcome_vec
                .with_label_values(["pruned_after_warmup"]),
            cancel_cpu_queue: search_split_outcome_vec.with_label_values(["cancel_cpu_queue"]),
            cancel_cpu: search_split_outcome_vec.with_label_values(["cancel_cpu"]),
            success: search_split_outcome_vec.with_label_values(["success"]),
        }
    }
}

pub struct SearchMetrics {
    pub root_search_requests_total: IntCounterVec<1>,
    pub root_search_request_duration_seconds: HistogramVec<1>,
    pub root_search_targeted_splits: HistogramVec<1>,
    pub leaf_search_requests_total: IntCounterVec<1>,
    pub leaf_search_request_duration_seconds: HistogramVec<1>,
    pub leaf_search_targeted_splits: HistogramVec<1>,
    pub leaf_list_terms_splits_total: IntCounter,
    pub split_search_outcome_total: SplitSearchOutcomeCounters,
    pub leaf_search_split_duration_secs: Histogram,
    pub job_assigned_total: IntCounterVec<1>,
    pub leaf_search_single_split_tasks_pending: IntGauge,
    pub leaf_search_single_split_tasks_ongoing: IntGauge,
    pub leaf_search_single_split_warmup_num_bytes: Histogram,
    pub searcher_local_kv_store_size_bytes: IntGauge,
}

/// From 0.008s to 131.072s
fn duration_buckets() -> Vec<f64> {
    exponential_buckets(0.008, 2.0, 15).unwrap()
}

impl Default for SearchMetrics {
    fn default() -> Self {
        let targeted_splits_buckets: Vec<f64> = [
            linear_buckets(0.0, 10.0, 10).unwrap(),
            linear_buckets(100.0, 100.0, 9).unwrap(),
            linear_buckets(1000.0, 1000.0, 9).unwrap(),
            linear_buckets(10000.0, 10000.0, 10).unwrap(),
        ]
        .iter()
        .flatten()
        .copied()
        .collect();

        let pseudo_exponential_bytes_buckets = vec![
            ByteSize::mb(10).as_u64() as f64,
            ByteSize::mb(20).as_u64() as f64,
            ByteSize::mb(50).as_u64() as f64,
            ByteSize::mb(100).as_u64() as f64,
            ByteSize::mb(200).as_u64() as f64,
            ByteSize::mb(500).as_u64() as f64,
            ByteSize::gb(1).as_u64() as f64,
            ByteSize::gb(2).as_u64() as f64,
            ByteSize::gb(5).as_u64() as f64,
        ];

        let leaf_search_single_split_tasks = new_gauge_vec::<1>(
            "leaf_search_single_split_tasks",
            "Number of single split search tasks pending or ongoing",
            "search",
            &[],
            ["status"], // takes values "ongoing" or "pending"
        );

        SearchMetrics {
            root_search_requests_total: new_counter_vec(
                "root_search_requests_total",
                "Total number of root search gRPC requests processed.",
                "search",
                &[("kind", "server")],
                ["status"],
            ),
            root_search_request_duration_seconds: new_histogram_vec(
                "root_search_request_duration_seconds",
                "Duration of root search gRPC requests in seconds.",
                "search",
                &[("kind", "server")],
                ["status"],
                duration_buckets(),
            ),
            root_search_targeted_splits: new_histogram_vec(
                "root_search_targeted_splits",
                "Number of splits targeted per root search GRPC request.",
                "search",
                &[],
                ["status"],
                targeted_splits_buckets.clone(),
            ),
            leaf_search_requests_total: new_counter_vec(
                "leaf_search_requests_total",
                "Total number of leaf search gRPC requests processed.",
                "search",
                &[("kind", "server")],
                ["status"],
            ),
            leaf_search_request_duration_seconds: new_histogram_vec(
                "leaf_search_request_duration_seconds",
                "Duration of leaf search gRPC requests in seconds.",
                "search",
                &[("kind", "server")],
                ["status"],
                duration_buckets(),
            ),
            leaf_search_targeted_splits: new_histogram_vec(
                "leaf_search_targeted_splits",
                "Number of splits targeted per leaf search GRPC request.",
                "search",
                &[],
                ["status"],
                targeted_splits_buckets,
            ),

            leaf_list_terms_splits_total: new_counter(
                "leaf_list_terms_splits_total",
                "Number of list terms splits total",
                "search",
                &[],
            ),
            split_search_outcome_total: SplitSearchOutcomeCounters::new_registered(),

            leaf_search_split_duration_secs: new_histogram(
                "leaf_search_split_duration_secs",
                "Number of seconds required to run a leaf search over a single split. The timer \
                 starts after the semaphore is obtained.",
                "search",
                duration_buckets(),
            ),
            leaf_search_single_split_tasks_ongoing: leaf_search_single_split_tasks
                .with_label_values(["ongoing"]),
            leaf_search_single_split_tasks_pending: leaf_search_single_split_tasks
                .with_label_values(["pending"]),
            leaf_search_single_split_warmup_num_bytes: new_histogram(
                "leaf_search_single_split_warmup_num_bytes",
                "Size of the short lived cache for a single split once the warmup is done.",
                "search",
                pseudo_exponential_bytes_buckets,
            ),
            job_assigned_total: new_counter_vec(
                "job_assigned_total",
                "Number of job assigned to searchers, per affinity rank.",
                "search",
                &[],
                ["affinity"],
            ),
            searcher_local_kv_store_size_bytes: new_gauge(
                "searcher_local_kv_store_size_bytes",
                "Size of the searcher kv store in bytes. This store is used to cache scroll \
                 contexts.",
                "search",
                &[],
            ),
        }
    }
}

/// `SEARCH_METRICS` exposes a bunch a set of storage/cache related metrics through a prometheus
/// endpoint.
pub static SEARCH_METRICS: Lazy<SearchMetrics> = Lazy::new(SearchMetrics::default);


================================================
FILE: quickwit/quickwit-search/src/metrics_trackers.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// See https://prometheus.io/docs/practices/naming/

use std::pin::Pin;
use std::task::{Context, Poll, ready};
use std::time::Instant;

use pin_project::{pin_project, pinned_drop};
use quickwit_proto::search::LeafSearchResponse;

use crate::SearchError;
use crate::metrics::SEARCH_METRICS;

// root

pub enum RootSearchMetricsStep {
    Plan,
    Exec { num_targeted_splits: usize },
}

/// Wrapper around the plan and search futures to track metrics.
#[pin_project(PinnedDrop)]
pub struct RootSearchMetricsFuture<F> {
    #[pin]
    pub tracked: F,
    pub start: Instant,
    pub step: RootSearchMetricsStep,
    pub is_success: Option<bool>,
}

#[pinned_drop]
impl<F> PinnedDrop for RootSearchMetricsFuture<F> {
    fn drop(self: Pin<&mut Self>) {
        let (num_targeted_splits, status) = match (&self.step, self.is_success) {
            // is is a partial success, actual success is recorded during the search step
            (RootSearchMetricsStep::Plan, Some(true)) => return,
            (RootSearchMetricsStep::Plan, Some(false)) => (0, "plan-error"),
            (RootSearchMetricsStep::Plan, None) => (0, "plan-cancelled"),
            (
                RootSearchMetricsStep::Exec {
                    num_targeted_splits,
                },
                Some(true),
            ) => (*num_targeted_splits, "success"),
            (
                RootSearchMetricsStep::Exec {
                    num_targeted_splits,
                },
                Some(false),
            ) => (*num_targeted_splits, "error"),
            (
                RootSearchMetricsStep::Exec {
                    num_targeted_splits,
                },
                None,
            ) => (*num_targeted_splits, "cancelled"),
        };

        let label_values = [status];
        SEARCH_METRICS
            .root_search_requests_total
            .with_label_values(label_values)
            .inc();
        SEARCH_METRICS
            .root_search_request_duration_seconds
            .with_label_values(label_values)
            .observe(self.start.elapsed().as_secs_f64());
        SEARCH_METRICS
            .root_search_targeted_splits
            .with_label_values(label_values)
            .observe(num_targeted_splits as f64);
    }
}

impl<F, R, E> Future for RootSearchMetricsFuture<F>
where F: Future<Output = Result<R, E>>
{
    type Output = Result<R, E>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let this = self.project();
        let response = ready!(this.tracked.poll(cx));
        *this.is_success = Some(response.is_ok());
        Poll::Ready(Ok(response?))
    }
}

// leaf

/// Wrapper around the search future to track metrics.
#[pin_project(PinnedDrop)]
pub struct LeafSearchMetricsFuture<F>
where F: Future<Output = Result<LeafSearchResponse, SearchError>>
{
    #[pin]
    pub tracked: F,
    pub start: Instant,
    pub targeted_splits: usize,
    pub status: Option<&'static str>,
}

#[pinned_drop]
impl<F> PinnedDrop for LeafSearchMetricsFuture<F>
where F: Future<Output = Result<LeafSearchResponse, SearchError>>
{
    fn drop(self: Pin<&mut Self>) {
        let label_values = [self.status.unwrap_or("cancelled")];
        SEARCH_METRICS
            .leaf_search_requests_total
            .with_label_values(label_values)
            .inc();
        SEARCH_METRICS
            .leaf_search_request_duration_seconds
            .with_label_values(label_values)
            .observe(self.start.elapsed().as_secs_f64());
        SEARCH_METRICS
            .leaf_search_targeted_splits
            .with_label_values(label_values)
            .observe(self.targeted_splits as f64);
    }
}

impl<F> Future for LeafSearchMetricsFuture<F>
where F: Future<Output = Result<LeafSearchResponse, SearchError>>
{
    type Output = Result<LeafSearchResponse, SearchError>;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let this = self.project();
        let response = ready!(this.tracked.poll(cx));
        *this.status = if response.is_ok() {
            Some("success")
        } else {
            Some("error")
        };
        Poll::Ready(Ok(response?))
    }
}


================================================
FILE: quickwit/quickwit-search/src/retry/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub mod search;

use std::collections::HashSet;
use std::net::SocketAddr;

use crate::search_job_placer::Job;
use crate::{SearchJobPlacer, SearchServiceClient};

/// A retry policy to evaluate if a request should be retried.
/// A retry can be made either on an error or on a partial success.
pub trait RetryPolicy<Request, Response, Error>: Sized {
    /// Returns a retry request in case of retry.
    fn retry_request(
        &self,
        request: Request,
        response_res: &Result<Response, Error>,
    ) -> Option<Request>;
}

/// Default retry policy:
/// - All responses are treated as success.
/// - All errors are retryable and the retry request is the same as the original one.
pub struct DefaultRetryPolicy {}

impl<Request, Response, Error> RetryPolicy<Request, Response, Error> for DefaultRetryPolicy {
    fn retry_request(
        &self,
        request: Request,
        response_res: &Result<Response, Error>,
    ) -> Option<Request> {
        match response_res {
            Ok(_) => None,
            Err(_) => Some(request),
        }
    }
}

impl Job for &str {
    fn split_id(&self) -> &str {
        self
    }

    fn cost(&self) -> usize {
        1
    }
}

// Select a new client from the client pool by the following oversimplified policy:
// 1. Take the first split_id of the request
// 2. Ask for a relevant client for that split while excluding the failing identified by its socket
// addr.
pub async fn retry_client(
    search_job_placer: &SearchJobPlacer,
    excluded_addr: SocketAddr,
    split_id: &str,
) -> anyhow::Result<SearchServiceClient> {
    let excluded_addrs = HashSet::from_iter([excluded_addr]);
    search_job_placer
        .assign_job(split_id, &excluded_addrs)
        .await
}

#[cfg(test)]
mod tests {
    use std::net::SocketAddr;
    use std::sync::Arc;

    use quickwit_proto::search::{FetchDocsResponse, SplitIdAndFooterOffsets};

    use crate::retry::{DefaultRetryPolicy, RetryPolicy, retry_client};
    use crate::{
        MockSearchService, SearchError, SearchJobPlacer, SearchServiceClient, SearcherPool,
    };

    #[test]
    fn test_should_retry_on_error() {
        let retry_policy = DefaultRetryPolicy {};
        let response_res = crate::Result::<()>::Err(SearchError::Internal("test".to_string()));
        retry_policy.retry_request((), &response_res).unwrap()
    }

    #[test]
    fn test_should_not_retry_if_result_is_ok() {
        let retry_policy = DefaultRetryPolicy {};
        let response_res =
            crate::Result::<FetchDocsResponse>::Ok(FetchDocsResponse { hits: Vec::new() });
        assert!(retry_policy.retry_request((), &response_res).is_none());
    }

    #[tokio::test]
    async fn test_retry_client_should_return_another_client() -> anyhow::Result<()> {
        let searcher_grpc_addr_1 = ([127, 0, 0, 1], 1000).into();
        let mock_search_service_1 = MockSearchService::new();
        let searcher_client_1 = SearchServiceClient::from_service(
            Arc::new(mock_search_service_1),
            searcher_grpc_addr_1,
        );
        let searcher_grpc_addr_2 = ([127, 0, 0, 1], 1001).into();
        let mock_search_service_2 = MockSearchService::new();
        let searcher_client_2 = SearchServiceClient::from_service(
            Arc::new(mock_search_service_2),
            searcher_grpc_addr_2,
        );
        let searcher_pool = SearcherPool::from_iter([
            (searcher_grpc_addr_1, searcher_client_1),
            (searcher_grpc_addr_2, searcher_client_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let _first_grpc_addr: SocketAddr = "127.0.0.1:1000".parse()?;
        let split_id_and_footer_offsets = SplitIdAndFooterOffsets {
            split_id: "split_1".to_string(),
            split_footer_end: 100,
            split_footer_start: 0,
            timestamp_start: None,
            timestamp_end: None,
            num_docs: 0,
        };
        let client_for_retry = retry_client(
            &search_job_placer,
            searcher_grpc_addr_1,
            &split_id_and_footer_offsets.split_id,
        )
        .await
        .unwrap();
        assert_eq!(client_for_retry.grpc_addr().to_string(), "127.0.0.1:1001");
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-search/src/retry/search.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;

use quickwit_proto::search::{LeafSearchRequest, LeafSearchResponse};

use super::RetryPolicy;
use crate::SearchError;

/// Retry policy for LeafSearchRequest.
/// A retry is made either on an error or if there are some failing splits.
/// In the last case, a retry request is built on failing splits only.
pub struct LeafSearchRetryPolicy {}

impl RetryPolicy<LeafSearchRequest, LeafSearchResponse, SearchError> for LeafSearchRetryPolicy {
    // Build a retry request on failing split ids only.
    fn retry_request(
        &self,
        mut request: LeafSearchRequest,
        response_res: &Result<LeafSearchResponse, SearchError>,
    ) -> Option<LeafSearchRequest> {
        match response_res {
            Ok(response) => {
                if response.failed_splits.is_empty() {
                    return None;
                }
                let failed_splits_hash_set: HashSet<&str> = response
                    .failed_splits
                    .iter()
                    .map(|failed_split| failed_split.split_id.as_str())
                    .collect();
                for request in request.leaf_requests.iter_mut() {
                    // Keep only failed splits
                    request.split_offsets.retain(|split_metadata| {
                        failed_splits_hash_set.contains(split_metadata.split_id.as_str())
                    });
                }
                // Remove requests with empty split_offsets
                request
                    .leaf_requests
                    .retain(|request| !request.split_offsets.is_empty());
                Some(request)
            }
            Err(SearchError::Timeout(_)) => None, // Don't retry on timeout
            Err(_) => Some(request),
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_proto::search::{
        LeafRequestRef, LeafSearchRequest, LeafSearchResponse, SearchRequest,
        SplitIdAndFooterOffsets, SplitSearchError,
    };
    use quickwit_query::query_ast::qast_json_helper;

    use crate::SearchError;
    use crate::retry::RetryPolicy;
    use crate::retry::search::LeafSearchRetryPolicy;

    fn mock_leaf_search_request() -> LeafSearchRequest {
        let search_request = SearchRequest {
            index_id_patterns: vec!["test-idx".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        LeafSearchRequest {
            search_request: Some(search_request),
            doc_mappers: vec!["doc_mapper".to_string()],
            index_uris: vec!["uri".to_string()],
            leaf_requests: vec![LeafRequestRef {
                index_uri_ord: 0,
                doc_mapper_ord: 0,
                split_offsets: vec![
                    SplitIdAndFooterOffsets {
                        split_id: "split_1".to_string(),
                        split_footer_start: 0,
                        split_footer_end: 100,
                        timestamp_start: None,
                        timestamp_end: None,
                        num_docs: 0,
                    },
                    SplitIdAndFooterOffsets {
                        split_id: "split_2".to_string(),
                        split_footer_start: 0,
                        split_footer_end: 100,
                        timestamp_start: None,
                        timestamp_end: None,
                        num_docs: 0,
                    },
                ],
            }],
        }
    }

    #[test]
    fn test_should_retry_on_error() {
        let retry_policy = LeafSearchRetryPolicy {};
        let request = mock_leaf_search_request();
        let response_res = Result::<LeafSearchResponse, SearchError>::Err(SearchError::Internal(
            "test".to_string(),
        ));
        retry_policy.retry_request(request, &response_res).unwrap();
    }

    #[test]
    fn test_should_not_retry_if_result_is_ok_and_no_failing_splits() {
        let retry_policy = LeafSearchRetryPolicy {};
        let request = mock_leaf_search_request();
        let response_res = Ok(LeafSearchResponse {
            num_hits: 0,
            partial_hits: Vec::new(),
            failed_splits: Vec::new(),
            num_attempted_splits: 1,
            ..Default::default()
        });
        assert!(retry_policy.retry_request(request, &response_res).is_none())
    }

    #[test]
    fn test_should_retry_on_failed_splits() {
        let retry_policy = LeafSearchRetryPolicy {};
        let request = mock_leaf_search_request();
        let mut expected_retry_request = request.clone();
        expected_retry_request.leaf_requests[0]
            .split_offsets
            .remove(0);
        let split_error = SplitSearchError {
            error: "error".to_string(),
            split_id: "split_2".to_string(),
            retryable_error: true,
        };
        let response_res = Ok(LeafSearchResponse {
            num_hits: 0,
            partial_hits: Vec::new(),
            failed_splits: vec![split_error],
            num_attempted_splits: 1,
            ..Default::default()
        });
        let retry_request = retry_policy.retry_request(request, &response_res).unwrap();
        assert_eq!(retry_request, expected_retry_request);
    }
}


================================================
FILE: quickwit/quickwit-search/src/root.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::sync::OnceLock;
use std::sync::atomic::{AtomicU64, Ordering};
use std::time::{Duration, Instant};

use anyhow::Context;
use futures::future::try_join_all;
use itertools::Itertools;
use quickwit_common::pretty::PrettySample;
use quickwit_common::shared_consts;
use quickwit_common::uri::Uri;
use quickwit_config::build_doc_mapper;
use quickwit_doc_mapper::DYNAMIC_FIELD_NAME;
use quickwit_doc_mapper::tag_pruning::extract_tags_from_query;
use quickwit_metastore::{IndexMetadata, ListIndexesMetadataResponseExt, SplitMetadata};
use quickwit_proto::metastore::{
    ListIndexesMetadataRequest, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::search::{
    FetchDocsRequest, FetchDocsResponse, Hit, LeafHit, LeafRequestRef, LeafSearchRequest,
    LeafSearchResponse, PartialHit, SearchPlanResponse, SearchRequest, SearchResponse,
    SnippetRequest, SortDatetimeFormat, SortField, SortValue, SplitIdAndFooterOffsets,
};
use quickwit_proto::types::{IndexUid, SplitId};
use quickwit_query::query_ast::{
    BoolQuery, QueryAst, QueryAstVisitor, RangeQuery, TermQuery, TermSetQuery,
};
use serde::{Deserialize, Serialize};
use tantivy::TantivyError;
use tantivy::aggregation::agg_result::AggregationResults;
use tantivy::aggregation::intermediate_agg_result::IntermediateAggregationResults;
use tantivy::collector::Collector;
use tantivy::schema::{Field, FieldEntry, FieldType, Schema};
use tracing::{debug, error, info, info_span, instrument};

use crate::cluster_client::ClusterClient;
use crate::collector::{QuickwitAggregations, make_merge_collector};
use crate::metrics_trackers::{RootSearchMetricsFuture, RootSearchMetricsStep};
use crate::scroll_context::{ScrollContext, ScrollKeyAndStartOffset};
use crate::search_job_placer::{Job, group_by, group_jobs_by_index_id};
use crate::search_response_rest::StorageRequestCount;
use crate::service::SearcherContext;
use crate::{
    SearchError, SearchJobPlacer, SearchPlanResponseRest, SearchServiceClient,
    extract_split_and_footer_offsets, list_relevant_splits,
};

/// Maximum accepted scroll TTL.
fn max_scroll_ttl() -> Duration {
    static MAX_SCROLL_TTL_LOCK: OnceLock<Duration> = OnceLock::new();
    *MAX_SCROLL_TTL_LOCK.get_or_init(|| {
        let split_deletion_grace_period = shared_consts::split_deletion_grace_period();
        assert!(
            split_deletion_grace_period >= shared_consts::MINIMUM_DELETION_GRACE_PERIOD,
            "The split deletion grace period is too short ({split_deletion_grace_period:?}). This \
             should not happen."
        );
        // We remove an extra margin of 2minutes from the split deletion grace period.
        split_deletion_grace_period - Duration::from_secs(60 * 2)
    })
}

const SORT_DOC_FIELD_NAMES: &[&str] = &["_shard_doc", "_doc"];

/// SearchJob to be assigned to search clients by the [`SearchJobPlacer`].
#[derive(Debug, Clone, PartialEq)]
pub struct SearchJob {
    /// The index UID.
    pub index_uid: IndexUid,
    cost: usize,
    /// The split ID and footer offsets of the split.
    pub offsets: SplitIdAndFooterOffsets,
}

impl SearchJob {
    /// Create a fake job from a split_id (used for hashing), and a cost.
    #[cfg(test)]
    pub fn for_test(split_id: &str, cost: usize) -> SearchJob {
        use std::str::FromStr;
        SearchJob {
            index_uid: IndexUid::from_str("test-index:00000000000000000000000000").unwrap(),
            cost,
            offsets: SplitIdAndFooterOffsets {
                split_id: split_id.to_string(),
                ..Default::default()
            },
        }
    }
}

impl From<SearchJob> for SplitIdAndFooterOffsets {
    fn from(search_job: SearchJob) -> Self {
        search_job.offsets
    }
}

impl<'a> From<&'a SplitMetadata> for SearchJob {
    fn from(split_metadata: &'a SplitMetadata) -> Self {
        SearchJob {
            index_uid: split_metadata.index_uid.clone(),
            cost: compute_split_cost(split_metadata),
            offsets: extract_split_and_footer_offsets(split_metadata),
        }
    }
}

impl Job for SearchJob {
    fn split_id(&self) -> &str {
        &self.offsets.split_id
    }

    fn cost(&self) -> usize {
        self.cost
    }
}

pub struct FetchDocsJob {
    index_uid: IndexUid,
    offsets: SplitIdAndFooterOffsets,
    pub partial_hits: Vec<PartialHit>,
}

impl Job for FetchDocsJob {
    fn split_id(&self) -> &str {
        &self.offsets.split_id
    }

    fn cost(&self) -> usize {
        self.partial_hits.len()
    }
}

impl From<FetchDocsJob> for SplitIdAndFooterOffsets {
    fn from(fetch_docs_job: FetchDocsJob) -> SplitIdAndFooterOffsets {
        fetch_docs_job.offsets
    }
}

/// Index metas needed for executing a leaf search request.
#[derive(Serialize, Deserialize, Clone, Debug)]
pub struct IndexMetasForLeafSearch {
    /// Index URI.
    pub index_uri: Uri,
    /// Doc mapper json string.
    pub doc_mapper_str: String,
}

pub(crate) type IndexesMetasForLeafSearch = HashMap<IndexUid, IndexMetasForLeafSearch>;

#[derive(Debug)]
struct RequestMetadata {
    timestamp_field_opt: Option<String>,
    query_ast_resolved: QueryAst,
    indexes_meta_for_leaf_search: IndexesMetasForLeafSearch,
    sort_fields_is_datetime: HashMap<String, bool>,
}

/// Validates request against each index's doc mapper and ensures that:
/// - timestamp fields (if any) are equal across indexes.
/// - resolved query ASTs are the same across indexes.
/// - if a sort field is of type datetime, it must be a datetime field on all indexes. This
///   constraint come from the need to support datetime formatting on sort values.
///
/// Returns the timestamp field, the resolved query AST and the indexes metadatas
/// needed for leaf search requests.
/// Note: the requirements on timestamp fields and resolved query ASTs can be lifted
/// but it adds complexity that does not seem needed right now.
fn validate_request_and_build_metadata(
    indexes_metadata: &[IndexMetadata],
    search_request: &SearchRequest,
) -> crate::Result<RequestMetadata> {
    validate_sort_by_fields_and_search_after(
        &search_request.sort_fields,
        &search_request.search_after,
    )?;
    let query_ast: QueryAst = serde_json::from_str(&search_request.query_ast)
        .map_err(|err| SearchError::InvalidQuery(err.to_string()))?;
    let mut indexes_meta_for_leaf_search: HashMap<IndexUid, IndexMetasForLeafSearch> =
        HashMap::new();
    let mut query_ast_resolved_opt: Option<QueryAst> = None;
    let mut timestamp_field_opt: Option<String> = None;
    let mut sort_fields_is_datetime: HashMap<String, bool> = HashMap::new();

    for index_metadata in indexes_metadata {
        let doc_mapper = build_doc_mapper(
            &index_metadata.index_config.doc_mapping,
            &index_metadata.index_config.search_settings,
        )
        .map_err(|err| {
            SearchError::Internal(format!("failed to build doc mapper. cause: {err}"))
        })?;
        let query_ast_resolved_for_index = query_ast
            .clone()
            .parse_user_query(doc_mapper.default_search_fields())
            // We convert the error to return a 400 to the user (and not a 500).
            .map_err(|err| SearchError::InvalidQuery(err.to_string()))?;

        // Validate uniqueness of resolved query AST.
        if let Some(query_ast_resolved) = &query_ast_resolved_opt {
            if query_ast_resolved != &query_ast_resolved_for_index {
                return Err(SearchError::InvalidQuery(
                    "resolved query ASTs must be the same across indexes. resolving queries with \
                     different default fields are different between indexes is not supported"
                        .to_string(),
                ));
            }
        } else {
            query_ast_resolved_opt = Some(query_ast_resolved_for_index.clone());
        }

        // Validate uniqueness of timestamp field if any.
        if let Some(timestamp_field_for_index) = doc_mapper.timestamp_field_name() {
            match timestamp_field_opt {
                Some(timestamp_field) if timestamp_field != timestamp_field_for_index => {
                    return Err(SearchError::InvalidQuery(
                        "the timestamp field (if present) must be the same for all indexes"
                            .to_string(),
                    ));
                }
                None => {
                    timestamp_field_opt = Some(timestamp_field_for_index.to_string());
                }
                _ => {}
            }
        }

        // Validate request against the current index schema.
        let schema = doc_mapper.schema();
        validate_request(&schema, &doc_mapper.timestamp_field_name(), search_request)?;

        validate_sort_field_types(
            &schema,
            &search_request.sort_fields,
            &mut sort_fields_is_datetime,
        )?;

        // Validates the query by effectively building it against the current schema.
        doc_mapper.query(
            doc_mapper.schema(),
            query_ast_resolved_for_index,
            true,
            None,
        )?;

        let index_metadata_for_leaf_search = IndexMetasForLeafSearch {
            index_uri: index_metadata.index_uri().clone(),
            doc_mapper_str: serde_json::to_string(&doc_mapper).map_err(|err| {
                SearchError::Internal(format!("failed to serialize doc mapper. cause: {err}"))
            })?,
        };
        indexes_meta_for_leaf_search.insert(
            index_metadata.index_uid.clone(),
            index_metadata_for_leaf_search,
        );
    }

    let query_ast_resolved = query_ast_resolved_opt.ok_or_else(|| {
        SearchError::Internal(
            "resolved query AST must be present. this should never happen".to_string(),
        )
    })?;

    Ok(RequestMetadata {
        timestamp_field_opt,
        query_ast_resolved,
        indexes_meta_for_leaf_search,
        sort_fields_is_datetime,
    })
}

/// Validate sort field types.
fn validate_sort_field_types(
    schema: &Schema,
    sort_fields: &[SortField],
    sort_field_is_datetime: &mut HashMap<String, bool>,
) -> crate::Result<()> {
    for sort_field in sort_fields.iter() {
        if let Some(sort_field_entry) = get_sort_by_field_entry(&sort_field.field_name, schema)? {
            validate_sort_by_field_type(
                sort_field_entry,
                sort_field.sort_datetime_format.is_some(),
            )?;
            // If sort field type is a date, ensure it's true for all indexes.
            if let Some(is_datetime) = sort_field_is_datetime.get(&sort_field.field_name) {
                if *is_datetime != sort_field_entry.field_type().is_date() {
                    return Err(SearchError::InvalidQuery(format!(
                        "sort datetime field `{}` must be of type datetime on all indexes",
                        sort_field_entry.name(),
                    )));
                }
            } else {
                sort_field_is_datetime.insert(
                    sort_field.field_name.to_string(),
                    sort_field_entry.field_type().is_date(),
                );
            }
        } else {
            sort_field_is_datetime.insert(sort_field.field_name.to_string(), false);
        }
    }
    Ok(())
}

fn validate_requested_snippet_fields(
    schema: &Schema,
    snippet_fields: &[String],
) -> anyhow::Result<()> {
    for field_name in snippet_fields {
        let field_entry = schema
            .get_field(field_name)
            .map(|field| schema.get_field_entry(field))?;
        match field_entry.field_type() {
            FieldType::Str(text_options) => {
                if !text_options.is_stored() {
                    return Err(anyhow::anyhow!(
                        "the snippet field `{}` must be stored",
                        field_name
                    ));
                }
            }
            other => {
                return Err(anyhow::anyhow!(
                    "the snippet field `{}` must be of type `Str`, got `{}`",
                    field_name,
                    other.value_type().name()
                ));
            }
        }
    }
    Ok(())
}

fn simplify_search_request_for_scroll_api(req: &SearchRequest) -> crate::Result<SearchRequest> {
    if req.search_after.is_some() {
        return Err(SearchError::InvalidArgument(
            "search_after cannot be used in a scroll context".to_string(),
        ));
    }

    // We do not mutate
    Ok(SearchRequest {
        index_id_patterns: req.index_id_patterns.clone(),
        query_ast: req.query_ast.clone(),
        start_timestamp: req.start_timestamp,
        end_timestamp: req.end_timestamp,
        max_hits: req.max_hits,
        start_offset: req.start_offset,
        sort_fields: req.sort_fields.clone(),
        // We remove all aggregation request.
        // The aggregation will not be computed for each scroll request.
        aggregation_request: None,
        // We remove the snippet fields. This feature is not supported for scroll requests.
        snippet_fields: Vec::new(),
        // We remove the scroll ttl parameter. It is irrelevant to process later request
        scroll_ttl_secs: None,
        search_after: None,
        // request is simplified after initial query, and we cache the hit count, so we don't need
        // to recompute it afterward.
        count_hits: quickwit_proto::search::CountHits::Underestimate as i32,
        ignore_missing_indexes: req.ignore_missing_indexes,
        skip_aggregation_finalization: false,
    })
}

/// Validates sort fields and search after values.
/// - validate sort fields length.
/// - search after values must be set for all sort fields.
fn validate_sort_by_fields_and_search_after(
    sort_fields: &[SortField],
    search_after: &Option<PartialHit>,
) -> crate::Result<()> {
    if sort_fields.is_empty() {
        return Ok(());
    }
    if sort_fields.len() > 2 {
        return Err(SearchError::InvalidArgument(format!(
            "sort by field must be up to 2 fields, got {}",
            sort_fields.len()
        )));
    }
    let Some(search_after_partial_hit) = search_after.as_ref() else {
        return Ok(());
    };

    let sort_fields_without_doc_count = sort_fields
        .iter()
        .filter(|sort_field| !SORT_DOC_FIELD_NAMES.contains(&sort_field.field_name.as_str()))
        .count();
    let has_doc_sort_field = sort_fields_without_doc_count != sort_fields.len();
    if has_doc_sort_field && search_after_partial_hit.split_id.is_empty() {
        return Err(SearchError::InvalidArgument(
            "search_after with a sort field `_doc` must define a split ID, segment ID and doc ID \
             values"
                .to_string(),
        ));
    }

    let mut search_after_sort_value_count = 0;
    // TODO: we could validate if the search after sort value types of consistent with the sort
    // field types.
    if let Some(sort_by_value) = search_after_partial_hit.sort_value.as_ref() {
        sort_by_value.sort_value.context("sort value must be set")?;
        search_after_sort_value_count += 1;
    }
    if let Some(sort_by_value_2) = search_after_partial_hit.sort_value2.as_ref() {
        sort_by_value_2
            .sort_value
            .context("sort value must be set")?;
        search_after_sort_value_count += 1;
    }
    if search_after_sort_value_count != sort_fields_without_doc_count {
        return Err(SearchError::InvalidArgument(format!(
            "`search_after` must have the same number of sort values as sort by fields {:?}",
            sort_fields
                .iter()
                .map(|sort_field| &sort_field.field_name)
                .collect_vec()
        )));
    }
    Ok(())
}

fn get_sort_by_field_entry<'a>(
    field_name: &str,
    schema: &'a Schema,
) -> crate::Result<Option<&'a FieldEntry>> {
    if "_score" == field_name || SORT_DOC_FIELD_NAMES.contains(&field_name) {
        return Ok(None);
    }
    let dynamic_field_opt = schema.get_field(DYNAMIC_FIELD_NAME).ok();
    let (sort_by_field, _json_path) = schema
        .find_field_with_default(field_name, dynamic_field_opt)
        .ok_or_else(|| {
            SearchError::InvalidArgument(format!("unknown field used in `sort by`: {field_name}"))
        })?;
    let sort_by_field_entry = schema.get_field_entry(sort_by_field);
    Ok(Some(sort_by_field_entry))
}

/// Validates sort field type.
fn validate_sort_by_field_type(
    sort_by_field_entry: &FieldEntry,
    has_timestamp_format: bool,
) -> crate::Result<()> {
    let field_name = sort_by_field_entry.name();
    if matches!(sort_by_field_entry.field_type(), FieldType::Str(_)) {
        return Err(SearchError::InvalidArgument(format!(
            "sort by field on type text is currently not supported `{field_name}`"
        )));
    }
    if !sort_by_field_entry.is_fast() {
        return Err(SearchError::InvalidArgument(format!(
            "sort by field must be a fast field, please add the fast property to your field \
             `{field_name}`",
        )));
    }
    if has_timestamp_format && !sort_by_field_entry.field_type().is_date() {
        return Err(SearchError::InvalidArgument(format!(
            "sort by field with a timestamp format must be a datetime field and the field \
             `{field_name}` is not",
        )));
    }
    Ok(())
}

fn check_is_fast_field(
    schema: &Schema,
    fast_field_name: &str,
    dynamic_fast_field: Option<Field>,
) -> crate::Result<()> {
    let Some((field, _path)): Option<(Field, &str)> =
        schema.find_field_with_default(fast_field_name, dynamic_fast_field)
    else {
        return Err(SearchError::InvalidArgument(format!(
            "Field \"{fast_field_name}\" does not exist"
        )));
    };
    let field_entry: &FieldEntry = schema.get_field_entry(field);
    if !field_entry.is_fast() {
        return Err(SearchError::InvalidArgument(format!(
            "Field \"{fast_field_name}\" is not configured as a fast field"
        )));
    }
    Ok(())
}

fn validate_request(
    schema: &Schema,
    timestamp_field_name: &Option<&str>,
    search_request: &SearchRequest,
) -> crate::Result<()> {
    if timestamp_field_name.is_none()
        && (search_request.start_timestamp.is_some() || search_request.end_timestamp.is_some())
    {
        return Err(SearchError::InvalidQuery(format!(
            "the timestamp field is not set in index: {:?} definition but start-timestamp or \
             end-timestamp are set in the query",
            search_request.index_id_patterns
        )));
    }

    validate_requested_snippet_fields(schema, &search_request.snippet_fields)?;

    if let Some(agg) = search_request.aggregation_request.as_ref() {
        let aggs: QuickwitAggregations = serde_json::from_str(agg).map_err(|_err| {
            let err = serde_json::from_str::<tantivy::aggregation::agg_req::Aggregations>(agg)
                .unwrap_err();
            SearchError::InvalidAggregationRequest(err.to_string())
        })?;

        // ensure that the required fast fields are indeed configured as fast fields.
        let fast_field_names = aggs.fast_field_names();
        let dynamic_field = schema.get_field(DYNAMIC_FIELD_NAME).ok();
        for fast_field_name in &fast_field_names {
            check_is_fast_field(schema, fast_field_name, dynamic_field)?;
        }
    };

    if search_request.start_offset > 10_000 {
        return Err(SearchError::InvalidArgument(format!(
            "max value for start_offset is 10_000, but got {}",
            search_request.start_offset
        )));
    }

    if search_request.max_hits > 10_000 {
        return Err(SearchError::InvalidArgument(format!(
            "max value for max_hits is 10_000, but got {}",
            search_request.max_hits
        )));
    }

    Ok(())
}

fn get_scroll_ttl_duration(search_request: &SearchRequest) -> crate::Result<Option<Duration>> {
    let Some(scroll_ttl_secs) = search_request.scroll_ttl_secs else {
        return Ok(None);
    };
    let scroll_ttl: Duration = Duration::from_secs(scroll_ttl_secs as u64);
    let max_scroll_ttl = max_scroll_ttl();
    if scroll_ttl > max_scroll_ttl {
        return Err(SearchError::InvalidArgument(format!(
            "Quickwit only supports scroll TTL period up to {} secs",
            max_scroll_ttl.as_secs()
        )));
    }
    Ok(Some(scroll_ttl))
}

#[instrument(level = "debug", skip_all)]
async fn search_partial_hits_phase_with_scroll(
    searcher_context: &SearcherContext,
    indexes_metas_for_leaf_search: &IndexesMetasForLeafSearch,
    mut search_request: SearchRequest,
    split_metadatas: &[SplitMetadata],
    cluster_client: &ClusterClient,
) -> crate::Result<(LeafSearchResponse, Option<ScrollKeyAndStartOffset>)> {
    let scroll_ttl_opt = get_scroll_ttl_duration(&search_request)?;

    if let Some(scroll_ttl) = scroll_ttl_opt {
        let max_hits = search_request.max_hits;
        // This is a scroll request.
        //
        // We increase max hits to add populate the scroll cache.
        search_request.max_hits = search_request
            .max_hits
            .max(shared_consts::SCROLL_BATCH_LEN as u64);
        search_request.scroll_ttl_secs = None;
        let mut leaf_search_resp = search_partial_hits_phase(
            searcher_context,
            indexes_metas_for_leaf_search,
            &search_request,
            split_metadatas,
            cluster_client,
        )
        .await?;
        let cached_partial_hits = leaf_search_resp.partial_hits.clone();
        leaf_search_resp.partial_hits.truncate(max_hits as usize);
        let last_hit = leaf_search_resp
            .partial_hits
            .last()
            .cloned()
            .unwrap_or_default();

        let scroll_context_search_request =
            simplify_search_request_for_scroll_api(&search_request)?;
        let mut scroll_ctx = ScrollContext {
            indexes_metas_for_leaf_search: indexes_metas_for_leaf_search.clone(),
            split_metadatas: split_metadatas.to_vec(),
            search_request: scroll_context_search_request,
            total_num_hits: leaf_search_resp.num_hits,
            max_hits_per_page: max_hits,
            cached_partial_hits_start_offset: search_request.start_offset,
            cached_partial_hits,
            failed_splits: leaf_search_resp.failed_splits.clone(),
            num_successful_splits: leaf_search_resp.num_successful_splits,
        };
        let scroll_key_and_start_offset: ScrollKeyAndStartOffset =
            ScrollKeyAndStartOffset::new_with_start_offset(
                scroll_ctx.search_request.start_offset,
                max_hits as u32,
                last_hit.clone(),
            )
            .next_page(leaf_search_resp.partial_hits.len() as u64, last_hit);

        scroll_ctx.clear_cache_if_unneeded();
        let payload: Vec<u8> = scroll_ctx.serialize();
        let scroll_key = scroll_key_and_start_offset.scroll_key();
        cluster_client
            .put_kv(&scroll_key, &payload, scroll_ttl)
            .await;
        Ok((leaf_search_resp, Some(scroll_key_and_start_offset)))
    } else {
        let leaf_search_resp = search_partial_hits_phase(
            searcher_context,
            indexes_metas_for_leaf_search,
            &search_request,
            split_metadatas,
            cluster_client,
        )
        .await?;
        Ok((leaf_search_resp, None))
    }
}

/// Check if the request is a count request without any filters, so we can just return the split
/// metadata count.
///
/// This is done by exclusion, so we will need to keep it up to date if fields are added.
pub fn is_metadata_count_request(request: &SearchRequest) -> bool {
    let query_ast: QueryAst = serde_json::from_str(&request.query_ast).unwrap();
    is_metadata_count_request_with_ast(&query_ast, request)
}

/// Check if the request is a count request without any filters, so we can just return the split
/// metadata count.
///
/// This is done by exclusion, so we will need to keep it up to date if fields are added.
///
/// The passed query_ast should match the serialized on in request.
pub fn is_metadata_count_request_with_ast(query_ast: &QueryAst, request: &SearchRequest) -> bool {
    // TODO detect Cache(MatchAll), Boost(MatchAll) and Bool{must/should:MatchAll}
    if query_ast != &QueryAst::MatchAll {
        return false;
    }
    if request.max_hits != 0 {
        return false;
    }

    // If the start and end timestamp encompass the whole split, it is still a count query.
    // We remove this currently on the leaf level, but not yet on the root level.
    // There's a small advantage when we would do this on the root level, since we have the
    // counts available on the split. On the leaf it is currently required to open the split
    // to get the count.
    if request.start_timestamp.is_some() || request.end_timestamp.is_some() {
        return false;
    }
    if request.aggregation_request.is_some() || !request.snippet_fields.is_empty() {
        return false;
    }
    true
}

/// Get a leaf search response that returns the num_docs of the split
pub fn get_count_from_metadata(split_metadatas: &[SplitMetadata]) -> Vec<LeafSearchResponse> {
    split_metadatas
        .iter()
        .map(|metadata| LeafSearchResponse {
            num_hits: metadata.num_docs as u64,
            partial_hits: Vec::new(),
            failed_splits: Vec::new(),
            num_attempted_splits: 1,
            num_successful_splits: 1,
            intermediate_aggregation_result: None,
            resource_stats: None,
        })
        .collect()
}

/// Returns true if the query is particularly memory intensive.
///
/// This function only considers the memory usage associated to the input data
/// and does not take in account aggregations (intermediary or not) results for instance.
///
/// Since its point is to log memory intensive queries, it focuses on the metric of the number of
/// bytes per document.
///
/// The threshold is computed dynamically using gradient descent.
fn is_top_5pct_memory_intensive(num_bytes: u64, split_num_docs: u64) -> bool {
    // It is not worth considering small splits for this.
    if split_num_docs < 100_000 {
        return false;
    }
    // We multiply those figure by 1_000 for accuracy.
    const PERCENTILE: u64 = 95;
    const PRIOR_NUM_BYTES_PER_DOC: u64 = 3 * 1_000;
    static NUM_BYTES_PER_DOC_95_PERCENTILE_ESTIMATOR: AtomicU64 =
        AtomicU64::new(PRIOR_NUM_BYTES_PER_DOC);
    let num_bits_per_docs = num_bytes * 1_000 / split_num_docs;
    let current_estimator = NUM_BYTES_PER_DOC_95_PERCENTILE_ESTIMATOR.load(Ordering::Relaxed);
    let is_memory_intensive = num_bits_per_docs > current_estimator;
    let new_estimator: u64 = if is_memory_intensive {
        current_estimator.saturating_add(PRIOR_NUM_BYTES_PER_DOC * PERCENTILE / 100)
    } else {
        current_estimator.saturating_sub(PRIOR_NUM_BYTES_PER_DOC * (100 - PERCENTILE) / 100)
    };
    // We do not use fetch_add / fetch_sub directly as they wrap around.
    // Concurrency could lead to different results here, but really we don't care.
    //
    // This is just ignoring some gradient updates.
    NUM_BYTES_PER_DOC_95_PERCENTILE_ESTIMATOR.store(new_estimator, Ordering::Relaxed);
    is_memory_intensive
}

/// If this method fails for some splits, a partial search response is returned, with the list of
/// faulty splits in the failed_splits field.
#[instrument(level = "debug", skip_all)]
pub(crate) async fn search_partial_hits_phase(
    searcher_context: &SearcherContext,
    indexes_metas_for_leaf_search: &IndexesMetasForLeafSearch,
    search_request: &SearchRequest,
    split_metadatas: &[SplitMetadata],
    cluster_client: &ClusterClient,
) -> crate::Result<LeafSearchResponse> {
    let leaf_search_responses: Vec<LeafSearchResponse> =
        if is_metadata_count_request(search_request) {
            get_count_from_metadata(split_metadatas)
        } else {
            let jobs: Vec<SearchJob> = split_metadatas.iter().map(SearchJob::from).collect();
            let assigned_leaf_search_jobs = cluster_client
                .search_job_placer
                .assign_jobs(jobs, &HashSet::default())
                .await?;
            let mut leaf_request_tasks = Vec::new();
            for (client, client_jobs) in assigned_leaf_search_jobs {
                let leaf_request = jobs_to_leaf_request(
                    search_request,
                    indexes_metas_for_leaf_search,
                    client_jobs,
                )?;
                leaf_request_tasks.push(cluster_client.leaf_search(leaf_request, client.clone()));
            }
            try_join_all(leaf_request_tasks).await?
        };

    let merge_collector =
        make_merge_collector(search_request, searcher_context.get_aggregation_limits())?;

    // Merging is a cpu-bound task.
    // It should be executed by Tokio's blocking threads.

    // Wrap into result for merge_fruits
    let leaf_search_results: Vec<tantivy::Result<LeafSearchResponse>> =
        leaf_search_responses.into_iter().map(Ok).collect_vec();
    let span = info_span!("merge_fruits");
    let leaf_search_response = crate::search_thread_pool()
        .run_cpu_intensive(move || {
            let _span_guard = span.enter();
            merge_collector.merge_fruits(leaf_search_results)
        })
        .await
        .context("failed to merge leaf search responses")?
        .map_err(|error: TantivyError| crate::SearchError::Internal(error.to_string()))?;
    debug!(
        num_hits = leaf_search_response.num_hits,
        failed_splits = ?leaf_search_response.failed_splits,
        num_attempted_splits = leaf_search_response.num_attempted_splits,
        has_intermediate_aggregation_result = leaf_search_response.intermediate_aggregation_result.is_some(),
        "Merged leaf search response."
    );

    if let Some(resource_stats) = &leaf_search_response.resource_stats
        && is_top_5pct_memory_intensive(
            resource_stats.short_lived_cache_num_bytes,
            resource_stats.split_num_docs,
        )
    {
        // We log at most 5 times per minute.
        quickwit_common::rate_limited_info!(
            limit_per_min = 5,
            split_num_docs = resource_stats.split_num_docs,
            short_lived_cached_num_bytes = resource_stats.short_lived_cache_num_bytes,
            "memory intensive query"
        );
    }

    if !leaf_search_response.failed_splits.is_empty() {
        quickwit_common::rate_limited_error!(limit_per_min=6, failed_splits = ?leaf_search_response.failed_splits, "leaf search response contains at least one failed split");
    }

    Ok(leaf_search_response)
}

pub(crate) fn get_snippet_request(search_request: &SearchRequest) -> Option<SnippetRequest> {
    if search_request.snippet_fields.is_empty() {
        return None;
    }
    Some(SnippetRequest {
        snippet_fields: search_request.snippet_fields.clone(),
        query_ast_resolved: search_request.query_ast.clone(),
    })
}

#[instrument(skip_all, fields(partial_hits_num=partial_hits.len()))]
pub(crate) async fn fetch_docs_phase(
    indexes_metas_for_leaf_search: &IndexesMetasForLeafSearch,
    partial_hits: &[PartialHit],
    split_metadatas: &[SplitMetadata],
    search_request: &SearchRequest,
    cluster_client: &ClusterClient,
) -> crate::Result<Vec<Hit>> {
    let snippet_request: Option<SnippetRequest> = get_snippet_request(search_request);
    let hit_order: HashMap<(String, u32, u32), usize> = partial_hits
        .iter()
        .enumerate()
        .map(|(position, partial_hit)| {
            let key = (
                partial_hit.split_id.clone(),
                partial_hit.segment_ord,
                partial_hit.doc_id,
            );
            (key, position)
        })
        .collect();

    let assigned_fetch_docs_jobs = assign_client_fetch_docs_jobs(
        partial_hits,
        split_metadatas,
        &cluster_client.search_job_placer,
    )
    .await?;

    let mut fetch_docs_tasks = Vec::new();
    for (client, client_jobs) in assigned_fetch_docs_jobs {
        let fetch_jobs_requests = jobs_to_fetch_docs_requests(
            snippet_request.clone(),
            indexes_metas_for_leaf_search,
            client_jobs,
        )?;
        for fetch_docs_request in fetch_jobs_requests {
            fetch_docs_tasks.push(cluster_client.fetch_docs(fetch_docs_request, client.clone()));
        }
    }
    let fetch_docs_responses: Vec<FetchDocsResponse> = try_join_all(fetch_docs_tasks).await?;

    // Merge the fetched docs.
    let leaf_hits = fetch_docs_responses
        .into_iter()
        .flat_map(|response| response.hits.into_iter());

    // Build map of Split ID > index ID to add the index ID to the hits.
    // Used for ES compatibility.
    let split_id_to_index_id_map: HashMap<&SplitId, &str> = split_metadatas
        .iter()
        .map(|split_metadata| {
            (
                &split_metadata.split_id,
                split_metadata.index_uid.index_id.as_str(),
            )
        })
        .collect();
    let mut sort_field_iter = search_request.sort_fields.iter();
    let sort_field_1_datetime_format_opt: Option<SortDatetimeFormat> =
        get_sort_field_datetime_format(sort_field_iter.next())?;
    let sort_field_2_datetime_format_opt: Option<SortDatetimeFormat> =
        get_sort_field_datetime_format(sort_field_iter.next())?;
    let mut hits_with_position: Vec<(usize, Hit)> = leaf_hits
        .map(|leaf_hit| {
            build_hit_with_position(
                leaf_hit,
                &split_id_to_index_id_map,
                &hit_order,
                &sort_field_1_datetime_format_opt,
                &sort_field_2_datetime_format_opt,
            )
        })
        .try_collect()?;

    hits_with_position.sort_by_key(|(position, _)| *position);
    let hits: Vec<Hit> = hits_with_position
        .into_iter()
        .map(|(_position, hit)| hit)
        .collect();

    Ok(hits)
}

fn build_hit_with_position(
    mut leaf_hit: LeafHit,
    split_id_to_index_id_map: &HashMap<&SplitId, &str>,
    hit_order: &HashMap<(String, u32, u32), usize>,
    sort_field_1_datetime_format_opt: &Option<SortDatetimeFormat>,
    sort_field_2_datetime_format_opt: &Option<SortDatetimeFormat>,
) -> crate::Result<(usize, Hit)> {
    let partial_hit_ref = leaf_hit
        .partial_hit
        .as_mut()
        .expect("partial hit must be present");
    let key = (
        partial_hit_ref.split_id.clone(),
        partial_hit_ref.segment_ord,
        partial_hit_ref.doc_id,
    );
    let sort_value_opt = partial_hit_ref
        .sort_value
        .as_mut()
        .and_then(|sort_field| sort_field.sort_value.as_mut());
    if let Some(sort_by_value) = sort_value_opt
        && let Some(output_datetime_format) = &sort_field_1_datetime_format_opt
    {
        convert_sort_datetime_value(sort_by_value, *output_datetime_format)?;
    }
    let sort_value_2_opt = partial_hit_ref
        .sort_value2
        .as_mut()
        .and_then(|sort_field| sort_field.sort_value.as_mut());
    if let Some(sort_by_value) = sort_value_2_opt
        && let Some(output_datetime_format) = &sort_field_2_datetime_format_opt
    {
        convert_sort_datetime_value(sort_by_value, *output_datetime_format)?;
    }
    let position = *hit_order.get(&key).expect("hit order must be present");
    let index_id = split_id_to_index_id_map
        .get(&partial_hit_ref.split_id)
        .map(|split_id| split_id.to_string())
        .unwrap_or_default();

    Result::<(usize, Hit), SearchError>::Ok((
        position,
        Hit {
            json: leaf_hit.leaf_json,
            partial_hit: leaf_hit.partial_hit,
            snippet: leaf_hit.leaf_snippet_json,
            index_id,
        },
    ))
}

fn get_sort_field_datetime_format(
    sort_field: Option<&SortField>,
) -> crate::Result<Option<SortDatetimeFormat>> {
    if let Some(sort_field) = sort_field
        && let Some(sort_field_datetime_format_int) = &sort_field.sort_datetime_format
    {
        let sort_field_datetime_format =
            SortDatetimeFormat::try_from(*sort_field_datetime_format_int)
                .context("invalid sort datetime format")?;
        return Ok(Some(sort_field_datetime_format));
    }
    Ok(None)
}

/// Performs a distributed search.
/// 1. Sends leaf requests over gRPC to multiple leaf nodes.
/// 2. Merges the search results.
/// 3. Sends fetch docs requests to multiple leaf nodes.
/// 4. Builds the response with docs and returns.
async fn root_search_aux(
    searcher_context: &SearcherContext,
    indexes_metas_for_leaf_search: &IndexesMetasForLeafSearch,
    search_request: SearchRequest,
    split_metadatas: Vec<SplitMetadata>,
    cluster_client: &ClusterClient,
) -> crate::Result<SearchResponse> {
    debug!(split_metadatas = ?PrettySample::new(&split_metadatas, 5));
    let (first_phase_result, scroll_key_and_start_offset_opt): (
        LeafSearchResponse,
        Option<ScrollKeyAndStartOffset>,
    ) = search_partial_hits_phase_with_scroll(
        searcher_context,
        indexes_metas_for_leaf_search,
        search_request.clone(),
        &split_metadatas[..],
        cluster_client,
    )
    .await?;

    let hits = fetch_docs_phase(
        indexes_metas_for_leaf_search,
        &first_phase_result.partial_hits,
        &split_metadatas[..],
        &search_request,
        cluster_client,
    )
    .await?;

    let mut aggregation_result_postcard_opt = finalize_aggregation_if_any(
        &search_request,
        first_phase_result.intermediate_aggregation_result,
        searcher_context,
    )?;
    // In case there is no index, we don't want the response to contain any aggregation structure
    if indexes_metas_for_leaf_search.is_empty() {
        aggregation_result_postcard_opt = None;
    }

    Ok(SearchResponse {
        aggregation_postcard: aggregation_result_postcard_opt,
        num_hits: first_phase_result.num_hits,
        hits,
        elapsed_time_micros: 0u64,
        errors: Vec::new(),
        scroll_id: scroll_key_and_start_offset_opt
            .as_ref()
            .map(ToString::to_string),
        failed_splits: first_phase_result.failed_splits,
        num_successful_splits: first_phase_result.num_successful_splits,
    })
}

fn finalize_aggregation(
    intermediate_aggregation_result_bytes_opt: Option<Vec<u8>>,
    aggregations: QuickwitAggregations,
    searcher_context: &SearcherContext,
) -> crate::Result<Option<Vec<u8>>> {
    let merge_aggregation_result = match aggregations {
        QuickwitAggregations::FindTraceIdsAggregation(_) => {
            // The merge collector has already merged the intermediate results.
            return Ok(intermediate_aggregation_result_bytes_opt);
        }
        QuickwitAggregations::TantivyAggregations(aggregations) => {
            let intermediate_aggregation_results =
                if let Some(intermediate_aggregation_result_bytes) =
                    intermediate_aggregation_result_bytes_opt
                {
                    let intermediate_aggregation_results: IntermediateAggregationResults =
                        postcard::from_bytes(&intermediate_aggregation_result_bytes)?;
                    intermediate_aggregation_results
                } else {
                    // Default, to return correct structure
                    Default::default()
                };
            let final_aggregation_results: AggregationResults = intermediate_aggregation_results
                .into_final_result(aggregations, searcher_context.get_aggregation_limits())?;
            let final_aggregation_proxy: quickwit_query::aggregations::AggregationResults =
                final_aggregation_results.into();
            postcard::to_stdvec(&final_aggregation_proxy)?
        }
    };
    Ok(Some(merge_aggregation_result))
}

fn finalize_aggregation_if_any(
    search_request: &SearchRequest,
    intermediate_aggregation_result_bytes_opt: Option<Vec<u8>>,
    searcher_context: &SearcherContext,
) -> crate::Result<Option<Vec<u8>>> {
    let Some(aggregations_json) = search_request.aggregation_request.as_ref() else {
        return Ok(None);
    };
    if search_request.skip_aggregation_finalization {
        return Ok(intermediate_aggregation_result_bytes_opt);
    }
    let aggregations: QuickwitAggregations = serde_json::from_str(aggregations_json)?;
    let aggregation_result_postcard = finalize_aggregation(
        intermediate_aggregation_result_bytes_opt,
        aggregations,
        searcher_context,
    )?;
    Ok(aggregation_result_postcard)
}

/// Checks that all of the index researched as found.
///
/// An index pattern (= containing a wildcard) not matching is not an error.
/// A specific index id however must be found.
///
/// We put this check here and not in the metastore to make sure the logic is independent
/// of the metastore implementation, and some different use cases could require different
/// behaviors. This specification was principally motivated by #4042.
pub fn ensure_all_indexes_found(
    indexes_metadata: &[IndexMetadata],
    index_id_patterns: &[String],
) -> crate::Result<()> {
    let mut index_ids: HashSet<&str> = index_id_patterns
        .iter()
        .filter(|pattern| !pattern.contains('*') && !pattern.starts_with('-'))
        .map(|pattern| pattern.as_str())
        .collect();

    if index_ids.is_empty() {
        // All the patterns are wildcard or negative patterns.
        return Ok(());
    }
    for index_metadata in indexes_metadata {
        index_ids.remove(index_metadata.index_id());
    }
    if index_ids.is_empty() {
        return Ok(());
    }
    let not_found_index_ids = index_ids
        .into_iter()
        .map(|index_id| index_id.to_string())
        .collect();

    Err(SearchError::IndexesNotFound {
        index_ids: not_found_index_ids,
    })
}

async fn refine_and_list_matches(
    metastore: &mut MetastoreServiceClient,
    search_request: &mut SearchRequest,
    indexes_metadata: Vec<IndexMetadata>,
    query_ast_resolved: QueryAst,
    sort_fields_is_datetime: HashMap<String, bool>,
    timestamp_field_opt: Option<String>,
) -> crate::Result<Vec<SplitMetadata>> {
    let index_uids = indexes_metadata
        .iter()
        .map(|index_metadata| index_metadata.index_uid.clone())
        .collect_vec();
    search_request.query_ast = serde_json::to_string(&query_ast_resolved)?;

    // convert search_after datetime values from input datetime format to nanos.
    convert_search_after_datetime_values(search_request, &sort_fields_is_datetime)?;

    // update_search_after_datetime_in_nanos(&mut search_request)?;
    if let Some(timestamp_field) = &timestamp_field_opt {
        refine_start_end_timestamp_from_ast(
            &query_ast_resolved,
            timestamp_field,
            &mut search_request.start_timestamp,
            &mut search_request.end_timestamp,
        );
    }
    let tag_filter_ast = extract_tags_from_query(query_ast_resolved);

    // TODO if search after is set, we sort by timestamp and we don't want to count all results,
    // we can refine more here. Same if we sort by _shard_doc
    let split_metadatas: Vec<SplitMetadata> = list_relevant_splits(
        index_uids,
        search_request.start_timestamp,
        search_request.end_timestamp,
        tag_filter_ast,
        metastore,
    )
    .await?;
    Ok(split_metadatas)
}

/// Fetches the list of splits and their metadata from the metastore
async fn plan_splits_for_root_search(
    search_request: &mut SearchRequest,
    metastore: &mut MetastoreServiceClient,
) -> crate::Result<(Vec<SplitMetadata>, IndexesMetasForLeafSearch)> {
    let list_indexes_metadatas_request = ListIndexesMetadataRequest {
        index_id_patterns: search_request.index_id_patterns.clone(),
    };
    let indexes_metadata: Vec<IndexMetadata> = metastore
        .list_indexes_metadata(list_indexes_metadatas_request)
        .await?
        .deserialize_indexes_metadata()
        .await?;

    if !search_request.ignore_missing_indexes {
        ensure_all_indexes_found(&indexes_metadata[..], &search_request.index_id_patterns[..])?;
    }

    if indexes_metadata.is_empty() {
        return Ok((Vec::new(), HashMap::default()));
    }

    let request_metadata = validate_request_and_build_metadata(&indexes_metadata, search_request)?;
    let split_metadatas = refine_and_list_matches(
        metastore,
        search_request,
        indexes_metadata,
        request_metadata.query_ast_resolved,
        request_metadata.sort_fields_is_datetime,
        request_metadata.timestamp_field_opt,
    )
    .await?;
    Ok((
        split_metadatas,
        request_metadata.indexes_meta_for_leaf_search,
    ))
}

/// Performs a distributed search.
/// 1. Sends leaf requests over gRPC to multiple leaf nodes.
/// 2. Merges the search results.
/// 3. Sends fetch docs requests to multiple leaf nodes.
/// 4. Builds the response with docs and returns.
#[instrument(skip_all)]
pub async fn root_search(
    searcher_context: &SearcherContext,
    mut search_request: SearchRequest,
    mut metastore: MetastoreServiceClient,
    cluster_client: &ClusterClient,
) -> crate::Result<SearchResponse> {
    let start_instant = Instant::now();

    let (split_metadatas, indexes_meta_for_leaf_search) = RootSearchMetricsFuture {
        start: start_instant,
        tracked: plan_splits_for_root_search(&mut search_request, &mut metastore),
        is_success: None,
        step: RootSearchMetricsStep::Plan,
    }
    .await?;

    let num_docs: usize = split_metadatas.iter().map(|split| split.num_docs).sum();
    let num_splits = split_metadatas.len();

    // It would have been nice to add those in the context of the trace span,
    // but with our current logging setting, it makes logs too verbose.
    info!(
        query_ast = search_request.query_ast.as_str(),
        agg = search_request.aggregation_request(),
        start_ts = ?(search_request.start_timestamp()..search_request.end_timestamp()),
        count_required = search_request.count_hits().as_str_name(),
        num_docs = num_docs,
        num_splits = num_splits,
        "root_search"
    );

    if let Some(max_total_split_searches) = searcher_context.searcher_config.max_splits_per_search
        && max_total_split_searches < num_splits
    {
        error!(
            num_splits,
            max_total_split_searches,
            index=?search_request.index_id_patterns,
            query=%search_request.query_ast,
            "max total splits exceeded"
        );
        return Err(SearchError::InvalidArgument(format!(
            "Number of targeted splits {num_splits} exceeds the limit {max_total_split_searches}"
        )));
    }

    let mut search_response_result = RootSearchMetricsFuture {
        start: start_instant,
        tracked: root_search_aux(
            searcher_context,
            &indexes_meta_for_leaf_search,
            search_request,
            split_metadatas,
            cluster_client,
        ),
        is_success: None,
        step: RootSearchMetricsStep::Exec {
            num_targeted_splits: num_splits,
        },
    }
    .await;

    if let Ok(search_response) = &mut search_response_result {
        search_response.elapsed_time_micros = start_instant.elapsed().as_micros() as u64;
    }

    search_response_result
}

/// Returns details on how a query would be executed
pub async fn search_plan(
    mut search_request: SearchRequest,
    mut metastore: MetastoreServiceClient,
) -> crate::Result<SearchPlanResponse> {
    let list_indexes_metadatas_request = ListIndexesMetadataRequest {
        index_id_patterns: search_request.index_id_patterns.clone(),
    };
    let indexes_metadata: Vec<IndexMetadata> = metastore
        .list_indexes_metadata(list_indexes_metadatas_request)
        .await?
        .deserialize_indexes_metadata()
        .await?;

    if !search_request.ignore_missing_indexes {
        ensure_all_indexes_found(&indexes_metadata[..], &search_request.index_id_patterns[..])?;
    }
    if indexes_metadata.is_empty() {
        return Ok(SearchPlanResponse {
            result: serde_json::to_string(&SearchPlanResponseRest {
                quickwit_ast: QueryAst::MatchAll,
                tantivy_ast: String::new(),
                searched_splits: Vec::new(),
                storage_requests: StorageRequestCount::default(),
            })?,
        });
    }
    let doc_mapper = build_doc_mapper(
        &indexes_metadata[0].index_config.doc_mapping,
        &indexes_metadata[0].index_config.search_settings,
    )
    .map_err(|err| SearchError::Internal(format!("failed to build doc mapper. cause: {err}")))?;

    let request_metadata = validate_request_and_build_metadata(&indexes_metadata, &search_request)?;
    let split_metadatas = refine_and_list_matches(
        &mut metastore,
        &mut search_request,
        indexes_metadata,
        request_metadata.query_ast_resolved.clone(),
        request_metadata.sort_fields_is_datetime,
        request_metadata.timestamp_field_opt,
    )
    .await?;

    let (query, mut warmup_info) = doc_mapper.query(
        doc_mapper.schema(),
        request_metadata.query_ast_resolved.clone(),
        true,
        None,
    )?;
    let merge_collector = make_merge_collector(&search_request, Default::default())?;
    warmup_info.merge(merge_collector.warmup_info());
    warmup_info.simplify();

    let split_ids = split_metadatas
        .into_iter()
        .map(|split| format!("{}/{}", split.index_uid.index_id, split.split_id))
        .collect();
    // this is an upper bound, we'd need access to a hotdir for more precise results
    let fieldnorm_query_count = if warmup_info.field_norms {
        doc_mapper
            .schema()
            .fields()
            .filter(|(_, entry)| entry.has_fieldnorms())
            .count()
    } else {
        0
    };
    let sstable_query_count = warmup_info.term_dict_fields.len()
        + warmup_info
            .terms_grouped_by_field
            .values()
            .map(|terms: &HashMap<tantivy::Term, bool>| terms.len())
            .sum::<usize>()
        + warmup_info
            .term_ranges_grouped_by_field
            .values()
            .map(|terms: &HashMap<_, bool>| terms.len())
            .sum::<usize>();
    let position_query_count = warmup_info
        .terms_grouped_by_field
        .values()
        .map(|terms: &HashMap<tantivy::Term, bool>| {
            terms
                .values()
                .filter(|load_position| **load_position)
                .count()
        })
        .sum::<usize>()
        + warmup_info
            .term_ranges_grouped_by_field
            .values()
            .map(|terms: &HashMap<_, bool>| {
                terms
                    .values()
                    .filter(|load_position| **load_position)
                    .count()
            })
            .sum::<usize>();
    Ok(SearchPlanResponse {
        result: serde_json::to_string(&SearchPlanResponseRest {
            quickwit_ast: request_metadata.query_ast_resolved,
            tantivy_ast: format!("{query:#?}"),
            searched_splits: split_ids,
            storage_requests: StorageRequestCount {
                footer: 1,
                fastfield: warmup_info.fast_fields.len(),
                fieldnorm: fieldnorm_query_count,
                sstable: sstable_query_count,
                posting: sstable_query_count,
                position: position_query_count,
            },
        })?,
    })
}

/// Converts search after with datetime format to nanoseconds (representation in tantivy).
/// If the sort field is a datetime field and no datetime format is set, the default format is
/// milliseconds.
/// `sort_fields_are_datetime_opt` must be of the same length as `search_request.sort_fields`.
fn convert_search_after_datetime_values(
    search_request: &mut SearchRequest,
    sort_fields_is_datetime: &HashMap<String, bool>,
) -> crate::Result<()> {
    for sort_field in search_request.sort_fields.iter_mut() {
        if *sort_fields_is_datetime
            .get(&sort_field.field_name)
            .unwrap_or(&false)
            && sort_field.sort_datetime_format.is_none()
        {
            sort_field.sort_datetime_format = Some(SortDatetimeFormat::UnixTimestampMillis as i32);
        }
    }
    if let Some(partial_hit) = search_request.search_after.as_mut() {
        let search_after_values = [
            partial_hit.sort_value.as_mut(),
            partial_hit.sort_value2.as_mut(),
        ];
        for (sort_field, search_after_value_opt) in
            search_request.sort_fields.iter().zip(search_after_values)
        {
            let Some(search_after_sort_by_value) = search_after_value_opt else {
                continue;
            };
            let Some(search_after_sort_value) = search_after_sort_by_value.sort_value.as_mut()
            else {
                continue;
            };
            let Some(datetime_format_int) = sort_field.sort_datetime_format else {
                continue;
            };
            let input_datetime_format = SortDatetimeFormat::try_from(datetime_format_int)
                .context("invalid sort datetime format")?;
            convert_sort_datetime_value_into_nanos(search_after_sort_value, input_datetime_format)?;
        }
    }
    Ok(())
}

/// Convert sort values from input datetime format into nanoseconds.
/// The conversion is done only for U64 and I64 sort values, an error is returned for other types.
fn convert_sort_datetime_value_into_nanos(
    sort_value: &mut SortValue,
    input_format: SortDatetimeFormat,
) -> crate::Result<()> {
    match sort_value {
        SortValue::U64(value) => match input_format {
            SortDatetimeFormat::UnixTimestampMillis => {
                *value = value.checked_mul(1_000_000).ok_or_else(|| {
                    SearchError::Internal(format!(
                        "sort value defined in milliseconds is too large and cannot be converted \
                         into nanoseconds: {value}"
                    ))
                })?;
            }
            SortDatetimeFormat::UnixTimestampNanos => {
                // Nothing to do as the internal format is nanos.
            }
        },
        SortValue::I64(value) => match input_format {
            SortDatetimeFormat::UnixTimestampMillis => {
                *value = value.checked_mul(1_000_000).ok_or_else(|| {
                    SearchError::Internal(format!(
                        "sort value defined in milliseconds is too large and cannot be converted \
                         into nanoseconds: {value}"
                    ))
                })?;
            }
            SortDatetimeFormat::UnixTimestampNanos => {
                // Nothing to do as the internal format is nanos.
            }
        },
        _ => {
            return Err(SearchError::Internal(format!(
                "datetime conversion are only support for u64 and i64 sort values, not \
                 `{sort_value:?}`"
            )));
        }
    }
    Ok(())
}

/// Convert sort values from nanoseconds to the requested output format.
/// The conversion is done only for U64 and I64 sort values, an error is returned for other types.
fn convert_sort_datetime_value(
    sort_value: &mut SortValue,
    output_format: SortDatetimeFormat,
) -> crate::Result<()> {
    match sort_value {
        SortValue::U64(value) => match output_format {
            SortDatetimeFormat::UnixTimestampMillis => {
                *value /= 1_000_000;
            }
            SortDatetimeFormat::UnixTimestampNanos => {
                // Nothing todo as the internal format is in nanos.
            }
        },
        SortValue::I64(value) => match output_format {
            SortDatetimeFormat::UnixTimestampMillis => {
                *value /= 1_000_000;
            }
            SortDatetimeFormat::UnixTimestampNanos => {
                // Nothing todo as the internal format is in nanos.
            }
        },
        _ => {
            return Err(SearchError::Internal(format!(
                "datetime conversion are only support for u64 and i64 sort values, not \
                 `{sort_value:?}`"
            )));
        }
    }
    Ok(())
}

pub(crate) fn refine_start_end_timestamp_from_ast(
    query_ast: &QueryAst,
    timestamp_field: &str,
    start_timestamp: &mut Option<i64>,
    end_timestamp: &mut Option<i64>,
) {
    let mut timestamp_range_extractor = ExtractTimestampRange {
        timestamp_field,
        start_timestamp: *start_timestamp,
        end_timestamp: *end_timestamp,
    };
    timestamp_range_extractor
        .visit(query_ast)
        .expect("can't fail unwrapping Infallible");
    *start_timestamp = timestamp_range_extractor.start_timestamp;
    *end_timestamp = timestamp_range_extractor.end_timestamp;
}

/// Boundaries identified as being implied by the QueryAst.
///
/// `start_timestamp` is to be interpreted as Inclusive (or Unbounded)
/// `end_timestamp` is to be interpreted as Exclusive (or Unbounded)
/// In other word, this is a `[start_timestamp..end_timestamp)` interval.
struct ExtractTimestampRange<'a> {
    timestamp_field: &'a str,
    start_timestamp: Option<i64>,
    end_timestamp: Option<i64>,
}

impl ExtractTimestampRange<'_> {
    fn update_start_timestamp(
        &mut self,
        lower_bound: &quickwit_query::JsonLiteral,
        included: bool,
    ) {
        use quickwit_query::InterpretUserInput;
        let Some(lower_bound) = tantivy::DateTime::interpret_json(lower_bound) else {
            return;
        };
        let mut lower_bound = lower_bound.into_timestamp_secs();
        if !included {
            // TODO saturating isn't exactly right, we should replace the RangeQuery with
            // a match_none, but the visitor doesn't allow mutation.
            lower_bound = lower_bound.saturating_add(1);
        }

        self.start_timestamp = self.start_timestamp.max(Some(lower_bound));
    }

    fn update_end_timestamp(&mut self, upper_bound: &quickwit_query::JsonLiteral, included: bool) {
        use quickwit_query::InterpretUserInput;
        let Some(upper_bound_timestamp) = tantivy::DateTime::interpret_json(upper_bound) else {
            return;
        };
        let mut upper_bound = upper_bound_timestamp.into_timestamp_secs();
        let round_up = (upper_bound_timestamp.into_timestamp_nanos() % 1_000_000_000) != 0;
        if included || round_up {
            // TODO saturating isn't exactly right, we should replace the RangeQuery with
            // a match_none, but the visitor doesn't allow mutation.
            upper_bound = upper_bound.saturating_add(1);
        }

        let new_end_timestamp = self.end_timestamp.unwrap_or(upper_bound).min(upper_bound);
        self.end_timestamp = Some(new_end_timestamp);
    }
}

impl<'b> QueryAstVisitor<'b> for ExtractTimestampRange<'_> {
    type Err = std::convert::Infallible;

    fn visit_bool(&mut self, bool_query: &'b BoolQuery) -> Result<(), Self::Err> {
        // we only want to visit sub-queries which are strict (positive) requirements
        for ast in bool_query.must.iter().chain(bool_query.filter.iter()) {
            self.visit(ast)?;
        }
        Ok(())
    }

    fn visit_range(&mut self, range_query: &'b RangeQuery) -> Result<(), Self::Err> {
        use std::ops::Bound;

        if range_query.field == self.timestamp_field {
            match &range_query.lower_bound {
                Bound::Included(lower_bound) => self.update_start_timestamp(lower_bound, true),
                Bound::Excluded(lower_bound) => self.update_start_timestamp(lower_bound, false),
                Bound::Unbounded => (),
            }
            match &range_query.upper_bound {
                Bound::Included(upper_bound) => self.update_end_timestamp(upper_bound, true),
                Bound::Excluded(upper_bound) => self.update_end_timestamp(upper_bound, false),
                Bound::Unbounded => (),
            }
        }
        Ok(())
    }

    // if we visit a term, limit the range to DATE..=DATE
    fn visit_term(&mut self, term_query: &'b TermQuery) -> Result<(), Self::Err> {
        if term_query.field == self.timestamp_field {
            // TODO when fixing #3323, this may need to be modified to support numbers too
            let json_term = quickwit_query::JsonLiteral::String(term_query.value.clone());
            self.update_start_timestamp(&json_term, true);
            self.update_end_timestamp(&json_term, true);
        }
        Ok(())
    }

    // if we visit a termset, limit the range to LOWEST..=HIGHEST
    fn visit_term_set(&mut self, term_query: &'b TermSetQuery) -> Result<(), Self::Err> {
        if let Some(term_set) = term_query.terms_per_field.get(self.timestamp_field) {
            // rfc3339 is lexicographically ordered if YEAR <= 9999, so we can use string
            // ordering to get the start and end quickly.
            if let Some(first) = term_set.first() {
                let json_term = quickwit_query::JsonLiteral::String(first.clone());
                self.update_start_timestamp(&json_term, true);
            }
            if let Some(last) = term_set.last() {
                let json_term = quickwit_query::JsonLiteral::String(last.clone());
                self.update_end_timestamp(&json_term, true);
            }
        }
        Ok(())
    }
}

async fn assign_client_fetch_docs_jobs(
    partial_hits: &[PartialHit],
    split_metadatas: &[SplitMetadata],
    client_pool: &SearchJobPlacer,
) -> crate::Result<impl Iterator<Item = (SearchServiceClient, Vec<FetchDocsJob>)>> {
    let index_uids_and_split_offsets_map: HashMap<String, (IndexUid, SplitIdAndFooterOffsets)> =
        split_metadatas
            .iter()
            .map(|metadata| {
                (
                    metadata.split_id().to_string(),
                    (
                        metadata.index_uid.clone(),
                        extract_split_and_footer_offsets(metadata),
                    ),
                )
            })
            .collect();

    // Group the partial hits per split
    let mut partial_hits_map: HashMap<String, Vec<PartialHit>> = HashMap::new();
    for partial_hit in partial_hits.iter() {
        partial_hits_map
            .entry(partial_hit.split_id.clone())
            .or_default()
            .push(partial_hit.clone());
    }

    let mut fetch_docs_req_jobs: Vec<FetchDocsJob> = Vec::new();
    for (split_id, partial_hits) in partial_hits_map {
        let (index_uid, offsets) = index_uids_and_split_offsets_map
            .get(&split_id)
            .ok_or_else(|| {
                crate::SearchError::Internal(format!(
                    "received partial hit from an unknown split {split_id}"
                ))
            })?
            .clone();
        let fetch_docs_job = FetchDocsJob {
            index_uid: index_uid.clone(),
            offsets,
            partial_hits,
        };
        fetch_docs_req_jobs.push(fetch_docs_job);
    }

    let assigned_jobs = client_pool
        .assign_jobs(fetch_docs_req_jobs, &HashSet::new())
        .await?;

    Ok(assigned_jobs)
}

// Measure the cost associated to searching in a given split metadata.
fn compute_split_cost(split_metadata: &SplitMetadata) -> usize {
    // TODO this formula could be tuned a lot more. The general idea is that there is a fixed
    // cost to searching a split, plus a somewhat-linear cost depending on the size of the split
    5 + split_metadata.num_docs / 100_000
}

/// Builds a LeafSearchRequest to one node, from a list of [`SearchJob`].
pub fn jobs_to_leaf_request(
    request: &SearchRequest,
    search_indexes_metadatas: &IndexesMetasForLeafSearch,
    jobs: Vec<SearchJob>,
) -> crate::Result<LeafSearchRequest> {
    let mut search_request_for_leaf = request.clone();
    search_request_for_leaf.start_offset = 0;
    search_request_for_leaf.max_hits += request.start_offset;
    search_request_for_leaf.index_id_patterns = Vec::new();

    let mut leaf_search_request = LeafSearchRequest {
        search_request: Some(search_request_for_leaf),
        leaf_requests: Vec::new(),
        doc_mappers: Vec::new(),
        index_uris: Vec::new(),
    };

    let mut added_doc_mappers: HashMap<&str, u32> = HashMap::new();
    // Group jobs by index uid, as the split offsets are relative to the index.
    group_jobs_by_index_id(jobs, |job_group| {
        let index_uid = &job_group[0].index_uid;
        leaf_search_request
            .search_request
            .as_mut()
            .unwrap()
            .index_id_patterns
            .push(index_uid.index_id.to_string());
        let search_index_meta = search_indexes_metadatas.get(index_uid).ok_or_else(|| {
            SearchError::Internal(format!(
                "received job for an unknown index {index_uid}. it should never happen"
            ))
        })?;
        let doc_mapper_ord = *added_doc_mappers
            .entry(&search_index_meta.doc_mapper_str)
            .or_insert_with(|| {
                let ord = leaf_search_request.doc_mappers.len();
                leaf_search_request
                    .doc_mappers
                    .push(search_index_meta.doc_mapper_str.to_string());
                ord as u32
            });
        let index_uri_ord = leaf_search_request.index_uris.len() as u32;
        leaf_search_request
            .index_uris
            .push(search_index_meta.index_uri.to_string());

        let leaf_search_request_ref = LeafRequestRef {
            split_offsets: job_group.into_iter().map(|job| job.offsets).collect(),
            doc_mapper_ord,
            index_uri_ord,
        };
        leaf_search_request
            .leaf_requests
            .push(leaf_search_request_ref);
        Ok(())
    })?;
    Ok(leaf_search_request)
}

/// Builds a list of [`FetchDocsRequest`], one per index, from a list of [`FetchDocsJob`].
pub fn jobs_to_fetch_docs_requests(
    snippet_request_opt: Option<SnippetRequest>,
    indexes_metas_for_leaf_search: &IndexesMetasForLeafSearch,
    jobs: Vec<FetchDocsJob>,
) -> crate::Result<Vec<FetchDocsRequest>> {
    let mut fetch_docs_requests = Vec::new();
    // Group jobs by index uid.
    group_by(
        jobs,
        |job| &job.index_uid,
        |fetch_docs_jobs| {
            let index_uid = &fetch_docs_jobs[0].index_uid;

            let index_meta = indexes_metas_for_leaf_search
                .get(index_uid)
                .ok_or_else(|| {
                    SearchError::Internal(format!(
                        "received search job for an unknown index {index_uid}"
                    ))
                })?;
            let partial_hits: Vec<PartialHit> = fetch_docs_jobs
                .iter()
                .flat_map(|fetch_doc_job| fetch_doc_job.partial_hits.iter().cloned())
                .collect();
            let split_offsets: Vec<SplitIdAndFooterOffsets> = fetch_docs_jobs
                .into_iter()
                .map(|fetch_doc_job| fetch_doc_job.into())
                .collect();
            let fetch_docs_req = FetchDocsRequest {
                partial_hits,
                split_offsets,
                index_uri: index_meta.index_uri.to_string(),
                snippet_request: snippet_request_opt.clone(),
                doc_mapper: index_meta.doc_mapper_str.clone(),
            };
            fetch_docs_requests.push(fetch_docs_req);

            Ok(())
        },
    )?;
    Ok(fetch_docs_requests)
}

#[cfg(test)]
mod tests {
    use std::ops::Range;
    use std::str::FromStr;
    use std::sync::{Arc, RwLock};

    use quickwit_common::ServiceStream;
    use quickwit_common::shared_consts::SCROLL_BATCH_LEN;
    use quickwit_config::{
        DocMapping, IndexConfig, IndexingSettings, IngestSettings, SearchSettings,
    };
    use quickwit_indexing::MockSplitBuilder;
    use quickwit_metastore::{IndexMetadata, ListSplitsRequestExt, ListSplitsResponseExt};
    use quickwit_proto::metastore::{
        ListIndexesMetadataResponse, ListSplitsResponse, MockMetastoreService,
    };
    use quickwit_proto::search::{
        ScrollRequest, SortByValue, SortOrder, SortValue, SplitSearchError,
    };
    use quickwit_query::query_ast::{qast_helper, qast_json_helper, query_ast_from_user_text};
    use tantivy::schema::{FAST, STORED, TEXT};

    use super::*;
    use crate::{MockSearchService, searcher_pool_for_test};

    #[track_caller]
    fn check_snippet_fields_validation(snippet_fields: &[String]) -> anyhow::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_text_field("desc", TEXT | STORED);
        schema_builder.add_ip_addr_field("ip", FAST | STORED);
        let schema = schema_builder.build();
        validate_requested_snippet_fields(&schema, snippet_fields)
    }

    #[test]
    fn test_validate_requested_snippet_fields() {
        check_snippet_fields_validation(&["desc".to_string()]).unwrap();
        let field_not_stored_err =
            check_snippet_fields_validation(&["title".to_string()]).unwrap_err();
        assert_eq!(
            field_not_stored_err.to_string(),
            "the snippet field `title` must be stored"
        );
        let field_doesnotexist_err =
            check_snippet_fields_validation(&["doesnotexist".to_string()]).unwrap_err();
        assert_eq!(
            field_doesnotexist_err.to_string(),
            "The field does not exist: 'doesnotexist'"
        );
        let field_is_not_text_err =
            check_snippet_fields_validation(&["ip".to_string()]).unwrap_err();
        assert_eq!(
            field_is_not_text_err.to_string(),
            "the snippet field `ip` must be of type `Str`, got `IpAddr`"
        );
    }

    #[test]
    fn test_get_sort_by_field_entry() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_text_field("desc", TEXT | STORED);
        schema_builder.add_u64_field("timestamp", FAST | STORED);
        let schema = schema_builder.build();
        get_sort_by_field_entry("timestamp", &schema)
            .unwrap()
            .unwrap();
        let sort_by_field_entry_err = get_sort_by_field_entry("doesnotexist", &schema).unwrap_err();
        assert_eq!(
            sort_by_field_entry_err.to_string(),
            "Invalid argument: unknown field used in `sort by`: doesnotexist"
        );
        for sort_field_name in &["_doc", "_score", "_shard_doc"] {
            assert!(
                get_sort_by_field_entry(sort_field_name, &schema)
                    .unwrap()
                    .is_none()
            );
        }
    }

    fn index_metadata_for_multi_indexes_test(index_id: &str, index_uri: &str) -> IndexMetadata {
        let index_uri = Uri::from_str(index_uri).unwrap();
        let doc_mapping_json = r#"{
            "mode": "lenient",
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "body",
                    "type": "text",
                    "stored": true
                }
            ],
            "timestamp_field": "timestamp",
            "store_source": true
        }"#;
        let doc_mapping = serde_json::from_str(doc_mapping_json).unwrap();
        let indexing_settings = IndexingSettings::default();
        let ingest_settings = IngestSettings::default();
        let search_settings = SearchSettings {
            default_search_fields: vec!["body".to_string()],
        };
        IndexMetadata::new(IndexConfig {
            index_id: index_id.to_string(),
            index_uri,
            doc_mapping,
            indexing_settings,
            ingest_settings,
            search_settings,
            retention_policy_opt: None,
        })
    }

    #[test]
    fn test_validate_request_and_build_metadatas_ok() {
        let request_query_ast = qast_helper("body:test", &[]);
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: serde_json::to_string(&request_query_ast).unwrap(),
            max_hits: 10,
            start_offset: 10,
            sort_fields: vec![
                SortField {
                    field_name: "timestamp".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
                },
                SortField {
                    field_name: "_doc".to_string(),
                    sort_order: SortOrder::Asc as i32,
                    sort_datetime_format: None,
                },
            ],
            ..Default::default()
        };
        let index_metadata = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let index_metadata_with_other_config =
            index_metadata_for_multi_indexes_test("test-index-2", "ram:///test-index-2");
        let mut index_metadata_no_timestamp =
            IndexMetadata::for_test("test-index-3", "ram:///test-index-3");
        index_metadata_no_timestamp
            .index_config
            .doc_mapping
            .timestamp_field = None;
        let request_metadata = validate_request_and_build_metadata(
            &[
                index_metadata,
                index_metadata_with_other_config,
                index_metadata_no_timestamp,
            ],
            &search_request,
        )
        .unwrap();
        assert_eq!(
            request_metadata.timestamp_field_opt,
            Some("timestamp".to_string())
        );
        assert_eq!(request_metadata.query_ast_resolved, request_query_ast);
        assert_eq!(request_metadata.indexes_meta_for_leaf_search.len(), 3);
        assert_eq!(request_metadata.sort_fields_is_datetime.len(), 2);
        assert_eq!(
            request_metadata.sort_fields_is_datetime.get("timestamp"),
            Some(&true)
        );
        assert_eq!(
            request_metadata.sort_fields_is_datetime.get("_doc"),
            Some(&false)
        );
    }

    #[test]
    fn test_validate_request_and_build_metadatas_fail_with_different_timestamps() {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            start_offset: 10,
            ..Default::default()
        };
        let index_metadata_1 = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let mut index_metadata_2 = IndexMetadata::for_test("test-index-2", "ram:///test-index-2");
        let doc_mapping_json_2 = r#"{
            "mode": "lenient",
            "field_mappings": [
                {
                    "name": "timestamp-2",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "body",
                    "type": "text"
                }
            ],
            "timestamp_field": "timestamp-2",
            "store_source": true
        }"#;
        let doc_mapping_2: DocMapping = serde_json::from_str(doc_mapping_json_2).unwrap();
        index_metadata_2.index_config.doc_mapping = doc_mapping_2;
        index_metadata_2
            .index_config
            .search_settings
            .default_search_fields = Vec::new();
        let timestamp_field_different = validate_request_and_build_metadata(
            &[index_metadata_1, index_metadata_2],
            &search_request,
        )
        .unwrap_err();
        assert_eq!(
            timestamp_field_different.to_string(),
            "the timestamp field (if present) must be the same for all indexes"
        );
    }

    #[test]
    fn test_validate_request_and_build_metadatas_fail_with_different_resolved_qast() {
        let qast = query_ast_from_user_text("test", None);
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: serde_json::to_string(&qast).unwrap(),
            max_hits: 10,
            start_offset: 10,
            ..Default::default()
        };
        let index_metadata_1 = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let mut index_metadata_2 = IndexMetadata::for_test("test-index-2", "ram:///test-index-2");
        index_metadata_2
            .index_config
            .search_settings
            .default_search_fields = vec!["owner".to_string()];
        let timestamp_field_different = validate_request_and_build_metadata(
            &[index_metadata_1, index_metadata_2],
            &search_request,
        )
        .unwrap_err();
        assert_eq!(
            timestamp_field_different.to_string(),
            "resolved query ASTs must be the same across indexes. resolving queries with \
             different default fields are different between indexes is not supported"
        );
    }

    fn index_metadata_for_multi_indexes_test_with_incompatible_sort_type(
        index_id: &str,
        index_uri: &str,
    ) -> IndexMetadata {
        let index_uri = Uri::from_str(index_uri).unwrap();
        let doc_mapping_json = r#"{
            "mode": "lenient",
            "field_mappings": [
                {
                    "name": "timestamp",
                    "type": "datetime",
                    "fast": true
                },
                {
                    "name": "body",
                    "type": "text",
                    "stored": true
                },
                {
                    "name": "response_date",
                    "type": "i64",
                    "stored": true,
                    "fast": true
                }
            ],
            "timestamp_field": "timestamp",
            "store_source": true
        }"#;
        let doc_mapping = serde_json::from_str(doc_mapping_json).unwrap();
        let ingest_settings = IngestSettings::default();
        let indexing_settings = IndexingSettings::default();
        let search_settings = SearchSettings {
            default_search_fields: vec!["body".to_string()],
        };
        IndexMetadata::new(IndexConfig {
            index_id: index_id.to_string(),
            index_uri,
            doc_mapping,
            ingest_settings,
            indexing_settings,
            search_settings,
            retention_policy_opt: None,
        })
    }

    #[test]
    fn test_validate_request_and_build_metadatas_fail_with_incompatible_sort_field_types() {
        let request_query_ast = qast_helper("body:test", &[]);
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: serde_json::to_string(&request_query_ast).unwrap(),
            max_hits: 10,
            start_offset: 10,
            sort_fields: vec![SortField {
                field_name: "response_date".to_string(),
                sort_order: SortOrder::Desc as i32,
                sort_datetime_format: None,
            }],
            ..Default::default()
        };
        let index_metadata = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let index_metadata_with_other_config =
            index_metadata_for_multi_indexes_test_with_incompatible_sort_type(
                "test-index-2",
                "ram:///test-index-2",
            );
        let search_error = validate_request_and_build_metadata(
            &[index_metadata, index_metadata_with_other_config],
            &search_request,
        )
        .unwrap_err();
        assert_eq!(
            search_error.to_string(),
            "sort datetime field `response_date` must be of type datetime on all indexes"
        );
    }

    #[test]
    fn test_convert_sort_datetime_value() {
        let mut sort_value = SortValue::U64(1617000000000000000);
        convert_sort_datetime_value(&mut sort_value, SortDatetimeFormat::UnixTimestampMillis)
            .unwrap();
        assert_eq!(sort_value, SortValue::U64(1617000000000));
        let mut sort_value = SortValue::I64(1617000000000000000);
        convert_sort_datetime_value(&mut sort_value, SortDatetimeFormat::UnixTimestampMillis)
            .unwrap();
        assert_eq!(sort_value, SortValue::I64(1617000000000));

        // conversion with float values should fail.
        let mut sort_value = SortValue::F64(1617000000000000000.0);
        let error =
            convert_sort_datetime_value(&mut sort_value, SortDatetimeFormat::UnixTimestampMillis)
                .unwrap_err();
        assert_eq!(
            error.to_string(),
            "internal error: `datetime conversion are only support for u64 and i64 sort values, \
             not `F64(1.617e18)``"
        );
    }

    #[test]
    fn test_convert_sort_datetime_value_into_nanos() {
        let mut sort_value = SortValue::U64(1617000000000);
        convert_sort_datetime_value_into_nanos(
            &mut sort_value,
            SortDatetimeFormat::UnixTimestampMillis,
        )
        .unwrap();
        assert_eq!(sort_value, SortValue::U64(1617000000000000000));
        let mut sort_value = SortValue::I64(1617000000000);
        convert_sort_datetime_value_into_nanos(
            &mut sort_value,
            SortDatetimeFormat::UnixTimestampMillis,
        )
        .unwrap();
        assert_eq!(sort_value, SortValue::I64(1617000000000000000));

        // conversion with a too large millisecond value should fail.
        let mut sort_value = SortValue::I64(1617000000000000);
        let error = convert_sort_datetime_value_into_nanos(
            &mut sort_value,
            SortDatetimeFormat::UnixTimestampMillis,
        )
        .unwrap_err();
        assert_eq!(
            error.to_string(),
            "internal error: `sort value defined in milliseconds is too large and cannot be \
             converted into nanoseconds: 1617000000000000`"
        );
        // conversion with float values should fail.
        let mut sort_value = SortValue::F64(1617000000000000.0);
        let error = convert_sort_datetime_value_into_nanos(
            &mut sort_value,
            SortDatetimeFormat::UnixTimestampMillis,
        )
        .unwrap_err();
        assert_eq!(
            error.to_string(),
            "internal error: `datetime conversion are only support for u64 and i64 sort values, \
             not `F64(1617000000000000.0)``"
        );
    }

    #[test]
    fn test_validate_sort_field_types_with_doc_and_shard_doc() {
        let sort_fields = vec![
            SortField {
                field_name: "_doc".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
            SortField {
                field_name: "_shard_doc".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let mut schema_builder = Schema::builder();
        schema_builder.add_date_field("timestamp", FAST);
        schema_builder.add_u64_field("id", FAST);
        let schema = schema_builder.build();
        let mut sort_field_are_datetime = HashMap::new();
        validate_sort_field_types(&schema, &sort_fields, &mut sort_field_are_datetime).unwrap();
        assert_eq!(sort_field_are_datetime.get("_doc"), Some(&false));
        assert_eq!(sort_field_are_datetime.get("_shard_doc"), Some(&false));
    }

    #[test]
    fn test_validate_sort_field_types_valid() {
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
            SortField {
                field_name: "id".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let mut schema_builder = Schema::builder();
        schema_builder.add_date_field("timestamp", FAST);
        schema_builder.add_u64_field("id", FAST);
        let schema = schema_builder.build();
        let mut sort_field_are_datetime = HashMap::new();
        validate_sort_field_types(&schema, &sort_fields, &mut sort_field_are_datetime).unwrap();
        assert_eq!(sort_field_are_datetime.get("timestamp"), Some(&true));
        assert_eq!(sort_field_are_datetime.get("id"), Some(&false));
    }

    #[test]
    fn test_validate_sort_field_types_with_inconsistent_datetime_type() {
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
            SortField {
                field_name: "id".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let mut schema_builder = Schema::builder();
        schema_builder.add_date_field("timestamp", FAST);
        schema_builder.add_u64_field("id", FAST);
        let schema = schema_builder.build();
        {
            let mut sort_field_are_datetime = HashMap::new();
            sort_field_are_datetime.insert("timestamp".to_string(), false);
            sort_field_are_datetime.insert("id".to_string(), false);
            let error =
                validate_sort_field_types(&schema, &sort_fields, &mut sort_field_are_datetime)
                    .unwrap_err();
            assert_eq!(
                error.to_string(),
                "sort datetime field `timestamp` must be of type datetime on all indexes"
            );
        }
        {
            let mut sort_field_are_datetime = HashMap::new();
            sort_field_are_datetime.insert("id".to_string(), true);
            let error =
                validate_sort_field_types(&schema, &sort_fields, &mut sort_field_are_datetime)
                    .unwrap_err();
            assert_eq!(
                error.to_string(),
                "sort datetime field `id` must be of type datetime on all indexes"
            );
        }
    }

    #[test]
    fn test_validate_sort_by_fields_with_datetime_format_ok() {
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "id".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        validate_sort_by_fields_and_search_after(&sort_fields, &None).unwrap();
    }

    #[test]
    fn test_validate_sort_by_fields_and_search_after_ok() {
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "id".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let partial_hit = PartialHit {
            sort_value: Some(SortByValue {
                sort_value: Some(SortValue::U64(1)),
            }),
            sort_value2: Some(SortByValue {
                sort_value: Some(SortValue::U64(2)),
            }),
            split_id: "".to_string(),
            segment_ord: 0,
            doc_id: 0,
        };
        validate_sort_by_fields_and_search_after(&sort_fields, &Some(partial_hit)).unwrap();
    }

    #[test]
    fn test_validate_sort_by_fields_and_search_after_ok_with_doc_sort_field() {
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "_doc".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let partial_hit = PartialHit {
            sort_value: Some(SortByValue {
                sort_value: Some(SortValue::U64(1)),
            }),
            sort_value2: None,
            split_id: "split1".to_string(),
            segment_ord: 1,
            doc_id: 1,
        };
        validate_sort_by_fields_and_search_after(&sort_fields, &Some(partial_hit)).unwrap();
    }

    #[test]
    fn test_validate_sort_by_field_type() {
        let mut schema_builder = Schema::builder();
        let timestamp_field = schema_builder.add_date_field("timestamp", FAST);
        let id_field = schema_builder.add_u64_field("id", FAST);
        let no_fast_field = schema_builder.add_u64_field("no_fast", STORED);
        let text_field = schema_builder.add_text_field("text", STORED);
        let schema = schema_builder.build();
        {
            let sort_by_field_entry = schema.get_field_entry(timestamp_field);
            validate_sort_by_field_type(sort_by_field_entry, false).unwrap();
            validate_sort_by_field_type(sort_by_field_entry, true).unwrap();
        }
        {
            let sort_by_field_entry = schema.get_field_entry(id_field);
            validate_sort_by_field_type(sort_by_field_entry, false).unwrap();
            let error = validate_sort_by_field_type(sort_by_field_entry, true).unwrap_err();
            assert_eq!(
                error.to_string(),
                "Invalid argument: sort by field with a timestamp format must be a datetime field \
                 and the field `id` is not"
            );
        }
        {
            let sort_by_field_entry = schema.get_field_entry(no_fast_field);
            let error = validate_sort_by_field_type(sort_by_field_entry, true).unwrap_err();
            assert_eq!(
                error.to_string(),
                "Invalid argument: sort by field must be a fast field, please add the fast \
                 property to your field `no_fast`"
            );
        }
        {
            let sort_by_field_entry = schema.get_field_entry(text_field);
            let error = validate_sort_by_field_type(sort_by_field_entry, true).unwrap_err();
            assert_eq!(
                error.to_string(),
                "Invalid argument: sort by field on type text is currently not supported `text`"
            );
        }
    }

    #[test]
    fn test_validate_sort_by_fields_and_search_after_invalid_1() {
        // 2 sort fields + search after with only one sort value is invalid.
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "id".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let partial_hit = PartialHit {
            sort_value: Some(SortByValue {
                sort_value: Some(SortValue::U64(1)),
            }),
            sort_value2: None,
            split_id: "split1".to_string(),
            segment_ord: 1,
            doc_id: 1,
        };
        let error =
            validate_sort_by_fields_and_search_after(&sort_fields, &Some(partial_hit)).unwrap_err();
        assert_eq!(
            error.to_string(),
            "Invalid argument: `search_after` must have the same number of sort values as sort by \
             fields [\"timestamp\", \"id\"]"
        );
    }

    #[test]
    fn test_validate_sort_by_fields_and_search_after_invalid_with_missing_split_id() {
        // 2 sort fields + search after with only one sort value is invalid.
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "_doc".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let partial_hit = PartialHit {
            sort_value: Some(SortByValue {
                sort_value: Some(SortValue::U64(1)),
            }),
            sort_value2: None,
            split_id: "".to_string(),
            segment_ord: 1,
            doc_id: 1,
        };
        let error =
            validate_sort_by_fields_and_search_after(&sort_fields, &Some(partial_hit)).unwrap_err();
        assert_eq!(
            error.to_string(),
            "Invalid argument: search_after with a sort field `_doc` must define a split ID, \
             segment ID and doc ID values"
        );
    }

    #[test]
    fn test_validate_sort_by_fields_and_search_valid_1() {
        // 2 sort fields + search after with only one sort value is invalid.
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "id".to_string(),
                sort_order: 0,
                sort_datetime_format: None,
            },
        ];
        let partial_hit = PartialHit {
            sort_value: Some(SortByValue {
                sort_value: Some(SortValue::U64(1)),
            }),
            sort_value2: None,
            split_id: "split1".to_string(),
            segment_ord: 1,
            doc_id: 1,
        };
        let error =
            validate_sort_by_fields_and_search_after(&sort_fields, &Some(partial_hit)).unwrap_err();
        assert_eq!(
            error.to_string(),
            "Invalid argument: `search_after` must have the same number of sort values as sort by \
             fields [\"timestamp\", \"id\"]"
        );
    }

    #[test]
    fn test_validate_sort_by_field_type_invalid() {
        // sort non-datetime field with a datetime format is invalid.
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_u64_field("timestamp", FAST);
        let schema = schema_builder.build();
        let field_entry = schema.get_field_entry(field);
        let error = validate_sort_by_field_type(field_entry, true).unwrap_err();
        assert_eq!(
            error.to_string(),
            "Invalid argument: sort by field with a timestamp format must be a datetime field and \
             the field `timestamp` is not"
        );
    }

    #[test]
    fn test_validate_sort_by_fields_and_search_after_invalid_3() {
        // 3 sort fields is not possible.
        let sort_fields = vec![
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
            SortField {
                field_name: "timestamp".to_string(),
                sort_order: 0,
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampMillis as i32),
            },
        ];
        let error = validate_sort_by_fields_and_search_after(&sort_fields, &None).unwrap_err();
        assert_eq!(
            error.to_string(),
            "Invalid argument: sort by field must be up to 2 fields, got 3"
        );
    }

    fn mock_partial_hit(
        split_id: &str,
        sort_value: u64,
        doc_id: u32,
    ) -> quickwit_proto::search::PartialHit {
        quickwit_proto::search::PartialHit {
            sort_value: Some(SortValue::U64(sort_value).into()),
            sort_value2: None,
            split_id: split_id.to_string(),
            segment_ord: 1,
            doc_id,
        }
    }

    fn mock_partial_hit_opt_sort_value(
        split_id: &str,
        sort_value: Option<u64>,
        doc_id: u32,
    ) -> quickwit_proto::search::PartialHit {
        quickwit_proto::search::PartialHit {
            sort_value: sort_value.map(|sort_value| SortValue::U64(sort_value).into()),
            sort_value2: None,
            split_id: split_id.to_string(),
            segment_ord: 1,
            doc_id,
        }
    }

    fn get_doc_for_fetch_req(
        fetch_docs_req: quickwit_proto::search::FetchDocsRequest,
    ) -> Vec<quickwit_proto::search::LeafHit> {
        fetch_docs_req
            .partial_hits
            .into_iter()
            .map(|req| quickwit_proto::search::LeafHit {
                leaf_json: serde_json::to_string_pretty(&serde_json::json!({
                    "title": [req.doc_id.to_string()],
                    "body": ["test 1"],
                    "url": ["http://127.0.0.1/1"]
                }))
                .expect("Json serialization should not fail"),
                partial_hit: Some(req),
                leaf_snippet_json: None,
            })
            .collect()
    }

    #[tokio::test]
    async fn test_root_search_offset_out_of_bounds_1085() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            start_offset: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_indexes_metadata_request| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 3,
                    partial_hits: vec![
                        mock_partial_hit("split1", 3, 1),
                        mock_partial_hit("split1", 2, 2),
                        mock_partial_hit("split1", 1, 3),
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 2,
                    partial_hits: vec![
                        mock_partial_hit("split2", 3, 1),
                        mock_partial_hit("split2", 1, 3),
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());

        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 5);
        assert_eq!(search_response.hits.len(), 0);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_single_split() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_list_splits_request| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 3,
                    partial_hits: vec![
                        mock_partial_hit("split1", 3, 1),
                        mock_partial_hit("split1", 2, 2),
                        mock_partial_hit("split1", 1, 3),
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());

        let searcher_context = SearcherContext::for_test();
        let search_response = root_search(
            &searcher_context,
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 3);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_multiple_splits() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 2,
                    partial_hits: vec![
                        mock_partial_hit("split1", 3, 1),
                        mock_partial_hit("split1", 1, 3),
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 1,
                    partial_hits: vec![mock_partial_hit("split2", 2, 2)],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 3);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_multiple_splits_with_failure() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 2,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            |leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                if leaf_search_req.leaf_requests[0].split_offsets.len() == 2 {
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: 2,
                        partial_hits: vec![
                            mock_partial_hit("split1", 3, 1),
                            mock_partial_hit("split1", 1, 3),
                        ],
                        failed_splits: vec![SplitSearchError {
                            error: "some error".to_string(),
                            split_id: "split2".to_string(),
                            retryable_error: true,
                        }],
                        num_attempted_splits: 2,
                        ..Default::default()
                    })
                } else {
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: 1,
                        partial_hits: vec![mock_partial_hit("split2", 2, 2)],
                        failed_splits: Vec::new(),
                        num_attempted_splits: 1,
                        ..Default::default()
                    })
                }
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service_1)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 2);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_multiple_splits_sort_heteregeneous_field_ascending()
    -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            sort_fields: vec![SortField {
                field_name: "response_date".to_string(),
                sort_order: SortOrder::Asc.into(),
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampNanos as i32),
            }],
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 2,
                    partial_hits: vec![
                        quickwit_proto::search::PartialHit {
                            sort_value: Some(SortValue::U64(2u64).into()),
                            sort_value2: None,
                            split_id: "split1".to_string(),
                            segment_ord: 0,
                            doc_id: 0,
                        },
                        quickwit_proto::search::PartialHit {
                            sort_value: None,
                            sort_value2: None,
                            split_id: "split1".to_string(),
                            segment_ord: 0,
                            doc_id: 1,
                        },
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 3,
                    partial_hits: vec![
                        quickwit_proto::search::PartialHit {
                            sort_value: Some(SortValue::I64(-1i64).into()),
                            sort_value2: None,
                            split_id: "split2".to_string(),
                            segment_ord: 0,
                            doc_id: 1,
                        },
                        quickwit_proto::search::PartialHit {
                            sort_value: Some(SortValue::I64(1i64).into()),
                            sort_value2: None,
                            split_id: "split2".to_string(),
                            segment_ord: 0,
                            doc_id: 0,
                        },
                        quickwit_proto::search::PartialHit {
                            sort_value: None,
                            sort_value2: None,
                            split_id: "split2".to_string(),
                            segment_ord: 0,
                            doc_id: 2,
                        },
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request.clone(),
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await?;

        assert_eq!(search_response.num_hits, 5);
        assert_eq!(search_response.hits.len(), 5);
        assert_eq!(
            search_response.hits[0].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split2".to_string(),
                segment_ord: 0,
                doc_id: 1,
                sort_value: Some(SortValue::I64(-1i64).into()),
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[1].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split2".to_string(),
                segment_ord: 0,
                doc_id: 0,
                sort_value: Some(SortValue::I64(1i64).into()),
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[2].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split1".to_string(),
                segment_ord: 0,
                doc_id: 0,
                sort_value: Some(SortValue::U64(2u64).into()),
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[3].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split1".to_string(),
                segment_ord: 0,
                doc_id: 1,
                sort_value: None,
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[4].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split2".to_string(),
                segment_ord: 0,
                doc_id: 2,
                sort_value: None,
                sort_value2: None,
            }
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_multiple_splits_sort_heteregeneous_field_descending()
    -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            sort_fields: vec![SortField {
                field_name: "response_date".to_string(),
                sort_order: SortOrder::Desc.into(),
                sort_datetime_format: Some(SortDatetimeFormat::UnixTimestampNanos as i32),
            }],
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 2,
                    partial_hits: vec![
                        quickwit_proto::search::PartialHit {
                            sort_value: Some(SortValue::U64(2u64).into()),
                            sort_value2: None,
                            split_id: "split1".to_string(),
                            segment_ord: 0,
                            doc_id: 0,
                        },
                        quickwit_proto::search::PartialHit {
                            sort_value: None,
                            sort_value2: None,
                            split_id: "split1".to_string(),
                            segment_ord: 0,
                            doc_id: 1,
                        },
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 3,
                    partial_hits: vec![
                        quickwit_proto::search::PartialHit {
                            sort_value: Some(SortValue::I64(1i64).into()),
                            sort_value2: None,
                            split_id: "split2".to_string(),
                            segment_ord: 0,
                            doc_id: 0,
                        },
                        quickwit_proto::search::PartialHit {
                            sort_value: Some(SortValue::I64(-1i64).into()),
                            sort_value2: None,
                            split_id: "split2".to_string(),
                            segment_ord: 0,
                            doc_id: 1,
                        },
                        quickwit_proto::search::PartialHit {
                            sort_value: None,
                            sort_value2: None,
                            split_id: "split2".to_string(),
                            segment_ord: 0,
                            doc_id: 2,
                        },
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request.clone(),
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await?;

        assert_eq!(search_response.num_hits, 5);
        assert_eq!(search_response.hits.len(), 5);
        assert_eq!(
            search_response.hits[0].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split1".to_string(),
                segment_ord: 0,
                doc_id: 0,
                sort_value: Some(SortValue::U64(2u64).into()),
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[1].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split2".to_string(),
                segment_ord: 0,
                doc_id: 0,
                sort_value: Some(SortValue::I64(1i64).into()),
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[2].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split2".to_string(),
                segment_ord: 0,
                doc_id: 1,
                sort_value: Some(SortValue::I64(-1i64).into()),
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[3].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split2".to_string(),
                segment_ord: 0,
                doc_id: 2,
                sort_value: None,
                sort_value2: None,
            }
        );
        assert_eq!(
            search_response.hits[4].partial_hit.as_ref().unwrap(),
            &PartialHit {
                split_id: "split1".to_string(),
                segment_ord: 0,
                doc_id: 1,
                sort_value: None,
                sort_value2: None,
            }
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_missing_index() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index1", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_list_splits_request| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mock_metastore_client = MetastoreServiceClient::from_mock(mock_metastore);
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_leaf_search().returning(
            |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 3,
                    partial_hits: vec![
                        mock_partial_hit("split1", 3, 1),
                        mock_partial_hit("split1", 2, 2),
                        mock_partial_hit("split1", 1, 3),
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());

        let searcher_context = SearcherContext::for_test();

        // search with ignore_missing_indexes=true succeeds
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index1".to_string(), "test-index2".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ignore_missing_indexes: true,
            ..Default::default()
        };
        let search_response = root_search(
            &searcher_context,
            search_request,
            mock_metastore_client.clone(),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 3);

        // search with ignore_missing_indexes=false fails
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index1".to_string(), "test-index2".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ignore_missing_indexes: false,
            ..Default::default()
        };
        let search_error = root_search(
            &searcher_context,
            search_request,
            mock_metastore_client,
            &cluster_client,
        )
        .await
        .unwrap_err();
        if let SearchError::IndexesNotFound { index_ids } = search_error {
            assert_eq!(index_ids, vec!["test-index2".to_string()]);
        } else {
            panic!("unexpected error type: {search_error}");
        }
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_multiple_splits_retry_on_other_node() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });

        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1
            .expect_leaf_search()
            .times(2)
            .returning(
                |leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                    let split_ids: Vec<&str> = leaf_search_req.leaf_requests[0]
                        .split_offsets
                        .iter()
                        .map(|metadata| metadata.split_id.as_str())
                        .collect();
                    if split_ids == ["split1"] {
                        Ok(quickwit_proto::search::LeafSearchResponse {
                            num_hits: 2,
                            partial_hits: vec![
                                mock_partial_hit("split1", 3, 1),
                                mock_partial_hit("split1", 1, 3),
                            ],
                            failed_splits: Vec::new(),
                            num_attempted_splits: 1,
                            ..Default::default()
                        })
                    } else if split_ids == ["split2"] {
                        // RETRY REQUEST!
                        Ok(quickwit_proto::search::LeafSearchResponse {
                            num_hits: 1,
                            partial_hits: vec![mock_partial_hit("split2", 2, 2)],
                            failed_splits: Vec::new(),
                            num_attempted_splits: 1,
                            ..Default::default()
                        })
                    } else {
                        panic!("unexpected request in test {split_ids:?}");
                    }
                },
            );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2
            .expect_leaf_search()
            .times(1)
            .returning(
                |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        // requests from split 2 arrive here - simulate failure
                        num_hits: 0,
                        partial_hits: Vec::new(),
                        failed_splits: vec![SplitSearchError {
                            error: "mock_error".to_string(),
                            split_id: "split2".to_string(),
                            retryable_error: true,
                        }],
                        num_attempted_splits: 1,
                        ..Default::default()
                    })
                },
            );
        mock_search_service_2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 3);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_multiple_splits_retry_on_all_nodes() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_indexes_metadata_request| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1
            .expect_leaf_search()
            .withf(|leaf_search_req| {
                leaf_search_req.leaf_requests[0].split_offsets[0].split_id == "split2"
            })
            .return_once(|_| {
                // requests from split 2 arrive here - simulate failure.
                // a retry will be made on the second service.
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 0,
                    partial_hits: Vec::new(),
                    failed_splits: vec![SplitSearchError {
                        error: "mock_error".to_string(),
                        split_id: "split2".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        mock_search_service_1
            .expect_leaf_search()
            .withf(|leaf_search_req| {
                leaf_search_req.leaf_requests[0].split_offsets[0].split_id == "split1"
            })
            .return_once(|_| {
                // RETRY REQUEST from split1
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 2,
                    partial_hits: vec![
                        mock_partial_hit("split1", 3, 1),
                        mock_partial_hit("split1", 1, 3),
                    ],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2
            .expect_leaf_search()
            .withf(|leaf_search_req| {
                leaf_search_req.leaf_requests[0].split_offsets[0].split_id == "split2"
            })
            .return_once(|_| {
                // retry for split 2 arrive here, simulate success.
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 1,
                    partial_hits: vec![mock_partial_hit("split2", 2, 2)],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        mock_search_service_2
            .expect_leaf_search()
            .withf(|leaf_search_req| {
                leaf_search_req.leaf_requests[0].split_offsets[0].split_id == "split1"
            })
            .return_once(|_| {
                // requests from split 1 arrive here - simulate failure, then success.
                Ok(quickwit_proto::search::LeafSearchResponse {
                    // requests from split 2 arrive here - simulate failure
                    num_hits: 0,
                    partial_hits: Vec::new(),
                    failed_splits: vec![SplitSearchError {
                        error: "mock_error".to_string(),
                        split_id: "split1".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            });
        mock_search_service_2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 3);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_single_split_retry_single_node() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_list_splits_request| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut first_call = true;
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_leaf_search().times(2).returning(
            move |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                // requests from split 2 arrive here - simulate failure, then success
                if first_call {
                    first_call = false;
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: 0,
                        partial_hits: Vec::new(),
                        failed_splits: vec![SplitSearchError {
                            error: "mock_error".to_string(),
                            split_id: "split1".to_string(),
                            retryable_error: true,
                        }],
                        num_attempted_splits: 1,
                        ..Default::default()
                    })
                } else {
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: 1,
                        partial_hits: vec![mock_partial_hit("split1", 2, 2)],
                        failed_splits: Vec::new(),
                        num_attempted_splits: 1,
                        ..Default::default()
                    })
                }
            },
        );
        mock_search_service.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 1);
        assert_eq!(search_response.hits.len(), 1);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_single_split_retry_single_node_fails() {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });

        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_leaf_search().times(2).returning(
            move |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 0,
                    partial_hits: Vec::new(),
                    failed_splits: vec![SplitSearchError {
                        error: "mock_error".to_string(),
                        split_id: "split1".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service.expect_fetch_docs().returning(
            |_fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Err(SearchError::Internal("mockerr docs".to_string()))
            },
        );
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.failed_splits.len(), 1);
    }

    #[tokio::test]
    async fn test_root_search_one_splits_two_nodes_but_one_is_failing_for_split()
    -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        // Service1 - broken node.
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            move |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                // retry requests from split 1 arrive here
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 1,
                    partial_hits: vec![mock_partial_hit("split1", 2, 2)],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        // Service2 - working node.
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_leaf_search().returning(
            move |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 0,
                    partial_hits: Vec::new(),
                    failed_splits: vec![SplitSearchError {
                        error: "mock_error".to_string(),
                        split_id: "split1".to_string(),
                        retryable_error: true,
                    }],
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_2.expect_fetch_docs().returning(
            |_fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Err(SearchError::Internal("mockerr docs".to_string()))
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 1);
        assert_eq!(search_response.hits.len(), 1);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_one_splits_two_nodes_but_one_is_failing_completely()
    -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });

        // Service1 - working node.
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1.expect_leaf_search().returning(
            move |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Ok(quickwit_proto::search::LeafSearchResponse {
                    num_hits: 1,
                    partial_hits: vec![mock_partial_hit("split1", 2, 2)],
                    failed_splits: Vec::new(),
                    num_attempted_splits: 1,
                    ..Default::default()
                })
            },
        );
        mock_search_service_1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );
        // Service2 - broken node.
        let mut mock_search_service_2 = MockSearchService::new();
        mock_search_service_2.expect_leaf_search().returning(
            move |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                Err(SearchError::Internal("mockerr search".to_string()))
            },
        );
        mock_search_service_2.expect_fetch_docs().returning(
            |_fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                Err(SearchError::Internal("mockerr docs".to_string()))
            },
        );
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service_1),
            ("127.0.0.1:1002", mock_search_service_2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 1);
        assert_eq!(search_response.hits.len(), 1);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_invalid_queries() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });

        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", MockSearchService::new())]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let searcher_context = SearcherContext::for_test();
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);

        assert!(
            root_search(
                &searcher_context,
                quickwit_proto::search::SearchRequest {
                    index_id_patterns: vec!["test-index".to_string()],
                    query_ast: qast_json_helper("invalid_field:\"test\"", &["body"]),
                    max_hits: 10,
                    ..Default::default()
                },
                metastore.clone(),
                &cluster_client,
            )
            .await
            .is_err()
        );

        assert!(
            root_search(
                &searcher_context,
                quickwit_proto::search::SearchRequest {
                    index_id_patterns: vec!["test-index".to_string()],
                    query_ast: qast_json_helper("test", &["invalid_field"]),
                    max_hits: 10,
                    ..Default::default()
                },
                metastore,
                &cluster_client,
            )
            .await
            .is_err()
        );

        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_invalid_aggregation() -> anyhow::Result<()> {
        let agg_req = r#"
            {
                "expensive_colors": {
                    "termss": {
                        "field": "color",
                        "order": {
                            "price_stats.max": "desc"
                        }
                    },
                    "aggs": {
                        "price_stats" : {
                            "stats": {
                                "field": "price"
                            }
                        }
                    }
                }
            }"#;

        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            aggregation_request: Some(agg_req.to_string()),
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", MockSearchService::new())]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await;
        assert!(search_response.is_err());
        assert!(
            search_response.unwrap_err().to_string().starts_with(
                "invalid aggregation request: unknown variant `termss`, expected one of"
            )
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_invalid_request() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            start_offset: 20_000,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", MockSearchService::new())]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            metastore.clone(),
            &cluster_client,
        )
        .await;
        assert!(search_response.is_err());
        assert_eq!(
            search_response.unwrap_err().to_string(),
            "Invalid argument: max value for start_offset is 10_000, but got 20000",
        );

        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 20_000,
            ..Default::default()
        };

        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            metastore,
            &cluster_client,
        )
        .await;
        assert!(search_response.is_err());
        assert_eq!(
            search_response.unwrap_err().to_string(),
            "Invalid argument: max value for max_hits is 10_000, but got 20000",
        );

        Ok(())
    }

    #[tokio::test]
    async fn test_search_plan_multiple_splits() -> anyhow::Result<()> {
        use quickwit_query::MatchAllOrNone;
        use quickwit_query::query_ast::{FullTextMode, FullTextParams, FullTextQuery};

        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test-query", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let search_response = search_plan(
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
        )
        .await
        .unwrap();
        let response: SearchPlanResponseRest =
            serde_json::from_str(&search_response.result).unwrap();
        assert_eq!(
            response,
            SearchPlanResponseRest {
                quickwit_ast: QueryAst::FullText(FullTextQuery {
                    field: "body".to_string(),
                    text: "test-query".to_string(),
                    params: FullTextParams {
                        tokenizer: None,
                        mode: FullTextMode::PhraseFallbackToIntersection,
                        zero_terms_query: MatchAllOrNone::MatchNone,
                    },
                    lenient: false,
                },),
                tantivy_ast: r#"BooleanQuery {
    subqueries: [
        (
            Must,
            TermQuery(Term(field=3, type=Str, "test")),
        ),
        (
            Must,
            TermQuery(Term(field=3, type=Str, "query")),
        ),
    ],
    minimum_number_should_match: 0,
}"#
                .to_string(),
                searched_splits: vec![
                    "test-index/split1".to_string(),
                    "test-index/split2".to_string()
                ],
                storage_requests: StorageRequestCount {
                    footer: 1,
                    fastfield: 0,
                    fieldnorm: 0,
                    sstable: 2,
                    posting: 2,
                    position: 0,
                },
            }
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_search_plan_missing_index() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index1", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mock_metastore_service = MetastoreServiceClient::from_mock(mock_metastore);

        // plan with ignore_missing_indexes=true succeeds
        search_plan(
            quickwit_proto::search::SearchRequest {
                index_id_patterns: vec!["test-index1".to_string(), "test-index2".to_string()],
                query_ast: qast_json_helper("test-query", &["body"]),
                max_hits: 10,
                ignore_missing_indexes: true,
                ..Default::default()
            },
            mock_metastore_service.clone(),
        )
        .await
        .unwrap();

        // plan with ignore_missing_indexes=false fails
        let search_error = search_plan(
            quickwit_proto::search::SearchRequest {
                index_id_patterns: vec!["test-index1".to_string(), "test-index2".to_string()],
                query_ast: qast_json_helper("test-query", &["body"]),
                max_hits: 10,
                ignore_missing_indexes: false,
                ..Default::default()
            },
            mock_metastore_service.clone(),
        )
        .await
        .unwrap_err();
        if let SearchError::IndexesNotFound { index_ids } = search_error {
            assert_eq!(index_ids, vec!["test-index2".to_string()]);
        } else {
            panic!("unexpected error type: {search_error}");
        }
        Ok(())
    }

    #[test]
    fn test_extract_timestamp_range_from_ast() {
        use std::ops::Bound;

        use quickwit_query::JsonLiteral;

        let timestamp_field = "timestamp";

        let simple_range = quickwit_query::query_ast::RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Included(JsonLiteral::String("2021-04-13T22:45:41Z".to_owned())),
            upper_bound: Bound::Excluded(JsonLiteral::String("2021-05-06T06:51:19Z".to_owned())),
        }
        .into();

        // direct range
        let mut timestamp_range_extractor = ExtractTimestampRange {
            timestamp_field,
            start_timestamp: None,
            end_timestamp: None,
        };
        timestamp_range_extractor.visit(&simple_range).unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(1618353941));
        assert_eq!(timestamp_range_extractor.end_timestamp, Some(1620283879));

        // range inside a must bool query
        let bool_query_must = quickwit_query::query_ast::BoolQuery {
            must: vec![simple_range.clone()],
            ..Default::default()
        };
        timestamp_range_extractor.start_timestamp = None;
        timestamp_range_extractor.end_timestamp = None;
        timestamp_range_extractor
            .visit(&bool_query_must.into())
            .unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(1618353941));
        assert_eq!(timestamp_range_extractor.end_timestamp, Some(1620283879));

        // range inside a should bool query
        let bool_query_should = quickwit_query::query_ast::BoolQuery {
            should: vec![simple_range.clone()],
            ..Default::default()
        };
        timestamp_range_extractor.start_timestamp = Some(123);
        timestamp_range_extractor.end_timestamp = None;
        timestamp_range_extractor
            .visit(&bool_query_should.into())
            .unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(123));
        assert_eq!(timestamp_range_extractor.end_timestamp, None);

        // start bound was already more restrictive
        timestamp_range_extractor.start_timestamp = Some(1618601297);
        timestamp_range_extractor.end_timestamp = Some(i64::MAX);
        timestamp_range_extractor.visit(&simple_range).unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(1618601297));
        assert_eq!(timestamp_range_extractor.end_timestamp, Some(1620283879));

        // end bound was already more restrictive
        timestamp_range_extractor.start_timestamp = Some(1);
        timestamp_range_extractor.end_timestamp = Some(1618601297);
        timestamp_range_extractor.visit(&simple_range).unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(1618353941));
        assert_eq!(timestamp_range_extractor.end_timestamp, Some(1618601297));

        // bounds are (start..end] instead of [start..end)
        let unusual_bounds = quickwit_query::query_ast::RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Excluded(JsonLiteral::String("2021-04-13T22:45:41Z".to_owned())),
            upper_bound: Bound::Included(JsonLiteral::String("2021-05-06T06:51:19Z".to_owned())),
        }
        .into();
        timestamp_range_extractor.start_timestamp = None;
        timestamp_range_extractor.end_timestamp = None;
        timestamp_range_extractor.visit(&unusual_bounds).unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(1618353942));
        assert_eq!(timestamp_range_extractor.end_timestamp, Some(1620283880));

        let wrong_field = quickwit_query::query_ast::RangeQuery {
            field: "other_field".to_string(),
            lower_bound: Bound::Included(JsonLiteral::String("2021-04-13T22:45:41Z".to_owned())),
            upper_bound: Bound::Excluded(JsonLiteral::String("2021-05-06T06:51:19Z".to_owned())),
        }
        .into();
        timestamp_range_extractor.start_timestamp = None;
        timestamp_range_extractor.end_timestamp = None;
        timestamp_range_extractor.visit(&wrong_field).unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, None);
        assert_eq!(timestamp_range_extractor.end_timestamp, None);

        let high_precision = quickwit_query::query_ast::RangeQuery {
            field: timestamp_field.to_string(),
            lower_bound: Bound::Included(JsonLiteral::String(
                "2021-04-13T22:45:41.001Z".to_owned(),
            )),
            upper_bound: Bound::Excluded(JsonLiteral::String(
                "2021-05-06T06:51:19.001Z".to_owned(),
            )),
        }
        .into();

        // the upper bound should be rounded up as to includes documents from X.000 to X.001
        let mut timestamp_range_extractor = ExtractTimestampRange {
            timestamp_field,
            start_timestamp: None,
            end_timestamp: None,
        };
        timestamp_range_extractor.visit(&high_precision).unwrap();
        assert_eq!(timestamp_range_extractor.start_timestamp, Some(1618353941));
        assert_eq!(timestamp_range_extractor.end_timestamp, Some(1620283880));
    }

    fn create_search_resp(
        index_uri: &str,
        hit_range: Range<usize>,
        search_after: Option<PartialHit>,
    ) -> LeafSearchResponse {
        let (num_total_hits, split_id) = match index_uri {
            "ram:///test-index-1" => (TOTAL_NUM_HITS_INDEX_1, "split1"),
            "ram:///test-index-2" => (TOTAL_NUM_HITS_INDEX_2, "split2"),
            _ => panic!("unexpected index uri"),
        };

        let doc_ids = (0..num_total_hits)
            .rev()
            .filter(|elem| {
                if let Some(search_after) = &search_after {
                    if split_id == search_after.split_id {
                        *elem < (search_after.doc_id as usize)
                    } else {
                        split_id < search_after.split_id.as_str()
                    }
                } else {
                    true
                }
            })
            .skip(hit_range.start)
            .take(hit_range.end - hit_range.start);
        quickwit_proto::search::LeafSearchResponse {
            num_hits: num_total_hits as u64,
            partial_hits: doc_ids
                .map(|doc_id| mock_partial_hit_opt_sort_value(split_id, None, doc_id as u32))
                .collect(),
            num_attempted_splits: 1,
            ..Default::default()
        }
    }

    const TOTAL_NUM_HITS_INDEX_1: usize = 2_005;
    const TOTAL_NUM_HITS_INDEX_2: usize = 10;
    const MAX_HITS_PER_PAGE: usize = 93;
    const MAX_HITS_PER_PAGE_LARGE: usize = 1_005;

    #[tokio::test]
    async fn test_root_search_with_scroll() {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let index_uid = index_metadata.index_uid.clone();
        let index_metadata_2 = IndexMetadata::for_test("test-index-2", "ram:///test-index-2");
        let index_uid_2 = index_metadata_2.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                let indexes_metadata = vec![index_metadata.clone(), index_metadata_2.clone()];
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid_2)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        // We add two mock_search_service to simulate a multi node environment, where the requests
        // are forwarded two node.
        let mut mock_search_service1 = MockSearchService::new();
        mock_search_service1
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, SCROLL_BATCH_LEN);
                assert!(search_req.search_after.is_none());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service1
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, SCROLL_BATCH_LEN);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service1
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, SCROLL_BATCH_LEN);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });

        let mut mock_search_service2 = MockSearchService::new();
        mock_search_service2
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, SCROLL_BATCH_LEN);
                assert!(search_req.search_after.is_none());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service2
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, SCROLL_BATCH_LEN);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service2
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, SCROLL_BATCH_LEN);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });

        let kv: Arc<RwLock<HashMap<Vec<u8>, Vec<u8>>>> = Default::default();
        let kv_clone = kv.clone();
        mock_search_service1
            .expect_put_kv()
            .returning(move |put_kv_req| {
                kv_clone
                    .write()
                    .unwrap()
                    .insert(put_kv_req.key, put_kv_req.payload);
            });
        mock_search_service1
            .expect_get_kv()
            .returning(move |get_kv_req| kv.read().unwrap().get(&get_kv_req.key).cloned());

        let kv: Arc<RwLock<HashMap<Vec<u8>, Vec<u8>>>> = Default::default();
        let kv_clone = kv.clone();
        mock_search_service2
            .expect_put_kv()
            .returning(move |put_kv_req| {
                kv_clone
                    .write()
                    .unwrap()
                    .insert(put_kv_req.key, put_kv_req.payload);
            });
        mock_search_service2
            .expect_get_kv()
            .returning(move |get_kv_req| kv.read().unwrap().get(&get_kv_req.key).cloned());

        mock_search_service1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                assert!(fetch_docs_req.partial_hits.len() <= MAX_HITS_PER_PAGE);
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );

        mock_search_service2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                assert!(fetch_docs_req.partial_hits.len() <= MAX_HITS_PER_PAGE);
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );

        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service1),
            ("127.0.0.1:1002", mock_search_service2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let searcher_context = SearcherContext::for_test();
        let cluster_client = ClusterClient::new(search_job_placer.clone());

        let mut count_seen_hits = 0;

        let mut scroll_id: String = {
            let search_request = quickwit_proto::search::SearchRequest {
                index_id_patterns: vec!["test-index-*".to_string()],
                query_ast: qast_json_helper("test", &["body"]),
                max_hits: MAX_HITS_PER_PAGE as u64,
                scroll_ttl_secs: Some(60),
                ..Default::default()
            };
            let search_response = root_search(
                &searcher_context,
                search_request,
                MetastoreServiceClient::from_mock(mock_metastore),
                &cluster_client,
            )
            .await
            .unwrap();
            assert_eq!(
                search_response.num_hits,
                (TOTAL_NUM_HITS_INDEX_1 + TOTAL_NUM_HITS_INDEX_2) as u64
            );
            assert_eq!(search_response.hits.len(), MAX_HITS_PER_PAGE);
            let expected = (0..TOTAL_NUM_HITS_INDEX_2)
                .rev()
                .zip(std::iter::repeat("split2"))
                .chain(
                    (0..TOTAL_NUM_HITS_INDEX_1)
                        .rev()
                        .zip(std::iter::repeat("split1")),
                );
            for (hit, (doc_id, split)) in search_response.hits.iter().zip(expected) {
                assert_eq!(
                    hit.partial_hit.as_ref().unwrap(),
                    &mock_partial_hit_opt_sort_value(split, None, doc_id as u32)
                );
            }
            count_seen_hits += search_response.hits.len();
            search_response.scroll_id.unwrap()
        };
        for page in 1.. {
            let scroll_req = ScrollRequest {
                scroll_id,
                scroll_ttl_secs: Some(60),
            };
            let scroll_resp =
                crate::service::scroll(scroll_req, &cluster_client, &searcher_context)
                    .await
                    .unwrap();
            assert_eq!(
                scroll_resp.num_hits,
                (TOTAL_NUM_HITS_INDEX_1 + TOTAL_NUM_HITS_INDEX_2) as u64
            );
            let expected = (0..TOTAL_NUM_HITS_INDEX_2)
                .rev()
                .zip(std::iter::repeat("split2"))
                .chain(
                    (0..TOTAL_NUM_HITS_INDEX_1)
                        .rev()
                        .zip(std::iter::repeat("split1")),
                )
                .skip(page * MAX_HITS_PER_PAGE);
            for (hit, (doc_id, split)) in scroll_resp.hits.iter().zip(expected) {
                assert_eq!(
                    hit.partial_hit.as_ref().unwrap(),
                    &mock_partial_hit_opt_sort_value(split, None, doc_id as u32)
                );
            }
            scroll_id = scroll_resp.scroll_id.unwrap();
            count_seen_hits += scroll_resp.hits.len();
            if scroll_resp.hits.is_empty() {
                break;
            }
        }

        assert_eq!(
            count_seen_hits,
            TOTAL_NUM_HITS_INDEX_1 + TOTAL_NUM_HITS_INDEX_2
        );
    }

    #[tokio::test]
    async fn test_root_search_with_scroll_large_page() {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let index_uid = index_metadata.index_uid.clone();
        let index_metadata_2 = IndexMetadata::for_test("test-index-2", "ram:///test-index-2");
        let index_uid_2 = index_metadata_2.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                let indexes_metadata = vec![index_metadata.clone(), index_metadata_2.clone()];
                Ok(ListIndexesMetadataResponse::for_test(indexes_metadata))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid_2)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        // We add two mock_search_service to simulate a multi node environment, where the requests
        // are forwarded two nodes.
        let mut mock_search_service1 = MockSearchService::new();
        mock_search_service1
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, MAX_HITS_PER_PAGE_LARGE);
                assert!(search_req.search_after.is_none());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service1
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, MAX_HITS_PER_PAGE_LARGE);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service1
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, MAX_HITS_PER_PAGE_LARGE);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        let kv: Arc<RwLock<HashMap<Vec<u8>, Vec<u8>>>> = Default::default();
        let kv_clone = kv.clone();
        mock_search_service1
            .expect_put_kv()
            .returning(move |put_kv_req| {
                kv_clone
                    .write()
                    .unwrap()
                    .insert(put_kv_req.key, put_kv_req.payload);
            });
        mock_search_service1
            .expect_get_kv()
            .returning(move |get_kv_req| kv.read().unwrap().get(&get_kv_req.key).cloned());
        mock_search_service1.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                assert!(fetch_docs_req.partial_hits.len() <= MAX_HITS_PER_PAGE_LARGE);
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );

        let mut mock_search_service2 = MockSearchService::new();
        mock_search_service2
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, MAX_HITS_PER_PAGE_LARGE);
                assert!(search_req.search_after.is_none());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service2
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, MAX_HITS_PER_PAGE_LARGE);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        mock_search_service2
            .expect_leaf_search()
            .times(1)
            .returning(|req: quickwit_proto::search::LeafSearchRequest| {
                let search_req = req.search_request.unwrap();
                // the leaf request does not need to know about the scroll_ttl.
                assert_eq!(search_req.start_offset, 0u64);
                assert!(search_req.scroll_ttl_secs.is_none());
                assert_eq!(search_req.max_hits as usize, MAX_HITS_PER_PAGE_LARGE);
                assert!(search_req.search_after.is_some());
                Ok(create_search_resp(
                    &req.index_uris[0],
                    search_req.start_offset as usize
                        ..(search_req.start_offset + search_req.max_hits) as usize,
                    search_req.search_after,
                ))
            });
        let kv: Arc<RwLock<HashMap<Vec<u8>, Vec<u8>>>> = Default::default();
        let kv_clone = kv.clone();
        mock_search_service2
            .expect_put_kv()
            .returning(move |put_kv_req| {
                kv_clone
                    .write()
                    .unwrap()
                    .insert(put_kv_req.key, put_kv_req.payload);
            });
        mock_search_service2
            .expect_get_kv()
            .returning(move |get_kv_req| kv.read().unwrap().get(&get_kv_req.key).cloned());
        mock_search_service2.expect_fetch_docs().returning(
            |fetch_docs_req: quickwit_proto::search::FetchDocsRequest| {
                assert!(fetch_docs_req.partial_hits.len() <= MAX_HITS_PER_PAGE_LARGE);
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            },
        );

        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", mock_search_service1),
            ("127.0.0.1:1002", mock_search_service2),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let searcher_context = SearcherContext::for_test();
        let cluster_client = ClusterClient::new(search_job_placer.clone());

        let mut count_seen_hits = 0;

        let mut scroll_id: String = {
            let search_request = quickwit_proto::search::SearchRequest {
                index_id_patterns: vec!["test-index-*".to_string()],
                query_ast: qast_json_helper("test", &["body"]),
                max_hits: MAX_HITS_PER_PAGE_LARGE as u64,
                scroll_ttl_secs: Some(60),
                ..Default::default()
            };
            let search_response = root_search(
                &searcher_context,
                search_request,
                MetastoreServiceClient::from_mock(mock_metastore),
                &cluster_client,
            )
            .await
            .unwrap();
            assert_eq!(
                search_response.num_hits,
                (TOTAL_NUM_HITS_INDEX_1 + TOTAL_NUM_HITS_INDEX_2) as u64
            );
            assert_eq!(search_response.hits.len(), MAX_HITS_PER_PAGE_LARGE);
            let expected = (0..TOTAL_NUM_HITS_INDEX_2)
                .rev()
                .zip(std::iter::repeat("split2"))
                .chain(
                    (0..TOTAL_NUM_HITS_INDEX_1)
                        .rev()
                        .zip(std::iter::repeat("split1")),
                );
            for (hit, (doc_id, split)) in search_response.hits.iter().zip(expected) {
                assert_eq!(
                    hit.partial_hit.as_ref().unwrap(),
                    &mock_partial_hit_opt_sort_value(split, None, doc_id as u32)
                );
            }
            count_seen_hits += search_response.hits.len();
            search_response.scroll_id.unwrap()
        };
        for page in 1.. {
            let scroll_req = ScrollRequest {
                scroll_id,
                scroll_ttl_secs: Some(60),
            };
            let scroll_resp =
                crate::service::scroll(scroll_req, &cluster_client, &searcher_context)
                    .await
                    .unwrap();
            assert_eq!(
                scroll_resp.num_hits,
                (TOTAL_NUM_HITS_INDEX_1 + TOTAL_NUM_HITS_INDEX_2) as u64
            );
            let expected = (0..TOTAL_NUM_HITS_INDEX_2)
                .rev()
                .zip(std::iter::repeat("split2"))
                .chain(
                    (0..TOTAL_NUM_HITS_INDEX_1)
                        .rev()
                        .zip(std::iter::repeat("split1")),
                )
                .skip(page * MAX_HITS_PER_PAGE_LARGE);
            for (hit, (doc_id, split)) in scroll_resp.hits.iter().zip(expected) {
                assert_eq!(
                    hit.partial_hit.as_ref().unwrap(),
                    &mock_partial_hit_opt_sort_value(split, None, doc_id as u32)
                );
            }
            scroll_id = scroll_resp.scroll_id.unwrap();
            count_seen_hits += scroll_resp.hits.len();
            if scroll_resp.hits.is_empty() {
                break;
            }
        }

        assert_eq!(
            count_seen_hits,
            TOTAL_NUM_HITS_INDEX_1 + TOTAL_NUM_HITS_INDEX_2
        );
    }

    #[tokio::test]
    async fn test_root_search_multi_indices() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index-*".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata_1 = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let index_uid_1 = index_metadata_1.index_uid.clone();
        let index_metadata_2 =
            index_metadata_for_multi_indexes_test("test-index-2", "ram:///test-index-2");
        let index_uid_2 = index_metadata_2.index_uid.clone();
        let index_metadata_3 =
            index_metadata_for_multi_indexes_test("test-index-3", "ram:///test-index-3");
        let index_uid_3 = index_metadata_3.index_uid.clone();
        mock_metastore.expect_list_indexes_metadata().return_once(
            move |list_indexes_metadata_request: ListIndexesMetadataRequest| {
                let index_id_patterns = list_indexes_metadata_request.index_id_patterns;
                assert_eq!(&index_id_patterns, &["test-index-*".to_string()]);
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata_1,
                    index_metadata_2,
                    index_metadata_3,
                ]))
            },
        );
        mock_metastore
            .expect_list_splits()
            .return_once(move |list_splits_request| {
                let list_splits_query =
                    list_splits_request.deserialize_list_splits_query().unwrap();
                assert!(
                    list_splits_query.index_uids
                        == Some(vec![
                            index_uid_1.clone(),
                            index_uid_2.clone(),
                            index_uid_3.clone()
                        ])
                );
                let splits = vec![
                    MockSplitBuilder::new("index-1-split-1")
                        .with_index_uid(&index_uid_1)
                        .build(),
                    MockSplitBuilder::new("index-1-split-2")
                        .with_index_uid(&index_uid_1)
                        .build(),
                    MockSplitBuilder::new("index-2-split-1")
                        .with_index_uid(&index_uid_2)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1
            .expect_leaf_search()
            .times(1)
            .withf(|leaf_search_req| {
                (&leaf_search_req.index_uris[0] == "ram:///test-index-1"
                    && leaf_search_req.leaf_requests[0].split_offsets.len() == 2)
                    || (leaf_search_req.index_uris[0] == "ram:///test-index-2"
                        && leaf_search_req.leaf_requests[0].split_offsets[0].split_id
                            == "index-2-split-1")
            })
            .returning(
                |leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                    let mut partial_hits = leaf_search_req.leaf_requests[0]
                        .split_offsets
                        .iter()
                        .map(|split_offset| mock_partial_hit(&split_offset.split_id, 3, 1))
                        .collect_vec();
                    let partial_hits2 = leaf_search_req.leaf_requests[1]
                        .split_offsets
                        .iter()
                        .map(|split_offset| mock_partial_hit(&split_offset.split_id, 3, 1))
                        .collect_vec();
                    partial_hits.extend_from_slice(&partial_hits2);
                    let num_attempted_splits: u64 = leaf_search_req
                        .leaf_requests
                        .iter()
                        .map(|leaf_req| leaf_req.split_offsets.len() as u64)
                        .sum::<u64>();
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: leaf_search_req.leaf_requests[0].split_offsets.len() as u64
                            + leaf_search_req.leaf_requests[1].split_offsets.len() as u64,
                        partial_hits,
                        failed_splits: Vec::new(),
                        num_attempted_splits,
                        ..Default::default()
                    })
                },
            );
        mock_search_service_1
            .expect_fetch_docs()
            .times(2)
            .withf(|fetch_docs_req: &FetchDocsRequest| {
                (fetch_docs_req.index_uri == "ram:///test-index-1"
                    && fetch_docs_req.partial_hits.len() == 2)
                    || (fetch_docs_req.index_uri == "ram:///test-index-2"
                        && fetch_docs_req.partial_hits[0].split_id == "index-2-split-1")
            })
            .returning(|fetch_docs_req| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service_1)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 3);
        assert_eq!(search_response.hits.len(), 3);
        assert_eq!(
            search_response
                .hits
                .iter()
                .map(|hit| &hit.index_id)
                .collect_vec(),
            vec!["test-index-1", "test-index-1", "test-index-2"]
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_split_failures() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index-1".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata_1 = IndexMetadata::for_test("test-index-1", "ram:///test-index-1");
        let index_uid_1 = index_metadata_1.index_uid.clone();
        mock_metastore.expect_list_indexes_metadata().return_once(
            move |_list_indexes_metadata_request: ListIndexesMetadataRequest| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata_1,
                ]))
            },
        );
        mock_metastore
            .expect_list_splits()
            .return_once(move |list_splits_request| {
                let list_splits_query =
                    list_splits_request.deserialize_list_splits_query().unwrap();
                assert!(list_splits_query.index_uids == Some(vec![index_uid_1.clone()]));
                let splits = vec![
                    MockSplitBuilder::new("index-1-split-1")
                        .with_index_uid(&index_uid_1)
                        .build(),
                    MockSplitBuilder::new("index-1-split-2")
                        .with_index_uid(&index_uid_1)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mut mock_search_service_1 = MockSearchService::new();
        mock_search_service_1
            .expect_leaf_search()
            .withf(
                |leaf_search_req: &quickwit_proto::search::LeafSearchRequest| {
                    leaf_search_req.leaf_requests.len() == 1
                        && leaf_search_req.leaf_requests[0].split_offsets.len() == 2
                },
            )
            .times(1)
            .returning(
                |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                    let partial_hits = vec![mock_partial_hit("index-1-split-1", 0u64, 1u32)];
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: 1,
                        partial_hits,
                        failed_splits: vec![{
                            SplitSearchError {
                                error: "some error".to_string(),
                                split_id: "index-1-split-1".to_string(),
                                retryable_error: true,
                            }
                        }],
                        num_attempted_splits: 3,
                        ..Default::default()
                    })
                },
            );
        mock_search_service_1
            .expect_leaf_search()
            .withf(
                |leaf_search_req: &quickwit_proto::search::LeafSearchRequest| {
                    leaf_search_req.leaf_requests.len() == 1
                        && leaf_search_req.leaf_requests[0].split_offsets.len() == 1
                },
            )
            .times(1)
            .returning(
                |_leaf_search_req: quickwit_proto::search::LeafSearchRequest| {
                    Ok(quickwit_proto::search::LeafSearchResponse {
                        num_hits: 0,
                        partial_hits: Vec::new(),
                        failed_splits: vec![{
                            SplitSearchError {
                                error: "some error".to_string(),
                                split_id: "index-1-split-1".to_string(),
                                retryable_error: true,
                            }
                        }],
                        num_attempted_splits: 1,
                        ..Default::default()
                    })
                },
            );
        mock_search_service_1
            .expect_fetch_docs()
            .times(1)
            .returning(|fetch_docs_req| {
                Ok(quickwit_proto::search::FetchDocsResponse {
                    hits: get_doc_for_fetch_req(fetch_docs_req),
                })
            });
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service_1)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());
        let search_response = root_search(
            &SearcherContext::for_test(),
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap();
        assert_eq!(search_response.num_hits, 1);
        assert_eq!(search_response.hits.len(), 1);
        assert_eq!(search_response.failed_splits.len(), 1);
        Ok(())
    }

    #[tokio::test]
    async fn test_root_search_too_many_splits() -> anyhow::Result<()> {
        let search_request = quickwit_proto::search::SearchRequest {
            index_id_patterns: vec!["test-index".to_string()],
            query_ast: qast_json_helper("test", &["body"]),
            max_hits: 10,
            ..Default::default()
        };
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata = IndexMetadata::for_test("test-index", "ram:///test-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_list_indexes_metadata()
            .returning(move |_index_ids_query| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    index_metadata.clone(),
                ]))
            });
        mock_metastore
            .expect_list_splits()
            .returning(move |_filter| {
                let splits = vec![
                    MockSplitBuilder::new("split1")
                        .with_index_uid(&index_uid)
                        .build(),
                    MockSplitBuilder::new("split2")
                        .with_index_uid(&index_uid)
                        .build(),
                ];
                let splits_response = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits_response)]))
            });
        let mock_search_service = MockSearchService::new();
        let searcher_pool = searcher_pool_for_test([("127.0.0.1:1001", mock_search_service)]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let cluster_client = ClusterClient::new(search_job_placer.clone());

        let mut searcher_context = SearcherContext::for_test();
        searcher_context.searcher_config.max_splits_per_search = Some(1);
        let search_error = root_search(
            &searcher_context,
            search_request,
            MetastoreServiceClient::from_mock(mock_metastore),
            &cluster_client,
        )
        .await
        .unwrap_err();
        assert!(matches!(search_error, SearchError::InvalidArgument { .. }));
        Ok(())
    }

    #[tokio::test]
    async fn test_finalize_aggregation_if_any_no_aggregation_request() {
        let search_request = SearchRequest {
            aggregation_request: None,
            skip_aggregation_finalization: false,
            ..Default::default()
        };
        let searcher_context = SearcherContext::for_test();
        let result =
            finalize_aggregation_if_any(&search_request, Some(vec![1, 2, 3]), &searcher_context)
                .unwrap();
        assert!(result.is_none());
    }

    #[tokio::test]
    async fn test_finalize_aggregation_if_any_skip_finalization_returns_intermediate_bytes() {
        let agg_req = r#"{"avg_price": {"avg": {"field": "price"}}}"#;
        let intermediate_bytes = vec![42, 43, 44];
        let search_request = SearchRequest {
            aggregation_request: Some(agg_req.to_string()),
            skip_aggregation_finalization: true,
            ..Default::default()
        };
        let searcher_context = SearcherContext::for_test();
        let result = finalize_aggregation_if_any(
            &search_request,
            Some(intermediate_bytes.clone()),
            &searcher_context,
        )
        .unwrap();
        assert_eq!(result, Some(intermediate_bytes));
    }

    #[tokio::test]
    async fn test_finalize_aggregation_if_any_skip_finalization_none_bytes() {
        let agg_req = r#"{"avg_price": {"avg": {"field": "price"}}}"#;
        let search_request = SearchRequest {
            aggregation_request: Some(agg_req.to_string()),
            skip_aggregation_finalization: true,
            ..Default::default()
        };
        let searcher_context = SearcherContext::for_test();
        let result = finalize_aggregation_if_any(&search_request, None, &searcher_context).unwrap();
        assert!(result.is_none());
    }

    #[tokio::test]
    async fn test_finalize_aggregation_if_any_default_finalizes() {
        let agg_req = r#"{"avg_price": {"avg": {"field": "price"}}}"#;
        let intermediate_results = IntermediateAggregationResults::default();
        let intermediate_bytes = postcard::to_stdvec(&intermediate_results).unwrap();
        let search_request = SearchRequest {
            aggregation_request: Some(agg_req.to_string()),
            skip_aggregation_finalization: false,
            ..Default::default()
        };
        let searcher_context = SearcherContext::for_test();
        let result = finalize_aggregation_if_any(
            &search_request,
            Some(intermediate_bytes.clone()),
            &searcher_context,
        )
        .unwrap();
        // Result should be Some (finalized), but different from intermediate bytes
        assert!(result.is_some());
        assert_ne!(result.unwrap(), intermediate_bytes);
    }

    #[tokio::test]
    async fn test_finalize_aggregation_if_any_false_flag_finalizes() {
        let agg_req = r#"{"avg_price": {"avg": {"field": "price"}}}"#;
        let intermediate_results = IntermediateAggregationResults::default();
        let intermediate_bytes = postcard::to_stdvec(&intermediate_results).unwrap();
        let search_request = SearchRequest {
            aggregation_request: Some(agg_req.to_string()),
            skip_aggregation_finalization: false,
            ..Default::default()
        };
        let searcher_context = SearcherContext::for_test();
        let result = finalize_aggregation_if_any(
            &search_request,
            Some(intermediate_bytes.clone()),
            &searcher_context,
        )
        .unwrap();
        assert!(result.is_some());
        assert_ne!(result.unwrap(), intermediate_bytes);
    }
}


================================================
FILE: quickwit/quickwit-search/src/scroll_context.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::ops::Range;
use std::str::FromStr;
use std::sync::Arc;
use std::time::Duration;

use anyhow::Context;
use base64::Engine;
use base64::prelude::BASE64_STANDARD;
use quickwit_common::metrics::GaugeGuard;
use quickwit_common::shared_consts::SCROLL_BATCH_LEN;
use quickwit_metastore::SplitMetadata;
use quickwit_proto::search::{LeafSearchResponse, PartialHit, SearchRequest, SplitSearchError};
use quickwit_proto::types::IndexUid;
use serde::{Deserialize, Serialize};
use tokio::sync::RwLock;
use ttl_cache::TtlCache;
use ulid::Ulid;

use crate::ClusterClient;
use crate::root::IndexMetasForLeafSearch;
use crate::service::SearcherContext;

/// Maximum number of values in the local search KV store.
///
/// TODO make configurable.
///
/// Assuming a search context of 1MB, this can
/// amount to up to 1GB.
const LOCAL_KV_CACHE_SIZE: usize = 1_000;

#[derive(Serialize, Deserialize)]
pub(crate) struct ScrollContext {
    pub split_metadatas: Vec<SplitMetadata>,
    pub search_request: SearchRequest,
    pub indexes_metas_for_leaf_search: HashMap<IndexUid, IndexMetasForLeafSearch>,
    pub total_num_hits: u64,
    pub max_hits_per_page: u64,
    pub cached_partial_hits_start_offset: u64,
    pub cached_partial_hits: Vec<PartialHit>,
    pub failed_splits: Vec<SplitSearchError>,
    pub num_successful_splits: u64,
}

impl ScrollContext {
    /// Returns as many results in cache.
    pub fn get_cached_partial_hits(&self, doc_range: Range<u64>) -> &[PartialHit] {
        if doc_range.end <= doc_range.start {
            return &[];
        }
        if doc_range.start < self.cached_partial_hits_start_offset {
            return &[];
        }
        if doc_range.start
            >= self.cached_partial_hits_start_offset + self.cached_partial_hits.len() as u64
        {
            return &[];
        }
        let truncated_partial_hits = &self.cached_partial_hits
            [(doc_range.start - self.cached_partial_hits_start_offset) as usize..];
        let num_partial_hits = truncated_partial_hits
            .len()
            .min((doc_range.end - doc_range.start) as usize);
        &truncated_partial_hits[..num_partial_hits]
    }

    /// Clear cache if it wouldn't be useful, i.e. if page size is greater than SCROLL_BATCH_LEN
    pub fn clear_cache_if_unneeded(&mut self) {
        if self.search_request.max_hits > SCROLL_BATCH_LEN as u64 {
            self.cached_partial_hits.clear();
        }
    }

    pub fn serialize(&self) -> Vec<u8> {
        let uncompressed_payload = serde_json::to_string(self).unwrap();
        uncompressed_payload.as_bytes().to_vec()
    }

    pub fn load(payload: &[u8]) -> anyhow::Result<Self> {
        let scroll_context =
            serde_json::from_slice(payload).context("failed to deserialize context")?;
        Ok(scroll_context)
    }

    /// Loads in the `ScrollContext` cache all the
    /// hits in range [start_offset..start_offset + SCROLL_BATCH_LEN).
    pub async fn load_batch_starting_at(
        &mut self,
        start_offset: u64,
        previous_last_hit: PartialHit,
        cluster_client: &ClusterClient,
        searcher_context: &SearcherContext,
    ) -> crate::Result<bool> {
        self.search_request.search_after = Some(previous_last_hit);
        let leaf_search_response: LeafSearchResponse = crate::root::search_partial_hits_phase(
            searcher_context,
            &self.indexes_metas_for_leaf_search,
            &self.search_request,
            &self.split_metadatas[..],
            cluster_client,
        )
        .await?;
        self.cached_partial_hits_start_offset = start_offset;
        self.cached_partial_hits = leaf_search_response.partial_hits;
        Ok(true)
    }
}

struct TrackedValue {
    content: Vec<u8>,
    _total_size_metric_guard: GaugeGuard<'static>,
}

/// In memory key value store with TTL and limited size.
///
/// Once the capacity [LOCAL_KV_CACHE_SIZE] is reached, the oldest entries are
/// removed.
///
/// Currently this store is only used for caching scroll contexts. Using it for
/// other purposes is risky as use cases would compete for its capacity.
#[derive(Clone)]
pub(crate) struct MiniKV {
    ttl_with_cache: Arc<RwLock<TtlCache<Vec<u8>, TrackedValue>>>,
}

impl Default for MiniKV {
    fn default() -> MiniKV {
        MiniKV {
            ttl_with_cache: Arc::new(RwLock::new(TtlCache::new(LOCAL_KV_CACHE_SIZE))),
        }
    }
}

impl MiniKV {
    pub async fn put(&self, key: Vec<u8>, payload: Vec<u8>, ttl: Duration) {
        let mut metric_guard =
            GaugeGuard::from_gauge(&crate::SEARCH_METRICS.searcher_local_kv_store_size_bytes);
        metric_guard.add(payload.len() as i64);
        let mut cache_lock = self.ttl_with_cache.write().await;
        cache_lock.insert(
            key,
            TrackedValue {
                content: payload,
                _total_size_metric_guard: metric_guard,
            },
            ttl,
        );
    }

    pub async fn get(&self, key: &[u8]) -> Option<Vec<u8>> {
        let cache_lock = self.ttl_with_cache.read().await;
        let tracked_value = cache_lock.get(key)?;
        Some(tracked_value.content.clone())
    }
}

#[derive(Serialize, Deserialize, Clone, Eq, PartialEq, Debug)]
pub(crate) struct ScrollKeyAndStartOffset {
    scroll_ulid: Ulid,
    pub(crate) start_offset: u64,
    // this is set to zero if there are no more documents
    pub(crate) max_hits_per_page: u32,
    pub(crate) search_after: PartialHit,
}

impl ScrollKeyAndStartOffset {
    pub fn new_with_start_offset(
        start_offset: u64,
        max_hits_per_page: u32,
        search_after: PartialHit,
    ) -> ScrollKeyAndStartOffset {
        let scroll_ulid: Ulid = Ulid::new();
        // technically we could only initialize search_after on first call to next_page, and use
        // default() before, but that feels like partial initialization.
        ScrollKeyAndStartOffset {
            scroll_ulid,
            start_offset,
            max_hits_per_page,
            search_after,
        }
    }

    pub fn next_page(
        mut self,
        found_hits_in_current_page: u64,
        last_hit: PartialHit,
    ) -> ScrollKeyAndStartOffset {
        self.start_offset += found_hits_in_current_page;
        if found_hits_in_current_page < self.max_hits_per_page as u64 {
            self.max_hits_per_page = 0;
        }
        self.search_after = last_hit;
        self
    }

    pub fn scroll_key(&self) -> [u8; 16] {
        u128::from(self.scroll_ulid).to_le_bytes()
    }
}

impl fmt::Display for ScrollKeyAndStartOffset {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        let mut payload = vec![0u8; 28];
        payload[..16].copy_from_slice(&u128::from(self.scroll_ulid).to_le_bytes());
        payload[16..24].copy_from_slice(&self.start_offset.to_le_bytes());
        payload[24..28].copy_from_slice(&self.max_hits_per_page.to_le_bytes());
        serde_json::to_writer(&mut payload, &self.search_after)
            .expect("serializing PartialHit should never fail");
        let b64_payload = BASE64_STANDARD.encode(payload);
        write!(formatter, "{b64_payload}")
    }
}

impl FromStr for ScrollKeyAndStartOffset {
    type Err = &'static str;

    fn from_str(scroll_id_str: &str) -> Result<Self, Self::Err> {
        let base64_decoded: Vec<u8> = BASE64_STANDARD
            .decode(scroll_id_str)
            .map_err(|_| "scroll id is invalid base64.")?;
        if base64_decoded.len() <= 16 + 8 + 4 {
            return Err("scroll id payload is truncated");
        }
        let (scroll_ulid_bytes, from_bytes, max_hits_bytes) = (
            &base64_decoded[..16],
            &base64_decoded[16..24],
            &base64_decoded[24..28],
        );
        let scroll_ulid = u128::from_le_bytes(scroll_ulid_bytes.try_into().unwrap()).into();
        let from = u64::from_le_bytes(from_bytes.try_into().unwrap());
        let max_hits = u32::from_le_bytes(max_hits_bytes.try_into().unwrap());
        if max_hits > 10_000 {
            return Err("scroll id is malformed");
        }
        let search_after =
            serde_json::from_slice(&base64_decoded[28..]).map_err(|_| "scroll id is malformed")?;
        Ok(ScrollKeyAndStartOffset {
            scroll_ulid,
            start_offset: from,
            max_hits_per_page: max_hits,
            search_after,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::str::FromStr;

    use quickwit_proto::search::PartialHit;

    use crate::scroll_context::ScrollKeyAndStartOffset;

    #[test]
    fn test_scroll_id() {
        let partial_hit = PartialHit {
            sort_value: None,
            sort_value2: None,
            split_id: "split".to_string(),
            segment_ord: 1,
            doc_id: 2,
        };
        let scroll = ScrollKeyAndStartOffset::new_with_start_offset(10, 100, partial_hit);
        let scroll_str = scroll.to_string();
        let ser_deser_scroll = ScrollKeyAndStartOffset::from_str(&scroll_str).unwrap();
        assert_eq!(scroll, ser_deser_scroll);
    }
}


================================================
FILE: quickwit/quickwit-search/src/search_job_placer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Ordering;
use std::collections::{HashMap, HashSet};
use std::fmt;
use std::hash::{Hash, Hasher};
use std::net::SocketAddr;

use anyhow::bail;
use async_trait::async_trait;
use quickwit_common::SocketAddrLegacyHash;
use quickwit_common::pubsub::EventSubscriber;
use quickwit_common::rendezvous_hasher::{node_affinity, sort_by_rendez_vous_hash};
use quickwit_proto::search::{ReportSplit, ReportSplitsRequest};
use tracing::{info, warn};

use crate::{SEARCH_METRICS, SearchJob, SearchServiceClient, SearcherPool};

/// Job.
/// The unit in which distributed search is performed.
///
/// The `split_id` is used to define an affinity between a leaf nodes and a job.
/// The `cost` is used to spread the work evenly amongst nodes.
pub trait Job {
    /// Split ID of the targeted split.
    fn split_id(&self) -> &str;

    /// Estimation of the load associated with running a given job.
    ///
    /// A list of jobs will be assigned to leaf nodes in a way that spread
    /// the sum of cost evenly.
    fn cost(&self) -> usize;

    /// Compares the cost of two jobs in reverse order, breaking ties by split ID.
    fn compare_cost(&self, other: &Self) -> Ordering {
        self.cost()
            .cmp(&other.cost())
            .reverse()
            .then_with(|| self.split_id().cmp(other.split_id()))
    }
}

/// Search job placer.
/// It assigns jobs to search clients.
#[derive(Clone, Default)]
pub struct SearchJobPlacer {
    /// Search clients pool.
    searcher_pool: SearcherPool,
}

#[async_trait]
impl EventSubscriber<ReportSplitsRequest> for SearchJobPlacer {
    async fn handle_event(&mut self, evt: ReportSplitsRequest) {
        let mut nodes: HashMap<SocketAddr, SearchServiceClient> =
            self.searcher_pool.pairs().into_iter().collect();
        if nodes.is_empty() {
            return;
        }
        let mut splits_per_node: HashMap<SocketAddr, Vec<ReportSplit>> =
            HashMap::with_capacity(nodes.len().min(evt.report_splits.len()));
        for report_split in evt.report_splits {
            let node_addr = nodes
                .keys()
                .max_by_key(|node_addr| {
                    node_affinity(SocketAddrLegacyHash(node_addr), &report_split.split_id)
                })
                // This actually never happens thanks to the if-condition at the
                // top of this function.
                .expect("`nodes` should not be empty");
            splits_per_node
                .entry(*node_addr)
                .or_default()
                .push(report_split);
        }
        for (node_addr, report_splits) in splits_per_node {
            if let Some(search_client) = nodes.get_mut(&node_addr) {
                let report_splits_req = ReportSplitsRequest { report_splits };
                let _ = search_client.report_splits(report_splits_req).await;
            }
        }
    }
}

impl fmt::Debug for SearchJobPlacer {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("SearchJobPlacer").finish()
    }
}

impl SearchJobPlacer {
    /// Returns an [`SearchJobPlacer`] from a search service client pool.
    pub fn new(searcher_pool: SearcherPool) -> Self {
        Self { searcher_pool }
    }
}

struct SocketAddrAndClient {
    socket_addr: SocketAddr,
    client: SearchServiceClient,
}

impl Hash for SocketAddrAndClient {
    fn hash<H: Hasher>(&self, hasher: &mut H) {
        SocketAddrLegacyHash(&self.socket_addr).hash(hasher);
    }
}

impl SearchJobPlacer {
    /// Returns an iterator over the search nodes, ordered by their affinity
    /// with the `affinity_key`, as defined by rendez-vous hashing.
    pub async fn best_nodes_per_affinity(
        &self,
        affinity_key: &[u8],
    ) -> impl Iterator<Item = SearchServiceClient> {
        let mut nodes: Vec<SocketAddrAndClient> = self
            .searcher_pool
            .pairs()
            .into_iter()
            .map(|(socket_addr, client)| SocketAddrAndClient {
                socket_addr,
                client,
            })
            .collect();
        sort_by_rendez_vous_hash(&mut nodes[..], affinity_key);
        nodes
            .into_iter()
            .map(|socket_addr_and_client| socket_addr_and_client.client)
    }

    /// Assign the given job to the clients
    /// Returns a list of pair (SocketAddr, `Vec<Job>`)
    ///
    /// When exclude_addresses filters all clients it is ignored.
    pub async fn assign_jobs<J: Job>(
        &self,
        mut jobs: Vec<J>,
        excluded_addrs: &HashSet<SocketAddr>,
    ) -> anyhow::Result<impl Iterator<Item = (SearchServiceClient, Vec<J>)> + use<J>> {
        let mut all_nodes = self.searcher_pool.pairs();

        if all_nodes.is_empty() {
            bail!(
                "failed to assign search jobs: there are no available searcher nodes in the \
                 cluster"
            );
        }
        if !excluded_addrs.is_empty() && excluded_addrs.len() < all_nodes.len() {
            all_nodes.retain(|(grpc_addr, _)| !excluded_addrs.contains(grpc_addr));

            // This should never happen, but... belt and suspenders policy.
            if all_nodes.is_empty() {
                bail!(
                    "failed to assign search jobs: there are no searcher nodes candidates for \
                     these jobs"
                );
            }
            info!(
                "excluded {} nodes from search job placement, {} remaining",
                excluded_addrs.len(),
                all_nodes.len()
            );
        }
        let mut candidate_nodes: Vec<CandidateNode> = all_nodes
            .into_iter()
            .map(|(grpc_addr, client)| CandidateNode {
                grpc_addr,
                client,
                load: 0,
            })
            .collect();

        jobs.sort_unstable_by(Job::compare_cost);

        let num_nodes = candidate_nodes.len();

        let mut job_assignments: HashMap<SocketAddr, (SearchServiceClient, Vec<J>)> =
            HashMap::with_capacity(num_nodes);

        let total_load: usize = jobs.iter().map(|job| job.cost()).sum();

        // allow around 5% disparity. Round up so we never end up in a case where
        // target_load * num_nodes < total_load
        // some of our tests needs 2 splits to be put on 2 different searchers. It makes sense for
        // these tests to keep doing so (testing root merge). Either we can make the allowed
        // difference stricter, find the right split names ("split6" instead of "split2" works).
        // or modify mock_split_meta() so that not all splits have the same job cost
        // for now i went with the mock_split_meta() changes.
        const ALLOWED_DIFFERENCE: usize = 105;
        let target_load = (total_load * ALLOWED_DIFFERENCE).div_ceil(num_nodes * 100);
        for job in jobs {
            sort_by_rendez_vous_hash(&mut candidate_nodes, job.split_id());

            let (chosen_node_idx, chosen_node) = if let Some((idx, node)) = candidate_nodes
                .iter_mut()
                .enumerate()
                .find(|(_pos, node)| node.load < target_load)
            {
                (idx, node)
            } else {
                warn!("found no lightly loaded searcher for split, this should never happen");
                (0, &mut candidate_nodes[0])
            };
            let metric_node_idx = match chosen_node_idx {
                0 => "0",
                1 => "1",
                _ => "> 1",
            };
            SEARCH_METRICS
                .job_assigned_total
                .with_label_values([metric_node_idx])
                .inc();
            chosen_node.load += job.cost();

            job_assignments
                .entry(chosen_node.grpc_addr)
                .or_insert_with(|| (chosen_node.client.clone(), Vec::new()))
                .1
                .push(job);
        }
        Ok(job_assignments.into_values())
    }

    /// Assigns a single job to a client.
    pub async fn assign_job<J: Job>(
        &self,
        job: J,
        excluded_addrs: &HashSet<SocketAddr>,
    ) -> anyhow::Result<SearchServiceClient> {
        let client = self
            .assign_jobs(vec![job], excluded_addrs)
            .await?
            .next()
            .map(|(client, _jobs)| client)
            .expect("`assign_jobs` should return at least one client or fail.");
        Ok(client)
    }
}

#[derive(Debug, Clone)]
struct CandidateNode {
    pub grpc_addr: SocketAddr,
    pub client: SearchServiceClient,
    pub load: usize,
}

impl Hash for CandidateNode {
    fn hash<H: Hasher>(&self, state: &mut H) {
        SocketAddrLegacyHash(&self.grpc_addr).hash(state);
    }
}

impl PartialEq for CandidateNode {
    fn eq(&self, other: &Self) -> bool {
        self.grpc_addr == other.grpc_addr
    }
}

impl Eq for CandidateNode {}

/// Groups jobs by index id and returns a list of `SearchJob` per index
pub fn group_jobs_by_index_id(
    jobs: Vec<SearchJob>,
    cb: impl FnMut(Vec<SearchJob>) -> crate::Result<()>,
) -> crate::Result<()> {
    // Group jobs by index uid.
    group_by(jobs, |job| &job.index_uid, cb)?;
    Ok(())
}

/// Note: The data will be sorted.
///
/// Returns slices of the input data grouped by passed closure.
pub fn group_by<T, K: Ord, F>(
    mut data: Vec<T>,
    compare_by: impl Fn(&T) -> &K,
    mut callback: F,
) -> crate::Result<()>
where
    F: FnMut(Vec<T>) -> crate::Result<()>,
{
    data.sort_by(|job1, job2| compare_by(job2).cmp(compare_by(job1)));
    while !data.is_empty() {
        let last_element = data.last().unwrap();
        let count = data
            .iter()
            .rev()
            .take_while(|&x| compare_by(x) == compare_by(last_element))
            .count();

        let group = data.split_off(data.len() - count);
        callback(group)?;
    }

    Ok(())
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::{MockSearchService, SearchJob, searcher_pool_for_test};

    #[test]
    fn test_group_by_1() {
        let data = vec![1, 1, 2, 2, 2, 3, 4, 4, 5, 5, 5];
        let mut outputs: Vec<Vec<i32>> = Vec::new();
        group_by(
            data,
            |el| el,
            |group| {
                outputs.push(group);
                Ok(())
            },
        )
        .unwrap();
        assert_eq!(outputs.len(), 5);
        assert_eq!(outputs[0], vec![1, 1]);
        assert_eq!(outputs[1], vec![2, 2, 2]);
        assert_eq!(outputs[2], vec![3]);
        assert_eq!(outputs[3], vec![4, 4]);
        assert_eq!(outputs[4], vec![5, 5, 5]);
    }
    #[test]
    fn test_group_by_all_same() {
        let data = vec![1, 1];
        let mut outputs: Vec<Vec<i32>> = Vec::new();
        group_by(
            data,
            |el| el,
            |group| {
                outputs.push(group);
                Ok(())
            },
        )
        .unwrap();
        assert_eq!(outputs.len(), 1);
        assert_eq!(outputs[0], vec![1, 1]);
    }
    #[test]
    fn test_group_by_empty() {
        let data = vec![];
        let mut outputs: Vec<Vec<i32>> = Vec::new();
        group_by(
            data,
            |el| el,
            |group| {
                outputs.push(group);
                Ok(())
            },
        )
        .unwrap();
        assert_eq!(outputs.len(), 0);
    }

    #[tokio::test]
    async fn test_search_job_placer() {
        {
            let searcher_pool = SearcherPool::default();
            let search_job_placer = SearchJobPlacer::new(searcher_pool);
            assert!(
                search_job_placer
                    .assign_jobs::<SearchJob>(Vec::new(), &HashSet::new())
                    .await
                    .is_err()
            );
        }
        {
            let searcher_pool =
                searcher_pool_for_test([("127.0.0.1:1001", MockSearchService::new())]);
            let search_job_placer = SearchJobPlacer::new(searcher_pool);
            let jobs = vec![
                SearchJob::for_test("split1", 1),
                SearchJob::for_test("split2", 2),
                SearchJob::for_test("split3", 3),
                SearchJob::for_test("split4", 4),
            ];
            let assigned_jobs: Vec<(SocketAddr, Vec<SearchJob>)> = search_job_placer
                .assign_jobs(jobs, &HashSet::default())
                .await
                .unwrap()
                .map(|(client, jobs)| (client.grpc_addr(), jobs))
                .collect();
            let expected_searcher_addr: SocketAddr = ([127, 0, 0, 1], 1001).into();
            let expected_assigned_jobs = vec![(
                expected_searcher_addr,
                vec![
                    SearchJob::for_test("split4", 4),
                    SearchJob::for_test("split3", 3),
                    SearchJob::for_test("split2", 2),
                    SearchJob::for_test("split1", 1),
                ],
            )];
            assert_eq!(assigned_jobs, expected_assigned_jobs);
        }
        {
            let searcher_pool = searcher_pool_for_test([
                ("127.0.0.1:1001", MockSearchService::new()),
                ("127.0.0.1:1002", MockSearchService::new()),
            ]);
            let search_job_placer = SearchJobPlacer::new(searcher_pool);
            let jobs = vec![
                SearchJob::for_test("split1", 1),
                SearchJob::for_test("split2", 2),
                SearchJob::for_test("split3", 3),
                SearchJob::for_test("split4", 4),
                SearchJob::for_test("split5", 5),
                SearchJob::for_test("split6", 6),
            ];
            let mut assigned_jobs: Vec<(SocketAddr, Vec<SearchJob>)> = search_job_placer
                .assign_jobs(jobs, &HashSet::default())
                .await
                .unwrap()
                .map(|(client, jobs)| (client.grpc_addr(), jobs))
                .collect();
            assigned_jobs.sort_unstable_by_key(|(node_uid, _)| *node_uid);

            let expected_searcher_addr_1: SocketAddr = ([127, 0, 0, 1], 1001).into();
            let expected_searcher_addr_2: SocketAddr = ([127, 0, 0, 1], 1002).into();
            // on a small number of splits, we may be unbalanced
            let expected_assigned_jobs = vec![
                (
                    expected_searcher_addr_1,
                    vec![
                        SearchJob::for_test("split5", 5),
                        SearchJob::for_test("split4", 4),
                        SearchJob::for_test("split3", 3),
                    ],
                ),
                (
                    expected_searcher_addr_2,
                    vec![
                        SearchJob::for_test("split6", 6),
                        SearchJob::for_test("split2", 2),
                        SearchJob::for_test("split1", 1),
                    ],
                ),
            ];
            assert_eq!(assigned_jobs, expected_assigned_jobs);
        }
        {
            let searcher_pool = searcher_pool_for_test([
                ("127.0.0.1:1001", MockSearchService::new()),
                ("127.0.0.1:1002", MockSearchService::new()),
            ]);
            let search_job_placer = SearchJobPlacer::new(searcher_pool);
            let jobs = vec![
                SearchJob::for_test("split1", 1000),
                SearchJob::for_test("split2", 1),
            ];
            let mut assigned_jobs: Vec<(SocketAddr, Vec<SearchJob>)> = search_job_placer
                .assign_jobs(jobs, &HashSet::default())
                .await
                .unwrap()
                .map(|(client, jobs)| (client.grpc_addr(), jobs))
                .collect();
            assigned_jobs.sort_unstable_by_key(|(node_uid, _)| *node_uid);

            let expected_searcher_addr_1: SocketAddr = ([127, 0, 0, 1], 1001).into();
            let expected_searcher_addr_2: SocketAddr = ([127, 0, 0, 1], 1002).into();
            let expected_assigned_jobs = vec![
                (
                    expected_searcher_addr_1,
                    vec![SearchJob::for_test("split1", 1000)],
                ),
                (
                    expected_searcher_addr_2,
                    vec![SearchJob::for_test("split2", 1)],
                ),
            ];
            assert_eq!(assigned_jobs, expected_assigned_jobs);
        }
    }

    #[tokio::test]
    async fn test_search_job_placer_many_splits() {
        let searcher_pool = searcher_pool_for_test([
            ("127.0.0.1:1001", MockSearchService::new()),
            ("127.0.0.1:1002", MockSearchService::new()),
            ("127.0.0.1:1003", MockSearchService::new()),
            ("127.0.0.1:1004", MockSearchService::new()),
            ("127.0.0.1:1005", MockSearchService::new()),
        ]);
        let search_job_placer = SearchJobPlacer::new(searcher_pool);
        let jobs = (0..1000)
            .map(|id| SearchJob::for_test(&format!("split{id}"), 1))
            .collect();
        let jobs_len: Vec<usize> = search_job_placer
            .assign_jobs(jobs, &HashSet::default())
            .await
            .unwrap()
            .map(|(_, jobs)| jobs.len())
            .collect();
        for job_len in jobs_len {
            assert!(job_len <= 1050 / 5);
        }
    }
}


================================================
FILE: quickwit/quickwit-search/src/search_permit_provider.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BinaryHeap;
use std::collections::binary_heap::PeekMut;
use std::future::Future;
use std::pin::Pin;
use std::sync::Arc;
use std::task::{Context, Poll};

use bytesize::ByteSize;
use quickwit_common::metrics::GaugeGuard;
use quickwit_proto::search::SplitIdAndFooterOffsets;
use tokio::sync::{mpsc, oneshot};

/// Distributor of permits to perform split search operation.
///
/// Requests are served in order. Each permit initially reserves a slot for the
/// warmup (limit concurrent downloads) and a pessimistic amount of memory. Once
/// the warmup is completed, the actual memory usage is set and the warmup slot
/// is released. Once the search is completed and the permit is dropped, the
/// remaining memory is also released.
#[derive(Clone)]
pub struct SearchPermitProvider {
    message_sender: mpsc::UnboundedSender<SearchPermitMessage>,
    #[allow(dead_code)]
    actor_join_handle: Arc<tokio::task::JoinHandle<SearchPermitActor>>,
}

pub enum SearchPermitMessage {
    RequestWithOffload {
        permit_sizes: Vec<u64>,
        /// Maximum number of pending requests. If granting all
        /// requested permits would cause the number of pending requests to exceed this threshold,
        /// some permits will be offloaded to Lambda.
        offload_threshold: usize,
        /// Channel to return the result message from the actor.
        /// When offloading permits, the number of futures can be < to the number of requested
        /// permits.
        permit_resp_tx: oneshot::Sender<Vec<SearchPermitFuture>>,
    },
    UpdateMemory {
        memory_delta: i64,
    },
    FreeWarmupSlot,
    Drop {
        memory_size: u64,
        warmup_slot_freed: bool,
    },
}

/// Makes very pessimistic estimate of the memory allocation required for a split search
///
/// This is refined later on when more data is available about the split.
pub fn compute_initial_memory_allocation(
    split: &SplitIdAndFooterOffsets,
    warmup_single_split_initial_allocation: ByteSize,
) -> ByteSize {
    let split_size = split.split_footer_start;
    // we consider the configured initial allocation to be set for a large split with 10M docs
    const LARGE_SPLIT_NUM_DOCS: u64 = 10_000_000;
    let proportional_allocation =
        warmup_single_split_initial_allocation.as_u64() * split.num_docs / LARGE_SPLIT_NUM_DOCS;
    let size_bytes = [
        split_size,
        proportional_allocation,
        warmup_single_split_initial_allocation.as_u64(),
    ]
    .into_iter()
    .min()
    .unwrap();
    const MINIMUM_ALLOCATION_BYTES: u64 = 10_000_000;
    ByteSize(size_bytes.max(MINIMUM_ALLOCATION_BYTES))
}

impl SearchPermitProvider {
    pub fn new(num_download_slots: usize, memory_budget: ByteSize) -> Self {
        let (message_sender, message_receiver) = mpsc::unbounded_channel();
        let actor = SearchPermitActor {
            msg_receiver: message_receiver,
            msg_sender: message_sender.downgrade(),
            num_warmup_slots_available: num_download_slots,
            total_memory_budget: memory_budget.as_u64(),
            permits_requests: BinaryHeap::new(),
            total_memory_allocated: 0u64,
        };
        let actor_join_handle = Arc::new(tokio::spawn(actor.run()));
        Self {
            message_sender,
            actor_join_handle,
        }
    }

    #[cfg(test)]
    async fn stop_and_unwrap(self) -> SearchPermitActor {
        let SearchPermitProvider {
            message_sender,
            actor_join_handle,
            ..
        } = self;
        drop(message_sender);
        Arc::into_inner(actor_join_handle).unwrap().await.unwrap()
    }

    /// Returns permits for local splits
    ///
    /// The returned futures are guaranteed to resolve in order.
    pub async fn get_permits(&self, splits: Vec<ByteSize>) -> Vec<SearchPermitFuture> {
        self.get_permits_with_offload(splits, usize::MAX).await
    }

    /// Returns permits for local splits and a list of split indices to offload.
    ///
    /// The actor checks the current pending queue depth. If adding all splits
    /// would exceed `offload_threshold` pending requests, only enough splits
    /// to fill up to the threshold are processed locally; the rest are offloaded.
    ///
    /// The returned futures are guaranteed to resolve in order.
    ///
    /// If `offload_threshold` is 0, all splits are offloaded.
    /// If `offload_threshold` is usize::MAX, all splits are processed locally.
    pub async fn get_permits_with_offload(
        &self,
        splits: Vec<ByteSize>,
        offload_threshold: usize,
    ) -> Vec<SearchPermitFuture> {
        if splits.is_empty() {
            return Vec::new();
        }
        let (permit_sender, permit_receiver) = oneshot::channel();
        let permit_sizes = splits.into_iter().map(|size| size.as_u64()).collect();
        self.message_sender
            .send(SearchPermitMessage::RequestWithOffload {
                permit_resp_tx: permit_sender,
                permit_sizes,
                offload_threshold,
            })
            .expect("Receiver lives longer than sender");
        permit_receiver
            .await
            .expect("Receiver lives longer than sender")
    }
}

struct SearchPermitActor {
    msg_receiver: mpsc::UnboundedReceiver<SearchPermitMessage>,
    msg_sender: mpsc::WeakUnboundedSender<SearchPermitMessage>,
    num_warmup_slots_available: usize,
    /// Note it is possible for memory_allocated to exceed memory_budget temporarily,
    /// if and only if a split leaf search task ended up using more than `initial_allocation`.
    /// When it happens, new permits will not be assigned until the memory is freed.
    total_memory_budget: u64,
    total_memory_allocated: u64,
    permits_requests: BinaryHeap<LeafPermitRequest>,
}

struct SingleSplitPermitRequest {
    permit_sender: oneshot::Sender<SearchPermit>,
    permit_size: u64,
}

struct LeafPermitRequest {
    /// Single split permit requests for this leaf search.
    single_split_permit_requests: std::vec::IntoIter<SingleSplitPermitRequest>,
}

impl Ord for LeafPermitRequest {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        // we compare other with self and not the other way arround because we want a min-heap and
        // Rust's is a max-heap
        other
            .single_split_permit_requests
            .as_slice()
            .len()
            .cmp(&self.single_split_permit_requests.as_slice().len())
    }
}

impl PartialOrd for LeafPermitRequest {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}

impl PartialEq for LeafPermitRequest {
    fn eq(&self, other: &Self) -> bool {
        self.cmp(other).is_eq()
    }
}

impl Eq for LeafPermitRequest {}

impl LeafPermitRequest {
    // `permit_sizes` must not be empty.
    fn from_estimated_costs(permit_sizes: Vec<u64>) -> (Self, Vec<SearchPermitFuture>) {
        assert!(!permit_sizes.is_empty(), "permit_sizes must not be empty");
        let mut permits = Vec::with_capacity(permit_sizes.len());
        let mut single_split_permit_requests = Vec::with_capacity(permit_sizes.len());
        for permit_size in permit_sizes {
            let (tx, rx) = oneshot::channel();
            // we keep our internal list of permits and the returned wait handles in the
            // same order to make sure we emit each permit in the right order. Doing otherwise
            // may cause deadlocks
            single_split_permit_requests.push(SingleSplitPermitRequest {
                permit_sender: tx,
                permit_size,
            });
            permits.push(SearchPermitFuture(rx));
        }
        (
            LeafPermitRequest {
                single_split_permit_requests: single_split_permit_requests.into_iter(),
            },
            permits,
        )
    }

    fn pop_if_smaller_than(&mut self, max_size: u64) -> Option<SingleSplitPermitRequest> {
        let peeked_single_split_req = self.single_split_permit_requests.as_slice().first()?;
        if peeked_single_split_req.permit_size > max_size {
            return None;
        }
        self.single_split_permit_requests.next()
    }

    fn is_empty(&self) -> bool {
        self.single_split_permit_requests.as_slice().is_empty()
    }
}

impl SearchPermitActor {
    async fn run(mut self) -> Self {
        // Stops when the last clone of SearchPermitProvider is dropped.
        while let Some(msg) = self.msg_receiver.recv().await {
            self.handle_message(msg);
        }
        self
    }

    fn handle_message(&mut self, msg: SearchPermitMessage) {
        match msg {
            SearchPermitMessage::RequestWithOffload {
                mut permit_sizes,
                permit_resp_tx: permit_sender,
                offload_threshold,
            } => {
                let current_pending = self
                    .permits_requests
                    .iter()
                    .map(|req| req.single_split_permit_requests.as_slice().len())
                    .sum();
                // How many new splits can we accept locally before hitting the threshold.
                let local_capacity = offload_threshold.saturating_sub(current_pending);

                // If this indeed truncates the permit_sizes vector, other splits will be offloaded
                // to lambdas.
                permit_sizes.truncate(local_capacity);

                // We special case here in order to avoid pushing empty request in the queue.
                // (they would never be removed)
                if permit_sizes.is_empty() {
                    let _ = permit_sender.send(Vec::new());
                    return;
                }

                let (leaf_permit_request, permit_futures) =
                    LeafPermitRequest::from_estimated_costs(permit_sizes);
                self.permits_requests.push(leaf_permit_request);
                self.assign_available_permits();
                let _ = permit_sender.send(permit_futures);
            }
            SearchPermitMessage::UpdateMemory { memory_delta } => {
                if self.total_memory_allocated as i64 + memory_delta < 0 {
                    panic!("More memory released than allocated, should never happen.")
                }
                self.total_memory_allocated =
                    (self.total_memory_allocated as i64 + memory_delta) as u64;
                self.assign_available_permits();
            }
            SearchPermitMessage::FreeWarmupSlot => {
                self.num_warmup_slots_available += 1;
                self.assign_available_permits();
            }
            SearchPermitMessage::Drop {
                memory_size,
                warmup_slot_freed,
            } => {
                if !warmup_slot_freed {
                    self.num_warmup_slots_available += 1;
                }
                self.total_memory_allocated = self
                    .total_memory_allocated
                    .checked_sub(memory_size)
                    .expect("More memory released than allocated, should never happen.");
                self.assign_available_permits();
            }
        }
    }

    fn pop_next_request_if_serviceable(&mut self) -> Option<SingleSplitPermitRequest> {
        if self.num_warmup_slots_available == 0 {
            return None;
        }
        let available_memory = self
            .total_memory_budget
            .checked_sub(self.total_memory_allocated)?;
        let mut peeked = self.permits_requests.peek_mut()?;

        assert!(
            !peeked.is_empty(),
            "unexpected empty permits_requests present in the search permit provider queue"
        );
        if let Some(permit_request) = peeked.pop_if_smaller_than(available_memory) {
            if peeked.is_empty() {
                PeekMut::pop(peeked);
            }
            return Some(permit_request);
        }
        None
    }

    fn assign_available_permits(&mut self) {
        while let Some(permit_request) = self.pop_next_request_if_serviceable() {
            let mut ongoing_gauge_guard = GaugeGuard::from_gauge(
                &crate::SEARCH_METRICS.leaf_search_single_split_tasks_ongoing,
            );
            ongoing_gauge_guard.add(1);
            self.total_memory_allocated += permit_request.permit_size;
            self.num_warmup_slots_available -= 1;
            permit_request
                .permit_sender
                .send(SearchPermit {
                    _ongoing_gauge_guard: ongoing_gauge_guard,
                    msg_sender: self.msg_sender.clone(),
                    memory_allocation: permit_request.permit_size,
                    warmup_slot_freed: false,
                })
                // if the requester dropped its receiver, we drop the newly
                // created SearchPermit which releases the resources
                .ok();
        }
        crate::SEARCH_METRICS
            .leaf_search_single_split_tasks_pending
            .set(self.permits_requests.len() as i64);
    }
}

pub struct SearchPermit {
    _ongoing_gauge_guard: GaugeGuard<'static>,
    msg_sender: mpsc::WeakUnboundedSender<SearchPermitMessage>,
    memory_allocation: u64,
    warmup_slot_freed: bool,
}

impl SearchPermit {
    /// Update the memory usage attached to this permit.
    ///
    /// This will increase or decrease the available memory in the [`SearchPermitProvider`].
    pub fn update_memory_usage(&mut self, new_memory_usage: ByteSize) {
        let new_usage_bytes = new_memory_usage.as_u64();
        let memory_delta = new_usage_bytes as i64 - self.memory_allocation as i64;
        self.memory_allocation = new_usage_bytes;
        self.send_if_still_running(SearchPermitMessage::UpdateMemory { memory_delta });
    }

    /// Drop the warmup permit, allowing more downloads to be started. Only one
    /// slot is attached to each permit so calling this again has no effect.
    pub fn free_warmup_slot(&mut self) {
        if self.warmup_slot_freed {
            return;
        }
        self.warmup_slot_freed = true;
        self.send_if_still_running(SearchPermitMessage::FreeWarmupSlot);
    }

    pub fn memory_allocation(&self) -> ByteSize {
        ByteSize(self.memory_allocation)
    }

    fn send_if_still_running(&self, msg: SearchPermitMessage) {
        if let Some(sender) = self.msg_sender.upgrade() {
            sender
                .send(msg)
                // Receiver instance in the event loop is never dropped or
                // closed as long as there is a strong sender reference.
                .expect("Receiver should live longer than sender");
        }
    }
}

impl Drop for SearchPermit {
    fn drop(&mut self) {
        self.send_if_still_running(SearchPermitMessage::Drop {
            memory_size: self.memory_allocation,
            warmup_slot_freed: self.warmup_slot_freed,
        });
    }
}

pub struct SearchPermitFuture(oneshot::Receiver<SearchPermit>);

impl Future for SearchPermitFuture {
    type Output = SearchPermit;

    fn poll(self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
        let receiver = Pin::new(&mut self.get_mut().0);
        match receiver.poll(cx) {
            Poll::Ready(Ok(search_permit)) => Poll::Ready(search_permit),
            Poll::Ready(Err(_)) => panic!("Failed to acquire permit. This should never happen! Please, report on https://github.com/quickwit-oss/quickwit/issues."),
            Poll::Pending => Poll::Pending,
        }
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use futures::StreamExt;
    use rand::seq::SliceRandom;
    use tokio::task::JoinSet;

    use super::*;

    #[tokio::test]
    async fn test_search_permit_order() {
        let permit_provider = SearchPermitProvider::new(1, ByteSize::mb(100));
        let mut all_futures = Vec::new();
        let first_batch_of_permits = permit_provider
            .get_permits(vec![ByteSize::mb(10); 10])
            .await;
        assert_eq!(first_batch_of_permits.len(), 10);
        all_futures.extend(
            first_batch_of_permits
                .into_iter()
                .enumerate()
                .map(move |(i, fut)| ((1, i), fut)),
        );

        let second_batch_of_permits = permit_provider
            .get_permits(vec![ByteSize::mb(10); 10])
            .await;
        assert_eq!(second_batch_of_permits.len(), 10);
        all_futures.extend(
            second_batch_of_permits
                .into_iter()
                .enumerate()
                .map(move |(i, fut)| ((2, i), fut)),
        );

        // not super useful, considering what join set does, but still a tiny bit more sound.
        all_futures.shuffle(&mut rand::rng());

        let mut join_set = JoinSet::new();
        for (res, fut) in all_futures {
            join_set.spawn(async move {
                let permit = fut.await;
                (res, permit)
            });
        }
        let mut ordered_result: Vec<(usize, usize)> = Vec::with_capacity(20);
        while let Some(Ok(((batch_id, order), _permit))) = join_set.join_next().await {
            ordered_result.push((batch_id, order));
        }

        assert_eq!(ordered_result.len(), 20);
        for (i, res) in ordered_result[0..10].iter().enumerate() {
            assert_eq!(res, &(1, i));
        }
        for (i, res) in ordered_result[10..20].iter().enumerate() {
            assert_eq!(res, &(2, i));
        }
    }

    #[tokio::test]
    async fn test_search_permit_order_with_concurrent_search() {
        let permit_provider = SearchPermitProvider::new(4, ByteSize::mb(100));
        let mut all_futures = Vec::new();
        let first_batch_of_permits = permit_provider.get_permits(vec![ByteSize::mb(10); 8]).await;
        assert_eq!(first_batch_of_permits.len(), 8);
        all_futures.extend(
            first_batch_of_permits
                .into_iter()
                .enumerate()
                .map(move |(i, fut)| ((1, i), fut)),
        );

        let second_batch_of_permits = permit_provider.get_permits(vec![ByteSize::mb(10); 2]).await;
        all_futures.extend(
            second_batch_of_permits
                .into_iter()
                .enumerate()
                .map(move |(i, fut)| ((2, i), fut)),
        );

        let third_batch_of_permits = permit_provider.get_permits(vec![ByteSize::mb(10); 6]).await;
        all_futures.extend(
            third_batch_of_permits
                .into_iter()
                .enumerate()
                .map(move |(i, fut)| ((3, i), fut)),
        );

        // not super useful, considering what join set does, but still a tiny bit more sound.
        all_futures.shuffle(&mut rand::rng());

        let mut join_set = JoinSet::new();
        for (res, fut) in all_futures {
            join_set.spawn(async move {
                let permit = fut.await;
                (res, permit)
            });
        }
        let mut ordered_result: Vec<(usize, usize)> = Vec::with_capacity(20);
        while let Some(Ok(((batch_id, order), _permit))) = join_set.join_next().await {
            ordered_result.push((batch_id, order));
        }

        let mut counters = [0; 4];
        let expected_result: Vec<(usize, usize)> = [
            1, 1, 1, 1, // initial 4 permits
            2, 2, 1, 1, 1, 1, 3, 3, 3, 3, 3, 3,
        ]
        .into_iter()
        .map(|batch_id| {
            let order = counters[batch_id];
            counters[batch_id] += 1;
            (batch_id, order)
        })
        .collect();

        // for the first 4 permits, the order is not well defined as they are all granted at once,
        // and we poll futures in a random order. We sort them to fix that artifact
        ordered_result[..4].sort();
        assert_eq!(ordered_result, expected_result);
    }

    #[tokio::test]
    async fn test_search_permit_early_drops() {
        let permit_provider = SearchPermitProvider::new(1, ByteSize::mb(100));
        let permit_fut1 = permit_provider
            .get_permits(vec![ByteSize::mb(10)])
            .await
            .into_iter()
            .next()
            .unwrap();
        let permit_fut2 = permit_provider
            .get_permits(vec![ByteSize::mb(10)])
            .await
            .into_iter()
            .next()
            .unwrap();
        drop(permit_fut1);
        let permit = permit_fut2.await;
        assert_eq!(permit.memory_allocation, ByteSize::mb(10).as_u64());
        assert!(!permit_provider.actor_join_handle.is_finished());

        let _permit_fut3 = permit_provider
            .get_permits(vec![ByteSize::mb(10)])
            .await
            .into_iter()
            .next()
            .unwrap();
        let SearchPermitProvider {
            message_sender,
            actor_join_handle,
        } = permit_provider;
        drop(message_sender);
        Arc::into_inner(actor_join_handle).unwrap().await.unwrap();
    }

    /// Tries to wait for a permit
    async fn try_get(permit_fut: SearchPermitFuture) -> anyhow::Result<SearchPermit> {
        // using a short timeout is a bit flaky, but it should be enough for these tests
        let permit = tokio::time::timeout(Duration::from_millis(20), permit_fut).await?;
        Ok(permit)
    }

    #[tokio::test]
    async fn test_memory_budget() {
        let permit_provider = SearchPermitProvider::new(100, ByteSize::mb(100));
        let mut permit_futs = permit_provider
            .get_permits(vec![ByteSize::mb(10); 14])
            .await;
        let mut remaining_permit_futs = permit_futs.split_off(10).into_iter();
        assert_eq!(remaining_permit_futs.len(), 4);
        // we should be able to obtain 10 permits right away (100MB / 10MB)
        let mut permits: Vec<SearchPermit> = futures::stream::iter(permit_futs.into_iter())
            .buffered(1)
            .collect()
            .await;
        // the next permit is blocked by the memory budget
        let next_blocked_permit_fut = remaining_permit_futs.next().unwrap();
        try_get(next_blocked_permit_fut).await.err().unwrap();
        // if we drop one of the permits, we can get a new one
        permits.drain(0..1);
        let next_permit_fut = remaining_permit_futs.next().unwrap();
        let _new_permit = try_get(next_permit_fut).await.unwrap();
        // the next permit is blocked again by the memory budget
        let next_blocked_permit_fut = remaining_permit_futs.next().unwrap();
        try_get(next_blocked_permit_fut).await.err().unwrap();
        // by setting a more accurate memory usage after a completed warmup, we can get more permits
        permits[0].update_memory_usage(ByteSize::mb(4));
        permits[1].update_memory_usage(ByteSize::mb(6));
        let next_permit_fut = remaining_permit_futs.next().unwrap();
        try_get(next_permit_fut).await.unwrap();
    }

    #[tokio::test]
    async fn test_get_permits_with_offload_threshold_max_returns_all() {
        let permit_provider = SearchPermitProvider::new(100, ByteSize::mb(100));
        let permits = permit_provider
            .get_permits_with_offload(vec![ByteSize::mb(1); 8], usize::MAX)
            .await;
        assert_eq!(permits.len(), 8);
    }

    #[tokio::test]
    async fn test_get_permits_with_offload_threshold_zero_returns_none() {
        let permit_provider = SearchPermitProvider::new(100, ByteSize::mb(100));
        let permits = permit_provider
            .get_permits_with_offload(vec![ByteSize::mb(1); 5], 0)
            .await;
        assert!(permits.is_empty());
        let permit_actor = permit_provider.stop_and_unwrap().await;
        assert!(permit_actor.permits_requests.is_empty());
    }

    #[tokio::test]
    async fn test_get_permits_with_offload_truncates_to_threshold() {
        let permit_provider = SearchPermitProvider::new(100, ByteSize::mb(100));
        let permits = permit_provider
            .get_permits_with_offload(vec![ByteSize::mb(1); 10], 4)
            .await;
        assert_eq!(permits.len(), 4);
    }

    #[tokio::test]
    async fn test_get_permits_with_offload_futures_resolve_in_order() {
        // We use a search permit provider with a capacity of 1 to make sure that the permits are
        // resolved in order.
        let permit_provider = SearchPermitProvider::new(1, ByteSize::mb(100));
        let permits = permit_provider
            .get_permits_with_offload(vec![ByteSize::mb(1); 4], 10)
            .await;
        assert_eq!(permits.len(), 4);
        let mut futs: Vec<_> = permits
            .into_iter()
            .enumerate()
            .map(|(i, permit_fut)| async move {
                permit_fut.await;
                i
            })
            .collect();
        futs.shuffle(&mut rand::rng());
        let mut join_set = JoinSet::new();
        for fut in futs {
            join_set.spawn(fut);
        }
        let mut results = Vec::new();
        while let Some(result) = join_set.join_next().await {
            results.push(result.unwrap());
        }
        assert_eq!(results, vec![0, 1, 2, 3]);
    }

    #[tokio::test]
    async fn test_get_permits_with_offload_pending_consumed_frees_capacity() {
        let permit_provider = SearchPermitProvider::new(100, ByteSize::mb(100));
        // First call: 4 splits, threshold 6.
        let first_permits = permit_provider
            .get_permits_with_offload(vec![ByteSize::mb(1); 4], 6)
            .await;
        assert_eq!(first_permits.len(), 4);
        // Consume all permits from the first batch (they resolve and get dropped).
        for permit_fut in first_permits {
            let _permit = permit_fut.await;
        }
        // Second call: the consumed permits no longer count as pending.
        let second_permits = permit_provider
            .get_permits_with_offload(vec![ByteSize::mb(1); 5], 6)
            .await;
        assert_eq!(second_permits.len(), 5);
    }

    #[tokio::test]
    async fn test_warmup_slot() {
        let permit_provider = SearchPermitProvider::new(10, ByteSize::mb(100));
        let mut permit_futs = permit_provider.get_permits(vec![ByteSize::mb(1); 16]).await;
        let mut remaining_permit_futs = permit_futs.split_off(10).into_iter();
        assert_eq!(remaining_permit_futs.len(), 6);
        // we should be able to obtain 10 permits right away
        let mut permits: Vec<SearchPermit> = futures::stream::iter(permit_futs.into_iter())
            .buffered(1)
            .collect()
            .await;
        // the next permit is blocked by the warmup slots
        let next_blocked_permit_fut = remaining_permit_futs.next().unwrap();
        try_get(next_blocked_permit_fut).await.err().unwrap();
        // if we drop one of the permits, we can get a new one
        permits.drain(0..1);
        let next_permit_fut = remaining_permit_futs.next().unwrap();
        permits.push(try_get(next_permit_fut).await.unwrap());
        // the next permit is blocked again by the warmup slots
        let next_blocked_permit_fut = remaining_permit_futs.next().unwrap();
        try_get(next_blocked_permit_fut).await.err().unwrap();
        // we can explicitly free the warmup slot on a permit
        permits[0].free_warmup_slot();
        let next_permit_fut = remaining_permit_futs.next().unwrap();
        permits.push(try_get(next_permit_fut).await.unwrap());
        // dropping that same permit does not free up another slot
        permits.drain(0..1);
        let next_blocked_permit_fut = remaining_permit_futs.next().unwrap();
        try_get(next_blocked_permit_fut).await.err().unwrap();
        // but dropping a permit for which the slot wasn't explicitly free does free up a slot
        permits.drain(0..1);
        let next_blocked_permit_fut = remaining_permit_futs.next().unwrap();
        permits.push(try_get(next_blocked_permit_fut).await.unwrap());
    }
}


================================================
FILE: quickwit/quickwit-search/src/search_response_rest.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::TryFrom;

use quickwit_common::truncate_str;
use quickwit_proto::search::SearchResponse;
use quickwit_query::aggregations::AggregationResults as AggregationResultsProxy;
use quickwit_query::query_ast::QueryAst;
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;

use crate::error::SearchError;

/// A classic ES aggregation result ast
// TODO previously, we were using zero-copy when possible, which we are no longer doing:
// is that problematic? How can we return to zero/low-copy without it being painful?
#[derive(Serialize, PartialEq, Debug)]
pub struct AggregationResults(tantivy::aggregation::agg_result::AggregationResults);

impl AggregationResults {
    /// Parse an ES aggregation result ast from our non-ambiguous postcard format
    pub fn from_postcard(postcard_bytes: &[u8]) -> anyhow::Result<Self> {
        let aggregation_result: AggregationResultsProxy = postcard::from_bytes(postcard_bytes)?;
        Ok(AggregationResults(aggregation_result.into()))
    }
}

/// SearchResponseRest represents the response returned by the REST search API
/// and is meant to be serialized into JSON.
#[derive(Serialize, PartialEq, Debug, utoipa::ToSchema)]
pub struct SearchResponseRest {
    /// Overall number of documents matching the query.
    pub num_hits: u64,
    #[schema(value_type = Vec<Object>)]
    /// List of hits returned.
    pub hits: Vec<JsonValue>,
    /// List of snippets
    #[schema(value_type = Vec<Object>)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub snippets: Option<Vec<JsonValue>>,
    /// Elapsed time.
    pub elapsed_time_micros: u64,
    /// Search errors.
    pub errors: Vec<String>,
    /// Aggregations.
    #[schema(value_type = Object)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub aggregations: Option<AggregationResults>,
}

impl TryFrom<SearchResponse> for SearchResponseRest {
    type Error = SearchError;

    fn try_from(search_response: SearchResponse) -> Result<Self, Self::Error> {
        let mut documents = Vec::with_capacity(search_response.hits.len());
        let mut snippets = Vec::new();
        for hit in search_response.hits {
            let document: JsonValue = serde_json::from_str(&hit.json).map_err(|err| {
                SearchError::Internal(format!(
                    "failed to serialize document `{}` to JSON: `{}`",
                    truncate_str(&hit.json, 100),
                    err
                ))
            })?;
            documents.push(document);

            if let Some(snippet_json) = hit.snippet {
                let snippet_opt: JsonValue =
                    serde_json::from_str(&snippet_json).map_err(|err| {
                        SearchError::Internal(format!(
                            "failed to serialize snippet `{snippet_json}` to JSON: `{err}`"
                        ))
                    })?;
                snippets.push(snippet_opt);
            }
        }

        let snippet_opt = if !snippets.is_empty() {
            Some(snippets)
        } else {
            None
        };

        let aggregations_opt =
            if let Some(aggregation_postcard) = search_response.aggregation_postcard {
                let aggregation = AggregationResults::from_postcard(&aggregation_postcard)
                    .map_err(|err| SearchError::Internal(err.to_string()))?;
                Some(aggregation)
            } else {
                None
            };

        Ok(SearchResponseRest {
            num_hits: search_response.num_hits,
            hits: documents,
            snippets: snippet_opt,
            elapsed_time_micros: search_response.elapsed_time_micros,
            errors: search_response.errors,
            aggregations: aggregations_opt,
        })
    }
}

/// Details on how a query would be executed.
#[derive(Serialize, Deserialize, PartialEq, Debug, utoipa::ToSchema)]
pub struct SearchPlanResponseRest {
    /// Quickwit AST of the query.
    #[schema(value_type = Object)]
    pub quickwit_ast: QueryAst,
    /// Resolved Tantivy AST of the query, according to the latest docmapping.
    ///
    /// It's possible older splits actually resolve to a different ast.
    pub tantivy_ast: String,
    /// List of splits that would be searched by this query
    pub searched_splits: Vec<String>,
    /// Requests expected for each split
    #[schema(value_type = Object)]
    pub storage_requests: StorageRequestCount,
}

/// Number of expected storage requests, per request kind.
///
/// These figures do not take in account whether the data is already cached or not.
#[derive(Serialize, Deserialize, PartialEq, Debug, Default)]
pub struct StorageRequestCount {
    /// Number of split footer downloaded, always 1
    pub footer: usize,
    /// Number of fastfields downloaded
    pub fastfield: usize,
    /// Number of fieldnorm downloaded
    pub fieldnorm: usize,
    /// Number of sstable downloaded
    pub sstable: usize,
    /// Number of posting list downloaded
    pub posting: usize,
    /// Number of position list downloaded
    pub position: usize,
}


================================================
FILE: quickwit/quickwit-search/src/service.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::str::FromStr;
use std::sync::Arc;
use std::time::{Duration, Instant};

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_config::SearcherConfig;
use quickwit_doc_mapper::DocMapper;
use quickwit_proto::metastore::MetastoreServiceClient;
use quickwit_proto::search::{
    FetchDocsRequest, FetchDocsResponse, GetKvRequest, Hit, LeafListFieldsRequest,
    LeafListTermsRequest, LeafListTermsResponse, LeafSearchRequest, LeafSearchResponse,
    ListFieldsRequest, ListFieldsResponse, ListTermsRequest, ListTermsResponse, PutKvRequest,
    ReportSplitsRequest, ReportSplitsResponse, ScrollRequest, SearchPlanResponse, SearchRequest,
    SearchResponse, SnippetRequest,
};
use quickwit_storage::{
    MemorySizedCache, QuickwitCache, SplitCache, StorageCache, StorageResolver,
};
use tantivy::aggregation::AggregationLimitsGuard;

use crate::invoker::LambdaLeafSearchInvoker;
use crate::leaf::multi_index_leaf_search;
use crate::leaf_cache::{LeafSearchCache, PredicateCacheImpl};
use crate::list_fields::{leaf_list_fields, root_list_fields};
use crate::list_fields_cache::ListFieldsCache;
use crate::list_terms::{leaf_list_terms, root_list_terms};
use crate::metrics_trackers::LeafSearchMetricsFuture;
use crate::root::fetch_docs_phase;
use crate::scroll_context::{MiniKV, ScrollContext, ScrollKeyAndStartOffset};
use crate::search_permit_provider::SearchPermitProvider;
use crate::{ClusterClient, SearchError, fetch_docs, root_search, search_plan};

#[derive(Clone)]
/// The search service implementation.
pub struct SearchServiceImpl {
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
    cluster_client: ClusterClient,
    searcher_context: Arc<SearcherContext>,
    local_kv_store: MiniKV,
}

/// Trait representing a search service.
///
/// It mirrors the gRPC service `SearchService`, but with a more concrete
/// error type that can be converted into an API Error.
/// The REST API relies directly on the `SearchService`.
/// Also, it is mockable.
#[mockall::automock]
#[async_trait]
pub trait SearchService: 'static + Send + Sync {
    /// Root search API.
    /// This RPC identifies the set of splits on which the query should run on,
    /// and dispatches the multiple calls to `LeafSearch`.
    ///
    /// It is also in charge of merging back the responses.
    async fn root_search(&self, request: SearchRequest) -> crate::Result<SearchResponse>;

    /// Performs a leaf search on a given set of splits.
    ///
    /// It is like a regular search except that:
    /// - the node should perform the search locally instead of dispatching
    /// it to other nodes.
    /// - it should be applied on the given subset of splits
    /// - hit content is not fetched, and we instead return a so-called `PartialHit`.
    async fn leaf_search(&self, request: LeafSearchRequest) -> crate::Result<LeafSearchResponse>;

    /// Fetches the documents contents from the document store.
    /// This methods takes `PartialHit`s and returns `Hit`s.
    async fn fetch_docs(&self, request: FetchDocsRequest) -> crate::Result<FetchDocsResponse>;

    /// Root search API.
    /// This RPC identifies the set of splits on which the query should run on,
    /// and dispatches the multiple calls to `LeafSearch`.
    ///
    /// It is also in charge of merging back the responses.
    async fn root_list_terms(&self, request: ListTermsRequest) -> crate::Result<ListTermsResponse>;

    /// Performs a leaf search on a given set of splits.
    ///
    /// It is like a regular search except that:
    /// - the node should perform the search locally instead of dispatching
    /// it to other nodes.
    /// - it should be applied on the given subset of splits
    /// - hit content is not fetched, and we instead return a so-called `PartialHit`.
    async fn leaf_list_terms(
        &self,
        request: LeafListTermsRequest,
    ) -> crate::Result<LeafListTermsResponse>;

    /// Performs a scroll request.
    async fn scroll(&self, scroll_request: ScrollRequest) -> crate::Result<SearchResponse>;

    /// Stores a Key value in the local cache.
    /// This operation is not distributed. The distribution logic lives in
    /// the `ClusterClient`.
    async fn put_kv(&self, put_kv: PutKvRequest);

    /// Gets the payload associated to a key in the local cache.
    /// See also `put_kv(..)`.
    async fn get_kv(&self, get_kv: GetKvRequest) -> Option<Vec<u8>>;

    /// Indexers call report_splits to inform searchers node about the presence of a split, which
    /// would then be considered as a candidate for the searcher split cache.
    async fn report_splits(&self, report_splits: ReportSplitsRequest) -> ReportSplitsResponse;

    /// Return the list of fields for a given or multiple indices.
    async fn root_list_fields(
        &self,
        list_fields: ListFieldsRequest,
    ) -> crate::Result<ListFieldsResponse>;

    /// Return the list of fields for one index.
    async fn leaf_list_fields(
        &self,
        list_fields: LeafListFieldsRequest,
    ) -> crate::Result<ListFieldsResponse>;

    /// Describe how a search would be processed.
    async fn search_plan(&self, request: SearchRequest) -> crate::Result<SearchPlanResponse>;
}

impl SearchServiceImpl {
    /// Creates a new search service.
    pub fn new(
        metastore: MetastoreServiceClient,
        storage_resolver: StorageResolver,
        cluster_client: ClusterClient,
        searcher_context: Arc<SearcherContext>,
    ) -> Self {
        SearchServiceImpl {
            metastore,
            storage_resolver,
            cluster_client,
            searcher_context,
            local_kv_store: MiniKV::default(),
        }
    }
}

/// Deserializes a JSON-encoded doc mapper string into an `Arc<DocMapper>`.
pub(crate) fn deserialize_doc_mapper(doc_mapper_str: &str) -> crate::Result<Arc<DocMapper>> {
    let doc_mapper = serde_json::from_str::<Arc<DocMapper>>(doc_mapper_str).map_err(|err| {
        SearchError::Internal(format!("failed to deserialize doc mapper: `{err}`"))
    })?;
    Ok(doc_mapper)
}

#[async_trait]
impl SearchService for SearchServiceImpl {
    async fn root_search(&self, search_request: SearchRequest) -> crate::Result<SearchResponse> {
        let search_result = root_search(
            &self.searcher_context,
            search_request,
            self.metastore.clone(),
            &self.cluster_client,
        )
        .await?;
        Ok(search_result)
    }

    async fn leaf_search(
        &self,
        leaf_search_request: LeafSearchRequest,
    ) -> crate::Result<LeafSearchResponse> {
        // Check leaf_search_request existence before tracing with `instrument` call.
        if leaf_search_request.search_request.is_none() {
            return Err(SearchError::Internal("no search request".to_string()));
        }
        let num_splits = leaf_search_request
            .leaf_requests
            .iter()
            .map(|req| req.split_offsets.len())
            .sum::<usize>();

        let tracked_future = LeafSearchMetricsFuture {
            tracked: multi_index_leaf_search(
                self.searcher_context.clone(),
                leaf_search_request,
                self.storage_resolver.clone(),
            ),
            start: Instant::now(),
            targeted_splits: num_splits,
            status: None,
        };
        let timeout = self.searcher_context.searcher_config.request_timeout();
        tokio::time::timeout(timeout, tracked_future).await?
    }

    async fn fetch_docs(
        &self,
        fetch_docs_request: FetchDocsRequest,
    ) -> crate::Result<FetchDocsResponse> {
        let index_uri = Uri::from_str(&fetch_docs_request.index_uri)?;
        let storage = self.storage_resolver.resolve(&index_uri).await?;
        let snippet_request_opt: Option<&SnippetRequest> =
            fetch_docs_request.snippet_request.as_ref();
        let doc_mapper = deserialize_doc_mapper(&fetch_docs_request.doc_mapper)?;
        let fetch_docs_response = fetch_docs(
            self.searcher_context.clone(),
            fetch_docs_request.partial_hits,
            storage,
            &fetch_docs_request.split_offsets,
            doc_mapper,
            snippet_request_opt,
        )
        .await?;

        Ok(fetch_docs_response)
    }

    async fn root_list_terms(
        &self,
        list_terms_request: ListTermsRequest,
    ) -> crate::Result<ListTermsResponse> {
        let search_result = root_list_terms(
            &list_terms_request,
            self.metastore.clone(),
            &self.cluster_client,
        )
        .await?;

        Ok(search_result)
    }

    async fn leaf_list_terms(
        &self,
        leaf_search_request: LeafListTermsRequest,
    ) -> crate::Result<LeafListTermsResponse> {
        let search_request = leaf_search_request
            .list_terms_request
            .ok_or_else(|| SearchError::Internal("no search request".to_string()))?;
        let index_uri = Uri::from_str(&leaf_search_request.index_uri)?;
        let storage = self.storage_resolver.resolve(&index_uri).await?;
        let split_ids = leaf_search_request.split_offsets;

        let leaf_search_response = leaf_list_terms(
            self.searcher_context.clone(),
            &search_request,
            storage.clone(),
            &split_ids[..],
        )
        .await?;

        Ok(leaf_search_response)
    }

    async fn scroll(&self, scroll_request: ScrollRequest) -> crate::Result<SearchResponse> {
        scroll(scroll_request, &self.cluster_client, &self.searcher_context).await
    }

    async fn put_kv(&self, put_request: PutKvRequest) {
        let ttl = Duration::from_secs(put_request.ttl_secs as u64);
        self.local_kv_store
            .put(put_request.key, put_request.payload, ttl)
            .await;
    }

    async fn get_kv(&self, get_request: GetKvRequest) -> Option<Vec<u8>> {
        let payload: Vec<u8> = self.local_kv_store.get(&get_request.key).await?;
        Some(payload)
    }

    async fn report_splits(&self, report_splits: ReportSplitsRequest) -> ReportSplitsResponse {
        if let Some(split_cache) = self.searcher_context.split_cache_opt.as_ref() {
            split_cache.report_splits(report_splits.report_splits);
        }
        ReportSplitsResponse {}
    }

    async fn root_list_fields(
        &self,
        list_fields_req: ListFieldsRequest,
    ) -> crate::Result<ListFieldsResponse> {
        root_list_fields(
            list_fields_req,
            &self.cluster_client,
            self.metastore.clone(),
        )
        .await
    }

    async fn leaf_list_fields(
        &self,
        list_fields_req: LeafListFieldsRequest,
    ) -> crate::Result<ListFieldsResponse> {
        let index_uri = Uri::from_str(&list_fields_req.index_uri)?;
        let storage = self.storage_resolver.resolve(&index_uri).await?;
        let index_id = list_fields_req.index_id;
        let split_ids = list_fields_req.split_offsets;
        leaf_list_fields(
            index_id,
            storage,
            &self.searcher_context,
            &split_ids[..],
            &list_fields_req.fields,
        )
        .await
    }

    async fn search_plan(
        &self,
        search_request: SearchRequest,
    ) -> crate::Result<SearchPlanResponse> {
        let search_plan = search_plan(search_request, self.metastore.clone()).await?;
        Ok(search_plan)
    }
}

pub(crate) async fn scroll(
    scroll_request: ScrollRequest,
    cluster_client: &ClusterClient,
    searcher_context: &SearcherContext,
) -> crate::Result<SearchResponse> {
    let start = Instant::now();
    let current_scroll = ScrollKeyAndStartOffset::from_str(&scroll_request.scroll_id)
        .map_err(|msg| SearchError::InvalidArgument(msg.to_string()))?;
    let start_doc = current_scroll.start_offset;
    let scroll_key: [u8; 16] = current_scroll.scroll_key();
    let payload = cluster_client.get_kv(&scroll_key[..]).await;
    let payload =
        payload.ok_or_else(|| SearchError::Internal("scroll key not found".to_string()))?;

    let mut scroll_context = ScrollContext::load(&payload)
        .map_err(|_| SearchError::Internal("corrupted Scroll context".to_string()))?;

    let end_doc: u64 = start_doc + scroll_context.max_hits_per_page;

    let mut partial_hits = Vec::new();
    let mut scroll_context_modified = false;

    let cached_results = scroll_context.get_cached_partial_hits(start_doc..end_doc);
    partial_hits.extend_from_slice(cached_results);
    if (partial_hits.len() as u64) < current_scroll.max_hits_per_page as u64 {
        let search_after = partial_hits
            .last()
            .cloned()
            .unwrap_or_else(|| current_scroll.search_after.clone());
        let cursor = start_doc + partial_hits.len() as u64;
        scroll_context
            .load_batch_starting_at(cursor, search_after, cluster_client, searcher_context)
            .await?;
        partial_hits.extend_from_slice(scroll_context.get_cached_partial_hits(cursor..end_doc));
        scroll_context_modified = true;
    }

    // Fetch the actual documents.
    let hits: Vec<Hit> = fetch_docs_phase(
        &scroll_context.indexes_metas_for_leaf_search,
        &partial_hits[..],
        &scroll_context.split_metadatas[..],
        &scroll_context.search_request,
        cluster_client,
    )
    .await?;

    let next_scroll_id = current_scroll.next_page(
        hits.len() as u64,
        partial_hits.last().cloned().unwrap_or_default(),
    );

    if let Some(scroll_ttl_secs) = scroll_request.scroll_ttl_secs
        && scroll_context_modified
    {
        scroll_context.clear_cache_if_unneeded();
        let payload = scroll_context.serialize();
        let scroll_ttl = Duration::from_secs(scroll_ttl_secs as u64);
        cluster_client
            .put_kv(&scroll_key, &payload, scroll_ttl)
            .await;
    }

    Ok(SearchResponse {
        hits,
        num_hits: scroll_context.total_num_hits,
        elapsed_time_micros: start.elapsed().as_micros() as u64,
        scroll_id: Some(next_scroll_id.to_string()),
        errors: Vec::new(),
        aggregation_postcard: None,
        failed_splits: scroll_context.failed_splits,
        num_successful_splits: scroll_context.num_successful_splits,
    })
}
/// [`SearcherContext`] provides a common set of variables
/// shared by a searcher instance (which instantiates a
/// [`SearchServiceImpl`]).
pub struct SearcherContext {
    /// Searcher config.
    pub searcher_config: SearcherConfig,
    /// Fast fields cache.
    pub fast_fields_cache: Arc<dyn StorageCache>,
    /// Counting semaphore to limit concurrent leaf search split requests.
    pub search_permit_provider: SearchPermitProvider,
    /// Split footer cache.
    pub split_footer_cache: MemorySizedCache<String>,
    /// Per-split and per-query cache.
    pub leaf_search_cache: LeafSearchCache,
    /// Per-split and per-predicate cache.
    pub predicate_cache: Arc<PredicateCacheImpl>,
    /// Search split cache. `None` if no split cache is configured.
    pub split_cache_opt: Option<Arc<SplitCache>>,
    /// List fields cache. Caches the list fields response for a given split.
    pub list_fields_cache: ListFieldsCache,
    /// The aggregation limits are passed to limit the memory usage.
    /// This object is shared across all request.
    pub aggregation_limit: AggregationLimitsGuard,
    /// Optional Lambda invoker for offloading leaf search to serverless functions.
    pub lambda_invoker: Option<Arc<dyn LambdaLeafSearchInvoker>>,
}

impl std::fmt::Debug for SearcherContext {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        f.debug_struct("SearcherContext")
            .field("searcher_config", &self.searcher_config)
            .finish()
    }
}

impl SearcherContext {
    /// Create a default SearcherContext
    #[cfg(test)]
    pub fn for_test() -> SearcherContext {
        let searcher_config = SearcherConfig::default();
        SearcherContext::new_without_invoker(searcher_config, None)
    }

    /// Creates a new searcher context without a lambda invoker.
    pub fn new_without_invoker(
        searcher_config: SearcherConfig,
        split_cache_opt: Option<Arc<SplitCache>>,
    ) -> Self {
        Self::new(
            searcher_config,
            split_cache_opt,
            None::<Box<dyn LambdaLeafSearchInvoker>>,
        )
    }

    /// Creates a new searcher context, given a searcher config, and an optional `SplitCache`.
    pub fn new(
        searcher_config: SearcherConfig,
        split_cache_opt: Option<Arc<SplitCache>>,
        lambda_invoker: Option<impl LambdaLeafSearchInvoker + 'static>,
    ) -> Self {
        let global_split_footer_cache = MemorySizedCache::from_config(
            &searcher_config.split_footer_cache,
            &quickwit_storage::STORAGE_METRICS.split_footer_cache,
        );
        let leaf_search_split_semaphore = SearchPermitProvider::new(
            searcher_config.max_num_concurrent_split_searches,
            searcher_config.warmup_memory_budget,
        );
        let storage_long_term_cache =
            Arc::new(QuickwitCache::new(&searcher_config.fast_field_cache));
        let leaf_search_cache = LeafSearchCache::new(&searcher_config.partial_request_cache);
        let predicate_cache = PredicateCacheImpl::new(&searcher_config.predicate_cache);
        let list_fields_cache = ListFieldsCache::new(&searcher_config.partial_request_cache);
        let aggregation_limit = AggregationLimitsGuard::new(
            Some(searcher_config.aggregation_memory_limit.as_u64()),
            Some(searcher_config.aggregation_bucket_limit),
        );

        let lambda_invoker =
            lambda_invoker.map(|invoker| Arc::new(invoker) as Arc<dyn LambdaLeafSearchInvoker>);

        Self {
            searcher_config,
            fast_fields_cache: storage_long_term_cache,
            predicate_cache: predicate_cache.into(),
            search_permit_provider: leaf_search_split_semaphore,
            split_footer_cache: global_split_footer_cache,
            leaf_search_cache,
            list_fields_cache,
            split_cache_opt,
            aggregation_limit,
            lambda_invoker,
        }
    }

    /// Returns the shared instance to track the aggregation memory usage.
    pub fn get_aggregation_limits(&self) -> AggregationLimitsGuard {
        self.aggregation_limit.clone()
    }
}


================================================
FILE: quickwit/quickwit-search/src/tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Ordering;
use std::collections::{BTreeMap, BTreeSet};

use assert_json_diff::{assert_json_eq, assert_json_include};
use quickwit_config::SearcherConfig;
use quickwit_doc_mapper::DocMapper;
use quickwit_doc_mapper::tag_pruning::extract_tags_from_query;
use quickwit_indexing::TestSandbox;
use quickwit_proto::search::{
    LeafListTermsResponse, ListTermsRequest, SearchRequest, SortByValue, SortField, SortOrder,
    SortValue, TraceId,
};
use quickwit_query::query_ast::{
    QueryAst, qast_helper, qast_json_helper, query_ast_from_user_text,
};
use serde_json::{Value as JsonValue, json};
use tantivy::Term;
use tantivy::schema::OwnedValue as TantivyValue;
use tantivy::time::OffsetDateTime;

use self::leaf::single_doc_mapping_leaf_search;
use super::*;
use crate::find_trace_ids_collector::Span;
use crate::list_terms::leaf_list_terms;
use crate::service::SearcherContext;
use crate::single_node_search;

#[tokio::test]
async fn test_single_node_simple() -> anyhow::Result<()> {
    let index_id = "single-node-simple-1";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
              - name: url
                type: text
              - name: binary
                type: bytes
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"]).await?;
    let docs = vec![
        json!({"title": "snoopy", "body": "Snoopy is an anthropomorphic beagle[5] in the comic strip...", "url": "http://snoopy", "binary": "dGhpcyBpcyBhIHRlc3Qu"}),
        json!({"title": "beagle", "body": "The beagle is a breed of small scent hound, similar in appearance to the much larger foxhound.", "url": "http://beagle", "binary": "bWFkZSB5b3UgbG9vay4="}),
    ];
    test_sandbox.add_documents(docs.clone()).await?;
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("anthropomorphic", &["body"]),
        max_hits: 2,
        ..Default::default()
    };
    let single_node_result = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(single_node_result.num_hits, 1);
    assert_eq!(single_node_result.hits.len(), 1);
    let hit_json: JsonValue = serde_json::from_str(&single_node_result.hits[0].json)?;
    let expected_json: JsonValue = json!({"title": "snoopy", "body": "Snoopy is an anthropomorphic beagle[5] in the comic strip...", "url": "http://snoopy", "binary": "dGhpcyBpcyBhIHRlc3Qu"});
    assert_json_include!(actual: hit_json, expected: expected_json);
    assert!(single_node_result.elapsed_time_micros > 10);
    assert!(single_node_result.elapsed_time_micros < 1_000_000);
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_node_termset() -> anyhow::Result<()> {
    let index_id = "single-node-termset-1";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
              - name: url
                type: text
              - name: binary
                type: bytes
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"]).await?;
    let docs = vec![
        json!({"title": "snoopy", "body": "Snoopy is an anthropomorphic beagle[5] in the comic strip...", "url": "http://snoopy", "binary": "dGhpcyBpcyBhIHRlc3Qu"}),
        json!({"title": "beagle", "body": "The beagle is a breed of small scent hound, similar in appearance to the much larger foxhound.", "url": "http://beagle", "binary": "bWFkZSB5b3UgbG9vay4="}),
    ];
    test_sandbox.add_documents(docs.clone()).await?;
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("title: IN [beagle]", &[]),
        start_timestamp: None,
        end_timestamp: None,
        max_hits: 2,
        start_offset: 0,
        ..Default::default()
    };
    let single_node_result = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(single_node_result.num_hits, 1);
    assert_eq!(single_node_result.hits.len(), 1);
    let hit_json: JsonValue = serde_json::from_str(&single_node_result.hits[0].json)?;
    let expected_json: JsonValue = json!({"title": "beagle", "body": "The beagle is a breed of small scent hound, similar in appearance to the much larger foxhound.", "url": "http://beagle", "binary": "bWFkZSB5b3UgbG9vay4="});
    assert_json_include!(actual: hit_json, expected: expected_json);
    assert!(single_node_result.elapsed_time_micros > 10);
    assert!(single_node_result.elapsed_time_micros < 1_000_000);
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_search_with_snippet() -> anyhow::Result<()> {
    let index_id = "single-node-with-snippet";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"]).await?;
    let docs = vec![
        json!({"title": "snoopy", "body": "Snoopy is an anthropomorphic beagle in the comic strip."}),
        json!({"title": "beagle", "body": "The beagle is a breed of small scent hound."}),
        json!({"title": "lisa", "body": "Lisa is a character in `The Simpsons` animated tv series."}),
    ];
    test_sandbox.add_documents(docs.clone()).await?;
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("beagle", &["title", "body"]),
        snippet_fields: vec!["title".to_string(), "body".to_string()],
        max_hits: 2,
        ..Default::default()
    };
    let single_node_result = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(single_node_result.num_hits, 2);
    assert_eq!(single_node_result.hits.len(), 2);

    let highlight_json: JsonValue =
        serde_json::from_str(single_node_result.hits[0].snippet.as_ref().unwrap())?;
    let expected_json: JsonValue = json!({
        "title": ["<b>beagle</b>"],
        "body": ["The <b>beagle</b> is a breed of small scent hound"]
    });

    assert_json_eq!(highlight_json, expected_json);
    let highlight_json: JsonValue =
        serde_json::from_str(single_node_result.hits[1].snippet.as_ref().unwrap())?;
    let expected_json: JsonValue = json!({"title": [], "body": ["Snoopy is an anthropomorphic <b>beagle</b> in the comic strip"]});
    assert_json_eq!(highlight_json, expected_json);

    test_sandbox.assert_quit().await;
    Ok(())
}

async fn slop_search_and_check(
    test_sandbox: &TestSandbox,
    index_id: &str,
    query: &str,
    expected_num_match: u64,
) -> anyhow::Result<()> {
    let query_ast = qast_json_helper(query, &["body"]);
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast,
        max_hits: 5,
        ..Default::default()
    };
    let single_node_result = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(
        single_node_result.num_hits, expected_num_match,
        "query: {query}"
    );
    assert_eq!(
        single_node_result.hits.len(),
        expected_num_match as usize,
        "query: {query}"
    );
    Ok(())
}

#[tokio::test]
async fn test_slop_queries() {
    let index_id = "slop-query";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
                record: position
        "#;

    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"])
        .await
        .unwrap();
    let docs = vec![
        json!({"title": "one", "body": "a red bike"}),
        json!({"title": "two", "body": "a small blue bike"}),
        json!({"title": "three", "body": "a small, rusty, and yellow bike"}),
        json!({"title": "four", "body": "fred's small bike"}),
        json!({"title": "five", "body": "a tiny shelter"}),
    ];
    test_sandbox.add_documents(docs.clone()).await.unwrap();

    slop_search_and_check(&test_sandbox, index_id, "\"small bird\"~2", 0)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"red bike\"~2", 1)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"small blue bike\"~3", 1)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"small bike\"", 1)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"small bike\"~1", 2)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"small bike\"~2", 2)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"small bike\"~3", 3)
        .await
        .unwrap();
    slop_search_and_check(&test_sandbox, index_id, "\"tiny shelter\"~3", 1)
        .await
        .unwrap();
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_single_node_several_splits() -> anyhow::Result<()> {
    let index_id = "single-node-several-splits";
    let doc_mapping_yaml = r#"
            tag_fields:
              - "owner"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
              - name: url
                type: text
              - name: owner
                type: text
                tokenizer: 'raw'
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["body"]).await?;
    for _ in 0..10u32 {
        test_sandbox.add_documents(vec![
                json!({"title": "snoopy", "body": "Snoopy is an anthropomorphic beagle[5] in the comic strip...", "url": "http://snoopy"}),
                json!({"title": "beagle", "body": "The beagle is a breed of small scent hound, similar in appearance to the much larger foxhound.", "url": "http://beagle"}),
            ]).await?;
    }
    let query_ast = query_ast_from_user_text("beagle", None);
    let query_ast_json = serde_json::to_string(&query_ast).unwrap();
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: query_ast_json,
        max_hits: 6,
        ..Default::default()
    };
    let single_node_result = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(single_node_result.num_hits, 20);
    assert_eq!(single_node_result.hits.len(), 6);
    assert!(&single_node_result.hits[0].json.contains("breed"));
    assert!(&single_node_result.hits[1].json.contains("Snoopy"));
    let hit_keys = single_node_result.hits.iter().flat_map(|hit| {
        hit.partial_hit
            .as_ref()
            .map(|partial_hit| (partial_hit.split_id.as_str(), partial_hit.doc_id as i32))
    });
    assert!(hit_keys.is_sorted_by(|left, right| left.cmp(right) == Ordering::Greater));
    assert!(single_node_result.elapsed_time_micros > 10);
    assert!(single_node_result.elapsed_time_micros < 1_000_000);
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_node_filtering() -> anyhow::Result<()> {
    let index_id = "single-node-filtering";
    let doc_mapping_yaml = r#"
            tag_fields:
              - owner
            field_mappings:
              - name: body
                type: text
              - name: ts
                type: datetime
                input_formats:
                    - "rfc3339"
                    - "unix_timestamp"
                fast: true
              - name: owner
                type: text
                tokenizer: raw
            timestamp_field: ts
            mode: lenient
        "#;
    let indexing_settings_json = r#"{}"#;
    let test_sandbox = TestSandbox::create(
        index_id,
        doc_mapping_yaml,
        indexing_settings_json,
        &["body"],
    )
    .await?;

    let mut docs = Vec::new();
    let start_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    for i in 0..30 {
        let body = format!("info @ t:{}", i + 1);
        docs.push(json!({"body": body, "ts": start_timestamp + i + 1}));
    }
    test_sandbox.add_documents(docs).await?;

    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("info", &["body"]),
        start_timestamp: Some(start_timestamp + 10),
        end_timestamp: Some(start_timestamp + 20),
        max_hits: 15,
        sort_fields: vec![SortField {
            field_name: "ts".to_string(),
            sort_order: SortOrder::Desc as i32,
            sort_datetime_format: None,
        }],
        ..Default::default()
    };
    let single_node_response = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(single_node_response.num_hits, 10);
    assert_eq!(single_node_response.hits.len(), 10);
    assert!(&single_node_response.hits[0].json.contains("t:19"));
    assert!(&single_node_response.hits[9].json.contains("t:10"));

    // filter on time range [i64::MIN 20[ should only hit first 19 docs because of filtering
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("info", &["body"]),
        end_timestamp: Some(start_timestamp + 20),
        max_hits: 25,
        sort_fields: vec![SortField {
            field_name: "ts".to_string(),
            sort_order: SortOrder::Desc as i32,
            sort_datetime_format: None,
        }],
        ..Default::default()
    };
    let single_node_response = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    assert_eq!(single_node_response.num_hits, 19);
    assert_eq!(single_node_response.hits.len(), 19);
    assert!(&single_node_response.hits[0].json.contains("t:19"));
    assert!(&single_node_response.hits[18].json.contains("t:1"));

    // filter on tag, should return an error since no split is tagged
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("tag:foo AND info", &["body"]),
        max_hits: 25,
        sort_fields: vec![SortField {
            field_name: "ts".to_string(),
            sort_order: SortOrder::Desc as i32,
            sort_datetime_format: None,
        }],
        ..Default::default()
    };
    let single_node_response = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await;
    assert!(single_node_response.is_err());
    assert_eq!(
        single_node_response.err().map(|err| err.to_string()),
        Some("invalid query: field does not exist: `tag`".to_string())
    );
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_node_without_timestamp_with_query_start_timestamp_enabled()
-> anyhow::Result<()> {
    let index_id = "single-node-no-timestamp";
    let doc_mapping_yaml = r#"
            tag_fields:
              - owner
            field_mappings:
              - name: body
                type: text
              - name: owner
                type: text
                tokenizer: raw
        "#;
    let indexing_settings_json = r#"{}"#;
    let test_sandbox = TestSandbox::create(
        index_id,
        doc_mapping_yaml,
        indexing_settings_json,
        &["body"],
    )
    .await?;

    let mut docs = Vec::new();
    let start_timestamp = OffsetDateTime::now_utc().unix_timestamp();
    for i in 0..30 {
        let body = format!("info @ t:{}", i + 1);
        docs.push(json!({ "body": body }));
    }
    test_sandbox.add_documents(docs).await?;

    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("info", &["body"]),
        start_timestamp: Some(start_timestamp + 10),
        end_timestamp: Some(start_timestamp + 20),
        max_hits: 15,
        ..Default::default()
    };
    let single_node_response = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await;

    assert!(single_node_response.is_err());
    assert_eq!(
        single_node_response.err().map(|err| err.to_string()),
        Some(
            "the timestamp field is not set in index: [\"single-node-no-timestamp\"] definition \
             but start-timestamp or end-timestamp are set in the query"
                .to_string()
        )
    );
    test_sandbox.assert_quit().await;
    Ok(())
}

async fn single_node_search_sort_by_field(
    sort_by_field: &str,
    fieldnorms_enabled: bool,
) -> anyhow::Result<()> {
    let index_id = "single-node-sorting-sort-by-".to_string()
        + sort_by_field
        + "fieldnorms-"
        + &fieldnorms_enabled.to_string();

    let doc_mapping_with_fieldnorms = r#"
            field_mappings:
              - name: description
                type: text
                fieldnorms: true
              - name: ts
                type: datetime
                fast: true
              - name: temperature
                type: i64
                fast: true
            timestamp_field: ts
            "#;

    let doc_mapping_without_fieldnorms = r#"
            field_mappings:
              - name: description
                type: text
              - name: ts
                type: datetime
                fast: true
              - name: temperature
                type: i64
                fast: true
            timestamp_field: ts
            "#;

    let doc_mapping_yaml = if fieldnorms_enabled {
        doc_mapping_with_fieldnorms
    } else {
        doc_mapping_without_fieldnorms
    };

    let indexing_settings_json = r#"{}"#;
    let test_sandbox = TestSandbox::create(
        &index_id,
        doc_mapping_yaml,
        indexing_settings_json,
        &["description"],
    )
    .await?;

    let mut docs = Vec::new();
    let start_timestamp = 72057595;
    for i in 0..30 {
        let timestamp = start_timestamp + (i + 1) as i64;
        let description = format!("city info-{timestamp}");
        docs.push(json!({"description": description, "ts": timestamp, "temperature": i+32}));
    }
    test_sandbox.add_documents(docs).await?;

    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("city", &["description"]),
        max_hits: 15,
        sort_fields: vec![SortField {
            field_name: sort_by_field.to_string(),
            sort_order: SortOrder::Desc as i32,
            sort_datetime_format: None,
        }],
        ..Default::default()
    };

    match single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await
    {
        Ok(single_node_response) => {
            assert_eq!(single_node_response.num_hits, 30);
            assert_eq!(single_node_response.hits.len(), 15);
            assert!(
                single_node_response.hits.windows(2).all(|hits| hits[0]
                    .partial_hit
                    .as_ref()
                    .unwrap()
                    .sort_value
                    >= hits[1].partial_hit.as_ref().unwrap().sort_value)
            );
            test_sandbox.assert_quit().await;
            Ok(())
        }
        Err(err) => {
            test_sandbox.assert_quit().await;
            Err(anyhow::Error::from(err))
        }
    }
}

#[tokio::test]
async fn test_single_node_sorting_with_query_fieldnorms_enabled() -> anyhow::Result<()> {
    single_node_search_sort_by_field("_score", true).await
}

#[tokio::test]
async fn test_single_node_sorting_with_query_fieldnorms_disabled() -> anyhow::Result<()> {
    single_node_search_sort_by_field("temperature", false).await
}

#[tokio::test]
async fn test_sort_bm25() {
    let index_id = "sort_by_bm25".to_string();
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
                record: freq
                fieldnorms: true
              - name: body
                type: text
                record: freq
                fieldnorms: true
              - name: nofreq
                type: text
                record: basic
                fieldnorms: true
              - name: nofreq_nofieldnorms
                type: text
                fieldnorms: false
            "#;
    let default_search_fields = &["title", "body", "nofreq", "nofreq_nofieldnorms"];
    let test_sandbox = TestSandbox::create(
        &index_id,
        doc_mapping_yaml,
        "{}",
        &default_search_fields[..],
    )
    .await
    .unwrap();
    let docs = vec![
        json!({"title": "one pad", "nofreq": "two pad"}), // 0
        json!({"title": "one", "nofreq": "two"}),         // 1
        json!({"title": "one one", "nofreq": "two two"}), // 2
    ];
    test_sandbox.add_documents(docs).await.unwrap();
    let search_hits = |query: &str| {
        let query_ast_json = serde_json::to_string(&query_ast_from_user_text(query, None)).unwrap();
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: query_ast_json,
            max_hits: 1_000,
            sort_fields: vec![SortField {
                field_name: "_score".to_string(),
                sort_order: SortOrder::Desc as i32,
                sort_datetime_format: None,
            }],
            ..Default::default()
        };
        let metastore = test_sandbox.metastore();
        let storage_resolver = test_sandbox.storage_resolver();
        async move {
            single_node_search(search_request, metastore, storage_resolver)
                .await
                .unwrap()
                .hits
                .into_iter()
                .map(|hit| {
                    let partial_hit = hit.partial_hit.unwrap();
                    let Some(SortByValue {
                        sort_value: Some(SortValue::F64(score)),
                    }) = partial_hit.sort_value
                    else {
                        panic!()
                    };
                    (score as f32, partial_hit.doc_id)
                })
                .collect()
        }
    };
    {
        let hits: Vec<(f32, u32)> = search_hits("title:one").await;
        assert_eq!(
            &hits[..],
            &[(0.1738279, 2), (0.15965714, 1), (0.12343242, 0)]
        );
    }
    {
        let hits: Vec<(f32, u32)> = search_hits("nofreq:two").await;
        assert_eq!(
            &hits[..],
            &[(0.15965714, 1), (0.12343242, 2), (0.12343242, 0)]
        );
    }
    {
        let hits: Vec<(f32, u32)> = search_hits("title:one nofreq:two").await;
        assert_eq!(
            &hits[..],
            &[(0.31931427, 1), (0.2972603, 2), (0.24686484, 0)]
        );
    }
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_sort_by_static_and_dynamic_field() {
    let index_id = "sort_by_dynamic_field".to_string();
    // In this test, we will try sorting docs by several fields.
    // - static_i64
    // - static_u64
    // - dynamic_i64
    // - dynamic_u64
    let doc_mapping_yaml = r#"
            mode: dynamic
            field_mappings:
              - name: static_u64
                type: u64
                fast: true
              - name: static_i64
                type: i64
                fast: true
            dynamic_mapping:
                fast: true
                stored: true
            "#;
    let test_sandbox = TestSandbox::create(&index_id, doc_mapping_yaml, "{}", &[])
        .await
        .unwrap();
    let docs = vec![
        // 0
        json!({"static_u64": 3u64, "dynamic_u64": 3u64, "static_i64": 0i64, "dynamic_i64": 0i64}),
        // 1
        json!({"static_u64": 2u64, "dynamic_u64": 2u64, "static_i64": -1i64, "dynamic_i64": -1i64}),
        // 2
        json!({}),
        // 3
        json!({"static_u64": 4u64, "dynamic_u64": (i64::MAX as u64) + 1, "static_i64": 1i64, "dynamic_i64": 1i64}),
    ];
    test_sandbox.add_documents(docs).await.unwrap();
    let search_hits = |sort_field: &str, order: SortOrder| {
        let query_ast_json = serde_json::to_string(&QueryAst::MatchAll).unwrap();
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: query_ast_json,
            max_hits: 1_000,
            sort_fields: vec![SortField {
                field_name: sort_field.to_string(),
                sort_order: order as i32,
                sort_datetime_format: None,
            }],
            ..Default::default()
        };
        let metastore = test_sandbox.metastore();
        let storage_resolver = test_sandbox.storage_resolver();
        async move {
            let search_resp = single_node_search(search_request, metastore, storage_resolver)
                .await
                .unwrap();
            assert_eq!(search_resp.num_hits, 4);
            search_resp
                .hits
                .into_iter()
                .map(|hit| {
                    let partial_hit = hit.partial_hit.unwrap();
                    partial_hit.doc_id
                })
                .collect::<Vec<u32>>()
        }
    };
    {
        let ordered_docs: Vec<u32> = search_hits("static_u64", SortOrder::Desc).await;
        assert_eq!(&ordered_docs[..], &[3, 0, 1, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("static_u64", SortOrder::Asc).await;
        assert_eq!(&ordered_docs[..], &[1, 0, 3, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("static_i64", SortOrder::Desc).await;
        assert_eq!(&ordered_docs[..], &[3, 0, 1, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("static_i64", SortOrder::Asc).await;
        assert_eq!(&ordered_docs[..], &[1, 0, 3, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("dynamic_u64", SortOrder::Desc).await;
        assert_eq!(&ordered_docs[..], &[3, 0, 1, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("dynamic_u64", SortOrder::Asc).await;
        assert_eq!(&ordered_docs[..], &[1, 0, 3, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("dynamic_i64", SortOrder::Desc).await;
        assert_eq!(&ordered_docs[..], &[3, 0, 1, 2]);
    }
    {
        let ordered_docs: Vec<u32> = search_hits("dynamic_i64", SortOrder::Asc).await;
        assert_eq!(&ordered_docs[..], &[1, 0, 3, 2]);
    }
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_sort_by_2_field() {
    let index_id = "sort_by_dynamic_field".to_string();
    // In this test, we will try sorting docs by several fields.
    // - static_u64
    // - dynamic_u64
    let doc_mapping_yaml = r#"
            mode: dynamic
            field_mappings:
              - name: static_u64
                type: u64
                fast: true
            dynamic_mapping:
                fast: true
                stored: true
            "#;
    let test_sandbox = TestSandbox::create(&index_id, doc_mapping_yaml, "{}", &[])
        .await
        .unwrap();
    let docs = vec![
        // 0
        json!({"static_u64": 3u64, "dynamic_u64": 3u64}),
        // 1
        json!({"static_u64": 3u64, "dynamic_u64": 2u64}),
        // 2
        json!({}),
        // 3
        json!({"dynamic_u64": 2u64}),
        // 4
        json!({"static_u64": 4u64, "dynamic_u64": (i64::MAX as u64) + 1}),
    ];
    test_sandbox.add_documents(docs).await.unwrap();
    let search_hits =
        |sort_field1: &str, order1: SortOrder, sort_field2: &str, order2: SortOrder| {
            let query_ast_json = serde_json::to_string(&QueryAst::MatchAll).unwrap();
            let search_request = SearchRequest {
                index_id_patterns: vec![index_id.to_string()],
                query_ast: query_ast_json,
                max_hits: 1_000,
                sort_fields: vec![
                    SortField {
                        field_name: sort_field1.to_string(),
                        sort_order: order1 as i32,
                        sort_datetime_format: None,
                    },
                    SortField {
                        field_name: sort_field2.to_string(),
                        sort_order: order2 as i32,
                        sort_datetime_format: None,
                    },
                ],
                ..Default::default()
            };
            let metastore = test_sandbox.metastore();
            let storage_resolver = test_sandbox.storage_resolver();
            async move {
                let search_resp = single_node_search(search_request, metastore, storage_resolver)
                    .await
                    .unwrap();
                assert_eq!(search_resp.num_hits, 5);
                search_resp
                    .hits
                    .into_iter()
                    .map(|hit| {
                        let partial_hit = hit.partial_hit.unwrap();
                        partial_hit.doc_id
                    })
                    .collect::<Vec<u32>>()
            }
        };
    {
        let ordered_docs: Vec<u32> = search_hits(
            "static_u64",
            SortOrder::Desc,
            "dynamic_u64",
            SortOrder::Desc,
        )
        .await;
        assert_eq!(&ordered_docs[..], &[4, 0, 1, 3, 2]);
    }
    {
        let ordered_docs: Vec<u32> =
            search_hits("static_u64", SortOrder::Desc, "dynamic_u64", SortOrder::Asc).await;
        assert_eq!(&ordered_docs[..], &[4, 1, 0, 3, 2]);
    }
    {
        let ordered_docs: Vec<u32> =
            search_hits("static_u64", SortOrder::Asc, "dynamic_u64", SortOrder::Desc).await;
        assert_eq!(&ordered_docs[..], &[0, 1, 4, 3, 2]);
    }
    {
        let ordered_docs: Vec<u32> =
            search_hits("static_u64", SortOrder::Asc, "dynamic_u64", SortOrder::Asc).await;
        assert_eq!(&ordered_docs[..], &[1, 0, 4, 3, 2]);
    }
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_single_node_invalid_sorting_with_query() {
    let index_id = "single-node-invalid-sorting";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: description
                type: text
                fast: true
              - name: temperature
                type: i64
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["description"])
        .await
        .unwrap();

    let mut docs = Vec::new();
    for i in 0..30 {
        let description = format!("city info-{}", i + 1);
        docs.push(json!({"description": description, "ts": i+1, "temperature": i+32}));
    }
    test_sandbox.add_documents(docs).await.unwrap();

    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("city", &["description"]),
        max_hits: 15,
        sort_fields: vec![SortField {
            field_name: "description".to_string(),
            sort_order: SortOrder::Desc as i32,
            sort_datetime_format: None,
        }],
        ..Default::default()
    };
    let single_node_response = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await;
    assert!(single_node_response.is_err());
    let error_msg = single_node_response.unwrap_err().to_string();
    assert_eq!(
        error_msg,
        "Invalid argument: sort by field on type text is currently not supported `description`"
    );
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_single_node_split_pruning_by_tags() -> anyhow::Result<()> {
    let doc_mapping_yaml = r#"
            tag_fields:
              - owner
            field_mappings:
              - name: owner
                type: text
                tokenizer: raw
        "#;
    let index_id = "single-node-pruning-by-tags";
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &[]).await?;
    let index_uid = test_sandbox.index_uid();

    let owners = ["paul", "adrien"];
    for owner in owners {
        let mut docs = Vec::new();
        for i in 0..10 {
            docs.push(json!({"body": format!("content num #{}", i + 1), "owner": owner}));
        }
        test_sandbox.add_documents(docs).await?;
    }

    let query_ast: QueryAst = qast_helper("owner:francois", &[]);

    let selected_splits = list_relevant_splits(
        vec![index_uid.clone()],
        None,
        None,
        extract_tags_from_query(query_ast),
        &mut test_sandbox.metastore(),
    )
    .await?;
    assert!(selected_splits.is_empty());

    let query_ast: QueryAst = qast_helper("", &[]);

    let selected_splits = list_relevant_splits(
        vec![index_uid.clone()],
        None,
        None,
        extract_tags_from_query(query_ast),
        &mut test_sandbox.metastore(),
    )
    .await?;
    assert_eq!(selected_splits.len(), 2);

    let query_ast: QueryAst = qast_helper("owner:francois OR owner:paul OR owner:adrien", &[]);

    let selected_splits = list_relevant_splits(
        vec![index_uid.clone()],
        None,
        None,
        extract_tags_from_query(query_ast),
        &mut test_sandbox.metastore(),
    )
    .await?;
    assert_eq!(selected_splits.len(), 2);
    let split_tags: BTreeSet<String> = selected_splits
        .iter()
        .flat_map(|split| split.tags.clone())
        .collect();
    assert_eq!(
        split_tags
            .iter()
            .map(|tag| tag.as_str())
            .collect::<Vec<&str>>(),
        vec!["owner!", "owner:adrien", "owner:paul"]
    );
    test_sandbox.assert_quit().await;
    Ok(())
}

async fn test_search_util(test_sandbox: &TestSandbox, query: &str) -> Vec<u32> {
    let splits = test_sandbox
        .metastore()
        .list_splits(ListSplitsRequest::try_from_index_uid(test_sandbox.index_uid()).unwrap())
        .await
        .unwrap()
        .collect_splits()
        .await
        .unwrap();
    let splits_offsets: Vec<_> = splits
        .into_iter()
        .map(|split| extract_split_and_footer_offsets(&split.split_metadata))
        .collect();
    let request = Arc::new(SearchRequest {
        index_id_patterns: vec![test_sandbox.index_uid().index_id.to_string()],
        query_ast: qast_json_helper(query, &[]),
        max_hits: 100,
        ..Default::default()
    });
    let searcher_context: Arc<SearcherContext> = Arc::new(SearcherContext::new_without_invoker(
        SearcherConfig::default(),
        None,
    ));

    let search_response = single_doc_mapping_leaf_search(
        searcher_context,
        request,
        test_sandbox.storage(),
        splits_offsets,
        test_sandbox.doc_mapper(),
    )
    .await
    .unwrap();

    search_response
        .partial_hits
        .into_iter()
        .map(|partial_hit| partial_hit.doc_id)
        .collect::<Vec<u32>>()
}

#[tokio::test]
async fn test_search_dynamic_mode() -> anyhow::Result<()> {
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: body
                type: text
                tokenizer: default
                indexed: true
            mode: dynamic
            dynamic_mapping:
                tokenizer: raw
        "#;
    let test_sandbox = TestSandbox::create("search_dynamic_mode", doc_mapping_yaml, "{}", &[])
        .await
        .unwrap();
    let docs = vec![
        json!({"body": "hello happy tax payer"}),
        json!({"body": "hello"}),
        json!({"body_dynamic": "hello happy tax payer"}),
        json!({"body_dynamic": "hello"}),
    ];
    test_sandbox.add_documents(docs).await.unwrap();
    {
        let docs = test_search_util(&test_sandbox, "body:hello").await;
        assert_eq!(&docs[..], &[1u32, 0u32]);
    }
    {
        let docs = test_search_util(&test_sandbox, "body_dynamic:hello").await;
        assert_eq!(&docs[..], &[3u32]); // 1 is not matched due to the raw tokenizer
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_search_dynamic_mode_expand_dots() -> anyhow::Result<()> {
    let doc_mapping_yaml = r#"
            field_mappings: []
            mode: dynamic
            #dynamic_mapping:
            #  expand_dots: true -- that's the default value.
        "#;
    let test_sandbox = TestSandbox::create(
        "search_dynamic_mode_expand_dots",
        doc_mapping_yaml,
        "{}",
        &[],
    )
    .await
    .unwrap();
    let docs = vec![json!({"k8s.component.name": "quickwit"})];
    test_sandbox.add_documents(docs).await.unwrap();
    {
        let docs = test_search_util(&test_sandbox, "k8s.component.name:quickwit").await;
        assert_eq!(&docs[..], &[0u32]);
    }
    {
        let docs = test_search_util(&test_sandbox, r"k8s\.component\.name:quickwit").await;
        assert_eq!(&docs[..], &[0u32]);
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_search_dynamic_mode_do_not_expand_dots() -> anyhow::Result<()> {
    let doc_mapping_yaml = r#"
            field_mappings: []
            mode: dynamic
            dynamic_mapping:
                expand_dots: false
        "#;
    let test_sandbox = TestSandbox::create(
        "search_dynamic_mode_not_expand_dots",
        doc_mapping_yaml,
        "{}",
        &[],
    )
    .await
    .unwrap();
    let docs = vec![json!({"k8s.component.name": "quickwit"})];
    test_sandbox.add_documents(docs).await.unwrap();
    {
        let docs = test_search_util(&test_sandbox, r"k8s\.component\.name:quickwit").await;
        assert_eq!(&docs[..], &[0u32]);
    }
    {
        let docs = test_search_util(&test_sandbox, r#"k8s.component.name:quickwit"#).await;
        assert!(docs.is_empty());
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

fn json_to_named_field_doc(doc_json: JsonValue) -> NamedFieldDocument {
    assert!(doc_json.is_object());
    let mut doc_map: BTreeMap<String, Vec<TantivyValue>> = BTreeMap::new();
    for (key, value) in doc_json.as_object().unwrap().clone() {
        doc_map.insert(key, json_value_to_tantivy_value(value));
    }
    NamedFieldDocument(doc_map)
}

fn json_value_to_tantivy_value(value: JsonValue) -> Vec<TantivyValue> {
    match value {
        JsonValue::Bool(val) => vec![TantivyValue::Bool(val)],
        JsonValue::String(val) => vec![TantivyValue::Str(val)],
        JsonValue::Array(values) => values
            .into_iter()
            .flat_map(json_value_to_tantivy_value)
            .collect(),
        JsonValue::Object(object) => {
            vec![TantivyValue::Object(
                object
                    .into_iter()
                    .map(|(key, val)| (key, TantivyValue::from(val)))
                    .collect(),
            )]
        }
        JsonValue::Null => Vec::new(),
        value => vec![value.into()],
    }
}

#[track_caller]
fn test_convert_leaf_hit_aux(
    default_doc_mapper_json: JsonValue,
    document_json: JsonValue,
    expected_hit_json: JsonValue,
) {
    let default_doc_mapper: DocMapper = serde_json::from_value(default_doc_mapper_json).unwrap();
    let named_field_doc = json_to_named_field_doc(document_json);
    let hit_json_str =
        convert_document_to_json_string(named_field_doc, &default_doc_mapper).unwrap();
    let hit_json: JsonValue = serde_json::from_str(&hit_json_str).unwrap();
    assert_eq!(hit_json, expected_hit_json);
}

#[test]
fn test_convert_leaf_hit_multiple_cardinality() {
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [
                { "name": "body", "type": "array<text>" }
            ],
            "mode": "lenient"
        }),
        json!({ "body": ["hello", "happy"] }),
        json!({ "body": ["hello", "happy"] }),
    );
}

#[test]
fn test_convert_leaf_hit_simple_cardinality() {
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [
                { "name": "body", "type": "text" }
            ],
            "mode": "lenient"
        }),
        json!({ "body": ["hello", "happy"] }),
        json!({ "body": "hello" }),
    );
}

#[test]
fn test_convert_dynamic() {
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [
                { "name": "body", "type": "text" }
            ],
            "mode": "dynamic"
        }),
        json!({ "body": ["hello", "happy"], "_dynamic": [{"title": "hello"}] }),
        json!({ "body": "hello", "title": "hello" }),
    );
}

#[test]
fn test_convert_leaf_object() {
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [
                {
                    "name": "user",
                    "type": "object",
                    "field_mappings": [
                        {"name": "username", "type": "text"},
                        {"name": "email", "type": "text"}
                    ]
                }
            ],
            "mode": "lenient"
        }),
        json!({ "user.username": ["fulmicoton"], "user.email": ["werwe33@quickwit.io"]}),
        json!({ "user": {"username": "fulmicoton", "email": "werwe33@quickwit.io"}}),
    );
}

#[test]
fn test_convert_leaf_object_used_to_be_dynamic() {
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [
                {
                    "name": "user",
                    "type": "object",
                    "field_mappings": [
                        {"name": "username", "type": "text"},
                    ]
                }
            ],
            "mode": "dynamic"
        }),
        json!({ "_dynamic": [{ "user": {"username": "fulmicoton", "email": "werwe33@quickwit.io"}}]}),
        json!({ "user": {"username": "fulmicoton", "email": "werwe33@quickwit.io"}}),
    );
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [
                {
                    "name": "user",
                    "type": "object",
                    "field_mappings": [
                        {"name": "username", "type": "text"},
                    ]
                }
            ],
            "mode": "dynamic"
        }),
        json!({ "_dynamic": [{ "user": {"email": "werwe33@quickwit.io"}}], "user.username": ["fulmicoton"] }),
        json!({ "user": {"username": "fulmicoton", "email": "werwe33@quickwit.io"}}),
    );
}

// This spec might change in the future. The mode has no impact on the
// output of convert_document_to_json_string. In particular, it does not ignore
// the previously gathered dynamic field.
#[test]
fn test_convert_leaf_object_arguable_mode_does_not_affect_format() {
    test_convert_leaf_hit_aux(
        json!({ "mode": "strict" }),
        json!({ "_dynamic": [{ "user": {"username": "fulmicoton", "email": "werwe33@quickwit.io"}}]}),
        json!({ "user": {"username": "fulmicoton", "email": "werwe33@quickwit.io"}}),
    );
}

#[test]
fn test_convert_leaf_hit_with_source() {
    test_convert_leaf_hit_aux(
        json!({
            "field_mappings": [ {"name": "username", "type": "text"} ],
            "mode": "strict"
        }),
        json!({ "_source": [{"username": "fulmicoton"}], "username": ["fulmicoton"] }),
        json!({ "username": "fulmicoton", "_source": {"username": "fulmicoton"}}),
    );
}

#[tokio::test]
async fn test_single_node_aggregation() -> anyhow::Result<()> {
    let index_id = "single-node-agg-1";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: color
                type: text
                fast: true
              - name: price
                type: f64
                fast: true
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["color"]).await?;
    let docs = vec![
        json!({"color": "blue", "price": 10.0}),
        json!({"color": "blue", "price": 15.0}),
        json!({"color": "green", "price": 10.0}),
        json!({"color": "white", "price": 100.0}),
        json!({"color": "white", "price": 1.0}),
    ];
    let agg_req = r#"
 {
   "expensive_colors": {
     "terms": {
       "field": "color",
       "order": {
            "price_stats.max": "desc"
       }
     },
     "aggs": {
       "price_stats" : {
          "stats": {
              "field": "price"
          }
       }
     }
   }
 }"#;

    test_sandbox.add_documents(docs.clone()).await?;
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("*", &[]),
        max_hits: 2,
        aggregation_request: Some(agg_req.to_string()),
        ..Default::default()
    };
    let single_node_result = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await?;
    let agg_res_struct =
        AggregationResults::from_postcard(&single_node_result.aggregation_postcard.unwrap())?;
    let agg_res_json = serde_json::to_string(&agg_res_struct)?;
    let agg_res_parsed_json: JsonValue = serde_json::from_str(&agg_res_json)?;
    assert_eq!(
        agg_res_parsed_json["expensive_colors"]["buckets"][0]["key"],
        "white"
    );
    assert_eq!(
        agg_res_parsed_json["expensive_colors"]["buckets"][1]["key"],
        "blue"
    );
    assert_eq!(
        agg_res_parsed_json["expensive_colors"]["buckets"][2]["key"],
        "green"
    );
    assert!(single_node_result.elapsed_time_micros > 10);
    assert!(single_node_result.elapsed_time_micros < 1_000_000);
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_node_aggregation_missing_fast_field() {
    let index_id = "single-node-agg-2";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: color
                type: text
              - name: price
                type: f64
                fast: true
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["color"])
        .await
        .unwrap();
    let docs = vec![
        json!({"color": "blue", "price": 10.0}),
        json!({"color": "blue", "price": 15.0}),
        json!({"color": "green", "price": 10.0}),
        json!({"color": "white", "price": 100.0}),
        json!({"color": "white", "price": 1.0}),
    ];
    let agg_req = r#"
 {
   "expensive_colors": {
     "terms": {
       "field": "color",
       "order": {
            "price_stats.max": "desc"
       }
     },
     "aggs": {
       "price_stats" : {
          "stats": {
              "field": "price"
          }
       }
     }
   }
 }"#;

    test_sandbox.add_documents(docs.clone()).await.unwrap();
    let search_request = SearchRequest {
        index_id_patterns: vec![index_id.to_string()],
        query_ast: qast_json_helper("*", &[]),
        max_hits: 2,
        aggregation_request: Some(agg_req.to_string()),
        ..Default::default()
    };
    let single_node_error = single_node_search(
        search_request,
        test_sandbox.metastore(),
        test_sandbox.storage_resolver(),
    )
    .await
    .unwrap_err();
    let SearchError::InvalidArgument(error_msg) = single_node_error else {
        panic!();
    };
    assert!(error_msg.contains("Field \"color\" is not configured as a fast field"));
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_single_node_with_ip_field() -> anyhow::Result<()> {
    let index_id = "single-node-with-ip-field";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: log
                type: text
              - name: host
                type: ip
        "#;
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["log"]).await?;
    let docs = vec![
        json!({"log": "User not found", "host": "192.168.0.1"}),
        json!({"log": "Request failed", "host": "10.10.12.123"}),
        json!({"log": "Request successful", "host": "10.10.11.125"}),
        json!({"log": "Auth service error", "host": "2001:db8::1:0:0:1"}),
        json!({"log": "Settings saved", "host": "::afff:4567:890a"}),
        json!({"log": "Request failed", "host": "10.10.12.123"}),
    ];
    test_sandbox.add_documents(docs.clone()).await?;
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("*", &[]),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 6);
        assert_eq!(single_node_result.hits.len(), 6);
    }
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("10.10.11.125", &["host"]),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 1);
        assert_eq!(single_node_result.hits.len(), 1);
        let hit_json: JsonValue = serde_json::from_str(&single_node_result.hits[0].json)?;
        let expected_json: JsonValue = json!({"log": "Request successful", "host": "10.10.11.125"});
        assert_json_include!(actual: hit_json, expected: expected_json);
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_node_range_queries() -> anyhow::Result<()> {
    let index_id = "single-node-range-queries";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: datetime
                type: datetime
                fast: true
              - name: log
                type: text
              - name: status_code
                type: u64
                fast: true
              - name: host
                type: ip
                fast: true
              - name: latency
                type: f64
                fast: true
              - name: error_code
                type: i64
                fast: true
        "#;
    let docs = vec![
        json!({"datetime": "2023-01-10T15:13:35Z", "log": "User not found", "status_code": 404, "host": "192.168.0.1", "latency": 12.34, "error_code": 4}),
        json!({"datetime": "2023-01-10T15:13:36Z", "log": "Request failed", "status_code": 400, "host": "10.10.12.123", "latency": 56.78, "error_code": 1}),
        json!({"datetime": "2023-01-10T15:13:37Z", "log": "Request successful", "status_code": 200, "host": "10.10.11.125", "latency": 91.10, "error_code": -1}),
        json!({"datetime": "2023-01-10T15:13:38Z", "log": "Auth service error", "status_code": 401, "host": "2001:db8::1:0:0:1", "latency": 111.12, "error_code": 2}),
        json!({"datetime": "2023-01-10T15:13:39Z", "log": "Settings saved", "status_code": 200, "host": "::afff:4567:890a", "latency": 112.13, "error_code": -1}),
        json!({"datetime": "2023-01-10T15:13:40Z", "log": "Request failed", "status_code": 400, "host": "10.10.12.123", "latency": 114.15, "error_code": 1}),
    ];
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &["log"]).await?;
    test_sandbox.add_documents(docs).await?;
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper(
                "datetime:[2023-01-10T15:13:36Z TO 2023-01-10T15:13:38Z}",
                &[],
            ),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 2);
        assert_eq!(single_node_result.hits.len(), 2);
    }
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("status_code:[400 TO 401]", &[]),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 3);
        assert_eq!(single_node_result.hits.len(), 3);
    }
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("host:[10.0.0.0 TO 10.255.255.255]", &[]),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 3);
        assert_eq!(single_node_result.hits.len(), 3);
    }
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("latency:[100 TO *]", &[]),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 3);
        assert_eq!(single_node_result.hits.len(), 3);
    }
    {
        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("error_code:[-1 TO 1]", &[]),
            max_hits: 10,
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await?;
        assert_eq!(single_node_result.num_hits, 4);
        assert_eq!(single_node_result.hits.len(), 4);
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

#[allow(deprecated)]
fn collect_str_terms(response: LeafListTermsResponse) -> Vec<String> {
    response
        .terms
        .into_iter()
        .map(|term| Term::wrap(&term).value().as_str().unwrap().to_string())
        .collect()
}

#[tokio::test]
async fn test_single_node_list_terms() -> anyhow::Result<()> {
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
              - name: url
                type: text
              - name: binary
                type: bytes
        "#;
    let test_sandbox =
        TestSandbox::create("single-node-list-terms", doc_mapping_yaml, "{}", &["body"]).await?;
    let docs = vec![
        json!({"title": "snoopy", "body": "Snoopy is an anthropomorphic beagle[5] in the comic strip...", "url": "http://snoopy", "binary": "dGhpcyBpcyBhIHRlc3Qu"}),
        json!({"title": "beagle", "body": "The beagle is a breed of small scent hound, similar in appearance to the much larger foxhound.", "url": "http://beagle", "binary": "bWFkZSB5b3UgbG9vay4="}),
    ];
    test_sandbox.add_documents(docs).await.unwrap();

    let splits = test_sandbox
        .metastore()
        .list_splits(ListSplitsRequest::try_from_index_uid(test_sandbox.index_uid()).unwrap())
        .await?
        .collect_splits()
        .await
        .unwrap();
    let splits_offsets: Vec<_> = splits
        .into_iter()
        .map(|split| extract_split_and_footer_offsets(&split.split_metadata))
        .collect();
    let searcher_context = Arc::new(SearcherContext::new_without_invoker(
        SearcherConfig::default(),
        None,
    ));

    {
        let request = ListTermsRequest {
            index_id_patterns: vec![test_sandbox.index_uid().index_id.to_string()],
            field: "title".to_string(),
            start_key: None,
            end_key: None,
            start_timestamp: None,
            end_timestamp: None,
            max_hits: Some(100),
        };
        let search_response = leaf_list_terms(
            searcher_context.clone(),
            &request,
            test_sandbox.storage(),
            &splits_offsets,
        )
        .await
        .unwrap();
        let terms = collect_str_terms(search_response);
        assert_eq!(terms, &["beagle", "snoopy",]);
    }
    {
        let request = ListTermsRequest {
            index_id_patterns: vec![test_sandbox.index_uid().index_id.to_string()],
            field: "title".to_string(),
            start_key: None,
            end_key: None,
            start_timestamp: None,
            end_timestamp: None,
            max_hits: Some(1),
        };
        let search_response = leaf_list_terms(
            searcher_context.clone(),
            &request,
            test_sandbox.storage(),
            &splits_offsets,
        )
        .await
        .unwrap();
        let terms = collect_str_terms(search_response);
        assert_eq!(terms, &["beagle"]);
    }
    {
        let request = ListTermsRequest {
            index_id_patterns: vec![test_sandbox.index_uid().index_id.to_string()],
            field: "title".to_string(),
            start_key: Some("casper".as_bytes().to_vec()),
            end_key: None,
            start_timestamp: None,
            end_timestamp: None,
            max_hits: Some(100),
        };
        let search_response = leaf_list_terms(
            searcher_context.clone(),
            &request,
            test_sandbox.storage(),
            &splits_offsets,
        )
        .await
        .unwrap();
        let terms = collect_str_terms(search_response);
        assert_eq!(terms, &["snoopy"]);
    }
    {
        let request = ListTermsRequest {
            index_id_patterns: vec![test_sandbox.index_uid().index_id.to_string()],
            field: "title".to_string(),
            start_key: None,
            end_key: Some("casper".as_bytes().to_vec()),
            start_timestamp: None,
            end_timestamp: None,
            max_hits: Some(100),
        };
        let search_response = leaf_list_terms(
            searcher_context.clone(),
            &request,
            test_sandbox.storage(),
            &splits_offsets,
        )
        .await
        .unwrap();
        let terms = collect_str_terms(search_response);
        assert_eq!(terms, &["beagle"]);
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

#[tokio::test]
async fn test_single_node_find_trace_ids_collector() {
    let index_id = "single-node-find-trace-ids-collector";
    let doc_mapping_yaml = r#"
            field_mappings:
              - name: trace_id
                type: bytes
                fast: true
                input_format: hex
                output_format: hex
              - name: span_timestamp_secs
                type: datetime
                fast: true
                fast_precision: seconds
        "#;
    let foo_trace_id = TraceId::new([1u8; 16]);
    let bar_trace_id = TraceId::new([2u8; 16]);
    let qux_trace_id = TraceId::new([3u8; 16]);
    let baz_trace_id = TraceId::new([4u8; 16]);

    let docs = vec![
        json!({"trace_id": foo_trace_id, "span_timestamp_secs": "2023-01-10T15:13:35Z"}),
        json!({"trace_id": foo_trace_id, "span_timestamp_secs": "2023-01-10T15:13:36Z"}),
        json!({"trace_id": foo_trace_id, "span_timestamp_secs": "2023-01-10T15:13:37Z"}),
        json!({"trace_id": foo_trace_id, "span_timestamp_secs": "2023-01-10T15:13:38Z"}),
        json!({"trace_id": foo_trace_id, "span_timestamp_secs": "2023-01-10T15:13:39Z"}),
        json!({"trace_id": foo_trace_id, "span_timestamp_secs": "2023-01-10T15:13:40Z"}),
        json!({"trace_id": bar_trace_id, "span_timestamp_secs": "2024-01-10T15:13:35Z"}),
        json!({"trace_id": bar_trace_id, "span_timestamp_secs": "2024-01-10T15:13:40Z"}),
        json!({"trace_id": qux_trace_id, "span_timestamp_secs": "2025-01-10T15:13:40Z"}),
        json!({"trace_id": qux_trace_id, "span_timestamp_secs": "2025-01-10T15:13:35Z"}),
        json!({"trace_id": baz_trace_id, "span_timestamp_secs": "2022-01-10T15:13:35Z"}),
    ];
    let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "{}", &[])
        .await
        .unwrap();
    test_sandbox.add_documents(docs).await.unwrap();
    {
        let aggregations = r#"{
            "num_traces": 3,
            "trace_id_field_name": "trace_id",
            "span_timestamp_field_name": "span_timestamp_secs"
        }"#
        .to_string();

        let search_request = SearchRequest {
            index_id_patterns: vec![index_id.to_string()],
            query_ast: qast_json_helper("*", &[]),
            aggregation_request: Some(aggregations),
            ..Default::default()
        };
        let single_node_result = single_node_search(
            search_request,
            test_sandbox.metastore(),
            test_sandbox.storage_resolver(),
        )
        .await
        .unwrap();
        let aggregation_postcard = single_node_result.aggregation_postcard.unwrap();
        let trace_ids: Vec<Span> = postcard::from_bytes(&aggregation_postcard).unwrap();
        assert_eq!(trace_ids.len(), 3);

        assert_eq!(trace_ids[0].trace_id, qux_trace_id);
        assert_eq!(
            trace_ids[0].span_timestamp.into_timestamp_secs(),
            1736522020
        );
        assert_eq!(trace_ids[1].trace_id, bar_trace_id);
        assert_eq!(
            trace_ids[1].span_timestamp.into_timestamp_secs(),
            1704899620
        );
        assert_eq!(trace_ids[2].trace_id, foo_trace_id);
        assert_eq!(
            trace_ids[2].span_timestamp.into_timestamp_secs(),
            1673363620
        );
    }
    test_sandbox.assert_quit().await;
}

#[tokio::test]
async fn test_search_in_text_field_with_custom_tokenizer() -> anyhow::Result<()> {
    let doc_mapping_yaml = r#"
            tokenizers:
              - name: custom_tokenizer
                type: ngram
                min_gram: 3
                max_gram: 5
                prefix_only: true
            field_mappings:
              - name: body
                type: text
                tokenizer: custom_tokenizer
                indexed: true
        "#;
    let test_sandbox = TestSandbox::create("search_custom_tokenizer", doc_mapping_yaml, "{}", &[])
        .await
        .unwrap();
    let docs = vec![json!({"body": "hellohappy"})];
    test_sandbox.add_documents(docs).await.unwrap();
    {
        let docs = test_search_util(&test_sandbox, "body:happy").await;
        assert!(&docs.is_empty());
    }
    {
        let docs = test_search_util(&test_sandbox, "body:hel").await;
        assert_eq!(&docs[..], &[0u32]);
    }
    test_sandbox.assert_quit().await;
    Ok(())
}

#[test]
fn test_global_doc_address_ser_deser() {
    let doc_address = GlobalDocAddress {
        split: "split_id".to_string(),
        doc_addr: DocAddress {
            segment_ord: 0,
            doc_id: 123456,
        },
    };
    let doc_address_string = doc_address.to_string();
    let doc_address_deser: GlobalDocAddress = doc_address_string.parse().unwrap();
    assert_eq!(doc_address_deser, doc_address);
}


================================================
FILE: quickwit/quickwit-search/src/top_k_collector.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::{Ordering, Reverse};
use std::fmt::Debug;
use std::marker::PhantomData;

use quickwit_common::binary_heap::TopK;
use quickwit_proto::search::{PartialHit, SortOrder};
use quickwit_proto::types::SplitId;
use tantivy::{DocId, Score};

use crate::collector::{
    HitSortingMapper, SegmentPartialHit, SegmentPartialHitSortingKey,
    SortingFieldExtractorComponent, SortingFieldExtractorPair,
};

pub trait QuickwitSegmentTopKCollector {
    fn collect_top_k_block(&mut self, docs: &[DocId]);
    fn collect_top_k(&mut self, doc_id: DocId, score: Score);
    fn get_top_k(&self) -> Vec<PartialHit>;
}

trait IntoOptionU64 {
    #[inline]
    fn is_unit_type() -> bool {
        false
    }
    fn into_option_u64(self) -> Option<u64>;
    fn from_option_u64(value: Option<u64>) -> Self;
}
trait MinValue {
    fn min_value() -> Self;
}

impl IntoOptionU64 for Option<u64> {
    #[inline]
    fn into_option_u64(self) -> Option<u64> {
        self
    }
    #[inline]
    fn from_option_u64(value: Option<u64>) -> Self {
        value
    }
}

impl MinValue for Option<u64> {
    #[inline]
    fn min_value() -> Self {
        None
    }
}

impl IntoOptionU64 for Option<Reverse<u64>> {
    #[inline]
    fn into_option_u64(self) -> Option<u64> {
        self.map(|el| el.0)
    }
    #[inline]
    fn from_option_u64(value: Option<u64>) -> Self {
        value.map(Reverse)
    }
}
impl MinValue for Option<Reverse<u64>> {
    #[inline]
    fn min_value() -> Self {
        None
    }
}

impl IntoOptionU64 for () {
    #[inline]
    fn is_unit_type() -> bool {
        true
    }
    #[inline]
    fn into_option_u64(self) -> Option<u64> {
        None
    }
    #[inline]
    fn from_option_u64(_: Option<u64>) -> Self {}
}
impl MinValue for () {
    #[inline]
    fn min_value() -> Self {}
}

/// Generic hit struct for top k collector.
/// V1 and V2 are the types of the two values to sort by.
/// They are either Option<u64> or _statically_ disabled via unit type.
#[derive(Debug, Copy, Clone, PartialEq, Eq)]
struct Hit<V1, V2, const REVERSE_DOCID: bool> {
    doc_id: DocId,
    value1: V1,
    value2: V2,
}

impl<V1, V2, const REVERSE_DOCID: bool> MinValue for Hit<V1, V2, REVERSE_DOCID>
where
    V1: MinValue,
    V2: MinValue,
{
    #[inline]
    fn min_value() -> Self {
        let doc_id = if REVERSE_DOCID {
            DocId::MAX
        } else {
            DocId::MIN
        };
        Hit {
            doc_id,
            value1: V1::min_value(),
            value2: V2::min_value(),
        }
    }
}

impl<V1, V2, const REVERSE_DOCID: bool> std::fmt::Display for Hit<V1, V2, REVERSE_DOCID>
where
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + Debug,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + Debug,
{
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(
            f,
            "Hit(doc_id: {}, value1: {:?}, value2: {:?})",
            self.doc_id, self.value1, self.value2
        )
    }
}

impl<V1, V2, const REVERSE_DOCID: bool> Ord for Hit<V1, V2, REVERSE_DOCID>
where
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + Debug + MinValue,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + Debug + MinValue,
{
    #[inline]
    fn cmp(&self, other: &Self) -> Ordering {
        let order = self.value1.cmp(&other.value1);
        order
            .then_with(|| self.value2.cmp(&other.value2))
            .then_with(|| {
                if REVERSE_DOCID {
                    other.doc_id.cmp(&self.doc_id)
                } else {
                    self.doc_id.cmp(&other.doc_id)
                }
            })
    }
}

impl<V1, V2, const REVERSE_DOCID: bool> PartialOrd for Hit<V1, V2, REVERSE_DOCID>
where
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + Debug + MinValue,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + Debug + MinValue,
{
    #[inline]
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl<
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue,
    const REVERSE_DOCID: bool,
> Hit<V1, V2, REVERSE_DOCID>
{
    #[inline]
    fn into_segment_partial_hit(self) -> SegmentPartialHit {
        SegmentPartialHit {
            sort_value: self.value1.into_option_u64(),
            sort_value2: self.value2.into_option_u64(),
            doc_id: self.doc_id,
        }
    }
}

pub fn specialized_top_k_segment_collector(
    split_id: SplitId,
    score_extractor: SortingFieldExtractorPair,
    leaf_max_hits: usize,
    segment_ord: u32,
    search_after_option: Option<PartialHit>,
    order1: SortOrder,
    order2: SortOrder,
) -> Box<dyn QuickwitSegmentTopKCollector> {
    // TODO: Add support for search_after to the specialized collector.
    // Eventually we may want to remove the generic collector to reduce complexity.
    if search_after_option.is_some() || score_extractor.is_score() {
        return Box::new(GenericQuickwitSegmentTopKCollector::new(
            split_id,
            score_extractor,
            leaf_max_hits,
            segment_ord,
            search_after_option,
            order1,
            order2,
        ));
    }

    let sort_first_by_ff = score_extractor.first.is_fast_field();
    let sort_second_by_ff = score_extractor
        .second
        .as_ref()
        .map(|extr| extr.is_fast_field())
        .unwrap_or(false);

    #[derive(Debug)]
    enum SortType {
        DocId,
        OneFFSort,
        TwoFFSorts,
    }
    let sort_type = match (sort_first_by_ff, sort_second_by_ff) {
        (false, false) => SortType::DocId,
        (true, false) => SortType::OneFFSort,
        (true, true) => SortType::TwoFFSorts,
        (false, true) => panic!("Internal error: Got second sort, but no first sort"),
    };
    // only check order1 for OneFFSort and DocId, as it's the only sort
    //
    // REVERSE_DOCID is only used for SortType::DocId and SortType::OneFFSort
    match (sort_type, order1, order2) {
        (SortType::DocId, SortOrder::Desc, _) => {
            Box::new(SpecializedSegmentTopKCollector::<(), (), false>::new(
                split_id,
                score_extractor,
                leaf_max_hits,
                segment_ord,
            ))
        }
        (SortType::DocId, SortOrder::Asc, _) => {
            Box::new(SpecializedSegmentTopKCollector::<(), (), true>::new(
                split_id,
                score_extractor,
                leaf_max_hits,
                segment_ord,
            ))
        }
        (SortType::OneFFSort, SortOrder::Asc, SortOrder::Asc) => {
            Box::new(SpecializedSegmentTopKCollector::<
                Option<Reverse<u64>>,
                (),
                true,
            >::new(
                split_id, score_extractor, leaf_max_hits, segment_ord
            ))
        }
        (SortType::OneFFSort, SortOrder::Desc, SortOrder::Asc) => Box::new(
            SpecializedSegmentTopKCollector::<Option<u64>, (), false>::new(
                split_id,
                score_extractor,
                leaf_max_hits,
                segment_ord,
            ),
        ),
        (SortType::OneFFSort, SortOrder::Asc, SortOrder::Desc) => {
            Box::new(SpecializedSegmentTopKCollector::<
                Option<Reverse<u64>>,
                (),
                true,
            >::new(
                split_id, score_extractor, leaf_max_hits, segment_ord
            ))
        }
        (SortType::OneFFSort, SortOrder::Desc, SortOrder::Desc) => Box::new(
            SpecializedSegmentTopKCollector::<Option<u64>, (), false>::new(
                split_id,
                score_extractor,
                leaf_max_hits,
                segment_ord,
            ),
        ),
        (SortType::TwoFFSorts, SortOrder::Asc, SortOrder::Asc) => {
            Box::new(SpecializedSegmentTopKCollector::<
                Option<Reverse<u64>>,
                Option<Reverse<u64>>,
                true,
            >::new(
                split_id, score_extractor, leaf_max_hits, segment_ord
            ))
        }
        (SortType::TwoFFSorts, SortOrder::Asc, SortOrder::Desc) => {
            Box::new(SpecializedSegmentTopKCollector::<
                Option<Reverse<u64>>,
                Option<u64>,
                true,
            >::new(
                split_id, score_extractor, leaf_max_hits, segment_ord
            ))
        }
        (SortType::TwoFFSorts, SortOrder::Desc, SortOrder::Asc) => {
            Box::new(SpecializedSegmentTopKCollector::<
                Option<u64>,
                Option<Reverse<u64>>,
                false,
            >::new(
                split_id, score_extractor, leaf_max_hits, segment_ord
            ))
        }
        (SortType::TwoFFSorts, SortOrder::Desc, SortOrder::Desc) => {
            Box::new(SpecializedSegmentTopKCollector::<
                Option<u64>,
                Option<u64>,
                false,
            >::new(
                split_id, score_extractor, leaf_max_hits, segment_ord
            ))
        }
    }
}

/// Fast Top K Computation
///
/// The buffer is truncated to the top_n elements when it reaches the capacity of the Vec.
/// That means capacity has special meaning and should be carried over when cloning or serializing.
///
/// For TopK == 0, it will be relative expensive.
struct TopKComputer<D> {
    /// Reverses sort order to get top-semantics instead of bottom-semantics
    buffer: Vec<Reverse<D>>,
    top_n: usize,
    pub(crate) threshold: D,
}

// Custom clone to keep capacity
impl<D: Clone> Clone for TopKComputer<D> {
    fn clone(&self) -> Self {
        let mut buffer_clone = Vec::with_capacity(self.buffer.capacity());
        buffer_clone.extend(self.buffer.iter().cloned());

        TopKComputer {
            buffer: buffer_clone,
            top_n: self.top_n,
            threshold: self.threshold.clone(),
        }
    }
}

impl<D> TopKComputer<D>
where D: Ord + Copy + Debug + MinValue
{
    /// Create a new `TopKComputer`.
    pub fn new(top_n: usize) -> Self {
        // Vec cap can't be 0, since it would panic in push
        let vec_cap = top_n.max(1) * 10;
        TopKComputer {
            buffer: Vec::with_capacity(vec_cap),
            top_n,
            threshold: D::min_value(),
        }
    }

    /// Push a new document to the top n.
    /// If the document is below the current threshold, it will be ignored.
    #[inline]
    pub fn push(&mut self, doc: D) {
        if doc < self.threshold {
            return;
        }
        if self.buffer.len() == self.buffer.capacity() {
            let median = self.truncate_top_n();
            self.threshold = median;
        }

        // This is faster since it avoids the buffer resizing to be inlined from vec.push()
        // (this is in the hot path)
        // TODO: Replace with `push_within_capacity` when it's stabilized
        let uninit = self.buffer.spare_capacity_mut();
        // This cannot panic, because we truncate_median will at least remove one element, since
        // the min capacity is larger than 2.
        uninit[0].write(Reverse(doc));
        // This is safe because it would panic in the line above
        unsafe {
            self.buffer.set_len(self.buffer.len() + 1);
        }
    }

    #[inline(never)]
    fn truncate_top_n(&mut self) -> D {
        // Use select_nth_unstable to find the top nth score
        let (_, median_el, _) = self.buffer.select_nth_unstable(self.top_n);

        let median_score = *median_el;
        // Remove all elements below the top_n
        self.buffer.truncate(self.top_n);

        median_score.0
    }

    /// Returns the top n elements in sorted order.
    pub fn into_sorted_vec(mut self) -> Vec<D> {
        if self.buffer.len() > self.top_n {
            self.truncate_top_n();
        }
        self.buffer.sort_unstable();
        self.buffer.into_iter().map(|el| el.0).collect()
    }

    /// Returns the top n elements in stored order.
    /// Useful if you do not need the elements in sorted order,
    /// for example when merging the results of multiple segments.
    #[allow(dead_code)]
    pub fn into_vec(mut self) -> Vec<D> {
        if self.buffer.len() > self.top_n {
            self.truncate_top_n();
        }
        self.buffer.into_iter().map(|el| el.0).collect()
    }
}

pub use tantivy::COLLECT_BLOCK_BUFFER_LEN;
struct SpecSortingFieldExtractor<V1, V2> {
    _phantom: std::marker::PhantomData<(V1, V2)>,
    sort_values1: Box<[Option<u64>; COLLECT_BLOCK_BUFFER_LEN]>,
    sort_values2: Box<[Option<u64>; COLLECT_BLOCK_BUFFER_LEN]>,

    pub first: SortingFieldExtractorComponent,
    pub second: Option<SortingFieldExtractorComponent>,
}

impl<
    V1: Copy + PartialEq + PartialOrd + Ord + IntoOptionU64 + Debug,
    V2: Copy + PartialEq + PartialOrd + Ord + IntoOptionU64 + Debug,
> SpecSortingFieldExtractor<V1, V2>
{
    fn new(
        first: SortingFieldExtractorComponent,
        second: Option<SortingFieldExtractorComponent>,
    ) -> Self {
        Self {
            _phantom: PhantomData,
            sort_values1: vec![None; COLLECT_BLOCK_BUFFER_LEN]
                .into_boxed_slice()
                .try_into()
                .unwrap(),
            sort_values2: vec![None; COLLECT_BLOCK_BUFFER_LEN]
                .into_boxed_slice()
                .try_into()
                .unwrap(),
            first,
            second,
        }
    }
    /// Fetches the sort values for the given docs.
    /// Does noting when sorting by docid.
    fn fetch_data(&mut self, docs: &[DocId]) {
        self.first
            .extract_typed_sort_values_block(docs, &mut self.sort_values1[..docs.len()]);
        if let Some(second) = self.second.as_ref() {
            second.extract_typed_sort_values_block(docs, &mut self.sort_values2[..docs.len()]);
        }
    }
    #[inline]
    fn iter_hits<'a, const REVERSE_DOCID: bool>(
        &'a self,
        docs: &'a [DocId],
    ) -> impl Iterator<Item = Hit<V1, V2, REVERSE_DOCID>> + 'a {
        SpecSortingFieldIter::<V1, V2, REVERSE_DOCID>::new(
            docs,
            &self.sort_values1,
            &self.sort_values2,
        )
    }
}

struct SpecSortingFieldIter<'a, V1, V2, const REVERSE_DOCID: bool> {
    docs: std::slice::Iter<'a, DocId>,
    sort_values1: std::slice::Iter<'a, Option<u64>>,
    sort_values2: std::slice::Iter<'a, Option<u64>>,
    _phantom: PhantomData<(V1, V2)>,
}

impl<'a, V1, V2, const REVERSE_DOCID: bool> SpecSortingFieldIter<'a, V1, V2, REVERSE_DOCID>
where
    V1: Copy + PartialEq + PartialOrd + Ord + IntoOptionU64,
    V2: Copy + PartialEq + PartialOrd + Ord + IntoOptionU64,
{
    #[inline]
    pub fn new(
        docs: &'a [DocId],
        sort_values1: &'a [Option<u64>; COLLECT_BLOCK_BUFFER_LEN],
        sort_values2: &'a [Option<u64>; COLLECT_BLOCK_BUFFER_LEN],
    ) -> Self {
        Self {
            docs: docs.iter(),
            sort_values1: sort_values1.iter(),
            sort_values2: sort_values2.iter(),
            _phantom: PhantomData,
        }
    }
}

impl<V1, V2, const REVERSE_DOCID: bool> Iterator for SpecSortingFieldIter<'_, V1, V2, REVERSE_DOCID>
where
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug,
{
    type Item = Hit<V1, V2, REVERSE_DOCID>;

    #[inline]
    fn next(&mut self) -> Option<Self::Item> {
        let doc_id = *self.docs.next()?;

        let value1 = if !V1::is_unit_type() {
            V1::from_option_u64(*self.sort_values1.next()?)
        } else {
            V1::from_option_u64(None)
        };

        let value2 = if !V2::is_unit_type() {
            V2::from_option_u64(*self.sort_values2.next()?)
        } else {
            V2::from_option_u64(None)
        };

        Some(Hit {
            doc_id,
            value1,
            value2,
        })
    }
}

/// No search after handling
/// Quickwit collector working at the scale of the segment.
struct SpecializedSegmentTopKCollector<
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue,
    const REVERSE_DOCID: bool,
> {
    split_id: SplitId,
    hit_fetcher: SpecSortingFieldExtractor<V1, V2>,
    top_k_hits: TopKComputer<Hit<V1, V2, REVERSE_DOCID>>,
    segment_ord: u32,
}

impl<
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue + 'static,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue + 'static,
    const REVERSE_DOCID: bool,
> SpecializedSegmentTopKCollector<V1, V2, REVERSE_DOCID>
{
    pub fn new(
        split_id: SplitId,
        score_extractor: SortingFieldExtractorPair,
        leaf_max_hits: usize,
        segment_ord: u32,
    ) -> Self {
        let hit_fetcher =
            SpecSortingFieldExtractor::new(score_extractor.first, score_extractor.second);
        let top_k_hits = TopKComputer::new(leaf_max_hits);
        Self {
            split_id,
            hit_fetcher,
            top_k_hits,
            segment_ord,
        }
    }
}
impl<
    V1: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue,
    V2: Copy + PartialEq + Eq + PartialOrd + Ord + IntoOptionU64 + Debug + MinValue,
    const REVERSE_DOCID: bool,
> QuickwitSegmentTopKCollector for SpecializedSegmentTopKCollector<V1, V2, REVERSE_DOCID>
{
    fn collect_top_k_block(&mut self, docs: &[DocId]) {
        self.hit_fetcher.fetch_data(docs);
        let iter = self.hit_fetcher.iter_hits::<REVERSE_DOCID>(docs);
        for doc_id in iter {
            self.top_k_hits.push(doc_id);
        }
    }

    #[inline]
    fn collect_top_k(&mut self, _doc_id: DocId, _score: Score) {
        panic!("Internal Error: This collector does not support collect_top_k");
    }

    fn get_top_k(&self) -> Vec<PartialHit> {
        self.top_k_hits
            .clone()
            .into_sorted_vec()
            .into_iter()
            .map(|el| el.into_segment_partial_hit())
            .map(|segment_partial_hit: SegmentPartialHit| {
                segment_partial_hit.into_partial_hit(
                    self.split_id.clone(),
                    self.segment_ord,
                    &self.hit_fetcher.first,
                    &self.hit_fetcher.second,
                )
            })
            .collect()
    }
}

/// Quickwit collector working at the scale of the segment.
pub(crate) struct GenericQuickwitSegmentTopKCollector {
    split_id: SplitId,
    score_extractor: SortingFieldExtractorPair,
    // PartialHits in this heap don't contain a split_id yet.
    top_k_hits: TopK<SegmentPartialHit, SegmentPartialHitSortingKey, HitSortingMapper>,
    segment_ord: u32,
    search_after: Option<SearchAfterSegment>,
    // Precomputed order for search_after for split_id and segment_ord
    precomp_search_after_order: Ordering,
    sort_values1: Box<[Option<u64>; COLLECT_BLOCK_BUFFER_LEN]>,
    sort_values2: Box<[Option<u64>; COLLECT_BLOCK_BUFFER_LEN]>,
}

impl GenericQuickwitSegmentTopKCollector {
    pub fn new(
        split_id: SplitId,
        score_extractor: SortingFieldExtractorPair,
        leaf_max_hits: usize,
        segment_ord: u32,
        search_after_option: Option<PartialHit>,
        order1: SortOrder,
        order2: SortOrder,
    ) -> Self {
        let sort_key_mapper = HitSortingMapper { order1, order2 };
        let precomp_search_after_order = match &search_after_option {
            Some(search_after) if !search_after.split_id.is_empty() => order1
                .compare(&split_id, &search_after.split_id)
                .then_with(|| order1.compare(&segment_ord, &search_after.segment_ord)),
            // This value isn't actually used.
            _ => Ordering::Equal,
        };
        let search_after =
            SearchAfterSegment::new(search_after_option, order1, order2, &score_extractor);

        GenericQuickwitSegmentTopKCollector {
            split_id,
            score_extractor,
            top_k_hits: TopK::new(leaf_max_hits, sort_key_mapper), // Adjusted for context
            segment_ord,
            search_after,
            precomp_search_after_order,
            sort_values1: vec![None; COLLECT_BLOCK_BUFFER_LEN]
                .into_boxed_slice()
                .try_into()
                .unwrap(),
            sort_values2: vec![None; COLLECT_BLOCK_BUFFER_LEN]
                .into_boxed_slice()
                .try_into()
                .unwrap(),
        }
    }
    #[inline]
    /// Generic top k collection, that includes search_after handling
    ///
    /// Outside of the collector to circumvent lifetime issues.
    fn collect_top_k_vals(
        doc_id: DocId,
        sort_value: Option<u64>,
        sort_value2: Option<u64>,
        search_after: &Option<SearchAfterSegment>,
        precomp_search_after_order: Ordering,
        top_k_hits: &mut TopK<SegmentPartialHit, SegmentPartialHitSortingKey, HitSortingMapper>,
    ) {
        if let Some(search_after) = &search_after {
            let search_after_value1 = search_after.sort_value;
            let search_after_value2 = search_after.sort_value2;
            let orders = &top_k_hits.sort_key_mapper;
            let mut cmp_result = orders
                .order1
                .compare_opt(&sort_value, &search_after_value1)
                .then_with(|| {
                    orders
                        .order2
                        .compare_opt(&sort_value2, &search_after_value2)
                });
            if search_after.compare_on_equal {
                // TODO actually it's not first, it should be what's in _shard_doc then first then
                // default
                let order = orders.order1;
                cmp_result = cmp_result
                    .then(precomp_search_after_order)
                    // We compare doc_id only if sort_value1, sort_value2, split_id and segment_ord
                    // are equal.
                    .then_with(|| order.compare(&doc_id, &search_after.doc_id))
            }

            if cmp_result != Ordering::Less {
                return;
            }
        }

        let hit = SegmentPartialHit {
            sort_value,
            sort_value2,
            doc_id,
        };
        top_k_hits.add_entry(hit);
    }
}
impl QuickwitSegmentTopKCollector for GenericQuickwitSegmentTopKCollector {
    fn collect_top_k_block(&mut self, docs: &[DocId]) {
        self.score_extractor.extract_typed_sort_values(
            docs,
            &mut self.sort_values1[..],
            &mut self.sort_values2[..],
        );
        if self.search_after.is_some() {
            // Search after not optimized for block collection yet
            for ((doc_id, sort_value), sort_value2) in docs
                .iter()
                .cloned()
                .zip(self.sort_values1.iter().cloned())
                .zip(self.sort_values2.iter().cloned())
            {
                Self::collect_top_k_vals(
                    doc_id,
                    sort_value,
                    sort_value2,
                    &self.search_after,
                    self.precomp_search_after_order,
                    &mut self.top_k_hits,
                );
            }
        } else {
            // Probably would make sense to check the fence against e.g. sort_values1 earlier,
            // before creating the SegmentPartialHit.
            //
            // Below are different versions to avoid iterating the caches if they are unused.
            //
            // No sort values loaded. Sort only by doc_id.
            if !self.score_extractor.first.is_fast_field() {
                for doc_id in docs.iter().cloned() {
                    let hit = SegmentPartialHit {
                        sort_value: None,
                        sort_value2: None,
                        doc_id,
                    };
                    self.top_k_hits.add_entry(hit);
                }
                return;
            }
            let has_no_second_sort = !self
                .score_extractor
                .second
                .as_ref()
                .map(|extr| extr.is_fast_field())
                .unwrap_or(false);
            // No second sort values => We can skip iterating the second sort values cache.
            if has_no_second_sort {
                for (doc_id, sort_value) in
                    docs.iter().cloned().zip(self.sort_values1.iter().cloned())
                {
                    let hit = SegmentPartialHit {
                        sort_value,
                        sort_value2: None,
                        doc_id,
                    };
                    self.top_k_hits.add_entry(hit);
                }
                return;
            }

            for ((doc_id, sort_value), sort_value2) in docs
                .iter()
                .cloned()
                .zip(self.sort_values1.iter().cloned())
                .zip(self.sort_values2.iter().cloned())
            {
                let hit = SegmentPartialHit {
                    sort_value,
                    sort_value2,
                    doc_id,
                };
                self.top_k_hits.add_entry(hit);
            }
        }
    }

    #[inline]
    fn collect_top_k(&mut self, doc_id: DocId, score: Score) {
        let (sort_value, sort_value2): (Option<u64>, Option<u64>) =
            self.score_extractor.extract_typed_sort_value(doc_id, score);
        Self::collect_top_k_vals(
            doc_id,
            sort_value,
            sort_value2,
            &self.search_after,
            self.precomp_search_after_order,
            &mut self.top_k_hits,
        );
    }

    fn get_top_k(&self) -> Vec<PartialHit> {
        self.top_k_hits
            .clone()
            .finalize()
            .into_iter()
            .map(|segment_partial_hit: SegmentPartialHit| {
                segment_partial_hit.into_partial_hit(
                    self.split_id.clone(),
                    self.segment_ord,
                    &self.score_extractor.first,
                    &self.score_extractor.second,
                )
            })
            .collect()
    }
}

/// Search After, but the sort values are converted to the u64 fast field representation.
pub(crate) struct SearchAfterSegment {
    sort_value: Option<u64>,
    sort_value2: Option<u64>,
    compare_on_equal: bool,
    doc_id: DocId,
}
impl SearchAfterSegment {
    pub fn new(
        search_after_opt: Option<PartialHit>,
        sort_order1: SortOrder,
        sort_order2: SortOrder,
        score_extractor: &SortingFieldExtractorPair,
    ) -> Option<Self> {
        let search_after = search_after_opt?;
        let mut sort_value = None;
        if let Some(search_after_sort_value) = search_after
            .sort_value
            .and_then(|sort_value| sort_value.sort_value)
        {
            if let Some(new_value) = score_extractor
                .first
                .convert_to_u64_ff_val(search_after_sort_value, sort_order1)
            {
                sort_value = Some(new_value);
            } else {
                // Value is out of bounds, we ignore sort_value2 and disable the whole
                // search_after
                return None;
            }
        }
        let mut sort_value2 = None;
        if let Some(search_after_sort_value) = search_after
            .sort_value2
            .and_then(|sort_value2| sort_value2.sort_value)
        {
            let extractor = score_extractor
                .second
                .as_ref()
                .expect("Internal error: Got sort_value2, but no sort extractor");
            if let Some(new_value) =
                extractor.convert_to_u64_ff_val(search_after_sort_value, sort_order2)
            {
                sort_value2 = Some(new_value);
            }
        }
        Some(Self {
            sort_value,
            sort_value2,
            compare_on_equal: !search_after.split_id.is_empty(),
            doc_id: search_after.doc_id,
        })
    }
}


================================================
FILE: quickwit/quickwit-serve/Cargo.toml
================================================
[package]
name = "quickwit-serve"
description = "REST API server"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
base64 = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
elasticsearch-dsl = "0.4"
flate2 = { workspace = true }
futures = { workspace = true }
futures-util = { workspace = true }
glob = { workspace = true }
hex = { workspace = true }
http = { workspace = true }
http-body = { workspace = true }
http-serde = { workspace = true }
humantime = { workspace = true }
hyper-util = {workspace = true}
itertools = { workspace = true }
mime_guess = { workspace = true }
once_cell = { workspace = true }
percent-encoding = { workspace = true }
pprof = { workspace = true, optional = true }
prost = { workspace = true }
prost-types = { workspace = true }
regex = { workspace = true }
rust-embed = { workspace = true }
rustls = { workspace = true }
rustls-pemfile = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
serde_qs = { workspace = true }
serde_with = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true }
tokio-rustls = { workspace = true }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tonic = { workspace = true }
tonic-health = { workspace = true }
tonic-reflection = { workspace = true }
tower = { workspace = true, features = ["limit"] }
tower-http = { workspace = true }
tracing = { workspace = true }
utoipa = { workspace = true }
warp = { workspace = true, features = ["server"] }
zstd = { workspace = true }

quickwit-actors = { workspace = true }
quickwit-cluster = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-control-plane = { workspace = true }
quickwit-doc-mapper = { workspace = true }
quickwit-index-management = { workspace = true }
quickwit-indexing = { workspace = true }
quickwit-ingest = { workspace = true }
quickwit-jaeger = { workspace = true }
quickwit-janitor = { workspace = true }
quickwit-metastore = { workspace = true }
quickwit-opentelemetry = { workspace = true }
quickwit-proto = { workspace = true }
quickwit-query = { workspace = true }
quickwit-search = { workspace = true }
quickwit-lambda-client = { workspace = true, optional = true }
quickwit-storage = { workspace = true }
quickwit-telemetry = { workspace = true }

[build-dependencies]
time = { workspace = true }

[dev-dependencies]
assert-json-diff = { workspace = true }
http = { workspace = true }
itertools = { workspace = true }
mockall = { workspace = true }
tempfile = { workspace = true }
tokio = { workspace = true }
tokio-stream = { workspace = true }
tonic = { workspace = true }

quickwit-actors = { workspace = true, features = ["testsuite"] }
quickwit-cluster = { workspace = true, features = ["testsuite"] }
quickwit-common = { workspace = true, features = ["testsuite"] }
quickwit-config = { workspace = true, features = ["testsuite"] }
quickwit-control-plane = { workspace = true, features = ["testsuite"] }
quickwit-indexing = { workspace = true, features = ["testsuite"] }
quickwit-ingest = { workspace = true, features = ["testsuite"] }
quickwit-janitor = { workspace = true, features = ["testsuite"] }
quickwit-metastore = { workspace = true, features = ["testsuite"] }
quickwit-opentelemetry = { workspace = true, features = ["testsuite"] }
quickwit-proto = { workspace = true, features = ["testsuite"] }
quickwit-search = { workspace = true, features = ["testsuite"] }
quickwit-storage = { workspace = true, features = ["testsuite"] }

[features]
pprof = [
  "dep:pprof"
]
jemalloc-profiled = [
  "quickwit-common/jemalloc-profiled"
]
testsuite = []
sqs-for-tests = [
  "quickwit-indexing/sqs",
  "quickwit-indexing/sqs-test-helpers"
]
lambda = [
  "quickwit-lambda-client"
]


================================================
FILE: quickwit/quickwit-serve/README.md
================================================
# quickwit-serve

This project hosts the REST, the gRPC API associated with quickwit and the react UI.

## REST and gRPC API

The API is split into:
- the search API: the normal and the stream search api;
- the index management API: create, delete, list indexes and list splits of an index;
- the ingest API;
- the cluster API: expose information about the cluster, its members etc;
- the health check API: the health check of the current node. This API is rest only at the moment.

The APIs are usually accessible both via gRPC and REST.
This is done consistently using the following pattern.

A service async trait mimics the tonic service api, but without the `tonic`
wrapping of the request and with a rich and specific error type instead of tonic::Status.
The argument and the response on the other hand are typically using protobuf object
directly whenever sensible.

This service only has one implementation but is a trait for mocking purpose.
This service is typically exposed by another crate, specific to the API considered.
For instance, the search api has a `SearchService` trait, using the `SearchError`
response in the `quickwit-search` crate.

An adapter then wraps this service to implement the grpc::Service
(It simply does the wrapping of the request / results and converts errors to the tonic status.).

The rest API then relies on calling this service.

```mermaid
graph TD
    grpc_service[grpc::BlopService] --> |wraps| service(Go shopping)
    rest[blop_handler] --> |calls| service(Go shopping)
    service[BlopService]
```

## UI

The server also exposes at `/ui` all static files located in `quickwit-ui/build` directory. These static files are
produced by the react app build in `quickwit-ui`.
During development, the server will serve the local files. When building the binary, these static files will be embedded in it.


================================================
FILE: quickwit/quickwit-serve/build.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::env;
use std::process::Command;

use time::OffsetDateTime;
use time::macros::format_description;

fn main() {
    println!(
        "cargo:rustc-env=BUILD_DATE={}",
        OffsetDateTime::now_utc()
            .format(format_description!(
                "[year]-[month]-[day]T[hour]:[minute]:[second]Z"
            ))
            .unwrap()
    );
    println!(
        "cargo:rustc-env=BUILD_PROFILE={}",
        env::var("PROFILE").unwrap()
    );
    println!(
        "cargo:rustc-env=BUILD_TARGET={}",
        env::var("TARGET").unwrap()
    );
    commit_info();
}

/// Extracts commit date, hash, and tags
fn commit_info() {
    // Extract commit date and hash.
    let output_bytes = match Command::new("git")
        .arg("log")
        .arg("-1")
        .arg("--format=%cd %H")
        .arg("--date=format-local:%Y-%m-%dT%H:%M:%SZ")
        .env("TZ", "UTC0")
        .output()
    {
        Ok(output) if output.status.success() => output.stdout,
        _ => Vec::new(),
    };
    let output = String::from_utf8(output_bytes).unwrap();
    let mut parts = output.split_whitespace();

    if let Some(commit_date) = parts.next() {
        println!("cargo:rustc-env=QW_COMMIT_DATE={commit_date}");
    }
    if let Some(commit_hash) = parts.next() {
        println!("cargo:rustc-env=QW_COMMIT_HASH={commit_hash}");
    }

    // Extract commit tags.
    let output_bytes = match Command::new("git")
        .arg("tag")
        .arg("--points-at")
        .arg("HEAD")
        .output()
    {
        Ok(output) if output.status.success() => output.stdout,
        _ => Vec::new(),
    };
    let output = String::from_utf8(output_bytes).unwrap();
    let tags = output.lines().collect::<Vec<_>>();
    if !tags.is_empty() {
        println!("cargo:rustc-env=QW_COMMIT_TAGS={}", tags.join(","));
    }
}


================================================
FILE: quickwit/quickwit-serve/resources/tests/jaeger_ui_trace.json
================================================
{
    "traceID": "0000000000000001",
    "spans": [
      {
        "traceID": "0000000000000001",
        "spanID": "0000000000000001",
        "operationName": "test-general-conversion",
        "references": [],
        "startTime": 1485467191639875,
        "duration": 5,
        "flags": 0,
        "tags": [],
        "logs": [
          {
            "timestamp": 1485467191639875,
            "fields": [
              {
                "key": "event",
                "type": "string",
                "value": "some-event"
              }
            ]
          },
          {
            "timestamp": 1485467191639875,
            "fields": [
              {
                "key": "x",
                "type": "string",
                "value": "y"
              }
            ]
          }
        ],
        "processID": "p1",
        "warnings": []
      },
      {
        "traceID": "0000000000000001",
        "spanID": "0000000000000002",
        "operationName": "some-operation",
        "references": [],
        "flags": 0,
        "startTime": 1485467191639875,
        "duration": 5,
        "tags": [
          {
            "key": "peer.service",
            "type": "string",
            "value": "service-y"
          },
          {
            "key": "peer.ipv4",
            "type": "int64",
            "value": 23456
          },
          {
            "key": "error",
            "type": "bool",
            "value": true
          },
          {
            "key": "temperature",
            "type": "float64",
            "value": 72.5
          },
          {
            "key": "javascript_limit",
            "type": "int64",
            "value": "9223372036854775222"
          },
          {
            "key": "blob",
            "type": "binary",
            "value": "AAAwOQ=="
          }
        ],
        "logs": [],
        "processID": "p1",
        "warnings": []
      },
      {
        "traceID": "0000000000000001",
        "spanID": "0000000000000003",
        "operationName": "some-operation",
        "flags": 0,
        "references": [
          {
            "refType": "CHILD_OF",
            "traceID": "0000000000000001",
            "spanID": "0000000000000002"
          }
        ],
        "startTime": 1485467191639875,
        "duration": 5,
        "tags": [],
        "logs": [],
        "processID": "p2",
        "warnings": []
      },
      {
        "traceID": "0000000000000001",
        "spanID": "0000000000000004",
        "operationName": "reference-test",
        "flags": 0,
        "references": [
          {
            "refType": "CHILD_OF",
            "traceID": "00000000000000ff",
            "spanID": "00000000000000ff"
          },
          {
            "refType": "CHILD_OF",
            "traceID": "0000000000000001",
            "spanID": "0000000000000002"
          },
          {
            "refType": "FOLLOWS_FROM",
            "traceID": "0000000000000001",
            "spanID": "0000000000000002"
          }
        ],
        "startTime": 1485467191639875,
        "duration": 5,
        "tags": [],
        "logs": [],
        "processID": "p2",
        "warnings": [
          "some span warning"
        ]
      },
      {
        "traceID": "0000000000000001",
        "spanID": "0000000000000005",
        "operationName": "preserveParentID-test",
        "flags": 0,
        "references": [
          {
            "refType": "CHILD_OF",
            "traceID": "0000000000000001",
            "spanID": "0000000000000004"
          }
        ],
        "startTime": 1485467191639875,
        "duration": 4,
        "tags": [],
        "logs": [],
        "processID": "p2",
        "warnings": [
          "some span warning"
        ]
      }
    ],
    "processes": {
      "p1": {
        "serviceName": "service-x",
        "key": "p1",
        "tags": []
      },
      "p2": {
        "serviceName": "service-y",
        "key": "p2",
        "tags": []
      }
    },
    "warnings": [
    ]
  }


================================================
FILE: quickwit/quickwit-serve/src/build_info.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::OnceCell;
use quickwit_common::runtimes::RuntimesConfig;
use serde::Serialize;

#[derive(Debug, Eq, PartialEq, Serialize, utoipa::ToSchema)]
pub struct BuildInfo {
    pub build_date: &'static str,
    pub build_profile: &'static str,
    pub build_target: &'static str,
    pub cargo_pkg_version: &'static str,
    pub commit_date: &'static str,
    pub commit_hash: &'static str,
    pub commit_short_hash: &'static str,
    pub commit_tags: Vec<String>,
    pub version: String,
}

impl BuildInfo {
    /// Returns the properties of the binary.
    pub fn get() -> &'static Self {
        const UNKNOWN: &str = "unknown";

        static INSTANCE: OnceCell<BuildInfo> = OnceCell::new();

        INSTANCE.get_or_init(|| {
            let commit_date = option_env!("QW_COMMIT_DATE")
                .filter(|commit_date| !commit_date.is_empty())
                .unwrap_or(UNKNOWN);
            let commit_hash = option_env!("QW_COMMIT_HASH")
                .filter(|commit_hash| !commit_hash.is_empty())
                .unwrap_or(UNKNOWN);
            let commit_short_hash = option_env!("QW_COMMIT_HASH")
                .filter(|commit_hash| commit_hash.len() >= 7)
                .map(|commit_hash| &commit_hash[..7])
                .unwrap_or(UNKNOWN);
            let mut commit_tags: Vec<String> = option_env!("QW_COMMIT_TAGS")
                .map(|tags| {
                    tags.split(',')
                        .map(|tag| tag.trim().to_string())
                        .filter(|tag| !tag.is_empty())
                        .collect()
                })
                .unwrap_or_default();
            commit_tags.sort();

            let version = commit_tags
                .iter()
                .find(|tag| tag.starts_with('v'))
                .cloned()
                .unwrap_or_else(|| concat!(env!("CARGO_PKG_VERSION"), "-nightly").to_string());

            Self {
                build_date: env!("BUILD_DATE"),
                build_profile: env!("BUILD_PROFILE"),
                build_target: env!("BUILD_TARGET"),
                cargo_pkg_version: env!("CARGO_PKG_VERSION"),
                commit_date,
                commit_hash,
                commit_short_hash,
                commit_tags,
                version,
            }
        })
    }

    pub fn get_version_text() -> String {
        let build_info = Self::get();
        format!(
            "{} ({} {} {})",
            build_info.cargo_pkg_version,
            build_info.build_target,
            build_info.commit_date,
            build_info.commit_short_hash
        )
    }
}

#[derive(Debug, Eq, PartialEq, Serialize, utoipa::ToSchema)]
pub struct RuntimeInfo {
    // This is a number of logical cpus: vCPU or hyperthread depending on where you are running.
    // This is usually NOT necessarily the number of cores.
    pub num_cpus: usize,
    pub num_threads_blocking: usize,
    pub num_threads_non_blocking: usize,
}

impl RuntimeInfo {
    /// Returns the properties of the node.
    pub fn get() -> &'static Self {
        static INSTANCE: OnceCell<RuntimeInfo> = OnceCell::new();

        INSTANCE.get_or_init(|| {
            let num_cpus = quickwit_common::num_cpus();
            let runtimes_config = RuntimesConfig::with_num_cpus(num_cpus);
            Self {
                num_cpus,
                num_threads_blocking: runtimes_config.num_threads_blocking,
                num_threads_non_blocking: runtimes_config.num_threads_non_blocking,
            }
        })
    }
}


================================================
FILE: quickwit/quickwit-serve/src/cluster_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod rest_handler;

pub use rest_handler::{ClusterApi, cluster_handler};


================================================
FILE: quickwit/quickwit-serve/src/cluster_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::Infallible;

use quickwit_cluster::{Cluster, ClusterSnapshot, NodeIdSchema};
use warp::{Filter, Rejection};

use crate::format::extract_format_from_qs;
use crate::rest::recover_fn;
use crate::rest_api_response::into_rest_api_response;

#[derive(utoipa::OpenApi)]
#[openapi(
    paths(get_cluster),
    components(schemas(ClusterSnapshot, NodeIdSchema,))
)]
pub struct ClusterApi;

/// Cluster handler.
pub fn cluster_handler(
    cluster: Cluster,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("cluster")
        .and(warp::path::end())
        .and(warp::get())
        .and(warp::path::end().map(move || cluster.clone()))
        .then(get_cluster)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .recover(recover_fn)
        .boxed()
}

#[utoipa::path(
    get,
    tag = "Cluster Info",
    path = "/cluster",
    responses(
        (status = 200, description = "Successfully fetched cluster information.", body = ClusterSnapshot)
    )
)]

/// Get cluster information.
async fn get_cluster(cluster: Cluster) -> Result<ClusterSnapshot, Infallible> {
    let snapshot = cluster.snapshot().await;
    Ok(snapshot)
}


================================================
FILE: quickwit/quickwit-serve/src/decompression.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io::Read;
use std::sync::OnceLock;

use bytes::Bytes;
use flate2::read::{MultiGzDecoder, ZlibDecoder};
use quickwit_common::metrics::{GaugeGuard, MEMORY_METRICS};
use quickwit_common::thread_pool::run_cpu_intensive;
use thiserror::Error;
use warp::Filter;
use warp::reject::Reject;

use crate::load_shield::{LoadShield, LoadShieldPermit};

fn get_ingest_load_shield() -> &'static LoadShield {
    static LOAD_SHIELD: OnceLock<LoadShield> = OnceLock::new();
    LOAD_SHIELD.get_or_init(|| LoadShield::new("ingest"))
}

/// There are two ways to decompress the body:
/// - Stream the body through an async decompressor
/// - Fetch the body and then decompress the bytes
///
/// The first approach lowers the latency, while the second approach is more CPU efficient.
/// Ingesting data is usually CPU bound and there is considerable latency until the data is
/// searchable, so the second approach is more suitable for this use case.
async fn decompress_body(encoding: Option<String>, body: Bytes) -> Result<Bytes, warp::Rejection> {
    match encoding.as_deref() {
        Some("identity") => Ok(body),
        Some("gzip" | "x-gzip") => {
            let decompressed = run_cpu_intensive(move || {
                let mut decompressed = Vec::new();
                let mut decoder = MultiGzDecoder::new(body.as_ref());
                decoder
                    .read_to_end(&mut decompressed)
                    .map_err(|_| warp::reject::custom(CorruptedData))?;
                Result::<_, warp::Rejection>::Ok(Bytes::from(decompressed))
            })
            .await
            .map_err(|_| warp::reject::custom(CorruptedData))??;
            Ok(decompressed)
        }
        Some("zstd") => {
            let decompressed = run_cpu_intensive(move || {
                zstd::decode_all(body.as_ref())
                    .map(Bytes::from)
                    .map_err(|_| warp::reject::custom(CorruptedData))
            })
            .await
            .map_err(|_| warp::reject::custom(CorruptedData))??;
            Ok(decompressed)
        }
        Some("deflate" | "x-deflate") => {
            let decompressed = run_cpu_intensive(move || {
                let mut decompressed = Vec::new();
                ZlibDecoder::new(body.as_ref())
                    .read_to_end(&mut decompressed)
                    .map_err(|_| warp::reject::custom(CorruptedData))?;
                Result::<_, warp::Rejection>::Ok(Bytes::from(decompressed))
            })
            .await
            .map_err(|_| warp::reject::custom(CorruptedData))??;
            Ok(decompressed)
        }
        Some(encoding) => Err(warp::reject::custom(UnsupportedEncoding(
            encoding.to_string(),
        ))),
        _ => Ok(body),
    }
}

#[derive(Debug, Error)]
#[error("Error while decompressing the data")]
pub(crate) struct CorruptedData;

impl Reject for CorruptedData {}

#[derive(Debug, Error)]
#[error("Unsupported Content-Encoding {}. Supported encodings are 'gzip' and 'zstd'", self.0)]
pub(crate) struct UnsupportedEncoding(String);

impl Reject for UnsupportedEncoding {}

/// Custom filter for optional decompression
pub(crate) fn get_body_bytes() -> impl Filter<Extract = (Body,), Error = warp::Rejection> + Clone {
    warp::header::optional("content-encoding")
        .and(warp::body::bytes())
        .and_then(|encoding: Option<String>, body: Bytes| async move {
            let permit = get_ingest_load_shield().acquire_permit().await?;
            decompress_body(encoding, body)
                .await
                .map(|content| Body::new(content, permit))
        })
}

pub(crate) struct Body {
    pub content: Bytes,
    _gauge_guard: GaugeGuard<'static>,
    _permit: LoadShieldPermit,
}

impl Body {
    pub fn new(content: Bytes, load_shield_permit: LoadShieldPermit) -> Body {
        let mut gauge_guard = GaugeGuard::from_gauge(&MEMORY_METRICS.in_flight.rest_server);
        gauge_guard.add(content.len() as i64);
        Body {
            content,
            _gauge_guard: gauge_guard,
            _permit: load_shield_permit,
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/delete_task_api/handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_config::build_doc_mapper;
use quickwit_janitor::error::JanitorError;
use quickwit_metastore::IndexMetadataResponseExt;
use quickwit_proto::metastore::{
    DeleteQuery, DeleteTask, IndexMetadataRequest, ListDeleteTasksRequest, MetastoreResult,
    MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::search::SearchRequest;
use quickwit_proto::types::{IndexId, IndexUid};
use quickwit_query::query_ast::{QueryAst, query_ast_from_user_text};
use serde::Deserialize;
use warp::{Filter, Rejection};

use crate::format::extract_format_from_qs;
use crate::rest::recover_fn;
use crate::rest_api_response::into_rest_api_response;
use crate::with_arg;

#[derive(utoipa::OpenApi)]
#[openapi(
    paths(get_delete_tasks, post_delete_request),
    components(schemas(DeleteQueryRequest, DeleteTask, DeleteQuery))
)]
pub struct DeleteTaskApi;

/// This struct represents the delete query passed to
/// the rest API.
#[derive(Deserialize, Debug, Eq, PartialEq, Default, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct DeleteQueryRequest {
    /// Query text. The query language is that of tantivy.
    pub query: String,
    // Fields to search on
    #[serde(rename(deserialize = "search_field"))]
    #[serde(default)]
    pub search_fields: Option<Vec<String>>,
    /// If set, restrict delete to documents with a `timestamp >= start_timestamp`.
    pub start_timestamp: Option<i64>,
    /// If set, restrict delete to documents with a `timestamp < end_timestamp``.
    pub end_timestamp: Option<i64>,
}

/// Delete query API handlers.
pub fn delete_task_api_handlers(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    get_delete_tasks_handler(metastore.clone())
        .or(post_delete_tasks_handler(metastore.clone()))
        .recover(recover_fn)
        .boxed()
}

pub fn get_delete_tasks_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!(String / "delete-tasks")
        .and(warp::get())
        .and(with_arg(metastore))
        .then(get_delete_tasks)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    get,
    tag = "Delete Tasks",
    path = "/{index_id}/delete-tasks",
    responses(
        (status = 200, description = "Successfully fetched delete tasks.", body = [DeleteTask])
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to retrieve delete tasks for."),
    )
)]
/// Get Delete Tasks
///
/// Returns delete tasks in json format for a given `index_id`.
// Note that `_delete_task_service_mailbox` is not used...
// Explanation: we don't want to expose any delete tasks endpoints without a running
// `DeleteTaskService`. This is ensured by requiring a `Mailbox<DeleteTaskService>` in
// `get_delete_tasks_handler` and consequently we get the mailbox in `get_delete_tasks` signature.
pub async fn get_delete_tasks(
    index_id: IndexId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<Vec<DeleteTask>> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    let list_delete_tasks_request = ListDeleteTasksRequest::new(index_uid, 0);
    let delete_tasks = metastore
        .list_delete_tasks(list_delete_tasks_request)
        .await?
        .delete_tasks;
    Ok(delete_tasks)
}

pub fn post_delete_tasks_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!(String / "delete-tasks")
        .and(warp::body::json())
        .and(warp::post())
        .and(with_arg(metastore))
        .then(post_delete_request)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    post,
    tag = "Delete Tasks",
    path = "/{index_id}/delete-tasks",
    request_body = DeleteQueryRequest,
    responses(
        (status = 200, description = "Successfully added a new delete task.", body = DeleteTask)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to add the delete task to."),
    )
)]
/// Create Delete Task
///
/// This operation will not be immediately executed, instead it will be added to a queue
/// and cleaned up in the near future.
pub async fn post_delete_request(
    index_id: IndexId,
    delete_request: DeleteQueryRequest,
    metastore: MetastoreServiceClient,
) -> Result<DeleteTask, JanitorError> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let metadata = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?;
    let index_uid: IndexUid = metadata.index_uid.clone();
    let query_ast = query_ast_from_user_text(&delete_request.query, delete_request.search_fields)
        .parse_user_query(&metadata.index_config.search_settings.default_search_fields)
        .map_err(|err| JanitorError::InvalidDeleteQuery(err.to_string()))?;
    let query_ast_json = serde_json::to_string(&query_ast).map_err(|_err| {
        JanitorError::Internal("failed to serialized delete query ast".to_string())
    })?;
    let delete_query = DeleteQuery {
        index_uid: Some(index_uid),
        start_timestamp: delete_request.start_timestamp,
        end_timestamp: delete_request.end_timestamp,
        query_ast: query_ast_json,
    };
    let index_config = metadata.into_index_config();
    // TODO should it be something else than a JanitorError?
    let doc_mapper = build_doc_mapper(&index_config.doc_mapping, &index_config.search_settings)
        .map_err(|error| JanitorError::Internal(error.to_string()))?;
    let delete_search_request = SearchRequest::try_from(delete_query.clone())
        .map_err(|error| JanitorError::InvalidDeleteQuery(error.to_string()))?;

    // Validate the delete query against the current doc mapping configuration.
    let query_ast: QueryAst = serde_json::from_str(&delete_search_request.query_ast)
        .map_err(|err| JanitorError::InvalidDeleteQuery(err.to_string()))?;
    doc_mapper
        .query(doc_mapper.schema(), query_ast, true, None)
        .map_err(|error| JanitorError::InvalidDeleteQuery(error.to_string()))?;
    let delete_task = metastore.create_delete_task(delete_query).await?;
    Ok(delete_task)
}

#[cfg(test)]
mod tests {
    use quickwit_indexing::TestSandbox;
    use quickwit_proto::metastore::DeleteTask;
    use warp::Filter;

    use crate::rest::recover_fn;

    #[tokio::test]
    async fn test_delete_task_api() {
        let index_id = "test-delete-task-rest";
        let doc_mapping_yaml = r#"
            field_mappings:
              - name: title
                type: text
              - name: body
                type: text
              - name: ts
                type: i64
                fast: true
            mode: lenient
        "#;
        let test_sandbox = TestSandbox::create(index_id, doc_mapping_yaml, "", &["title"])
            .await
            .unwrap();
        let metastore = test_sandbox.metastore();
        let delete_query_api_handlers =
            super::delete_task_api_handlers(metastore).recover(recover_fn);

        // POST a delete query with explicit field name in query
        let resp = warp::test::request()
            .path("/test-delete-task-rest/delete-tasks")
            .method("POST")
            .json(&true)
            .body(r#"{"query": "body:myterm", "start_timestamp": 1, "end_timestamp": 10}"#)
            .reply(&delete_query_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let created_delete_task: DeleteTask = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(created_delete_task.opstamp, 1);
        let created_delete_query = created_delete_task.delete_query.unwrap();
        assert_eq!(created_delete_query.index_uid(), &test_sandbox.index_uid());
        assert_eq!(
            created_delete_query.query_ast,
            r#"{"type":"full_text","field":"body","text":"myterm","params":{"mode":{"type":"phrase_fallback_to_intersection"}},"lenient":false}"#
        );
        assert_eq!(created_delete_query.start_timestamp, Some(1));
        assert_eq!(created_delete_query.end_timestamp, Some(10));

        // POST a delete query with specified default field
        let resp = warp::test::request()
            .path("/test-delete-task-rest/delete-tasks")
            .method("POST")
            .json(&true)
            .body(r#"{"query": "myterm", "start_timestamp": 1, "end_timestamp": 10, "search_field": ["body"]}"#)
            .reply(&delete_query_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let created_delete_task: DeleteTask = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(created_delete_task.opstamp, 2);
        let created_delete_query = created_delete_task.delete_query.unwrap();
        assert_eq!(created_delete_query.index_uid(), &test_sandbox.index_uid());
        assert_eq!(
            created_delete_query.query_ast,
            r#"{"type":"full_text","field":"body","text":"myterm","params":{"mode":{"type":"phrase_fallback_to_intersection"}},"lenient":false}"#
        );
        assert_eq!(created_delete_query.start_timestamp, Some(1));
        assert_eq!(created_delete_query.end_timestamp, Some(10));

        // POST a delete query using the config default field
        let resp = warp::test::request()
            .path("/test-delete-task-rest/delete-tasks")
            .method("POST")
            .json(&true)
            .body(r#"{"query": "myterm", "start_timestamp": 1, "end_timestamp": 10}"#)
            .reply(&delete_query_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let created_delete_task: DeleteTask = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(created_delete_task.opstamp, 3);
        let created_delete_query = created_delete_task.delete_query.unwrap();
        assert_eq!(created_delete_query.index_uid(), &test_sandbox.index_uid());
        assert_eq!(
            created_delete_query.query_ast,
            r#"{"type":"full_text","field":"title","text":"myterm","params":{"mode":{"type":"phrase_fallback_to_intersection"}},"lenient":false}"#
        );
        assert_eq!(created_delete_query.start_timestamp, Some(1));
        assert_eq!(created_delete_query.end_timestamp, Some(10));

        // POST an invalid delete query.
        let resp = warp::test::request()
            .path("/test-delete-task-rest/delete-tasks")
            .method("POST")
            .json(&true)
            .body(r#"{"query": "unknown_field:test", "start_timestamp": 1, "end_timestamp": 10}"#)
            .reply(&delete_query_api_handlers)
            .await;
        assert_eq!(resp.status(), 400);
        assert!(String::from_utf8_lossy(resp.body()).contains("invalid delete query"));

        // GET delete tasks.
        let resp = warp::test::request()
            .path("/test-delete-task-rest/delete-tasks")
            .reply(&delete_query_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let delete_tasks: Vec<DeleteTask> = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(delete_tasks.len(), 3);

        test_sandbox.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-serve/src/delete_task_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod handler;

pub use handler::{DeleteTaskApi, delete_task_api_handlers};


================================================
FILE: quickwit/quickwit-serve/src/developer_api/debug.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{HashMap, HashSet};
use std::time::Duration;

use futures::StreamExt;
use futures::stream::FuturesUnordered;
use glob::{MatchOptions, Pattern as GlobPattern};
use quickwit_cluster::Cluster;
use quickwit_config::service::QuickwitService;
use quickwit_proto::developer::{DeveloperService, DeveloperServiceClient, GetDebugInfoRequest};
use quickwit_proto::tonic::codec::CompressionEncoding;
use quickwit_proto::types::{NodeId, NodeIdRef};
use serde::Deserialize;
use serde_json::Value as JsonValue;
use tokio::time::timeout;
use tracing::error;
use warp::hyper::StatusCode;
use warp::{Filter, Rejection, Reply};

use super::DeveloperApiServer;
use crate::with_arg;

#[derive(Deserialize)]
struct DebugInfoQueryParams {
    // Comma-separated list of case insensitive node ID glob patterns to restrict the debug
    // information to.
    node_ids: Option<String>,
    // Comma-separated list of roles to restrict the debug information to.
    roles: Option<String>,
}

#[utoipa::path(
    get,
    tag = "Debug",
    path = "/debug",
    responses(
        (status = 200, description = "Successfully fetched debug info."),
    ),
)]
/// Get debug information for the nodes in the cluster.
pub(super) fn debug_handler(
    cluster: Cluster,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path("debug")
        .and(warp::path::end())
        .and(with_arg(cluster))
        .and(warp::query::<DebugInfoQueryParams>())
        .then(get_node_debug_infos)
}

async fn get_node_debug_infos(
    cluster: Cluster,
    query_params: DebugInfoQueryParams,
) -> warp::reply::Response {
    let node_id_patterns = if let Some(node_ids) = &query_params.node_ids {
        match NodeIdGlobPatterns::try_from_comma_separated_patterns(node_ids) {
            Ok(node_id_patterns) => node_id_patterns,
            Err(error) => {
                return warp::reply::with_status(
                    format!(
                        "failed to parse node ID glob patterns `{}`: {error}",
                        query_params.node_ids.as_deref().unwrap_or("")
                    ),
                    StatusCode::BAD_REQUEST,
                )
                .into_response();
            }
        }
    } else {
        NodeIdGlobPatterns::default()
    };
    let target_roles: HashSet<QuickwitService> = if let Some(roles) = query_params.roles {
        let target_roles_res = roles.split(',').map(|role| role.parse()).collect();

        match target_roles_res {
            Ok(target_roles) => target_roles,
            Err(error) => {
                return warp::reply::with_status(
                    format!("failed to parse roles `{roles}`: {error}"),
                    StatusCode::BAD_REQUEST,
                )
                .into_response();
            }
        }
    } else {
        HashSet::new()
    };
    let ready_nodes = cluster.ready_nodes().await;
    let mut debug_infos: HashMap<NodeId, JsonValue> = HashMap::with_capacity(ready_nodes.len());

    let mut get_debug_info_futures = FuturesUnordered::new();

    for ready_node in ready_nodes {
        if node_id_patterns.matches(ready_node.node_id()) {
            let node_id = ready_node.node_id().to_owned();
            let client = DeveloperServiceClient::from_channel(
                ready_node.grpc_advertise_addr(),
                ready_node.channel(),
                DeveloperApiServer::MAX_GRPC_MESSAGE_SIZE,
                Some(CompressionEncoding::Zstd),
            );
            let roles = target_roles.iter().map(|role| role.to_string()).collect();
            let request = GetDebugInfoRequest { roles };
            let get_debug_info_future = async move {
                let get_debug_info_res =
                    timeout(Duration::from_secs(5), client.get_debug_info(request)).await;
                (node_id, get_debug_info_res)
            };
            get_debug_info_futures.push(get_debug_info_future);
        }
    }
    while let Some(get_debug_info_res) = get_debug_info_futures.next().await {
        match get_debug_info_res {
            (node_id, Ok(Ok(debug_info_response))) => {
                match serde_json::from_slice(&debug_info_response.debug_info_json) {
                    Ok(debug_info) => {
                        debug_infos.insert(node_id, debug_info);
                    }
                    Err(error) => {
                        error!(%node_id, %error, "failed to parse JSON debug info from node");
                    }
                };
            }
            (node_id, Ok(Err(error))) => {
                error!(%node_id, %error, "failed to get debug info from node");
            }
            (node_id, Err(_elpased)) => {
                error!(%node_id, "get debug info request timed out");
            }
        }
    }
    warp::reply::json(&debug_infos).into_response()
}

#[derive(Debug)]
struct NodeIdGlobPatterns(HashSet<GlobPattern>, MatchOptions);

impl Default for NodeIdGlobPatterns {
    fn default() -> Self {
        let glob_patterns = HashSet::new();
        let match_options = MatchOptions {
            case_sensitive: false,
            ..Default::default()
        };
        Self(glob_patterns, match_options)
    }
}

impl NodeIdGlobPatterns {
    fn try_from_comma_separated_patterns(comma_separated_patterns: &str) -> anyhow::Result<Self> {
        let glob_patterns: HashSet<GlobPattern> = comma_separated_patterns
            .split(',')
            .filter(|pattern| !pattern.is_empty())
            .map(GlobPattern::new)
            .collect::<Result<_, _>>()?;
        let match_options = MatchOptions {
            case_sensitive: false,
            ..Default::default()
        };
        Ok(Self(glob_patterns, match_options))
    }

    fn matches(&self, node_id: &NodeIdRef) -> bool {
        if self.0.is_empty() {
            return true;
        }
        self.0
            .iter()
            .any(|pattern| pattern.matches_with(node_id.as_str(), self.1))
    }
}

#[cfg(test)]
mod tests {
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};

    use super::*;

    #[tokio::test]
    async fn test_developer_api_debug_handler() {
        let peer_seeds = Vec::new();
        let transport = ChannelTransport::default();
        let self_node_readiness = true;
        let cluster = create_cluster_for_test(
            peer_seeds,
            &["control-plane"],
            &transport,
            self_node_readiness,
        )
        .await
        .unwrap();

        let debug_handler = debug_handler(cluster);

        let response = warp::test::request()
            .path("/debug?roles=foo")
            .method("GET")
            .reply(&debug_handler)
            .await;
        assert_eq!(response.status(), 400);

        let response = warp::test::request()
            .path("/debug?node_ids=[")
            .method("GET")
            .reply(&debug_handler)
            .await;
        assert_eq!(response.status(), 400);

        let response = warp::test::request()
            .path("/debug")
            .method("GET")
            .reply(&debug_handler)
            .await;
        assert_eq!(response.status(), 200);

        // TODO: Refactor handler and test against mock developer service servers.
    }

    #[test]
    fn test_node_id_glob_patterns() {
        let node_id_patterns = NodeIdGlobPatterns::try_from_comma_separated_patterns("").unwrap();
        let node_id = NodeIdRef::from_str("node-1");
        assert!(node_id_patterns.matches(node_id));

        let node_id_patterns = NodeIdGlobPatterns::try_from_comma_separated_patterns(",").unwrap();
        let node_id = NodeIdRef::from_str("node-1");
        assert!(node_id_patterns.matches(node_id));

        let node_id_patterns = NodeIdGlobPatterns::try_from_comma_separated_patterns(
            "control-plane,,indexer-[1-2],searcher*",
        )
        .unwrap();

        let node_id = NodeIdRef::from_str("control-plane");
        assert!(node_id_patterns.matches(node_id));

        let node_id = NodeIdRef::from_str("indexer-1");
        assert!(node_id_patterns.matches(node_id));

        let node_id = NodeIdRef::from_str("Indexer-2");
        assert!(node_id_patterns.matches(node_id));

        let node_id = NodeIdRef::from_str("indexer-3");
        assert!(!node_id_patterns.matches(node_id));

        let node_id = NodeIdRef::from_str("searcher-1");
        assert!(node_id_patterns.matches(node_id));

        let node_id = NodeIdRef::from_str("janitor");
        assert!(!node_id_patterns.matches(node_id));
    }
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/heap_prof.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::jemalloc_profiled::{start_profiling, stop_profiling};
use serde::Deserialize;
use warp::Filter;
use warp::reply::Reply;

pub fn heap_prof_handlers()
-> impl Filter<Extract = impl warp::Reply, Error = warp::Rejection> + Clone {
    #[derive(Deserialize)]
    struct ProfilerQueryParams {
        min_alloc_size: Option<u64>,
        backtrace_every: Option<u64>,
    }

    let start_profiler = {
        warp::path!("heap-prof" / "start")
            .and(warp::query::<ProfilerQueryParams>())
            .and_then(move |params: ProfilerQueryParams| start_profiler_handler(params))
    };

    let stop_profiler = { warp::path!("heap-prof" / "stop").and_then(stop_profiler_handler) };

    async fn start_profiler_handler(
        params: ProfilerQueryParams,
    ) -> Result<warp::reply::Response, warp::Rejection> {
        start_profiling(params.min_alloc_size, params.backtrace_every);
        let response =
            warp::reply::with_status("Heap profiling started", warp::http::StatusCode::OK)
                .into_response();
        Ok(response)
    }

    async fn stop_profiler_handler() -> Result<warp::reply::Response, warp::Rejection> {
        stop_profiling();
        let response =
            warp::reply::with_status("Heap profiling stopped", warp::http::StatusCode::OK)
                .into_response();
        Ok(response)
    }

    start_profiler.or(stop_profiler)
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/heap_prof_disabled.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use warp::Filter;

fn not_implemented_handler() -> impl warp::Reply {
    warp::reply::with_status(
        "Quickwit was compiled without the `jemalloc-profiled` feature",
        warp::http::StatusCode::NOT_IMPLEMENTED,
    )
}

pub fn heap_prof_handlers()
-> impl Filter<Extract = impl warp::Reply, Error = warp::Rejection> + Clone {
    let start_profiler = { warp::path!("heap-prof" / "start").map(not_implemented_handler) };
    let stop_profiler = { warp::path!("heap-prof" / "stop").map(not_implemented_handler) };
    start_profiler.or(stop_profiler)
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/log_level.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;
use tracing::{error, info};
use warp::hyper::StatusCode;
use warp::{Filter, Rejection};

use crate::{EnvFilterReloadFn, with_arg};

#[derive(Deserialize)]
struct EnvFilter {
    filter: String,
}

/// Dynamically Quickwit's log level
#[utoipa::path(get, tag = "Debug", path = "/log-level")]
pub fn log_level_handler(
    env_filter_reload_fn: EnvFilterReloadFn,
) -> impl warp::Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path("log-level")
        .and(warp::get().or(warp::post()).unify())
        .and(warp::path::end())
        .and(with_arg(env_filter_reload_fn))
        .and(warp::query::<EnvFilter>())
        .then(
            |env_filter_reload_fn: EnvFilterReloadFn, env_filter: EnvFilter| async move {
                match env_filter_reload_fn(&env_filter.filter) {
                    Ok(_) => {
                        info!(filter = env_filter.filter, "setting log level");
                        warp::reply::with_status(
                            format!("set log level to: [{}]", env_filter.filter),
                            StatusCode::OK,
                        )
                    }
                    Err(err) => {
                        error!(filter = env_filter.filter, %err, "failed to set log level");
                        warp::reply::with_status(
                            format!(
                                "failed to set log level to: [{}], {}",
                                env_filter.filter, err
                            ),
                            StatusCode::BAD_REQUEST,
                        )
                    }
                }
            },
        )
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod debug;

#[cfg_attr(not(feature = "jemalloc-profiled"), path = "heap_prof_disabled.rs")]
mod heap_prof;
mod log_level;
#[cfg_attr(not(feature = "pprof"), path = "pprof_disabled.rs")]
mod pprof;
mod server;

use debug::debug_handler;
use heap_prof::heap_prof_handlers;
use log_level::log_level_handler;
use pprof::pprof_handlers;
use quickwit_cluster::Cluster;
pub(crate) use server::DeveloperApiServer;
use warp::{Filter, Rejection};

use crate::EnvFilterReloadFn;
use crate::rest::recover_fn;

#[derive(utoipa::OpenApi)]
#[openapi(paths(debug::debug_handler, log_level::log_level_handler))]
pub struct DeveloperApi;

pub(crate) fn developer_api_routes(
    cluster: Cluster,
    env_filter_reload_fn: EnvFilterReloadFn,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("api" / "developer" / ..)
        .and(
            debug_handler(cluster.clone())
                .or(log_level_handler(env_filter_reload_fn.clone()).boxed())
                .or(pprof_handlers())
                .or(heap_prof_handlers()),
        )
        .recover(recover_fn)
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/pprof.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::OnceLock;

use regex::Regex;
use warp::Filter;

fn remove_trailing_numbers(thread_name: &mut String) {
    static REMOVE_TRAILING_NUMBER_PTN: OnceLock<Regex> = OnceLock::new();
    let captures_opt = REMOVE_TRAILING_NUMBER_PTN
        .get_or_init(|| Regex::new(r"^(.*?)[-\d]+$").unwrap())
        .captures(thread_name);
    if let Some(captures) = captures_opt {
        *thread_name = captures[1].to_string();
    }
}

fn frames_post_processor(frames: &mut pprof::Frames) {
    remove_trailing_numbers(&mut frames.thread_name);
}

/// pprof/start to start cpu profiling.
/// pprof/start?duration=5&sampling=1000 to start a short high frequency cpu profiling
/// pprof/flamegraph to stop the current cpu profiling and return a flamegraph or return the last
/// flamegraph
///
/// Query parameters:
/// - duration: duration of the profiling in seconds, default is 30 seconds. max value is 300
/// - sampling: the sampling rate, default is 100, max value is 1000
pub fn pprof_handlers() -> impl Filter<Extract = impl warp::Reply, Error = warp::Rejection> + Clone
{
    use std::sync::{Arc, Mutex};

    use pprof::ProfilerGuard;
    use serde::Deserialize;
    use tokio::time::{self, Duration};
    use warp::reply::Reply;

    struct ProfilerState {
        profiler_guard: Option<ProfilerGuard<'static>>,
        // We will keep the latest flamegraph and return it at the flamegraph endpoint
        // A new run will overwrite the flamegraph_data
        flamegraph_data: Option<Vec<u8>>,
    }

    let profiler_state = Arc::new(Mutex::new(ProfilerState {
        profiler_guard: None,
        flamegraph_data: None,
    }));

    #[derive(Deserialize)]
    struct ProfilerQueryParams {
        duration: Option<u64>, // max allowed value is 300 seconds, default is 30 seconds
        sampling: Option<i32>, // max value is 1000, default is 100
    }

    let start_profiler = {
        let profiler_state = Arc::clone(&profiler_state);
        warp::path!("pprof" / "start")
            .and(warp::query::<ProfilerQueryParams>())
            .and_then(move |params: ProfilerQueryParams| {
                start_profiler_handler(profiler_state.clone(), params)
            })
    };

    let stop_profiler = {
        let profiler_state = Arc::clone(&profiler_state);
        warp::path!("pprof" / "flamegraph")
            .and_then(move || get_flamegraph_handler(Arc::clone(&profiler_state)))
    };

    async fn start_profiler_handler(
        profiler_state: Arc<Mutex<ProfilerState>>,
        params: ProfilerQueryParams,
    ) -> Result<impl warp::Reply, warp::Rejection> {
        let mut state = profiler_state.lock().unwrap();

        if state.profiler_guard.is_none() {
            let duration = params.duration.unwrap_or(30).min(300);
            let sampling = params.sampling.unwrap_or(100).min(1000);
            state.profiler_guard = Some(pprof::ProfilerGuard::new(sampling).unwrap());
            let profiler_state = Arc::clone(&profiler_state);
            tokio::spawn(async move {
                time::sleep(Duration::from_secs(duration)).await;
                save_flamegraph(profiler_state).await;
            });
            Ok(warp::reply::with_status(
                "CPU profiling started",
                warp::http::StatusCode::OK,
            ))
        } else {
            Ok(warp::reply::with_status(
                "CPU profiling is already running",
                warp::http::StatusCode::BAD_REQUEST,
            ))
        }
    }

    async fn get_flamegraph_handler(
        profiler_state: Arc<Mutex<ProfilerState>>,
    ) -> Result<impl warp::Reply, warp::Rejection> {
        let state = profiler_state.lock().unwrap();

        if let Some(data) = state.flamegraph_data.clone() {
            Ok(warp::reply::with_header(data, "Content-Type", "image/svg+xml").into_response())
        } else {
            Ok(warp::reply::with_status(
                "flamegraph is not available",
                warp::http::StatusCode::BAD_REQUEST,
            )
            .into_response())
        }
    }

    async fn save_flamegraph(profiler_state: Arc<Mutex<ProfilerState>>) {
        let handle = quickwit_common::thread_pool::run_cpu_intensive(move || {
            let mut state = profiler_state.lock().unwrap();
            if let Some(profiler) = state.profiler_guard.take()
                && let Ok(report) = profiler
                    .report()
                    .frames_post_processor(frames_post_processor)
                    .build()
            {
                let mut buffer = Vec::new();
                if report.flamegraph(&mut buffer).is_ok() {
                    state.flamegraph_data = Some(buffer);
                }
            }
        });
        let _ = handle.await;
    }

    start_profiler.or(stop_profiler)
}

#[cfg(test)]
mod tests {
    use super::remove_trailing_numbers;

    #[track_caller]
    fn test_remove_trailing_numbers_aux(thread_name: &str, expected: &str) {
        let mut thread_name = thread_name.to_string();
        remove_trailing_numbers(&mut thread_name);
        assert_eq!(&thread_name, expected);
    }

    #[test]
    fn test_remove_trailing_numbers() {
        test_remove_trailing_numbers_aux("thread-12", "thread");
        test_remove_trailing_numbers_aux("thread12", "thread");
        test_remove_trailing_numbers_aux("thread-", "thread");
        test_remove_trailing_numbers_aux("thread-1-2", "thread");
        test_remove_trailing_numbers_aux("thread-1-2", "thread");
        test_remove_trailing_numbers_aux("12-aa", "12-aa");
    }
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/pprof_disabled.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use warp::Filter;

fn not_implemented_handler() -> impl warp::Reply {
    warp::reply::with_status(
        "Quickwit was compiled without the `pprof` feature",
        warp::http::StatusCode::NOT_IMPLEMENTED,
    )
}

/// pprof/start disabled
/// pprof/flamegraph disabled
pub fn pprof_handlers() -> impl Filter<Extract = impl warp::Reply, Error = warp::Rejection> + Clone
{
    let start_profiler = { warp::path!("pprof" / "start").map(not_implemented_handler) };
    let stop_profiler = { warp::path!("pprof" / "flamegraph").map(not_implemented_handler) };
    start_profiler.or(stop_profiler)
}


================================================
FILE: quickwit/quickwit-serve/src/developer_api/server.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::fmt;
use std::sync::Arc;

use async_trait::async_trait;
use bytes::Bytes;
use bytesize::ByteSize;
use quickwit_actors::Mailbox;
use quickwit_cluster::Cluster;
use quickwit_config::NodeConfig;
use quickwit_config::service::QuickwitService;
use quickwit_control_plane::control_plane::{ControlPlane, GetDebugInfo};
use quickwit_ingest::{IngestRouter, Ingester};
use quickwit_proto::developer::{
    DeveloperError, DeveloperResult, DeveloperService, GetDebugInfoRequest, GetDebugInfoResponse,
};
use serde_json::json;

use crate::{BuildInfo, QuickwitServices, RuntimeInfo};

#[derive(Clone)]
pub(crate) struct DeveloperApiServer {
    node_config: Arc<NodeConfig>,
    cluster: Cluster,
    control_plane_mailbox_opt: Option<Mailbox<ControlPlane>>,
    ingest_router_opt: Option<IngestRouter>,
    ingester_opt: Option<Ingester>,
}

impl fmt::Debug for DeveloperApiServer {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("DeveloperApiServer").finish()
    }
}

impl DeveloperApiServer {
    pub const MAX_GRPC_MESSAGE_SIZE: ByteSize = ByteSize::mib(100);

    pub fn from_services(services: &QuickwitServices) -> Self {
        Self {
            node_config: services.node_config.clone(),
            cluster: services.cluster.clone(),
            control_plane_mailbox_opt: services.control_plane_server_opt.clone(),
            ingest_router_opt: services.ingest_router_opt.clone(),
            ingester_opt: services.ingester_opt.clone(),
        }
    }
}

#[async_trait]
impl DeveloperService for DeveloperApiServer {
    async fn get_debug_info(
        &self,
        request: GetDebugInfoRequest,
    ) -> DeveloperResult<GetDebugInfoResponse> {
        let roles: HashSet<QuickwitService> = request
            .roles
            .into_iter()
            .map(|role| role.parse())
            .collect::<anyhow::Result<_>>()
            .map_err(|error| DeveloperError::InvalidArgument(error.to_string()))?;

        let cluster_snapshot = self.cluster.snapshot().await;

        // We must redact sensitive information such as credentials.
        let mut node_config = (*self.node_config).clone();
        node_config.redact();

        let mut debug_info = json!({
            "build_info": BuildInfo::get(),
            "runtime_info": RuntimeInfo::get(),
            "node_config": node_config,
            "cluster_membership_info": json!({
                "ready_nodes": cluster_snapshot.ready_nodes,
                "live_nodes": cluster_snapshot.live_nodes,
                "dead_nodes": cluster_snapshot.dead_nodes,
                "chitchat_state": cluster_snapshot.chitchat_state_snapshot.node_states,
            })
        });
        if let Some(control_plane_mailbox) = &self.control_plane_mailbox_opt
            && (roles.is_empty() || roles.contains(&QuickwitService::ControlPlane))
        {
            debug_info["control_plane"] = match control_plane_mailbox.ask(GetDebugInfo).await {
                Ok(debug_info) => debug_info,
                Err(error) => {
                    json!({"error": error.to_string()})
                }
            };
        }
        if let Some(ingest_router) = &self.ingest_router_opt {
            debug_info["ingest_router"] = ingest_router.debug_info().await;
        }
        if let Some(ingester) = &self.ingester_opt
            && (roles.is_empty() || roles.contains(&QuickwitService::Indexer))
        {
            debug_info["ingester"] = ingester.debug_info().await;
        };
        let debug_info_json = serde_json::to_vec(&debug_info).map_err(|error| {
            let message = format!("failed to JSON serialize debug info: {error}");
            DeveloperError::Internal(message)
        })?;
        let response = GetDebugInfoResponse {
            debug_info_json: Bytes::from(debug_info_json),
        };
        Ok(response)
    }
}

#[cfg(test)]
mod tests {
    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use serde_json::Value as JsonValue;

    use super::*;

    #[tokio::test]
    async fn test_developer_api_server_get_debug_info() {
        let peer_seeds = Vec::new();
        let transport = ChannelTransport::default();
        let self_node_readiness = true;
        let cluster = create_cluster_for_test(
            peer_seeds,
            &["metastore", "control-plane", "indexer"],
            &transport,
            self_node_readiness,
        )
        .await
        .unwrap();

        let mut node_config = NodeConfig::for_test();
        node_config.metastore_uri =
            quickwit_common::uri::Uri::for_test("postgresql://username:password@db");
        let node_config = Arc::new(node_config);

        let developer_api_server = DeveloperApiServer {
            node_config,
            cluster,
            control_plane_mailbox_opt: None,
            ingest_router_opt: None,
            ingester_opt: None,
        };
        let request = GetDebugInfoRequest { roles: Vec::new() };
        let response = developer_api_server.get_debug_info(request).await.unwrap();
        let debug_info: JsonValue = serde_json::from_slice(&response.debug_info_json).unwrap();

        assert!(debug_info["build_info"].is_object());
        assert!(debug_info["runtime_info"].is_object());
        assert!(debug_info["node_config"].is_object());
        assert!(debug_info["cluster_membership_info"].is_object());

        assert_eq!(
            debug_info["node_config"]["metastore_uri"],
            "postgresql://username:***redacted***@db"
        );

        // TODO: Test control plane and ingester debug info.
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/bulk.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::time::Instant;

use bytesize::ByteSize;
use quickwit_ingest::{
    CommitType, DocBatchBuilder, IngestRequest, IngestService, IngestServiceClient,
};
use quickwit_proto::ingest::router::IngestRouterServiceClient;
use quickwit_proto::types::IndexId;
use warp::http::StatusCode;
use warp::{Filter, Rejection};

use super::bulk_v2::{ElasticBulkResponse, elastic_bulk_ingest_v2};
use crate::elasticsearch_api::filter::{elastic_bulk_filter, elastic_index_bulk_filter};
use crate::elasticsearch_api::make_elastic_api_response;
use crate::elasticsearch_api::model::{BulkAction, ElasticBulkOptions, ElasticsearchError};
use crate::format::extract_format_from_qs;
use crate::ingest_api::lines;
use crate::rest::recover_fn;
use crate::{Body, with_arg};

/// POST `_elastic/_bulk`
pub fn es_compat_bulk_handler(
    ingest_service: IngestServiceClient,
    ingest_router: IngestRouterServiceClient,
    content_length_limit: ByteSize,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_bulk_filter(content_length_limit)
        .and(with_arg(ingest_service))
        .and(with_arg(ingest_router))
        .then(move |body, bulk_options, ingest_service, ingest_router| {
            elastic_ingest_bulk(
                None,
                body,
                bulk_options,
                ingest_service,
                ingest_router,
                enable_ingest_v1,
                enable_ingest_v2,
            )
        })
        .and(extract_format_from_qs())
        .map(make_elastic_api_response)
        .recover(recover_fn)
}

/// POST `_elastic/<index>/_bulk`
pub fn es_compat_index_bulk_handler(
    ingest_service: IngestServiceClient,
    ingest_router: IngestRouterServiceClient,
    content_length_limit: ByteSize,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_bulk_filter(content_length_limit)
        .and(with_arg(ingest_service))
        .and(with_arg(ingest_router))
        .then(
            move |index_id, body, bulk_options, ingest_service, ingest_router| {
                elastic_ingest_bulk(
                    Some(index_id),
                    body,
                    bulk_options,
                    ingest_service,
                    ingest_router,
                    enable_ingest_v1,
                    enable_ingest_v2,
                )
            },
        )
        .and(extract_format_from_qs())
        .map(make_elastic_api_response)
        .recover(recover_fn)
        .boxed()
}

async fn elastic_ingest_bulk(
    default_index_id: Option<IndexId>,
    body: Body,
    bulk_options: ElasticBulkOptions,
    ingest_service: IngestServiceClient,
    ingest_router: IngestRouterServiceClient,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> Result<ElasticBulkResponse, ElasticsearchError> {
    if enable_ingest_v2 && !bulk_options.use_legacy_ingest {
        return elastic_bulk_ingest_v2(default_index_id, body, bulk_options, ingest_router).await;
    }
    if !enable_ingest_v1 {
        return Err(ElasticsearchError::new(
            StatusCode::INTERNAL_SERVER_ERROR,
            "ingest v1 is disabled: environment variable `QW_DISABLE_INGEST_V1` is set".to_string(),
            None,
        ));
    }
    let now = Instant::now();
    let mut doc_batch_builders = HashMap::new();
    let mut lines = lines(&body.content).enumerate();

    while let Some((line_number, line)) = lines.next() {
        let action = serde_json::from_slice::<BulkAction>(line).map_err(|error| {
            ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                format!("Malformed action/metadata line [#{line_number}]. Details: `{error}`"),
                None,
            )
        })?;
        let (_, source) = lines.next().ok_or_else(|| {
            ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                "expected source for the action".to_string(),
                None,
            )
        })?;
        // when ingesting on /my-index/_bulk, if _index: is set to something else than my-index,
        // ES honors it and create the doc in the requested index. That is, `my-index` is a default
        // value in case _index: is missing, but not a constraint on each sub-action.
        let index_id = action
            .into_index_id()
            .or_else(|| default_index_id.clone())
            .ok_or_else(|| {
                ElasticsearchError::new(
                    StatusCode::BAD_REQUEST,
                    format!("missing required field: `_index` in the line [#{line_number}]."),
                    None,
                )
            })?;
        let doc_batch_builder = doc_batch_builders
            .entry(index_id.clone())
            .or_insert(DocBatchBuilder::new(index_id));

        doc_batch_builder.ingest_doc(source);
    }
    let doc_batches = doc_batch_builders
        .into_values()
        .map(|builder| builder.build())
        .collect();
    let commit_type: CommitType = bulk_options.refresh.into();
    let ingest_request = IngestRequest {
        doc_batches,
        commit: commit_type.into(),
    };
    ingest_service.ingest(ingest_request).await?;

    let took_millis = now.elapsed().as_millis() as u64;
    let errors = false;
    let bulk_response = ElasticBulkResponse {
        took_millis,
        errors,
        actions: Vec::new(),
    };
    Ok(bulk_response)
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;
    use std::time::Duration;

    use quickwit_config::{IngestApiConfig, NodeConfig};
    use quickwit_index_management::IndexService;
    use quickwit_ingest::{FetchRequest, IngestServiceClient, SuggestTruncateRequest};
    use quickwit_metastore::metastore_for_test;
    use quickwit_proto::ingest::router::IngestRouterServiceClient;
    use quickwit_proto::metastore::MetastoreServiceClient;
    use quickwit_search::MockSearchService;
    use quickwit_storage::StorageResolver;
    use warp::hyper::StatusCode;

    use crate::elasticsearch_api::bulk_v2::ElasticBulkResponse;
    use crate::elasticsearch_api::elastic_api_handlers;
    use crate::elasticsearch_api::model::ElasticsearchError;
    use crate::elasticsearch_api::tests::mock_cluster;
    use crate::ingest_api::setup_ingest_v1_service;

    #[tokio::test]
    async fn test_bulk_api_returns_404_if_index_id_does_not_exist() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = r#"
            { "create" : { "_index" : "my-index", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "index-2", "_id" : "1" } }
            {"id": 1, "message": "push"}"#;
        let resp = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&elastic_api_handlers)
            .await;
        assert_eq!(resp.status(), 404);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_bulk_api_returns_200() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index-1", "my-index-2"], &IngestApiConfig::default())
                .await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = r#"
            { "create" : { "_index" : "my-index-1", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-2", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-1" } }
            {"id": 2, "message": "push"}"#;
        let resp = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&elastic_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let bulk_response: ElasticBulkResponse = serde_json::from_slice(resp.body()).unwrap();
        assert!(!bulk_response.errors);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_bulk_api_returns_200_if_payload_has_blank_lines() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index-1"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = "
            {\"create\": {\"_index\": \"my-index-1\", \"_id\": \"1674834324802805760\"}}
            \u{20}\u{20}\u{20}\u{20}\n
            {\"_line\": {\"message\": \"hello-world\"}}";
        let resp = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&elastic_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let bulk_response: ElasticBulkResponse = serde_json::from_slice(resp.body()).unwrap();
        assert!(!bulk_response.errors);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_bulk_index_api_returns_200() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index-1", "my-index-2"], &IngestApiConfig::default())
                .await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = r#"
            { "create" : { "_index" : "my-index-1", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-2", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : {} }
            {"id": 2, "message": "push"}"#;
        let resp = warp::test::request()
            .path("/_elastic/my-index-1/_bulk")
            .method("POST")
            .body(payload)
            .reply(&elastic_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let bulk_response: ElasticBulkResponse = serde_json::from_slice(resp.body()).unwrap();
        assert!(!bulk_response.errors);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_bulk_api_blocks_when_refresh_wait_for_is_specified() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let (universe, _temp_dir, ingest_service, ingest_service_mailbox) =
            setup_ingest_v1_service(&["my-index-1", "my-index-2"], &IngestApiConfig::default())
                .await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = r#"
            { "create" : { "_index" : "my-index-1", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-2", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-1" } }
            {"id": 2, "message": "push"}"#;
        let handle = tokio::spawn(async move {
            let resp = warp::test::request()
                .path("/_elastic/_bulk?refresh=wait_for")
                .method("POST")
                .body(payload)
                .reply(&elastic_api_handlers)
                .await;

            assert_eq!(resp.status(), 200);
            let bulk_response: ElasticBulkResponse = serde_json::from_slice(resp.body()).unwrap();
            assert!(!bulk_response.errors);
        });
        universe.sleep(Duration::from_secs(10)).await;
        assert!(!handle.is_finished());
        assert_eq!(
            ingest_service_mailbox
                .ask_for_res(FetchRequest {
                    index_id: "my-index-1".to_string(),
                    start_after: None,
                    num_bytes_limit: None,
                })
                .await
                .unwrap()
                .doc_batch
                .unwrap()
                .num_docs(),
            2
        );
        assert!(!handle.is_finished());
        assert_eq!(
            ingest_service_mailbox
                .ask_for_res(FetchRequest {
                    index_id: "my-index-2".to_string(),
                    start_after: None,
                    num_bytes_limit: None,
                })
                .await
                .unwrap()
                .doc_batch
                .unwrap()
                .num_docs(),
            1
        );
        ingest_service_mailbox
            .ask_for_res(SuggestTruncateRequest {
                index_id: "my-index-1".to_string(),
                up_to_position_included: 1,
            })
            .await
            .unwrap();
        universe.sleep(Duration::from_secs(10)).await;
        assert!(!handle.is_finished());
        ingest_service_mailbox
            .ask_for_res(SuggestTruncateRequest {
                index_id: "my-index-2".to_string(),
                up_to_position_included: 0,
            })
            .await
            .unwrap();
        handle.await.unwrap();
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_bulk_api_blocks_when_refresh_true_is_specified() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let (universe, _temp_dir, ingest_service, ingest_service_mailbox) =
            setup_ingest_v1_service(&["my-index-1", "my-index-2"], &IngestApiConfig::default())
                .await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = r#"
            { "create" : { "_index" : "my-index-1", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-2", "_id" : "1"} }
            {"id": 1, "message": "push"}
            { "create" : { "_index" : "my-index-1" } }
            {"id": 2, "message": "push"}"#;
        let handle = tokio::spawn(async move {
            let resp = warp::test::request()
                .path("/_elastic/_bulk?refresh")
                .method("POST")
                .body(payload)
                .reply(&elastic_api_handlers)
                .await;

            assert_eq!(resp.status(), 200);
            let bulk_response: ElasticBulkResponse = serde_json::from_slice(resp.body()).unwrap();
            assert!(!bulk_response.errors);
        });
        universe.sleep(Duration::from_secs(10)).await;
        assert!(!handle.is_finished());
        assert_eq!(
            ingest_service_mailbox
                .ask_for_res(FetchRequest {
                    index_id: "my-index-1".to_string(),
                    start_after: None,
                    num_bytes_limit: None,
                })
                .await
                .unwrap()
                .doc_batch
                .unwrap()
                .num_docs(),
            3
        );
        assert_eq!(
            ingest_service_mailbox
                .ask_for_res(FetchRequest {
                    index_id: "my-index-2".to_string(),
                    start_after: None,
                    num_bytes_limit: None,
                })
                .await
                .unwrap()
                .doc_batch
                .unwrap()
                .num_docs(),
            2
        );
        ingest_service_mailbox
            .ask_for_res(SuggestTruncateRequest {
                index_id: "my-index-1".to_string(),
                up_to_position_included: 1,
            })
            .await
            .unwrap();
        universe.sleep(Duration::from_secs(10)).await;
        assert!(!handle.is_finished());
        ingest_service_mailbox
            .ask_for_res(SuggestTruncateRequest {
                index_id: "my-index-2".to_string(),
                up_to_position_included: 0,
            })
            .await
            .unwrap();
        handle.await.unwrap();
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_bulk_ingest_request_returns_400_if_action_is_malformed() {
        let config = Arc::new(NodeConfig::for_test());
        let search_service = Arc::new(MockSearchService::new());
        let ingest_service = IngestServiceClient::mocked();
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let elastic_api_handlers = elastic_api_handlers(
            mock_cluster().await,
            config,
            search_service,
            ingest_service,
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let payload = r#"
            {"create": {"_index": "my-index", "_id": "1"},}
            {"id": 1, "message": "my-doc"}"#;
        let resp = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&elastic_api_handlers)
            .await;
        assert_eq!(resp.status(), 400);
        let es_error: ElasticsearchError = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(es_error.status, StatusCode::BAD_REQUEST);
        assert_eq!(
            es_error.error.reason.unwrap(),
            "Malformed action/metadata line [#0]. Details: `expected value at line 1 column 57`"
        );
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/bulk_v2.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::time::Instant;

use quickwit_common::rate_limited_error;
use quickwit_config::{INGEST_V2_SOURCE_ID, validate_identifier};
use quickwit_ingest::IngestRequestV2Builder;
use quickwit_proto::ingest::CommitTypeV2;
use quickwit_proto::ingest::router::{
    IngestFailureReason, IngestResponseV2, IngestRouterService, IngestRouterServiceClient,
};
use quickwit_proto::types::{DocUid, IndexId};
use serde::{Deserialize, Serialize};
use warp::hyper::StatusCode;

use super::model::ElasticException;
use crate::Body;
use crate::elasticsearch_api::model::{BulkAction, ElasticBulkOptions, ElasticsearchError};
use crate::ingest_api::lines;

#[derive(Debug, Default, Serialize, Deserialize)]
pub(crate) struct ElasticBulkResponse {
    #[serde(rename = "took")]
    pub took_millis: u64,
    pub errors: bool,
    #[serde(rename = "items")]
    pub actions: Vec<ElasticBulkAction>,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub(crate) enum ElasticBulkAction {
    #[serde(rename = "create")]
    Create(ElasticBulkItem),
    #[serde(rename = "index")]
    Index(ElasticBulkItem),
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub(crate) struct ElasticBulkItem {
    #[serde(rename = "_index")]
    pub index_id: IndexId,
    #[serde(rename = "_id")]
    pub es_doc_id: Option<String>,
    #[serde(with = "http_serde::status_code")]
    pub status: StatusCode,
    pub error: Option<ElasticBulkError>,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub(crate) struct ElasticBulkError {
    #[serde(rename = "index")]
    pub index_id: Option<IndexId>,
    #[serde(rename = "type")]
    pub exception: ElasticException,
    pub reason: String,
}

type ElasticDocId = String;

#[derive(Debug)]
struct DocHandle {
    doc_position: usize,
    doc_uid: DocUid,
    es_doc_id: Option<ElasticDocId>,
    // Whether the document failed to parse. When the struct is instantiated, this value is set to
    // `false` and then mutated if the ingest response contains a parse failure for this document.
    is_parse_failure: bool,
}

pub(crate) async fn elastic_bulk_ingest_v2(
    default_index_id: Option<IndexId>,
    body: Body,
    bulk_options: ElasticBulkOptions,
    ingest_router: IngestRouterServiceClient,
) -> Result<ElasticBulkResponse, ElasticsearchError> {
    let now = Instant::now();
    let mut ingest_request_builder = IngestRequestV2Builder::default();
    let mut lines = lines(&body.content).enumerate();
    let mut per_subrequest_doc_handles: HashMap<u32, Vec<DocHandle>> = HashMap::new();
    let mut action_count = 0;
    let mut invalid_index_id_items = Vec::new();
    while let Some((line_no, line)) = lines.next() {
        let action = serde_json::from_slice::<BulkAction>(line).map_err(|error| {
            ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                format!("Malformed action/metadata line [{}]: {error}", line_no + 1),
                Some(ElasticException::IllegalArgument),
            )
        })?;
        let (_, doc) = lines.next().ok_or_else(|| {
            ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                "Validation Failed: 1: no requests added;".to_string(),
                Some(ElasticException::ActionRequestValidation),
            )
        })?;
        let meta = action.into_meta();
        // When ingesting into `/my-index/_bulk`, if `_index` is set to something other than
        // `my-index`, ES honors it and creates the doc for the requested index. That is,
        // `my-index` is a default value in case `_index`` is missing, but not a constraint on
        // each sub-action.
        let index_id = meta
            .index_id
            .or_else(|| default_index_id.clone())
            .ok_or_else(|| {
                ElasticsearchError::new(
                    StatusCode::BAD_REQUEST,
                    "Validation Failed: 1: index is missing;".to_string(),
                    Some(ElasticException::ActionRequestValidation),
                )
            })?;

        // Validate index ID early because propagating back the right error (400)
        // from deeper ingest layers is harder
        if validate_identifier("", &index_id).is_err() {
            let invalid_item = make_invalid_index_id_item(index_id.clone(), meta.es_doc_id);
            invalid_index_id_items.push((action_count, invalid_item));
            action_count += 1;
            continue;
        }

        let (subrequest_id, doc_uid) = ingest_request_builder.add_doc(index_id, doc);

        let doc_handle = DocHandle {
            doc_position: action_count,
            doc_uid,
            es_doc_id: meta.es_doc_id,
            is_parse_failure: false,
        };
        action_count += 1;
        per_subrequest_doc_handles
            .entry(subrequest_id)
            .or_default()
            .push(doc_handle);
    }
    let commit_type: CommitTypeV2 = bulk_options.refresh.into();

    let ingest_request_opt = ingest_request_builder.build(INGEST_V2_SOURCE_ID, commit_type);

    let Some(ingest_request) = ingest_request_opt else {
        return Ok(ElasticBulkResponse::default());
    };
    let ingest_response = ingest_router.ingest(ingest_request).await.map_err(|err| {
        rate_limited_error!(limit_per_min=6, err=?err, "router error");
        err
    })?;
    make_elastic_bulk_response_v2(
        ingest_response,
        per_subrequest_doc_handles,
        now,
        action_count,
        invalid_index_id_items,
    )
}

#[allow(clippy::result_large_err)]
fn make_elastic_bulk_response_v2(
    ingest_response_v2: IngestResponseV2,
    mut per_subrequest_doc_handles: HashMap<u32, Vec<DocHandle>>,
    now: Instant,
    action_count: usize,
    invalid_index_id_items: Vec<(usize, ElasticBulkItem)>,
) -> Result<ElasticBulkResponse, ElasticsearchError> {
    let mut positioned_actions: Vec<(usize, ElasticBulkAction)> = Vec::with_capacity(action_count);
    let mut errors = false;

    // Populate the items for each `IngestSuccess` subresponse. They may be partially successful and
    // contain some parse failures.
    for success in ingest_response_v2.successes {
        let index_id = success
            .index_uid
            .map(|index_uid| index_uid.index_id)
            .expect("`index_uid` should be a required field");

        // Find the doc handles for the subresponse.
        let mut doc_handles = remove_doc_handles(
            &mut per_subrequest_doc_handles,
            success.subrequest_id,
        )
        .inspect_err(|_| {
            rate_limited_error!(limit_per_min=6, index_id=%index_id, "could not find subrequest id");
        })?;
        doc_handles.sort_unstable_by(|left, right| left.doc_uid.cmp(&right.doc_uid));

        // Populate the response items with one error per parse failure.
        for parse_failure in success.parse_failures {
            errors = true;

            let failed_doc_uid = parse_failure.doc_uid();
            let doc_handle_idx = doc_handles
                .binary_search_by_key(&failed_doc_uid, |doc_handle| doc_handle.doc_uid)
                .map_err(|_| {
                    rate_limited_error!(limit_per_min=6, doc_uid=%failed_doc_uid, "could not find doc_uid from parse failure");
                    ElasticsearchError::new(
                        StatusCode::INTERNAL_SERVER_ERROR,
                        format!(
                            "could not find doc `{}` in bulk request",
                            parse_failure.doc_uid()
                        ),
                        None,
                    )
                })?;
            let doc_handle = &mut doc_handles[doc_handle_idx];
            doc_handle.is_parse_failure = true;

            let error = ElasticBulkError {
                index_id: Some(index_id.clone()),
                exception: ElasticException::DocumentParsing,
                reason: parse_failure.message,
            };
            let item = ElasticBulkItem {
                index_id: index_id.clone(),
                es_doc_id: doc_handle.es_doc_id.take(),
                status: StatusCode::BAD_REQUEST,
                error: Some(error),
            };
            let action = ElasticBulkAction::Index(item);
            positioned_actions.push((doc_handle.doc_position, action));
        }
        // Populate the remaining successful items.
        for mut doc_handle in doc_handles {
            if doc_handle.is_parse_failure {
                continue;
            }
            let item = ElasticBulkItem {
                index_id: index_id.clone(),
                es_doc_id: doc_handle.es_doc_id.take(),
                status: StatusCode::CREATED,
                error: None,
            };
            let action = ElasticBulkAction::Index(item);
            positioned_actions.push((doc_handle.doc_position, action));
        }
    }
    // Repeat the operation for each `IngestFailure` subresponse.
    for failure in ingest_response_v2.failures {
        errors = true;

        // Find the doc handles for the subrequest.
        let doc_handles =
            remove_doc_handles(&mut per_subrequest_doc_handles, failure.subrequest_id)
                .inspect_err(|_| {
                    rate_limited_error!(
                        limit_per_min = 6,
                        subrequest = failure.subrequest_id,
                        "failed to find error subrequest"
                    );
                })?;

        // Populate the response items with one error per doc handle.
        let (exception, reason, status) = match failure.reason() {
            IngestFailureReason::IndexNotFound => (
                ElasticException::IndexNotFound,
                format!("no such index [{}]", failure.index_id),
                StatusCode::NOT_FOUND,
            ),
            IngestFailureReason::SourceNotFound => (
                ElasticException::SourceNotFound,
                format!("no such source [{}]", failure.index_id),
                StatusCode::NOT_FOUND,
            ),
            IngestFailureReason::Timeout => (
                ElasticException::Timeout,
                format!("timeout [{}]", failure.index_id),
                StatusCode::REQUEST_TIMEOUT,
            ),
            IngestFailureReason::ShardRateLimited => (
                ElasticException::RateLimited,
                format!("shard rate limiting [{}]", failure.index_id),
                StatusCode::TOO_MANY_REQUESTS,
            ),
            IngestFailureReason::NoShardsAvailable => (
                ElasticException::RateLimited,
                format!("no shards available [{}]", failure.index_id),
                StatusCode::TOO_MANY_REQUESTS,
            ),
            reason => {
                let pretty_reason = reason
                    .as_str_name()
                    .strip_prefix("INGEST_FAILURE_REASON_")
                    .unwrap_or("")
                    .replace('_', " ")
                    .to_ascii_lowercase();
                (
                    ElasticException::Internal,
                    format!("{} error [{}]", pretty_reason, failure.index_id),
                    StatusCode::INTERNAL_SERVER_ERROR,
                )
            }
        };
        for mut doc_handle in doc_handles {
            let error = ElasticBulkError {
                index_id: Some(failure.index_id.clone()),
                exception,
                reason: reason.clone(),
            };
            let item = ElasticBulkItem {
                index_id: failure.index_id.clone(),
                es_doc_id: doc_handle.es_doc_id.take(),
                status,
                error: Some(error),
            };
            let action = ElasticBulkAction::Index(item);
            positioned_actions.push((doc_handle.doc_position, action));
        }
    }
    assert!(
        per_subrequest_doc_handles.is_empty(),
        "doc handles should be empty"
    );

    for (position, item) in invalid_index_id_items {
        errors = true;
        let action = ElasticBulkAction::Index(item);
        positioned_actions.push((position, action));
    }

    assert_eq!(
        positioned_actions.len(),
        action_count,
        "request and response action count should match"
    );
    positioned_actions.sort_unstable_by_key(|(idx, _)| *idx);
    let actions = positioned_actions
        .into_iter()
        .map(|(_, action)| action)
        .collect();

    let took_millis = now.elapsed().as_millis() as u64;

    let bulk_response = ElasticBulkResponse {
        took_millis,
        errors,
        actions,
    };
    Ok(bulk_response)
}

#[allow(clippy::result_large_err)]
fn remove_doc_handles(
    per_subrequest_doc_handles: &mut HashMap<u32, Vec<DocHandle>>,
    subrequest_id: u32,
) -> Result<Vec<DocHandle>, ElasticsearchError> {
    per_subrequest_doc_handles
        .remove(&subrequest_id)
        .ok_or_else(|| {
            ElasticsearchError::new(
                StatusCode::INTERNAL_SERVER_ERROR,
                format!("could not find subrequest `{subrequest_id}` in bulk request"),
                None,
            )
        })
}

fn make_invalid_index_id_item(index_id: String, es_doc_id: Option<String>) -> ElasticBulkItem {
    let error = ElasticBulkError {
        index_id: Some(index_id.clone()),
        exception: ElasticException::IllegalArgument,
        reason: format!("invalid index id [{index_id}]"),
    };
    ElasticBulkItem {
        index_id,
        es_doc_id,
        status: StatusCode::BAD_REQUEST,
        error: Some(error),
    }
}

#[cfg(test)]
mod tests {
    use bytesize::ByteSize;
    use quickwit_proto::ingest::router::{
        IngestFailure, IngestFailureReason, IngestResponseV2, IngestSuccess,
        MockIngestRouterService,
    };
    use quickwit_proto::ingest::{ParseFailure, ParseFailureReason};
    use quickwit_proto::types::{IndexUid, Position, ShardId};
    use warp::{Filter, Rejection, Reply};

    use super::*;
    use crate::elasticsearch_api::bulk_v2::ElasticBulkResponse;
    use crate::elasticsearch_api::filter::elastic_bulk_filter;
    use crate::elasticsearch_api::make_elastic_api_response;
    use crate::elasticsearch_api::model::ElasticsearchError;
    use crate::format::extract_format_from_qs;
    use crate::with_arg;

    impl ElasticBulkAction {
        fn index_id(&self) -> &IndexId {
            match self {
                ElasticBulkAction::Create(item) => &item.index_id,
                ElasticBulkAction::Index(item) => &item.index_id,
            }
        }

        fn es_doc_id(&self) -> Option<&str> {
            match self {
                ElasticBulkAction::Create(item) => item.es_doc_id.as_deref(),
                ElasticBulkAction::Index(item) => item.es_doc_id.as_deref(),
            }
        }

        fn status(&self) -> StatusCode {
            match self {
                ElasticBulkAction::Create(item) => item.status,
                ElasticBulkAction::Index(item) => item.status,
            }
        }

        fn error(&self) -> Option<&ElasticBulkError> {
            match self {
                ElasticBulkAction::Create(item) => item.error.as_ref(),
                ElasticBulkAction::Index(item) => item.error.as_ref(),
            }
        }
    }

    fn es_compat_bulk_handler_v2(
        ingest_router: IngestRouterServiceClient,
        content_length_limit: ByteSize,
    ) -> impl Filter<Extract = (impl Reply,), Error = Rejection> + Clone {
        elastic_bulk_filter(content_length_limit)
            .and(with_arg(ingest_router))
            .then(|body, bulk_options, ingest_router| {
                elastic_bulk_ingest_v2(None, body, bulk_options, ingest_router)
            })
            .and(extract_format_from_qs())
            .map(make_elastic_api_response)
    }

    #[tokio::test]
    async fn test_bulk_api_happy_path() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .once()
            .returning(|ingest_request| {
                assert_eq!(ingest_request.subrequests.len(), 2);
                assert_eq!(ingest_request.commit_type(), CommitTypeV2::Auto);

                let mut subrequests = ingest_request.subrequests;
                subrequests.sort_by(|left, right| left.index_id.cmp(&right.index_id));

                assert_eq!(subrequests[0].subrequest_id, 0);
                assert_eq!(subrequests[0].index_id, "my-index-1");
                assert_eq!(subrequests[0].source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(subrequests[0].doc_batch.as_ref().unwrap().num_docs(), 2);
                assert_eq!(subrequests[0].doc_batch.as_ref().unwrap().num_bytes(), 104);

                assert_eq!(subrequests[1].subrequest_id, 1);
                assert_eq!(subrequests[1].index_id, "my-index-2");
                assert_eq!(subrequests[1].source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(subrequests[1].doc_batch.as_ref().unwrap().num_docs(), 1);
                assert_eq!(subrequests[1].doc_batch.as_ref().unwrap().num_bytes(), 52);

                Ok(IngestResponseV2 {
                    successes: vec![
                        IngestSuccess {
                            subrequest_id: 0,
                            index_uid: Some(IndexUid::for_test("my-index-1", 0)),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            shard_id: Some(ShardId::from(1)),
                            replication_position_inclusive: Some(Position::offset(1u64)),
                            num_ingested_docs: 2,
                            parse_failures: Vec::new(),
                        },
                        IngestSuccess {
                            subrequest_id: 1,
                            index_uid: Some(IndexUid::for_test("my-index-2", 0)),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            shard_id: Some(ShardId::from(1)),
                            replication_position_inclusive: Some(Position::offset(0u64)),
                            num_ingested_docs: 1,
                            parse_failures: Vec::new(),
                        },
                    ],
                    failures: Vec::new(),
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let payload = r#"
            {"create": {"_index": "my-index-1", "_id" : "1"}}
            {"ts": 1, "message": "my-message-1"}
            {"create": {"_index": "my-index-2", "_id" : "1"}}
            {"ts": 1, "message": "my-message-1"}
            {"create": {"_index": "my-index-1"}}
            {"ts": 2, "message": "my-message-2"}
        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 200);

        let bulk_response: ElasticBulkResponse = serde_json::from_slice(response.body()).unwrap();
        assert!(!bulk_response.errors);

        let mut items = bulk_response
            .actions
            .into_iter()
            .map(|action| match action {
                ElasticBulkAction::Create(item) => item,
                ElasticBulkAction::Index(item) => item,
            })
            .collect::<Vec<_>>();
        assert_eq!(items.len(), 3);

        items.sort_by(|left, right| {
            left.index_id
                .cmp(&right.index_id)
                .then(left.es_doc_id.cmp(&right.es_doc_id))
        });
        assert_eq!(items[0].index_id, "my-index-1");
        assert!(items[0].es_doc_id.is_none());
        assert_eq!(items[0].status, StatusCode::CREATED);

        assert_eq!(items[1].index_id, "my-index-1");
        assert_eq!(items[1].es_doc_id.as_ref().unwrap(), "1");
        assert_eq!(items[1].status, StatusCode::CREATED);

        assert_eq!(items[2].index_id, "my-index-2");
        assert_eq!(items[2].es_doc_id.as_ref().unwrap(), "1");
        assert_eq!(items[2].status, StatusCode::CREATED);
    }

    #[tokio::test]
    async fn test_bulk_api_accepts_empty_requests() {
        let ingest_router = IngestRouterServiceClient::mocked();
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body("")
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 200);

        let bulk_response: ElasticBulkResponse = serde_json::from_slice(response.body()).unwrap();
        assert!(!bulk_response.errors)
    }

    #[tokio::test]
    async fn test_bulk_api_ignores_blank_lines() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .once()
            .returning(|ingest_request| {
                assert_eq!(ingest_request.subrequests.len(), 1);
                assert_eq!(ingest_request.commit_type(), CommitTypeV2::Auto);

                let subrequest_0 = &ingest_request.subrequests[0];

                assert_eq!(subrequest_0.index_id, "my-index-1");
                assert_eq!(subrequest_0.source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(subrequest_0.doc_batch.as_ref().unwrap().num_docs(), 1);
                assert_eq!(subrequest_0.doc_batch.as_ref().unwrap().num_bytes(), 52);

                Ok(IngestResponseV2 {
                    successes: vec![IngestSuccess {
                        subrequest_id: 0,
                        index_uid: Some(IndexUid::for_test("my-index-1", 0)),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shard_id: Some(ShardId::from(1)),
                        replication_position_inclusive: Some(Position::offset(0u64)),
                        num_ingested_docs: 1,
                        parse_failures: Vec::new(),
                    }],
                    failures: Vec::new(),
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let payload = r#"

            {"create": {"_index": "my-index-1", "_id" : "1"}}

            {"ts": 1, "message": "my-message-1"}
        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 200);

        let bulk_response: ElasticBulkResponse = serde_json::from_slice(response.body()).unwrap();
        assert!(!bulk_response.errors);
    }

    #[tokio::test]
    async fn test_bulk_api_handles_malformed_requests() {
        let ingest_router = IngestRouterServiceClient::mocked();
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let payload = r#"
            {"create": {"_index": "my-index-1", "_id" : "1"},}
            {"ts": 1, "message": "my-message-1"}
        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 400);

        let es_error: ElasticsearchError = serde_json::from_slice(response.body()).unwrap();
        assert_eq!(es_error.status, StatusCode::BAD_REQUEST);

        let reason = es_error.error.reason.unwrap();
        assert_eq!(
            reason,
            "Malformed action/metadata line [1]: expected value at line 1 column 60"
        );

        let payload = r#"
            {"create": {"_index": "my-index-1", "_id" : "1"}}
        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 400);

        let es_error: ElasticsearchError = serde_json::from_slice(response.body()).unwrap();
        assert_eq!(es_error.status, StatusCode::BAD_REQUEST);

        let reason = es_error.error.reason.unwrap();
        assert_eq!(reason, "Validation Failed: 1: no requests added;");

        let payload = r#"
            {"create": {"_id" : "1"}}
            {"ts": 1, "message": "my-message-1"}
        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 400);

        let es_error: ElasticsearchError = serde_json::from_slice(response.body()).unwrap();
        assert_eq!(es_error.status, StatusCode::BAD_REQUEST);

        let reason = es_error.error.reason.unwrap();
        assert_eq!(reason, "Validation Failed: 1: index is missing;");
    }

    #[tokio::test]
    async fn test_bulk_api_index_not_found() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .once()
            .returning(|ingest_request| {
                assert_eq!(ingest_request.subrequests.len(), 2);
                assert_eq!(ingest_request.commit_type(), CommitTypeV2::Auto);

                let mut subrequests = ingest_request.subrequests;
                subrequests.sort_by(|left, right| left.index_id.cmp(&right.index_id));

                assert_eq!(subrequests[0].subrequest_id, 0);
                assert_eq!(subrequests[0].index_id, "my-index-1");
                assert_eq!(subrequests[0].source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(subrequests[0].doc_batch.as_ref().unwrap().num_docs(), 2);

                assert_eq!(subrequests[1].subrequest_id, 1);
                assert_eq!(subrequests[1].index_id, "my-index-2");
                assert_eq!(subrequests[1].source_id, INGEST_V2_SOURCE_ID);
                assert_eq!(subrequests[1].doc_batch.as_ref().unwrap().num_docs(), 1);

                Ok(IngestResponseV2 {
                    successes: Vec::new(),
                    failures: vec![
                        IngestFailure {
                            subrequest_id: 0,
                            index_id: "my-index-1".to_string(),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            reason: IngestFailureReason::IndexNotFound as i32,
                        },
                        IngestFailure {
                            subrequest_id: 1,
                            index_id: "my-index-2".to_string(),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            reason: IngestFailureReason::IndexNotFound as i32,
                        },
                    ],
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let payload = r#"
            {"index": {"_index": "my-index-1", "_id" : "1"}}
            {"ts": 1, "message": "my-message-1"}
            {"index": {"_index": "my-index-1"}}
            {"ts": 2, "message": "my-message-1"}
            {"index": {"_index": "my-index-2", "_id" : "1"}}
            {"ts": 3, "message": "my-message-2"}
        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 200);

        let bulk_response: ElasticBulkResponse = serde_json::from_slice(response.body()).unwrap();
        assert!(bulk_response.errors);
        assert_eq!(bulk_response.actions.len(), 3);
    }

    #[test]
    fn test_bulk_api_make_elastic_bulk_response_v2() {
        let response = make_elastic_bulk_response_v2(
            IngestResponseV2::default(),
            HashMap::new(),
            Instant::now(),
            0,
            Vec::new(),
        )
        .unwrap();

        assert!(!response.errors);
        assert!(response.actions.is_empty());

        let ingest_response_v2 = IngestResponseV2 {
            successes: vec![IngestSuccess {
                subrequest_id: 0,
                index_uid: Some(IndexUid::for_test("test-index-foo", 0)),
                source_id: "test-source".to_string(),
                shard_id: Some(ShardId::from(0)),
                replication_position_inclusive: Some(Position::offset(0u64)),
                num_ingested_docs: 1,
                parse_failures: vec![ParseFailure {
                    doc_uid: Some(DocUid::for_test(1)),
                    reason: ParseFailureReason::InvalidJson as i32,
                    message: "failed to parse JSON document".to_string(),
                }],
            }],
            failures: vec![IngestFailure {
                subrequest_id: 1,
                index_id: "test-index-bar".to_string(),
                source_id: "test-source".to_string(),
                reason: IngestFailureReason::IndexNotFound as i32,
            }],
        };
        let per_request_doc_handles = HashMap::from_iter([
            (
                0,
                vec![
                    DocHandle {
                        doc_position: 0,
                        doc_uid: DocUid::for_test(0),
                        es_doc_id: Some("0".to_string()),
                        is_parse_failure: false,
                    },
                    DocHandle {
                        doc_position: 1,
                        doc_uid: DocUid::for_test(1),
                        es_doc_id: Some("1".to_string()),
                        is_parse_failure: false,
                    },
                ],
            ),
            (
                1,
                vec![DocHandle {
                    doc_position: 2,
                    doc_uid: DocUid::for_test(2),
                    es_doc_id: Some("2".to_string()),
                    is_parse_failure: false,
                }],
            ),
        ]);
        let response = make_elastic_bulk_response_v2(
            ingest_response_v2,
            per_request_doc_handles,
            Instant::now(),
            3,
            Vec::new(),
        )
        .unwrap();

        assert!(response.errors);
        assert_eq!(response.actions.len(), 3);

        assert_eq!(response.actions[0].index_id(), "test-index-foo");
        assert_eq!(response.actions[0].es_doc_id(), Some("0"));
        assert_eq!(response.actions[0].status(), StatusCode::CREATED);
        assert!(response.actions[0].error().is_none());

        assert_eq!(response.actions[1].index_id(), "test-index-foo");
        assert_eq!(response.actions[1].es_doc_id(), Some("1"));
        assert_eq!(response.actions[1].status(), StatusCode::BAD_REQUEST);

        let error = response.actions[1].error().unwrap();
        assert_eq!(error.index_id.as_ref().unwrap(), "test-index-foo");
        assert_eq!(error.exception, ElasticException::DocumentParsing);
        assert_eq!(error.reason, "failed to parse JSON document");

        assert_eq!(response.actions[2].index_id(), "test-index-bar");
        assert_eq!(response.actions[2].es_doc_id(), Some("2"));
        assert_eq!(response.actions[2].status(), StatusCode::NOT_FOUND);

        let error = response.actions[2].error().unwrap();
        assert_eq!(error.index_id.as_ref().unwrap(), "test-index-bar");
        assert_eq!(error.exception, ElasticException::IndexNotFound);
        assert_eq!(error.reason, "no such index [test-index-bar]");
    }

    #[tokio::test]
    async fn test_bulk_api_refresh_parameter() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .once()
            .returning(|ingest_request| {
                assert_eq!(ingest_request.commit_type(), CommitTypeV2::WaitFor);
                Ok(IngestResponseV2 {
                    successes: vec![IngestSuccess {
                        subrequest_id: 0,
                        index_uid: Some(IndexUid::for_test("my-index-1", 0)),
                        source_id: INGEST_V2_SOURCE_ID.to_string(),
                        shard_id: Some(ShardId::from(1)),
                        replication_position_inclusive: Some(Position::offset(1u64)),
                        num_ingested_docs: 2,
                        parse_failures: Vec::new(),
                    }],
                    failures: Vec::new(),
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let payload = r#"
            {"create": {"_index": "my-index-1", "_id" : "1"}}
            {"ts": 1, "message": "my-message-1"}
        "#;
        warp::test::request()
            .path("/_elastic/_bulk?refresh=wait_for")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
    }

    #[tokio::test]
    async fn test_bulk_api_invalid_index_id() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .once()
            .returning(|ingest_request| {
                assert_eq!(ingest_request.subrequests.len(), 2);
                Ok(IngestResponseV2 {
                    successes: vec![
                        IngestSuccess {
                            subrequest_id: 0,
                            index_uid: Some(IndexUid::for_test("my-index-1", 0)),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            shard_id: Some(ShardId::from(1)),
                            replication_position_inclusive: Some(Position::offset(1u64)),
                            num_ingested_docs: 2,
                            parse_failures: Vec::new(),
                        },
                        IngestSuccess {
                            subrequest_id: 1,
                            index_uid: Some(IndexUid::for_test("my-index-2", 0)),
                            source_id: INGEST_V2_SOURCE_ID.to_string(),
                            shard_id: Some(ShardId::from(1)),
                            replication_position_inclusive: Some(Position::offset(0u64)),
                            num_ingested_docs: 1,
                            parse_failures: Vec::new(),
                        },
                    ],
                    failures: Vec::new(),
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let handler = es_compat_bulk_handler_v2(ingest_router, ByteSize::mb(10));

        let payload = r#"
            {"create": {"_index": "my-index-1"}}
            {"ts": 1, "message": "my-message-1"}
            {"create": {"_index": "bad!"}}
            {"ts": 1, "message": "my-message-2"}
            {"create": {"_index": "my-index-2", "_id" : "1"}}
            {"ts": 1, "message": "my-message-3"}

        "#;
        let response = warp::test::request()
            .path("/_elastic/_bulk")
            .method("POST")
            .body(payload)
            .reply(&handler)
            .await;
        assert_eq!(response.status(), 200);

        let bulk_response: ElasticBulkResponse = serde_json::from_slice(response.body()).unwrap();
        assert!(bulk_response.errors);

        let items = bulk_response
            .actions
            .into_iter()
            .map(|action| match action {
                ElasticBulkAction::Create(item) => item,
                ElasticBulkAction::Index(item) => item,
            })
            .collect::<Vec<_>>();
        assert_eq!(items.len(), 3);

        assert_eq!(items[0].index_id, "my-index-1");
        assert!(items[0].es_doc_id.is_none());
        assert_eq!(items[0].status, StatusCode::CREATED);

        assert_eq!(items[1].index_id, "bad!");
        assert!(items[1].es_doc_id.is_none());
        assert_eq!(items[1].status, StatusCode::BAD_REQUEST);

        assert_eq!(items[2].index_id, "my-index-2");
        assert_eq!(items[2].es_doc_id.as_ref().unwrap(), "1");
        assert_eq!(items[2].status, StatusCode::CREATED);
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/filter.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytes::Bytes;
use bytesize::ByteSize;
use serde::de::DeserializeOwned;
use warp::reject::LengthRequired;
use warp::{Filter, Rejection};

use super::model::{
    CatIndexQueryParams, DeleteQueryParams, FieldCapabilityQueryParams, FieldCapabilityRequestBody,
    MultiSearchQueryParams, SearchQueryParamsCount,
};
use crate::Body;
use crate::decompression::get_body_bytes;
use crate::elasticsearch_api::model::{
    ElasticBulkOptions, ScrollQueryParams, SearchBody, SearchQueryParams,
};
use crate::search_api::{extract_index_id_patterns, extract_index_id_patterns_default};

const BODY_LENGTH_LIMIT: ByteSize = ByteSize::mib(1);

// TODO: Make all elastic endpoint models `utoipa` compatible
// and register them here.
#[derive(utoipa::OpenApi)]
#[openapi(paths(elastic_cluster_info_filter,))]
pub struct ElasticCompatibleApi;

#[utoipa::path(get, tag = "Cluster Info", path = "/_elastic")]
pub(crate) fn elastic_cluster_info_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone
{
    warp::path!("_elastic")
        .and(warp::get().or(warp::head()).unify())
        .and(warp::path::end())
}

#[utoipa::path(get, tag = "Search", path = "/_search")]
pub(crate) fn elasticsearch_filter()
-> impl Filter<Extract = (SearchQueryParams,), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_search")
        .and(warp::get().or(warp::post()).unify())
        .and(warp::query())
}

#[utoipa::path(
    post,
    tag = "Ingest",
    path = "/_bulk",
    request_body(content = String, description = "Elasticsearch compatible bulk request body limited to 10MB", content_type = "application/json"),
    responses(
        (status = 200, description = "Successfully ingested documents.", body = IngestResponse)
    ),
    params(
        ("refresh" = Option<ElasticRefresh>, Query, description = "Force or wait for commit at the end of the indexing operation."),
    )
)]
pub(crate) fn elastic_bulk_filter(
    content_length_limit: ByteSize,
) -> impl Filter<Extract = (Body, ElasticBulkOptions), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_bulk")
        .and(warp::post().or(warp::put()).unify())
        .and(warp::body::content_length_limit(
            content_length_limit.as_u64(),
        ))
        .and(get_body_bytes())
        .and(warp::query())
}

#[utoipa::path(
    post,
    tag = "Ingest",
    path = "/{index}/_bulk",
    request_body(content = String, description = "Elasticsearch compatible bulk request body limited to 10MB", content_type = "application/json"),
    responses(
        (status = 200, description = "Successfully ingested documents.", body = IngestResponse)
    ),
    params(
        ("refresh" = Option<ElasticRefresh>, Query, description = "Force or wait for commit at the end of the indexing operation."),
    )
)]
pub(crate) fn elastic_index_bulk_filter(
    content_length_limit: ByteSize,
) -> impl Filter<Extract = (String, Body, ElasticBulkOptions), Error = Rejection> + Clone {
    warp::path!("_elastic" / String / "_bulk")
        .and(warp::post().or(warp::put()).unify())
        .and(warp::body::content_length_limit(
            content_length_limit.as_u64(),
        ))
        .and(get_body_bytes())
        .and(warp::query::<ElasticBulkOptions>())
}

/// Like the warp json filter, but accepts an empty body and interprets it as `T::default`.
fn json_or_empty<T: DeserializeOwned + Send + Default>()
-> impl Filter<Extract = (T,), Error = Rejection> + Copy {
    warp::body::content_length_limit(BODY_LENGTH_LIMIT.as_u64())
        .and(warp::body::bytes().and_then(|buf: Bytes| async move {
            if buf.is_empty() {
                return Ok(T::default());
            }
            serde_json::from_slice(&buf)
                .map_err(|err| warp::reject::custom(crate::rest::InvalidJsonRequest(err)))
        }))
        .recover(|rejection: Rejection| async {
            // Not having a header with content length is not an error as long as
            // there are no body.
            if rejection.find::<LengthRequired>().is_some() {
                Ok(T::default())
            } else {
                Err(rejection)
            }
        })
        .unify()
}

#[utoipa::path(get, tag = "Metadata", path = "/{index}/_field_caps")]
pub(crate) fn elastic_index_field_capabilities_filter() -> impl Filter<
    Extract = (
        Vec<String>,
        FieldCapabilityQueryParams,
        FieldCapabilityRequestBody,
    ),
    Error = Rejection,
> + Clone {
    warp::path!("_elastic" / String / "_field_caps")
        .and_then(extract_index_id_patterns)
        .and(warp::get().or(warp::post()).unify())
        .and(warp::query())
        .and(json_or_empty())
}

#[utoipa::path(get, tag = "Metadata", path = "/_field_caps")]
pub(crate) fn elastic_field_capabilities_filter() -> impl Filter<
    Extract = (
        Vec<String>,
        FieldCapabilityQueryParams,
        FieldCapabilityRequestBody,
    ),
    Error = Rejection,
> + Clone {
    warp::path!("_elastic" / "_field_caps")
        .and_then(extract_index_id_patterns_default)
        .and(warp::get().or(warp::post()).unify())
        .and(warp::query())
        .and(json_or_empty())
}

#[utoipa::path(get, tag = "Metadata", path = "/_resolve/index/{index}")]
pub(crate) fn elastic_resolve_index_filter()
-> impl Filter<Extract = (Vec<String>,), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_resolve" / "index" / String)
        .and_then(extract_index_id_patterns)
        .and(warp::get())
}

#[utoipa::path(get, tag = "Count", path = "/{index}/_count")]
pub(crate) fn elastic_index_count_filter()
-> impl Filter<Extract = (Vec<String>, SearchQueryParamsCount, SearchBody), Error = Rejection> + Clone
{
    warp::path!("_elastic" / String / "_count")
        .and_then(extract_index_id_patterns)
        .and(warp::get().or(warp::post()).unify())
        .and(warp::query())
        .and(json_or_empty())
}

#[utoipa::path(delete, tag = "Indexes", path = "/{index}")]
pub(crate) fn elastic_delete_index_filter()
-> impl Filter<Extract = (Vec<String>, DeleteQueryParams), Error = Rejection> + Clone {
    warp::path!("_elastic" / String)
        .and(warp::delete())
        .and_then(extract_index_id_patterns)
        .and(warp::query())
}

// No support for any query parameters for now.
#[utoipa::path(get, tag = "Search", path = "/{index}/_stats")]
pub(crate) fn elastic_index_stats_filter()
-> impl Filter<Extract = (Vec<String>,), Error = Rejection> + Clone {
    warp::path!("_elastic" / String / "_stats")
        .and_then(extract_index_id_patterns)
        .and(warp::get())
}

#[utoipa::path(get, tag = "Search", path = "/_stats")]
pub(crate) fn elastic_stats_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_stats").and(warp::get())
}

#[utoipa::path(get, tag = "Search", path = "/_cluster/health")]
pub(crate) fn elastic_cluster_health_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone
{
    warp::path!("_elastic" / "_cluster" / "health").and(warp::get())
}

#[utoipa::path(get, tag = "Search", path = "/_cat/indices/{index}")]
pub(crate) fn elastic_index_cat_indices_filter()
-> impl Filter<Extract = (Vec<String>, CatIndexQueryParams), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_cat" / "indices" / String)
        .and_then(extract_index_id_patterns)
        .and(warp::get())
        .and(warp::query())
}

#[utoipa::path(get, tag = "Search", path = "/_cat/indices")]
pub(crate) fn elastic_cat_indices_filter()
-> impl Filter<Extract = (CatIndexQueryParams,), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_cat" / "indices")
        .and(warp::get())
        .and(warp::query())
}

#[utoipa::path(get, tag = "Search", path = "/{index}/_search")]
pub(crate) fn elastic_index_search_filter()
-> impl Filter<Extract = (Vec<String>, SearchQueryParams, SearchBody), Error = Rejection> + Clone {
    warp::path!("_elastic" / String / "_search")
        .and_then(extract_index_id_patterns)
        .and(warp::get().or(warp::post()).unify())
        .and(warp::query())
        .and(json_or_empty())
}

#[utoipa::path(post, tag = "Search", path = "/_msearch")]
pub(crate) fn elastic_multi_search_filter()
-> impl Filter<Extract = (Bytes, MultiSearchQueryParams), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_msearch")
        .and(warp::body::content_length_limit(BODY_LENGTH_LIMIT.as_u64()))
        .and(warp::body::bytes())
        .and(warp::post())
        .and(warp::query())
}

fn merge_scroll_body_params(
    from_query_string: ScrollQueryParams,
    from_body: ScrollQueryParams,
) -> ScrollQueryParams {
    ScrollQueryParams {
        scroll: from_query_string.scroll.or(from_body.scroll),
        scroll_id: from_query_string.scroll_id.or(from_body.scroll_id),
    }
}

pub(crate) fn elastic_nodes_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_nodes" / "http").and(warp::get())
}

pub(crate) fn elastic_search_shards_filter()
-> impl Filter<Extract = (String,), Error = Rejection> + Clone {
    warp::path!("_elastic" / String / "_search_shards").and(warp::get())
}

#[utoipa::path(post, tag = "Search", path = "/_search/scroll")]
pub(crate) fn elastic_scroll_filter()
-> impl Filter<Extract = (ScrollQueryParams,), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_search" / "scroll")
        .and(warp::body::content_length_limit(BODY_LENGTH_LIMIT.as_u64()))
        .and(warp::get().or(warp::post()).unify())
        .and(warp::query())
        .and(json_or_empty())
        .map(
            |scroll_query_params: ScrollQueryParams, scroll_body: ScrollQueryParams| {
                merge_scroll_body_params(scroll_query_params, scroll_body)
            },
        )
}

pub(crate) fn elastic_delete_scroll_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone
{
    warp::path!("_elastic" / "_search" / "scroll").and(warp::delete())
}

pub(crate) fn elastic_aliases_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone {
    warp::path!("_elastic" / "_aliases").and(warp::get())
}

pub(crate) fn elastic_index_mapping_filter()
-> impl Filter<Extract = (String,), Error = Rejection> + Clone {
    warp::path!("_elastic" / String / "_mapping")
        .or(warp::path!("_elastic" / String / "_mappings"))
        .unify()
        .and(warp::get())
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod bulk;
mod bulk_v2;
mod filter;
mod model;
mod rest_handler;

use std::sync::Arc;

use bulk::{es_compat_bulk_handler, es_compat_index_bulk_handler};
pub use filter::ElasticCompatibleApi;
use quickwit_cluster::Cluster;
use quickwit_config::NodeConfig;
use quickwit_index_management::IndexService;
use quickwit_ingest::IngestServiceClient;
use quickwit_proto::ingest::router::IngestRouterServiceClient;
use quickwit_proto::metastore::MetastoreServiceClient;
use quickwit_search::SearchService;
pub use rest_handler::{
    es_compat_cat_indices_handler, es_compat_cluster_info_handler, es_compat_delete_index_handler,
    es_compat_delete_scroll_handler, es_compat_index_cat_indices_handler,
    es_compat_index_count_handler, es_compat_index_field_capabilities_handler,
    es_compat_index_multi_search_handler, es_compat_index_search_handler,
    es_compat_index_stats_handler, es_compat_resolve_index_handler, es_compat_scroll_handler,
    es_compat_search_handler, es_compat_stats_handler,
};
use rest_handler::{
    es_compat_cluster_health_handler, es_compat_nodes_handler, es_compat_search_shards_handler,
};
use serde::{Deserialize, Serialize};
use warp::hyper::StatusCode;
use warp::{Filter, Rejection};

use crate::elasticsearch_api::model::ElasticsearchError;
use crate::elasticsearch_api::rest_handler::{
    es_compat_aliases_handler, es_compat_index_mapping_handler,
};
use crate::rest::recover_fn;
use crate::rest_api_response::RestApiResponse;
use crate::{BodyFormat, BuildInfo};

/// Setup Elasticsearch API handlers
///
/// This is where all newly supported Elasticsearch handlers
/// should be registered.
#[allow(clippy::too_many_arguments)] // Will go away when we remove ingest v1.
pub fn elastic_api_handlers(
    cluster: Cluster,
    node_config: Arc<NodeConfig>,
    search_service: Arc<dyn SearchService>,
    ingest_service: IngestServiceClient,
    ingest_router: IngestRouterServiceClient,
    metastore: MetastoreServiceClient,
    index_service: IndexService,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    let ingest_content_length_limit = node_config.ingest_api_config.content_length_limit;
    es_compat_cluster_info_handler(node_config.clone(), BuildInfo::get())
        .or(es_compat_nodes_handler(node_config.clone()))
        .or(es_compat_search_handler(search_service.clone()))
        .or(es_compat_bulk_handler(
            ingest_service.clone(),
            ingest_router.clone(),
            ingest_content_length_limit,
            enable_ingest_v1,
            enable_ingest_v2,
        ))
        .boxed()
        .or(es_compat_index_bulk_handler(
            ingest_service,
            ingest_router,
            ingest_content_length_limit,
            enable_ingest_v1,
            enable_ingest_v2,
        ))
        .or(es_compat_index_search_handler(search_service.clone()))
        .or(es_compat_index_count_handler(search_service.clone()))
        .or(es_compat_scroll_handler(search_service.clone()))
        .or(es_compat_delete_scroll_handler())
        .or(es_compat_index_multi_search_handler(search_service.clone()))
        .or(es_compat_index_field_capabilities_handler(
            search_service.clone(),
        ))
        .boxed()
        .or(es_compat_index_stats_handler(metastore.clone()))
        .or(es_compat_delete_index_handler(index_service))
        .or(es_compat_stats_handler(metastore.clone()))
        .or(es_compat_cluster_health_handler(cluster))
        .or(es_compat_index_cat_indices_handler(metastore.clone()))
        .or(es_compat_cat_indices_handler(metastore.clone()))
        .or(es_compat_resolve_index_handler(metastore.clone()))
        .or(es_compat_aliases_handler())
        .or(es_compat_index_mapping_handler(
            metastore.clone(),
            search_service.clone(),
        ))
        .or(es_compat_search_shards_handler(node_config))
        .recover(recover_fn)
        .with(warp::reply::with::header(
            "X-Elastic-Product",
            "Elasticsearch",
        ))
        .boxed()
    // Register newly created handlers here.
}

/// Helper type needed by the Elasticsearch endpoints.
/// Control how the total number of hits should be tracked.
///
/// When set to `Track` with a value `true`, the response will always track the number of hits that
/// match the query accurately.
///
/// When set to `Count` with an integer value `n`, the response accurately tracks the total
/// hit count that match the query up to `n` documents.
#[derive(Debug, Clone, Copy, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
pub enum TrackTotalHits {
    /// Track the number of hits that match the query accurately.
    Track(bool),
    /// Track the number of hits up to the specified value.
    Count(i64),
}

impl From<bool> for TrackTotalHits {
    fn from(b: bool) -> Self {
        TrackTotalHits::Track(b)
    }
}

impl From<i64> for TrackTotalHits {
    fn from(i: i64) -> Self {
        TrackTotalHits::Count(i)
    }
}

fn make_elastic_api_response<T: serde::Serialize>(
    elasticsearch_result: Result<T, ElasticsearchError>,
    body_format: BodyFormat,
) -> RestApiResponse {
    let status_code = match &elasticsearch_result {
        Ok(_) => StatusCode::OK,
        Err(error) => error.status,
    };
    RestApiResponse::new(&elasticsearch_result, status_code, body_format)
}

#[cfg(test)]
mod tests {
    use std::sync::Arc;

    use assert_json_diff::assert_json_include;
    use mockall::predicate;
    use quickwit_cluster::{ChannelTransport, Cluster, create_cluster_for_test};
    use quickwit_config::NodeConfig;
    use quickwit_index_management::IndexService;
    use quickwit_ingest::{IngestApiService, IngestServiceClient};
    use quickwit_metastore::metastore_for_test;
    use quickwit_proto::ingest::router::IngestRouterServiceClient;
    use quickwit_proto::metastore::MetastoreServiceClient;
    use quickwit_search::MockSearchService;
    use quickwit_storage::StorageResolver;
    use serde_json::Value as JsonValue;
    use warp::Filter;

    use super::elastic_api_handlers;
    use super::model::ElasticsearchError;
    use crate::BuildInfo;
    use crate::elasticsearch_api::rest_handler::es_compat_cluster_info_handler;
    use crate::rest::recover_fn;

    fn ingest_service_client() -> IngestServiceClient {
        let universe = quickwit_actors::Universe::new();
        let (ingest_service_mailbox, _) = universe.create_test_mailbox::<IngestApiService>();
        IngestServiceClient::from_mailbox(ingest_service_mailbox)
    }

    pub async fn mock_cluster() -> Cluster {
        let transport = ChannelTransport::default();
        create_cluster_for_test(Vec::new(), &[], &transport, false)
            .await
            .unwrap()
    }

    #[tokio::test]
    async fn test_msearch_api_return_200_responses() {
        let config = Arc::new(NodeConfig::for_test());
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .with(predicate::function(
                |search_request: &quickwit_proto::search::SearchRequest| {
                    (search_request.index_id_patterns == vec!["index-1".to_string()]
                        && search_request.start_offset == 5
                        && search_request.max_hits == 20)
                        || (search_request.index_id_patterns == vec!["index-2".to_string()]
                            && search_request.start_offset == 0
                            && search_request.max_hits == 10)
                },
            ))
            .returning(|_| Ok(Default::default()));
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = super::elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {"index":"index-1"}
            {"query":{"query_string":{"query":"test"}}, "from": 5, "size": 20}
            {"index":"index-2"}
            {"query":{"query_string":{"query":"test"}}}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
        assert_eq!(
            resp.headers().get("x-elastic-product").unwrap(),
            "Elasticsearch"
        );
        let string_body = String::from_utf8(resp.body().to_vec()).unwrap();
        let es_msearch_response: serde_json::Value = serde_json::from_str(&string_body).unwrap();
        let responses = es_msearch_response
            .get("responses")
            .unwrap()
            .as_array()
            .unwrap();
        assert_eq!(responses.len(), 2);
        for response in responses {
            assert_eq!(response.get("status").unwrap().as_u64().unwrap(), 200);
            assert_eq!(response.get("error"), None);
            response.get("hits").unwrap();
        }
    }

    #[tokio::test]
    async fn test_msearch_api_return_one_500_and_one_200_responses() {
        let config = Arc::new(NodeConfig::for_test());
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .returning(|search_request| {
                if search_request
                    .index_id_patterns
                    .contains(&"index-1".to_string())
                {
                    Ok(Default::default())
                } else {
                    Err(quickwit_search::SearchError::Internal(
                        "something bad happened".to_string(),
                    ))
                }
            });

        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = super::elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {"index":"index-1"}
            {"query":{"query_string":{"query":"test"}}, "from": 5, "size": 10}
            {"index":"index-2"}
            {"query":{"query_string":{"query":"test"}}}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let es_msearch_response: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
        let responses = es_msearch_response
            .get("responses")
            .unwrap()
            .as_array()
            .unwrap();
        assert_eq!(responses.len(), 2);
        assert_eq!(responses[0].get("status").unwrap().as_u64().unwrap(), 200);
        assert_eq!(responses[0].get("error"), None);
        assert_eq!(responses[1].get("status").unwrap().as_u64().unwrap(), 500);
        assert_eq!(responses[1].get("hits"), None);
        let error_cause = responses[1].get("error").unwrap();
        assert_eq!(
            error_cause.get("reason").unwrap().as_str().unwrap(),
            "internal error: `something bad happened`"
        );
    }

    #[tokio::test]
    async fn test_msearch_api_return_400_with_malformed_request_header() {
        let config = Arc::new(NodeConfig::for_test());
        let mock_search_service = MockSearchService::new();

        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = super::elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {"index":"index-1"
            {"query":{"query_string":{"query":"test"}}}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 400);
        let es_error: ElasticsearchError = serde_json::from_slice(resp.body()).unwrap();
        assert!(
            es_error
                .error
                .reason
                .unwrap()
                .starts_with("Invalid argument: failed to parse request header")
        );
    }

    #[tokio::test]
    async fn test_msearch_api_return_400_with_malformed_request_body() {
        let config = Arc::new(NodeConfig::for_test());
        let mock_search_service = MockSearchService::new();

        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {"index":"index-1"}
            {"query":{"query_string":{"bad":"test"}}}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 400);
        let es_error: ElasticsearchError = serde_json::from_slice(resp.body()).unwrap();
        assert!(
            es_error
                .error
                .reason
                .unwrap()
                .starts_with("Invalid argument: failed to parse request body")
        );
    }

    #[tokio::test]
    async fn test_msearch_api_return_400_with_only_a_header_request() {
        let config = Arc::new(NodeConfig::for_test());
        let mock_search_service = MockSearchService::new();

        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = super::elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {"index":"index-1"}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 400);
        let es_error: ElasticsearchError = serde_json::from_slice(resp.body()).unwrap();
        assert!(
            es_error
                .error
                .reason
                .unwrap()
                .starts_with("Invalid argument: expect request body after request header")
        );
    }

    #[tokio::test]
    async fn test_msearch_api_return_400_with_no_index() {
        let config = Arc::new(NodeConfig::for_test());
        let mock_search_service = MockSearchService::new();

        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = super::elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {}
            {"query":{"query_string":{"bad":"test"}}}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 400);
        let es_error: ElasticsearchError = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(
            es_error.error.reason.unwrap(),
            "Invalid argument: `_msearch` request header must define at least one index"
        );
    }

    #[tokio::test]
    async fn test_msearch_api_return_400_with_multiple_indexes() {
        let config = Arc::new(NodeConfig::for_test());
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .returning(|search_request| {
                if search_request.index_id_patterns
                    == vec!["index-1".to_string(), "index-2".to_string()]
                {
                    Ok(Default::default())
                } else {
                    Err(quickwit_search::SearchError::Internal(
                        "something bad happened".to_string(),
                    ))
                }
            });
        let ingest_router = IngestRouterServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_for_test(), StorageResolver::unconfigured());
        let es_search_api_handler = super::elastic_api_handlers(
            mock_cluster().await,
            config,
            Arc::new(mock_search_service),
            ingest_service_client(),
            ingest_router,
            MetastoreServiceClient::mocked(),
            index_service,
            true,
            false,
        );
        let msearch_payload = r#"
            {"index": ["index-1", "index-2"]}
            {"query":{"query_string":{"query":"test"}}}
            "#;
        let resp = warp::test::request()
            .path("/_elastic/_msearch")
            .method("POST")
            .body(msearch_payload)
            .reply(&es_search_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
    }

    #[tokio::test]
    async fn test_es_compat_cluster_info_handler() {
        let build_info = BuildInfo::get();
        let config = Arc::new(NodeConfig::for_test());
        let handler =
            es_compat_cluster_info_handler(config.clone(), build_info).recover(recover_fn);
        let resp = warp::test::request()
            .path("/_elastic")
            .reply(&handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "name" : config.node_id,
            "cluster_name" : config.cluster_id,
            "version" : {
                "distribution" : "quickwit",
                "number" : "7.17.0",
                "build_hash" : build_info.commit_hash,
                "build_date" : build_info.build_date,
                "build_snapshot" : false,
                "lucene_version" : "8.11.1",
                "minimum_wire_compatibility_version" : "6.8.0",
                "minimum_index_compatibility_version" : "6.0.0-beta1",
            }
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);
    }

    #[tokio::test]
    async fn test_head_request_on_root_endpoint() {
        let build_info = BuildInfo::get();
        let config = Arc::new(NodeConfig::for_test());
        let handler =
            es_compat_cluster_info_handler(config.clone(), build_info).recover(recover_fn);
        let resp = warp::test::request()
            .path("/_elastic")
            .method("HEAD")
            .reply(&handler)
            .await;
        assert_eq!(resp.status(), 200);
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/bulk_body.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_proto::types::IndexId;
use serde::Deserialize;

#[derive(Clone, Debug, Deserialize, PartialEq)]
#[serde(rename_all(deserialize = "lowercase"))]
pub enum BulkAction {
    Create(BulkActionMeta),
    Index(BulkActionMeta),
}

impl BulkAction {
    pub fn into_index_id(self) -> Option<IndexId> {
        match self {
            BulkAction::Index(meta) => meta.index_id,
            BulkAction::Create(meta) => meta.index_id,
        }
    }

    pub fn into_meta(self) -> BulkActionMeta {
        match self {
            BulkAction::Create(meta) => meta,
            BulkAction::Index(meta) => meta,
        }
    }
}

#[derive(Clone, Debug, Deserialize, PartialEq)]
pub struct BulkActionMeta {
    #[serde(alias = "_index")]
    #[serde(default)]
    pub index_id: Option<IndexId>,
    #[serde(alias = "_id")]
    #[serde(default)]
    pub es_doc_id: Option<String>,
}

#[cfg(test)]
mod tests {
    use crate::elasticsearch_api::model::BulkAction;
    use crate::elasticsearch_api::model::bulk_body::BulkActionMeta;

    #[test]
    fn test_bulk_action_serde() {
        {
            let bulk_action_json = r#"{
                "create": {
                    "_index": "test",
                    "_id" : "2"
                }
            }"#;
            let bulk_action = serde_json::from_str::<BulkAction>(bulk_action_json).unwrap();
            assert_eq!(
                bulk_action,
                BulkAction::Create(BulkActionMeta {
                    index_id: Some("test".to_string()),
                    es_doc_id: Some("2".to_string()),
                })
            );
        }
        {
            let bulk_action_json = r#"{
                "create": {
                    "_index": "test"
                }
            }"#;
            let bulk_action = serde_json::from_str::<BulkAction>(bulk_action_json).unwrap();
            assert_eq!(
                bulk_action,
                BulkAction::Create(BulkActionMeta {
                    index_id: Some("test".to_string()),
                    es_doc_id: None,
                })
            );
        }
        {
            let bulk_action_json = r#"{
                "create": {
                    "_id": "3"
                }
            }"#;
            let bulk_action = serde_json::from_str::<BulkAction>(bulk_action_json).unwrap();
            assert_eq!(
                bulk_action,
                BulkAction::Create(BulkActionMeta {
                    index_id: None,
                    es_doc_id: Some("3".to_string()),
                })
            );
        }
        {
            let bulk_action_json = r#"{
                "delete": {
                    "_index": "test",
                    "_id": "2"
                }
            }"#;
            serde_json::from_str::<BulkAction>(bulk_action_json).unwrap_err();
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/bulk_query_params.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_ingest::CommitType;
use quickwit_proto::ingest::CommitTypeV2;
use serde::Deserialize;

#[derive(Clone, Copy, Debug, Default, Deserialize, PartialEq)]
pub struct ElasticBulkOptions {
    #[serde(default)]
    pub refresh: ElasticRefresh,
    #[serde(default)]
    pub use_legacy_ingest: bool,
}

/// ?refresh parameter for elasticsearch bulk request
///
/// The syntax for this parameter is a bit confusing for backward compatibility reasons.
/// - Absence of ?refresh parameter or ?refresh=false means no refresh
/// - Presence of ?refresh parameter without any values or ?refresh=true means force refresh
/// - ?refresh=wait_for means wait for refresh
#[derive(Clone, Copy, Debug, Deserialize, PartialEq, utoipa::ToSchema)]
#[serde(rename_all(deserialize = "snake_case"))]
#[derive(Default)]
pub enum ElasticRefresh {
    // if the refresh parameter is not present it is false
    #[default]
    /// The request doesn't wait for commit
    False,
    // but if it is present without a value like this: ?refresh, it should be the same as
    // ?refresh=true
    #[serde(alias = "")]
    /// The request forces an immediate commit after the last document in the batch and waits for
    /// it to finish.
    True,
    /// The request will wait for the next scheduled commit to finish.
    WaitFor,
}

impl From<ElasticRefresh> for CommitType {
    fn from(val: ElasticRefresh) -> Self {
        match val {
            ElasticRefresh::False => Self::Auto,
            ElasticRefresh::True => Self::Force,
            ElasticRefresh::WaitFor => Self::WaitFor,
        }
    }
}

impl From<ElasticRefresh> for CommitTypeV2 {
    fn from(val: ElasticRefresh) -> Self {
        match val {
            ElasticRefresh::False => Self::Auto,
            ElasticRefresh::True => Self::Force,
            ElasticRefresh::WaitFor => Self::WaitFor,
        }
    }
}

#[cfg(test)]
mod tests {
    use crate::elasticsearch_api::model::ElasticBulkOptions;
    use crate::elasticsearch_api::model::bulk_query_params::ElasticRefresh;

    #[test]
    fn test_elastic_refresh_parsing() {
        assert_eq!(
            serde_qs::from_str::<ElasticBulkOptions>("")
                .unwrap()
                .refresh,
            ElasticRefresh::False
        );
        assert_eq!(
            serde_qs::from_str::<ElasticBulkOptions>("refresh=true")
                .unwrap()
                .refresh,
            ElasticRefresh::True
        );
        assert_eq!(
            serde_qs::from_str::<ElasticBulkOptions>("refresh=false")
                .unwrap()
                .refresh,
            ElasticRefresh::False
        );
        assert_eq!(
            serde_qs::from_str::<ElasticBulkOptions>("refresh=wait_for")
                .unwrap()
                .refresh,
            ElasticRefresh::WaitFor
        );
        assert_eq!(
            serde_qs::from_str::<ElasticBulkOptions>("refresh")
                .unwrap()
                .refresh,
            ElasticRefresh::True
        );
        assert_eq!(
            serde_qs::from_str::<ElasticBulkOptions>("refresh=wait")
                .unwrap_err()
                .to_string(),
            "unknown variant `wait`, expected one of `false`, ``, `true`, `wait_for`"
        );
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/cat_indices.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::ops::AddAssign;

use quickwit_metastore::{IndexMetadata, SplitMetadata};
use serde::{Deserialize, Serialize, Serializer};
use warp::hyper::StatusCode;

use super::ElasticsearchError;
use crate::simple_list::{from_simple_list, to_simple_list};

#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct CatIndexQueryParams {
    #[serde(default)]
    /// Only JSON supported for now.
    pub format: Option<String>,
    /// Comma-separated list of column names to display.
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub h: Option<Vec<String>>,
    #[serde(default)]
    /// Filter for health: green, yellow, or red
    pub health: Option<Health>,
    /// Unit used to display byte values.
    /// Unsupported for now.
    #[serde(default)]
    pub bytes: Option<String>,
    /// Comma-separated list of column names or column aliases used to sort the response.
    /// Unsupported for now.
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub s: Option<Vec<String>>,
    /// If true, the response includes column headings. Defaults to false.
    /// Unsupported for now.
    #[serde(default)]
    pub v: Option<bool>,
}
impl CatIndexQueryParams {
    #[allow(clippy::result_large_err)]
    pub fn validate(&self) -> Result<(), ElasticsearchError> {
        if let Some(format) = &self.format {
            if format.to_lowercase() != "json" {
                return Err(ElasticsearchError::new(
                    StatusCode::BAD_REQUEST,
                    format!("Format {format:?} is not supported. Only format=json is supported."),
                    None,
                ));
            }
        } else {
            return Err(ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                "Only format=json is supported.".to_string(),
                None,
            ));
        }
        let unsupported_parameter_error = |field: &str| {
            ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                format!("Parameter {field:?} is not supported."),
                None,
            )
        };
        if self.bytes.is_some() {
            return Err(unsupported_parameter_error("bytes"));
        }
        if self.v.is_some() {
            return Err(unsupported_parameter_error("v"));
        }
        if let Some(sort_by) = &self.s {
            if sort_by.len() > 1 {
                return Err(unsupported_parameter_error("s"));
            }
            if sort_by[0] != "index" && sort_by[0] != "index:asc" {
                return Err(unsupported_parameter_error("s"));
            }
        }
        Ok(())
    }
}

#[derive(Debug, Clone, Default, Serialize)]
pub struct ElasticsearchCatIndexResponse {
    pub health: Health,
    status: Status,
    pub index: String,
    uuid: String,
    pri: String,
    rep: String,
    #[serde(rename = "docs.count", serialize_with = "serialize_u64_as_string")]
    docs_count: u64,
    #[serde(rename = "docs.deleted", serialize_with = "serialize_u64_as_string")]
    docs_deleted: u64,
    #[serde(rename = "store.size", serialize_with = "ser_es_format")]
    store_size: u64,
    #[serde(rename = "pri.store.size", serialize_with = "ser_es_format")]
    pri_store_size: u64,
    #[serde(rename = "dataset.size", serialize_with = "ser_es_format")]
    dataset_size: u64,
}

impl ElasticsearchCatIndexResponse {
    pub fn serialize_filtered(
        &self,
        fields: &Option<Vec<String>>,
    ) -> serde_json::Result<serde_json::Value> {
        let mut value = serde_json::to_value(self)?;

        if let Some(fields) = fields {
            let fields: HashSet<String> = fields.iter().cloned().collect();
            // If fields are specified, retain only those fields
            if let serde_json::Value::Object(ref mut map) = value {
                map.retain(|key, _| fields.contains(key));
            }
        }

        Ok(value)
    }
}
impl AddAssign for ElasticsearchCatIndexResponse {
    fn add_assign(&mut self, rhs: Self) {
        self.health += rhs.health;
        self.status += rhs.status;
        self.docs_count += rhs.docs_count;
        self.docs_deleted += rhs.docs_deleted;
        self.store_size += rhs.store_size;
        self.pri_store_size += rhs.pri_store_size;
        self.dataset_size += rhs.dataset_size;
    }
}

impl From<IndexMetadata> for ElasticsearchCatIndexResponse {
    fn from(index_metadata: IndexMetadata) -> Self {
        ElasticsearchCatIndexResponse {
            uuid: index_metadata.index_uid.to_string(),
            index: index_metadata.index_config.index_id.to_string(),
            pri: "1".to_string(),
            rep: "1".to_string(),
            ..Default::default()
        }
    }
}

impl From<SplitMetadata> for ElasticsearchCatIndexResponse {
    fn from(split_metadata: SplitMetadata) -> Self {
        ElasticsearchCatIndexResponse {
            store_size: split_metadata.as_split_info().file_size_bytes.as_u64(),
            pri_store_size: split_metadata.as_split_info().file_size_bytes.as_u64(),
            dataset_size: split_metadata
                .as_split_info()
                .uncompressed_docs_size_bytes
                .as_u64(),
            uuid: split_metadata.index_uid.to_string(),
            pri: "1".to_string(),
            rep: "1".to_string(),
            docs_count: split_metadata.as_split_info().num_docs as u64,
            ..Default::default()
        }
    }
}

#[derive(Debug, Clone, Default, Serialize)]
pub struct ElasticsearchResolveIndexResponse {
    pub indices: Vec<ElasticsearchResolveIndexEntryResponse>,
    // Unused for the moment.
    pub aliases: Vec<serde_json::Value>,
    pub data_streams: Vec<serde_json::Value>,
}

#[derive(Debug, Clone, Default, Serialize)]
pub struct ElasticsearchResolveIndexEntryResponse {
    pub name: String,
    pub attributes: Vec<Status>,
}

impl From<IndexMetadata> for ElasticsearchResolveIndexEntryResponse {
    fn from(index_metadata: IndexMetadata) -> Self {
        ElasticsearchResolveIndexEntryResponse {
            name: index_metadata.index_config.index_id.to_string(),
            attributes: vec![Status::Open],
        }
    }
}

fn serialize_u64_as_string<S>(value: &u64, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer {
    serializer.serialize_str(&value.to_string())
}

fn ser_es_format<S>(bytes: &u64, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer {
    serializer.serialize_str(&format_byte_size(*bytes))
}

fn format_byte_size(bytes: u64) -> String {
    const KILOBYTE: u64 = 1024;
    const MEGABYTE: u64 = KILOBYTE * 1024;
    const GIGABYTE: u64 = MEGABYTE * 1024;
    const TERABYTE: u64 = GIGABYTE * 1024;
    if bytes < KILOBYTE {
        format!("{bytes}b")
    } else if bytes < MEGABYTE {
        format!("{:.1}kb", bytes as f64 / KILOBYTE as f64)
    } else if bytes < GIGABYTE {
        format!("{:.1}mb", bytes as f64 / MEGABYTE as f64)
    } else if bytes < TERABYTE {
        format!("{:.1}gb", bytes as f64 / GIGABYTE as f64)
    } else {
        format!("{:.1}tb", bytes as f64 / TERABYTE as f64)
    }
}

#[derive(Debug, Default, Clone, Copy, Serialize, Deserialize, Eq, PartialEq)]
#[serde(rename_all = "lowercase")]
pub enum Health {
    #[default]
    Green = 1,
    Yellow = 2,
    Red = 3,
}
impl AddAssign for Health {
    fn add_assign(&mut self, other: Self) {
        *self = match std::cmp::max(*self as u8, other as u8) {
            1 => Health::Green,
            2 => Health::Yellow,
            _ => Health::Red,
        };
    }
}

#[derive(Debug, Default, Clone, Copy, Serialize, Deserialize)]
#[serde(rename_all = "lowercase")]
pub enum Status {
    #[default]
    Open = 1,
}
impl AddAssign for Status {
    fn add_assign(&mut self, other: Self) {
        *self = match std::cmp::max(*self as u8, other as u8) {
            1 => Status::Open,
            _ => Status::Open,
        };
    }
}

#[cfg(test)]
mod tests {
    use serde_json::json;

    use super::*;

    #[test]
    fn test_serialize_filtered() {
        let response = ElasticsearchCatIndexResponse {
            health: Health::Green,
            status: Status::Open,
            index: "test_index".to_string(),
            uuid: "test_uuid".to_string(),
            pri: "1".to_string(),
            rep: "2".to_string(),
            docs_count: 100,
            docs_deleted: 10,
            store_size: 1000,
            pri_store_size: 500,
            dataset_size: 1500,
        };

        // Test serialization with all fields
        let all_fields = response.serialize_filtered(&None).unwrap();
        let expected_all_fields = json!({
            "health": "green",
            "status": "open",
            "index": "test_index",
            "uuid": "test_uuid",
            "pri": "1",
            "rep": "2",
            "docs.count": "100",
            "docs.deleted": "10",
            "store.size": "1000b",  // Assuming ser_es_format formats size to kb
            "pri.store.size": "500b", // Example format
            "dataset.size": "1.5kb", // Example format
        });
        assert_eq!(all_fields, expected_all_fields);

        // Test serialization with selected fields
        let selected_fields = response
            .serialize_filtered(&Some(vec!["index".to_string(), "uuid".to_string()]))
            .unwrap();
        let expected_selected_fields = json!({
            "index": "test_index",
            "uuid": "test_uuid"
        });
        assert_eq!(selected_fields, expected_selected_fields);

        // Add more test cases as needed
    }

    #[test]
    fn test_cat_index_query_params_validate_s_parameter() {
        let params = CatIndexQueryParams {
            format: Some("json".to_string()),
            s: Some(vec!["index:asc".to_string()]),
            ..Default::default()
        };
        assert!(params.validate().is_ok());

        let params = CatIndexQueryParams {
            format: Some("json".to_string()),
            s: Some(vec!["index".to_string()]),
            ..Default::default()
        };
        assert!(params.validate().is_ok());

        let params = CatIndexQueryParams {
            format: Some("json".to_string()),
            s: Some(vec!["index:desc".to_string()]),
            ..Default::default()
        };
        assert!(params.validate().is_err());

        let params = CatIndexQueryParams {
            format: Some("json".to_string()),
            s: Some(vec!["index:asc".to_string(), "docs.count".to_string()]),
            ..Default::default()
        };
        assert!(params.validate().is_err());

        let params = CatIndexQueryParams {
            format: Some("json".to_string()),
            s: None,
            ..Default::default()
        };
        assert!(params.validate().is_ok());
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use elasticsearch_dsl::search::ErrorCause;
use quickwit_common::{rate_limited_debug, rate_limited_error};
use quickwit_index_management::IndexServiceError;
use quickwit_ingest::IngestServiceError;
use quickwit_proto::ServiceError;
use quickwit_proto::ingest::IngestV2Error;
use quickwit_search::SearchError;
use serde::{Deserialize, Serialize};
use warp::hyper::StatusCode;

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ElasticsearchError {
    #[serde(with = "http_serde::status_code")]
    pub status: StatusCode,
    pub error: ErrorCause,
}

impl ElasticsearchError {
    pub fn new(
        status: StatusCode,
        reason: String,
        exception_opt: Option<ElasticException>,
    ) -> Self {
        if status.is_server_error() {
            rate_limited_error!(limit_per_min=10, status=%status, "http request failed with server error: {reason}");
        } else if !status.is_success() {
            rate_limited_debug!(limit_per_min=10, status=%status, "http request failed: {reason}");
        }
        ElasticsearchError {
            status,
            error: ErrorCause {
                reason: Some(reason),
                caused_by: None,
                root_cause: Vec::new(),
                stack_trace: None,
                suppressed: Vec::new(),
                ty: exception_opt.map(|exception| exception.as_str().to_string()),
                additional_details: Default::default(),
            },
        }
    }
}

impl From<SearchError> for ElasticsearchError {
    fn from(search_error: SearchError) -> Self {
        let status = search_error.error_code().http_status_code();
        // Fill only reason field to keep it simple.
        let reason = ErrorCause {
            reason: Some(search_error.to_string()),
            caused_by: None,
            root_cause: Vec::new(),
            stack_trace: None,
            suppressed: Vec::new(),
            ty: None,
            additional_details: Default::default(),
        };
        ElasticsearchError {
            status,
            error: reason,
        }
    }
}

impl From<IngestServiceError> for ElasticsearchError {
    fn from(ingest_service_error: IngestServiceError) -> Self {
        let status = ingest_service_error.error_code().http_status_code();

        let reason = ErrorCause {
            reason: Some(ingest_service_error.to_string()),
            caused_by: None,
            root_cause: Vec::new(),
            stack_trace: None,
            suppressed: Vec::new(),
            ty: None,
            additional_details: Default::default(),
        };
        ElasticsearchError {
            status,
            error: reason,
        }
    }
}

impl From<IngestV2Error> for ElasticsearchError {
    fn from(ingest_error: IngestV2Error) -> Self {
        let status = ingest_error.error_code().http_status_code();

        let reason = ErrorCause {
            reason: Some(ingest_error.to_string()),
            caused_by: None,
            root_cause: Vec::new(),
            stack_trace: None,
            suppressed: Vec::new(),
            ty: None,
            additional_details: Default::default(),
        };
        ElasticsearchError {
            status,
            error: reason,
        }
    }
}

impl From<IndexServiceError> for ElasticsearchError {
    fn from(ingest_error: IndexServiceError) -> Self {
        let status = ingest_error.error_code().http_status_code();

        let reason = ErrorCause {
            reason: Some(ingest_error.to_string()),
            caused_by: None,
            root_cause: Vec::new(),
            stack_trace: None,
            suppressed: Vec::new(),
            ty: None,
            additional_details: Default::default(),
        };
        ElasticsearchError {
            status,
            error: reason,
        }
    }
}

#[derive(Debug, Clone, Copy, Eq, PartialEq, Serialize, Deserialize)]
pub enum ElasticException {
    #[serde(rename = "action_request_validation_exception")]
    ActionRequestValidation,
    #[serde(rename = "document_parsing_exception")]
    DocumentParsing,
    // This is an exception proper to Quickwit.
    #[serde(rename = "internal_exception")]
    Internal,
    #[serde(rename = "illegal_argument_exception")]
    IllegalArgument,
    #[serde(rename = "index_not_found_exception")]
    IndexNotFound,
    // This is an exception proper to Quickwit.
    #[serde(rename = "rate_limited_exception")]
    RateLimited,
    // This is an exception proper to Quickwit.
    #[serde(rename = "source_not_found_exception")]
    SourceNotFound,
    #[serde(rename = "timeout_exception")]
    Timeout,
}

impl ElasticException {
    pub fn as_str(&self) -> &'static str {
        match self {
            Self::ActionRequestValidation => "action_request_validation_exception",
            Self::DocumentParsing => "document_parsing_exception",
            Self::Internal => "internal_exception",
            Self::RateLimited => "rate_limited_exception",
            Self::IllegalArgument => "illegal_argument_exception",
            Self::IndexNotFound => "index_not_found_exception",
            Self::SourceNotFound => "source_not_found_exception",
            Self::Timeout => "timeout_exception",
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/field_capability.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use quickwit_proto::search::{ListFieldType, ListFieldsEntryResponse, ListFieldsResponse};
use quickwit_query::ElasticQueryDsl;
use quickwit_query::query_ast::QueryAst;
use serde::{Deserialize, Serialize};
use warp::hyper::StatusCode;

use super::ElasticsearchError;
use super::search_query_params::*;
use crate::simple_list::{from_simple_list, to_simple_list};

#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct FieldCapabilityQueryParams {
    #[serde(default)]
    pub allow_no_indices: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub expand_wildcards: Option<Vec<ExpandWildcards>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub fields: Option<Vec<String>>,
    #[serde(default)]
    pub ignore_unavailable: Option<bool>,
    /// Non-ES Parameter. If set, restricts splits to documents with a `time_range.start >=
    /// start_timestamp`.
    pub start_timestamp: Option<i64>,
    /// Non-ES Parameter. If set, restricts splits to documents with a `time_range.end <
    /// end_timestamp``.
    pub end_timestamp: Option<i64>,
}

#[derive(Debug, Default, Clone, Deserialize, PartialEq)]
#[serde(deny_unknown_fields)]
pub struct FieldCapabilityRequestBody {
    #[serde(default)]
    // unsupported currently
    pub index_filter: serde_json::Value,
    #[serde(default)]
    // unsupported currently
    pub runtime_mappings: serde_json::Value,
}

#[derive(Serialize, Deserialize, Debug)]
pub struct FieldCapabilityResponse {
    indices: Vec<String>,
    fields: HashMap<String, FieldCapabilityFieldTypesResponse>,
}

type FieldCapabilityFieldTypesResponse =
    HashMap<FieldCapabilityEntryType, FieldCapabilityEntryResponse>;

#[derive(Serialize, Deserialize, Debug, Clone, Eq, PartialEq, Hash)]
enum FieldCapabilityEntryType {
    #[serde(rename = "long")]
    Long,
    #[serde(rename = "keyword")]
    Keyword,
    #[serde(rename = "text")]
    Text,
    #[serde(rename = "date_nanos")]
    DateNanos,
    #[serde(rename = "binary")]
    Binary,
    #[serde(rename = "double")]
    Double,
    #[serde(rename = "boolean")]
    Boolean,
    #[serde(rename = "ip")]
    Ip,
    // Unmapped currently
    #[serde(rename = "nested")]
    Nested,
    // Unmapped currently
    #[serde(rename = "object")]
    Object,
}

#[derive(Serialize, Deserialize, Debug, Clone)]
struct FieldCapabilityEntryResponse {
    metadata_field: bool, // Always false
    searchable: bool,
    aggregatable: bool,
    // Option since it is filled later
    #[serde(rename = "type")]
    typ: Option<FieldCapabilityEntryType>,
    #[serde(skip_serializing_if = "Vec::is_empty")]
    indices: Vec<String>, // [ "index1", "index2" ],
    #[serde(skip_serializing_if = "Vec::is_empty")]
    non_aggregatable_indices: Vec<String>, // [ "index1" ]
    #[serde(skip_serializing_if = "Vec::is_empty")]
    non_searchable_indices: Vec<String>, // [ "index1" ]
}
impl FieldCapabilityEntryResponse {
    fn from_list_field_entry_response(entry: ListFieldsEntryResponse) -> Self {
        Self {
            metadata_field: false,
            searchable: entry.searchable,
            aggregatable: entry.aggregatable,
            typ: None,
            indices: entry.index_ids.clone(),
            non_aggregatable_indices: entry.non_aggregatable_index_ids,
            non_searchable_indices: entry.non_searchable_index_ids,
        }
    }
}

pub fn convert_to_es_field_capabilities_response(
    resp: ListFieldsResponse,
) -> FieldCapabilityResponse {
    let mut indices = resp
        .fields
        .iter()
        .flat_map(|entry| entry.index_ids.iter().cloned())
        .collect::<Vec<_>>();
    indices.sort();
    indices.dedup();

    let mut fields: HashMap<String, FieldCapabilityFieldTypesResponse> = HashMap::new();
    for list_field_resp in resp.fields {
        let entry = fields
            .entry(list_field_resp.field_name.to_string())
            .or_default();

        let field_type = ListFieldType::try_from(list_field_resp.field_type).unwrap();
        let add_entry =
            FieldCapabilityEntryResponse::from_list_field_entry_response(list_field_resp);
        let types = match field_type {
            ListFieldType::Str => {
                vec![
                    FieldCapabilityEntryType::Keyword,
                    FieldCapabilityEntryType::Text,
                ]
            }
            ListFieldType::U64 => vec![FieldCapabilityEntryType::Long],
            ListFieldType::I64 => vec![FieldCapabilityEntryType::Long],
            ListFieldType::F64 => vec![FieldCapabilityEntryType::Double],
            ListFieldType::Bool => vec![FieldCapabilityEntryType::Boolean],
            ListFieldType::Date => vec![FieldCapabilityEntryType::DateNanos],
            ListFieldType::Facet => continue,
            ListFieldType::Json => continue,
            ListFieldType::Bytes => vec![FieldCapabilityEntryType::Binary],
            ListFieldType::IpAddr => vec![FieldCapabilityEntryType::Ip],
        };
        for field_type in types {
            let mut add_entry = add_entry.clone();
            add_entry.typ = Some(field_type.clone());

            // If the field exists in all indices, we omit field.indices in the response.
            let exists_in_all_indices = add_entry.indices.len() == indices.len();
            if exists_in_all_indices {
                add_entry.indices = Vec::new();
            }

            entry.insert(field_type, add_entry);
        }
    }
    FieldCapabilityResponse { indices, fields }
}

/// Parses an Elasticsearch index_filter JSON value into a Quickwit QueryAst.
///
/// Returns `Ok(None)` if the index_filter is null.
/// Returns `Ok(Some(QueryAst))` if the index_filter is valid.
/// Returns `Err` if the index_filter is invalid or cannot be converted (including empty object).
#[allow(clippy::result_large_err)]
pub fn parse_index_filter_to_query_ast(
    index_filter: serde_json::Value,
) -> Result<Option<QueryAst>, ElasticsearchError> {
    if index_filter.is_null() {
        return Ok(None);
    }

    // Parse ES Query DSL to internal QueryAst
    let elastic_query_dsl: ElasticQueryDsl =
        serde_json::from_value(index_filter).map_err(|err| {
            ElasticsearchError::new(
                StatusCode::BAD_REQUEST,
                format!("Invalid index_filter: {err}"),
                None,
            )
        })?;

    let query_ast: QueryAst = elastic_query_dsl.try_into().map_err(|err: anyhow::Error| {
        ElasticsearchError::new(
            StatusCode::BAD_REQUEST,
            format!("Failed to convert index_filter: {err}"),
            None,
        )
    })?;

    Ok(Some(query_ast))
}

#[allow(clippy::result_large_err)]
pub fn build_list_field_request_for_es_api(
    index_id_patterns: Vec<String>,
    search_params: FieldCapabilityQueryParams,
    search_body: FieldCapabilityRequestBody,
) -> Result<quickwit_proto::search::ListFieldsRequest, ElasticsearchError> {
    let query_ast = parse_index_filter_to_query_ast(search_body.index_filter)?;
    let query_ast_json = query_ast
        .map(|ast| serde_json::to_string(&ast).expect("QueryAst should be JSON serializable"));

    Ok(quickwit_proto::search::ListFieldsRequest {
        index_id_patterns,
        fields: search_params.fields.unwrap_or_default(),
        start_timestamp: search_params.start_timestamp,
        end_timestamp: search_params.end_timestamp,
        query_ast: query_ast_json,
    })
}

#[cfg(test)]
mod tests {
    use serde_json::json;

    use super::*;

    #[test]
    fn test_build_list_field_request_empty_index_filter() {
        let result = build_list_field_request_for_es_api(
            vec!["test_index".to_string()],
            FieldCapabilityQueryParams::default(),
            FieldCapabilityRequestBody::default(),
        )
        .unwrap();

        assert_eq!(result.index_id_patterns, vec!["test_index".to_string()]);
        assert!(result.query_ast.is_none());
    }

    #[test]
    fn test_build_list_field_request_with_term_index_filter() {
        let search_body = FieldCapabilityRequestBody {
            index_filter: json!({
                "term": {
                    "status": "active"
                }
            }),
            runtime_mappings: serde_json::Value::Null,
        };

        let result = build_list_field_request_for_es_api(
            vec!["test_index".to_string()],
            FieldCapabilityQueryParams::default(),
            search_body,
        )
        .unwrap();

        assert_eq!(result.index_id_patterns, vec!["test_index".to_string()]);
        assert!(result.query_ast.is_some());

        // Verify the query_ast is valid JSON
        let query_ast: serde_json::Value =
            serde_json::from_str(&result.query_ast.unwrap()).unwrap();
        assert!(query_ast.is_object());
    }

    #[test]
    fn test_build_list_field_request_with_bool_index_filter() {
        let search_body = FieldCapabilityRequestBody {
            index_filter: json!({
                "bool": {
                    "must": [
                        { "term": { "status": "active" } }
                    ],
                    "filter": [
                        { "range": { "age": { "gte": 18 } } }
                    ]
                }
            }),
            runtime_mappings: serde_json::Value::Null,
        };

        let result = build_list_field_request_for_es_api(
            vec!["test_index".to_string()],
            FieldCapabilityQueryParams::default(),
            search_body,
        )
        .unwrap();

        assert!(result.query_ast.is_some());
    }

    #[test]
    fn test_build_list_field_request_with_invalid_index_filter() {
        let search_body = FieldCapabilityRequestBody {
            index_filter: json!({
                "invalid_query_type": {
                    "field": "value"
                }
            }),
            runtime_mappings: serde_json::Value::Null,
        };

        let result = build_list_field_request_for_es_api(
            vec!["test_index".to_string()],
            FieldCapabilityQueryParams::default(),
            search_body,
        );

        assert!(result.is_err());
        let err = result.unwrap_err();
        assert_eq!(err.status, StatusCode::BAD_REQUEST);
    }

    #[test]
    fn test_build_list_field_request_with_null_index_filter() {
        let search_body = FieldCapabilityRequestBody {
            index_filter: serde_json::Value::Null,
            runtime_mappings: serde_json::Value::Null,
        };

        let result = build_list_field_request_for_es_api(
            vec!["test_index".to_string()],
            FieldCapabilityQueryParams::default(),
            search_body,
        )
        .unwrap();

        assert!(result.query_ast.is_none());
    }

    #[test]
    fn test_build_list_field_request_preserves_other_params() {
        let search_params = FieldCapabilityQueryParams {
            fields: Some(vec!["field1".to_string(), "field2".to_string()]),
            start_timestamp: Some(1000),
            end_timestamp: Some(2000),
            ..Default::default()
        };

        let search_body = FieldCapabilityRequestBody {
            index_filter: json!({ "match_all": {} }),
            runtime_mappings: serde_json::Value::Null,
        };

        let result = build_list_field_request_for_es_api(
            vec!["test_index".to_string()],
            search_params,
            search_body,
        )
        .unwrap();

        assert_eq!(
            result.fields,
            vec!["field1".to_string(), "field2".to_string()]
        );
        assert_eq!(result.start_timestamp, Some(1000));
        assert_eq!(result.end_timestamp, Some(2000));
        assert!(result.query_ast.is_some());
    }

    #[test]
    fn test_parse_index_filter_to_query_ast_null() {
        let result = parse_index_filter_to_query_ast(serde_json::Value::Null).unwrap();
        assert!(result.is_none());
    }

    #[test]
    fn test_parse_index_filter_to_query_ast_empty_object() {
        // Empty object {} should return error to match ES behavior
        let result = parse_index_filter_to_query_ast(json!({}));
        assert!(result.is_err());
    }

    #[test]
    fn test_parse_index_filter_to_query_ast_valid_term() {
        let result = parse_index_filter_to_query_ast(json!({
            "term": { "status": "active" }
        }))
        .unwrap();
        assert!(result.is_some());
    }

    #[test]
    fn test_parse_index_filter_to_query_ast_invalid() {
        let result = parse_index_filter_to_query_ast(json!({
            "invalid_query_type": { "field": "value" }
        }));
        assert!(result.is_err());
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/mappings.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use quickwit_doc_mapper::{FieldMappingEntry, FieldMappingType};
use quickwit_metastore::IndexMetadata;
use quickwit_proto::search::{ListFieldType, ListFieldsResponse};
use serde::ser::SerializeMap;
use serde::{Serialize, Serializer};

/// Top-level response for `GET /{index}/_mapping(s)`.
///
/// Serializes as `{ "<index_id>": { "mappings": { "properties": { ... } } } }`.
pub(crate) struct ElasticsearchMappingsResponse {
    indices: HashMap<String, IndexMappings>,
}

impl Serialize for ElasticsearchMappingsResponse {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        let mut map = serializer.serialize_map(Some(self.indices.len()))?;
        for (index_id, mappings) in &self.indices {
            map.serialize_entry(index_id, mappings)?;
        }
        map.end()
    }
}

#[derive(Debug, Serialize)]
struct IndexMappings {
    mappings: MappingProperties,
}

#[derive(Debug, Serialize)]
struct MappingProperties {
    properties: HashMap<String, FieldMapping>,
}

#[derive(Debug, Serialize)]
#[serde(untagged)]
enum FieldMapping {
    Leaf {
        #[serde(rename = "type")]
        typ: &'static str,
    },
    Object {
        #[serde(rename = "type")]
        typ: &'static str,
        properties: HashMap<String, FieldMapping>,
    },
}

impl ElasticsearchMappingsResponse {
    pub fn from_doc_mapping(
        indexes_metadata: Vec<IndexMetadata>,
        list_fields_response: Option<&ListFieldsResponse>,
    ) -> Self {
        let indices = indexes_metadata
            .into_iter()
            .map(|index_metadata| {
                let field_mappings = &index_metadata.index_config.doc_mapping.field_mappings;
                let mut properties = build_properties(field_mappings);
                if let Some(list_fields) = list_fields_response {
                    merge_dynamic_fields(&mut properties, list_fields);
                }
                let index_id = index_metadata.index_id().to_string();
                (
                    index_id,
                    IndexMappings {
                        mappings: MappingProperties { properties },
                    },
                )
            })
            .collect();
        Self { indices }
    }
}

fn build_properties(field_mappings: &[FieldMappingEntry]) -> HashMap<String, FieldMapping> {
    let mut properties = HashMap::with_capacity(field_mappings.len());
    for entry in field_mappings {
        if let Some(field_mapping) = field_mapping_from_entry(entry) {
            properties.insert(entry.name.clone(), field_mapping);
        }
    }
    properties
}

fn field_mapping_from_entry(entry: &FieldMappingEntry) -> Option<FieldMapping> {
    match &entry.mapping_type {
        // Quickwit text fields behave like ES keyword fields: they support exact
        // match, prefix, and regexp queries. Reporting them as "keyword" enables
        // downstream connectors (e.g. Trino ES connector) to push down filters and
        // LIKE predicates, which they only do for keyword-typed fields.
        FieldMappingType::Text(..) => Some(FieldMapping::Leaf { typ: "keyword" }),
        FieldMappingType::I64(..) => Some(FieldMapping::Leaf { typ: "long" }),
        FieldMappingType::U64(..) => Some(FieldMapping::Leaf { typ: "long" }),
        FieldMappingType::F64(..) => Some(FieldMapping::Leaf { typ: "double" }),
        FieldMappingType::Bool(..) => Some(FieldMapping::Leaf { typ: "boolean" }),
        FieldMappingType::DateTime(..) => Some(FieldMapping::Leaf { typ: "date" }),
        FieldMappingType::IpAddr(..) => Some(FieldMapping::Leaf { typ: "ip" }),
        FieldMappingType::Bytes(..) => Some(FieldMapping::Leaf { typ: "binary" }),
        FieldMappingType::Json(..) => Some(FieldMapping::Leaf { typ: "object" }),
        FieldMappingType::Object(options) => {
            let properties = build_properties(&options.field_mappings);
            Some(FieldMapping::Object {
                typ: "object",
                properties,
            })
        }
        FieldMappingType::Concatenate(_) => Some(FieldMapping::Leaf { typ: "keyword" }),
    }
}

/// Merges dynamic fields from a `ListFieldsResponse` into the properties map.
///
/// Fields already present in the map (from explicit doc mappings) are skipped,
/// as are internal fields (prefixed with `_`).
fn merge_dynamic_fields(
    properties: &mut HashMap<String, FieldMapping>,
    list_fields_response: &ListFieldsResponse,
) {
    for field_entry in &list_fields_response.fields {
        let field_name = &field_entry.field_name;
        if field_name.starts_with('_') {
            continue;
        }
        if properties.contains_key(field_name) {
            continue;
        }
        let Ok(field_type) = ListFieldType::try_from(field_entry.field_type) else {
            continue;
        };
        if let Some(es_type) = es_type_from_list_field_type(field_type) {
            properties.insert(field_name.clone(), FieldMapping::Leaf { typ: es_type });
        }
    }
}

fn es_type_from_list_field_type(field_type: ListFieldType) -> Option<&'static str> {
    match field_type {
        ListFieldType::Str => Some("keyword"),
        ListFieldType::U64 | ListFieldType::I64 => Some("long"),
        ListFieldType::F64 => Some("double"),
        ListFieldType::Bool => Some("boolean"),
        ListFieldType::Date => Some("date"),
        ListFieldType::Bytes => Some("binary"),
        ListFieldType::IpAddr => Some("ip"),
        ListFieldType::Facet | ListFieldType::Json => None,
    }
}

#[cfg(test)]
mod tests {
    use serde_json::json;

    use super::*;

    #[test]
    fn test_field_mapping_from_entry_bool() {
        let entry_json = json!({ "name": "active", "type": "bool" });
        let entry: FieldMappingEntry = serde_json::from_value(entry_json).unwrap();
        let mapping = field_mapping_from_entry(&entry).unwrap();
        let serialized = serde_json::to_value(&mapping).unwrap();
        assert_eq!(serialized, json!({ "type": "boolean" }));
    }

    #[test]
    fn test_field_mapping_from_entry_text() {
        let entry_json = json!({ "name": "message", "type": "text" });
        let entry: FieldMappingEntry = serde_json::from_value(entry_json).unwrap();
        let mapping = field_mapping_from_entry(&entry).unwrap();
        let serialized = serde_json::to_value(&mapping).unwrap();
        assert_eq!(serialized, json!({ "type": "keyword" }));
    }

    #[test]
    fn test_field_mapping_from_entry_i64() {
        let entry_json = json!({ "name": "count", "type": "i64" });
        let entry: FieldMappingEntry = serde_json::from_value(entry_json).unwrap();
        let mapping = field_mapping_from_entry(&entry).unwrap();
        let serialized = serde_json::to_value(&mapping).unwrap();
        assert_eq!(serialized, json!({ "type": "long" }));
    }

    #[test]
    fn test_field_mapping_from_entry_object() {
        let entry_json = json!({
            "name": "nested",
            "type": "object",
            "field_mappings": [
                { "name": "id", "type": "u64" },
                { "name": "label", "type": "text" }
            ]
        });
        let entry: FieldMappingEntry = serde_json::from_value(entry_json).unwrap();
        let mapping = field_mapping_from_entry(&entry).unwrap();
        let serialized = serde_json::to_value(&mapping).unwrap();
        assert_eq!(
            serialized,
            json!({
                "type": "object",
                "properties": {
                    "id": { "type": "long" },
                    "label": { "type": "keyword" }
                }
            })
        );
    }

    #[test]
    fn test_field_mapping_from_entry_concatenate_exposed_as_keyword() {
        let entry_json = json!({
            "name": "concat_field",
            "type": "concatenate",
            "concatenate_fields": ["field_a", "field_b"]
        });
        let entry: FieldMappingEntry = serde_json::from_value(entry_json).unwrap();
        let mapping = field_mapping_from_entry(&entry).unwrap();
        let serialized = serde_json::to_value(&mapping).unwrap();
        assert_eq!(serialized, json!({ "type": "keyword" }));
    }

    #[test]
    fn test_build_properties_all_leaf_types() {
        let entries: Vec<FieldMappingEntry> = serde_json::from_value(json!([
            { "name": "title", "type": "text" },
            { "name": "count", "type": "i64" },
            { "name": "unsigned", "type": "u64" },
            { "name": "score", "type": "f64" },
            { "name": "active", "type": "bool" },
            { "name": "created_at", "type": "datetime" },
            { "name": "ip_field", "type": "ip" },
            { "name": "data", "type": "bytes" },
            { "name": "payload", "type": "json" },
            {
                "name": "metadata",
                "type": "object",
                "field_mappings": [
                    { "name": "source", "type": "text" }
                ]
            }
        ]))
        .unwrap();

        let props = build_properties(&entries);
        let to_json = |fm: &FieldMapping| serde_json::to_value(fm).unwrap();

        assert_eq!(to_json(&props["title"]), json!({ "type": "keyword" }));
        assert_eq!(to_json(&props["count"]), json!({ "type": "long" }));
        assert_eq!(to_json(&props["unsigned"]), json!({ "type": "long" }));
        assert_eq!(to_json(&props["score"]), json!({ "type": "double" }));
        assert_eq!(to_json(&props["active"]), json!({ "type": "boolean" }));
        assert_eq!(to_json(&props["created_at"]), json!({ "type": "date" }));
        assert_eq!(to_json(&props["ip_field"]), json!({ "type": "ip" }));
        assert_eq!(to_json(&props["data"]), json!({ "type": "binary" }));
        assert_eq!(to_json(&props["payload"]), json!({ "type": "object" }));

        let meta = to_json(&props["metadata"]);
        assert_eq!(meta["type"], "object");
        assert_eq!(meta["properties"]["source"]["type"], "keyword");
    }

    #[test]
    fn test_merge_dynamic_fields_skips_existing_and_internal() {
        use quickwit_proto::search::ListFieldsEntryResponse;

        let mut properties = HashMap::new();
        properties.insert("title".to_string(), FieldMapping::Leaf { typ: "text" });

        let list_fields = ListFieldsResponse {
            fields: vec![
                ListFieldsEntryResponse {
                    field_name: "title".to_string(),
                    field_type: ListFieldType::Str as i32,
                    ..Default::default()
                },
                ListFieldsEntryResponse {
                    field_name: "_timestamp".to_string(),
                    field_type: ListFieldType::Date as i32,
                    ..Default::default()
                },
                ListFieldsEntryResponse {
                    field_name: "dynamic_field".to_string(),
                    field_type: ListFieldType::Str as i32,
                    ..Default::default()
                },
            ],
        };

        merge_dynamic_fields(&mut properties, &list_fields);

        assert_eq!(properties.len(), 2);
        assert!(properties.contains_key("title"));
        assert!(properties.contains_key("dynamic_field"));
        assert!(!properties.contains_key("_timestamp"));
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod bulk_body;
mod bulk_query_params;
mod cat_indices;
mod error;
mod field_capability;
mod mappings;
mod multi_search;
mod scroll;
mod search_body;
mod search_query_params;
mod search_response;
mod stats;

pub use bulk_body::BulkAction;
pub use bulk_query_params::ElasticBulkOptions;
pub use cat_indices::{
    CatIndexQueryParams, ElasticsearchCatIndexResponse, ElasticsearchResolveIndexEntryResponse,
    ElasticsearchResolveIndexResponse,
};
pub use error::{ElasticException, ElasticsearchError};
pub use field_capability::{
    FieldCapabilityQueryParams, FieldCapabilityRequestBody, FieldCapabilityResponse,
    build_list_field_request_for_es_api, convert_to_es_field_capabilities_response,
};
pub(crate) use mappings::ElasticsearchMappingsResponse;
pub use multi_search::{
    MultiSearchHeader, MultiSearchQueryParams, MultiSearchResponse, MultiSearchSingleResponse,
};
use quickwit_proto::search::{SortDatetimeFormat, SortOrder};
pub use scroll::ScrollQueryParams;
pub use search_body::SearchBody;
pub use search_query_params::{DeleteQueryParams, SearchQueryParams, SearchQueryParamsCount};
pub use search_response::ElasticsearchResponse;
use serde::{Deserialize, Serialize};
pub use stats::{ElasticsearchStatsResponse, StatsResponseEntry};

#[derive(Debug, Clone, Eq, PartialEq)]
pub struct SortField {
    pub field: String,
    pub order: SortOrder,
    pub date_format: Option<ElasticDateFormat>,
}

#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum ElasticDateFormat {
    /// Sort values are in milliseconds by default to ease migration from ES.
    /// We allow the user to specify nanoseconds if needed.
    /// We add `Int` to the name to avoid confusion ES variant `EpochMillis` which,
    /// returns milliseconds as strings.
    EpochNanosInt,
}

impl From<ElasticDateFormat> for SortDatetimeFormat {
    fn from(date_format: ElasticDateFormat) -> Self {
        match date_format {
            ElasticDateFormat::EpochNanosInt => SortDatetimeFormat::UnixTimestampNanos,
        }
    }
}

pub(crate) fn default_elasticsearch_sort_order(field_name: &str) -> SortOrder {
    if field_name == "_score" {
        SortOrder::Desc
    } else {
        SortOrder::Asc
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/multi_search.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use elasticsearch_dsl::ErrorCause;
use serde::{Deserialize, Serialize};
use serde_with::formats::PreferMany;
use serde_with::{OneOrMany, serde_as};
use warp::hyper::StatusCode;

use super::ElasticsearchError;
use super::search_query_params::ExpandWildcards;
use super::search_response::ElasticsearchResponse;
use crate::simple_list::{from_simple_list, to_simple_list};

// Multi search doc: https://www.elastic.co/guide/en/elasticsearch/reference/current/search-multi-search.html

#[serde_as]
#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct MultiSearchQueryParams {
    #[serde(default)]
    pub allow_no_indices: Option<bool>,
    #[serde(default)]
    pub ccs_minimize_roundtrips: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub expand_wildcards: Option<Vec<ExpandWildcards>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    /// Additional filters to be applied to the query.
    /// Useful for permissions and other use cases.
    /// This is not part of the official Elasticsearch API.
    ///
    /// This will set extra_filters on the search request.
    pub extra_filters: Option<Vec<String>>,
    #[serde(default)]
    pub ignore_throttled: Option<bool>,
    #[serde(default)]
    pub ignore_unavailable: Option<bool>,
    /// List of indexes to search.
    #[serde_as(deserialize_as = "OneOrMany<_, PreferMany>")]
    #[serde(default, rename = "index")]
    pub indexes: Vec<String>,
    #[serde(default)]
    pub max_concurrent_searches: Option<u64>,
    #[serde(default)]
    pub max_concurrent_shard_requests: Option<i64>,
    #[serde(default)]
    pub pre_filter_shard_size: Option<i64>,
    #[serde(default)]
    pub rest_total_hits_as_int: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub routing: Option<Vec<String>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    /// This is not part of the official Elasticsearch API.
    /// This will set source_excludes on the search request.
    pub _source_excludes: Option<Vec<String>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    /// This is not part of the official Elasticsearch API.
    /// This will set source_includes on the search request.
    pub _source_includes: Option<Vec<String>>,
    #[serde(default)]
    pub typed_keys: Option<bool>,
}

#[serde_as]
#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct MultiSearchHeader {
    #[serde(default)]
    pub allow_no_indices: Option<bool>,
    #[serde(default)]
    pub expand_wildcards: Option<Vec<ExpandWildcards>>,
    #[serde(default)]
    pub ignore_unavailable: Option<bool>,
    #[serde_as(deserialize_as = "OneOrMany<_, PreferMany>")]
    #[serde(default, rename = "index")]
    pub indexes: Vec<String>,
    #[serde(default)]
    pub preference: Option<String>,
    #[serde(default)]
    pub request_cache: Option<bool>,
    #[serde(default)]
    pub routing: Option<Vec<String>>,
}

impl MultiSearchHeader {
    pub fn apply_query_param_defaults(&mut self, defaults: &MultiSearchQueryParams) {
        if self.allow_no_indices.is_none() {
            self.allow_no_indices = defaults.allow_no_indices;
        }
        if self.expand_wildcards.is_none() {
            self.expand_wildcards = defaults.expand_wildcards.clone();
        }
        if self.ignore_unavailable.is_none() {
            self.ignore_unavailable = defaults.ignore_unavailable;
        }
        if self.indexes.is_empty() {
            self.indexes = defaults.indexes.clone();
        }
        if self.routing.is_none() {
            self.routing = defaults.routing.clone();
        }
    }
}

#[derive(Serialize)]
pub struct MultiSearchResponse {
    pub responses: Vec<MultiSearchSingleResponse>,
}

#[derive(Serialize, Debug)]
pub struct MultiSearchSingleResponse {
    #[serde(with = "http_serde::status_code")]
    pub status: StatusCode,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(flatten)]
    pub response: Option<ElasticsearchResponse>,
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    pub error: Option<ErrorCause>,
}

impl From<ElasticsearchResponse> for MultiSearchSingleResponse {
    fn from(response: ElasticsearchResponse) -> Self {
        MultiSearchSingleResponse {
            status: StatusCode::OK,
            response: Some(response),
            error: None,
        }
    }
}

impl From<ElasticsearchError> for MultiSearchSingleResponse {
    fn from(error: ElasticsearchError) -> Self {
        MultiSearchSingleResponse {
            status: error.status,
            response: None,
            error: Some(error.error),
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/scroll.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use serde::Deserialize;

#[derive(Deserialize, Default)]
pub struct ScrollQueryParams {
    pub scroll: Option<String>,
    pub scroll_id: Option<String>,
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/search_body.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::fmt;

use quickwit_proto::search::SortOrder;
use quickwit_query::{ElasticQueryDsl, OneFieldMap};
use serde::de::{MapAccess, Visitor};
use serde::{Deserialize, Deserializer, Serialize};

use super::ElasticDateFormat;
use crate::elasticsearch_api::TrackTotalHits;
use crate::elasticsearch_api::model::{SortField, default_elasticsearch_sort_order};

#[derive(Debug, Clone, PartialEq, Deserialize)]
#[serde(untagged)]
enum FieldSortParamsForDeser {
    // we can't just use FieldSortParams or we get infinite recursion on deser
    Object {
        order: Option<SortOrder>,
        format: Option<ElasticDateFormat>,
    },
    String(SortOrder),
}

impl From<FieldSortParamsForDeser> for FieldSortParams {
    fn from(for_deser: FieldSortParamsForDeser) -> FieldSortParams {
        match for_deser {
            FieldSortParamsForDeser::Object {
                order,
                format: date_format,
            } => FieldSortParams { order, date_format },
            FieldSortParamsForDeser::String(order) => FieldSortParams {
                order: Some(order),
                date_format: None,
            },
        }
    }
}

#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
#[serde(from = "FieldSortParamsForDeser")]
#[serde(deny_unknown_fields)]
struct FieldSortParams {
    #[serde(default)]
    pub order: Option<SortOrder>,
    #[serde(default)]
    #[serde(rename = "format")]
    pub date_format: Option<ElasticDateFormat>,
}

#[derive(Debug, Default, Clone, Deserialize, PartialEq)]
#[serde(deny_unknown_fields)]
pub struct SearchBody {
    #[serde(default)]
    pub from: Option<u64>,
    #[serde(default)]
    pub size: Option<u64>,
    #[serde(default)]
    pub query: Option<ElasticQueryDsl>,
    #[serde(default)]
    #[serde(deserialize_with = "deserialize_field_sorts")]
    pub sort: Option<Vec<SortField>>,
    #[serde(default)]
    pub aggs: serde_json::Map<String, serde_json::Value>,
    #[serde(default)]
    pub track_total_hits: Option<TrackTotalHits>,
    #[serde(default)]
    pub stored_fields: Option<BTreeSet<String>>,
    #[serde(default)]
    pub search_after: Vec<serde_json::Value>,

    // Ignored values, only here for compatibility with OpenSearch Dashboards.
    #[serde(default)]
    pub _source: serde::de::IgnoredAny,
    #[serde(default)]
    pub docvalue_fields: serde::de::IgnoredAny,
    #[serde(default)]
    pub script_fields: serde::de::IgnoredAny,
    #[serde(default)]
    pub highlight: serde::de::IgnoredAny,
    #[serde(default)]
    pub version: serde::de::IgnoredAny,
}

struct FieldSortVecVisitor;

#[derive(Deserialize)]
#[serde(untagged)]
enum StringOrMapFieldSort {
    FieldNameOnly(String),
    Sort(OneFieldMap<FieldSortParams>),
}

impl From<StringOrMapFieldSort> for SortField {
    fn from(string_or_map_field_sort: StringOrMapFieldSort) -> Self {
        match string_or_map_field_sort {
            StringOrMapFieldSort::FieldNameOnly(field_name) => {
                let order = default_elasticsearch_sort_order(&field_name);
                SortField {
                    field: field_name,
                    order,
                    date_format: None,
                }
            }
            StringOrMapFieldSort::Sort(sort) => {
                let order = sort
                    .value
                    .order
                    .unwrap_or_else(|| default_elasticsearch_sort_order(&sort.field));
                SortField {
                    field: sort.field,
                    order,
                    date_format: sort.value.date_format,
                }
            }
        }
    }
}

impl<'de> Visitor<'de> for FieldSortVecVisitor {
    type Value = Vec<SortField>;

    fn expecting(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter.write_str("A string, array, or object containing the sort fields.")
    }

    fn visit_str<E>(self, field_name: &str) -> Result<Vec<SortField>, E>
    where E: serde::de::Error {
        let order = default_elasticsearch_sort_order(field_name);
        Ok(vec![SortField {
            field: field_name.to_string(),
            order,
            date_format: None,
        }])
    }

    fn visit_seq<A>(self, mut seq: A) -> Result<Vec<SortField>, A::Error>
    where A: serde::de::SeqAccess<'de> {
        let mut sort_fields: Vec<SortField> = Vec::new();
        while let Some(field_sort) = seq.next_element::<StringOrMapFieldSort>()? {
            sort_fields.push(field_sort.into());
        }
        Ok(sort_fields)
    }

    fn visit_map<M>(self, mut map: M) -> Result<Vec<SortField>, M::Error>
    where M: MapAccess<'de> {
        let mut sort_fields: Vec<SortField> = Vec::new();
        while let Some((field_sort_key, field_sort_params)) =
            map.next_entry::<String, FieldSortParams>()?
        {
            let sort_order = field_sort_params
                .order
                .unwrap_or_else(|| default_elasticsearch_sort_order(&field_sort_key));
            sort_fields.push(SortField {
                field: field_sort_key,
                order: sort_order,
                date_format: field_sort_params.date_format,
            });
        }
        Ok(sort_fields)
    }
}

/// ES accepts structs to describe the sort field.
/// In that case the order of apparition in the JSON object matters.
fn deserialize_field_sorts<'de, D>(deserializer: D) -> Result<Option<Vec<SortField>>, D::Error>
where D: Deserializer<'de> {
    deserializer.deserialize_any(FieldSortVecVisitor).map(Some)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_sort_field_array() {
        let json = r#"
        {
            "sort": [
                { "timestamp": { "order": "desc", "format": "epoch_nanos_int" } },
                { "uid": { "order": "asc" } },
                { "my_field": "asc" },
                { "hello": {}},
                { "_score": {}}
            ]
        }
        "#;
        let search_body: SearchBody = serde_json::from_str(json).unwrap();
        let sort_fields = search_body.sort.unwrap();
        assert_eq!(sort_fields.len(), 5);
        assert_eq!(sort_fields[0].field, "timestamp");
        assert_eq!(sort_fields[0].order, SortOrder::Desc);
        assert_eq!(
            sort_fields[0].date_format,
            Some(ElasticDateFormat::EpochNanosInt)
        );
        assert_eq!(sort_fields[1].field, "uid");
        assert_eq!(sort_fields[1].order, SortOrder::Asc);
        assert_eq!(sort_fields[1].date_format, None);
        assert_eq!(sort_fields[2].field, "my_field");
        assert_eq!(sort_fields[2].order, SortOrder::Asc);
        assert_eq!(sort_fields[2].date_format, None);
        assert_eq!(sort_fields[3].field, "hello");
        assert_eq!(sort_fields[3].order, SortOrder::Asc);
        assert_eq!(sort_fields[3].date_format, None);
        assert_eq!(sort_fields[4].field, "_score");
        assert_eq!(sort_fields[4].order, SortOrder::Desc);
        assert_eq!(sort_fields[4].date_format, None);
    }

    #[test]
    fn test_sort_field_obj() {
        let json = r#"
        {
            "sort": {
                "timestamp": { "order": "desc" },
                "uid": { "order": "asc" }
            }
        }
        "#;
        let search_body: SearchBody = serde_json::from_str(json).unwrap();
        let field_sorts = search_body.sort.unwrap();
        assert_eq!(field_sorts.len(), 2);
        assert_eq!(field_sorts[0].field, "timestamp");
        assert_eq!(field_sorts[0].order, SortOrder::Desc);
        assert_eq!(field_sorts[1].field, "uid");
        assert_eq!(field_sorts[1].order, SortOrder::Asc);
    }

    #[test]
    fn test_sort_field_str() {
        let json = r#"
        {
            "sort": "timestamp"
        }
        "#;
        let search_body: SearchBody = serde_json::from_str(json).unwrap();
        let field_sorts = search_body.sort.unwrap();
        assert_eq!(field_sorts.len(), 1);
        assert_eq!(field_sorts[0].field, "timestamp");
        assert_eq!(field_sorts[0].order, SortOrder::Asc);
    }

    #[test]
    fn test_sort_default_orders() {
        let json = r#"
        {
            "sort": [
                "timestamp",
                "uid",
                "_score",
                "_doc"
            ]
        }
        "#;
        let search_body: SearchBody = serde_json::from_str(json).unwrap();
        let field_sorts = search_body.sort.unwrap();
        assert_eq!(field_sorts.len(), 4);
        assert_eq!(field_sorts[0].field, "timestamp");
        assert_eq!(field_sorts[0].order, SortOrder::Asc);
        assert_eq!(field_sorts[1].field, "uid");
        assert_eq!(field_sorts[1].order, SortOrder::Asc);
        assert_eq!(field_sorts[2].field, "_score");
        assert_eq!(field_sorts[2].order, SortOrder::Desc);
        assert_eq!(field_sorts[3].field, "_doc");
        assert_eq!(field_sorts[3].order, SortOrder::Asc);
    }

    #[test]
    fn test_unknown_field_behaviour() {
        let json = r#"
            {
                "term": {
                    "actor.id": {
                        "value": "95077794"
                     }
                }
            }
        "#;

        let search_body = serde_json::from_str::<SearchBody>(json);
        let error_msg = search_body.unwrap_err().to_string();
        assert!(error_msg.contains("unknown field `term`"));
        assert!(error_msg.contains("expected one of "));
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/search_query_params.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::str::FromStr;
use std::time::Duration;

use quickwit_query::BooleanOperand;
use quickwit_search::SearchError;
use serde::{Deserialize, Serialize};

use super::super::TrackTotalHits;
use super::MultiSearchHeader;
use crate::elasticsearch_api::model::{SortField, default_elasticsearch_sort_order};
use crate::simple_list::{from_simple_list, to_simple_list};

#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct SearchQueryParams {
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub _source: Option<Vec<String>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub _source_excludes: Option<Vec<String>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub _source_includes: Option<Vec<String>>,
    #[serde(default)]
    pub allow_no_indices: Option<bool>,
    #[serde(default)]
    pub allow_partial_search_results: Option<bool>,
    #[serde(default)]
    pub analyze_wildcard: Option<bool>,
    #[serde(default)]
    pub analyzer: Option<String>,
    #[serde(default)]
    pub batched_reduce_size: Option<u64>,
    #[serde(default)]
    pub ccs_minimize_roundtrips: Option<bool>,
    #[serde(default)]
    pub default_operator: Option<BooleanOperand>,
    #[serde(default)]
    pub df: Option<String>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub docvalue_fields: Option<Vec<String>>,
    #[serde(default)]
    pub error_trace: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub expand_wildcards: Option<Vec<ExpandWildcards>>,
    #[serde(default)]
    pub explain: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    /// Additional filters to be applied to the query.
    /// Useful for permissions and other use cases.
    /// This is not part of the official Elasticsearch API.
    pub extra_filters: Option<Vec<String>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub filter_path: Option<Vec<String>>,
    #[serde(default)]
    pub force_synthetic_source: Option<bool>,
    #[serde(default)]
    pub from: Option<u64>,
    #[serde(default)]
    pub human: Option<bool>,
    #[serde(default)]
    pub ignore_throttled: Option<bool>,
    #[serde(default)]
    pub ignore_unavailable: Option<bool>,
    #[serde(default)]
    pub lenient: Option<bool>,
    #[serde(default)]
    pub max_concurrent_shard_requests: Option<u64>,
    #[serde(default)]
    pub min_compatible_shard_node: Option<String>,
    #[serde(default)]
    pub pre_filter_shard_size: Option<u64>,
    #[serde(default)]
    pub preference: Option<String>,
    #[serde(default)]
    pub pretty: Option<bool>,
    #[serde(default)]
    pub q: Option<String>,
    #[serde(default)]
    pub request_cache: Option<bool>,
    #[serde(default)]
    pub rest_total_hits_as_int: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub routing: Option<Vec<String>>,
    #[serde(default)]
    pub scroll: Option<String>,
    #[serde(default)]
    pub search_type: Option<String>,
    #[serde(default)]
    pub seq_no_primary_term: Option<bool>,
    #[serde(default)]
    pub size: Option<u64>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub sort: Option<Vec<String>>,
    #[serde(default)]
    pub stats: Option<Vec<String>>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub stored_fields: Option<Vec<String>>,
    #[serde(default)]
    pub suggest_field: Option<String>,
    #[serde(default)]
    pub suggest_mode: Option<SuggestMode>,
    #[serde(default)]
    pub suggest_size: Option<u64>,
    #[serde(default)]
    pub suggest_text: Option<String>,
    #[serde(default)]
    pub terminate_after: Option<u64>,
    #[serde(default)]
    pub timeout: Option<String>,
    #[serde(default)]
    pub track_scores: Option<bool>,
    #[serde(default)]
    pub track_total_hits: Option<TrackTotalHits>,
    #[serde(default)]
    pub typed_keys: Option<bool>,
    #[serde(default)]
    pub version: Option<bool>,
}

#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct SearchQueryParamsCount {
    #[serde(default)]
    pub allow_no_indices: Option<bool>,
    #[serde(default)]
    pub analyze_wildcard: Option<bool>,
    #[serde(default)]
    pub analyzer: Option<String>,
    #[serde(default)]
    pub default_operator: Option<BooleanOperand>,
    #[serde(default)]
    pub df: Option<String>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub expand_wildcards: Option<Vec<ExpandWildcards>>,
    #[serde(default)]
    pub ignore_throttled: Option<bool>,
    #[serde(default)]
    pub ignore_unavailable: Option<bool>,
    #[serde(default)]
    pub lenient: Option<bool>,
    #[serde(default)]
    pub max_concurrent_shard_requests: Option<u64>,
    #[serde(default)]
    pub preference: Option<String>,
    #[serde(default)]
    pub q: Option<String>,
    #[serde(default)]
    pub request_cache: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub routing: Option<Vec<String>>,
}
impl From<SearchQueryParamsCount> for SearchQueryParams {
    fn from(value: SearchQueryParamsCount) -> Self {
        SearchQueryParams {
            allow_no_indices: value.allow_no_indices,
            analyze_wildcard: value.analyze_wildcard,
            analyzer: value.analyzer,
            default_operator: value.default_operator,
            df: value.df,
            expand_wildcards: value.expand_wildcards,
            ignore_throttled: value.ignore_throttled,
            ignore_unavailable: value.ignore_unavailable,
            preference: value.preference,
            q: value.q,
            request_cache: value.request_cache,
            routing: value.routing,
            size: Some(0),
            ..Default::default()
        }
    }
}

#[serde_with::skip_serializing_none]
#[derive(Default, Debug, Serialize, Deserialize)]
#[serde(deny_unknown_fields)]
pub struct DeleteQueryParams {
    #[serde(default)]
    pub allow_no_indices: Option<bool>,
    #[serde(serialize_with = "to_simple_list")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(default)]
    pub expand_wildcards: Option<Vec<ExpandWildcards>>,
    #[serde(default)]
    pub ignore_unavailable: Option<bool>,
    #[serde(default)]
    pub master_timeout: Option<String>,
    #[serde(default)]
    pub timeout: Option<String>,
}

/// Parses a string as if it was a json value string.
fn parse_str_like_json<T: serde::de::DeserializeOwned>(s: &str) -> Option<T> {
    let json_value = serde_json::Value::String(s.to_string());
    serde_json::from_value::<T>(json_value).ok()
}

// Parse a single sort field parameter from ES sort query string parameter.
fn parse_sort_field_str(sort_field_str: &str) -> Result<SortField, SearchError> {
    if let Some((field, order_str)) = sort_field_str.split_once(':') {
        let order = parse_str_like_json(order_str).ok_or_else(|| {
            SearchError::InvalidArgument(format!(
                "invalid sort order `{field}`. expected `asc` or `desc`"
            ))
        })?;
        Ok(SortField {
            field: field.to_string(),
            order,
            date_format: None,
        })
    } else {
        let order = default_elasticsearch_sort_order(sort_field_str);
        Ok(SortField {
            field: sort_field_str.to_string(),
            order,
            date_format: None,
        })
    }
}

impl SearchQueryParams {
    /// Accessor for the list of sort fields passed in the sort query string parameter.
    ///
    /// Returns an error if the sort query string are not in the expected format
    /// (`field:order,field2:order2,...`). Returns `Ok(None)` if the sort query string parameter
    /// is not present.
    #[allow(clippy::type_complexity)]
    pub(crate) fn sort_fields(&self) -> Result<Option<Vec<SortField>>, SearchError> {
        let Some(sort_fields_str) = self.sort.as_ref() else {
            return Ok(None);
        };
        let mut sort_fields: Vec<SortField> = Vec::with_capacity(sort_fields_str.len());
        for sort_field_str in sort_fields_str {
            sort_fields.push(parse_sort_field_str(sort_field_str)?);
        }
        Ok(Some(sort_fields))
    }

    /// Returns the scroll duration supplied by the user.
    ///
    /// This function returns an error if the scroll duration is not in the expected format. (`40s`
    /// etc.)
    pub fn parse_scroll_ttl(&self) -> Result<Option<Duration>, SearchError> {
        let Some(scroll_str) = self.scroll.as_ref() else {
            return Ok(None);
        };
        let duration: Duration = humantime::parse_duration(scroll_str).map_err(|_err| {
            SearchError::InvalidArgument(format!("invalid scroll duration: `{scroll_str}`"))
        })?;
        Ok(Some(duration))
    }

    pub fn allow_partial_search_results(&self) -> bool {
        // By default, elastic search allows partial results.
        self.allow_partial_search_results.unwrap_or(true)
    }
}

#[doc = "Whether to expand wildcard expression to concrete indices that are open, closed or both."]
#[derive(Debug, PartialEq, Deserialize, Serialize, Clone, Copy)]
#[serde(rename_all = "lowercase")]
pub enum ExpandWildcards {
    Open,
    Closed,
    Hidden,
    None,
    All,
}

impl FromStr for ExpandWildcards {
    type Err = &'static str;
    fn from_str(value_str: &str) -> Result<Self, Self::Err> {
        match value_str {
            "open" => Ok(Self::Open),
            "closed" => Ok(Self::Closed),
            "hidden" => Ok(Self::Hidden),
            "none" => Ok(Self::None),
            "all" => Ok(Self::All),
            _ => Err("unknown enum variant"),
        }
    }
}

impl fmt::Display for ExpandWildcards {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        match self {
            Self::Open => write!(formatter, "open"),
            Self::Closed => write!(formatter, "closed"),
            Self::Hidden => write!(formatter, "hidden"),
            Self::None => write!(formatter, "none"),
            Self::All => write!(formatter, "all"),
        }
    }
}

impl From<MultiSearchHeader> for SearchQueryParams {
    fn from(multi_search_header: MultiSearchHeader) -> Self {
        SearchQueryParams {
            allow_no_indices: multi_search_header.allow_no_indices,
            expand_wildcards: multi_search_header.expand_wildcards,
            ignore_unavailable: multi_search_header.ignore_unavailable,
            routing: multi_search_header.routing,
            request_cache: multi_search_header.request_cache,
            preference: multi_search_header.preference,
            ..Default::default()
        }
    }
}

/// Specify suggest mode
#[derive(Debug, PartialEq, Deserialize, Serialize, Clone, Copy)]
#[serde(rename_all = "lowercase")]
pub enum SuggestMode {
    Missing,
    Popular,
    Always,
}

impl FromStr for SuggestMode {
    type Err = &'static str;
    fn from_str(value_str: &str) -> Result<Self, Self::Err> {
        match value_str {
            "missing" => Ok(Self::Missing),
            "popular" => Ok(Self::Popular),
            "always" => Ok(Self::Always),
            _ => Err("unknown enum variant"),
        }
    }
}

impl fmt::Display for SuggestMode {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        match self {
            Self::Missing => write!(formatter, "missing"),
            Self::Popular => write!(formatter, "popular"),
            Self::Always => write!(formatter, "always"),
        }
    }
}

#[cfg(test)]
mod tests {

    use quickwit_proto::search::SortOrder;

    use super::*;

    #[derive(Deserialize, PartialEq, Eq, Debug)]
    #[serde(rename_all = "snake_case")]
    enum TestEnum {
        FirstItem,
        SecondItem,
    }

    #[test]
    fn test_parse_str_like_json() {
        assert_eq!(
            parse_str_like_json::<TestEnum>("first_item").unwrap(),
            TestEnum::FirstItem
        );
        assert!(parse_str_like_json::<TestEnum>("FirstItem").is_none());
    }

    #[test]
    fn test_sort_order_qs() {
        let sort_order_qs = parse_sort_field_str("timestamp:desc").unwrap();
        assert_eq!(
            sort_order_qs,
            SortField {
                field: "timestamp".to_string(),
                order: SortOrder::Desc,
                date_format: None
            }
        );
        let sort_order_qs = parse_sort_field_str("timestamp:asc").unwrap();
        assert_eq!(
            sort_order_qs,
            SortField {
                field: "timestamp".to_string(),
                order: SortOrder::Asc,
                date_format: None
            }
        );
    }
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/search_response.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use elasticsearch_dsl::{ClusterStatistics, HitsMetadata, ShardStatistics, Suggest};
use quickwit_search::AggregationResults;
use serde::Serialize;

type Map<K, V> = std::collections::BTreeMap<K, V>;

/// Search response
///
/// This is a fork of [`elasticsearch_dsl::SearchResponse`] with the
/// `aggregations` field using [`AggregationResults`] instead of
/// [`serde_json::Value`].
#[derive(Debug, Default, Serialize, PartialEq)]
pub struct ElasticsearchResponse {
    /// The time that it took Elasticsearch to process the query
    pub took: u32,

    /// The search has been cancelled and results are partial
    pub timed_out: bool,

    /// Indicates if search has been terminated early
    #[serde(default)]
    pub terminated_early: Option<bool>,

    /// Scroll Id
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(rename = "_scroll_id")]
    pub scroll_id: Option<String>,

    /// Dynamically fetched fields
    #[serde(default)]
    pub fields: Map<String, serde_json::Value>,

    /// Point in time Id
    #[serde(skip_serializing_if = "Option::is_none")]
    pub pit_id: Option<String>,

    /// Number of reduce phases
    #[serde(skip_serializing_if = "Option::is_none")]
    pub num_reduce_phases: Option<u64>,

    /// Maximum document score. [None] when documents are implicitly sorted
    /// by a field other than `_score`
    #[serde(skip_serializing_if = "Option::is_none")]
    pub max_score: Option<f32>,

    /// Number of clusters touched with their states
    #[serde(skip_serializing_if = "Option::is_none", rename = "_clusters")]
    pub clusters: Option<ClusterStatistics>,

    /// Number of shards touched with their states
    #[serde(rename = "_shards")]
    pub shards: ShardStatistics,

    /// Search hits
    pub hits: HitsMetadata,

    /// Search aggregations
    #[serde(skip_serializing_if = "Option::is_none")]
    pub aggregations: Option<AggregationResults>,

    #[serde(skip_serializing_if = "Map::is_empty", default)]
    /// Suggest response
    pub suggest: Map<String, Vec<Suggest>>,
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/model/stats.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::ops::AddAssign;

use quickwit_metastore::SplitMetadata;
use serde::{Deserialize, Serialize};

/// Returns JSON in the format:
///
/// {
///   "_all": {
///     "primaries": {
///       "store": {"size_in_bytes": 123456789},
///       "docs": {"count": 5000}
///     },
///     "total": {
///       "segments": {"count": 100},
///       "docs": {"count": 5000}
///     }
///   },
///   "indices": {
///     "exampleIndex": {
///       "primaries": {
///         "store": {"size_in_bytes": 123456789},
///         "docs": {"count": 5000}
///       },
///       "total": {
///         "segments": {"count": 50},
///         "docs": {"count": 5000}
///       }
///     }
///   }
/// }
#[derive(Clone, Serialize, Deserialize, Debug)]
pub struct ElasticsearchStatsResponse {
    pub _all: StatsResponseEntry,
    pub indices: HashMap<String, StatsResponseEntry>, // String is Field name
}

#[derive(Clone, Serialize, Deserialize, Debug, Default)]
pub struct StatsResponseEntry {
    primaries: StatsPrimariesResponse,
    total: StatsTotalResponse,
}

impl AddAssign for StatsResponseEntry {
    fn add_assign(&mut self, rhs: Self) {
        self.primaries.store.size_in_bytes += rhs.primaries.store.size_in_bytes;
        self.primaries.docs.count += rhs.primaries.docs.count;
        self.total.segments.count += rhs.total.segments.count;
        self.total.docs.count += rhs.total.docs.count;
    }
}

impl From<SplitMetadata> for StatsResponseEntry {
    fn from(split_metadata: SplitMetadata) -> Self {
        let mut stats_response_entry = StatsResponseEntry::default();
        stats_response_entry.primaries.store.size_in_bytes =
            split_metadata.as_split_info().file_size_bytes.as_u64();
        stats_response_entry.primaries.docs.count = split_metadata.num_docs as u64;
        stats_response_entry.total.docs.count = split_metadata.num_docs as u64;
        stats_response_entry.total.segments.count = 1;
        stats_response_entry
    }
}

#[derive(Clone, Serialize, Deserialize, Debug, Default)]
pub struct StatsPrimariesResponse {
    store: StatsStoreResponse,
    docs: StatsDocsResponse,
}

#[derive(Clone, Serialize, Deserialize, Debug, Default)]
pub struct StatsStoreResponse {
    size_in_bytes: u64,
}

#[derive(Clone, Serialize, Deserialize, Debug, Default)]
pub struct StatsDocsResponse {
    count: u64,
}

#[derive(Clone, Serialize, Deserialize, Debug, Default)]
pub struct StatsTotalResponse {
    segments: StatsTotalSegmentsResponse,
    docs: StatsDocsResponse,
}

#[derive(Clone, Serialize, Deserialize, Debug, Default)]
pub struct StatsTotalSegmentsResponse {
    count: u64,
}


================================================
FILE: quickwit/quickwit-serve/src/elasticsearch_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::str::from_utf8;
use std::sync::Arc;
use std::time::{Duration, Instant};

use bytes::Bytes;
use elasticsearch_dsl::search::Hit as ElasticHit;
use elasticsearch_dsl::{HitsMetadata, ShardStatistics, Source, TotalHits, TotalHitsRelation};
use futures_util::StreamExt;
use itertools::Itertools;
use quickwit_cluster::Cluster;
use quickwit_common::truncate_str;
use quickwit_config::{NodeConfig, validate_index_id_pattern};
use quickwit_index_management::IndexService;
use quickwit_metastore::*;
use quickwit_proto::metastore::{IndexMetadataRequest, MetastoreService, MetastoreServiceClient};
use quickwit_proto::search::{
    CountHits, ListFieldsResponse, PartialHit, ScrollRequest, SearchResponse, SortByValue,
    SortDatetimeFormat,
};
use quickwit_proto::types::IndexUid;
use quickwit_query::BooleanOperand;
use quickwit_query::query_ast::{BoolQuery, QueryAst, UserInputQuery};
use quickwit_search::{
    AggregationResults, SearchError, SearchService, list_all_splits, resolve_index_patterns,
};
use serde::{Deserialize, Serialize};
use serde_json::{Map, Value, json};
use warp::hyper::StatusCode;
use warp::reply::with_status;
use warp::{Filter, Rejection};

use super::filter::{
    elastic_aliases_filter, elastic_cat_indices_filter, elastic_cluster_health_filter,
    elastic_cluster_info_filter, elastic_delete_index_filter, elastic_delete_scroll_filter,
    elastic_field_capabilities_filter, elastic_index_cat_indices_filter,
    elastic_index_count_filter, elastic_index_field_capabilities_filter,
    elastic_index_mapping_filter, elastic_index_search_filter, elastic_index_stats_filter,
    elastic_multi_search_filter, elastic_nodes_filter, elastic_resolve_index_filter,
    elastic_scroll_filter, elastic_search_shards_filter, elastic_stats_filter,
    elasticsearch_filter,
};
use super::model::{
    CatIndexQueryParams, DeleteQueryParams, ElasticsearchCatIndexResponse, ElasticsearchError,
    ElasticsearchResolveIndexEntryResponse, ElasticsearchResolveIndexResponse,
    ElasticsearchResponse, ElasticsearchStatsResponse, FieldCapabilityQueryParams,
    FieldCapabilityRequestBody, FieldCapabilityResponse, MultiSearchHeader, MultiSearchQueryParams,
    MultiSearchResponse, MultiSearchSingleResponse, ScrollQueryParams, SearchBody,
    SearchQueryParams, SearchQueryParamsCount, StatsResponseEntry,
    build_list_field_request_for_es_api, convert_to_es_field_capabilities_response,
};
use super::{TrackTotalHits, make_elastic_api_response};
use crate::elasticsearch_api::model::ElasticsearchMappingsResponse;
use crate::format::BodyFormat;
use crate::rest::recover_fn;
use crate::rest_api_response::{RestApiError, RestApiResponse};
use crate::{BuildInfo, with_arg};

/// Elastic compatible cluster info handler.
pub fn es_compat_cluster_info_handler(
    node_config: Arc<NodeConfig>,
    build_info: &'static BuildInfo,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_cluster_info_filter()
        .and(with_arg(node_config.clone()))
        .and(with_arg(build_info))
        .then(
            |config: Arc<NodeConfig>, build_info: &'static BuildInfo| async move {
                warp::reply::json(&json!({
                    "name" : config.node_id,
                    "cluster_name" : config.cluster_id,
                    "cluster_uuid" : config.cluster_id,
                    "tagline" : "You Know, for Search",
                    "version" : {
                        "distribution" : "quickwit",
                        "number" : "7.17.0",
                        "build_hash" : build_info.commit_hash,
                        "build_date" : build_info.build_date,
                        "build_snapshot" : false,
                        "lucene_version" : "8.11.1",
                        "minimum_wire_compatibility_version" : "6.8.0",
                        "minimum_index_compatibility_version" : "6.0.0-beta1",
                    }
                }))
            },
        )
        .boxed()
}

/// GET _elastic/_nodes/http
pub fn es_compat_nodes_handler(
    node_config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_nodes_filter()
        .and(with_arg(node_config))
        .then(|config: Arc<NodeConfig>| async move {
            let advertise_addr = std::net::SocketAddr::new(
                config.grpc_advertise_addr.ip(),
                config.rest_config.listen_addr.port(),
            );
            warp::reply::json(&json!({
                "nodes": {
                    config.node_id.as_str(): {
                        "roles": ["data", "ingest"],
                        "http": {
                            "publish_address": advertise_addr.to_string()
                        }
                    }
                }
            }))
        })
        .boxed()
}

/// GET _elastic/{index}/_search_shards
pub fn es_compat_search_shards_handler(
    node_config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_search_shards_filter()
        .and(with_arg(node_config))
        .then(|index_id: String, config: Arc<NodeConfig>| async move {
            warp::reply::json(&json!({
                "shards": [[{
                    "index": index_id,
                    "shard": 0,
                    "primary": true,
                    "node": config.node_id.as_str()
                }]]
            }))
        })
        .boxed()
}

/// GET _elastic/_aliases
pub fn es_compat_aliases_handler()
-> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_aliases_filter()
        .then(|| async { Ok(Value::Object(Map::new())) })
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// GET _elastic/{index}/_mapping or _elastic/{index}/_mappings
pub fn es_compat_index_mapping_handler(
    metastore: MetastoreServiceClient,
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_mapping_filter()
        .and(with_arg(metastore))
        .and(with_arg(search_service))
        .then(es_compat_index_mapping)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
}

async fn get_index_metadata(
    index_id: String,
    metastore: MetastoreServiceClient,
) -> Result<IndexMetadata, SearchError> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id);
    let index_metadata = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?;
    Ok(index_metadata)
}

async fn es_compat_index_mapping(
    index_id: String,
    mut metastore: MetastoreServiceClient,
    search_service: Arc<dyn SearchService>,
) -> Result<ElasticsearchMappingsResponse, ElasticsearchError> {
    let indexes_metadata = if index_id.contains('*') || index_id.contains(',') {
        let patterns: Vec<String> = index_id.split(',').map(|s| s.trim().to_string()).collect();
        resolve_index_patterns(&patterns, &mut metastore).await?
    } else {
        vec![get_index_metadata(index_id.clone(), metastore).await?]
    };
    let index_id_patterns: Vec<String> = indexes_metadata
        .iter()
        .map(|m| m.index_id().to_string())
        .collect();
    let list_fields_request = quickwit_proto::search::ListFieldsRequest {
        index_id_patterns,
        fields: Vec::new(),
        start_timestamp: None,
        end_timestamp: None,
        query_ast: None,
    };
    let list_fields_response = search_service
        .root_list_fields(list_fields_request)
        .await
        .ok();
    let response = ElasticsearchMappingsResponse::from_doc_mapping(
        indexes_metadata,
        list_fields_response.as_ref(),
    );
    Ok(response)
}

/// GET or POST _elastic/_search
pub fn es_compat_search_handler(
    _search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elasticsearch_filter()
        .then(|_params: SearchQueryParams| async move {
            // TODO
            let api_error = RestApiError {
                status_code: StatusCode::NOT_IMPLEMENTED,
                message: "_elastic/_search is not supported yet. Please try the index search \
                          endpoint (_elastic/{index}/search)"
                    .to_string(),
            };
            RestApiResponse::new::<(), _>(
                &Err(api_error),
                StatusCode::NOT_IMPLEMENTED,
                BodyFormat::default(),
            )
        })
        .recover(recover_fn)
}

/// GET or POST _elastic/{index}/_field_caps
pub fn es_compat_index_field_capabilities_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_field_capabilities_filter()
        .or(elastic_field_capabilities_filter())
        .unify()
        .and(with_arg(search_service))
        .then(es_compat_index_field_capabilities)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
}

/// DELETE _elastic/{index}
pub fn es_compat_delete_index_handler(
    index_service: IndexService,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_delete_index_filter()
        .and(with_arg(index_service))
        .then(es_compat_delete_index)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .boxed()
}

/// GET _elastic/_stats
pub fn es_compat_stats_handler(
    metastore_service: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_stats_filter()
        .and(with_arg(metastore_service))
        .then(es_compat_stats)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// Check if the parameter is a known query parameter to reject
fn is_unsupported_qp(param: &str) -> bool {
    ["wait_for_status", "timeout", "level"].contains(&param)
}

/// GET _elastic/_cluster/health
pub fn es_compat_cluster_health_handler(
    cluster: Cluster,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_cluster_health_filter()
        .and(warp::query::<HashMap<String, String>>())
        .and(with_arg(cluster))
        .then(es_compat_cluster_health)
        .recover(recover_fn)
}

#[utoipa::path(
    get,
    tag = "Node Health",
    path = "/_elastic/_cluster/health",
    responses(
        (status = 200, description = "The cluster is healthy.", body = bool),
        (status = 503, description = "The cluster is unhealthy.", body = bool),
    ),
)]
/// Get Node Liveliness
async fn es_compat_cluster_health(
    query_params: HashMap<String, String>,
    cluster: Cluster,
) -> impl warp::Reply {
    if let Some(invalid_param) = query_params.keys().find(|key| is_unsupported_qp(key)) {
        let error_body = warp::reply::json(&json!({
            "error": "Unsupported parameter.",
            "param": invalid_param
        }));
        return with_status(error_body, StatusCode::BAD_REQUEST);
    }
    let is_ready = cluster.is_self_node_ready().await;
    if is_ready {
        with_status(
            warp::reply::json(&json!({"status": "green"})),
            StatusCode::OK,
        )
    } else {
        with_status(
            warp::reply::json(&json!({"status": "red"})),
            StatusCode::SERVICE_UNAVAILABLE,
        )
    }
}

/// GET _elastic/{index}/_stats
pub fn es_compat_index_stats_handler(
    metastore_service: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_stats_filter()
        .and(with_arg(metastore_service))
        .then(es_compat_index_stats)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// GET _elastic/_cat/indices
pub fn es_compat_cat_indices_handler(
    metastore_service: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_cat_indices_filter()
        .and(with_arg(metastore_service))
        .then(es_compat_cat_indices)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// GET _elastic/_cat/indices/{index}
pub fn es_compat_index_cat_indices_handler(
    metastore_service: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_cat_indices_filter()
        .and(with_arg(metastore_service))
        .then(es_compat_index_cat_indices)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// GET  _elastic/_resolve/index/{index}
pub fn es_compat_resolve_index_handler(
    metastore_service: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_resolve_index_filter()
        .and(with_arg(metastore_service))
        .then(es_compat_resolve_index)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .boxed()
}

/// GET or POST _elastic/{index}/_search
pub fn es_compat_index_search_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_search_filter()
        .and(with_arg(search_service))
        .then(es_compat_index_search)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// GET or POST _elastic/{index}/_count
pub fn es_compat_index_count_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_index_count_filter()
        .and(with_arg(search_service))
        .then(es_compat_index_count)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// POST _elastic/_msearch
pub fn es_compat_index_multi_search_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_multi_search_filter()
        .and(with_arg(search_service))
        .then(es_compat_index_multi_search)
        .map(|result: Result<MultiSearchResponse, ElasticsearchError>| {
            let status_code = match &result {
                Ok(_) => StatusCode::OK,
                Err(err) => err.status,
            };
            RestApiResponse::new(&result, status_code, BodyFormat::default())
        })
        .recover(recover_fn)
        .boxed()
}

/// GET or POST _elastic/_search/scroll
pub fn es_compat_scroll_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_scroll_filter()
        .and(with_arg(search_service))
        .then(es_scroll)
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

/// DELETE _elastic/_search/scroll
///
/// Clears a scroll context. Quickwit manages scroll lifetime via TTL,
/// so this is a no-op that returns success.
pub fn es_compat_delete_scroll_handler()
-> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    elastic_delete_scroll_filter()
        .then(|| async {
            Ok::<_, ElasticsearchError>(json!({
                "succeeded": true,
                "num_freed": 0
            }))
        })
        .map(|result| make_elastic_api_response(result, BodyFormat::default()))
        .recover(recover_fn)
        .boxed()
}

#[allow(clippy::result_large_err)]
fn build_request_for_es_api(
    index_id_patterns: Vec<String>,
    search_params: SearchQueryParams,
    search_body: SearchBody,
) -> Result<(quickwit_proto::search::SearchRequest, bool), ElasticsearchError> {
    let default_operator = search_params.default_operator.unwrap_or(BooleanOperand::Or);
    // The query string, if present, takes priority over what can be in the request
    // body.
    let mut query_ast = if let Some(q) = &search_params.q {
        let user_text_query = UserInputQuery {
            user_text: q.to_string(),
            default_fields: None,
            default_operator,
            lenient: false,
        };
        user_text_query.into()
    } else if let Some(query_dsl) = search_body.query {
        query_dsl
            .try_into()
            .map_err(|err: anyhow::Error| SearchError::InvalidQuery(err.to_string()))?
    } else {
        QueryAst::MatchAll
    };

    if let Some(extra_filters) = &search_params.extra_filters {
        let queries: Vec<QueryAst> = extra_filters
            .iter()
            .map(|query| {
                let user_text_query = UserInputQuery {
                    user_text: query.to_string(),
                    default_fields: None,
                    default_operator,
                    lenient: false,
                };
                QueryAst::UserInput(user_text_query)
            })
            .collect();

        query_ast = QueryAst::Bool(BoolQuery {
            must: vec![query_ast],
            must_not: Vec::new(),
            should: Vec::new(),
            filter: queries,
            minimum_should_match: None,
        });
    }

    let aggregation_request: Option<String> = if search_body.aggs.is_empty() {
        None
    } else {
        serde_json::to_string(&search_body.aggs).ok()
    };

    let max_hits = search_params.size.or(search_body.size).unwrap_or(10);
    let start_offset = search_params.from.or(search_body.from).unwrap_or(0);
    let ignore_missing_indexes = search_params.ignore_unavailable.unwrap_or(false);
    let count_hits = match search_params
        .track_total_hits
        .or(search_body.track_total_hits)
    {
        None => CountHits::Underestimate,
        Some(TrackTotalHits::Track(false)) => CountHits::Underestimate,
        Some(TrackTotalHits::Count(count)) if count <= max_hits as i64 => CountHits::Underestimate,
        Some(TrackTotalHits::Track(true) | TrackTotalHits::Count(_)) => CountHits::CountAll,
    }
    .into();

    let sort_fields: Vec<quickwit_proto::search::SortField> = search_params
        .sort_fields()?
        .or_else(|| search_body.sort.clone())
        .unwrap_or_default()
        .iter()
        .map(|sort_field| quickwit_proto::search::SortField {
            field_name: sort_field.field.to_string(),
            sort_order: sort_field.order as i32,
            sort_datetime_format: sort_field
                .date_format
                .clone()
                .map(|date_format| SortDatetimeFormat::from(date_format) as i32),
        })
        .take_while_inclusive(|sort_field| !is_doc_field(sort_field))
        .collect();
    if sort_fields.len() >= 3 {
        return Err(ElasticsearchError::from(SearchError::InvalidArgument(
            format!("only up to two sort fields supported at the moment. got {sort_fields:?}"),
        )));
    }

    let scroll_duration: Option<Duration> = search_params.parse_scroll_ttl()?;
    let scroll_ttl_secs: Option<u32> = scroll_duration.map(|duration| duration.as_secs() as u32);

    let has_doc_id_field = sort_fields.iter().any(is_doc_field);
    let search_after = partial_hit_from_search_after_param(search_body.search_after, &sort_fields)?;

    Ok((
        quickwit_proto::search::SearchRequest {
            index_id_patterns,
            query_ast: serde_json::to_string(&query_ast).expect("Failed to serialize QueryAst"),
            max_hits,
            start_offset,
            aggregation_request,
            sort_fields,
            start_timestamp: None,
            end_timestamp: None,
            snippet_fields: Vec::new(),
            scroll_ttl_secs,
            search_after,
            count_hits,
            ignore_missing_indexes,
            skip_aggregation_finalization: false,
        },
        has_doc_id_field,
    ))
}

fn is_doc_field(field: &quickwit_proto::search::SortField) -> bool {
    field.field_name == "_shard_doc" || field.field_name == "_doc"
}

#[allow(clippy::result_large_err)]
fn partial_hit_from_search_after_param(
    search_after: Vec<serde_json::Value>,
    sort_order: &[quickwit_proto::search::SortField],
) -> Result<Option<PartialHit>, ElasticsearchError> {
    if search_after.is_empty() {
        return Ok(None);
    }
    if search_after.len() != sort_order.len() {
        return Err(ElasticsearchError::new(
            StatusCode::BAD_REQUEST,
            "sort and search_after are of different length".to_string(),
            None,
        ));
    }
    let mut parsed_search_after = PartialHit::default();
    for (value, field) in search_after.into_iter().zip(sort_order) {
        if is_doc_field(field) {
            if let Some(value_str) = value.as_str() {
                let address: quickwit_search::GlobalDocAddress =
                    value_str.parse().map_err(|_| {
                        ElasticsearchError::new(
                            StatusCode::BAD_REQUEST,
                            "invalid search_after doc id, must be of form \
                             `{split_id}:{segment_id: u32}:{doc_id: u32}`"
                                .to_string(),
                            None,
                        )
                    })?;
                parsed_search_after.split_id = address.split;
                parsed_search_after.segment_ord = address.doc_addr.segment_ord;
                parsed_search_after.doc_id = address.doc_addr.doc_id;
                return Ok(Some(parsed_search_after));
            } else {
                return Err(ElasticsearchError::new(
                    StatusCode::BAD_REQUEST,
                    "search_after doc id must be of string type".to_string(),
                    None,
                ));
            }
        } else {
            let value = SortByValue::try_from_json(value).ok_or_else(|| {
                ElasticsearchError::new(
                    StatusCode::BAD_REQUEST,
                    "invalid search_after field value, expect bool, number or string".to_string(),
                    None,
                )
            })?;
            // TODO make cleaner once we support Vec
            if parsed_search_after.sort_value.is_none() {
                parsed_search_after.sort_value = Some(value);
            } else {
                parsed_search_after.sort_value2 = Some(value);
            }
        }
    }
    Ok(Some(parsed_search_after))
}

#[derive(Debug, Serialize, Deserialize)]
struct ElasticsearchCountResponse {
    count: u64,
}

async fn es_compat_index_count(
    index_id_patterns: Vec<String>,
    search_params: SearchQueryParamsCount,
    search_body: SearchBody,
    search_service: Arc<dyn SearchService>,
) -> Result<ElasticsearchCountResponse, ElasticsearchError> {
    let mut search_params: SearchQueryParams = search_params.into();
    search_params.track_total_hits = Some(TrackTotalHits::Track(true));
    let (search_request, _append_shard_doc) =
        build_request_for_es_api(index_id_patterns, search_params, search_body)?;
    let search_response: SearchResponse = search_service.root_search(search_request).await?;
    let search_response_rest: ElasticsearchCountResponse = ElasticsearchCountResponse {
        count: search_response.num_hits,
    };
    Ok(search_response_rest)
}

async fn es_compat_index_search(
    index_id_patterns: Vec<String>,
    search_params: SearchQueryParams,
    search_body: SearchBody,
    search_service: Arc<dyn SearchService>,
) -> Result<ElasticsearchResponse, ElasticsearchError> {
    if search_params.scroll.is_some() && !search_params.allow_partial_search_results() {
        return Err(ElasticsearchError::from(SearchError::InvalidArgument(
            "Quickwit only supports scroll API with allow_partial_search_results set to true"
                .to_string(),
        )));
    }
    let _source_excludes = search_params._source_excludes.clone();
    let _source_includes = search_params._source_includes.clone();
    let start_instant = Instant::now();
    let allow_partial_search_results = search_params.allow_partial_search_results();
    let (search_request, append_shard_doc) =
        build_request_for_es_api(index_id_patterns, search_params, search_body)?;
    let search_response: SearchResponse = search_service.root_search(search_request).await?;
    let elapsed = start_instant.elapsed();
    let mut search_response_rest: ElasticsearchResponse = convert_to_es_search_response(
        search_response,
        append_shard_doc,
        _source_excludes,
        _source_includes,
        allow_partial_search_results,
    )?;
    search_response_rest.took = elapsed.as_millis() as u32;
    Ok(search_response_rest)
}

/// Returns JSON in the format:
///
/// {
///   "acknowledged": true
/// }
#[derive(Clone, Serialize, Deserialize, Debug)]
pub struct ElasticsearchDeleteResponse {
    pub acknowledged: bool,
}

async fn es_compat_delete_index(
    index_id_patterns: Vec<String>,
    query_params: DeleteQueryParams,
    index_service: IndexService,
) -> Result<ElasticsearchDeleteResponse, ElasticsearchError> {
    index_service
        .delete_indexes(
            index_id_patterns,
            query_params.ignore_unavailable.unwrap_or_default(),
            false,
        )
        .await?;
    Ok(ElasticsearchDeleteResponse { acknowledged: true })
}

async fn es_compat_stats(
    metastore: MetastoreServiceClient,
) -> Result<ElasticsearchStatsResponse, ElasticsearchError> {
    es_compat_index_stats(vec!["*".to_string()], metastore).await
}

async fn es_compat_index_stats(
    index_id_patterns: Vec<String>,
    mut metastore: MetastoreServiceClient,
) -> Result<ElasticsearchStatsResponse, ElasticsearchError> {
    let indexes_metadata = resolve_index_patterns(&index_id_patterns, &mut metastore).await?;

    // Index uid to index id mapping
    let index_uid_to_index_id: HashMap<IndexUid, String> = indexes_metadata
        .iter()
        .map(|metadata| (metadata.index_uid.clone(), metadata.index_id().to_owned()))
        .collect();

    let index_uids = indexes_metadata
        .into_iter()
        .map(|index_metadata| index_metadata.index_uid)
        .collect_vec();
    // calling into the search module is not necessary, but reuses established patterns
    let splits_metadata = list_all_splits(index_uids, &mut metastore).await?;

    let search_response_rest: ElasticsearchStatsResponse =
        convert_to_es_stats_response(index_uid_to_index_id, splits_metadata);

    Ok(search_response_rest)
}

async fn es_compat_cat_indices(
    query_params: CatIndexQueryParams,
    metastore: MetastoreServiceClient,
) -> Result<Vec<serde_json::Value>, ElasticsearchError> {
    es_compat_index_cat_indices(vec!["*".to_string()], query_params, metastore).await
}

async fn es_compat_index_cat_indices(
    index_id_patterns: Vec<String>,
    query_params: CatIndexQueryParams,
    mut metastore: MetastoreServiceClient,
) -> Result<Vec<serde_json::Value>, ElasticsearchError> {
    query_params.validate()?;
    let indexes_metadata = resolve_index_patterns(&index_id_patterns, &mut metastore).await?;
    let mut index_id_to_resp: HashMap<IndexUid, ElasticsearchCatIndexResponse> = indexes_metadata
        .iter()
        .map(|metadata| (metadata.index_uid.to_owned(), metadata.clone().into()))
        .collect();

    let splits_metadata = {
        let index_uids = indexes_metadata
            .into_iter()
            .map(|index_metadata| index_metadata.index_uid)
            .collect_vec();

        // calling into the search module is not necessary, but reuses established patterns
        list_all_splits(index_uids, &mut metastore).await?
    };

    let search_response_rest: Vec<ElasticsearchCatIndexResponse> =
        convert_to_es_cat_indices_response(&mut index_id_to_resp, splits_metadata);

    let search_response_rest = search_response_rest
        .into_iter()
        .filter(|resp| {
            if let Some(health) = query_params.health {
                resp.health == health
            } else {
                true
            }
        })
        .map(|cat_index| cat_index.serialize_filtered(&query_params.h))
        .collect::<Result<Vec<serde_json::Value>, serde_json::Error>>()
        .map_err(|serde_error| {
            ElasticsearchError::new(
                StatusCode::INTERNAL_SERVER_ERROR,
                format!("Failed to serialize cat indices response: {serde_error}"),
                None,
            )
        })?;

    Ok(search_response_rest)
}

async fn es_compat_resolve_index(
    index_id_patterns: Vec<String>,
    mut metastore: MetastoreServiceClient,
) -> Result<ElasticsearchResolveIndexResponse, ElasticsearchError> {
    let indexes_metadata = resolve_index_patterns(&index_id_patterns, &mut metastore).await?;
    let mut indices: Vec<ElasticsearchResolveIndexEntryResponse> = indexes_metadata
        .into_iter()
        .map(|metadata| metadata.into())
        .collect();

    indices.sort_by(|left, right| left.name.cmp(&right.name));

    Ok(ElasticsearchResolveIndexResponse {
        indices,
        ..Default::default()
    })
}

async fn es_compat_index_field_capabilities(
    index_id_patterns: Vec<String>,
    search_params: FieldCapabilityQueryParams,
    search_body: FieldCapabilityRequestBody,
    search_service: Arc<dyn SearchService>,
) -> Result<FieldCapabilityResponse, ElasticsearchError> {
    let search_request =
        build_list_field_request_for_es_api(index_id_patterns, search_params, search_body)?;
    let search_response: ListFieldsResponse =
        search_service.root_list_fields(search_request).await?;
    let search_response_rest: FieldCapabilityResponse =
        convert_to_es_field_capabilities_response(search_response);
    Ok(search_response_rest)
}

fn filter_source(
    value: &mut serde_json::Value,
    _source_excludes: &Option<Vec<String>>,
    _source_includes: &Option<Vec<String>>,
) {
    fn remove_path(value: &mut serde_json::Value, path: &str) {
        for (prefix, suffix) in generate_path_variants_with_suffix(path) {
            match value {
                serde_json::Value::Object(map) => {
                    if let Some(suffix) = suffix {
                        if let Some(sub_value) = map.get_mut(prefix) {
                            remove_path(sub_value, suffix);
                            return;
                        }
                    } else {
                        map.remove(prefix);
                    }
                }
                _ => continue,
            }
        }
    }
    fn retain_includes(
        value: &mut serde_json::Value,
        current_path: &str,
        include_paths: &Vec<String>,
    ) {
        if let Some(ref mut map) = value.as_object_mut() {
            map.retain(|key, sub_value| {
                let path = if current_path.is_empty() {
                    key.to_string()
                } else {
                    format!("{current_path}.{key}")
                };

                if include_paths.contains(&path) {
                    // Exact match keep whole node
                    return true;
                }
                // Check if the path is sub path of any allowed path
                for allowed_path in include_paths {
                    if allowed_path.starts_with(path.as_str()) {
                        retain_includes(sub_value, &path, include_paths);
                        return true;
                    }
                }
                false
            });
        }
    }

    // Remove fields that are not included
    if let Some(includes) = _source_includes {
        retain_includes(value, "", includes);
    }

    // Remove fields that are excluded
    if let Some(excludes) = _source_excludes {
        for exclude in excludes {
            remove_path(value, exclude);
        }
    }
}

/// "app.id.name" -> [("app", Some("id.name")), ("app.id", Some("name")), ("app.id.name", None)]
fn generate_path_variants_with_suffix(input: &str) -> Vec<(&str, Option<&str>)> {
    let mut variants = Vec::new();

    // Iterate over each character in the input.
    for (idx, ch) in input.char_indices() {
        if ch == '.' {
            // If a dot is found, create a variant using the current slice and the remainder of the
            // string.
            let prefix = &input[0..idx];
            let suffix = if idx + 1 < input.len() {
                Some(&input[idx + 1..])
            } else {
                None
            };
            variants.push((prefix, suffix));
        }
    }

    variants.push((&input[0..], None));

    variants
}

fn convert_hit(
    hit: quickwit_proto::search::Hit,
    append_shard_doc: bool,
    _source_excludes: &Option<Vec<String>>,
    _source_includes: &Option<Vec<String>>,
) -> ElasticHit {
    let mut json: serde_json::Value = serde_json::from_str(&hit.json).unwrap_or(json!({}));
    filter_source(&mut json, _source_excludes, _source_includes);
    let source =
        Source::from_string(serde_json::to_string(&json).unwrap_or_else(|_| "{}".to_string()))
            .unwrap_or_else(|_| Source::from_string("{}".to_string()).unwrap());

    let mut sort = Vec::new();
    if let Some(partial_hit) = hit.partial_hit {
        if let Some(sort_value) = partial_hit.sort_value {
            sort.push(sort_value.into_json());
        }
        if let Some(sort_value2) = partial_hit.sort_value2 {
            sort.push(sort_value2.into_json());
        }
        if append_shard_doc {
            sort.push(serde_json::Value::String(
                quickwit_search::GlobalDocAddress::from_partial_hit(&partial_hit).to_string(),
            ));
        }
    }

    ElasticHit {
        fields: Default::default(),
        explanation: None,
        index: hit.index_id,
        id: "".to_string(),
        score: None,
        nested: None,
        source,
        highlight: Default::default(),
        inner_hits: Default::default(),
        matched_queries: Vec::default(),
        sort,
    }
}

async fn es_compat_index_multi_search(
    payload: Bytes,
    multi_search_params: MultiSearchQueryParams,
    search_service: Arc<dyn SearchService>,
) -> Result<MultiSearchResponse, ElasticsearchError> {
    let mut search_requests = Vec::new();
    let str_payload = from_utf8(&payload)
        .map_err(|err| SearchError::InvalidQuery(format!("invalid UTF-8: {err}")))?;
    let mut payload_lines = str_lines(str_payload);

    while let Some(line) = payload_lines.next() {
        let mut request_header =
            serde_json::from_str::<MultiSearchHeader>(line).map_err(|err| {
                SearchError::InvalidArgument(format!(
                    "failed to parse request header `{}...`: {}",
                    truncate_str(line, 20),
                    err
                ))
            })?;
        request_header.apply_query_param_defaults(&multi_search_params);
        if request_header.indexes.is_empty() {
            return Err(ElasticsearchError::from(SearchError::InvalidArgument(
                "`_msearch` request header must define at least one index".to_string(),
            )));
        }
        for index in &request_header.indexes {
            validate_index_id_pattern(index, true).map_err(|err| {
                SearchError::InvalidArgument(format!(
                    "request header contains an invalid index: {err}"
                ))
            })?;
        }
        let index_ids_patterns = request_header.indexes.clone();
        let search_body = payload_lines
            .next()
            .ok_or_else(|| {
                SearchError::InvalidArgument("expect request body after request header".to_string())
            })
            .and_then(|line| {
                serde_json::from_str::<SearchBody>(line).map_err(|err| {
                    SearchError::InvalidArgument(format!(
                        "failed to parse request body `{}...`: {}",
                        truncate_str(line, 20),
                        err
                    ))
                })
            })?;
        let mut search_query_params = SearchQueryParams::from(request_header);
        if let Some(_source_excludes) = &multi_search_params._source_excludes {
            search_query_params._source_excludes = Some(_source_excludes.to_vec());
        }
        if let Some(_source_includes) = &multi_search_params._source_includes {
            search_query_params._source_includes = Some(_source_includes.to_vec());
        }
        if let Some(extra_filters) = &multi_search_params.extra_filters {
            search_query_params.extra_filters = Some(extra_filters.to_vec());
        }
        let es_request =
            build_request_for_es_api(index_ids_patterns, search_query_params, search_body)?;
        search_requests.push(es_request);
    }

    // TODO: forced to do weird referencing to work around https://github.com/rust-lang/rust/issues/100905
    // otherwise append_shard_doc is captured by ref, and we get lifetime issues
    let futures = search_requests
        .into_iter()
        .map(|(search_request, append_shard_doc)| {
            let search_service = &search_service;
            let _source_excludes = multi_search_params._source_excludes.clone();
            let _source_includes = multi_search_params._source_includes.clone();
            async move {
                let start_instant = Instant::now();
                let search_response: SearchResponse =
                    search_service.clone().root_search(search_request).await?;
                let elapsed = start_instant.elapsed();
                let mut search_response_rest: ElasticsearchResponse =
                    convert_to_es_search_response(
                        search_response,
                        append_shard_doc,
                        _source_excludes,
                        _source_includes,
                        true, //< allow_partial_results. Set to true to match ES's behavior.
                    )?;
                search_response_rest.took = elapsed.as_millis() as u32;
                Ok::<_, ElasticsearchError>(search_response_rest)
            }
        });
    let max_concurrent_searches =
        multi_search_params.max_concurrent_searches.unwrap_or(10) as usize;
    let search_responses = futures::stream::iter(futures)
        .buffered(max_concurrent_searches)
        .collect::<Vec<_>>()
        .await;
    let responses = search_responses
        .into_iter()
        .map(|search_response| match search_response {
            Ok(search_response) => MultiSearchSingleResponse::from(search_response),
            Err(error) => MultiSearchSingleResponse::from(error),
        })
        .collect_vec();
    let multi_search_response = MultiSearchResponse { responses };
    Ok(multi_search_response)
}

async fn es_scroll(
    scroll_query_params: ScrollQueryParams,
    search_service: Arc<dyn SearchService>,
) -> Result<ElasticsearchResponse, ElasticsearchError> {
    let start_instant = Instant::now();
    let Some(scroll_id) = scroll_query_params.scroll_id.clone() else {
        return Err(SearchError::InvalidArgument("missing scroll_id".to_string()).into());
    };
    let scroll_ttl_secs: Option<u32> = if let Some(scroll_ttl) = scroll_query_params.scroll {
        let scroll_ttl_duration = humantime::parse_duration(&scroll_ttl)
            .map_err(|_| SearchError::InvalidArgument(format!("Scroll invalid: {scroll_ttl}")))?;
        Some(scroll_ttl_duration.as_secs() as u32)
    } else {
        None
    };
    let scroll_request = ScrollRequest {
        scroll_id,
        scroll_ttl_secs,
    };
    let search_response: SearchResponse = search_service.scroll(scroll_request).await?;
    // TODO append_shard_doc depends on the initial request, but we don't have access to it

    // Ideally, we would have wanted to reuse the setting from the initial search request.
    // However, passing that parameter is cumbersome, so we cut some corner and forbid the
    // use of scroll requests in combination with allow_partial_results set to false.
    let allow_failed_splits = true;
    let mut search_response_rest: ElasticsearchResponse =
        convert_to_es_search_response(search_response, false, None, None, allow_failed_splits)?;
    search_response_rest.took = start_instant.elapsed().as_millis() as u32;
    Ok(search_response_rest)
}

fn convert_to_es_cat_indices_response(
    index_id_to_resp: &mut HashMap<IndexUid, ElasticsearchCatIndexResponse>,
    splits: Vec<SplitMetadata>,
) -> Vec<ElasticsearchCatIndexResponse> {
    for split_metadata in splits {
        let resp_entry = index_id_to_resp
            .get_mut(&split_metadata.index_uid)
            .unwrap_or_else(|| {
                panic!(
                    "index_id {} not found in index_id_to_resp",
                    split_metadata.index_uid
                )
            });
        let cat_index_entry: ElasticsearchCatIndexResponse = split_metadata.into();
        *resp_entry += cat_index_entry.clone();
    }
    let mut indices: Vec<ElasticsearchCatIndexResponse> =
        index_id_to_resp.values().cloned().collect();
    indices.sort_by(|a, b| a.index.cmp(&b.index));

    indices
}

fn convert_to_es_stats_response(
    index_uid_to_index_id: HashMap<IndexUid, String>,
    splits: Vec<SplitMetadata>,
) -> ElasticsearchStatsResponse {
    let mut indices: HashMap<String, StatsResponseEntry> = index_uid_to_index_id
        .values()
        .map(|index_id| (index_id.to_owned(), StatsResponseEntry::default()))
        .collect();
    let mut _all = StatsResponseEntry::default();

    for split_metadata in splits {
        let index_id = index_uid_to_index_id
            .get(&split_metadata.index_uid)
            .unwrap_or_else(|| {
                panic!(
                    "index_uid {} not found in index_uid_to_index_id",
                    split_metadata.index_uid
                )
            });
        let resp_entry = indices.get_mut(index_id).unwrap_or_else(|| {
            panic!(
                "index_id {} not found in index_id_to_resp",
                split_metadata.index_uid
            )
        });
        let stats_entry: StatsResponseEntry = split_metadata.into();
        *resp_entry += stats_entry.clone();
        _all += stats_entry.clone();
    }
    ElasticsearchStatsResponse { _all, indices }
}

#[allow(clippy::result_large_err)]
fn convert_to_es_search_response(
    resp: SearchResponse,
    append_shard_doc: bool,
    _source_excludes: Option<Vec<String>>,
    _source_includes: Option<Vec<String>>,
    allow_partial_results: bool,
) -> Result<ElasticsearchResponse, ElasticsearchError> {
    if (!allow_partial_results || resp.num_successful_splits == 0)
        && let Some(search_error) = SearchError::from_split_errors(&resp.failed_splits)
    {
        return Err(ElasticsearchError::from(search_error));
    }
    let hits: Vec<ElasticHit> = resp
        .hits
        .into_iter()
        .map(|hit| convert_hit(hit, append_shard_doc, &_source_excludes, &_source_includes))
        .collect();
    let aggregations: Option<AggregationResults> =
        if let Some(aggregation_postcard) = resp.aggregation_postcard {
            let aggregations =
                AggregationResults::from_postcard(&aggregation_postcard).map_err(|_| {
                    ElasticsearchError::new(
                        StatusCode::INTERNAL_SERVER_ERROR,
                        "Failed to parse aggregation results".to_string(),
                        None,
                    )
                })?;
            Some(aggregations)
        } else {
            None
        };
    let num_failed_splits = resp.failed_splits.len() as u32;
    let num_successful_splits = resp.num_successful_splits as u32;
    let num_total_splits = num_successful_splits + num_failed_splits;
    Ok(ElasticsearchResponse {
        timed_out: false,
        hits: HitsMetadata {
            total: Some(TotalHits {
                value: resp.num_hits,
                relation: TotalHitsRelation::Equal,
            }),
            max_score: None,
            hits,
        },
        aggregations,
        scroll_id: resp.scroll_id,
        // There is no concept of shards here, but use this to convey split search failures.
        shards: ShardStatistics {
            total: num_total_splits,
            successful: num_successful_splits,
            skipped: 0u32,
            failed: num_failed_splits,
            failures: Vec::new(),
        },
        ..Default::default()
    })
}

pub(crate) fn str_lines(body: &str) -> impl Iterator<Item = &str> {
    body.lines()
        .map(|line| line.trim())
        .filter(|line| !line.is_empty())
}

#[cfg(test)]
mod tests {
    use quickwit_proto::search::SplitSearchError;
    use warp::hyper::StatusCode;

    use super::{partial_hit_from_search_after_param, *};

    #[test]
    fn test_partial_hit_from_search_after_param_invalid_length() {
        let search_after = vec![serde_json::json!([1])];
        let sort_order = &[];
        let error = partial_hit_from_search_after_param(search_after, sort_order).unwrap_err();
        assert_eq!(error.status, StatusCode::BAD_REQUEST);
        assert_eq!(
            error.error.reason.unwrap(),
            "sort and search_after are of different length"
        );
    }

    #[test]
    fn test_partial_hit_from_search_after_param_invalid_search_after_value() {
        let search_after = vec![serde_json::json!([1])];
        let sort_order = &[quickwit_proto::search::SortField {
            field_name: "field1".to_string(),
            sort_order: 1,
            sort_datetime_format: None,
        }];
        let error = partial_hit_from_search_after_param(search_after, sort_order).unwrap_err();
        assert_eq!(error.status, StatusCode::BAD_REQUEST);
        assert_eq!(
            error.error.reason.unwrap(),
            "invalid search_after field value, expect bool, number or string"
        );
    }

    #[test]
    fn test_partial_hit_from_search_after_param_invalid_search_after_doc_id() {
        let search_after = vec![serde_json::json!("split_id:1112")];
        let sort_order = &[quickwit_proto::search::SortField {
            field_name: "_doc".to_string(),
            sort_order: 1,
            sort_datetime_format: None,
        }];
        let error = partial_hit_from_search_after_param(search_after, sort_order).unwrap_err();
        assert_eq!(error.status, StatusCode::BAD_REQUEST);
        assert_eq!(
            error.error.reason.unwrap(),
            "invalid search_after doc id, must be of form `{split_id}:{segment_id: u32}:{doc_id: \
             u32}`"
        );
    }

    #[test]
    fn test_single_element() {
        let input = "app";
        let expected = vec![("app", None)];
        assert_eq!(generate_path_variants_with_suffix(input), expected);
    }

    #[test]
    fn test_two_elements() {
        let input = "app.id";
        let expected = vec![("app", Some("id")), ("app.id", None)];
        assert_eq!(generate_path_variants_with_suffix(input), expected);
    }

    #[test]
    fn test_multiple_elements() {
        let input = "app.id.name";
        let expected = vec![
            ("app", Some("id.name")),
            ("app.id", Some("name")),
            ("app.id.name", None),
        ];
        assert_eq!(generate_path_variants_with_suffix(input), expected);
    }

    #[test]
    fn test_include_fields1() {
        let mut fields = json!({
            "app": { "id": 123, "name": "Blub" },
            "user": { "id": 456, "name": "Fred" }
        });

        let includes = Some(vec!["app.id".to_string()]);
        filter_source(&mut fields, &None, &includes);

        let expected = json!({
            "app": { "id": 123 }
        });

        assert_eq!(fields, expected);
    }
    #[test]
    fn test_include_fields2() {
        let mut fields = json!({
            "app": { "id": 123, "name": "Blub" },
            "app.id": { "id": 123, "name": "Blub" },
            "user": { "id": 456, "name": "Fred" }
        });

        let includes = Some(vec!["app".to_string(), "app.id".to_string()]);
        filter_source(&mut fields, &None, &includes);

        let expected = json!({
            "app": { "id": 123, "name": "Blub" },
            "app.id": { "id": 123, "name": "Blub" },
        });

        assert_eq!(fields, expected);
    }

    #[test]
    fn test_exclude_fields() {
        let mut fields = json!({
            "app": {
                "id": 123,
                "name": "Blub"
            },
            "user": {
                "id": 456,
                "name": "Fred"
            }
        });

        let excludes = Some(vec!["app.name".to_string(), "user.id".to_string()]);
        filter_source(&mut fields, &excludes, &None);

        let expected = json!({
            "app": {
                "id": 123
            },
            "user": {
                "name": "Fred"
            }
        });

        assert_eq!(fields, expected);
    }

    #[test]
    fn test_include_and_exclude_fields() {
        let mut fields = json!({
            "app": { "id": 123, "name": "Blub", "version": "1.0" },
            "user": { "id": 456, "name": "Fred", "email": "john@example.com" }
        });

        let includes = Some(vec![
            "app".to_string(),
            "user.name".to_string(),
            "user.email".to_string(),
        ]);
        let excludes = Some(vec!["app.version".to_string(), "user.email".to_string()]);
        filter_source(&mut fields, &excludes, &includes);

        let expected = json!({
            "app": { "id": 123, "name": "Blub" },
            "user": { "name": "Fred" }
        });

        assert_eq!(fields, expected);
    }

    #[test]
    fn test_no_includes_or_excludes() {
        let mut fields = json!({
            "app": {
                "id": 123,
                "name": "Blub"
            }
        });

        filter_source(&mut fields, &None, &None);

        let expected = json!({
            "app": {
                "id": 123,
                "name": "Blub"
            }
        });

        assert_eq!(fields, expected);
    }

    // We test that the behavior of allow partial search results.
    #[test]
    fn test_convert_to_es_search_response_allow_partial() {
        let split_error = SplitSearchError {
            error: "some-error".to_string(),
            split_id: "some-split-id".to_string(),
            retryable_error: true,
        };
        {
            let search_response = SearchResponse {
                num_successful_splits: 1,
                failed_splits: vec![split_error.clone()],
                ..Default::default()
            };
            convert_to_es_search_response(search_response, false, None, None, false).unwrap_err();
        }
        {
            let search_response = SearchResponse {
                num_successful_splits: 1,
                failed_splits: vec![split_error.clone()],
                ..Default::default()
            };
            // if we allow partial search results, this should not fail, but we report the presence
            // of failed splits in the fail shard response.
            let es_search_resp =
                convert_to_es_search_response(search_response, false, None, None, true).unwrap();
            assert_eq!(es_search_resp.shards.failed, 1);
        }
        {
            let search_response = SearchResponse {
                failed_splits: vec![split_error.clone()],
                ..Default::default()
            };
            // Event if we allow partial search results, with a fail and no success, we have a
            // failure.
            convert_to_es_search_response(search_response, false, None, None, true).unwrap_err();
        }
        {
            // Not having any splits (no failure + no success) is not considered a failure.
            for allow_partial in [true, false] {
                let search_response = SearchResponse::default();
                let es_search_resp = convert_to_es_search_response(
                    search_response,
                    false,
                    None,
                    None,
                    allow_partial,
                )
                .unwrap();
                assert_eq!(es_search_resp.shards.failed, 0);
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/format.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;

use quickwit_config::ConfigFormat;
use serde::{self, Deserialize, Serialize, Serializer};
use thiserror::Error;
use warp::hyper::header::CONTENT_TYPE;
use warp::{Filter, Rejection};

/// Body output format used for the REST API.
#[derive(Deserialize, Clone, Debug, Eq, PartialEq, Copy, utoipa::ToSchema)]
#[serde(rename_all = "snake_case")]
#[derive(Default)]
pub enum BodyFormat {
    Json,
    #[default]
    PrettyJson,
}

impl BodyFormat {
    pub(crate) fn result_to_vec<T: serde::Serialize, E: serde::Serialize>(
        &self,
        result: &Result<T, E>,
    ) -> Result<Vec<u8>, ()> {
        match result {
            Ok(value) => self.value_to_vec(value),
            Err(err) => self.value_to_vec(err),
        }
    }

    fn value_to_vec(&self, value: &impl serde::Serialize) -> Result<Vec<u8>, ()> {
        match &self {
            Self::Json => serde_json::to_vec(value),
            Self::PrettyJson => serde_json::to_vec_pretty(value),
        }
        .map_err(|_| {
            tracing::error!("response serialization failed");
        })
    }
}

impl fmt::Display for BodyFormat {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        match &self {
            Self::Json => write!(formatter, "json"),
            Self::PrettyJson => write!(formatter, "pretty_json"),
        }
    }
}

impl Serialize for BodyFormat {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.serialize_str(&self.to_string())
    }
}

/// This struct represents a QueryString passed to
/// the REST API.
#[derive(Deserialize, Debug, Eq, PartialEq, utoipa::IntoParams)]
#[into_params(parameter_in = Query)]
struct FormatQueryString {
    /// The output format requested.
    #[serde(default)]
    pub format: BodyFormat,
}

pub(crate) fn extract_format_from_qs()
-> impl Filter<Extract = (BodyFormat,), Error = Rejection> + Clone {
    warp::query::<FormatQueryString>().map(|format_qs: FormatQueryString| format_qs.format)
}

#[derive(Debug, Error)]
#[error(
    "request's content-type is not supported: supported media types are `application/json`, \
     `application/toml`, and `application/yaml`"
)]
pub(crate) struct UnsupportedMediaType;

impl warp::reject::Reject for UnsupportedMediaType {}

pub(crate) fn extract_config_format()
-> impl Filter<Extract = (ConfigFormat,), Error = Rejection> + Copy {
    warp::filters::header::optional::<mime_guess::Mime>(CONTENT_TYPE.as_str()).and_then(
        |mime_opt: Option<mime_guess::Mime>| {
            if let Some(mime) = mime_opt {
                let config_format = match mime.subtype().as_str() {
                    "json" => ConfigFormat::Json,
                    "toml" => ConfigFormat::Toml,
                    "yaml" => ConfigFormat::Yaml,
                    _ => {
                        return futures::future::err(warp::reject::custom(UnsupportedMediaType));
                    }
                };
                return futures::future::ok(config_format);
            }
            futures::future::ok(ConfigFormat::Json)
        },
    )
}


================================================
FILE: quickwit/quickwit-serve/src/grpc.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeSet;
use std::sync::Arc;

use anyhow::Context;
use quickwit_cluster::cluster_grpc_server;
use quickwit_common::tower::BoxFutureInfaillible;
use quickwit_config::GrpcConfig;
use quickwit_config::service::QuickwitService;
use quickwit_proto::developer::DeveloperServiceClient;
use quickwit_proto::indexing::IndexingServiceClient;
use quickwit_proto::jaeger::storage::v1::span_reader_plugin_server::SpanReaderPluginServer;
use quickwit_proto::jaeger::storage::v2::trace_reader_server::TraceReaderServer;
use quickwit_proto::opentelemetry::proto::collector::logs::v1::logs_service_server::LogsServiceServer;
use quickwit_proto::opentelemetry::proto::collector::trace::v1::trace_service_server::TraceServiceServer;
use quickwit_proto::search::search_service_server::SearchServiceServer;
use quickwit_proto::tonic::codegen::CompressionEncoding;
use quickwit_proto::tonic::transport::server::TcpIncoming;
use quickwit_proto::tonic::transport::{Certificate, Identity, Server, ServerTlsConfig};
use tokio::net::TcpListener;
use tonic_health::pb::FILE_DESCRIPTOR_SET as HEALTH_FILE_DESCRIPTOR_SET;
use tonic_health::pb::health_server::{Health, HealthServer};
use tonic_reflection::pb::v1::FILE_DESCRIPTOR_SET as REFLECTION_FILE_DESCRIPTOR_SET;
use tonic_reflection::server::v1::{ServerReflection, ServerReflectionServer};
use tracing::*;

use crate::developer_api::DeveloperApiServer;
use crate::search_api::GrpcSearchAdapter;
use crate::{INDEXING_GRPC_SERVER_METRICS_LAYER, QuickwitServices};

/// Starts and binds gRPC services to `grpc_listen_addr`.
pub(crate) async fn start_grpc_server(
    tcp_listener: TcpListener,
    grpc_config: GrpcConfig,
    services: Arc<QuickwitServices>,
    readiness_trigger: BoxFutureInfaillible<()>,
    shutdown_signal: BoxFutureInfaillible<()>,
    health_service: HealthServer<impl Health>,
) -> anyhow::Result<()> {
    let mut enabled_grpc_services = BTreeSet::new();
    let mut file_descriptor_sets = Vec::new();
    let mut server = Server::builder();

    if let Some(tls_config) = grpc_config.tls {
        let cert = std::fs::read_to_string(tls_config.cert_path)?;
        let key = std::fs::read_to_string(tls_config.key_path)?;
        let identity = Identity::from_pem(cert, key);

        let mut tls = ServerTlsConfig::new().identity(identity);

        if tls_config.validate_client {
            let ca_cert = std::fs::read_to_string(tls_config.ca_path)?;
            let ca_cert = Certificate::from_pem(ca_cert);
            tls = tls.client_ca_root(ca_cert);
        }
        // TODO using this builtin method means we have no way of hot-reloading certificates
        // (i.e. the process must be restarted every time its certificate expires)
        // to do better, we'd need to wra the TcpListener with something that does (m)TLS
        // and that we control, however it would be somewhat painful, and more error prone
        server = server.tls_config(tls)?;
    }

    let cluster_grpc_service = cluster_grpc_server(services.cluster.clone());
    file_descriptor_sets.push(quickwit_proto::cluster::CLUSTER_PLANE_FILE_DESCRIPTOR_SET);

    // Mount gRPC metastore service if `QuickwitService::Metastore` is enabled on node.
    let metastore_grpc_service = if let Some(metastore_server) = &services.metastore_server_opt {
        enabled_grpc_services.insert("metastore");
        file_descriptor_sets.push(quickwit_proto::metastore::METASTORE_FILE_DESCRIPTOR_SET);

        Some(metastore_server.as_grpc_service(grpc_config.max_message_size))
    } else {
        None
    };
    // Mount gRPC indexing service if `QuickwitService::Indexer` is enabled on node.
    let indexing_grpc_service = if services
        .node_config
        .is_service_enabled(QuickwitService::Indexer)
    {
        if let Some(indexing_service) = services.indexing_service_opt.clone() {
            enabled_grpc_services.insert("indexing");
            file_descriptor_sets.push(quickwit_proto::indexing::INDEXING_FILE_DESCRIPTOR_SET);

            let indexing_service = IndexingServiceClient::tower()
                .stack_layer(INDEXING_GRPC_SERVER_METRICS_LAYER.clone())
                .build_from_mailbox(indexing_service);
            Some(indexing_service.as_grpc_service(grpc_config.max_message_size))
        } else {
            None
        }
    } else {
        None
    };
    // Mount gRPC ingest service if `QuickwitService::Indexer` is enabled on node.
    let ingest_api_grpc_service = if services
        .node_config
        .is_service_enabled(QuickwitService::Indexer)
    {
        enabled_grpc_services.insert("ingest-api");
        Some(
            services
                .ingest_service
                .as_grpc_service(grpc_config.max_message_size),
        )
    } else {
        None
    };
    let ingest_router_grpc_service = if services
        .node_config
        .is_service_enabled(QuickwitService::Indexer)
    {
        enabled_grpc_services.insert("ingest-router");

        let ingest_router_service = services
            .ingest_router_service
            .as_grpc_service(grpc_config.max_message_size);
        Some(ingest_router_service)
    } else {
        None
    };

    let ingester_grpc_service = if let Some(ingester_service) = services.ingester_service() {
        enabled_grpc_services.insert("ingester");
        file_descriptor_sets.push(quickwit_proto::ingest::INGEST_FILE_DESCRIPTOR_SET);
        let ingester_grpc_service = ingester_service.as_grpc_service(grpc_config.max_message_size);
        Some(ingester_grpc_service)
    } else {
        None
    };

    // Mount gRPC control plane service if `QuickwitService::ControlPlane` is enabled on node.
    let control_plane_grpc_service = if services
        .node_config
        .is_service_enabled(QuickwitService::ControlPlane)
    {
        enabled_grpc_services.insert("control-plane");
        file_descriptor_sets.push(quickwit_proto::control_plane::CONTROL_PLANE_FILE_DESCRIPTOR_SET);

        Some(
            services
                .control_plane_client
                .as_grpc_service(grpc_config.max_message_size),
        )
    } else {
        None
    };
    // Mount gRPC OpenTelemetry OTLP services if present.
    let otlp_trace_grpc_service =
        if let Some(otlp_traces_service) = services.otlp_traces_service_opt.clone() {
            enabled_grpc_services.insert("otlp-traces");
            let trace_service = TraceServiceServer::new(otlp_traces_service)
                .accept_compressed(CompressionEncoding::Gzip)
                .accept_compressed(CompressionEncoding::Zstd)
                .max_decoding_message_size(grpc_config.max_message_size.0 as usize)
                .max_encoding_message_size(grpc_config.max_message_size.0 as usize);
            Some(trace_service)
        } else {
            None
        };
    let otlp_log_grpc_service =
        if let Some(otlp_logs_service) = services.otlp_logs_service_opt.clone() {
            enabled_grpc_services.insert("otlp-logs");
            let logs_service = LogsServiceServer::new(otlp_logs_service)
                .accept_compressed(CompressionEncoding::Gzip)
                .accept_compressed(CompressionEncoding::Zstd)
                .max_decoding_message_size(grpc_config.max_message_size.0 as usize)
                .max_encoding_message_size(grpc_config.max_message_size.0 as usize);
            Some(logs_service)
        } else {
            None
        };
    // Mount gRPC search service if `QuickwitService::Searcher` is enabled on node.
    let search_grpc_service = if services
        .node_config
        .is_service_enabled(QuickwitService::Searcher)
    {
        enabled_grpc_services.insert("search");
        file_descriptor_sets.push(quickwit_proto::search::SEARCH_FILE_DESCRIPTOR_SET);

        let search_service = services.search_service.clone();
        let grpc_search_service = GrpcSearchAdapter::from(search_service);
        Some(
            SearchServiceServer::new(grpc_search_service)
                .max_decoding_message_size(grpc_config.max_message_size.0 as usize)
                .max_encoding_message_size(grpc_config.max_message_size.0 as usize),
        )
    } else {
        None
    };

    // Mount gRPC jaeger service if present.
    let jaeger_grpc_service = if let Some(jaeger_service) = services.jaeger_service_opt.clone() {
        enabled_grpc_services.insert("jaeger");
        Some(SpanReaderPluginServer::new(jaeger_service))
    } else {
        None
    };

    // Mount gRPC jaeger v2 service (TraceReader) if present.
    let jaeger_v2_grpc_service = if let Some(jaeger_service) = services.jaeger_service_opt.clone() {
        enabled_grpc_services.insert("jaeger-v2");
        Some(TraceReaderServer::new(jaeger_service))
    } else {
        None
    };

    let developer_grpc_service = {
        enabled_grpc_services.insert("developer");
        file_descriptor_sets.push(quickwit_proto::developer::DEVELOPER_FILE_DESCRIPTOR_SET);

        let developer_service = DeveloperApiServer::from_services(&services);

        DeveloperServiceClient::new(developer_service)
            .as_grpc_service(DeveloperApiServer::MAX_GRPC_MESSAGE_SIZE)
    };
    enabled_grpc_services.insert("health");
    file_descriptor_sets.push(HEALTH_FILE_DESCRIPTOR_SET);

    enabled_grpc_services.insert("reflection");
    file_descriptor_sets.push(REFLECTION_FILE_DESCRIPTOR_SET);
    let reflection_service = build_reflection_service(&file_descriptor_sets)?;

    let server_router = server
        .add_service(cluster_grpc_service)
        .add_service(developer_grpc_service)
        .add_service(health_service)
        .add_service(reflection_service)
        .add_optional_service(control_plane_grpc_service)
        .add_optional_service(indexing_grpc_service)
        .add_optional_service(ingest_api_grpc_service)
        .add_optional_service(ingest_router_grpc_service)
        .add_optional_service(ingester_grpc_service)
        .add_optional_service(jaeger_grpc_service)
        .add_optional_service(jaeger_v2_grpc_service)
        .add_optional_service(metastore_grpc_service)
        .add_optional_service(otlp_log_grpc_service)
        .add_optional_service(otlp_trace_grpc_service)
        .add_optional_service(search_grpc_service);

    let grpc_listen_addr = tcp_listener.local_addr()?;
    info!(
        enabled_grpc_services=?enabled_grpc_services,
        grpc_listen_addr=?grpc_listen_addr,
        "starting gRPC server listening on {grpc_listen_addr}"
    );
    // nodelay=true and keepalive=None are the default values for Server::builder()
    let tcp_incoming = TcpIncoming::from(tcp_listener)
        .with_nodelay(Some(true))
        .with_keepalive(None);
    let serve_fut = server_router.serve_with_incoming_shutdown(tcp_incoming, shutdown_signal);
    let (serve_res, _trigger_res) = tokio::join!(serve_fut, readiness_trigger);
    serve_res?;
    Ok(())
}

fn build_reflection_service(
    file_descriptor_sets: &[&[u8]],
) -> anyhow::Result<ServerReflectionServer<impl ServerReflection>> {
    let mut builder = tonic_reflection::server::Builder::configure();

    for file_descriptor_set in file_descriptor_sets {
        builder = builder.register_encoded_file_descriptor_set(file_descriptor_set)
    }
    builder
        .build_v1()
        .context("failed to build reflection service")
}


================================================
FILE: quickwit/quickwit-serve/src/health_check_api/handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_actors::{Healthz, Mailbox};
use quickwit_cluster::Cluster;
use quickwit_indexing::IndexingService;
use quickwit_janitor::JanitorService;
use tracing::error;
use warp::hyper::StatusCode;
use warp::reply::with_status;
use warp::{Filter, Rejection};

use crate::rest::recover_fn;
use crate::with_arg;

#[derive(utoipa::OpenApi)]
#[openapi(paths(get_liveness, get_readiness))]
pub struct HealthCheckApi;

/// Health check handlers.
pub(crate) fn health_check_handlers(
    cluster: Cluster,
    indexer_service_opt: Option<Mailbox<IndexingService>>,
    janitor_service_opt: Option<Mailbox<JanitorService>>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    liveness_handler(indexer_service_opt, janitor_service_opt).or(readiness_handler(cluster))
}

fn liveness_handler(
    indexer_service_opt: Option<Mailbox<IndexingService>>,
    janitor_service_opt: Option<Mailbox<JanitorService>>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("health" / "livez")
        .and(warp::get())
        .and(with_arg(indexer_service_opt))
        .and(with_arg(janitor_service_opt))
        .then(get_liveness)
        .recover(recover_fn)
}

fn readiness_handler(
    cluster: Cluster,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("health" / "readyz")
        .and(warp::get())
        .and(with_arg(cluster))
        .then(get_readiness)
        .recover(recover_fn)
}

#[utoipa::path(
    get,
    tag = "Node Health",
    path = "/livez",
    responses(
        (status = 200, description = "The service is live.", body = bool),
        (status = 503, description = "The service is not live.", body = bool),
    ),
)]
/// Get Node Liveliness
async fn get_liveness(
    indexer_service_opt: Option<Mailbox<IndexingService>>,
    janitor_service_opt: Option<Mailbox<JanitorService>>,
) -> impl warp::Reply {
    let mut is_live = true;

    if let Some(indexer_service) = indexer_service_opt
        && !indexer_service.ask(Healthz).await.unwrap_or(false)
    {
        error!("indexer service is unhealthy");
        is_live = false;
    }
    if let Some(janitor_service) = janitor_service_opt
        && !janitor_service.ask(Healthz).await.unwrap_or(false)
    {
        error!("janitor service is unhealthy");
        is_live = false;
    }
    let status_code = if is_live {
        StatusCode::OK
    } else {
        StatusCode::SERVICE_UNAVAILABLE
    };
    with_status(warp::reply::json(&is_live), status_code)
}

#[utoipa::path(
    get,
    tag = "Node Health",
    path = "/readyz",
    responses(
        (status = 200, description = "The service is ready.", body = bool),
        (status = 503, description = "The service is not ready.", body = bool),
    ),
)]
/// Get Node Readiness
async fn get_readiness(cluster: Cluster) -> impl warp::Reply {
    let is_ready = cluster.is_self_node_ready().await;
    let status_code = if is_ready {
        StatusCode::OK
    } else {
        StatusCode::SERVICE_UNAVAILABLE
    };
    with_status(warp::reply::json(&is_ready), status_code)
}

#[cfg(test)]
mod tests {

    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};

    #[tokio::test]
    async fn test_rest_search_api_health_checks() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &[], &transport, false)
            .await
            .unwrap();
        let health_check_handler = super::health_check_handlers(cluster.clone(), None, None);
        let resp = warp::test::request()
            .path("/health/livez")
            .reply(&health_check_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp = warp::test::request()
            .path("/health/readyz")
            .reply(&health_check_handler)
            .await;
        assert_eq!(resp.status(), 503);
        cluster.set_self_node_readiness(true).await;
        let resp = warp::test::request()
            .path("/health/readyz")
            .reply(&health_check_handler)
            .await;
        assert_eq!(resp.status(), 200);
    }
}


================================================
FILE: quickwit/quickwit-serve/src/health_check_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod handler;

pub(crate) use handler::{HealthCheckApi, health_check_handlers};


================================================
FILE: quickwit/quickwit-serve/src/index_api/index_resource.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use bytes::Bytes;
use quickwit_common::uri::Uri;
use quickwit_config::{
    ConfigFormat, NodeConfig, load_index_config_update, validate_index_id_pattern,
};
use quickwit_index_management::{IndexService, IndexServiceError};
use quickwit_metastore::{
    IndexMetadata, IndexMetadataResponseExt, ListIndexesMetadataResponseExt, ListSplitsQuery,
    ListSplitsRequestExt, MetastoreServiceStreamSplitsExt, Split, SplitInfo, SplitState,
};
use quickwit_proto::metastore::{
    IndexMetadataRequest, ListIndexesMetadataRequest, ListSplitsRequest, MetastoreError,
    MetastoreResult, MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::IndexId;
use serde::{Deserialize, Serialize};
use tracing::info;
use warp::{Filter, Rejection};

use super::rest_handler::log_failure;
use crate::format::{extract_config_format, extract_format_from_qs};
use crate::rest_api_response::into_rest_api_response;
use crate::simple_list::from_simple_list;
use crate::with_arg;

pub fn get_index_metadata_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String)
        .and(warp::get())
        .and(with_arg(metastore))
        .then(get_index_metadata)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

pub async fn get_index_metadata(
    index_id: IndexId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<IndexMetadata> {
    info!(index_id = %index_id, "get-index-metadata");
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_metadata = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?;
    Ok(index_metadata)
}

/// This struct represents the QueryString passed to
/// the rest API to filter indexes.
#[derive(Debug, Clone, Deserialize, Serialize, utoipa::IntoParams, utoipa::ToSchema, Default)]
#[into_params(parameter_in = Query)]
pub struct ListIndexesQueryParams {
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub index_id_patterns: Option<Vec<String>>,
}

pub fn list_indexes_metadata_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes")
        .and(warp::get())
        .and(warp::query())
        .and(with_arg(metastore))
        .then(list_indexes_metadata)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

/// Describes an index with its main information and statistics.
#[derive(Serialize, Deserialize, utoipa::ToSchema)]
pub struct IndexStats {
    #[schema(value_type = String)]
    pub index_id: IndexId,
    #[schema(value_type = String)]
    pub index_uri: Uri,
    pub num_published_splits: usize,
    pub size_published_splits: u64,
    pub num_published_docs: u64,
    pub size_published_docs_uncompressed: u64,
    pub timestamp_field_name: Option<String>,
    pub min_timestamp: Option<i64>,
    pub max_timestamp: Option<i64>,
}

#[utoipa::path(
    get,
    tag = "Indexes",
    path = "/indexes/{index_id}/describe",
    responses(
        (status = 200, description = "Successfully fetched stats about Index.", body = IndexStats)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to describe."),
    )
)]

/// Describes an index.
pub async fn describe_index(
    index_id: IndexId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<IndexStats> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_metadata = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?;
    let query = ListSplitsQuery::for_index(index_metadata.index_uid.clone());
    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
    let splits = metastore
        .list_splits(list_splits_request)
        .await?
        .collect_splits()
        .await?;
    let published_splits: Vec<Split> = splits
        .into_iter()
        .filter(|split| split.split_state == SplitState::Published)
        .collect();
    let mut total_num_docs = 0;
    let mut total_num_bytes = 0;
    let mut total_uncompressed_num_bytes = 0;
    let mut min_timestamp: Option<i64> = None;
    let mut max_timestamp: Option<i64> = None;

    for split in &published_splits {
        total_num_docs += split.split_metadata.num_docs as u64;
        total_num_bytes += split.split_metadata.footer_offsets.end;
        total_uncompressed_num_bytes += split.split_metadata.uncompressed_docs_size_in_bytes;

        if let Some(time_range) = &split.split_metadata.time_range {
            min_timestamp = min_timestamp
                .min(Some(*time_range.start()))
                .or(Some(*time_range.start()));
            max_timestamp = max_timestamp
                .max(Some(*time_range.end()))
                .or(Some(*time_range.end()));
        }
    }

    let index_config = index_metadata.into_index_config();
    let index_stats = IndexStats {
        index_id,
        index_uri: index_config.index_uri.clone(),
        num_published_splits: published_splits.len(),
        size_published_splits: total_num_bytes,
        num_published_docs: total_num_docs,
        size_published_docs_uncompressed: total_uncompressed_num_bytes,
        timestamp_field_name: index_config.doc_mapping.timestamp_field,
        min_timestamp,
        max_timestamp,
    };

    Ok(index_stats)
}

pub fn describe_index_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "describe")
        .and(warp::get())
        .and(with_arg(metastore))
        .then(describe_index)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    get,
    tag = "Indexes",
    path = "/indexes",
    responses(
        // We return `VersionedIndexMetadata` as it's the serialized model view.
        (status = 200, description = "Successfully fetched all indexes.", body = [VersionedIndexMetadata])
    ),
    params(
        ListIndexesQueryParams,
        ("index_id_patterns" = String, Path, description = "The index ID pattern to retrieve indexes for."),
    )
)]
/// Gets indexes metadata.
pub async fn list_indexes_metadata(
    list_indexes_params: ListIndexesQueryParams,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<Vec<IndexMetadata>> {
    let list_indexes_metata_request =
        if let Some(index_id_patterns) = list_indexes_params.index_id_patterns {
            for index_id_pattern in &index_id_patterns {
                validate_index_id_pattern(index_id_pattern, true).map_err(|error| {
                    MetastoreError::InvalidArgument {
                        message: error.to_string(),
                    }
                })?;
            }
            ListIndexesMetadataRequest { index_id_patterns }
        } else {
            ListIndexesMetadataRequest::all()
        };
    metastore
        .list_indexes_metadata(list_indexes_metata_request)
        .await?
        .deserialize_indexes_metadata()
        .await
}

#[derive(Deserialize, utoipa::IntoParams, utoipa::ToSchema)]
#[into_params(parameter_in = Query)]
pub struct CreateIndexQueryParams {
    #[serde(default)]
    overwrite: bool,
}

pub fn create_index_handler(
    index_service: IndexService,
    node_config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes")
        .and(warp::post())
        .and(warp::query())
        .and(extract_config_format())
        .and(warp::body::content_length_limit(1024 * 1024))
        .and(warp::filters::body::bytes())
        .and(with_arg(index_service))
        .and(with_arg(node_config))
        .then(create_index)
        .map(log_failure("failed to create index"))
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    post,
    tag = "Indexes",
    path = "/indexes",
    request_body = VersionedIndexConfig,
    responses(
        // We return `VersionedIndexMetadata` as it's the serialized model view.
        (status = 200, description = "Successfully created index.", body = VersionedIndexMetadata)
    ),
    params(
        CreateIndexQueryParams,
    )
)]
/// Creates index.
pub async fn create_index(
    create_index_query_params: CreateIndexQueryParams,
    config_format: ConfigFormat,
    index_config_bytes: Bytes,
    mut index_service: IndexService,
    node_config: Arc<NodeConfig>,
) -> Result<IndexMetadata, IndexServiceError> {
    let index_config = quickwit_config::load_index_config_from_user_config(
        config_format,
        &index_config_bytes,
        &node_config.default_index_root_uri,
    )
    .map_err(IndexServiceError::InvalidConfig)?;
    info!(index_id = %index_config.index_id, overwrite = create_index_query_params.overwrite, "create-index");
    index_service
        .create_index(index_config, create_index_query_params.overwrite)
        .await
}

/// Query parameters for update index queries
#[derive(Deserialize, Debug, Eq, PartialEq, utoipa::IntoParams)]
#[into_params(parameter_in = Query)]
pub struct UpdateQueryParams {
    /// Create the index if it doesn't exist yet
    #[serde(default)]
    pub create: bool,
}

fn update_index_qp() -> impl Filter<Extract = (UpdateQueryParams,), Error = Rejection> + Clone {
    warp::query::<UpdateQueryParams>()
}

pub fn update_index_handler(
    index_service: IndexService,
    node_config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String)
        .and(warp::put())
        .and(extract_config_format())
        .and(update_index_qp())
        .and(warp::body::content_length_limit(1024 * 1024))
        .and(warp::filters::body::bytes())
        .and(with_arg(index_service))
        .and(with_arg(node_config))
        .then(update_index)
        .map(log_failure("failed to update index"))
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    put,
    tag = "Indexes",
    path = "/indexes/{index_id}",
    request_body = VersionedIndexConfig,
    responses(
        (status = 200, description = "Successfully updated the index configuration.", body = VersionedIndexMetadata)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to update."),
        UpdateQueryParams,
    )
)]
/// Updates an existing index.
///
/// This endpoint follows PUT semantics, which means that all the fields of the
/// current configuration are replaced by the values specified in this request
/// or the associated defaults. In particular, if the field is optional (e.g.
/// `retention_policy`), omitting it will delete the associated configuration.
/// If the new configuration file contains updates that cannot be applied, the
/// request fails, and none of the updates are applied.
pub async fn update_index(
    target_index_id: IndexId,
    config_format: ConfigFormat,
    query_params: UpdateQueryParams,
    index_config_bytes: Bytes,
    mut index_service: IndexService,
    node_config: Arc<NodeConfig>,
) -> Result<IndexMetadata, IndexServiceError> {
    info!(index_id = %target_index_id, "update-index");

    let metastore = index_service.metastore();
    let index_metadata_request = IndexMetadataRequest::for_index_id(target_index_id.to_string());
    let current_index_metadata_res = metastore.index_metadata(index_metadata_request).await;

    let current_index_metadata_ser = match current_index_metadata_res {
        Ok(index_metadata) => index_metadata,
        Err(MetastoreError::NotFound(_)) if query_params.create => {
            let index_config = quickwit_config::load_index_config_from_user_config(
                config_format,
                &index_config_bytes,
                &node_config.default_index_root_uri,
            )
            .map_err(IndexServiceError::InvalidConfig)?;
            if index_config.index_id != target_index_id {
                return Err(IndexServiceError::InvalidConfig(anyhow::anyhow!(
                    "`index_id` in config file does not match index_id from query path"
                )));
            }
            info!(index_id = %index_config.index_id, "create-index-on-update");
            match index_service.create_index(index_config, false).await {
                Err(IndexServiceError::Metastore(MetastoreError::AlreadyExists(_))) => {
                    // If the index was created just after we tried to update it, try to update as
                    // if nothing happened. But if it gets deleted again before we update it, just
                    // error out
                    let index_metadata_request =
                        IndexMetadataRequest::for_index_id(target_index_id.to_string());
                    metastore.index_metadata(index_metadata_request).await?
                }
                other => return other,
            }
        }
        Err(e) => return Err(e.into()),
    };
    let current_index_metadata = current_index_metadata_ser.deserialize_index_metadata()?;
    let index_uid = current_index_metadata.index_uid.clone();
    let current_index_config = current_index_metadata.into_index_config();

    let new_index_config = load_index_config_update(
        config_format,
        &index_config_bytes,
        &node_config.default_index_root_uri,
        &current_index_config,
    )
    .map_err(IndexServiceError::InvalidConfig)?;

    let index_metadata = index_service
        .update_index(index_uid, new_index_config)
        .await?;
    Ok(index_metadata)
}

pub fn clear_index_handler(
    index_service: IndexService,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "clear")
        .and(warp::put())
        .and(with_arg(index_service))
        .then(clear_index)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    put,
    tag = "Indexes",
    path = "/indexes/{index_id}/clear",
    responses(
        (status = 200, description = "Successfully cleared index.")
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to clear."),
    )
)]
/// Removes all of the data (splits, queued document) associated with the index, but keeps the index
/// configuration. (See also, `delete-index`).
pub async fn clear_index(
    index_id: IndexId,
    mut index_service: IndexService,
) -> Result<(), IndexServiceError> {
    info!(index_id = %index_id, "clear-index");
    index_service.clear_index(&index_id).await
}

#[derive(Deserialize, utoipa::IntoParams, utoipa::ToSchema)]
#[into_params(parameter_in = Query)]
pub struct DeleteIndexQueryParam {
    #[serde(default)]
    dry_run: bool,
}

pub fn delete_index_handler(
    index_service: IndexService,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String)
        .and(warp::delete())
        .and(warp::query())
        .and(with_arg(index_service))
        .then(delete_index)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    delete,
    tag = "Indexes",
    path = "/indexes/{index_id}",
    responses(
        // We return `VersionedIndexMetadata` as it's the serialized model view.
        (status = 200, description = "Successfully deleted index.", body = [FileEntry])
    ),
    params(
        DeleteIndexQueryParam,
        ("index_id" = String, Path, description = "The index ID to delete."),
    )
)]
/// Deletes index.
pub async fn delete_index(
    index_id: IndexId,
    delete_index_query_param: DeleteIndexQueryParam,
    mut index_service: IndexService,
) -> Result<Vec<SplitInfo>, IndexServiceError> {
    info!(index_id = %index_id, dry_run = delete_index_query_param.dry_run, "delete-index");
    index_service
        .delete_index(&index_id, delete_index_query_param.dry_run)
        .await
}


================================================
FILE: quickwit/quickwit-serve/src/index_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod index_resource;
mod rest_handler;
mod source_resource;
mod split_resource;

pub use self::index_resource::get_index_metadata_handler;
pub use self::rest_handler::{IndexApi, index_management_handlers};
pub use self::split_resource::{ListSplitsQueryParams, ListSplitsResponse};


================================================
FILE: quickwit/quickwit-serve/src/index_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use quickwit_config::NodeConfig;
use quickwit_doc_mapper::{TokenizerConfig, analyze_text};
use quickwit_index_management::{IndexService, IndexServiceError};
use quickwit_query::query_ast::{QueryAst, query_ast_from_user_text};
use serde::Deserialize;
use serde::de::DeserializeOwned;
use tracing::warn;
use warp::{Filter, Rejection};

use super::get_index_metadata_handler;
use super::index_resource::{
    __path_clear_index, __path_create_index, __path_delete_index, __path_describe_index,
    __path_list_indexes_metadata, __path_update_index, IndexStats, clear_index_handler,
    create_index_handler, delete_index_handler, describe_index_handler,
    list_indexes_metadata_handler, update_index_handler,
};
use super::source_resource::{
    __path_create_source, __path_delete_source, __path_reset_source_checkpoint,
    __path_toggle_source, __path_update_source, ToggleSource, create_source_handler,
    delete_source_handler, get_source_handler, get_source_shards_handler,
    reset_source_checkpoint_handler, toggle_source_handler, update_source_handler,
};
use super::split_resource::{
    __path_list_splits, __path_mark_splits_for_deletion, SplitsForDeletion, list_splits_handler,
    mark_splits_for_deletion_handler,
};
use crate::format::extract_format_from_qs;
use crate::rest::recover_fn;
use crate::rest_api_response::into_rest_api_response;
use crate::simple_list::from_simple_list;

#[derive(utoipa::OpenApi)]
#[openapi(
    paths(
        create_index,
        update_index,
        clear_index,
        delete_index,
        list_indexes_metadata,
        list_splits,
        describe_index,
        mark_splits_for_deletion,
        create_source,
        update_source,
        reset_source_checkpoint,
        toggle_source,
        delete_source,
    ),
    components(schemas(ToggleSource, SplitsForDeletion, IndexStats))
)]
pub struct IndexApi;

pub fn log_failure<T, E: std::fmt::Display>(
    message: &'static str,
) -> impl Fn(Result<T, E>) -> Result<T, E> + Clone {
    move |result| {
        if let Err(err) = &result {
            warn!("{message}: {err}");
        };
        result
    }
}

pub fn json_body<T: DeserializeOwned + Send>()
-> impl Filter<Extract = (T,), Error = warp::Rejection> + Clone {
    warp::body::content_length_limit(1024 * 1024).and(warp::body::json())
}

pub fn index_management_handlers(
    index_service: IndexService,
    node_config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    // Indexes handlers.
    get_index_metadata_handler(index_service.metastore())
        .or(list_indexes_metadata_handler(index_service.metastore()))
        .or(create_index_handler(
            index_service.clone(),
            node_config.clone(),
        ))
        .or(update_index_handler(index_service.clone(), node_config))
        .or(clear_index_handler(index_service.clone()))
        .or(delete_index_handler(index_service.clone()))
        .boxed()
        // Splits handlers
        .or(list_splits_handler(index_service.metastore()))
        .or(describe_index_handler(index_service.metastore()))
        .or(mark_splits_for_deletion_handler(index_service.metastore()))
        .boxed()
        // Sources handlers.
        .or(reset_source_checkpoint_handler(index_service.metastore()))
        .or(toggle_source_handler(index_service.metastore()))
        .or(create_source_handler(index_service.clone()))
        .or(update_source_handler(index_service.clone()))
        .or(get_source_handler(index_service.metastore()))
        .or(delete_source_handler(index_service.metastore()))
        .or(get_source_shards_handler(index_service.metastore()))
        .boxed()
        // Tokenizer handlers.
        .or(analyze_request_handler())
        // Parse query into query AST handler.
        .or(parse_query_request_handler())
        .recover(recover_fn)
        .boxed()
}

#[derive(Debug, Deserialize, utoipa::IntoParams, utoipa::ToSchema)]
struct AnalyzeRequest {
    /// The tokenizer to use.
    #[serde(flatten)]
    pub tokenizer_config: TokenizerConfig,
    /// The text to analyze.
    pub text: String,
}

fn analyze_request_filter() -> impl Filter<Extract = (AnalyzeRequest,), Error = Rejection> + Clone {
    warp::path!("analyze")
        .and(warp::post())
        .and(warp::body::json())
}

fn analyze_request_handler() -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone
{
    analyze_request_filter()
        .then(analyze_request)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

/// Analyzes text with given tokenizer config and returns the list of tokens.
#[utoipa::path(
    post,
    tag = "analyze",
    path = "/analyze",
    request_body = AnalyzeRequest,
    responses(
        (status = 200, description = "Successfully analyze text.")
    ),
)]
async fn analyze_request(request: AnalyzeRequest) -> Result<serde_json::Value, IndexServiceError> {
    let tokens = analyze_text(&request.text, &request.tokenizer_config)
        .map_err(|err| IndexServiceError::Internal(format!("{err:?}")))?;
    let json_value = serde_json::to_value(tokens)
        .map_err(|err| IndexServiceError::Internal(format!("cannot serialize tokens: {err}")))?;
    Ok(json_value)
}

#[derive(Debug, Deserialize, utoipa::IntoParams, utoipa::ToSchema)]
struct ParseQueryRequest {
    /// Query text. The query language is that of tantivy.
    pub query: String,
    // Fields to search on.
    #[param(rename = "search_field")]
    #[serde(default)]
    #[serde(rename(deserialize = "search_field"))]
    #[serde(deserialize_with = "from_simple_list")]
    pub search_fields: Option<Vec<String>>,
}

fn parse_query_request_filter()
-> impl Filter<Extract = (ParseQueryRequest,), Error = Rejection> + Clone {
    warp::path!("parse-query")
        .and(warp::post())
        .and(warp::body::json())
}

fn parse_query_request_handler()
-> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    parse_query_request_filter()
        .then(parse_query_request)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

/// Analyzes text with given tokenizer config and returns the list of tokens.
#[utoipa::path(
    post,
    tag = "parse_query",
    path = "/parse_query",
    request_body = ParseQueryRequest,
    responses(
        (status = 200, description = "Successfully parsed query into AST.")
    ),
)]
async fn parse_query_request(request: ParseQueryRequest) -> Result<QueryAst, IndexServiceError> {
    let query_ast = query_ast_from_user_text(&request.query, request.search_fields)
        .parse_user_query(&[])
        .map_err(|err| IndexServiceError::Internal(err.to_string()))?;
    Ok(query_ast)
}

#[cfg(test)]
mod tests {
    use std::ops::{Bound, RangeInclusive};

    use assert_json_diff::assert_json_include;
    use quickwit_common::ServiceStream;
    use quickwit_common::uri::Uri;
    use quickwit_config::{
        CLI_SOURCE_ID, INGEST_API_SOURCE_ID, NodeConfig, SourceParams, VecSourceParams,
    };
    use quickwit_indexing::{MockSplitBuilder, mock_split};
    use quickwit_metastore::{
        IndexMetadata, IndexMetadataResponseExt, ListIndexesMetadataResponseExt,
        ListSplitsRequestExt, ListSplitsResponseExt, SplitState, metastore_for_test,
    };
    use quickwit_proto::metastore::{
        DeleteSourceRequest, EmptyResponse, EntityKind, IndexMetadataRequest,
        IndexMetadataResponse, ListIndexesMetadataRequest, ListIndexesMetadataResponse,
        ListSplitsRequest, ListSplitsResponse, MarkSplitsForDeletionRequest, MetastoreError,
        MetastoreService, MetastoreServiceClient, MockMetastoreService,
        ResetSourceCheckpointRequest, SourceType, ToggleSourceRequest,
    };
    use quickwit_proto::types::IndexUid;
    use quickwit_storage::StorageResolver;
    use serde_json::Value as JsonValue;

    use super::*;
    use crate::recover_fn;

    #[tokio::test]
    async fn test_get_index() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_index_metadata().return_once(|_| {
            Ok(
                IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                    "test-index",
                    "ram:///indexes/test-index",
                ))
                .unwrap(),
            )
        });
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/test-index")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let actual_response_json: JsonValue = serde_json::from_slice(resp.body())?;
        let expected_response_json = serde_json::json!({
            "index_id": "test-index",
            "index_uri": "ram:///indexes/test-index",
        });
        assert_json_include!(
            actual: actual_response_json.get("index_config").unwrap(),
            expected: expected_response_json
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_get_non_existing_index() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore, StorageResolver::unconfigured());
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/test-index")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 404);
    }

    #[tokio::test]
    async fn test_get_splits() {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata =
            IndexMetadata::for_test("quickwit-demo-index", "ram:///indexes/quickwit-demo-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_index_metadata()
            .returning(move |_| {
                Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
            })
            .times(2);
        mock_metastore
            .expect_list_splits()
            .returning(move |list_splits_request: ListSplitsRequest| {
                let list_split_query = list_splits_request.deserialize_list_splits_query().unwrap();
                if list_split_query.index_uids.unwrap().contains(&index_uid)
                    && list_split_query.split_states
                        == vec![SplitState::Published, SplitState::Staged]
                    && list_split_query.time_range.start == Bound::Included(10)
                    && list_split_query.time_range.end == Bound::Excluded(20)
                    && list_split_query.create_timestamp.end == Bound::Excluded(2)
                {
                    let splits = vec![
                        MockSplitBuilder::new("split_1")
                            .with_index_uid(&index_uid)
                            .build(),
                    ];
                    let splits = ListSplitsResponse::try_from_splits(splits).unwrap();
                    return Ok(ServiceStream::from(vec![Ok(splits)]));
                }
                Err(MetastoreError::Internal {
                    message: "".to_string(),
                    cause: "".to_string(),
                })
            })
            .times(2);
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        {
            let resp = warp::test::request()
                .path(
                    "/indexes/quickwit-demo-index/splits?split_states=Published,Staged&\
                     start_timestamp=10&end_timestamp=20&end_create_timestamp=2",
                )
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
            let expected_response_json = serde_json::json!({
                "splits": [
                    {
                        "create_timestamp": 0,
                        "split_id": "split_1",
                    }
                ]
            });
            assert_json_include!(
                actual: actual_response_json,
                expected: expected_response_json
            );
        }
        {
            let resp = warp::test::request()
                .path(
                    "/indexes/quickwit-demo-index/splits?split_states=Published&\
                     start_timestamp=11&end_timestamp=20&end_create_timestamp=2",
                )
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 500);
        }
    }

    #[tokio::test]
    async fn test_describe_index() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata =
            IndexMetadata::for_test("quickwit-demo-index", "ram:///indexes/quickwit-demo-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_index_metadata()
            .return_once(move |_| {
                Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
            });
        let split_1 = MockSplitBuilder::new("split_1")
            .with_index_uid(&index_uid)
            .build();
        let split_1_time_range = split_1.split_metadata.time_range.clone().unwrap();
        let mut split_2 = MockSplitBuilder::new("split_2")
            .with_index_uid(&index_uid)
            .build();
        split_2.split_metadata.time_range = Some(RangeInclusive::new(
            split_1_time_range.start() - 10,
            split_1_time_range.end() + 10,
        ));
        mock_metastore
            .expect_list_splits()
            .withf(move |list_split_request| -> bool {
                let list_split_query = list_split_request.deserialize_list_splits_query().unwrap();
                list_split_query.index_uids.unwrap().contains(&index_uid)
            })
            .return_once(move |_| {
                let splits = vec![split_1, split_2];
                let splits = ListSplitsResponse::try_from_splits(splits).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits)]))
            });

        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/describe")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);

        let actual_response_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "index_id": "quickwit-demo-index",
            "index_uri": "ram:///indexes/quickwit-demo-index",
            "num_published_splits": 2,
            "size_published_splits": 1600,
            "num_published_docs": 20,
            "size_published_docs_uncompressed": 512,
            "timestamp_field_name": "timestamp",
            "min_timestamp": split_1_time_range.start() - 10,
            "max_timestamp": split_1_time_range.end() + 10,
        });

        assert_eq!(actual_response_json, expected_response_json);
        Ok(())
    }

    #[tokio::test]
    async fn test_get_all_splits() {
        let mut mock_metastore = MockMetastoreService::new();
        let index_metadata =
            IndexMetadata::for_test("quickwit-demo-index", "ram:///indexes/quickwit-demo-index");
        let index_uid = index_metadata.index_uid.clone();
        mock_metastore
            .expect_index_metadata()
            .return_once(move |_| {
                Ok(IndexMetadataResponse::try_from_index_metadata(&index_metadata).unwrap())
            });
        mock_metastore.expect_list_splits().return_once(
            move |list_split_request: ListSplitsRequest| {
                let list_split_query = list_split_request.deserialize_list_splits_query().unwrap();
                if list_split_query.index_uids.unwrap().contains(&index_uid)
                    && list_split_query.split_states.is_empty()
                    && list_split_query.time_range.is_unbounded()
                    && list_split_query.create_timestamp.is_unbounded()
                {
                    return Ok(ServiceStream::empty());
                }
                Err(MetastoreError::Internal {
                    message: "".to_string(),
                    cause: "".to_string(),
                })
            },
        );
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/splits")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
    }

    #[tokio::test]
    async fn test_mark_splits_for_deletion() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .returning(|_| {
                Ok(
                    IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                        "quickwit-demo-index",
                        "ram:///indexes/quickwit-demo-index",
                    ))
                    .unwrap(),
                )
            })
            .times(2);
        mock_metastore
            .expect_mark_splits_for_deletion()
            .returning(
                |mark_splits_for_deletion_request: MarkSplitsForDeletionRequest| {
                    let index_uid: IndexUid = mark_splits_for_deletion_request.index_uid().clone();
                    let split_ids = mark_splits_for_deletion_request.split_ids;
                    if index_uid.index_id == "quickwit-demo-index"
                        && split_ids == ["split-1", "split-2"]
                    {
                        return Ok(EmptyResponse {});
                    }
                    Err(MetastoreError::Internal {
                        message: "".to_string(),
                        cause: "".to_string(),
                    })
                },
            )
            .times(2);
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/splits/mark-for-deletion")
            .method("PUT")
            .json(&true)
            .body(r#"{"split_ids": ["split-1", "split-2"]}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/splits/mark-for-deletion")
            .json(&true)
            .body(r#"{"split_ids": [""]}"#)
            .method("PUT")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 500);
        Ok(())
    }

    #[tokio::test]
    async fn test_get_list_indexes() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|list_indexes_request| {
                assert_eq!(
                    list_indexes_request.index_id_patterns,
                    vec!["test-index-*".to_string()]
                );
                let index_metadata =
                    IndexMetadata::for_test("test-index", "ram:///indexes/test-index");
                Ok(ListIndexesMetadataResponse::for_test(vec![index_metadata]))
            });
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes?index_id_patterns=test-index-*")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let actual_response_json: JsonValue = serde_json::from_slice(resp.body())?;
        let actual_response_arr: &Vec<JsonValue> = actual_response_json.as_array().unwrap();
        assert_eq!(actual_response_arr.len(), 1);
        let actual_index_metadata_json: &JsonValue = &actual_response_arr[0];
        let expected_response_json = serde_json::json!({
            "index_id": "test-index",
            "index_uri": "ram:///indexes/test-index",
        });
        assert_json_include!(
            actual: actual_index_metadata_json.get("index_config").unwrap(),
            expected: expected_response_json
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_clear_index() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_index_metadata().return_once(|_| {
            Ok(
                IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                    "quickwit-demo-index",
                    "file:///path/to/index/quickwit-demo-index",
                ))
                .unwrap(),
            )
        });
        mock_metastore.expect_list_splits().return_once(|_| {
            let splits = ListSplitsResponse::try_from_splits(vec![mock_split("split_1")]).unwrap();
            Ok(ServiceStream::from(vec![Ok(splits)]))
        });
        mock_metastore
            .expect_mark_splits_for_deletion()
            .return_once(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_delete_splits()
            .return_once(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_reset_source_checkpoint()
            .return_once(|_| Ok(EmptyResponse {}));
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/clear")
            .method("PUT")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        Ok(())
    }

    #[tokio::test]
    async fn test_delete_index() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .returning(|_| {
                Ok(
                    IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                        "quickwit-demo-index",
                        "file:///path/to/index/quickwit-demo-index",
                    ))
                    .unwrap(),
                )
            })
            .times(2);
        mock_metastore
            .expect_list_splits()
            .returning(|_| {
                let splits =
                    ListSplitsResponse::try_from_splits(vec![mock_split("split_1")]).unwrap();
                Ok(ServiceStream::from(vec![Ok(splits)]))
            })
            .times(3);
        mock_metastore
            .expect_mark_splits_for_deletion()
            .return_once(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_delete_splits()
            .return_once(|_| Ok(EmptyResponse {}));
        mock_metastore
            .expect_delete_index()
            .return_once(|_| Ok(EmptyResponse {}));
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        {
            // Dry run
            let resp = warp::test::request()
                .path("/indexes/quickwit-demo-index?dry_run=true")
                .method("DELETE")
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
            let expected_response_json = serde_json::json!([{
                "file_name": "split_1.split",
                "file_size_bytes": "800 B",
            }]);
            assert_json_include!(actual: resp_json, expected: expected_response_json);
        }
        {
            let resp = warp::test::request()
                .path("/indexes/quickwit-demo-index")
                .method("DELETE")
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
            let expected_response_json = serde_json::json!([{
                "file_name": "split_1.split",
                "file_size_bytes": "800 B",
            }]);
            assert_json_include!(actual: resp_json, expected: expected_response_json);
        }
    }

    #[tokio::test]
    async fn test_delete_on_non_existing_index() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore, StorageResolver::unconfigured());
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index")
            .method("DELETE")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 404);
    }

    #[tokio::test]
    async fn test_create_index_with_overwrite() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config));
        {
            let resp = warp::test::request()
                .path("/indexes?overwrite=true")
                .method("POST")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]}}"#)
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
        }
        {
            let resp = warp::test::request()
                .path("/indexes?overwrite=true")
                .method("POST")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]}}"#)
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
        }
        {
            let resp = warp::test::request()
                .path("/indexes")
                .method("POST")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]}}"#)
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 400);
        }
    }

    #[tokio::test]
    async fn test_create_delete_index_and_source() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config));
        let resp = warp::test::request()
            .path("/indexes")
            .method("POST")
            .json(&true)
            .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]}}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "index_config": {
                "index_id": "hdfs-logs",
                "index_uri": "file:///default-index-root-uri/hdfs-logs",
            }
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);

        // Create source.
        let source_config_body = r#"{"version": "0.7", "source_id": "vec-source", "source_type": "vec", "params": {"docs": [], "batch_num_docs": 10}}"#;
        let resp = warp::test::request()
            .path("/indexes/hdfs-logs/sources")
            .method("POST")
            .json(&true)
            .body(source_config_body)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);

        // Get source.
        let resp = warp::test::request()
            .path("/indexes/hdfs-logs/sources/vec-source")
            .method("GET")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);

        // Check that the source has been added to index metadata.
        let index_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id("hdfs-logs".to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert!(index_metadata.sources.contains_key("vec-source"));
        let source_config = index_metadata.sources.get("vec-source").unwrap();
        assert_eq!(source_config.source_type(), SourceType::Vec);
        assert_eq!(
            source_config.source_params,
            SourceParams::Vec(VecSourceParams {
                docs: Vec::new(),
                batch_num_docs: 10,
                partition: "".to_string(),
            })
        );

        // Check delete source.
        let resp = warp::test::request()
            .path("/indexes/hdfs-logs/sources/vec-source")
            .method("DELETE")
            .body(source_config_body)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let index_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id("hdfs-logs".to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert!(!index_metadata.sources.contains_key("file-source"));

        // Check cannot delete source managed by Quickwit.
        let resp = warp::test::request()
            .path(format!("/indexes/hdfs-logs/sources/{INGEST_API_SOURCE_ID}").as_str())
            .method("DELETE")
            .body(source_config_body)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 403);

        let resp = warp::test::request()
            .path(format!("/indexes/hdfs-logs/sources/{CLI_SOURCE_ID}").as_str())
            .method("DELETE")
            .body(source_config_body)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 403);

        // Check get a non existing source returns 404.
        let resp = warp::test::request()
            .path("/indexes/hdfs-logs/sources/file-source")
            .method("GET")
            .body(source_config_body)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 404);

        // Check delete index.
        let resp = warp::test::request()
            .path("/indexes/hdfs-logs")
            .method("DELETE")
            .body(source_config_body)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let indexes = metastore
            .list_indexes_metadata(ListIndexesMetadataRequest::all())
            .await
            .unwrap()
            .deserialize_indexes_metadata()
            .await
            .unwrap();
        assert!(indexes.is_empty());
    }

    #[tokio::test]
    async fn test_create_index_with_yaml() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes")
            .method("POST")
            .header("content-type", "application/yaml")
            .body(
                r#"
            version: 0.8
            index_id: hdfs-logs
            doc_mapping:
              field_mappings:
                - name: timestamp
                  type: i64
                  fast: true
                  indexed: true
            "#,
            )
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "index_config": {
                "index_id": "hdfs-logs",
                "index_uri": "file:///default-index-root-uri/hdfs-logs",
            }
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);
    }

    #[tokio::test]
    async fn test_create_index_and_source_with_toml() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes")
            .method("POST")
            .header("content-type", "application/toml")
            .body(
                r#"
            version = "0.7"
            index_id = "hdfs-logs"
            [doc_mapping]
            field_mappings = [
                { name = "timestamp", type = "i64", fast = true, indexed = true}
            ]
            "#,
            )
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "index_config": {
                "index_id": "hdfs-logs",
                "index_uri": "file:///default-index-root-uri/hdfs-logs",
            }
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);
    }

    #[tokio::test]
    async fn test_create_index_with_wrong_content_type() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes")
            .method("POST")
            .header("content-type", "application/yoml")
            .body(r#""#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 415);
        let body = std::str::from_utf8(resp.body()).unwrap();
        assert!(body.contains("content-type is not supported"));
    }

    #[tokio::test]
    async fn test_create_index_with_bad_config() -> anyhow::Result<()> {
        let index_service = IndexService::new(
            MetastoreServiceClient::mocked(),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes")
            .method("POST")
            .json(&true)
            .body(
                r#"{"version": "0.7", "index_id": "hdfs-log", "doc_mapping":
    {"field_mappings":[{"name": "timestamp", "type": "unknown", "fast": true, "indexed":
    true}]}}"#,
            )
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 400);
        let body = std::str::from_utf8(resp.body()).unwrap();
        assert!(body.contains("field `timestamp` has an unknown type"));
        Ok(())
    }

    #[tokio::test]
    async fn test_update_index() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config));
        {
            let resp = warp::test::request()
                .path("/indexes")
                .method("POST")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]},"search_settings":{"default_search_fields":["body"]}}"#)
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
            let expected_response_json = serde_json::json!({
                "index_config": {
                    "search_settings": {
                        "default_search_fields": ["body"]
                    }
                }
            });
            assert_json_include!(actual: resp_json, expected: expected_response_json);
        }
        {
            let resp = warp::test::request()
                .path("/indexes/hdfs-logs")
                .method("PUT")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]},"search_settings":{"default_search_fields":["severity_text", "body"]}}"#)
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
            let expected_response_json = serde_json::json!({
                "index_config": {
                    "search_settings": {
                        "default_search_fields": ["severity_text", "body"]
                    }
                }
            });
            assert_json_include!(actual: resp_json, expected: expected_response_json);
        }
        // check that the metastore was updated
        let index_metadata = metastore
            .index_metadata(IndexMetadataRequest::for_index_id("hdfs-logs".to_string()))
            .await
            .unwrap()
            .deserialize_index_metadata()
            .unwrap();
        assert_eq!(
            index_metadata
                .index_config
                .search_settings
                .default_search_fields,
            ["severity_text", "body"]
        );
        // test with index_uri at the root of a bucket
        {
            let resp = warp::test::request()
                .path("/indexes")
                .method("POST")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs2", "index_uri": "s3://my-bucket", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]},"search_settings":{"default_search_fields":["body"]}}"#)
                .reply(&index_management_handler)
                .await;
            let body = std::str::from_utf8(resp.body()).unwrap();
            assert_eq!(resp.status(), 200, "{body}",);
        }
        {
            let resp = warp::test::request()
                .path("/indexes/hdfs-logs2")
                .method("PUT")
                .json(&true)
                .body(r#"{"version": "0.7", "index_id": "hdfs-logs2", "index_uri": "s3://my-bucket", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]},"search_settings":{"default_search_fields":["severity_text", "body"]}}"#)
                .reply(&index_management_handler)
                .await;
            let body = std::str::from_utf8(resp.body()).unwrap();
            assert_eq!(resp.status(), 200, "{body}",);
        }
    }

    #[tokio::test]
    async fn test_create_source_with_bad_config() {
        let metastore = metastore_for_test();
        let index_service = IndexService::new(metastore, StorageResolver::unconfigured());
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        {
            // Source config with bad version.
            let resp = warp::test::request()
                .path("/indexes/my-index/sources")
                .method("POST")
                .json(&true)
                .body(r#"{"version": 0.4, "source_id": "file-source"}"#)
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 400);
            let body = std::str::from_utf8(resp.body()).unwrap();
            assert!(body.contains("invalid type: floating point `0.4`"));
        }
        {
            // Invalid pulsar source config with number of pipelines > 1, not supported yet.
            let resp = warp::test::request()
                .path("/indexes/my-index/sources")
                .method("POST")
                .json(&true)
                .body(
                    r#"{"version": "0.8", "source_id": "pulsar-source",
    "num_pipelines": 2, "source_type": "pulsar", "params": {"topics": ["my-topic"],
    "address": "pulsar://localhost:6650" }}"#,
                )
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 400);
            let body = std::str::from_utf8(resp.body()).unwrap();
            assert!(body.contains(
                "Quickwit currently supports multiple pipelines only for GCP PubSub or Kafka \
                 sources"
            ));
        }
        {
            let resp = warp::test::request()
                .path("/indexes/hdfs-logs/sources")
                .method("POST")
                .body(
                    r#"{"version": "0.8", "source_id": "my-stdin-source", "source_type": "stdin"}"#,
                )
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 400);
            let response_body = std::str::from_utf8(resp.body()).unwrap();
            assert!(
                response_body.contains("stdin can only be used as source through the CLI command")
            )
        }
        {
            let resp = warp::test::request()
                .path("/indexes/hdfs-logs/sources")
                .method("POST")
                .body(
                    r#"{"version": "0.8", "source_id": "my-local-file-source", "source_type": "file", "params": {"filepath": "localfile"}}"#,
                )
                .reply(&index_management_handler)
                .await;
            assert_eq!(resp.status(), 400);
            let response_body = std::str::from_utf8(resp.body()).unwrap();
            assert!(response_body.contains("limited to a local usage"))
        }
    }

    #[cfg(feature = "sqs-for-tests")]
    #[tokio::test]
    async fn test_update_source() {
        use quickwit_indexing::source::sqs_queue::test_helpers::start_mock_sqs_get_queue_attributes_endpoint;

        let metastore = metastore_for_test();
        let (queue_url, _guard) = start_mock_sqs_get_queue_attributes_endpoint().await;
        let index_service = IndexService::new(metastore.clone(), StorageResolver::unconfigured());
        let mut node_config = NodeConfig::for_test();
        node_config.default_index_root_uri = Uri::for_test("file:///default-index-root-uri");
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(node_config));
        let resp = warp::test::request()
            .path("/indexes")
            .method("POST")
            .json(&true)
            .body(r#"{"version": "0.7", "index_id": "hdfs-logs", "doc_mapping": {"field_mappings":[{"name": "timestamp", "type": "i64", "fast": true, "indexed": true}]}}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp_json: serde_json::Value = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "index_config": {
                "index_id": "hdfs-logs",
                "index_uri": "file:///default-index-root-uri/hdfs-logs",
            }
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);

        // Create source.
        let source_config_body = serde_json::json!({
            "version": "0.7",
            "source_id": "sqs-source",
            "source_type": "file",
            "params": {"notifications": [{"type": "sqs", "queue_url": queue_url, "message_type": "s3_notification"}]},
        });
        let resp = warp::test::request()
            .path("/indexes/hdfs-logs/sources")
            .method("POST")
            .json(&source_config_body)
            .reply(&index_management_handler)
            .await;
        let resp_body = std::str::from_utf8(resp.body()).unwrap();
        assert_eq!(resp.status(), 200, "{resp_body}");

        {
            // Update the source.
            let update_source_config_body = serde_json::json!({
                "version": "0.7",
                "source_id": "sqs-source",
                "source_type": "file",
                "params": {"notifications": [{"type": "sqs", "queue_url": queue_url, "message_type": "s3_notification"}]},
            });
            let resp = warp::test::request()
                .path("/indexes/hdfs-logs/sources/sqs-source")
                .method("PUT")
                .json(&update_source_config_body)
                .reply(&index_management_handler)
                .await;
            let resp_body = std::str::from_utf8(resp.body()).unwrap();
            assert_eq!(resp.status(), 200, "{resp_body}");
            // Check that the source has been updated.
            let index_metadata = metastore
                .index_metadata(IndexMetadataRequest::for_index_id("hdfs-logs".to_string()))
                .await
                .unwrap()
                .deserialize_index_metadata()
                .unwrap();
            let metastore_source_config = index_metadata.sources.get("sqs-source").unwrap();
            assert_eq!(metastore_source_config.source_type(), SourceType::File);
            assert_eq!(
                metastore_source_config,
                &serde_json::from_value(update_source_config_body).unwrap(),
            );
        }
        {
            // Update the source with a different source_id (forbidden)
            let update_source_config_body = serde_json::json!({
                "version": "0.7",
                "source_id": "new-source-id",
                "source_type": "file",
                "params": {"notifications": [{"type": "sqs", "queue_url": queue_url, "message_type": "s3_notification"}]},
            });
            let resp = warp::test::request()
                .path("/indexes/hdfs-logs/sources/sqs-source")
                .method("PUT")
                .json(&update_source_config_body)
                .reply(&index_management_handler)
                .await;
            let resp_body = std::str::from_utf8(resp.body()).unwrap();
            assert_eq!(resp.status(), 400, "{resp_body}");
            // Check that the source hasn't been updated.
            let index_metadata = metastore
                .index_metadata(IndexMetadataRequest::for_index_id("hdfs-logs".to_string()))
                .await
                .unwrap()
                .deserialize_index_metadata()
                .unwrap();
            assert!(index_metadata.sources.contains_key("sqs-source"));
            assert!(!index_metadata.sources.contains_key("other-source-id"));
        }
    }

    #[tokio::test]
    async fn test_delete_non_existing_source() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_index_metadata().return_once(|_| {
            Ok(
                IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                    "quickwit-demo-index",
                    "file:///path/to/index/quickwit-demo-index",
                ))
                .unwrap(),
            )
        });
        // TODO
        // metastore
        //     .expect_index_exists()
        //     .return_once(|index_id: &str| Ok(index_id == "quickwit-demo-index"));
        mock_metastore.expect_delete_source().return_once(
            |delete_source_request: DeleteSourceRequest| {
                let index_uid: IndexUid = delete_source_request.index_uid().clone();
                let source_id = delete_source_request.source_id;
                assert_eq!(index_uid.index_id, "quickwit-demo-index");
                Err(MetastoreError::NotFound(EntityKind::Source {
                    index_id: "quickwit-demo-index".to_string(),
                    source_id: source_id.to_string(),
                }))
            },
        );
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/sources/foo-source")
            .method("DELETE")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 404);
    }

    #[tokio::test]
    async fn test_source_reset_checkpoint() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .returning(|_| {
                Ok(
                    IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                        "quickwit-demo-index",
                        "file:///path/to/index/quickwit-demo-index",
                    ))
                    .unwrap(),
                )
            })
            .times(2);
        mock_metastore
            .expect_reset_source_checkpoint()
            .returning(
                |reset_source_checkpoint_request: ResetSourceCheckpointRequest| {
                    let index_uid: IndexUid = reset_source_checkpoint_request.index_uid().clone();
                    let source_id = reset_source_checkpoint_request.source_id;
                    if index_uid.index_id == "quickwit-demo-index" && source_id == "source-to-reset"
                    {
                        return Ok(EmptyResponse {});
                    }
                    Err(MetastoreError::Internal {
                        message: "".to_string(),
                        cause: "".to_string(),
                    })
                },
            )
            .times(2);
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/sources/source-to-reset/reset-checkpoint")
            .method("PUT")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/sources/source-to-reset-2/reset-checkpoint")
            .method("PUT")
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 500);
        Ok(())
    }

    #[tokio::test]
    async fn test_source_toggle() -> anyhow::Result<()> {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_index_metadata()
            .returning(|_| {
                Ok(
                    IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                        "quickwit-demo-index",
                        "file:///path/to/index/quickwit-demo-index",
                    ))
                    .unwrap(),
                )
            })
            .times(3);
        mock_metastore.expect_toggle_source().return_once(
            |toggle_source_request: ToggleSourceRequest| {
                let index_uid: IndexUid = toggle_source_request.index_uid().clone();
                let source_id = toggle_source_request.source_id;
                let enable = toggle_source_request.enable;
                if index_uid.index_id == "quickwit-demo-index"
                    && source_id == "source-to-toggle"
                    && enable
                {
                    return Ok(EmptyResponse {});
                }
                Err(MetastoreError::Internal {
                    message: "".to_string(),
                    cause: "".to_string(),
                })
            },
        );
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/sources/source-to-toggle/toggle")
            .method("PUT")
            .json(&true)
            .body(r#"{"enable": true}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp = warp::test::request()
            .path("/indexes/quickwit-demo-index/sources/source-to-toggle/toggle")
            .method("PUT")
            .json(&true)
            .body(r#"{"toggle": true}"#) // unknown field, should return 400.
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 400);
        // Check cannot toggle source managed by Quickwit.
        let resp = warp::test::request()
            .path(format!("/indexes/hdfs-logs/sources/{INGEST_API_SOURCE_ID}/toggle").as_str())
            .method("PUT")
            .body(r#"{"enable": true}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 403);

        let resp = warp::test::request()
            .path(format!("/indexes/hdfs-logs/sources/{CLI_SOURCE_ID}/toggle").as_str())
            .method("PUT")
            .body(r#"{"enable": true}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 403);
        Ok(())
    }

    #[tokio::test]
    async fn test_analyze_request() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore.expect_index_metadata().return_once(|_| {
            Ok(
                IndexMetadataResponse::try_from_index_metadata(&IndexMetadata::for_test(
                    "test-index",
                    "ram:///indexes/test-index",
                ))
                .unwrap(),
            )
        });
        let index_service = IndexService::new(
            MetastoreServiceClient::from_mock(mock_metastore),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/analyze")
            .method("POST")
            .json(&true)
            .body(
                r#"{"type": "ngram", "min_gram": 3, "max_gram": 3, "text": "Hel", "filters":
    ["lower_caser"]}"#,
            )
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let actual_response_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!([
            {
                "offset_from": 0,
                "offset_to": 3,
                "position": 0,
                "position_length": 1,
                "text": "hel"
            }
        ]);
        assert_json_include!(
            actual: actual_response_json,
            expected: expected_response_json
        );
    }

    #[tokio::test]
    async fn test_parse_query_request() {
        let index_service = IndexService::new(
            MetastoreServiceClient::mocked(),
            StorageResolver::unconfigured(),
        );
        let index_management_handler =
            super::index_management_handlers(index_service, Arc::new(NodeConfig::for_test()))
                .recover(recover_fn);
        let resp = warp::test::request()
            .path("/parse-query")
            .method("POST")
            .json(&true)
            .body(r#"{"query": "field:this AND field:that"}"#)
            .reply(&index_management_handler)
            .await;
        assert_eq!(resp.status(), 200);
    }
}


================================================
FILE: quickwit/quickwit-serve/src/index_api/source_resource.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytes::Bytes;
use quickwit_config::{
    CLI_SOURCE_ID, ConfigFormat, FileSourceParams, INGEST_API_SOURCE_ID, SourceConfig,
    SourceParams, load_source_config_from_user_config, load_source_config_update,
};
use quickwit_index_management::{IndexService, IndexServiceError};
use quickwit_metastore::IndexMetadataResponseExt;
use quickwit_proto::ingest::Shard;
use quickwit_proto::metastore::{
    DeleteSourceRequest, EntityKind, IndexMetadataRequest, ListShardsRequest, ListShardsSubrequest,
    MetastoreError, MetastoreResult, MetastoreService, MetastoreServiceClient,
    ResetSourceCheckpointRequest, ToggleSourceRequest,
};
use quickwit_proto::types::{IndexId, IndexUid, SourceId};
use serde::Deserialize;
use tracing::info;
use warp::{Filter, Rejection};

use super::rest_handler::{json_body, log_failure};
use crate::format::{extract_config_format, extract_format_from_qs};
use crate::rest_api_response::into_rest_api_response;
use crate::with_arg;

pub fn create_source_handler(
    index_service: IndexService,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources")
        .and(warp::post())
        .and(extract_config_format())
        .and(warp::body::content_length_limit(1024 * 1024))
        .and(warp::filters::body::bytes())
        .and(with_arg(index_service))
        .then(create_source)
        .map(log_failure("failed to create source"))
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[allow(clippy::result_large_err)]
fn check_source_type(source_params: &SourceParams) -> Result<(), IndexServiceError> {
    // Note: This check is performed here instead of the source config serde
    // because many tests use the file source, and can't store that config in
    // the metastore without going through the validation.
    if let SourceParams::File(FileSourceParams::Filepath(_)) = source_params {
        return Err(IndexServiceError::InvalidConfig(anyhow::anyhow!(
            "path based file sources are limited to a local usage, please use the CLI command \
             `quickwit tool local-ingest` to ingest data from a specific file or setup a \
             notification based file source"
        )));
    }
    Ok(())
}

#[utoipa::path(
    post,
    tag = "Sources",
    path = "/indexes/{index_id}/sources",
    request_body = VersionedSourceConfig,
    responses(
        // We return `VersionedSourceConfig` as it's the serialized model view.
        (status = 200, description = "Successfully created source.", body = VersionedSourceConfig)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to create a source for."),
    )
)]
/// Creates Source.
pub async fn create_source(
    index_id: IndexId,
    config_format: ConfigFormat,
    source_config_bytes: Bytes,
    mut index_service: IndexService,
) -> Result<SourceConfig, IndexServiceError> {
    let source_config: SourceConfig =
        load_source_config_from_user_config(config_format, &source_config_bytes)
            .map_err(IndexServiceError::InvalidConfig)?;
    check_source_type(&source_config.source_params)?;
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = index_service
        .metastore()
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    info!(index_id = %index_id, source_id = %source_config.source_id, "create-source");
    index_service.add_source(index_uid, source_config).await
}

/// Query parameters for update source queries
#[derive(Deserialize, Debug, Eq, PartialEq, utoipa::IntoParams)]
#[into_params(parameter_in = Query)]
pub struct UpdateQueryParams {
    /// Create the source if it doesn't exist yet
    #[serde(default)]
    pub create: bool,
}

fn update_source_qp() -> impl Filter<Extract = (UpdateQueryParams,), Error = Rejection> + Clone {
    warp::query::<UpdateQueryParams>()
}

pub fn update_source_handler(
    index_service: IndexService,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources" / String)
        .and(warp::put())
        .and(extract_config_format())
        .and(update_source_qp())
        .and(warp::body::content_length_limit(1024 * 1024))
        .and(warp::filters::body::bytes())
        .and(with_arg(index_service))
        .then(update_source)
        .map(log_failure("failed to update source"))
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    put,
    tag = "Sources",
    path = "/indexes/{index_id}/sources/{source_id}",
    request_body = VersionedSourceConfig,
    responses(
        // We return `VersionedSourceConfig` as it's the serialized model view.
        (status = 200, description = "Successfully updated source.", body = VersionedSourceConfig)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to create a source for."),
        ("source_id" = String, Path, description = "The source ID to update."),
        UpdateQueryParams,
    )
)]
/// Updates Source.
pub async fn update_source(
    index_id: IndexId,
    source_id: SourceId,
    config_format: ConfigFormat,
    query_params: UpdateQueryParams,
    source_config_bytes: Bytes,
    mut index_service: IndexService,
) -> Result<SourceConfig, IndexServiceError> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let mut current_index_metadata = index_service
        .metastore()
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?;
    let current_source_config = match current_index_metadata.sources.remove(&source_id) {
        Some(source_config) => source_config,
        None if query_params.create => {
            let source_config: SourceConfig =
                load_source_config_from_user_config(config_format, &source_config_bytes)
                    .map_err(IndexServiceError::InvalidConfig)?;
            if source_config.source_id != source_id {
                return Err(IndexServiceError::InvalidConfig(anyhow::anyhow!(
                    "`source_id` in config file does not match source_id from query path"
                )));
            }
            check_source_type(&source_config.source_params)?;
            info!(index_id = %index_id, source_id = %source_config.source_id, "create-source-on-update");
            // TODO handle already exists?
            return index_service
                .add_source(current_index_metadata.index_uid, source_config)
                .await;
        }
        None => {
            return Err(MetastoreError::NotFound(EntityKind::Source {
                index_id: index_id.to_string(),
                source_id,
            })
            .into());
        }
    };

    let new_source_config: SourceConfig =
        load_source_config_update(config_format, &source_config_bytes, &current_source_config)
            .map_err(IndexServiceError::InvalidConfig)?;

    info!(index_id = %index_id, source_id = %new_source_config.source_id, "update-source");
    index_service
        .update_source(current_index_metadata.index_uid, new_source_config)
        .await
}

pub fn get_source_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources" / String)
        .and(warp::get())
        .and(with_arg(metastore))
        .then(get_source)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

pub async fn get_source(
    index_id: IndexId,
    source_id: SourceId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<SourceConfig> {
    info!(index_id = %index_id, source_id = %source_id, "get-source");
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let source_config = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .sources
        .remove(&source_id)
        .ok_or({
            MetastoreError::NotFound(EntityKind::Source {
                index_id,
                source_id,
            })
        })?;
    Ok(source_config)
}

pub fn reset_source_checkpoint_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources" / String / "reset-checkpoint")
        .and(warp::put())
        .and(with_arg(metastore))
        .then(reset_source_checkpoint)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    put,
    tag = "Sources",
    path = "/indexes/{index_id}/sources/{source_id}/reset-checkpoint",
    responses(
        (status = 200, description = "Successfully reset source checkpoint.")
    ),
    params(
        ("index_id" = String, Path, description = "The index ID of the source."),
        ("source_id" = String, Path, description = "The source ID whose checkpoint is reset."),
    )
)]
/// Resets source checkpoint.
pub async fn reset_source_checkpoint(
    index_id: IndexId,
    source_id: SourceId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<()> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    info!(index_id = %index_id, source_id = %source_id, "reset-checkpoint");
    let reset_source_checkpoint_request = ResetSourceCheckpointRequest {
        index_uid: Some(index_uid),
        source_id: source_id.clone(),
    };
    metastore
        .reset_source_checkpoint(reset_source_checkpoint_request)
        .await?;
    Ok(())
}

pub fn toggle_source_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources" / String / "toggle")
        .and(warp::put())
        .and(json_body())
        .and(with_arg(metastore))
        .then(toggle_source)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[derive(Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct ToggleSource {
    enable: bool,
}

#[utoipa::path(
    put,
    tag = "Sources",
    path = "/indexes/{index_id}/sources/{source_id}/toggle",
    request_body = ToggleSource,
    responses(
        (status = 200, description = "Successfully toggled source.")
    ),
    params(
        ("index_id" = String, Path, description = "The index ID of the source."),
        ("source_id" = String, Path, description = "The source ID to toggle."),
    )
)]
/// Toggles source.
pub async fn toggle_source(
    index_id: IndexId,
    source_id: SourceId,
    toggle_source: ToggleSource,
    metastore: MetastoreServiceClient,
) -> Result<(), IndexServiceError> {
    info!(index_id = %index_id, source_id = %source_id, enable = toggle_source.enable, "toggle-source");
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    if [CLI_SOURCE_ID, INGEST_API_SOURCE_ID].contains(&source_id.as_str()) {
        return Err(IndexServiceError::OperationNotAllowed(format!(
            "source `{source_id}` is managed by Quickwit, you cannot enable or disable a source \
             managed by Quickwit"
        )));
    }
    let toggle_source_request = ToggleSourceRequest {
        index_uid: Some(index_uid),
        source_id: source_id.clone(),
        enable: toggle_source.enable,
    };
    metastore.toggle_source(toggle_source_request).await?;
    Ok(())
}

pub fn delete_source_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources" / String)
        .and(warp::delete())
        .and(with_arg(metastore))
        .then(delete_source)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[utoipa::path(
    delete,
    tag = "Sources",
    path = "/indexes/{index_id}/sources/{source_id}",
    responses(
        (status = 200, description = "Successfully deleted source.")
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to remove the source from."),
        ("source_id" = String, Path, description = "The source ID to remove from the index."),
    )
)]
/// Deletes source.
pub async fn delete_source(
    index_id: IndexId,
    source_id: SourceId,
    metastore: MetastoreServiceClient,
) -> Result<(), IndexServiceError> {
    info!(index_id = %index_id, source_id = %source_id, "delete-source");
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    if [INGEST_API_SOURCE_ID, CLI_SOURCE_ID].contains(&source_id.as_str()) {
        return Err(IndexServiceError::OperationNotAllowed(format!(
            "source `{source_id}` is managed by Quickwit, you cannot delete a source managed by \
             Quickwit"
        )));
    }
    let delete_source_request = DeleteSourceRequest {
        index_uid: Some(index_uid),
        source_id: source_id.clone(),
    };
    metastore.delete_source(delete_source_request).await?;
    Ok(())
}

pub fn get_source_shards_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "sources" / String / "shards")
        .and(warp::get())
        .and(with_arg(metastore))
        .then(get_source_shards)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

pub async fn get_source_shards(
    index_id: IndexId,
    source_id: SourceId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<Vec<Shard>> {
    info!(index_id = %index_id, source_id = %source_id, "get-source-shards");
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    let response = metastore
        .list_shards(ListShardsRequest {
            subrequests: vec![ListShardsSubrequest {
                index_uid: Some(index_uid),
                source_id: source_id.to_string(),
                ..Default::default()
            }],
        })
        .await?;
    let shards = response
        .subresponses
        .into_iter()
        .flat_map(|resp| resp.shards)
        .collect();
    Ok(shards)
}


================================================
FILE: quickwit/quickwit-serve/src/index_api/split_resource.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_metastore::{
    IndexMetadataResponseExt, ListSplitsQuery, ListSplitsRequestExt,
    MetastoreServiceStreamSplitsExt, Split, SplitState,
};
use quickwit_proto::metastore::{
    IndexMetadataRequest, ListSplitsRequest, MarkSplitsForDeletionRequest, MetastoreResult,
    MetastoreService, MetastoreServiceClient,
};
use quickwit_proto::types::{IndexId, IndexUid};
use serde::{Deserialize, Serialize};
use tracing::info;
use warp::{Filter, Rejection};

use super::rest_handler::json_body;
use crate::format::extract_format_from_qs;
use crate::rest_api_response::into_rest_api_response;
use crate::simple_list::{from_simple_list, to_simple_list};
use crate::with_arg;

/// This struct represents the QueryString passed to
/// the rest API to filter splits.
#[derive(Debug, Clone, Deserialize, Serialize, utoipa::IntoParams, utoipa::ToSchema, Default)]
#[into_params(parameter_in = Query)]
pub struct ListSplitsQueryParams {
    /// If set, define the number of splits to skip
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub offset: Option<usize>,
    /// If set, restrict maximum number of splits to retrieve
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub limit: Option<usize>,
    /// A specific split state(s) to filter by.
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(serialize_with = "to_simple_list")]
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub split_states: Option<Vec<SplitState>>,
    /// If set, restrict splits to documents with a `timestamp >= start_timestamp`.
    /// This timestamp is in seconds.
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub start_timestamp: Option<i64>,
    /// If set, restrict splits to documents with a `timestamp < end_timestamp`.
    /// This timestamp is in seconds.
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub end_timestamp: Option<i64>,
    /// If set, restrict splits whose creation dates are before this date.
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(default)]
    pub end_create_timestamp: Option<i64>,
}

#[derive(Serialize, Deserialize, Debug, utoipa::ToSchema)]
pub struct ListSplitsResponse {
    #[serde(default)]
    pub offset: usize,
    #[serde(default)]
    pub size: usize,
    #[serde(default)]
    pub splits: Vec<Split>,
}

#[utoipa::path(
    get,
    tag = "Indexes",
    path = "/indexes/{index_id}/splits",
    responses(
        (status = 200, description = "Successfully fetched splits.", body = ListSplitsResponse)
    ),
    params(
        ListSplitsQueryParams,
        ("index_id" = String, Path, description = "The index ID to retrieve splits for."),
    )
)]

/// Get splits.
pub async fn list_splits(
    index_id: IndexId,
    list_split_query: ListSplitsQueryParams,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<ListSplitsResponse> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    info!(index_id = %index_id, list_split_query = ?list_split_query, "get-splits");
    let mut query = ListSplitsQuery::for_index(index_uid);
    let mut offset = 0;
    if let Some(offset_value) = list_split_query.offset {
        query = query.with_offset(offset_value);
        offset = offset_value;
    }
    if let Some(limit) = list_split_query.limit {
        query = query.with_limit(limit);
    }
    if let Some(split_states) = list_split_query.split_states {
        query = query.with_split_states(split_states);
    }
    if let Some(start_timestamp) = list_split_query.start_timestamp {
        query = query.with_time_range_start_gte(start_timestamp);
    }
    if let Some(end_timestamp) = list_split_query.end_timestamp {
        query = query.with_time_range_end_lt(end_timestamp);
    }
    if let Some(end_created_timestamp) = list_split_query.end_create_timestamp {
        query = query.with_create_timestamp_lt(end_created_timestamp);
    }
    let list_splits_request = ListSplitsRequest::try_from_list_splits_query(&query)?;
    let splits = metastore
        .list_splits(list_splits_request)
        .await?
        .collect_splits()
        .await?;
    Ok(ListSplitsResponse {
        offset,
        size: splits.len(),
        splits,
    })
}

pub fn list_splits_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "splits")
        .and(warp::get())
        .and(warp::query())
        .and(with_arg(metastore))
        .then(list_splits)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

#[derive(Deserialize, utoipa::ToSchema)]
#[serde(deny_unknown_fields)]
pub struct SplitsForDeletion {
    pub split_ids: Vec<String>,
}

#[utoipa::path(
    put,
    tag = "Splits",
    path = "/indexes/{index_id}/splits/mark-for-deletion",
    request_body = SplitsForDeletion,
    responses(
        (status = 200, description = "Successfully marked splits for deletion.")
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to mark splits for deletion for."),
    )
)]
/// Marks splits for deletion.
pub async fn mark_splits_for_deletion(
    index_id: IndexId,
    splits_for_deletion: SplitsForDeletion,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<()> {
    let index_metadata_request = IndexMetadataRequest::for_index_id(index_id.to_string());
    let index_uid: IndexUid = metastore
        .index_metadata(index_metadata_request)
        .await?
        .deserialize_index_metadata()?
        .index_uid;
    info!(index_id = %index_id, splits_ids = ?splits_for_deletion.split_ids, "mark-splits-for-deletion");
    let split_ids: Vec<String> = splits_for_deletion
        .split_ids
        .iter()
        .map(|split_id| split_id.to_string())
        .collect();
    let mark_splits_for_deletion_request =
        MarkSplitsForDeletionRequest::new(index_uid, split_ids.clone());
    metastore
        .mark_splits_for_deletion(mark_splits_for_deletion_request)
        .await?;
    Ok(())
}

pub fn mark_splits_for_deletion_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("indexes" / String / "splits" / "mark-for-deletion")
        .and(warp::put())
        .and(json_body())
        .and(with_arg(metastore))
        .then(mark_splits_for_deletion)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}


================================================
FILE: quickwit/quickwit-serve/src/indexing_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod rest_handler;

pub use rest_handler::{IndexingApi, indexing_get_handler};


================================================
FILE: quickwit/quickwit-serve/src/indexing_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::Infallible;

use quickwit_actors::{AskError, Mailbox, Observe};
use quickwit_indexing::actors::{IndexingService, IndexingServiceCounters};
use warp::{Filter, Rejection};

use crate::format::extract_format_from_qs;
use crate::require;
use crate::rest::recover_fn;
use crate::rest_api_response::into_rest_api_response;

#[derive(utoipa::OpenApi)]
#[openapi(paths(indexing_endpoint))]
pub struct IndexingApi;

#[utoipa::path(
    get,
    tag = "Indexing",
    path = "/indexing",
    responses(
        (status = 200, description = "Successfully observed indexing pipelines.", body = IndexingStatistics)
    ),
)]
/// Observe Indexing Pipeline
async fn indexing_endpoint(
    indexing_service_mailbox: Mailbox<IndexingService>,
) -> Result<IndexingServiceCounters, AskError<Infallible>> {
    let counters = indexing_service_mailbox.ask(Observe).await?;
    indexing_service_mailbox.ask(Observe).await?;
    Ok(counters)
}

fn indexing_get_filter() -> impl Filter<Extract = (), Error = Rejection> + Clone {
    warp::path!("indexing").and(warp::get())
}

pub fn indexing_get_handler(
    indexing_service_mailbox_opt: Option<Mailbox<IndexingService>>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    indexing_get_filter()
        .and(require(indexing_service_mailbox_opt))
        .then(indexing_endpoint)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .recover(recover_fn)
        .boxed()
}


================================================
FILE: quickwit/quickwit-serve/src/ingest_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod response;
mod rest_handler;

pub use response::{RestIngestResponse, RestParseFailure};
#[cfg(test)]
pub(crate) use rest_handler::tests::setup_ingest_v1_service;
pub use rest_handler::{IngestApi, IngestApiSchemas};
pub(crate) use rest_handler::{ingest_api_handlers, lines};


================================================
FILE: quickwit/quickwit-serve/src/ingest_api/response.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::BTreeMap;

use bytes::Bytes;
use quickwit_ingest::{IngestResponse, IngestServiceError};
use quickwit_proto::ingest::router::IngestResponseV2;
use quickwit_proto::ingest::{DocBatchV2, ParseFailureReason};
use quickwit_proto::types::DocUid;
use serde::{Deserialize, Serialize};

#[derive(Serialize, Deserialize, Debug, PartialEq, utoipa::ToSchema)]
pub struct RestParseFailure {
    pub message: String,
    pub document: String,
    pub reason: ParseFailureReason,
}

#[derive(Serialize, Deserialize, Debug, PartialEq, Default, utoipa::ToSchema)]
pub struct RestIngestResponse {
    /// Number of rows in the request payload
    pub num_docs_for_processing: u64,
    /// Number of docs successfully ingested
    #[serde(skip_serializing_if = "Option::is_none")]
    pub num_ingested_docs: Option<u64>, // TODO(#5604) remove Option
    /// Number of docs rejected because of parsing errors
    #[serde(skip_serializing_if = "Option::is_none")]
    pub num_rejected_docs: Option<u64>, // TODO(#5604) remove Option
    /// Detailed description of parsing errors (available if the path param
    /// `detailed_response` is set to `true`)
    #[serde(skip_serializing_if = "Option::is_none")]
    pub parse_failures: Option<Vec<RestParseFailure>>,
}

impl RestIngestResponse {
    pub(crate) fn from_ingest_v1(ingest_response: IngestResponse) -> Self {
        Self {
            num_docs_for_processing: ingest_response.num_docs_for_processing,
            ..Default::default()
        }
    }

    /// Converts [`IngestResponseV2`] into [`RestIngestResponse`].
    ///
    /// Generates a detailed failure description (`parse_failures`) if
    /// `doc_batch_clone_opt.is_some()`
    pub(crate) fn from_ingest_v2(
        mut ingest_response: IngestResponseV2,
        doc_batch_clone_opt: Option<&DocBatchV2>,
        num_docs_for_processing: u64,
    ) -> Result<Self, IngestServiceError> {
        let num_responses = ingest_response.successes.len() + ingest_response.failures.len();
        if num_responses != 1 {
            return Err(IngestServiceError::Internal(format!(
                "expected a single failure/success, got {num_responses}",
            )));
        }
        if let Some(failure_resp) = ingest_response.failures.pop() {
            return Err(failure_resp.into());
        }
        let success_resp = ingest_response.successes.pop().unwrap();

        let mut resp = Self {
            num_docs_for_processing,
            num_ingested_docs: Some(success_resp.num_ingested_docs as u64),
            num_rejected_docs: Some(success_resp.parse_failures.len() as u64),
            parse_failures: None,
        };
        if let Some(doc_batch) = doc_batch_clone_opt {
            let docs: BTreeMap<DocUid, Bytes> = doc_batch.docs().collect();
            let mut parse_failures = Vec::with_capacity(success_resp.parse_failures.len());
            for failure in success_resp.parse_failures {
                let doc = docs.get(&failure.doc_uid()).ok_or_else(|| {
                    IngestServiceError::Internal(format!(
                        "failed doc_uid {} not found in the original doc batch",
                        failure.doc_uid()
                    ))
                })?;
                parse_failures.push(RestParseFailure {
                    reason: failure.reason(),
                    message: failure.message,
                    document: String::from_utf8(doc.to_vec()).unwrap(),
                });
            }
            resp.parse_failures = Some(parse_failures);
        }
        Ok(resp)
    }

    /// Aggregates ingest counts and errors.
    pub fn merge(self, other: Self) -> Self {
        Self {
            num_docs_for_processing: self.num_docs_for_processing + other.num_docs_for_processing,
            num_ingested_docs: apply_op(self.num_ingested_docs, other.num_ingested_docs, |a, b| {
                a + b
            }),
            num_rejected_docs: apply_op(self.num_rejected_docs, other.num_rejected_docs, |a, b| {
                a + b
            }),
            parse_failures: apply_op(self.parse_failures, other.parse_failures, |a, b| {
                a.into_iter().chain(b).collect()
            }),
        }
    }
}

fn apply_op<T>(a: Option<T>, b: Option<T>, f: impl Fn(T, T) -> T) -> Option<T> {
    match (a, b) {
        (Some(a), Some(b)) => Some(f(a, b)),
        (Some(a), None) => Some(a),
        (None, Some(b)) => Some(b),
        (None, None) => None,
    }
}
#[cfg(test)]
mod tests {
    use quickwit_proto::ingest::ParseFailure;
    use quickwit_proto::ingest::router::{IngestFailure, IngestFailureReason, IngestSuccess};
    use quickwit_proto::types::IndexUid;

    use super::*;

    #[test]
    fn test_from_ingest_v1() {
        let ingest_response = IngestResponse {
            num_docs_for_processing: 10,
        };
        let rest_response = RestIngestResponse::from_ingest_v1(ingest_response);
        assert_eq!(rest_response.num_docs_for_processing, 10);
        assert_eq!(rest_response.num_ingested_docs, None);
        assert_eq!(rest_response.num_rejected_docs, None);
        assert_eq!(rest_response.parse_failures, None);
    }

    #[test]
    fn test_from_ingest_v2_success() {
        let success_resp = IngestResponseV2 {
            successes: vec![IngestSuccess {
                subrequest_id: 0,
                index_uid: Some(IndexUid::new_with_random_ulid("myindex")),
                source_id: String::from("mysource"),
                shard_id: Some("myshard".into()),
                replication_position_inclusive: None,
                num_ingested_docs: 5,
                parse_failures: vec![],
            }],
            failures: vec![],
        };
        let rest_response = RestIngestResponse::from_ingest_v2(success_resp, None, 10).unwrap();
        assert_eq!(rest_response.num_docs_for_processing, 10);
        assert_eq!(rest_response.num_ingested_docs, Some(5));
        assert_eq!(rest_response.num_rejected_docs, Some(0));
        assert_eq!(rest_response.parse_failures, None);
    }

    #[test]
    fn test_from_ingest_v2_partial_success() {
        let success_resp = IngestResponseV2 {
            successes: vec![IngestSuccess {
                subrequest_id: 0,
                index_uid: Some(IndexUid::new_with_random_ulid("myindex")),
                source_id: String::from("mysource"),
                shard_id: Some("myshard".into()),
                replication_position_inclusive: None,
                num_ingested_docs: 5,
                parse_failures: vec![ParseFailure {
                    doc_uid: Some(DocUid::for_test(42)),
                    message: "error".to_string(),
                    reason: ParseFailureReason::InvalidJson.into(),
                }],
            }],
            failures: vec![],
        };
        let rest_response = RestIngestResponse::from_ingest_v2(success_resp, None, 10).unwrap();
        assert_eq!(rest_response.num_docs_for_processing, 10);
        assert_eq!(rest_response.num_ingested_docs, Some(5));
        assert_eq!(rest_response.num_rejected_docs, Some(1));
        assert_eq!(rest_response.parse_failures, None);
    }

    #[test]
    fn test_from_ingest_v2_failure() {
        let failure_resp = IngestResponseV2 {
            successes: vec![],
            failures: vec![IngestFailure {
                subrequest_id: 0,
                index_id: String::from("myindex"),
                source_id: String::from("mysource"),
                reason: IngestFailureReason::SourceNotFound.into(),
            }],
        };
        let result = RestIngestResponse::from_ingest_v2(failure_resp, None, 10);
        assert!(result.is_err());
    }

    #[test]
    fn test_merge_responses() {
        let response1 = RestIngestResponse {
            num_docs_for_processing: 10,
            num_ingested_docs: Some(5),
            num_rejected_docs: Some(2),
            parse_failures: Some(vec![RestParseFailure {
                message: "error1".to_string(),
                document: "doc1".to_string(),
                reason: ParseFailureReason::InvalidJson,
            }]),
        };
        let response2 = RestIngestResponse {
            num_docs_for_processing: 15,
            num_ingested_docs: Some(10),
            num_rejected_docs: Some(3),
            parse_failures: Some(vec![RestParseFailure {
                message: "error2".to_string(),
                document: "doc2".to_string(),
                reason: ParseFailureReason::InvalidJson,
            }]),
        };
        let merged_response = response1.merge(response2);
        assert_eq!(merged_response.num_docs_for_processing, 25);
        assert_eq!(merged_response.num_ingested_docs.unwrap(), 15);
        assert_eq!(merged_response.num_rejected_docs.unwrap(), 5);
        assert_eq!(
            merged_response.parse_failures.unwrap(),
            vec![
                RestParseFailure {
                    message: "error1".to_string(),
                    document: "doc1".to_string(),
                    reason: ParseFailureReason::InvalidJson,
                },
                RestParseFailure {
                    message: "error2".to_string(),
                    document: "doc2".to_string(),
                    reason: ParseFailureReason::InvalidJson,
                }
            ]
        );
    }
}


================================================
FILE: quickwit/quickwit-serve/src/ingest_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use bytes::{Buf, Bytes};
use quickwit_config::{INGEST_V2_SOURCE_ID, IngestApiConfig, validate_identifier};
use quickwit_ingest::{
    CommitType, DocBatchBuilder, DocBatchV2Builder, FetchResponse, IngestRequest, IngestService,
    IngestServiceClient, IngestServiceError, TailRequest,
};
use quickwit_proto::ingest::CommitTypeV2;
use quickwit_proto::ingest::router::{
    IngestRequestV2, IngestRouterService, IngestRouterServiceClient, IngestSubrequest,
};
use quickwit_proto::types::{DocUidGenerator, IndexId};
use serde::Deserialize;
use warp::{Filter, Rejection};

use super::RestIngestResponse;
use crate::decompression::get_body_bytes;
use crate::format::extract_format_from_qs;
use crate::rest_api_response::into_rest_api_response;
use crate::{Body, BodyFormat, with_arg};

#[derive(utoipa::OpenApi)]
#[openapi(paths(ingest, tail_endpoint,))]
pub struct IngestApi;

#[derive(utoipa::OpenApi)]
#[openapi(components(schemas(
    quickwit_ingest::DocBatch,
    quickwit_ingest::FetchResponse,
    quickwit_ingest::IngestResponse,
    quickwit_ingest::CommitType,
)))]
pub struct IngestApiSchemas;

#[derive(Clone, Debug, Deserialize, PartialEq)]
struct IngestOptions {
    #[serde(alias = "commit", default = "IngestOptions::default_commit_type")]
    commit_type: CommitTypeV2,
    #[serde(default)]
    use_legacy_ingest: bool,
    #[serde(default)]
    detailed_response: bool,
}

impl IngestOptions {
    // This default implementation is necessary because `CommitTypeV2::default()` is
    // `CommitTypeV2::Unspecified`.
    fn default_commit_type() -> CommitTypeV2 {
        CommitTypeV2::Auto
    }

    fn commit_type_v1(&self) -> CommitType {
        match self.commit_type {
            CommitTypeV2::Unspecified | CommitTypeV2::Auto => CommitType::Auto,
            CommitTypeV2::Force => CommitType::Force,
            CommitTypeV2::WaitFor => CommitType::WaitFor,
        }
    }
}

pub(crate) fn ingest_api_handlers(
    ingest_router: IngestRouterServiceClient,
    ingest_service: IngestServiceClient,
    config: IngestApiConfig,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    ingest_handler(
        ingest_router,
        ingest_service.clone(),
        config,
        enable_ingest_v1,
        enable_ingest_v2,
    )
    .or(tail_handler(ingest_service))
    .boxed()
}

fn ingest_filter(
    config: IngestApiConfig,
) -> impl Filter<Extract = (String, Body, IngestOptions), Error = Rejection> + Clone {
    warp::path!(String / "ingest")
        .and(warp::post())
        .and(warp::body::content_length_limit(
            config.content_length_limit.as_u64(),
        ))
        .and(get_body_bytes())
        .and(warp::query::<IngestOptions>())
}

fn ingest_handler(
    ingest_router: IngestRouterServiceClient,
    ingest_service: IngestServiceClient,
    config: IngestApiConfig,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    ingest_filter(config)
        .and(with_arg(ingest_router))
        .and(with_arg(ingest_service))
        .then(
            move |index_id, body, ingest_options, ingest_router, ingest_service| {
                ingest(
                    index_id,
                    body,
                    ingest_options,
                    ingest_router,
                    ingest_service,
                    enable_ingest_v1,
                    enable_ingest_v2,
                )
            },
        )
        .map(|result| into_rest_api_response(result, BodyFormat::default()))
        .boxed()
}

#[utoipa::path(
    post,
    tag = "Ingest",
    path = "/{index_id}/ingest",
    request_body(content = String, description = "Documents to ingest in NDJSON format and limited to 10MB", content_type = "application/json"),
    responses(
        (status = 200, description = "Successfully ingested documents.", body = RestIngestResponse)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to add docs to."),
        ("commit" = Option<CommitType>, Query, description = "Force or wait for commit at the end of the indexing operation."),
    )
)]
/// Ingest documents
async fn ingest(
    index_id: IndexId,
    body: Body,
    ingest_options: IngestOptions,
    ingest_router: IngestRouterServiceClient,
    ingest_service: IngestServiceClient,
    enable_ingest_v1: bool,
    enable_ingest_v2: bool,
) -> Result<RestIngestResponse, IngestServiceError> {
    if enable_ingest_v2 && !ingest_options.use_legacy_ingest {
        return ingest_v2(index_id, body, ingest_options, ingest_router).await;
    }
    if !enable_ingest_v1 {
        let message = "ingest v1 is disabled: environment variable `QW_DISABLE_INGEST_V1` is set";
        return Err(IngestServiceError::Internal(message.to_string()));
    }
    ingest_v1(index_id, body, ingest_options, ingest_service).await
}

/// Ingest documents
async fn ingest_v1(
    index_id: IndexId,
    body: Body,
    ingest_options: IngestOptions,
    ingest_service: IngestServiceClient,
) -> Result<RestIngestResponse, IngestServiceError> {
    if ingest_options.detailed_response {
        return Err(IngestServiceError::BadRequest(
            "detailed_response is not supported in ingest v1".to_string(),
        ));
    }
    // The size of the body should be an upper bound of the size of the batch. The removal of the
    // end of line character for each doc compensates the addition of the `DocCommand` header.
    let mut doc_batch_builder = DocBatchBuilder::with_capacity(index_id, body.content.remaining());
    for line in lines(&body.content) {
        doc_batch_builder.ingest_doc(line);
    }
    let ingest_req = IngestRequest {
        doc_batches: vec![doc_batch_builder.build()],
        commit: ingest_options.commit_type_v1() as i32,
    };
    let ingest_response = ingest_service.ingest(ingest_req).await?;
    Ok(RestIngestResponse::from_ingest_v1(ingest_response))
}

async fn ingest_v2(
    index_id: IndexId,
    body: Body,
    ingest_options: IngestOptions,
    ingest_router: IngestRouterServiceClient,
) -> Result<RestIngestResponse, IngestServiceError> {
    let mut doc_batch_builder = DocBatchV2Builder::default();
    let mut doc_uid_generator = DocUidGenerator::default();

    for doc in lines(&body.content) {
        doc_batch_builder.add_doc(doc_uid_generator.next_doc_uid(), doc);
    }
    drop(body);
    let doc_batch_opt = doc_batch_builder.build();

    let Some(doc_batch) = doc_batch_opt else {
        let response = RestIngestResponse::default();
        return Ok(response);
    };
    let num_docs_for_processing = doc_batch.num_docs() as u64;
    let doc_batch_clone_opt = if ingest_options.detailed_response {
        Some(doc_batch.clone())
    } else {
        None
    };

    // Validate index ID early because propagating back the right error (400)
    // from deeper ingest layers is harder
    if validate_identifier("", &index_id).is_err() {
        return Err(IngestServiceError::BadRequest(
            "invalid index ID".to_string(),
        ));
    }

    let subrequest = IngestSubrequest {
        subrequest_id: 0,
        index_id,
        source_id: INGEST_V2_SOURCE_ID.to_string(),
        doc_batch: Some(doc_batch),
    };
    let request = IngestRequestV2 {
        commit_type: ingest_options.commit_type as i32,
        subrequests: vec![subrequest],
    };
    let response = ingest_router.ingest(request).await?;
    RestIngestResponse::from_ingest_v2(
        response,
        doc_batch_clone_opt.as_ref(),
        num_docs_for_processing,
    )
}

pub fn tail_handler(
    ingest_service: IngestServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    tail_filter()
        .and(with_arg(ingest_service))
        .then(tail_endpoint)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
        .boxed()
}

fn tail_filter() -> impl Filter<Extract = (String,), Error = Rejection> + Clone {
    warp::path!(String / "tail").and(warp::get())
}

#[utoipa::path(
    get,
    tag = "Ingest",
    path = "/{index_id}/tail",
    responses(
        (status = 200, description = "Successfully fetched documents.", body = FetchResponse)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to tail."),
    )
)]
/// Returns the last few ingested documents.
async fn tail_endpoint(
    index_id: IndexId,
    ingest_service: IngestServiceClient,
) -> Result<FetchResponse, IngestServiceError> {
    let fetch_response = ingest_service.tail(TailRequest { index_id }).await?;
    Ok(fetch_response)
}

pub(crate) fn lines(body: &Bytes) -> impl Iterator<Item = &[u8]> {
    body.split(|byte| byte == &b'\n')
        .filter(|line| !is_empty_or_blank_line(line))
}

#[inline]
fn is_empty_or_blank_line(line: &[u8]) -> bool {
    line.is_empty() || line.iter().all(|ch| ch.is_ascii_whitespace())
}

#[cfg(test)]
pub(crate) mod tests {
    use std::str;
    use std::time::Duration;

    use bytes::Bytes;
    use quickwit_actors::{Mailbox, Universe};
    use quickwit_config::IngestApiConfig;
    use quickwit_ingest::{
        CreateQueueIfNotExistsRequest, FetchRequest, FetchResponse, IngestApiService,
        IngestServiceClient, QUEUES_DIR_NAME, SuggestTruncateRequest, init_ingest_api,
    };
    use quickwit_proto::ingest::router::IngestRouterServiceClient;

    use super::{RestIngestResponse, ingest_api_handlers};
    use crate::ingest_api::lines;

    #[test]
    fn test_process_lines() {
        let test_cases = [
            // an empty line is inserted before the metadata action and the doc
            (&b"\n{ \"create\" : { \"_index\" : \"my-index-1\", \"_id\" : \"1\"} }\n{\"id\": 1, \"message\": \"push\"}"[..], 2),
            // a blank line is inserted before the metadata action and the doc
            (&b"       \n{ \"create\" : { \"_index\" : \"my-index-1\", \"_id\" : \"1\"} }\n{\"id\": 1, \"message\": \"push\"}"[..], 2),
            // an empty line is inserted after the metadata action and before the doc
            (&b"{ \"create\" : { \"_index\" : \"my-index-1\", \"_id\" : \"1\"} }\n\n{\"id\": 1, \"message\": \"push\"}"[..], 2),
            // a blank line is inserted after the metadata action and before the doc
            (&b"{ \"create\" : { \"_index\" : \"my-index-1\", \"_id\" : \"1\"} }\n     \n{\"id\": 1, \"message\": \"push\"}"[..], 2),
        ];

        for &(input, expected_count) in &test_cases {
            assert_eq!(lines(&Bytes::from(input)).count(), expected_count);
        }
    }

    pub(crate) async fn setup_ingest_v1_service(
        queues: &[&str],
        config: &IngestApiConfig,
    ) -> (
        Universe,
        tempfile::TempDir,
        IngestServiceClient,
        Mailbox<IngestApiService>,
    ) {
        let universe = Universe::with_accelerated_time();
        let temp_dir = tempfile::tempdir().unwrap();
        let queues_dir_path = temp_dir.path().join(QUEUES_DIR_NAME);
        let ingest_service_mailbox = init_ingest_api(&universe, &queues_dir_path, config)
            .await
            .unwrap();
        for queue in queues {
            let create_queue_req = CreateQueueIfNotExistsRequest {
                queue_id: queue.to_string(),
            };
            ingest_service_mailbox
                .ask_for_res(create_queue_req)
                .await
                .unwrap();
        }
        let ingest_service = IngestServiceClient::from_mailbox(ingest_service_mailbox.clone());
        (universe, temp_dir, ingest_service, ingest_service_mailbox)
    }

    #[tokio::test]
    async fn test_ingest_api_returns_200_when_ingest_json_and_fetch() {
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers = ingest_api_handlers(
            ingest_router,
            ingest_service,
            IngestApiConfig::default(),
            true,
            false,
        );
        let resp = warp::test::request()
            .path("/my-index/ingest")
            .method("POST")
            .json(&true)
            .body(r#"{"id": 1, "message": "push"}"#)
            .reply(&ingest_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let ingest_response: RestIngestResponse = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(ingest_response.num_docs_for_processing, 1);

        let resp = warp::test::request()
            .path("/my-index/tail")
            .method("GET")
            .reply(&ingest_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let fetch_response: FetchResponse = serde_json::from_slice(resp.body()).unwrap();
        let doc_batch = fetch_response.doc_batch.unwrap();
        assert_eq!(doc_batch.index_id, "my-index");
        assert_eq!(doc_batch.num_docs(), 1);
        assert_eq!(
            doc_batch.doc_lengths.iter().sum::<u32>() as usize,
            doc_batch.doc_buffer.len()
        );

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_ingest_api_returns_200_when_ingest_ndjson_and_fetch() {
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers = ingest_api_handlers(
            ingest_router,
            ingest_service,
            IngestApiConfig::default(),
            true,
            false,
        );
        let payload = r#"
            {"id": 1, "message": "push"}
            {"id": 2, "message": "push"}
            {"id": 3, "message": "push"}"#;
        let resp = warp::test::request()
            .path("/my-index/ingest")
            .method("POST")
            .body(payload)
            .reply(&ingest_api_handlers)
            .await;
        assert_eq!(resp.status(), 200);
        let ingest_response: RestIngestResponse = serde_json::from_slice(resp.body()).unwrap();
        assert_eq!(ingest_response.num_docs_for_processing, 3);

        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_ingest_api_return_429_if_above_limits() {
        let config: IngestApiConfig =
            serde_json::from_str(r#"{ "max_queue_memory_usage": "1" }"#).unwrap();
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index"], &config).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers = ingest_api_handlers(
            ingest_router,
            ingest_service,
            IngestApiConfig::default(),
            true,
            false,
        );
        let resp = warp::test::request()
            .path("/my-index/ingest")
            .method("POST")
            .json(&true)
            .body(r#"{"id": 1, "message": "push"}"#)
            .reply(&ingest_api_handlers)
            .await;
        assert_eq!(resp.status(), 429);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_ingest_api_return_413_if_above_content_limit() {
        let config: IngestApiConfig =
            serde_json::from_str(r#"{ "content_length_limit": "1" }"#).unwrap();
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers =
            ingest_api_handlers(ingest_router, ingest_service, config.clone(), true, false);
        let resp = warp::test::request()
            .path("/my-index/ingest")
            .method("POST")
            .json(&true)
            .body(r#"{"id": 1, "message": "push"}"#)
            .reply(&ingest_api_handlers)
            .await;
        assert_eq!(resp.status(), 413);
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_ingest_api_blocks_when_wait_is_specified() {
        let (universe, _temp_dir, ingest_service_client, ingest_service_mailbox) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers = ingest_api_handlers(
            ingest_router,
            ingest_service_client,
            IngestApiConfig::default(),
            true,
            false,
        );
        let handle = tokio::spawn(async move {
            let resp = warp::test::request()
                .path("/my-index/ingest?commit=wait_for")
                .method("POST")
                .json(&true)
                .body(r#"{"id": 1, "message": "push"}"#)
                .reply(&ingest_api_handlers)
                .await;
            assert_eq!(resp.status(), 200);
            let ingest_response: RestIngestResponse = serde_json::from_slice(resp.body()).unwrap();
            assert_eq!(ingest_response.num_docs_for_processing, 1);
        });
        universe.sleep(Duration::from_secs(10)).await;
        assert!(!handle.is_finished());
        assert_eq!(
            ingest_service_mailbox
                .ask_for_res(FetchRequest {
                    index_id: "my-index".to_string(),
                    start_after: None,
                    num_bytes_limit: None,
                })
                .await
                .unwrap()
                .doc_batch
                .unwrap()
                .num_docs(),
            1
        );
        ingest_service_mailbox
            .ask_for_res(SuggestTruncateRequest {
                index_id: "my-index".to_string(),
                up_to_position_included: 0,
            })
            .await
            .unwrap();
        handle.await.unwrap();
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_ingest_api_blocks_when_force_is_specified() {
        let (universe, _temp_dir, ingest_service_client, ingest_service_mailbox) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers = ingest_api_handlers(
            ingest_router,
            ingest_service_client,
            IngestApiConfig::default(),
            true,
            false,
        );
        let handle = tokio::spawn(async move {
            let resp = warp::test::request()
                .path("/my-index/ingest?commit=force")
                .method("POST")
                .json(&true)
                .body(r#"{"id": 1, "message": "push"}"#)
                .reply(&ingest_api_handlers)
                .await;
            assert_eq!(resp.status(), 200);
            let ingest_response: RestIngestResponse = serde_json::from_slice(resp.body()).unwrap();
            assert_eq!(ingest_response.num_docs_for_processing, 1);
        });
        universe.sleep(Duration::from_secs(10)).await;
        assert!(!handle.is_finished());
        assert_eq!(
            ingest_service_mailbox
                .ask_for_res(FetchRequest {
                    index_id: "my-index".to_string(),
                    start_after: None,
                    num_bytes_limit: None,
                })
                .await
                .unwrap()
                .doc_batch
                .unwrap()
                .num_docs(),
            2
        );
        ingest_service_mailbox
            .ask_for_res(SuggestTruncateRequest {
                index_id: "my-index".to_string(),
                up_to_position_included: 0,
            })
            .await
            .unwrap();
        handle.await.unwrap();
        universe.assert_quit().await;
    }

    #[tokio::test]
    async fn test_ingest_api_unsupported_detailed_errors() {
        let (universe, _temp_dir, ingest_service, _) =
            setup_ingest_v1_service(&["my-index"], &IngestApiConfig::default()).await;
        let ingest_router = IngestRouterServiceClient::mocked();
        let ingest_api_handlers = ingest_api_handlers(
            ingest_router,
            ingest_service,
            IngestApiConfig::default(),
            true,
            false,
        );
        let resp = warp::test::request()
            .path("/my-index/ingest?detailed_response=true")
            .method("POST")
            .json(&true)
            .body(r#"{"id": 1, "message": "push"}"#)
            .reply(&ingest_api_handlers)
            .await;
        assert_eq!(resp.status(), 400);
        universe.assert_quit().await;
    }
}


================================================
FILE: quickwit/quickwit-serve/src/jaeger_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod model;
mod parse_duration;
mod rest_handler;
pub(crate) use rest_handler::{JaegerApi, jaeger_api_handlers};


================================================
FILE: quickwit/quickwit-serve/src/jaeger_api/model.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;

use base64::prelude::{BASE64_STANDARD, Engine};
use itertools::Itertools;
use prost_types::{Duration, Timestamp};
use quickwit_proto::jaeger::api_v2::{KeyValue, Log, Process, Span, SpanRef, ValueType};
use serde::{Deserialize, Serialize};
use serde_json::{Value, json};
use serde_with::serde_as;
use warp::hyper::StatusCode;

pub(super) const DEFAULT_NUMBER_OF_TRACES: i32 = 20;

pub(super) fn build_jaeger_traces(spans: Vec<JaegerSpan>) -> anyhow::Result<Vec<JaegerTrace>> {
    let jaeger_traces: Vec<JaegerTrace> = spans
        .into_iter()
        .chunk_by(|span| span.trace_id.clone())
        .into_iter()
        .map(|(span_id, group)| JaegerTrace::new(span_id, group.collect()))
        .collect();
    Ok(jaeger_traces)
}

#[derive(Debug, Default, Clone, Serialize, Deserialize, PartialEq)]
#[serde(deny_unknown_fields)]
pub struct JaegerResponseBody<T> {
    pub data: T,
}

#[serde_with::skip_serializing_none]
#[derive(Clone, Default, Debug, Serialize, Deserialize, utoipa::IntoParams)]
#[serde(rename_all = "camelCase")]
#[serde(deny_unknown_fields)]
pub struct TracesSearchQueryParams {
    #[serde(default)]
    pub service: Option<String>,
    #[serde(default)]
    pub operation: Option<String>,
    // these are microsecond precision
    pub start: Option<i64>,
    pub end: Option<i64>,
    pub tags: Option<String>,
    // these are unit-suffixed numbers. in practice we only support precision up to the ms
    pub min_duration: Option<String>,
    pub max_duration: Option<String>,
    pub lookback: Option<String>,
    pub limit: Option<i32>,
}

// Jaeger Model for UI
// Source: https://github.com/jaegertracing/jaeger/blob/main/model/json/model.go#L82

#[derive(Clone, Default, Debug, PartialEq, Serialize, utoipa::IntoParams)]
#[serde(rename_all = "camelCase")]
pub struct JaegerTrace {
    #[serde(rename = "traceID")]
    #[serde(serialize_with = "serialize_bytes_to_hex")]
    trace_id: Vec<u8>,
    spans: Vec<JaegerSpan>,
    processes: HashMap<String, JaegerProcess>,
    warnings: Vec<String>,
}

impl JaegerTrace {
    pub fn new(trace_id: Vec<u8>, mut spans: Vec<JaegerSpan>) -> Self {
        let processes = Self::build_process_map(&mut spans);
        JaegerTrace {
            trace_id,
            spans,
            processes,
            warnings: Vec::new(),
        }
    }

    /// Processes a collection of spans, updating the `process_id` field based on the unique
    /// `service_name` values. The function uses an accumulator (`acc`) to keep track of
    /// processed `JaegerProcess` objects and assigns a new key to each unique `service_name` value.
    /// The logic has been replicated from
    /// <https://github.com/jaegertracing/jaeger/blob/995231c42cadd70bce2bbbf02579e33f6e6329c8/model/converter/json/process_hashtable.go#L37>
    /// TODO: use also tags to identify processes.
    fn build_process_map(spans: &mut [JaegerSpan]) -> HashMap<String, JaegerProcess> {
        let mut service_name_to_process_id: HashMap<String, String> = HashMap::new();
        let mut process_map: HashMap<String, JaegerProcess> = HashMap::new();
        let mut process_counter: i32 = 0;
        for span in spans.iter_mut() {
            let Some(current_process) = span.process.as_mut() else {
                continue;
            };
            if let Some(process_id) = service_name_to_process_id.get(&current_process.service_name)
            {
                span.process_id = Some(process_id.clone());
            } else {
                process_counter += 1;
                current_process.key = format!("p{process_counter}");
                span.process_id = Some(current_process.key.clone());
                process_map.insert(current_process.key.clone(), current_process.clone());
                service_name_to_process_id.insert(
                    current_process.service_name.clone(),
                    current_process.key.clone(),
                );
            }
        }
        process_map
    }
}

#[serde_as]
#[derive(Debug, Clone, PartialEq, Serialize)]
#[serde(rename_all = "camelCase")]
pub struct JaegerSpan {
    #[serde(rename = "traceID")]
    #[serde(serialize_with = "serialize_bytes_to_hex")]
    pub trace_id: Vec<u8>,
    #[serde(rename = "spanID")]
    #[serde(serialize_with = "serialize_bytes_to_hex")]
    span_id: Vec<u8>,
    operation_name: String,
    references: Vec<JaegerSpanRef>,
    #[serde(default)]
    flags: u32,
    start_time: i64, // start_time since Unix epoch
    duration: i64,   // microseconds
    tags: Vec<JaegerKeyValue>,
    logs: Vec<JaegerLog>,
    #[serde(default)]
    #[serde(skip_serializing)]
    process: Option<JaegerProcess>,
    #[serde(rename = "processID")]
    pub process_id: Option<String>,
    pub warnings: Vec<String>,
}

impl TryFrom<Span> for JaegerSpan {
    type Error = anyhow::Error;
    fn try_from(span: Span) -> Result<Self, Self::Error> {
        let references: Vec<JaegerSpanRef> =
            span.references.iter().map(JaegerSpanRef::from).collect();
        let tags: Vec<JaegerKeyValue> = span.tags.iter().map(JaegerKeyValue::from).collect();
        let logs: Vec<JaegerLog> = span.logs.iter().map(JaegerLog::from).collect();
        Ok(Self {
            trace_id: span.trace_id,
            span_id: span.span_id,
            operation_name: span.operation_name.clone(),
            references,
            flags: span.flags,
            start_time: span
                .start_time
                .as_ref()
                .map(convert_timestamp_to_microsecs)
                .unwrap_or(0),
            duration: span
                .duration
                .map(convert_duration_to_microsecs)
                .unwrap_or(0),
            tags,
            logs,
            process: span.process.map(JaegerProcess::from),
            process_id: None,
            warnings: span.warnings.iter().map(|s| s.to_string()).collect(),
        })
    }
}

#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "camelCase")]
pub struct JaegerSpanRef {
    #[serde(rename = "traceID")]
    #[serde(serialize_with = "serialize_bytes_to_hex")]
    trace_id: Vec<u8>,
    #[serde(rename = "spanID")]
    #[serde(serialize_with = "serialize_bytes_to_hex")]
    span_id: Vec<u8>,
    ref_type: String,
}

impl From<&SpanRef> for JaegerSpanRef {
    fn from(sr: &SpanRef) -> Self {
        Self {
            trace_id: sr.trace_id.clone(),
            span_id: sr.span_id.clone(),
            ref_type: if sr.ref_type == 0 {
                "CHILD_OF".to_string()
            } else {
                "FOLLOWS_FROM".to_string()
            },
        }
    }
}

#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub struct JaegerKeyValue {
    key: String,
    #[serde(rename = "type")]
    value_type: String,
    value: Value,
}

impl From<&KeyValue> for JaegerKeyValue {
    fn from(kv: &KeyValue) -> Self {
        match kv.v_type {
            // String = 0,
            0 => Self {
                key: kv.key.to_string(),
                value_type: ValueType::String.as_str_name().to_lowercase(),
                value: json!(kv.v_str.to_string()),
            },
            // Bool = 1,
            1 => Self {
                key: kv.key.to_string(),
                value_type: ValueType::Bool.as_str_name().to_lowercase(),
                value: json!(kv.v_bool),
            },
            // Int64 = 2,
            2 => {
                if kv.v_int64 > 9007199254740991 {
                    Self {
                        key: kv.key.to_string(),
                        value_type: ValueType::Int64.as_str_name().to_lowercase(),
                        value: json!(kv.v_int64.to_string()),
                    }
                } else {
                    Self {
                        key: kv.key.to_string(),
                        value_type: ValueType::Int64.as_str_name().to_lowercase(),
                        value: json!(kv.v_int64),
                    }
                }
            }
            // Float64 = 3,
            3 => Self {
                key: kv.key.to_string(),
                value_type: ValueType::Float64.as_str_name().to_lowercase(),
                value: json!(kv.v_float64),
            },
            // Binary = 4,
            4 => Self {
                key: kv.key.to_string(),
                value_type: ValueType::Binary.as_str_name().to_lowercase(),
                value: serde_json::Value::String(BASE64_STANDARD.encode(kv.v_binary.as_slice())),
            },
            _ => Self {
                key: "no_value".to_string(),
                value_type: "unsupported_type".to_string(),
                value: Default::default(),
            },
        }
    }
}

#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub struct JaegerLog {
    timestamp: i64, // microseconds since Unix epoch
    fields: Vec<JaegerKeyValue>,
}

impl From<&Log> for JaegerLog {
    fn from(log: &Log) -> Self {
        Self {
            timestamp: log
                .timestamp
                .as_ref()
                .map(convert_timestamp_to_microsecs)
                .unwrap_or(0),
            fields: log.fields.iter().map(JaegerKeyValue::from).collect(),
        }
    }
}

#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "camelCase")]
struct JaegerProcess {
    service_name: String,
    key: String,
    tags: Vec<JaegerKeyValue>,
}

impl Default for JaegerProcess {
    fn default() -> Self {
        Self {
            service_name: "none".to_string(),
            key: "".to_string(),
            tags: Vec::new(),
        }
    }
}

impl From<Process> for JaegerProcess {
    fn from(process: Process) -> Self {
        Self {
            service_name: process.service_name.to_string(),
            key: "".to_string(),
            tags: process.tags.iter().map(JaegerKeyValue::from).collect(),
        }
    }
}

#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct JaegerError {
    #[serde(with = "http_serde::status_code")]
    pub status: StatusCode,
    pub message: String,
}

impl From<anyhow::Error> for JaegerError {
    fn from(error: anyhow::Error) -> Self {
        Self {
            status: StatusCode::INTERNAL_SERVER_ERROR,
            message: error.to_string(),
        }
    }
}

fn serialize_bytes_to_hex<S>(bytes: &Vec<u8>, s: S) -> Result<S::Ok, S::Error>
where S: serde::Serializer {
    s.serialize_str(&format!("{:0>16}", hex::encode(bytes)))
}

fn convert_timestamp_to_microsecs(timestamp: &Timestamp) -> i64 {
    timestamp.seconds * 1_000_000 + i64::from(timestamp.nanos / 1000)
}

fn convert_duration_to_microsecs(duration: Duration) -> i64 {
    duration.seconds * 1_000_000 + i64::from(duration.nanos / 1000)
}

#[cfg(test)]
mod tests {
    use quickwit_proto::jaeger::api_v2::Log;

    use crate::jaeger_api::model::{JaegerSpan, build_jaeger_traces};

    #[test]
    fn test_convert_grpc_jaeger_spans_into_jaeger_ui_model() {
        let file_content = std::fs::read_to_string(get_jaeger_ui_trace_filepath()).unwrap();
        let expected_jaeger_trace: serde_json::Value = serde_json::from_str(&file_content).unwrap();
        let grpc_spans = create_grpc_spans();
        let jaeger_spans: Vec<JaegerSpan> = grpc_spans
            .iter()
            .map(|span| super::JaegerSpan::try_from(span.clone()).unwrap())
            .collect();
        let traces = build_jaeger_traces(jaeger_spans).unwrap();
        let trace_json: serde_json::Value = serde_json::to_value(traces[0].clone()).unwrap();
        assert_json_diff::assert_json_eq!(expected_jaeger_trace, trace_json);
    }

    fn get_jaeger_ui_trace_filepath() -> String {
        format!(
            "{}/resources/tests/jaeger_ui_trace.json",
            env!("CARGO_MANIFEST_DIR"),
        )
    }

    fn create_grpc_spans() -> Vec<quickwit_proto::jaeger::api_v2::Span> {
        let span_0 = quickwit_proto::jaeger::api_v2::Span {
            trace_id: vec![1],
            span_id: vec![1],
            operation_name: "test-general-conversion".to_string(),
            start_time: Some(prost_types::Timestamp {
                seconds: 1485467191,
                nanos: 639875000,
            }),
            duration: Some(prost_types::Duration {
                seconds: 0,
                nanos: 5000,
            }),
            process: Some(quickwit_proto::jaeger::api_v2::Process {
                service_name: "service-x".to_string(),
                tags: Vec::new(),
            }),
            logs: vec![
                Log {
                    timestamp: Some(prost_types::Timestamp {
                        seconds: 1485467191,
                        nanos: 639875000,
                    }),
                    fields: vec![quickwit_proto::jaeger::api_v2::KeyValue {
                        key: "event".to_string(),
                        v_type: 0,
                        v_str: "some-event".to_string(),
                        ..Default::default()
                    }],
                },
                Log {
                    timestamp: Some(prost_types::Timestamp {
                        seconds: 1485467191,
                        nanos: 639875000,
                    }),
                    fields: vec![quickwit_proto::jaeger::api_v2::KeyValue {
                        key: "x".to_string(),
                        v_type: 0,
                        v_str: "y".to_string(),
                        ..Default::default()
                    }],
                },
            ],
            ..Default::default()
        };
        let span_1 = quickwit_proto::jaeger::api_v2::Span {
            operation_name: "some-operation".to_string(),
            trace_id: vec![1],
            span_id: vec![2],
            start_time: Some(prost_types::Timestamp {
                seconds: 1485467191,
                nanos: 639875000,
            }),
            duration: Some(prost_types::Duration {
                seconds: 0,
                nanos: 5000,
            }),
            process: Some(quickwit_proto::jaeger::api_v2::Process {
                service_name: "service-x".to_string(),
                tags: Vec::new(),
            }),
            process_id: "".to_string(),
            tags: vec![
                quickwit_proto::jaeger::api_v2::KeyValue {
                    key: "peer.service".to_string(),
                    v_type: 0,
                    v_str: "service-y".to_string(),
                    ..Default::default()
                },
                quickwit_proto::jaeger::api_v2::KeyValue {
                    key: "peer.ipv4".to_string(),
                    v_type: 2,
                    v_int64: 23456,
                    ..Default::default()
                },
                quickwit_proto::jaeger::api_v2::KeyValue {
                    key: "error".to_string(),
                    v_type: 1,
                    v_bool: true,
                    ..Default::default()
                },
                quickwit_proto::jaeger::api_v2::KeyValue {
                    key: "temperature".to_string(),
                    v_type: 3,
                    v_float64: 72.5,
                    ..Default::default()
                },
                quickwit_proto::jaeger::api_v2::KeyValue {
                    key: "javascript_limit".to_string(),
                    v_type: 2,
                    v_int64: 9223372036854775222,
                    ..Default::default()
                },
                quickwit_proto::jaeger::api_v2::KeyValue {
                    key: "blob".to_string(),
                    v_type: 4,
                    v_binary: vec![0b0, 0b0, 0b00110000, 0b00111001],
                    ..Default::default()
                },
            ],
            ..Default::default()
        };
        let span_2 = quickwit_proto::jaeger::api_v2::Span {
            operation_name: "some-operation".to_string(),
            trace_id: vec![1],
            span_id: vec![3],
            references: vec![quickwit_proto::jaeger::api_v2::SpanRef {
                trace_id: vec![1],
                span_id: vec![2],
                ref_type: 0,
            }],
            start_time: Some(prost_types::Timestamp {
                seconds: 1485467191,
                nanos: 639875000,
            }),
            duration: Some(prost_types::Duration {
                seconds: 0,
                nanos: 5000,
            }),
            process: Some(quickwit_proto::jaeger::api_v2::Process {
                service_name: "service-y".to_string(),
                tags: Vec::new(),
            }),
            process_id: "".to_string(),
            ..Default::default()
        };
        let span_3 = quickwit_proto::jaeger::api_v2::Span {
            operation_name: "reference-test".to_string(),
            trace_id: vec![1],
            span_id: vec![4],
            references: vec![
                quickwit_proto::jaeger::api_v2::SpanRef {
                    trace_id: vec![255],
                    span_id: vec![255],
                    ref_type: 0,
                },
                quickwit_proto::jaeger::api_v2::SpanRef {
                    trace_id: vec![1],
                    span_id: vec![2],
                    ref_type: 0,
                },
                quickwit_proto::jaeger::api_v2::SpanRef {
                    trace_id: vec![1],
                    span_id: vec![2],
                    ref_type: 1,
                },
            ],
            start_time: Some(prost_types::Timestamp {
                seconds: 1485467191,
                nanos: 639875000,
            }),
            duration: Some(prost_types::Duration {
                seconds: 0,
                nanos: 5000,
            }),
            process: Some(quickwit_proto::jaeger::api_v2::Process {
                service_name: "service-y".to_string(),
                tags: Vec::new(),
            }),
            process_id: "".to_string(),
            warnings: vec!["some span warning".to_string()],
            ..Default::default()
        };
        let span_4 = quickwit_proto::jaeger::api_v2::Span {
            operation_name: "preserveParentID-test".to_string(),
            trace_id: vec![1],
            span_id: vec![5],
            references: vec![quickwit_proto::jaeger::api_v2::SpanRef {
                trace_id: vec![1],
                span_id: vec![4],
                ref_type: 0,
            }],
            start_time: Some(prost_types::Timestamp {
                seconds: 1485467191,
                nanos: 639875000,
            }),
            duration: Some(prost_types::Duration {
                seconds: 0,
                nanos: 4000,
            }),
            process: Some(quickwit_proto::jaeger::api_v2::Process {
                service_name: "service-y".to_string(),
                tags: Vec::new(),
            }),
            process_id: "".to_string(),
            warnings: vec!["some span warning".to_string()],
            ..Default::default()
        };
        vec![span_0, span_1, span_2, span_3, span_4]
    }
}


================================================
FILE: quickwit/quickwit-serve/src/jaeger_api/parse_duration.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use prost_types::{Duration as ProstDuration, Timestamp as ProstTimestamp};

pub(crate) fn parse_duration_with_units(duration_string: String) -> anyhow::Result<ProstDuration> {
    parse_duration_nanos(&duration_string)
        .map(to_well_known_timestamp)
        .map(|timestamp| ProstDuration {
            seconds: timestamp.seconds,
            nanos: timestamp.nanos,
        })
        .map_err(|error| anyhow::anyhow!("Failed to parse duration: {:?}", error))
}

pub(crate) fn to_well_known_timestamp(timestamp_nanos: i64) -> ProstTimestamp {
    let seconds = timestamp_nanos / 1_000_000_000;
    let nanos = (timestamp_nanos % 1_000_000_000) as i32;
    ProstTimestamp { seconds, nanos }
}

/// Parses a duration string and return duration in nanoseconds.
/// A duration string is a possibly signed sequence of decimal numbers, each
/// with optional fraction and a unit suffix, such as "300ms", "-1.5h".
///
/// Valid time units are "ns", "us" (or "µs"), "ms", "s", "m", "h".
fn parse_duration_nanos(input: &str) -> anyhow::Result<i64> {
    let mut num_str = String::new();
    for ch in input.trim().chars() {
        if ch.is_ascii_digit() || ch == '.' || ch == '-' {
            num_str.push(ch);
            continue;
        }
        if ch.is_alphabetic() {
            let unit = &input[num_str.len()..];
            let num: f64 = num_str.parse()?;
            let duration: f64 = match unit {
                "ns" => num,
                "us" | "µs" => num * 1000.0,
                "ms" => num * 1_000_000.0,
                "s" => num * 1_000_000_000.0,
                "m" => num * 60.0 * 1_000_000_000.0,
                "h" => num * 3600.0 * 1_000_000_000.0,
                _ => anyhow::bail!("Invalid time unit: {}", unit),
            };
            if num < i64::MIN as f64 || num > i64::MAX as f64 {
                anyhow::bail!("Invalid duration: {}", num_str)
            }
            return Ok(duration.round() as i64);
        } else {
            anyhow::bail!("Invalid duration string")
        }
    }
    anyhow::bail!("Invalid duration string")
}

#[cfg(test)]
mod tests {
    use crate::jaeger_api::parse_duration::parse_duration_nanos;

    #[test]
    fn test_parse_duration_nanos() {
        // Test valid duration strings
        assert_eq!(parse_duration_nanos("300ns").unwrap(), 300);
        assert_eq!(parse_duration_nanos("1us").unwrap(), 1000);
        assert_eq!(parse_duration_nanos("2.5ms").unwrap(), 2500000);
        assert_eq!(parse_duration_nanos("3s").unwrap(), 3000000000);
        assert_eq!(parse_duration_nanos("4m").unwrap(), 240000000000);
        assert_eq!(parse_duration_nanos("5h").unwrap(), 18000000000000);
        assert_eq!(parse_duration_nanos("-100ns").unwrap(), -100);
        assert_eq!(parse_duration_nanos("-2us").unwrap(), -2000);
        assert_eq!(parse_duration_nanos("-3.5ms").unwrap(), -3500000);
        assert_eq!(parse_duration_nanos("-4s").unwrap(), -4000000000);
        assert_eq!(parse_duration_nanos("-5m").unwrap(), -300000000000);
        assert_eq!(parse_duration_nanos("-6h").unwrap(), -21600000000000);

        // Test invalid duration strings
        assert!(parse_duration_nanos("abc").is_err());
        assert!(parse_duration_nanos("1.2.3s").is_err());
        assert!(parse_duration_nanos("1-.23s").is_err());
    }
}


================================================
FILE: quickwit/quickwit-serve/src/jaeger_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::time::Instant;

use itertools::Itertools;
use quickwit_jaeger::JaegerService;
use quickwit_proto::jaeger::storage::v1::{
    FindTracesRequest, GetOperationsRequest, GetServicesRequest, GetTraceRequest,
    SpansResponseChunk, TraceQueryParameters,
};
use quickwit_proto::tonic;
use tokio_stream::StreamExt;
use tokio_stream::wrappers::ReceiverStream;
use tracing::error;
use warp::hyper::StatusCode;
use warp::{Filter, Rejection};

use super::model::build_jaeger_traces;
use super::parse_duration::{parse_duration_with_units, to_well_known_timestamp};
use crate::jaeger_api::model::{
    DEFAULT_NUMBER_OF_TRACES, JaegerError, JaegerResponseBody, JaegerSpan, JaegerTrace,
    TracesSearchQueryParams,
};
use crate::rest::recover_fn;
use crate::rest_api_response::RestApiResponse;
use crate::search_api::extract_index_id_patterns;
use crate::{BodyFormat, require};

#[derive(utoipa::OpenApi)]
#[openapi(paths(
    jaeger_services_handler,
    jaeger_service_operations_handler,
    jaeger_traces_search_handler,
    jaeger_traces_handler
))]
pub(crate) struct JaegerApi;

/// Setup Jaeger API handlers
///
/// This is where all Jaeger handlers
/// should be registered.
/// Request are executed on the `otel-traces-v0_*` indexes.
pub(crate) fn jaeger_api_handlers(
    jaeger_service_opt: Option<JaegerService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    jaeger_services_handler(jaeger_service_opt.clone())
        .or(jaeger_service_operations_handler(
            jaeger_service_opt.clone(),
        ))
        .or(jaeger_traces_search_handler(jaeger_service_opt.clone()))
        .or(jaeger_traces_handler(jaeger_service_opt.clone()))
        .recover(recover_fn)
        .boxed()
}

fn jaeger_api_path_filter() -> impl Filter<Extract = (Vec<String>,), Error = Rejection> + Clone {
    warp::path!(String / "jaeger" / "api" / ..)
        .and(warp::get())
        .and_then(extract_index_id_patterns)
}

#[utoipa::path(
    get,
    tag = "Jaeger",
    path = "/{otel-traces-index-id}/jaeger/api/services",
    responses(
        (status = 200, description = "Successfully fetched services names.", body = JaegerResponseBody )
    ),
    params(
        ("otel-traces-index-id" = String, Path, description = "The name of the index to get services for.")
    )
)]
pub fn jaeger_services_handler(
    jaeger_service_opt: Option<JaegerService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    jaeger_api_path_filter()
        .and(warp::path!("services"))
        .and(require(jaeger_service_opt))
        .then(jaeger_services)
        .map(|result| make_jaeger_api_response(result, BodyFormat::default()))
}

#[utoipa::path(
    get,
    tag = "Jaeger",
    path = "/{otel-traces-index-id}/jaeger/api/services/{service}/operations",
    responses(
        (status = 200, description = "Successfully fetched operations names the given service.", body = JaegerResponseBody )
    ),
    params(
        ("otel-traces-index-id" = String, Path, description = "The name of the index to get operations for."),
        ("service" = String, Path, description = "The name of the service to get operations for."),
    )
)]
pub fn jaeger_service_operations_handler(
    jaeger_service_opt: Option<JaegerService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    jaeger_api_path_filter()
        .and(warp::path!("services" / String / "operations"))
        .and(require(jaeger_service_opt))
        .then(jaeger_service_operations)
        .map(|result| make_jaeger_api_response(result, BodyFormat::default()))
}

#[utoipa::path(
    get,
    tag = "Jaeger",
    path = "/{otel-traces-index-id}/jaeger/api/traces",
    responses(
        (status = 200, description = "Successfully fetched traces information.", body = JaegerResponseBody )
    ),
    params(
        ("otel-traces-index-id" = String, Path, description = "The name of the index to get traces for."),
        ("service" = Option<String>, Query, description = "The service name."),
        ("operation" = Option<String>, Query, description = "The operation name."),
        ("start" = Option<i64>, Query, description = "The start time in nanoseconds."),
        ("end" = Option<i64>, Query, description = "The end time in nanoseconds."),
        ("tags" = Option<String>, Query, description = "Sets tags with values in the logfmt format, such as error=true status=200."),
        ("min_duration" = Option<String>, Query, description = "Filters all traces with a duration higher than the set value. Possible values are 1.2s, 100ms, 500us."),
        ("max_duration" = Option<String>, Query, description = "Filters all traces with a duration lower than the set value. Possible values are 1.2s, 100ms, 500us."),
        ("limit" = Option<i32>, Query, description = "Limits the number of traces returned."),
    )
)]
pub fn jaeger_traces_search_handler(
    jaeger_service_opt: Option<JaegerService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    jaeger_api_path_filter()
        .and(warp::path!("traces"))
        .and(warp::query())
        .and(require(jaeger_service_opt))
        .then(jaeger_traces_search)
        .map(|result| make_jaeger_api_response(result, BodyFormat::default()))
}

#[utoipa::path(
    get,
    tag = "Jaeger",
    path = "/{otel-traces-index-id}/jaeger/api/traces/{id}",
    responses(
        (status = 200, description = "Successfully fetched traces spans for the provided trace ID.", body = JaegerResponseBody )
    ),
    params(
        ("otel-traces-index-id" = String, Path, description = "The name of the index to get traces for."),
        ("id" = String, Path, description = "The ID of the trace to get spans for."),
    )
)]
pub fn jaeger_traces_handler(
    jaeger_service_opt: Option<JaegerService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    jaeger_api_path_filter()
        .and(warp::path!("traces" / String))
        .and(warp::get())
        .and(require(jaeger_service_opt))
        .then(jaeger_get_trace_by_id)
        .map(|result| make_jaeger_api_response(result, BodyFormat::default()))
}

async fn jaeger_services(
    index_id_patterns: Vec<String>,
    jaeger_service: JaegerService,
) -> Result<JaegerResponseBody<Vec<String>>, JaegerError> {
    let get_services_response = jaeger_service
        .get_services_for_indexes(GetServicesRequest {}, index_id_patterns)
        .await
        .map_err(|error| JaegerError {
            status: StatusCode::INTERNAL_SERVER_ERROR,
            message: format!("failed to fetch services: {error}"),
        })?;
    Ok(JaegerResponseBody::<Vec<String>> {
        data: get_services_response.services,
    })
}

async fn jaeger_service_operations(
    index_id_patterns: Vec<String>,
    service_name: String,
    jaeger_service: JaegerService,
) -> Result<JaegerResponseBody<Vec<String>>, JaegerError> {
    let get_operations_request = GetOperationsRequest {
        service: service_name,
        span_kind: "".to_string(),
    };
    let get_operations_response = jaeger_service
        .get_operations_for_indexes(get_operations_request, index_id_patterns)
        .await
        .map_err(|error| JaegerError {
            status: StatusCode::INTERNAL_SERVER_ERROR,
            message: format!("failed to fetch services: {error}"),
        })?;

    let operations = get_operations_response
        .operations
        .into_iter()
        .map(|op| op.name)
        .collect_vec();
    Ok(JaegerResponseBody::<Vec<String>> { data: operations })
}

async fn jaeger_traces_search(
    index_id_patterns: Vec<String>,
    search_params: TracesSearchQueryParams,
    jaeger_service: JaegerService,
) -> Result<JaegerResponseBody<Vec<JaegerTrace>>, JaegerError> {
    let duration_min = search_params
        .min_duration
        .map(parse_duration_with_units)
        .transpose()?;
    let duration_max = search_params
        .max_duration
        .map(parse_duration_with_units)
        .transpose()?;
    let tags = search_params
        .tags
        .clone()
        .map(|s| {
            serde_json::from_str::<HashMap<String, String>>(&s).map_err(|error| {
                let error_msg = format!(
                    "failed to deserialize tags `{:?}`: {:?}",
                    search_params.tags, error
                );
                error!(error_msg);
                JaegerError {
                    status: StatusCode::INTERNAL_SERVER_ERROR,
                    message: error_msg,
                }
            })
        })
        .transpose()?
        .unwrap_or(Default::default());
    let query = TraceQueryParameters {
        service_name: search_params.service.unwrap_or_default(),
        operation_name: search_params.operation.unwrap_or_default(),
        tags,
        start_time_min: search_params
            .start
            .map(|ts| to_well_known_timestamp(ts * 1000)),
        start_time_max: search_params
            .end
            .map(|ts| to_well_known_timestamp(ts * 1000)),
        duration_min,
        duration_max,
        num_traces: search_params.limit.unwrap_or(DEFAULT_NUMBER_OF_TRACES),
    };
    let find_traces_request = FindTracesRequest { query: Some(query) };
    let spans_chunk_stream = jaeger_service
        .find_traces_for_indexes(
            find_traces_request,
            "find_traces",
            Instant::now(),
            index_id_patterns,
            true,
        )
        .await
        .map_err(|error| {
            error!(error = ?error, "failed to fetch traces");
            JaegerError {
                status: StatusCode::INTERNAL_SERVER_ERROR,
                message: "failed to fetch traces".to_string(),
            }
        })?;
    let jaeger_spans = collect_and_build_jaeger_spans(spans_chunk_stream).await?;
    let jaeger_traces: Vec<JaegerTrace> = build_jaeger_traces(jaeger_spans)?;
    Ok(JaegerResponseBody {
        data: jaeger_traces,
    })
}

async fn collect_and_build_jaeger_spans(
    mut spans_chunk_stream: ReceiverStream<Result<SpansResponseChunk, tonic::Status>>,
) -> anyhow::Result<Vec<JaegerSpan>> {
    let mut all_spans = Vec::<JaegerSpan>::new();
    while let Some(Ok(SpansResponseChunk { spans })) = spans_chunk_stream.next().await {
        let jaeger_spans: Vec<JaegerSpan> =
            spans.into_iter().map(JaegerSpan::try_from).try_collect()?;
        all_spans.extend(jaeger_spans);
    }
    Ok(all_spans)
}

async fn jaeger_get_trace_by_id(
    index_id_patterns: Vec<String>,
    trace_id_string: String,
    jaeger_service: JaegerService,
) -> Result<JaegerResponseBody<Vec<JaegerTrace>>, JaegerError> {
    let trace_id = hex::decode(trace_id_string.clone()).map_err(|error| {
        error!(error = ?error, "failed to decode trace `{}`", trace_id_string.clone());
        JaegerError {
            status: StatusCode::INTERNAL_SERVER_ERROR,
            message: "failed to decode trace id".to_string(),
        }
    })?;
    let get_trace_request = GetTraceRequest { trace_id };
    let spans_chunk_stream: ReceiverStream<Result<SpansResponseChunk, tonic::Status>> =
        jaeger_service
            .get_trace_for_indexes(
                get_trace_request,
                "get_trace",
                Instant::now(),
                index_id_patterns,
            )
            .await
            .map_err(|error| {
                error!(error = ?error, "failed to fetch trace `{trace_id_string}`");
                JaegerError {
                    status: StatusCode::INTERNAL_SERVER_ERROR,
                    message: "failed to fetch trace".to_string(),
                }
            })?;
    let jaeger_spans = collect_and_build_jaeger_spans(spans_chunk_stream).await?;
    let jaeger_traces: Vec<JaegerTrace> = build_jaeger_traces(jaeger_spans)?;
    Ok(JaegerResponseBody {
        data: jaeger_traces,
    })
}

fn make_jaeger_api_response<T: serde::Serialize>(
    jaeger_result: Result<T, JaegerError>,
    body_format: BodyFormat,
) -> RestApiResponse {
    let status_code = match &jaeger_result {
        Ok(_) => StatusCode::OK,
        Err(err) => err.status,
    };
    RestApiResponse::new(&jaeger_result, status_code, body_format)
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;
    use std::sync::Arc;

    use quickwit_config::JaegerConfig;
    use quickwit_opentelemetry::otlp::OTEL_TRACES_INDEX_ID;
    use quickwit_search::MockSearchService;
    use serde_json::Value as JsonValue;

    use super::*;
    use crate::recover_fn;

    #[tokio::test]
    async fn test_when_jaeger_not_found() {
        let jaeger_api_handler = jaeger_api_handlers(None).recover(crate::rest::recover_fn_final);
        let resp = warp::test::request()
            .path("/otel-traces-v0_9/jaeger/api/services")
            .reply(&jaeger_api_handler)
            .await;
        assert_eq!(resp.status(), 404);
        let error_body = serde_json::from_slice::<HashMap<String, String>>(resp.body()).unwrap();
        assert!(error_body.contains_key("message"));
        assert_eq!(error_body.get("message").unwrap(), "Route not found");
    }

    #[tokio::test]
    async fn test_jaeger_services() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_list_terms()
            .withf(|req| {
                req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID]
                    && req.field == "service_name"
                    && req.start_timestamp.is_some()
            })
            .return_once(|_| {
                Ok(quickwit_proto::search::ListTermsResponse {
                    num_hits: 0,
                    terms: Vec::new(),
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                })
            });
        let mock_search_service = Arc::new(mock_search_service);
        let jaeger = JaegerService::new(JaegerConfig::default(), mock_search_service);

        let jaeger_api_handler = jaeger_api_handlers(Some(jaeger)).recover(recover_fn);
        let resp = warp::test::request()
            .path("/otel-traces-v0_9/jaeger/api/services")
            .reply(&jaeger_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let actual_response_json: JsonValue = serde_json::from_slice(resp.body())?;
        assert!(
            actual_response_json
                .get("data")
                .unwrap()
                .as_array()
                .unwrap()
                .is_empty()
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_jaeger_service_operations() {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_list_terms()
            .withf(|req| {
                req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID]
                    && req.field == "span_fingerprint"
                    && req.start_timestamp.is_some()
            })
            .return_once(|_| {
                Ok(quickwit_proto::search::ListTermsResponse {
                    num_hits: 1,
                    terms: Vec::new(),
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                })
            });
        let mock_search_service = Arc::new(mock_search_service);
        let jaeger = JaegerService::new(JaegerConfig::default(), mock_search_service);
        let jaeger_api_handler = jaeger_api_handlers(Some(jaeger)).recover(recover_fn);
        let resp = warp::test::request()
            .path("/otel-traces-v0_9/jaeger/api/services/service1/operations")
            .reply(&jaeger_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let actual_response_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        assert!(
            actual_response_json
                .get("data")
                .unwrap()
                .as_array()
                .unwrap()
                .is_empty()
        );
    }

    #[tokio::test]
    async fn test_jaeger_traces_search() {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .withf(|req| {
                assert!(req.query_ast.contains(
                    "{\"type\":\"term\",\"field\":\"resource_attributes.tag.first\",\"value\":\"\
                     common\"}"
                ));
                assert!(req.query_ast.contains(
                    "{\"type\":\"term\",\"field\":\"resource_attributes.tag.second\",\"value\":\"\
                     true\"}"
                ));
                assert!(req.query_ast.contains(
                    "{\"type\":\"term\",\"field\":\"resource_attributes.tag.second\",\"value\":\"\
                     true\"}"
                ));
                // no lowerbound because minDuration < 1ms,
                assert!(req.query_ast.contains(
                    "{\"type\":\"range\",\"field\":\"span_duration_millis\",\"lower_bound\":\"\
                     Unbounded\",\"upper_bound\":{\"Included\":1200}}"
                ));
                assert_eq!(req.start_timestamp, Some(1702352106));
                // TODO(trinity) i think we have an off by 1 here, imo this should be rounded up
                assert_eq!(req.end_timestamp, Some(1702373706));
                assert_eq!(
                    req.index_id_patterns,
                    vec![OTEL_TRACES_INDEX_ID.to_string()]
                );
                true
            })
            .return_once(|_| {
                Ok(quickwit_proto::search::SearchResponse {
                    num_hits: 0,
                    hits: Vec::new(),
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                    aggregation_postcard: None,
                    scroll_id: None,
                    failed_splits: Vec::new(),
                    num_successful_splits: 1,
                })
            });
        let mock_search_service = Arc::new(mock_search_service);
        let jaeger = JaegerService::new(JaegerConfig::default(), mock_search_service);
        let jaeger_api_handler = jaeger_api_handlers(Some(jaeger)).recover(recover_fn);
        let resp = warp::test::request()
            .path(
                "/otel-traces-v0_9/jaeger/api/traces?service=quickwit&\
                 operation=delete_splits_marked_for_deletion&minDuration=500us&maxDuration=1.2s&\
                 tags=%7B%22tag.first%22%3A%22common%22%2C%22tag.second%22%3A%22true%22%7D&\
                 limit=1&start=1702352106016000&end=1702373706016000&lookback=custom",
            )
            .reply(&jaeger_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
    }

    #[tokio::test]
    async fn test_jaeger_trace_by_id() {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .withf(|req| req.index_id_patterns == vec![OTEL_TRACES_INDEX_ID.to_string()])
            .return_once(|_| {
                Ok(quickwit_proto::search::SearchResponse {
                    num_hits: 0,
                    hits: Vec::new(),
                    elapsed_time_micros: 0,
                    errors: Vec::new(),
                    aggregation_postcard: None,
                    scroll_id: None,
                    failed_splits: Vec::new(),
                    num_successful_splits: 1,
                })
            });
        let mock_search_service = Arc::new(mock_search_service);
        let jaeger = JaegerService::new(JaegerConfig::default(), mock_search_service);

        let jaeger_api_handler = jaeger_api_handlers(Some(jaeger)).recover(recover_fn);
        let resp = warp::test::request()
            .path("/otel-traces-v0_9/jaeger/api/traces/1506026ddd216249555653218dc88a6c")
            .reply(&jaeger_api_handler)
            .await;

        assert_eq!(resp.status(), 200);
        let actual_response_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        assert!(
            actual_response_json
                .get("data")
                .unwrap()
                .as_array()
                .unwrap()
                .is_empty()
        );
    }
}


================================================
FILE: quickwit/quickwit-serve/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![recursion_limit = "256"]

mod build_info;
mod cluster_api;
mod decompression;
mod delete_task_api;
mod developer_api;
mod elasticsearch_api;
mod format;
mod grpc;
mod health_check_api;
mod index_api;
mod indexing_api;
mod ingest_api;
mod jaeger_api;
mod load_shield;
mod metrics;
mod metrics_api;
mod node_info_handler;
mod openapi;
mod otlp_api;
mod rate_modulator;
mod rest;
mod rest_api_response;
mod search_api;
pub(crate) mod simple_list;
pub mod tcp_listener;
mod template_api;
mod ui_handler;

use std::collections::{HashMap, HashSet};
use std::convert::Infallible;
use std::fs;
use std::net::SocketAddr;
use std::num::NonZeroUsize;
use std::sync::Arc;
use std::time::Duration;

use anyhow::{Context, bail};
use bytesize::ByteSize;
pub(crate) use decompression::Body;
pub use format::BodyFormat;
use futures::StreamExt;
use itertools::Itertools;
use once_cell::sync::Lazy;
use quickwit_actors::{ActorExitStatus, Mailbox, SpawnContext, Universe};
use quickwit_cluster::{
    Cluster, ClusterChange, ClusterChangeStream, ClusterNode, ListenerHandle, start_cluster_service,
};
use quickwit_common::pubsub::{EventBroker, EventSubscriptionHandle};
use quickwit_common::rate_limiter::RateLimiterSettings;
use quickwit_common::retry::RetryParams;
use quickwit_common::runtimes::RuntimesConfig;
use quickwit_common::tower::{
    BalanceChannel, BoxFutureInfaillible, BufferLayer, Change, CircuitBreakerEvaluator,
    ConstantRate, EstimateRateLayer, EventListenerLayer, GrpcMetricsLayer, LoadShedLayer,
    RateLimitLayer, RetryLayer, RetryPolicy, SmaRateEstimator, TimeoutLayer,
};
use quickwit_common::uri::Uri;
use quickwit_common::{get_bool_from_env, spawn_named_task};
use quickwit_config::service::QuickwitService;
use quickwit_config::{ClusterConfig, IngestApiConfig, NodeConfig};
use quickwit_control_plane::control_plane::{ControlPlane, ControlPlaneEventSubscriber};
use quickwit_control_plane::{IndexerNodeInfo, IndexerPool};
use quickwit_index_management::{IndexService as IndexManager, IndexServiceError};
use quickwit_indexing::actors::IndexingService;
use quickwit_indexing::models::ShardPositionsService;
use quickwit_indexing::start_indexing_service;
use quickwit_ingest::{
    GetMemoryCapacity, IngestRequest, IngestRouter, IngestServiceClient, Ingester, IngesterPool,
    IngesterPoolEntry, LocalShardsUpdate, get_idle_shard_timeout,
    setup_ingester_capacity_update_listener, setup_local_shards_update_listener,
    start_ingest_api_service, try_get_ingester_status, wait_for_ingester_decommission,
    wait_for_ingester_status,
};
use quickwit_jaeger::JaegerService;
use quickwit_janitor::{JanitorService, start_janitor_service};
use quickwit_metastore::{
    ControlPlaneMetastore, ListIndexesMetadataResponseExt, MetastoreResolver,
};
use quickwit_opentelemetry::otlp::{OtlpGrpcLogsService, OtlpGrpcTracesService};
use quickwit_proto::control_plane::ControlPlaneServiceClient;
use quickwit_proto::indexing::{IndexingServiceClient, ShardPositionsUpdate};
use quickwit_proto::ingest::ingester::{
    IngesterService, IngesterServiceClient, IngesterServiceTowerLayerStack, IngesterStatus,
    PersistFailureReason, PersistResponse,
};
use quickwit_proto::ingest::router::IngestRouterServiceClient;
use quickwit_proto::ingest::{IngestV2Error, RateLimitingCause};
use quickwit_proto::metastore::{
    EntityKind, ListIndexesMetadataRequest, MetastoreError, MetastoreService,
    MetastoreServiceClient,
};
use quickwit_proto::search::ReportSplitsRequest;
use quickwit_proto::types::NodeId;
use quickwit_search::{
    SearchJobPlacer, SearchService, SearchServiceClient, SearcherContext, SearcherPool,
    create_search_client_from_channel, start_searcher_service,
};
use quickwit_storage::{SplitCache, StorageResolver};
use tcp_listener::TcpListenerResolver;
use tokio::sync::oneshot;
use tonic::codec::CompressionEncoding;
use tonic_health::ServingStatus;
use tonic_health::server::HealthReporter;
use tower::ServiceBuilder;
use tower::timeout::Timeout;
use tracing::{debug, error, info, warn};
use warp::{Filter, Rejection};

pub use crate::build_info::{BuildInfo, RuntimeInfo};
pub use crate::index_api::{ListSplitsQueryParams, ListSplitsResponse};
pub use crate::ingest_api::{RestIngestResponse, RestParseFailure};
pub use crate::metrics::SERVE_METRICS;
use crate::rate_modulator::RateModulator;
#[cfg(test)]
use crate::rest::recover_fn;
pub use crate::search_api::{SearchRequestQueryString, SortBy, search_request_from_api_request};

const READINESS_REPORTING_INTERVAL: Duration = if cfg!(any(test, feature = "testsuite")) {
    Duration::from_millis(25)
} else {
    Duration::from_secs(10)
};

const METASTORE_CLIENT_MAX_CONCURRENCY_ENV_KEY: &str = "QW_METASTORE_CLIENT_MAX_CONCURRENCY";
const DEFAULT_METASTORE_CLIENT_MAX_CONCURRENCY: usize = 6;
const DISABLE_DELETE_TASK_SERVICE_ENV_KEY: &str = "QW_DISABLE_DELETE_TASK_SERVICE";

pub type EnvFilterReloadFn = Arc<dyn Fn(&str) -> anyhow::Result<()> + Send + Sync>;

pub fn do_nothing_env_filter_reload_fn() -> EnvFilterReloadFn {
    Arc::new(|_| Ok(()))
}

fn get_metastore_client_max_concurrency() -> usize {
    quickwit_common::get_from_env(
        METASTORE_CLIENT_MAX_CONCURRENCY_ENV_KEY,
        DEFAULT_METASTORE_CLIENT_MAX_CONCURRENCY,
        false,
    )
}

static CP_GRPC_CLIENT_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("control_plane", "client"));
static CP_GRPC_SERVER_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("control_plane", "server"));

static INDEXING_GRPC_CLIENT_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("indexing", "client"));
pub(crate) static INDEXING_GRPC_SERVER_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("indexing", "server"));

static INGEST_GRPC_CLIENT_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("ingest", "client"));
static INGEST_GRPC_SERVER_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("ingest", "server"));

static METASTORE_GRPC_CLIENT_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("metastore", "client"));
static METASTORE_GRPC_SERVER_METRICS_LAYER: Lazy<GrpcMetricsLayer> =
    Lazy::new(|| GrpcMetricsLayer::new("metastore", "server"));

static GRPC_INGESTER_SERVICE_TIMEOUT: Duration = Duration::from_secs(30);
static GRPC_INDEXING_SERVICE_TIMEOUT: Duration = Duration::from_secs(30);
static GRPC_METASTORE_SERVICE_TIMEOUT: Duration = Duration::from_secs(10);

struct QuickwitServices {
    pub node_config: Arc<NodeConfig>,
    pub cluster: Cluster,
    pub metastore_server_opt: Option<MetastoreServiceClient>,
    pub metastore_client: MetastoreServiceClient,
    pub control_plane_server_opt: Option<Mailbox<ControlPlane>>,
    pub control_plane_client: ControlPlaneServiceClient,
    pub index_manager: IndexManager,
    pub indexing_service_opt: Option<Mailbox<IndexingService>>,
    // Ingest v1
    pub ingest_service: IngestServiceClient,
    // Ingest v2
    pub ingest_router_opt: Option<IngestRouter>,
    pub ingest_router_service: IngestRouterServiceClient,
    ingester_opt: Option<Ingester>,

    pub janitor_service_opt: Option<Mailbox<JanitorService>>,
    pub jaeger_service_opt: Option<JaegerService>,
    pub otlp_logs_service_opt: Option<OtlpGrpcLogsService>,
    pub otlp_traces_service_opt: Option<OtlpGrpcTracesService>,
    /// We do have a search service even on nodes that are not running `search`.
    /// It is only used to serve the rest API calls and will only execute
    /// the root requests.
    pub search_service: Arc<dyn SearchService>,

    pub env_filter_reload_fn: EnvFilterReloadFn,

    /// The control plane listens to various events.
    /// We must maintain a reference to the subscription handles to continue receiving
    /// notifications. Otherwise, the subscriptions are dropped.
    _local_shards_update_listener_handle_opt: Option<ListenerHandle>,
    _report_splits_subscription_handle_opt: Option<EventSubscriptionHandle>,
}

impl QuickwitServices {
    /// Client in the type is a bit misleading here.
    ///
    /// The object returned is the implementation of the local ingester service,
    /// with all of the appropriate tower layers.
    pub fn ingester_service(&self) -> Option<IngesterServiceClient> {
        let ingester = self.ingester_opt.clone()?;
        Some(ingester_service_layer_stack(IngesterServiceClient::tower()).build(ingester))
    }
}

async fn balance_channel_for_service(
    cluster: &Cluster,
    service: QuickwitService,
) -> BalanceChannel<SocketAddr> {
    let cluster_change_stream = cluster.change_stream();
    let service_change_stream = cluster_change_stream.filter_map(move |cluster_change| {
        Box::pin(async move {
            match cluster_change {
                ClusterChange::Add(node) if node.enabled_services().contains(&service) => {
                    let chitchat_id = node.chitchat_id();
                    info!(
                        node_id = chitchat_id.node_id,
                        generation_id = chitchat_id.generation_id,
                        "adding node `{}` to {} pool",
                        chitchat_id.node_id,
                        service.as_str().replace('_', " "),
                    );
                    Some(Change::Insert(node.grpc_advertise_addr(), node.channel()))
                }
                ClusterChange::Remove(node) if node.enabled_services().contains(&service) => {
                    let chitchat_id = node.chitchat_id();
                    info!(
                        node_id = chitchat_id.node_id,
                        generation_id = chitchat_id.generation_id,
                        "removing node `{}` from {} pool",
                        chitchat_id.node_id,
                        service.as_str().replace('_', " "),
                    );
                    Some(Change::Remove(node.grpc_advertise_addr()))
                }
                _ => None,
            }
        })
    });
    BalanceChannel::from_stream(service_change_stream)
}

async fn start_ingest_client_if_needed(
    node_config: &NodeConfig,
    universe: &Universe,
    cluster: &Cluster,
) -> anyhow::Result<IngestServiceClient> {
    if node_config.is_service_enabled(QuickwitService::Indexer) {
        let ingest_api_service = start_ingest_api_service(
            universe,
            &node_config.data_dir_path,
            &node_config.ingest_api_config,
        )
        .await?;
        let num_buckets = NonZeroUsize::new(60).expect("60 should be non-zero");
        let rate_estimator = SmaRateEstimator::new(
            num_buckets,
            Duration::from_secs(10),
            Duration::from_millis(100),
        );
        let memory_capacity = ingest_api_service.ask(GetMemoryCapacity).await?;
        let min_rate = ConstantRate::new(ByteSize::mib(1).as_u64(), Duration::from_millis(100));
        let rate_modulator = RateModulator::new(rate_estimator.clone(), memory_capacity, min_rate);
        let ingest_service = IngestServiceClient::tower()
            .stack_ingest_layer(
                ServiceBuilder::new()
                    .layer(EstimateRateLayer::<IngestRequest, _>::new(rate_estimator))
                    .layer(BufferLayer::new(100))
                    .layer(RateLimitLayer::new(rate_modulator))
                    .into_inner(),
            )
            .build_from_mailbox(ingest_api_service);
        Ok(ingest_service)
    } else {
        let balance_channel = balance_channel_for_service(cluster, QuickwitService::Indexer).await;
        let ingest_service = IngestServiceClient::from_balance_channel(
            balance_channel,
            node_config.grpc_config.max_message_size,
            node_config.ingest_api_config.grpc_compression_encoding(),
        );
        Ok(ingest_service)
    }
}

async fn start_control_plane_if_needed(
    node_config: &NodeConfig,
    cluster: &Cluster,
    event_broker: &EventBroker,
    metastore_client: &MetastoreServiceClient,
    universe: &Universe,
    indexer_pool: &IndexerPool,
    ingester_pool: &IngesterPool,
) -> anyhow::Result<(Option<Mailbox<ControlPlane>>, ControlPlaneServiceClient)> {
    if node_config.is_service_enabled(QuickwitService::ControlPlane) {
        check_cluster_configuration(
            &node_config.enabled_services,
            &node_config.peer_seeds,
            metastore_client.clone(),
        )
        .await?;

        let self_node_id: NodeId = cluster.self_node_id().into();

        let control_plane_mailbox = setup_control_plane(
            universe,
            event_broker,
            self_node_id,
            cluster.clone(),
            indexer_pool.clone(),
            ingester_pool.clone(),
            metastore_client.clone(),
            node_config.default_index_root_uri.clone(),
            &node_config.ingest_api_config,
        )
        .await?;

        let control_plane_server_opt = Some(control_plane_mailbox.clone());
        let control_plane_client = ControlPlaneServiceClient::tower()
            .stack_layer(CP_GRPC_SERVER_METRICS_LAYER.clone())
            .stack_layer(LoadShedLayer::new(100))
            .build_from_mailbox(control_plane_mailbox);
        Ok((control_plane_server_opt, control_plane_client))
    } else {
        let balance_channel =
            balance_channel_for_service(cluster, QuickwitService::ControlPlane).await;

        // If the node is a metastore, we skip this check in order to avoid a deadlock.
        // If the node is a searcher, we skip this check because the searcher does not need to.
        if !node_config.is_service_enabled(QuickwitService::Metastore)
            && node_config.enabled_services != HashSet::from([QuickwitService::Searcher])
        {
            info!("connecting to control plane");

            if !balance_channel
                .wait_for(Duration::from_secs(300), |connections| {
                    !connections.is_empty()
                })
                .await
            {
                bail!("could not find control plane in the cluster");
            }
        }
        let control_plane_server_opt = None;
        let control_plane_client = ControlPlaneServiceClient::tower()
            .stack_layer(CP_GRPC_CLIENT_METRICS_LAYER.clone())
            .build_from_balance_channel(
                balance_channel,
                node_config.grpc_config.max_message_size,
                None,
            );
        Ok((control_plane_server_opt, control_plane_client))
    }
}

fn start_shard_positions_service(
    ingester_opt: Option<Ingester>,
    cluster: Cluster,
    event_broker: EventBroker,
    spawn_ctx: SpawnContext,
) {
    // We spawn a task here, because we need the ingester to be ready before spawning the
    // the `ShardPositionsService`. If we don't, all the events we emit too early will be dismissed.
    tokio::spawn(async move {
        if let Some(ingester) = &ingester_opt
            && wait_for_ingester_status(ingester, IngesterStatus::Ready, Duration::from_secs(300))
                .await
                .is_err()
        {
            warn!("ingester failed to reach ready status");
        }
        ShardPositionsService::spawn(&spawn_ctx, event_broker, cluster);
    });
}

/// Waits for the shutdown signal and notifies all other services when it
/// occurs.
///
/// Usually called when receiving a SIGTERM signal, e.g. k8s trying to
/// decomission a pod.
async fn shutdown_signal_handler(
    shutdown_signal: BoxFutureInfaillible<()>,
    universe: Universe,
    ingester_opt: Option<Ingester>,
    grpc_shutdown_trigger_tx: oneshot::Sender<()>,
    rest_shutdown_trigger_tx: oneshot::Sender<()>,
    cluster: Cluster,
) -> HashMap<String, ActorExitStatus> {
    shutdown_signal.await;
    // We must decommission the ingester first before terminating the indexing pipelines that
    // may consume from it. We also need to keep the gRPC server running while doing so.
    if let Some(ingester) = &ingester_opt
        && let Err(error) = wait_for_ingester_decommission(ingester, Duration::from_secs(300)).await
    {
        error!("failed to decommission ingester gracefully: {:?}", error);
    }
    let actor_exit_statuses = universe.quit().await;

    if grpc_shutdown_trigger_tx.send(()).is_err() {
        debug!("gRPC server shutdown signal receiver was dropped");
    }
    if rest_shutdown_trigger_tx.send(()).is_err() {
        debug!("REST server shutdown signal receiver was dropped");
    }
    if let Err(err) = cluster.initiate_shutdown().await {
        debug!("{err}");
    }
    actor_exit_statuses
}

pub async fn serve_quickwit(
    node_config: NodeConfig,
    runtimes_config: RuntimesConfig,
    metastore_resolver: MetastoreResolver,
    storage_resolver: StorageResolver,
    tcp_listener_resolver: impl TcpListenerResolver,
    shutdown_signal: BoxFutureInfaillible<()>,
    env_filter_reload_fn: EnvFilterReloadFn,
) -> anyhow::Result<HashMap<String, ActorExitStatus>> {
    let cluster = start_cluster_service(&node_config)
        .await
        .context("failed to start cluster service")?;

    let event_broker = EventBroker::default();
    let indexer_pool = IndexerPool::default();
    let ingester_pool = IngesterPool::default();
    let universe = Universe::new();
    let grpc_config = node_config.grpc_config.clone();

    // Instantiate a metastore "server" if the `metastore` role is enabled on the node.
    let metastore_server_opt: Option<MetastoreServiceClient> =
        if node_config.is_service_enabled(QuickwitService::Metastore) {
            let metastore: MetastoreServiceClient = metastore_resolver
                .resolve(&node_config.metastore_uri)
                .await
                .with_context(|| {
                    format!(
                        "failed to resolve metastore uri `{}`",
                        node_config.metastore_uri
                    )
                })?;
            let max_in_flight_requests = if node_config.metastore_uri.protocol().is_database() {
                node_config
                    .metastore_configs
                    .find_postgres()
                    .map(|config| config.max_connections.get() * 2)
                    .unwrap_or_default()
                    .max(100)
            } else {
                100
            };
            // These layers apply to all the RPCs of the metastore.
            let shared_layer = ServiceBuilder::new()
                .layer(METASTORE_GRPC_SERVER_METRICS_LAYER.clone())
                .layer(LoadShedLayer::new(max_in_flight_requests))
                .into_inner();
            let broker_layer = EventListenerLayer::new(event_broker.clone());
            let metastore = MetastoreServiceClient::tower()
                .stack_layer(shared_layer)
                .stack_create_index_layer(broker_layer.clone())
                .stack_delete_index_layer(broker_layer.clone())
                .stack_add_source_layer(broker_layer.clone())
                .stack_delete_source_layer(broker_layer.clone())
                .stack_toggle_source_layer(broker_layer)
                .build(metastore);
            Some(metastore)
        } else {
            None
        };
    // Instantiate a metastore client, either local if available or remote otherwise.
    let metastore_client: MetastoreServiceClient =
        if let Some(metastore_server) = &metastore_server_opt {
            metastore_server.clone()
        } else {
            info!("connecting to metastore");

            let balance_channel =
                balance_channel_for_service(&cluster, QuickwitService::Metastore).await;

            if !balance_channel
                .wait_for(Duration::from_secs(300), |connections| {
                    !connections.is_empty()
                })
                .await
            {
                bail!("could not find any metastore node in the cluster");
            }
            MetastoreServiceClient::tower()
                .stack_layer(RetryLayer::new(RetryPolicy::from(RetryParams::standard())))
                .stack_layer(TimeoutLayer::new(GRPC_METASTORE_SERVICE_TIMEOUT))
                .stack_layer(METASTORE_GRPC_CLIENT_METRICS_LAYER.clone())
                .stack_layer(tower::limit::GlobalConcurrencyLimitLayer::new(
                    get_metastore_client_max_concurrency(),
                ))
                .build_from_balance_channel(balance_channel, grpc_config.max_message_size, None)
        };
    // Instantiate a control plane server if the `control-plane` role is enabled on the node.
    // Otherwise, instantiate a control plane client.
    let (control_plane_server_opt, control_plane_client) = start_control_plane_if_needed(
        &node_config,
        &cluster,
        &event_broker,
        &metastore_client,
        &universe,
        &indexer_pool,
        &ingester_pool,
    )
    .await
    .context("failed to start control plane service")?;

    // Set up the "control plane proxy" for the metastore.
    let metastore_through_control_plane = MetastoreServiceClient::new(ControlPlaneMetastore::new(
        control_plane_client.clone(),
        metastore_client,
    ));

    // Setup ingest service v1.
    let ingest_service = start_ingest_client_if_needed(&node_config, &universe, &cluster)
        .await
        .context("failed to start ingest v1 service")?;

    let indexing_service_opt = if node_config.is_service_enabled(QuickwitService::Indexer) {
        let indexing_service = start_indexing_service(
            &universe,
            &node_config,
            runtimes_config.num_threads_blocking,
            cluster.clone(),
            metastore_through_control_plane.clone(),
            ingester_pool.clone(),
            storage_resolver.clone(),
            event_broker.clone(),
        )
        .await
        .context("failed to start indexing service")?;
        Some(indexing_service)
    } else {
        None
    };

    // Setup the indexer pool to track cluster changes.
    setup_indexer_pool(
        cluster.change_stream(),
        indexing_service_opt.clone(),
        indexer_pool,
        node_config.grpc_config.max_message_size,
    );

    // Setup ingest service v2.
    let (ingest_router, ingest_router_service, ingester_opt) = setup_ingest_v2(
        &node_config,
        &cluster,
        &event_broker,
        control_plane_client.clone(),
        ingester_pool,
    )
    .await
    .context("failed to start ingest v2 service")?;

    if node_config.is_service_enabled(QuickwitService::Indexer)
        || node_config.is_service_enabled(QuickwitService::ControlPlane)
    {
        start_shard_positions_service(
            ingester_opt.clone(),
            cluster.clone(),
            event_broker.clone(),
            universe.spawn_ctx().clone(),
        );
    }

    // Any node can serve index management requests (create/update/delete index, add/remove source,
    // etc.), so we always instantiate an index manager.
    let mut index_manager = IndexManager::new(
        metastore_through_control_plane.clone(),
        storage_resolver.clone(),
    );

    if node_config.is_service_enabled(QuickwitService::Indexer)
        && node_config.indexer_config.enable_otlp_endpoint
    {
        {
            let otel_logs_index_config =
                OtlpGrpcLogsService::index_config(&node_config.default_index_root_uri)
                    .context("failed to load OTEL logs index config")?;
            let otel_traces_index_config =
                OtlpGrpcTracesService::index_config(&node_config.default_index_root_uri)
                    .context("failed to load OTEL traces index config")?;

            for (index_name, index_config) in [
                ("OTEL logs", otel_logs_index_config),
                ("OTEL traces", otel_traces_index_config),
            ] {
                match index_manager.create_index(index_config, false).await {
                    Ok(_)
                    | Err(IndexServiceError::Metastore(MetastoreError::AlreadyExists(
                        EntityKind::Index { .. },
                    ))) => {}
                    Err(error) => bail!("failed to create {index_name} index: {error}",),
                };
            }
        }
    }

    let split_cache_opt: Option<Arc<SplitCache>> =
        if let Some(split_cache_limits) = node_config.searcher_config.split_cache {
            let split_cache = SplitCache::with_root_path(
                node_config.data_dir_path.join("searcher-split-cache"),
                storage_resolver.clone(),
                split_cache_limits,
            )
            .context("failed to load searcher split cache")?;
            Some(split_cache)
        } else {
            None
        };

    // Initialize Lambda invoker if enabled and searcher service is running
    let searcher_context = if node_config.is_service_enabled(QuickwitService::Searcher) {
        if let Some(lambda_config) = &node_config.searcher_config.lambda {
            #[cfg(feature = "lambda")]
            {
                info!("initializing AWS Lambda invoker for search");
                warn!("offloading to lambda is EXPERIMENTAL. Use at your own risk");
                let invoker =
                    quickwit_lambda_client::try_get_or_deploy_invoker(lambda_config).await?;
                Arc::new(SearcherContext::new(
                    node_config.searcher_config.clone(),
                    split_cache_opt,
                    Some(invoker),
                ))
            }
            #[cfg(not(feature = "lambda"))]
            {
                let _ = lambda_config;
                bail!("lambda support is statically disabled, but enabled in configuration");
            }
        } else {
            Arc::new(SearcherContext::new_without_invoker(
                node_config.searcher_config.clone(),
                split_cache_opt,
            ))
        }
    } else {
        Arc::new(SearcherContext::new_without_invoker(
            node_config.searcher_config.clone(),
            split_cache_opt,
        ))
    };

    let (search_job_placer, search_service) = setup_searcher(
        &node_config,
        cluster.change_stream(),
        // search remains available without a control plane because not all
        // metastore RPCs are proxied
        metastore_through_control_plane.clone(),
        storage_resolver.clone(),
        searcher_context,
    )
    .await
    .context("failed to start searcher service")?;

    // The control plane listens for local shards updates to learn about each shard's ingestion
    // throughput. Ingesters (routers) do so to update their shard table.
    let local_shards_update_listener_handle_opt = if node_config
        .is_service_enabled(QuickwitService::ControlPlane)
        || node_config.is_service_enabled(QuickwitService::Indexer)
    {
        Some(setup_local_shards_update_listener(cluster.clone(), event_broker.clone()).await)
    } else {
        None
    };

    let report_splits_subscription_handle_opt =
        // DISCLAIMER: This is quirky here: We base our decision to forward the split report depending
        // on the current searcher configuration.
        if node_config.searcher_config.split_cache.is_some() {
            // The searcher receive hints about new splits to populate their index.
            Some(event_broker.subscribe::<ReportSplitsRequest>(search_job_placer.clone()))
        } else {
            None
        };

    let janitor_service_opt = if node_config.is_service_enabled(QuickwitService::Janitor) {
        let janitor_service = start_janitor_service(
            &universe,
            &node_config,
            metastore_through_control_plane.clone(),
            search_job_placer,
            storage_resolver.clone(),
            event_broker.clone(),
            !get_bool_from_env(DISABLE_DELETE_TASK_SERVICE_ENV_KEY, false),
        )
        .await
        .context("failed to start janitor service")?;
        Some(janitor_service)
    } else {
        None
    };

    let jaeger_service_opt = if node_config.jaeger_config.enable_endpoint
        && node_config.is_service_enabled(QuickwitService::Searcher)
    {
        let search_service = search_service.clone();
        Some(JaegerService::new(
            node_config.jaeger_config.clone(),
            search_service,
        ))
    } else {
        None
    };

    let otlp_logs_service_opt = if node_config.is_service_enabled(QuickwitService::Indexer)
        && node_config.indexer_config.enable_otlp_endpoint
    {
        Some(OtlpGrpcLogsService::new(ingest_router_service.clone()))
    } else {
        None
    };

    let otlp_traces_service_opt = if node_config.is_service_enabled(QuickwitService::Indexer)
        && node_config.indexer_config.enable_otlp_endpoint
    {
        Some(OtlpGrpcTracesService::new(
            ingest_router_service.clone(),
            None,
        ))
    } else {
        None
    };

    let grpc_listen_addr = node_config.grpc_listen_addr;
    let rest_listen_addr = node_config.rest_config.listen_addr;
    let quickwit_services: Arc<QuickwitServices> = Arc::new(QuickwitServices {
        node_config: Arc::new(node_config),
        cluster: cluster.clone(),
        metastore_server_opt,
        metastore_client: metastore_through_control_plane.clone(),
        control_plane_server_opt,
        control_plane_client,
        _local_shards_update_listener_handle_opt: local_shards_update_listener_handle_opt,
        _report_splits_subscription_handle_opt: report_splits_subscription_handle_opt,
        index_manager,
        indexing_service_opt,
        ingest_router_opt: Some(ingest_router),
        ingest_router_service,
        ingest_service,
        ingester_opt: ingester_opt.clone(),
        janitor_service_opt,
        jaeger_service_opt,
        otlp_logs_service_opt,
        otlp_traces_service_opt,
        search_service,
        env_filter_reload_fn,
    });
    // Setup and start gRPC server.
    let (grpc_readiness_trigger_tx, grpc_readiness_signal_rx) = oneshot::channel::<()>();
    let grpc_readiness_trigger = Box::pin(async move {
        if grpc_readiness_trigger_tx.send(()).is_err() {
            debug!("gRPC server readiness signal receiver was dropped");
        }
    });
    let (grpc_shutdown_trigger_tx, grpc_shutdown_signal_rx) = oneshot::channel::<()>();
    let grpc_shutdown_signal = Box::pin(async move {
        if grpc_shutdown_signal_rx.await.is_err() {
            debug!("gRPC server shutdown trigger sender was dropped");
        }
    });
    let (health_reporter, health_service) = tonic_health::server::health_reporter();
    let grpc_server = grpc::start_grpc_server(
        tcp_listener_resolver.resolve(grpc_listen_addr).await?,
        grpc_config,
        quickwit_services.clone(),
        grpc_readiness_trigger,
        grpc_shutdown_signal,
        health_service,
    );
    // Setup and start REST server.
    let (rest_readiness_trigger_tx, rest_readiness_signal_rx) = oneshot::channel::<()>();
    let rest_readiness_trigger = Box::pin(async move {
        if rest_readiness_trigger_tx.send(()).is_err() {
            debug!("REST server readiness signal receiver was dropped");
        }
    });
    let (rest_shutdown_trigger_tx, rest_shutdown_signal_rx) = oneshot::channel::<()>();
    let rest_shutdown_signal = Box::pin(async move {
        if rest_shutdown_signal_rx.await.is_err() {
            debug!("REST server shutdown trigger sender was dropped");
        }
    });

    let rest_server = rest::start_rest_server(
        tcp_listener_resolver.resolve(rest_listen_addr).await?,
        quickwit_services,
        rest_readiness_trigger,
        rest_shutdown_signal,
    );

    // Node readiness indicates that the server is ready to receive requests.
    // Thus readiness task is started once gRPC and REST servers are started.
    spawn_named_task(
        node_readiness_reporting_task(
            cluster.clone(),
            metastore_through_control_plane,
            ingester_opt.clone(),
            grpc_readiness_signal_rx,
            rest_readiness_signal_rx,
            health_reporter,
        ),
        "node_readiness_reporting",
    );

    let shutdown_handle = tokio::spawn(shutdown_signal_handler(
        shutdown_signal,
        universe,
        ingester_opt,
        grpc_shutdown_trigger_tx,
        rest_shutdown_trigger_tx,
        cluster.clone(),
    ));
    let grpc_join_handle = async move {
        spawn_named_task(grpc_server, "grpc_server")
            .await
            .expect("tasks running the gRPC server should not panic or be cancelled")
            .context("gRPC server failed")
    };

    let rest_join_handle = async move {
        spawn_named_task(rest_server, "rest_server")
            .await
            .expect("tasks running the REST server should not panic or be cancelled")
            .context("REST server failed")
    };

    let chitchat_server_handle = cluster.chitchat_server_termination_watcher().await;

    if let Err(err) = tokio::try_join!(grpc_join_handle, rest_join_handle, chitchat_server_handle) {
        error!("server failed: {err:?}");
    }

    let actor_exit_statuses = shutdown_handle
        .await
        .context("failed to gracefully shutdown services")?;
    Ok(actor_exit_statuses)
}

#[derive(Clone, Copy)]
struct PersistCircuitBreakerEvaluator;

impl CircuitBreakerEvaluator for PersistCircuitBreakerEvaluator {
    type Response = PersistResponse;

    type Error = IngestV2Error;

    fn is_circuit_breaker_error(&self, output: &Result<Self::Response, IngestV2Error>) -> bool {
        let Ok(persist_response) = output.as_ref() else {
            return false;
        };
        for persist_failure in &persist_response.failures {
            // This is the error we return when the WAL is full.
            if persist_failure.reason() == PersistFailureReason::WalFull {
                return true;
            }
        }
        false
    }

    fn make_circuit_breaker_output(&self) -> IngestV2Error {
        IngestV2Error::TooManyRequests(RateLimitingCause::CircuitBreaker)
    }
}

/// Stack of layers to use on the server side of the ingester service.
fn ingester_service_layer_stack(
    layer_stack: IngesterServiceTowerLayerStack,
) -> IngesterServiceTowerLayerStack {
    layer_stack
        .stack_layer(INGEST_GRPC_SERVER_METRICS_LAYER.clone())
        .stack_persist_layer(quickwit_common::tower::OneTaskPerCallLayer)
        .stack_persist_layer(
            // "3" may seem a little bit low, but we only consider error caused by a full WAL.
            PersistCircuitBreakerEvaluator.make_layer(
                3,
                Duration::from_millis(500),
                crate::metrics::SERVE_METRICS.circuit_break_total.clone(),
            ),
        )
        .stack_open_replication_stream_layer(quickwit_common::tower::OneTaskPerCallLayer)
        .stack_init_shards_layer(quickwit_common::tower::OneTaskPerCallLayer)
        .stack_retain_shards_layer(quickwit_common::tower::OneTaskPerCallLayer)
        .stack_truncate_shards_layer(quickwit_common::tower::OneTaskPerCallLayer)
        .stack_close_shards_layer(quickwit_common::tower::OneTaskPerCallLayer)
        .stack_decommission_layer(quickwit_common::tower::OneTaskPerCallLayer)
}

async fn setup_ingest_v2(
    node_config: &NodeConfig,
    cluster: &Cluster,
    event_broker: &EventBroker,
    control_plane: ControlPlaneServiceClient,
    ingester_pool: IngesterPool,
) -> anyhow::Result<(IngestRouter, IngestRouterServiceClient, Option<Ingester>)> {
    // Instantiate ingest router.
    let self_node_id: NodeId = cluster.self_node_id().into();
    let grpc_compression_encoding_opt = node_config.ingest_api_config.grpc_compression_encoding();
    let replication_factor = node_config
        .ingest_api_config
        .replication_factor()
        .expect("replication factor should have been validated")
        .get();

    // Any node can serve ingest requests, so we always instantiate an ingest router.
    // TODO: I'm not sure that's such a good idea.
    let ingest_router = IngestRouter::new(
        self_node_id.clone(),
        control_plane.clone(),
        ingester_pool.clone(),
        replication_factor,
        event_broker.clone(),
        node_config.availability_zone.clone(),
    );
    ingest_router.subscribe();
    setup_ingester_capacity_update_listener(cluster.clone(), event_broker.clone())
        .await
        .forever();

    let ingest_router_service = IngestRouterServiceClient::tower()
        .stack_layer(INGEST_GRPC_SERVER_METRICS_LAYER.clone())
        .build(ingest_router.clone());

    let rate_limit =
        ConstantRate::bytes_per_sec(node_config.ingest_api_config.shard_throughput_limit);
    let rate_limiter_settings = RateLimiterSettings {
        burst_limit: node_config.ingest_api_config.shard_burst_limit.as_u64(),
        rate_limit,
        // Refill every 100ms.
        refill_period: Duration::from_millis(100),
    };

    // Instantiate ingester.
    let ingester_opt: Option<Ingester> = if node_config.is_service_enabled(QuickwitService::Indexer)
    {
        let wal_dir_path = node_config.data_dir_path.join("wal");
        fs::create_dir_all(&wal_dir_path)?;

        let idle_shard_timeout = get_idle_shard_timeout();
        let ingester = Ingester::try_new(
            cluster.clone(),
            control_plane,
            ingester_pool.clone(),
            &wal_dir_path,
            node_config.ingest_api_config.max_queue_disk_usage,
            node_config.ingest_api_config.max_queue_memory_usage,
            rate_limiter_settings,
            replication_factor,
            idle_shard_timeout,
        )
        .await?;
        ingester.subscribe(event_broker);
        // We will now receive all new shard positions update events, from chitchat.
        // Unfortunately at this point, chitchat is already running.
        //
        // We need to make sure the existing positions are loaded too.
        Some(ingester)
    } else {
        None
    };
    setup_ingester_pool(
        cluster.change_stream(),
        ingester_opt.clone(),
        ingester_pool,
        grpc_compression_encoding_opt,
        node_config.grpc_config.max_message_size,
    );
    Ok((ingest_router, ingest_router_service, ingester_opt))
}

fn setup_ingester_pool(
    cluster_change_stream: ClusterChangeStream,
    ingester_opt: Option<Ingester>,
    ingester_pool: IngesterPool,
    grpc_compression_encoding_opt: Option<CompressionEncoding>,
    grpc_max_message_size: ByteSize,
) {
    let ingester_change_stream = cluster_change_stream.filter_map(move |cluster_change| {
        let ingester_opt_clone = ingester_opt.clone();
        Box::pin(async move {
            match cluster_change {
                ClusterChange::Add(node) if node.is_indexer() => {
                    let change = build_ingester_insert_change(
                        &node,
                        ingester_opt_clone,
                        grpc_max_message_size,
                        grpc_compression_encoding_opt,
                    );
                    Some(change)
                }
                // only update the ingester pool when the ingester status changes, to avoid
                // unnecessary churn
                ClusterChange::Update { previous, updated }
                    if updated.is_indexer()
                        && previous.ingester_status() != updated.ingester_status() =>
                {
                    let change = build_ingester_insert_change(
                        &updated,
                        ingester_opt_clone,
                        grpc_max_message_size,
                        grpc_compression_encoding_opt,
                    );
                    Some(change)
                }
                ClusterChange::Remove(node) if node.is_indexer() => {
                    let change = build_ingester_remove_change(&node);
                    Some(change)
                }
                _ => None,
            }
        })
    });
    ingester_pool.listen_for_changes(ingester_change_stream);
}

fn build_ingester_insert_change(
    node: &ClusterNode,
    ingester_opt: Option<impl IngesterService>,
    grpc_max_message_size: ByteSize,
    grpc_compression_encoding_opt: Option<CompressionEncoding>,
) -> Change<NodeId, IngesterPoolEntry> {
    let chitchat_id = node.chitchat_id();
    info!(
        node_id = chitchat_id.node_id,
        generation_id = chitchat_id.generation_id,
        "adding/updating node `{}` with ingester status `{}` to ingester pool",
        chitchat_id.node_id,
        node.ingester_status(),
    );
    let node_id: NodeId = node.node_id().into();
    let ingester_service = build_ingester_service(
        node,
        ingester_opt,
        grpc_max_message_size,
        grpc_compression_encoding_opt,
    );
    let pool_entry = IngesterPoolEntry {
        client: ingester_service,
        status: node.ingester_status(),
        availability_zone: node.availability_zone().map(|az| az.to_string()),
    };
    Change::Insert(node_id, pool_entry)
}

fn build_ingester_remove_change(node: &ClusterNode) -> Change<NodeId, IngesterPoolEntry> {
    let chitchat_id = node.chitchat_id();
    info!(
        node_id = chitchat_id.node_id,
        generation_id = chitchat_id.generation_id,
        "removing node `{}` from ingester pool",
        chitchat_id.node_id,
    );
    let node_id: NodeId = node.node_id().into();
    Change::Remove(node_id)
}

fn build_ingester_service(
    node: &ClusterNode,
    ingester_opt: Option<impl IngesterService>,
    max_message_size: ByteSize,
    grpc_compression_encoding_opt: Option<CompressionEncoding>,
) -> IngesterServiceClient {
    if node.is_self_node() {
        // Here, since the service is available locally, we bypass the network stack
        // and use the instance directly. However, we still want client-side
        // metrics, so we use both metrics layers.
        let ingester = ingester_opt.expect("ingester service should be initialized");
        let service = ingester_service_layer_stack(
            IngesterServiceClient::tower().stack_layer(INGEST_GRPC_CLIENT_METRICS_LAYER.clone()),
        )
        .build(ingester);
        return service;
    }
    IngesterServiceClient::tower()
        .stack_layer(INGEST_GRPC_CLIENT_METRICS_LAYER.clone())
        .stack_layer(TimeoutLayer::new(GRPC_INGESTER_SERVICE_TIMEOUT))
        .build_from_channel(
            node.grpc_advertise_addr(),
            node.channel(),
            max_message_size,
            grpc_compression_encoding_opt,
        )
}

async fn setup_searcher(
    node_config: &NodeConfig,
    cluster_change_stream: ClusterChangeStream,
    metastore: MetastoreServiceClient,
    storage_resolver: StorageResolver,
    searcher_context: Arc<SearcherContext>,
) -> anyhow::Result<(SearchJobPlacer, Arc<dyn SearchService>)> {
    let searcher_pool = SearcherPool::default();
    let search_job_placer = SearchJobPlacer::new(searcher_pool.clone());

    let search_service = start_searcher_service(
        metastore,
        storage_resolver,
        search_job_placer.clone(),
        searcher_context,
    )
    .await?;
    let search_service_clone = search_service.clone();
    let max_message_size = node_config.grpc_config.max_message_size;
    let request_timeout = node_config.searcher_config.request_timeout();
    let searcher_change_stream = cluster_change_stream.filter_map(move |cluster_change| {
        let search_service_clone = search_service_clone.clone();
        Box::pin(async move {
            match cluster_change {
                ClusterChange::Add(node) if node.is_searcher() => {
                    let chitchat_id = node.chitchat_id();
                    info!(
                        node_id = chitchat_id.node_id,
                        generation_id = chitchat_id.generation_id,
                        "adding node `{}` to searcher pool",
                        chitchat_id.node_id,
                    );
                    let grpc_addr = node.grpc_advertise_addr();

                    if node.is_self_node() {
                        let search_client =
                            SearchServiceClient::from_service(search_service_clone, grpc_addr);
                        Some(Change::Insert(grpc_addr, search_client))
                    } else {
                        let timeout_channel = Timeout::new(node.channel(), request_timeout);
                        let search_client = create_search_client_from_channel(
                            grpc_addr,
                            timeout_channel,
                            max_message_size,
                        );
                        Some(Change::Insert(grpc_addr, search_client))
                    }
                }
                ClusterChange::Remove(node) if node.is_searcher() => {
                    let chitchat_id = node.chitchat_id();
                    info!(
                        node_id = chitchat_id.node_id,
                        generation_id = chitchat_id.generation_id,
                        "removing node `{}` from searcher pool",
                        chitchat_id.node_id,
                    );
                    Some(Change::Remove(node.grpc_advertise_addr()))
                }
                _ => None,
            }
        })
    });
    searcher_pool.listen_for_changes(searcher_change_stream);
    Ok((search_job_placer, search_service))
}

#[allow(clippy::too_many_arguments)]
async fn setup_control_plane(
    universe: &Universe,
    event_broker: &EventBroker,
    self_node_id: NodeId,
    cluster: Cluster,
    indexer_pool: IndexerPool,
    ingester_pool: IngesterPool,
    metastore: MetastoreServiceClient,
    default_index_root_uri: Uri,
    ingest_api_config: &IngestApiConfig,
) -> anyhow::Result<Mailbox<ControlPlane>> {
    let cluster_id = cluster.cluster_id().to_string();
    let replication_factor = ingest_api_config
        .replication_factor()
        .expect("replication factor should have been validated")
        .get();
    let cluster_config = ClusterConfig {
        cluster_id,
        auto_create_indexes: true,
        default_index_root_uri,
        replication_factor,
        shard_throughput_limit: ingest_api_config.shard_throughput_limit,
        shard_scale_up_factor: ingest_api_config.shard_scale_up_factor,
    };
    let (control_plane_mailbox, _control_plane_handle, mut readiness_rx) = ControlPlane::spawn(
        universe,
        cluster_config,
        self_node_id,
        cluster.clone(),
        indexer_pool,
        ingester_pool,
        metastore,
    );
    let subscriber = ControlPlaneEventSubscriber::new(control_plane_mailbox.downgrade());
    event_broker
        .subscribe_without_timeout::<LocalShardsUpdate>(subscriber.clone())
        .forever();
    event_broker
        .subscribe_without_timeout::<ShardPositionsUpdate>(subscriber)
        .forever();

    tokio::time::timeout(
        Duration::from_secs(300),
        readiness_rx.wait_for(|readiness| *readiness),
    )
    .await
    .context("control plane initialization timed out")?
    .context("control plane was killled or quit")?;

    info!("control plane is ready");
    Ok(control_plane_mailbox)
}

fn setup_indexer_pool(
    cluster_change_stream: ClusterChangeStream,
    indexing_service_opt: Option<Mailbox<IndexingService>>,
    indexer_pool: IndexerPool,
    grpc_max_message_size: ByteSize,
) {
    let indexer_change_stream = cluster_change_stream.filter_map(move |cluster_change| {
        let indexing_service_clone_opt = indexing_service_opt.clone();
        Box::pin(async move {
            match cluster_change {
                ClusterChange::Add(node) if node.is_indexer() => {
                    let change = build_indexer_insert_change(
                        &node,
                        indexing_service_clone_opt,
                        grpc_max_message_size,
                    );
                    Some(change)
                }
                ClusterChange::Remove(node) if node.is_indexer() => {
                    let change = build_indexer_remove_change(&node);
                    Some(change)
                }
                _ => None,
            }
        })
    });
    indexer_pool.listen_for_changes(indexer_change_stream);
}

fn build_indexer_insert_change(
    node: &ClusterNode,
    indexing_service_opt: Option<Mailbox<IndexingService>>,
    grpc_max_message_size: ByteSize,
) -> Change<NodeId, IndexerNodeInfo> {
    let chitchat_id = node.chitchat_id();
    info!(
        node_id = chitchat_id.node_id,
        generation_id = chitchat_id.generation_id,
        "adding node `{}` with ingester status `{}` to indexer pool",
        chitchat_id.node_id,
        node.ingester_status()
    );
    let node_id: NodeId = node.node_id().into();
    let client = build_indexing_service(node, indexing_service_opt, grpc_max_message_size);
    Change::Insert(
        node_id.clone(),
        IndexerNodeInfo {
            node_id,
            generation_id: chitchat_id.generation_id,
            client,
            indexing_tasks: node.indexing_tasks().to_vec(),
            indexing_capacity: node.indexing_capacity(),
        },
    )
}

fn build_indexer_remove_change(node: &ClusterNode) -> Change<NodeId, IndexerNodeInfo> {
    let chitchat_id = node.chitchat_id();
    info!(
        node_id = chitchat_id.node_id,
        generation_id = chitchat_id.generation_id,
        "removing node `{}` from indexer pool",
        chitchat_id.node_id,
    );
    let node_id: NodeId = node.node_id().into();
    Change::Remove(node_id)
}

fn build_indexing_service(
    node: &ClusterNode,
    indexing_service_opt: Option<Mailbox<IndexingService>>,
    max_message_size: ByteSize,
) -> IndexingServiceClient {
    if node.is_self_node() {
        // Here, since the service is available locally, we bypass the network stack
        // and use the mailbox directly. However, we still want client-side metrics,
        // so we use both metrics layers.
        let indexing_service_mailbox =
            indexing_service_opt.expect("indexing service should be initialized");
        let shared_layers = ServiceBuilder::new()
            .layer(INDEXING_GRPC_CLIENT_METRICS_LAYER.clone())
            .layer(INDEXING_GRPC_SERVER_METRICS_LAYER.clone())
            .into_inner();
        return IndexingServiceClient::tower()
            .stack_layer(shared_layers)
            .build_from_mailbox(indexing_service_mailbox);
    }
    IndexingServiceClient::tower()
        .stack_layer(INDEXING_GRPC_CLIENT_METRICS_LAYER.clone())
        .stack_layer(TimeoutLayer::new(GRPC_INDEXING_SERVICE_TIMEOUT))
        .build_from_channel(
            node.grpc_advertise_addr(),
            node.channel(),
            max_message_size,
            None,
        )
}

fn require<T: Clone + Send>(
    val_opt: Option<T>,
) -> impl Filter<Extract = (T,), Error = Rejection> + Clone {
    warp::any().and_then(move || {
        let val_opt_clone = val_opt.clone();
        async move {
            if let Some(val) = val_opt_clone {
                Ok(val)
            } else {
                Err(warp::reject())
            }
        }
    })
}

fn with_arg<T: Clone + Send>(arg: T) -> impl Filter<Extract = (T,), Error = Infallible> + Clone {
    warp::any().map(move || arg.clone())
}

/// Reports node readiness to chitchat cluster every 10 seconds (25 ms for tests).
async fn node_readiness_reporting_task(
    cluster: Cluster,
    metastore: MetastoreServiceClient,
    ingester_opt: Option<impl IngesterService>,
    grpc_readiness_signal_rx: oneshot::Receiver<()>,
    rest_readiness_signal_rx: oneshot::Receiver<()>,
    health_reporter: HealthReporter,
) {
    let mut node_ready = false;
    cluster.set_self_node_readiness(node_ready).await;
    // Set the initial health status to `NotServing` with "" meaning all services, as per
    // https://github.com/grpc/grpc/blob/master/doc/health-checking.md
    health_reporter
        .set_service_status("", ServingStatus::NotServing)
        .await;

    if grpc_readiness_signal_rx.await.is_err() {
        // the gRPC server failed.
        return;
    };
    info!("gRPC server is ready");

    if rest_readiness_signal_rx.await.is_err() {
        // the REST server failed.
        return;
    };
    info!("REST server is ready");

    let mut interval = tokio::time::interval(READINESS_REPORTING_INTERVAL);

    loop {
        interval.tick().await;

        let metastore_is_available = match metastore.check_connectivity().await {
            Ok(()) => {
                debug!(metastore_endpoints=?metastore.endpoints(), "metastore service is available");
                true
            }
            Err(error) => {
                warn!(metastore_endpoints=?metastore.endpoints(), error=?error, "metastore service is unavailable");
                false
            }
        };
        let ingester_is_available = if let Some(ingester) = &ingester_opt {
            match try_get_ingester_status(ingester).await {
                Ok(status) => {
                    status == IngesterStatus::Initializing || status != IngesterStatus::Failed
                }
                Err(error) => {
                    // If we couldn't get the ingester status, it's not looking good, so we set the
                    // node to not ready.
                    error!(%error, "failed to get ingester status");
                    false
                }
            }
        } else {
            true
        };
        let new_node_ready = metastore_is_available && ingester_is_available;

        if new_node_ready != node_ready {
            node_ready = new_node_ready;
            cluster.set_self_node_readiness(node_ready).await;

            let serving_status = if node_ready {
                ServingStatus::Serving
            } else {
                ServingStatus::NotServing
            };
            health_reporter.set_service_status("", serving_status).await;
        }
    }
}

/// Displays some warnings if the cluster runs a file-backed metastore or serves file-backed
/// indexes.
async fn check_cluster_configuration(
    services: &HashSet<QuickwitService>,
    peer_seeds: &[String],
    metastore: MetastoreServiceClient,
) -> anyhow::Result<()> {
    if !services.contains(&QuickwitService::Metastore) || peer_seeds.is_empty() {
        return Ok(());
    }
    if metastore
        .endpoints()
        .iter()
        .any(|uri| !uri.protocol().is_database())
    {
        warn!(
            metastore_endpoints=?metastore.endpoints(),
            "Using a file-backed metastore in cluster mode is not recommended for production use.
            Running multiple file-backed metastores simultaneously can lead to data loss.");
    }
    let file_backed_indexes = metastore
        .list_indexes_metadata(ListIndexesMetadataRequest::all())
        .await?
        .deserialize_indexes_metadata()
        .await?
        .into_iter()
        .filter(|index_metadata| index_metadata.index_uri().protocol().is_file_storage())
        .collect::<Vec<_>>();
    if !file_backed_indexes.is_empty() {
        let index_ids = file_backed_indexes
            .iter()
            .map(|index_metadata| index_metadata.index_id())
            .join(", ");
        let index_uris = file_backed_indexes
            .iter()
            .map(|index_metadata| index_metadata.index_uri())
            .join(", ");
        warn!(
            index_ids=%index_ids,
            index_uris=%index_uris,
            "Found some file-backed indexes in the metastore. Some nodes in the cluster may not have access to all index files."
        );
    }
    Ok(())
}

#[cfg(test)]
mod tests {
    use quickwit_cluster::{ChannelTransport, ClusterNode, create_cluster_for_test};
    use quickwit_common::uri::Uri;
    use quickwit_common::{ServiceStream, assert_eventually};
    use quickwit_config::SearcherConfig;
    use quickwit_metastore::{IndexMetadata, metastore_for_test};
    use quickwit_proto::ingest::ingester::{MockIngesterService, ObservationMessage};
    use quickwit_proto::metastore::{ListIndexesMetadataResponse, MockMetastoreService};
    use quickwit_search::Job;
    use tokio::sync::watch;
    use tonic::transport::{Channel, Server};
    use tonic_health::pb::HealthCheckRequest;
    use tonic_health::pb::health_client::HealthClient;
    use tonic_health::server::health_reporter;

    use super::*;

    #[tokio::test]
    async fn test_check_cluster_configuration() {
        let services = HashSet::from_iter([QuickwitService::Metastore]);
        let peer_seeds = ["192.168.0.12:7280".to_string()];
        let mut mock_metastore = MockMetastoreService::new();

        mock_metastore
            .expect_endpoints()
            .return_const(vec![Uri::for_test("file:///qwdata/indexes")]);
        mock_metastore
            .expect_list_indexes_metadata()
            .return_once(|_| {
                Ok(ListIndexesMetadataResponse::for_test(vec![
                    IndexMetadata::for_test("test-index", "file:///qwdata/indexes/test-index"),
                ]))
            });

        check_cluster_configuration(
            &services,
            &peer_seeds,
            MetastoreServiceClient::from_mock(mock_metastore),
        )
        .await
        .unwrap();
    }

    #[tokio::test]
    async fn test_readiness_updates() {
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &[], &transport, false)
            .await
            .unwrap();
        let (metastore_readiness_tx, metastore_readiness_rx) = watch::channel(false);
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_check_connectivity()
            .returning(move || {
                if *metastore_readiness_rx.borrow() {
                    Ok(())
                } else {
                    Err(anyhow::anyhow!("Metastore not ready"))
                }
            });
        let (ingester_status_tx, ingester_status_rx) = watch::channel(IngesterStatus::Initializing);
        let mut mock_ingester = MockIngesterService::new();
        mock_ingester
            .expect_open_observation_stream()
            .returning(move |_| {
                let status_stream = ServiceStream::from(ingester_status_rx.clone());
                let observation_stream = status_stream.map(|status| {
                    let message = ObservationMessage {
                        node_id: "test-node".to_string(),
                        status: status as i32,
                    };
                    Ok(message)
                });
                Ok(observation_stream)
            });
        let (grpc_readiness_trigger_tx, grpc_readiness_signal_rx) = oneshot::channel();
        let (rest_readiness_trigger_tx, rest_readiness_signal_rx) = oneshot::channel();

        let (health_reporter, health_service) = health_reporter();
        let (client, server) = tokio::io::duplex(1024);
        tokio::spawn(async move {
            Server::builder()
                .add_service(health_service)
                .serve_with_incoming(tokio_stream::once(Ok::<_, std::io::Error>(server)))
                .await
                .unwrap();
        });
        let mut client_opt = Some(client);
        let connector = tower::service_fn(move |_: http::Uri| {
            let client = client_opt.take().unwrap();
            async move { Ok::<_, Infallible>(hyper_util::rt::TokioIo::new(client)) }
        });
        let channel = Channel::builder("http://[::]:50051".parse().unwrap())
            .connect_with_connector(connector)
            .await
            .unwrap();

        let mut health_client = HealthClient::new(channel);

        tokio::spawn(node_readiness_reporting_task(
            cluster.clone(),
            MetastoreServiceClient::from_mock(mock_metastore),
            Some(mock_ingester),
            grpc_readiness_signal_rx,
            rest_readiness_signal_rx,
            health_reporter,
        ));
        assert!(!cluster.is_self_node_ready().await);

        let request = tonic::Request::new(HealthCheckRequest::default());
        let response = health_client.check(request).await.unwrap().into_inner();
        assert_eq!(response.status(), ServingStatus::NotServing.into());

        grpc_readiness_trigger_tx.send(()).unwrap();
        rest_readiness_trigger_tx.send(()).unwrap();
        assert!(!cluster.is_self_node_ready().await);

        metastore_readiness_tx.send(true).unwrap();
        ingester_status_tx.send(IngesterStatus::Ready).unwrap();
        assert_eventually!(cluster.is_self_node_ready().await);

        let request = tonic::Request::new(HealthCheckRequest::default());
        let response = health_client.check(request).await.unwrap().into_inner();
        assert_eq!(response.status(), ServingStatus::Serving.into());

        metastore_readiness_tx.send(false).unwrap();
        assert_eventually!(!cluster.is_self_node_ready().await);

        let request = tonic::Request::new(HealthCheckRequest::default());
        let response = health_client.check(request).await.unwrap().into_inner();
        assert_eq!(response.status(), ServingStatus::NotServing.into());
    }

    #[tokio::test]
    async fn test_setup_indexer_pool() {
        let universe = Universe::with_accelerated_time();
        let (indexing_service_mailbox, _indexing_service_inbox) =
            universe.create_test_mailbox::<IndexingService>();
        let node_config = NodeConfig::for_test();

        let (cluster_change_stream, cluster_change_stream_tx) =
            ClusterChangeStream::new_unbounded();
        let indexer_pool = IndexerPool::default();
        setup_indexer_pool(
            cluster_change_stream,
            Some(indexing_service_mailbox),
            indexer_pool.clone(),
            node_config.grpc_config.max_message_size,
        );

        // adding a indexer node refreshes the indexer pool
        let new_indexer_node = ClusterNode::for_test(
            "test-indexer-node",
            1,
            true,
            &["indexer"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        cluster_change_stream_tx
            .send(ClusterChange::Add(new_indexer_node.clone()))
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert_eq!(indexer_pool.len(), 1);

        // removing an indexer node refreshes the indexer pool
        cluster_change_stream_tx
            .send(ClusterChange::Remove(new_indexer_node))
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert!(indexer_pool.is_empty());
    }

    #[tokio::test]
    async fn test_setup_searcher() {
        let node_config = NodeConfig::for_test();
        let searcher_context = Arc::new(SearcherContext::new_without_invoker(
            SearcherConfig::default(),
            None,
        ));
        let metastore = metastore_for_test();
        let (change_stream, change_stream_tx) = ClusterChangeStream::new_unbounded();
        let storage_resolver = StorageResolver::unconfigured();
        let (search_job_placer, _searcher_service) = setup_searcher(
            &node_config,
            change_stream,
            metastore,
            storage_resolver,
            searcher_context,
        )
        .await
        .unwrap();

        struct DummyJob(String);

        impl Job for DummyJob {
            fn split_id(&self) -> &str {
                &self.0
            }

            fn cost(&self) -> usize {
                1
            }
        }
        search_job_placer
            .assign_job(DummyJob("job-1".to_string()), &HashSet::new())
            .await
            .unwrap_err();

        let self_node = ClusterNode::for_test(
            "node-1",
            1337,
            true,
            &["searcher"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        change_stream_tx
            .send(ClusterChange::Add(self_node.clone()))
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        let searcher_client = search_job_placer
            .assign_job(DummyJob("job-1".to_string()), &HashSet::new())
            .await
            .unwrap();
        assert!(searcher_client.is_local());

        change_stream_tx
            .send(ClusterChange::Remove(self_node))
            .unwrap();

        let node = ClusterNode::for_test(
            "node-1",
            1337,
            false,
            &["searcher"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        change_stream_tx.send(ClusterChange::Add(node)).unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        let searcher_client = search_job_placer
            .assign_job(DummyJob("job-1".to_string()), &HashSet::new())
            .await
            .unwrap();
        assert!(!searcher_client.is_local());
    }

    #[tokio::test]
    async fn test_setup_ingester_pool() {
        let (cluster_change_stream, cluster_change_stream_tx) =
            ClusterChangeStream::new_unbounded();
        let ingester_pool = IngesterPool::default();
        setup_ingester_pool(
            cluster_change_stream,
            None::<Ingester>,
            ingester_pool.clone(),
            None,
            ByteSize::mib(20),
        );

        // Add an indexer node with IngesterStatus::Initializing.
        let new_node = ClusterNode::for_test(
            "test-ingester-node",
            1,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Initializing,
        )
        .await;
        cluster_change_stream_tx
            .send(ClusterChange::Add(new_node.clone()))
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert_eq!(ingester_pool.len(), 1);
        let pool_entry = ingester_pool
            .get(&NodeId::from("test-ingester-node"))
            .unwrap();
        assert_eq!(pool_entry.status, IngesterStatus::Initializing);

        // Update the node: ingester status transitions from Initializing to Ready.
        let updated_node = ClusterNode::for_test(
            "test-ingester-node",
            1,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Ready,
        )
        .await;
        cluster_change_stream_tx
            .send(ClusterChange::Update {
                previous: new_node.clone(),
                updated: updated_node.clone(),
            })
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert_eq!(ingester_pool.len(), 1);
        let pool_entry = ingester_pool
            .get(&NodeId::from("test-ingester-node"))
            .unwrap();
        assert_eq!(pool_entry.status, IngesterStatus::Ready);

        // Update the node: ingester status transitions from Ready to Decommissioning.
        let updated_node_2 = ClusterNode::for_test(
            "test-ingester-node",
            1,
            false,
            &["indexer"],
            &[],
            IngesterStatus::Decommissioning,
        )
        .await;
        cluster_change_stream_tx
            .send(ClusterChange::Update {
                previous: updated_node.clone(),
                updated: updated_node_2.clone(),
            })
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        // The node should still be in the pool with updated status.
        assert_eq!(ingester_pool.len(), 1);
        let pool_entry = ingester_pool
            .get(&NodeId::from("test-ingester-node"))
            .unwrap();
        assert_eq!(pool_entry.status, IngesterStatus::Decommissioning);

        // Remove the node.
        cluster_change_stream_tx
            .send(ClusterChange::Remove(updated_node))
            .unwrap();
        tokio::time::sleep(Duration::from_millis(1)).await;

        assert!(ingester_pool.is_empty());
    }
}


================================================
FILE: quickwit/quickwit-serve/src/load_shield.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use quickwit_common::metrics::{GaugeGuard, IntGauge};
use tokio::sync::{Semaphore, SemaphorePermit};

use crate::rest::TooManyRequests;

pub struct LoadShield {
    in_flight_semaphore_opt: Option<Semaphore>, // This one is doing the load shedding.
    concurrency_semaphore_opt: Option<Semaphore>,
    ongoing_gauge: IntGauge,
    pending_gauge: IntGauge,
}

pub struct LoadShieldPermit {
    _concurrency_permit_opt: Option<SemaphorePermit<'static>>,
    _in_flight_permit_opt: Option<SemaphorePermit<'static>>,
    _ongoing_gauge_guard: GaugeGuard<'static>,
}

impl LoadShield {
    pub fn new(endpoint_group: &'static str) -> LoadShield {
        let endpoint_group_uppercase = endpoint_group.to_ascii_uppercase();
        let max_in_flight_env_key = format!("QW_{endpoint_group_uppercase}_MAX_IN_FLIGHT");
        let max_concurrency_env_key = format!("QW_{endpoint_group_uppercase}_MAX_CONCURRENCY");
        let max_in_flight_opt: Option<usize> =
            quickwit_common::get_from_env_opt(&max_in_flight_env_key, false);
        let max_concurrency_opt: Option<usize> =
            quickwit_common::get_from_env_opt(&max_concurrency_env_key, false);
        let in_flight_semaphore_opt = max_in_flight_opt.map(Semaphore::new);
        let concurrency_semaphore_opt = max_concurrency_opt.map(Semaphore::new);
        let pending_gauge = crate::metrics::SERVE_METRICS
            .pending_requests
            .with_label_values([endpoint_group]);
        let ongoing_gauge = crate::metrics::SERVE_METRICS
            .ongoing_requests
            .with_label_values([endpoint_group]);
        LoadShield {
            in_flight_semaphore_opt,
            concurrency_semaphore_opt,
            ongoing_gauge,
            pending_gauge,
        }
    }

    async fn acquire_in_flight_permit(
        &'static self,
    ) -> Result<Option<SemaphorePermit<'static>>, warp::Rejection> {
        let Some(in_flight_semaphore) = &self.in_flight_semaphore_opt else {
            return Ok(None);
        };
        let Ok(in_flight_permit) = in_flight_semaphore.try_acquire() else {
            // Wait a little to deal before load shedding. The point is to lower the load associated
            // with super aggressive clients.
            tokio::time::sleep(Duration::from_millis(100)).await;
            return Err(warp::reject::custom(TooManyRequests));
        };
        Ok(Some(in_flight_permit))
    }

    async fn acquire_concurrency_permit(&'static self) -> Option<SemaphorePermit<'static>> {
        let concurrency_semaphore = self.concurrency_semaphore_opt.as_ref()?;
        Some(concurrency_semaphore.acquire().await.unwrap())
    }

    pub async fn acquire_permit(&'static self) -> Result<LoadShieldPermit, warp::Rejection> {
        let mut pending_gauge_guard = GaugeGuard::from_gauge(&self.pending_gauge);
        pending_gauge_guard.add(1);
        let in_flight_permit_opt = self.acquire_in_flight_permit().await?;
        let concurrency_permit_opt = self.acquire_concurrency_permit().await;
        drop(pending_gauge_guard);
        let mut ongoing_gauge_guard = GaugeGuard::from_gauge(&self.ongoing_gauge);
        ongoing_gauge_guard.add(1);
        Ok(LoadShieldPermit {
            _in_flight_permit_opt: in_flight_permit_opt,
            _concurrency_permit_opt: concurrency_permit_opt,
            _ongoing_gauge_guard: ongoing_gauge_guard,
        })
    }
}


================================================
FILE: quickwit/quickwit-serve/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    HistogramVec, IntCounter, IntCounterVec, IntGaugeVec, new_counter, new_counter_vec,
    new_gauge_vec, new_histogram_vec,
};

pub struct ServeMetrics {
    pub http_requests_total: IntCounterVec<2>,
    pub request_duration_secs: HistogramVec<2>,
    pub ongoing_requests: IntGaugeVec<1>,
    pub pending_requests: IntGaugeVec<1>,
    pub circuit_break_total: IntCounter,
}

impl Default for ServeMetrics {
    fn default() -> Self {
        let circuit_break_total = new_counter(
            "circuit_break_total",
            "Circuit breaker counter",
            "grpc",
            &[],
        );
        ServeMetrics {
            http_requests_total: new_counter_vec(
                "http_requests_total",
                "Total number of HTTP requests processed.",
                "",
                &[],
                ["method", "status_code"],
            ),
            request_duration_secs: new_histogram_vec(
                "request_duration_secs",
                "Response time in seconds",
                "",
                &[],
                ["method", "status_code"],
                // last bucket is 163.84s
                quickwit_common::metrics::exponential_buckets(0.02, 2.0, 14).unwrap(),
            ),
            ongoing_requests: new_gauge_vec(
                "ongoing_requests",
                "Number of ongoing requests.",
                "",
                &[],
                ["endpoint_group"],
            ),
            pending_requests: new_gauge_vec(
                "pending_requests",
                "Number of pending requests.",
                "",
                &[],
                ["endpoint_group"],
            ),
            circuit_break_total,
        }
    }
}

/// Serve counters exposes a bunch a set of metrics about the request received to quickwit.
pub static SERVE_METRICS: Lazy<ServeMetrics> = Lazy::new(ServeMetrics::default);


================================================
FILE: quickwit/quickwit-serve/src/metrics_api.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use tracing::error;
use warp::hyper::StatusCode;
use warp::reply::with_status;

#[derive(utoipa::OpenApi)]
#[openapi(paths(metrics_handler))]
/// Endpoints which are weirdly tied to another crate with no
/// other bits of information attached.
///
/// If a crate plans to encompass different schemas, handlers, etc...
/// Then it should have its own specific API group.
pub struct MetricsApi;

#[utoipa::path(
    get,
    tag = "Get Metrics",
    path = "/",
    responses(
        (status = 200, description = "Successfully fetched metrics.", body = String),
        (status = 500, description = "Metrics not available.", body = String),
    ),
)]
/// Get Node Metrics
///
/// These are in the form of prometheus metrics.
pub fn metrics_handler() -> impl warp::Reply {
    match quickwit_common::metrics::metrics_text_payload() {
        Ok(metrics) => with_status(metrics, StatusCode::OK),
        Err(e) => {
            error!("failed to encode prometheus metrics: {e}");
            with_status(String::new(), StatusCode::INTERNAL_SERVER_ERROR)
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/node_info_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use quickwit_config::NodeConfig;
use serde_json::json;
use warp::{Filter, Rejection};

use crate::rest::recover_fn;
use crate::{BuildInfo, RuntimeInfo, with_arg};

#[derive(utoipa::OpenApi)]
#[openapi(paths(node_version_handler, node_config_handler,))]
pub struct NodeInfoApi;

pub fn node_info_handler(
    build_info: &'static BuildInfo,
    runtime_info: &'static RuntimeInfo,
    config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    node_version_handler(build_info, runtime_info)
        .or(node_config_handler(config))
        .recover(recover_fn)
        .boxed()
}

#[utoipa::path(get, tag = "Node Info", path = "/version")]
fn node_version_handler(
    build_info: &'static BuildInfo,
    runtime_info: &'static RuntimeInfo,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path("version")
        .and(warp::path::end())
        .and(with_arg(build_info))
        .and(with_arg(runtime_info))
        .then(get_version)
}

async fn get_version(
    build_info: &'static BuildInfo,
    runtime_info: &'static RuntimeInfo,
) -> impl warp::Reply {
    warp::reply::json(&json!({
        "build": build_info,
        "runtime": runtime_info,
    }))
}

#[utoipa::path(get, tag = "Node Info", path = "/config")]
fn node_config_handler(
    config: Arc<NodeConfig>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path("config")
        .and(warp::path::end())
        .and(with_arg(config))
        .then(get_config)
}

async fn get_config(config: Arc<NodeConfig>) -> impl warp::Reply {
    // We must redact sensitive information such as credentials.
    let mut config = (*config).clone();
    config.redact();
    warp::reply::json(&config)
}

#[cfg(test)]
mod tests {
    use assert_json_diff::assert_json_include;
    use quickwit_common::uri::Uri;
    use serde_json::Value as JsonValue;

    use super::*;
    use crate::recover_fn;

    #[tokio::test]
    async fn test_rest_node_info() {
        let build_info = BuildInfo::get();
        let runtime_info = RuntimeInfo::get();
        let mut config = NodeConfig::for_test();
        config.metastore_uri = Uri::for_test("postgresql://username:password@db");
        let handler = node_info_handler(build_info, runtime_info, Arc::new(config.clone()))
            .recover(recover_fn);
        let resp = warp::test::request().path("/version").reply(&handler).await;
        assert_eq!(resp.status(), 200);
        let info_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        let build_info_json = info_json.get("build").unwrap();
        let expected_build_info_json = serde_json::json!({
            "commit_date": build_info.commit_date,
            "version": build_info.version,
        });
        assert_json_include!(actual: build_info_json, expected: expected_build_info_json);

        let runtime_info_json = info_json.get("runtime").unwrap();
        let expected_runtime_info_json = serde_json::json!({
            "num_cpus": runtime_info.num_cpus,
        });
        assert_json_include!(
            actual: runtime_info_json,
            expected: expected_runtime_info_json
        );

        let resp = warp::test::request().path("/config").reply(&handler).await;
        assert_eq!(resp.status(), 200);
        let resp_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        let expected_response_json = serde_json::json!({
            "node_id": config.node_id,
            "metastore_uri": "postgresql://username:***redacted***@db",
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);
    }
}


================================================
FILE: quickwit/quickwit-serve/src/openapi.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::mem;

use quickwit_config::ConfigApiSchemas;
use quickwit_doc_mapper::DocMapperApiSchemas;
use quickwit_indexing::IndexingApiSchemas;
use quickwit_janitor::JanitorApiSchemas;
use quickwit_metastore::MetastoreApiSchemas;
use utoipa::OpenApi;
use utoipa::openapi::Tag;

use crate::cluster_api::ClusterApi;
use crate::delete_task_api::DeleteTaskApi;
use crate::developer_api::DeveloperApi;
use crate::elasticsearch_api::ElasticCompatibleApi;
use crate::health_check_api::HealthCheckApi;
use crate::index_api::IndexApi;
use crate::indexing_api::IndexingApi;
use crate::ingest_api::{IngestApi, IngestApiSchemas};
use crate::jaeger_api::JaegerApi;
use crate::metrics_api::MetricsApi;
use crate::node_info_handler::NodeInfoApi;
use crate::otlp_api::OtlpApi;
use crate::search_api::SearchApi;
use crate::template_api::IndexTemplateApi;

/// Builds the OpenApi docs structure using the registered/merged docs.
pub fn build_docs() -> utoipa::openapi::OpenApi {
    let mut docs_base = utoipa::openapi::OpenApiBuilder::new()
        .info(
            utoipa::openapi::InfoBuilder::new()
                .title("Quickwit")
                .version(env!("CARGO_PKG_VERSION"))
                .description(Some(env!("CARGO_PKG_DESCRIPTION")))
                .license(Some(utoipa::openapi::License::new(env!(
                    "CARGO_PKG_LICENSE"
                ))))
                .contact(Some(
                    utoipa::openapi::ContactBuilder::new()
                        .name(Some("Quickwit, Inc."))
                        .email(Some("hello@quickwit.io"))
                        .build(),
                ))
                .build(),
        )
        .paths(utoipa::openapi::Paths::new())
        .components(Some(utoipa::openapi::Components::new()))
        .build();

    // Tags use for grouping and sorting routes.
    let tags = vec![
        Tag::new("Search"),
        Tag::new("Indexes"),
        Tag::new("Ingest"),
        Tag::new("Delete Tasks"),
        Tag::new("Node Health"),
        Tag::new("Sources"),
        Tag::new("Get Metrics"),
        Tag::new("Cluster Info"),
        Tag::new("Node Info"),
        Tag::new("Indexing"),
        Tag::new("Splits"),
        Tag::new("Jaeger"),
        Tag::new("Open Telemetry"),
        Tag::new("Debug"),
    ];
    docs_base.tags = Some(tags);

    // Routing
    docs_base.merge_components_and_paths(ClusterApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(DeleteTaskApi::openapi().with_path_prefix("/api/v1"));
    docs_base
        .merge_components_and_paths(DeveloperApi::openapi().with_path_prefix("/api/developer"));
    docs_base
        .merge_components_and_paths(ElasticCompatibleApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(OtlpApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(HealthCheckApi::openapi().with_path_prefix("/health"));
    docs_base.merge_components_and_paths(IndexApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(IndexingApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(IndexTemplateApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(IngestApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(JaegerApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(MetricsApi::openapi().with_path_prefix("/metrics"));
    docs_base.merge_components_and_paths(NodeInfoApi::openapi().with_path_prefix("/api/v1"));
    docs_base.merge_components_and_paths(SearchApi::openapi().with_path_prefix("/api/v1"));

    // Schemas
    docs_base.merge_components_and_paths(MetastoreApiSchemas::openapi());
    docs_base.merge_components_and_paths(ConfigApiSchemas::openapi());
    docs_base.merge_components_and_paths(JanitorApiSchemas::openapi());
    docs_base.merge_components_and_paths(DocMapperApiSchemas::openapi());
    docs_base.merge_components_and_paths(IndexingApiSchemas::openapi());
    docs_base.merge_components_and_paths(IngestApiSchemas::openapi());

    docs_base
}

pub trait OpenApiMerger {
    /// Merges a given [OpenApi] schema into another schema.
    fn merge_components_and_paths(&mut self, schema: utoipa::openapi::OpenApi);

    /// Modifies all of the paths for a given OpenAPI instance
    /// and appends the provided prefix to the paths.
    fn with_path_prefix(self, path: &str) -> Self;
}

impl OpenApiMerger for utoipa::openapi::OpenApi {
    fn merge_components_and_paths(&mut self, schema: utoipa::openapi::OpenApi) {
        self.paths.paths.extend(schema.paths.paths);

        if let Some(tags) = &mut self.tags {
            tags.extend(schema.tags.unwrap_or_default());
        } else {
            self.tags = schema.tags;
        }

        if let Some(components) = &mut self.components {
            let other_components = schema.components.unwrap_or_default();

            components.responses.extend(other_components.responses);
            components.schemas.extend(other_components.schemas);
            components
                .security_schemes
                .extend(other_components.security_schemes);
        } else {
            self.components = schema.components;
        }
    }

    fn with_path_prefix(mut self, prefix: &str) -> Self {
        let paths = mem::take(&mut self.paths.paths);
        for (path, detail) in paths {
            // We can panic here as it will be raised during unit tests.
            assert!(
                path.starts_with('/'),
                "Path {path:?} does not start with `/`."
            );

            let adjusted_path = if path != "/" {
                format!("{prefix}{path}")
            } else {
                prefix.to_owned()
            };
            self.paths.paths.insert(adjusted_path, detail);
        }

        self
    }
}

#[cfg(test)]
mod openapi_schema_tests {
    use std::collections::BTreeSet;

    use itertools::Itertools;
    use utoipa::openapi::schema::AdditionalProperties;
    use utoipa::openapi::{RefOr, Schema};

    use super::*;

    #[test]
    fn ensure_schemas_resolve() {
        let docs = build_docs();
        resolve_openapi_schemas(&docs).expect("All schemas should be resolved.");
    }

    fn resolve_openapi_schemas(openapi: &utoipa::openapi::OpenApi) -> anyhow::Result<()> {
        let schemas_lookup = if let Some(components) = &openapi.components {
            resolve_component_schemas(components)?
        } else {
            BTreeSet::new()
        };

        let mut errors = Vec::new();
        for (path, detail) in openapi.paths.paths.iter() {
            let path = path.as_str();
            for (method, operation) in detail.operations.iter() {
                let method = serde_json::to_string(method).unwrap();
                let contents = operation
                    .request_body
                    .as_ref()
                    .map(|v| &v.content)
                    .cloned()
                    .unwrap_or_default();
                for (key, content) in contents {
                    let location = match content.schema {
                        RefOr::Ref(r) => r.ref_location,
                        RefOr::T(_) => continue,
                    };

                    if !schemas_lookup.contains(&location) {
                        let info = format!("key:{key:?}");
                        errors.push((location, method.clone(), path, info));
                    }
                }

                for (status, resp) in operation.responses.responses.iter() {
                    let location = match resp {
                        RefOr::Ref(r) => &r.ref_location,
                        RefOr::T(_) => continue,
                    };

                    if !schemas_lookup.contains(location) {
                        let info = format!("status:{status}");
                        errors.push((location.clone(), method.clone(), path, info));
                    }
                }

                for parameter in operation.parameters.as_deref().unwrap_or(&[]) {
                    let location = match &parameter.schema {
                        Some(RefOr::Ref(r)) => &r.ref_location,
                        Some(RefOr::T(schema)) => {
                            let parent = format!("param: {}", &parameter.name);
                            check_schema(
                                &method,
                                path,
                                &schemas_lookup,
                                &mut errors,
                                &parent,
                                schema,
                            );
                            continue;
                        }
                        _ => continue,
                    };

                    if !schemas_lookup.contains(location) {
                        let info = format!("param:{}", parameter.name);
                        errors.push((location.clone(), method.clone(), path, info));
                    }
                }
            }
        }

        if !errors.is_empty() {
            let errors = errors
                .into_iter()
                .map(|(location, method, path, info)| {
                    format!("{method} {path:?} {info} - location: {location}")
                })
                .join("\n");

            anyhow::bail!(
                "failed to resolve schemas, do these types implement `ToSchema`?:\n\n{errors}"
            )
        }

        Ok(())
    }

    /// Builds a lookup set of all of the schemas that can be referenced.
    fn resolve_component_schemas(
        components: &utoipa::openapi::Components,
    ) -> anyhow::Result<BTreeSet<String>> {
        // Loads the core schemas which is used by most references
        // This can have references in and of itself however, so we
        // need to track those to resolve later.
        let mut schema_lookup = BTreeSet::new();
        let mut pending_resolved = Vec::new();
        let mut resolve_once = Vec::new();

        for (schema_item, maybe_ref) in &components.schemas {
            let path = format!("#/components/schemas/{schema_item}");
            match maybe_ref {
                RefOr::Ref(r) => {
                    pending_resolved.push((path, r.ref_location.clone()));
                }
                RefOr::T(schema) => {
                    resolve_schema(&mut resolve_once, schema_item, schema);
                    schema_lookup.insert(path);
                }
            };
        }

        for schema_item in components.security_schemes.keys() {
            let path = format!("#/components/securitySchemes/{schema_item}");
            schema_lookup.insert(path);
        }

        // Although responses aren't technically a schema, they can be referenced and contain
        // references, so it's easier to merge them into one.
        for (schema_item, maybe_ref) in &components.responses {
            let path = format!("#/components/responses/{schema_item}");
            match maybe_ref {
                RefOr::Ref(r) => {
                    pending_resolved.push((path, r.ref_location.clone()));
                }
                RefOr::T(schema) => {
                    for (_, content) in &schema.content {
                        if let RefOr::Ref(r) = &content.schema
                            && !schema_lookup.contains(&r.ref_location)
                        {
                            resolve_once.push(CheckResolve::new(
                                r.ref_location.clone(),
                                schema_item.clone(),
                            ));
                        }
                    }
                    schema_lookup.insert(path);
                }
            };
        }

        // Walks through the list of references that need to be resolved.
        // Technically a reference can lead to a reference, so if one
        // location is resolved later on, we might then be able to resolve
        // others, hence the loop.
        loop {
            for (path, location) in mem::take(&mut pending_resolved) {
                if schema_lookup.contains(&location) {
                    schema_lookup.insert(path);
                } else {
                    pending_resolved.push((path, location));
                }
            }

            if pending_resolved.is_empty() {
                break;
            }
        }

        let mut failed_to_resolve = Vec::new();
        for resolve in resolve_once {
            if !schema_lookup.contains(&resolve.location) {
                failed_to_resolve.push(resolve);
            }
        }

        if !pending_resolved.is_empty() || !failed_to_resolve.is_empty() {
            let errors_pending = pending_resolved
                .into_iter()
                .map(|(path, _)| format!("{path:?}"))
                .join("\n");
            let errors_resolve_once = failed_to_resolve
                .into_iter()
                .map(|resolve| format!("Struct: {:?} - {:?}", resolve.parent, resolve.location,))
                .join("\n");
            anyhow::bail!(
                "failed to resolve schemas for OpenAPI \
                 spec:\n{errors_pending}\n{errors_resolve_once}"
            );
        }

        Ok(schema_lookup)
    }

    fn resolve_schema(
        resolve_once: &mut Vec<CheckResolve>,
        parent_location: &str,
        schema: &Schema,
    ) {
        match schema {
            Schema::Array(array) => {
                let parent = format!("{parent_location}.Vec");
                match &*array.items {
                    RefOr::Ref(r) => {
                        resolve_once.push(CheckResolve::new(r.ref_location.clone(), parent))
                    }
                    RefOr::T(schema) => resolve_schema(resolve_once, &parent, schema),
                }
            }
            Schema::Object(object) => {
                for (key, r) in object.properties.iter() {
                    let parent = format!("{parent_location}.{key}");
                    match r {
                        RefOr::Ref(r) => {
                            resolve_once.push(CheckResolve::new(r.ref_location.clone(), parent))
                        }
                        RefOr::T(schema) => resolve_schema(resolve_once, &parent, schema),
                    }
                }

                if let Some(ref props) = object.additional_properties
                    && let AdditionalProperties::RefOr(ref r) = **props
                {
                    match r {
                        RefOr::Ref(r) => resolve_once.push(CheckResolve::new(
                            r.ref_location.clone(),
                            parent_location.to_owned(),
                        )),
                        RefOr::T(schema) => resolve_schema(resolve_once, parent_location, schema),
                    }
                }
            }
            Schema::OneOf(one_of) => {
                let parent = format!("{parent_location}.Enum");
                for r in &one_of.items {
                    match r {
                        RefOr::Ref(r) => resolve_once
                            .push(CheckResolve::new(r.ref_location.clone(), parent.clone())),
                        RefOr::T(schema) => resolve_schema(resolve_once, &parent, schema),
                    }
                }
            }
            Schema::AllOf(all_of) => {
                for r in &all_of.items {
                    match r {
                        RefOr::Ref(r) => resolve_once.push(CheckResolve::new(
                            r.ref_location.clone(),
                            parent_location.to_owned(),
                        )),
                        RefOr::T(schema) => resolve_schema(resolve_once, parent_location, schema),
                    }
                }
            }
            _ => unimplemented!("Unknown schema variant"),
        }
    }

    fn check_schema<'a>(
        method: &str,
        path: &'a str,
        schemas_lookup: &BTreeSet<String>,
        errors: &mut Vec<(String, String, &'a str, String)>,
        parent_location: &str,
        schema: &Schema,
    ) {
        match schema {
            Schema::Array(array) => {
                let parent = format!("{parent_location}.Vec");
                match &*array.items {
                    RefOr::Ref(r) => {
                        if !schemas_lookup.contains(&r.ref_location) {
                            errors.push((parent, method.to_string(), path, String::new()));
                        }
                    }
                    RefOr::T(schema) => {
                        check_schema(method, path, schemas_lookup, errors, &parent, schema)
                    }
                }
            }
            Schema::Object(object) => {
                for (key, r) in object.properties.iter() {
                    let parent = format!("{parent_location}.{key}");
                    match r {
                        RefOr::Ref(r) => {
                            if !schemas_lookup.contains(&r.ref_location) {
                                errors.push((parent, method.to_string(), path, String::new()));
                            }
                        }
                        RefOr::T(schema) => {
                            check_schema(method, path, schemas_lookup, errors, &parent, schema)
                        }
                    }
                }

                if let Some(ref props) = object.additional_properties
                    && let AdditionalProperties::RefOr(ref r) = **props
                {
                    match r {
                        RefOr::Ref(r) => {
                            if !schemas_lookup.contains(&r.ref_location) {
                                errors.push((
                                    parent_location.to_string(),
                                    method.to_string(),
                                    path,
                                    String::new(),
                                ));
                            }
                        }
                        RefOr::T(schema) => check_schema(
                            method,
                            path,
                            schemas_lookup,
                            errors,
                            parent_location,
                            schema,
                        ),
                    }
                }
            }
            Schema::OneOf(one_of) => {
                let parent = format!("{parent_location}.Enum");
                for r in &one_of.items {
                    match r {
                        RefOr::Ref(r) => {
                            if !schemas_lookup.contains(&r.ref_location) {
                                errors.push((
                                    parent.clone(),
                                    method.to_string(),
                                    path,
                                    String::new(),
                                ));
                            }
                        }
                        RefOr::T(schema) => {
                            check_schema(method, path, schemas_lookup, errors, &parent, schema)
                        }
                    }
                }
            }
            Schema::AllOf(all_of) => {
                for r in &all_of.items {
                    match r {
                        RefOr::Ref(r) => {
                            let (_, type_name) = r.ref_location.rsplit_once('/').unwrap();
                            let parent = format!("{parent_location}.{type_name}");
                            if !schemas_lookup.contains(&r.ref_location) {
                                errors.push((parent, method.to_string(), path, String::new()));
                            }
                        }
                        RefOr::T(schema) => check_schema(
                            method,
                            path,
                            schemas_lookup,
                            errors,
                            parent_location,
                            schema,
                        ),
                    }
                }
            }
            _ => unimplemented!("Unknown schema variant"),
        }
    }

    struct CheckResolve {
        location: String,
        parent: String,
    }

    impl CheckResolve {
        fn new(location: String, parent: String) -> Self {
            Self { location, parent }
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/otlp_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod rest_handler;
pub use rest_handler::OtlpApi;
pub(crate) use rest_handler::otlp_ingest_api_handlers;


================================================
FILE: quickwit/quickwit-serve/src/otlp_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_common::rate_limited_error;
use quickwit_opentelemetry::otlp::{OtelSignal, OtlpGrpcLogsService, OtlpGrpcTracesService};
use quickwit_proto::opentelemetry::proto::collector::logs::v1::logs_service_server::LogsService;
use quickwit_proto::opentelemetry::proto::collector::logs::v1::{
    ExportLogsServiceRequest, ExportLogsServiceResponse,
};
use quickwit_proto::opentelemetry::proto::collector::trace::v1::trace_service_server::TraceService;
use quickwit_proto::opentelemetry::proto::collector::trace::v1::{
    ExportTraceServiceRequest, ExportTraceServiceResponse,
};
use quickwit_proto::types::IndexId;
use quickwit_proto::{ServiceError, ServiceErrorCode, tonic};
use serde::{self, Serialize};
use warp::{Filter, Rejection};

use crate::decompression::get_body_bytes;
use crate::rest::recover_fn;
use crate::rest_api_response::into_rest_api_response;
use crate::{Body, BodyFormat, require, with_arg};

#[derive(utoipa::OpenApi)]
#[openapi(paths(
    otlp_default_logs_handler,
    otlp_logs_handler,
    otlp_default_traces_handler,
    otlp_ingest_traces_handler
))]
pub struct OtlpApi;

/// Setup OpenTelemetry API handlers.
pub(crate) fn otlp_ingest_api_handlers(
    otlp_logs_service: Option<OtlpGrpcLogsService>,
    otlp_traces_service: Option<OtlpGrpcTracesService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    otlp_default_logs_handler(otlp_logs_service.clone())
        .or(otlp_default_traces_handler(otlp_traces_service.clone()).recover(recover_fn))
        .or(otlp_logs_handler(otlp_logs_service).recover(recover_fn))
        .or(otlp_ingest_traces_handler(otlp_traces_service).recover(recover_fn))
        .boxed()
}

/// Open Telemetry REST/Protobuf logs ingest endpoint.
#[utoipa::path(
    post,
    tag = "Open Telemetry",
    path = "/otlp/v1/logs",
    request_body(content = String, description = "`ExportLogsServiceRequest` protobuf message", content_type = "application/x-protobuf"),
    responses(
        (status = 200, description = "Successfully exported logs.", body = ExportLogsServiceResponse)
    ),
)]
pub(crate) fn otlp_default_logs_handler(
    otlp_logs_service: Option<OtlpGrpcLogsService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    require(otlp_logs_service)
        .and(warp::path!("otlp" / "v1" / "logs"))
        .and(warp::header::exact_ignore_case(
            "content-type",
            "application/x-protobuf",
        ))
        .and(warp::header::optional::<String>(
            OtelSignal::Logs.header_name(),
        ))
        .and(warp::post())
        .and(get_body_bytes())
        .then(
            |otlp_logs_service, index_id: Option<String>, body| async move {
                let index_id =
                    index_id.unwrap_or_else(|| OtelSignal::Logs.default_index_id().to_string());
                otlp_ingest_logs(otlp_logs_service, index_id, body).await
            },
        )
        .and(with_arg(BodyFormat::default()))
        .map(into_rest_api_response)
        .boxed()
}
/// Open Telemetry REST/Protobuf logs ingest endpoint.
#[utoipa::path(
    post,
    tag = "Open Telemetry",
    path = "/{index}/otlp/v1/logs",
    request_body(content = String, description = "`ExportLogsServiceRequest` protobuf message", content_type = "application/x-protobuf"),
    responses(
        (status = 200, description = "Successfully exported logs.", body = ExportLogsServiceResponse)
    ),
)]
pub(crate) fn otlp_logs_handler(
    otlp_log_service: Option<OtlpGrpcLogsService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    require(otlp_log_service)
        .and(warp::path!(String / "otlp" / "v1" / "logs"))
        .and(warp::header::exact_ignore_case(
            "content-type",
            "application/x-protobuf",
        ))
        .and(warp::post())
        .and(get_body_bytes())
        .then(otlp_ingest_logs)
        .and(with_arg(BodyFormat::default()))
        .map(into_rest_api_response)
        .boxed()
}

/// Open Telemetry REST/Protobuf traces ingest endpoint.
#[utoipa::path(
    post,
    tag = "Open Telemetry",
    path = "/otlp/v1/traces",
    request_body(content = String, description = "`ExportTraceServiceRequest` protobuf message", content_type = "application/x-protobuf"),
    responses(
        (status = 200, description = "Successfully exported traces.", body = ExportTracesServiceResponse)
    ),
)]
pub(crate) fn otlp_default_traces_handler(
    otlp_traces_service: Option<OtlpGrpcTracesService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    require(otlp_traces_service)
        .and(warp::path!("otlp" / "v1" / "traces"))
        .and(warp::header::exact_ignore_case(
            "content-type",
            "application/x-protobuf",
        ))
        .and(warp::header::optional::<String>(
            OtelSignal::Traces.header_name(),
        ))
        .and(warp::post())
        .and(get_body_bytes())
        .then(
            |otlp_traces_service, index_id: Option<String>, body| async move {
                let index_id =
                    index_id.unwrap_or_else(|| OtelSignal::Traces.default_index_id().to_string());
                otlp_ingest_traces(otlp_traces_service, index_id, body).await
            },
        )
        .and(with_arg(BodyFormat::default()))
        .map(into_rest_api_response)
        .boxed()
}
/// Open Telemetry REST/Protobuf traces ingest endpoint.
#[utoipa::path(
    post,
    tag = "Open Telemetry",
    path = "/{index}/otlp/v1/traces",
    request_body(content = String, description = "`ExportTraceServiceRequest` protobuf message", content_type = "application/x-protobuf"),
    responses(
        (status = 200, description = "Successfully exported traces.", body = ExportTracesServiceResponse)
    ),
)]
pub(crate) fn otlp_ingest_traces_handler(
    otlp_traces_service: Option<OtlpGrpcTracesService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    require(otlp_traces_service)
        .and(warp::path!(String / "otlp" / "v1" / "traces"))
        .and(warp::header::exact_ignore_case(
            "content-type",
            "application/x-protobuf",
        ))
        .and(warp::post())
        .and(get_body_bytes())
        .then(otlp_ingest_traces)
        .and(with_arg(BodyFormat::default()))
        .map(into_rest_api_response)
        .boxed()
}

#[derive(Debug, Clone, thiserror::Error, Serialize)]
pub enum OtlpApiError {
    #[error("invalid OTLP request: {0}")]
    InvalidPayload(String),
    #[error("error when ingesting payload: {0}")]
    Ingest(String),
}

impl ServiceError for OtlpApiError {
    fn error_code(&self) -> ServiceErrorCode {
        match self {
            OtlpApiError::InvalidPayload(_) => ServiceErrorCode::BadRequest,
            OtlpApiError::Ingest(err_msg) => {
                rate_limited_error!(limit_per_min = 6, "otlp internal error: {err_msg}");
                ServiceErrorCode::Internal
            }
        }
    }
}

async fn otlp_ingest_logs(
    otlp_logs_service: OtlpGrpcLogsService,
    index_id: IndexId,
    body: Body,
) -> Result<ExportLogsServiceResponse, OtlpApiError> {
    let export_logs_request: ExportLogsServiceRequest =
        prost::Message::decode(&body.content[..])
            .map_err(|err| OtlpApiError::InvalidPayload(err.to_string()))?;
    let mut request = tonic::Request::new(export_logs_request);
    let index = index_id
        .try_into()
        .map_err(|_| OtlpApiError::InvalidPayload("invalid index id".to_string()))?;
    request
        .metadata_mut()
        .insert(OtelSignal::Logs.header_name(), index);
    let result = otlp_logs_service
        .export(request)
        .await
        .map_err(|err| OtlpApiError::Ingest(err.to_string()))?;
    Ok(result.into_inner())
}

async fn otlp_ingest_traces(
    otlp_traces_service: OtlpGrpcTracesService,
    index_id: IndexId,
    body: Body,
) -> Result<ExportTraceServiceResponse, OtlpApiError> {
    let export_traces_request: ExportTraceServiceRequest =
        prost::Message::decode(&body.content[..])
            .map_err(|err| OtlpApiError::InvalidPayload(err.to_string()))?;
    let mut request = tonic::Request::new(export_traces_request);
    let index = index_id
        .try_into()
        .map_err(|_| OtlpApiError::InvalidPayload("invalid index id".to_string()))?;
    request
        .metadata_mut()
        .insert(OtelSignal::Traces.header_name(), index);
    let response = otlp_traces_service
        .export(request)
        .await
        .map_err(|err| OtlpApiError::Ingest(err.to_string()))?;
    Ok(response.into_inner())
}

#[cfg(test)]
mod tests {
    use std::io::Write;

    use flate2::Compression;
    use flate2::write::GzEncoder;
    use prost::Message;
    use quickwit_ingest::CommitType;
    use quickwit_opentelemetry::otlp::{
        OtlpGrpcLogsService, OtlpGrpcTracesService, make_resource_spans_for_test,
    };
    use quickwit_proto::ingest::router::{
        IngestResponseV2, IngestRouterServiceClient, IngestSuccess, MockIngestRouterService,
    };
    use quickwit_proto::opentelemetry::proto::collector::logs::v1::{
        ExportLogsServiceRequest, ExportLogsServiceResponse,
    };
    use quickwit_proto::opentelemetry::proto::collector::trace::v1::{
        ExportTraceServiceRequest, ExportTraceServiceResponse,
    };
    use quickwit_proto::opentelemetry::proto::logs::v1::{LogRecord, ResourceLogs, ScopeLogs};
    use quickwit_proto::opentelemetry::proto::resource::v1::Resource;
    use warp::Filter;

    use super::otlp_ingest_api_handlers;
    use crate::rest::recover_fn;

    fn compress(body: &[u8]) -> Vec<u8> {
        let mut encoder = GzEncoder::new(Vec::new(), Compression::default());
        encoder.write_all(body).expect("Failed to write to encoder");
        encoder.finish().expect("Failed to finish compression")
    }

    #[tokio::test]
    async fn test_otlp_ingest_logs_handler() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .times(2)
            .withf(|request| {
                if request.subrequests.len() == 1 {
                    let subrequest = &request.subrequests[0];
                    subrequest.doc_batch.is_some()
                    // && request.commit == CommitType::Auto as i32
                    && subrequest.doc_batch.as_ref().unwrap().doc_lengths.len() == 1
                    && subrequest.index_id == quickwit_opentelemetry::otlp::OTEL_LOGS_INDEX_ID
                } else {
                    false
                }
            })
            .returning(|_| {
                Ok(IngestResponseV2 {
                    successes: vec![IngestSuccess {
                        num_ingested_docs: 1,
                        ..Default::default()
                    }],
                    failures: Vec::new(),
                })
            });
        mock_ingest_router
            .expect_ingest()
            .times(2)
            .withf(|request| {
                if request.subrequests.len() == 1 {
                    let subrequest = &request.subrequests[0];
                    subrequest.doc_batch.is_some()
                    // && request.commit == CommitType::Auto as i32
                    && subrequest.doc_batch.as_ref().unwrap().doc_lengths.len() == 1
                    && subrequest.index_id == "otel-logs-v0_6"
                } else {
                    false
                }
            })
            .returning(|_| {
                Ok(IngestResponseV2 {
                    successes: vec![IngestSuccess {
                        num_ingested_docs: 1,
                        ..Default::default()
                    }],
                    failures: Vec::new(),
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let logs_service = OtlpGrpcLogsService::new(ingest_router.clone());
        let traces_service = OtlpGrpcTracesService::new(ingest_router, Some(CommitType::Force));
        let export_logs_request = ExportLogsServiceRequest {
            resource_logs: vec![ResourceLogs {
                resource: Some(Resource {
                    attributes: Vec::new(),
                    dropped_attributes_count: 0,
                }),
                scope_logs: vec![ScopeLogs {
                    log_records: vec![LogRecord {
                        body: None,
                        attributes: Vec::new(),
                        dropped_attributes_count: 0,
                        time_unix_nano: 1704036033047000000,
                        severity_number: 0,
                        severity_text: "ERROR".to_string(),
                        span_id: Vec::new(),
                        trace_id: Vec::new(),
                        flags: 0,
                        observed_time_unix_nano: 0,
                    }],
                    scope: None,
                    schema_url: "".to_string(),
                }],
                schema_url: "".to_string(),
            }],
        };
        let body = export_logs_request.encode_to_vec();
        let otlp_traces_api_handler =
            otlp_ingest_api_handlers(Some(logs_service), Some(traces_service)).recover(recover_fn);
        {
            // Test default otlp endpoint
            let resp = warp::test::request()
                .path("/otlp/v1/logs")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .body(body.clone())
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportLogsServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(
                actual_response
                    .partial_success
                    .unwrap()
                    .rejected_log_records,
                0
            );
        }
        {
            // Test default otlp endpoint with compression
            let resp = warp::test::request()
                .path("/otlp/v1/logs")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .header("content-encoding", "gzip")
                .body(compress(&body))
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportLogsServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(
                actual_response
                    .partial_success
                    .unwrap()
                    .rejected_log_records,
                0
            );
        }
        {
            // Test endpoint with index ID through header
            let resp = warp::test::request()
                .path("/otlp/v1/logs")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .header("qw-otel-logs-index", "otel-logs-v0_6")
                .body(body.clone())
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportLogsServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(
                actual_response
                    .partial_success
                    .unwrap()
                    .rejected_log_records,
                0
            );
        }
        {
            // Test endpoint with given index ID through path.
            let resp = warp::test::request()
                .path("/otel-logs-v0_6/otlp/v1/logs")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .body(body.clone())
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportLogsServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(
                actual_response
                    .partial_success
                    .unwrap()
                    .rejected_log_records,
                0
            );
        }
    }

    #[tokio::test]
    async fn test_otlp_ingest_traces_handler() {
        let mut mock_ingest_router = MockIngestRouterService::new();
        mock_ingest_router
            .expect_ingest()
            .times(2)
            .withf(|request| {
                if request.subrequests.len() == 1 {
                    let subrequest = &request.subrequests[0];
                    subrequest.doc_batch.is_some()
                    // && request.commit == CommitType::Auto as i32
                    && subrequest.doc_batch.as_ref().unwrap().doc_lengths.len() == 5
                    && subrequest.index_id == quickwit_opentelemetry::otlp::OTEL_TRACES_INDEX_ID
                } else {
                    false
                }
            })
            .returning(|_| {
                Ok(IngestResponseV2 {
                    successes: vec![IngestSuccess {
                        num_ingested_docs: 1,
                        ..Default::default()
                    }],
                    failures: Vec::new(),
                })
            });
        mock_ingest_router
            .expect_ingest()
            .times(2)
            .withf(|request| {
                if request.subrequests.len() == 1 {
                    let subrequest = &request.subrequests[0];
                    subrequest.doc_batch.is_some()
                    // && request.commit == CommitType::Auto as i32
                    && subrequest.doc_batch.as_ref().unwrap().doc_lengths.len() == 5
                    && subrequest.index_id == "otel-traces-v0_6"
                } else {
                    false
                }
            })
            .returning(|_| {
                Ok(IngestResponseV2 {
                    successes: vec![IngestSuccess {
                        num_ingested_docs: 1,
                        ..Default::default()
                    }],
                    failures: Vec::new(),
                })
            });
        let ingest_router = IngestRouterServiceClient::from_mock(mock_ingest_router);
        let logs_service = OtlpGrpcLogsService::new(ingest_router.clone());
        let traces_service = OtlpGrpcTracesService::new(ingest_router, Some(CommitType::Force));
        let export_trace_request = ExportTraceServiceRequest {
            resource_spans: make_resource_spans_for_test(),
        };
        let body = export_trace_request.encode_to_vec();
        let otlp_traces_api_handler =
            otlp_ingest_api_handlers(Some(logs_service), Some(traces_service)).recover(recover_fn);
        {
            // Test default otlp endpoint
            let resp = warp::test::request()
                .path("/otlp/v1/traces")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .body(body.clone())
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportTraceServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(actual_response.partial_success.unwrap().rejected_spans, 0);
        }
        {
            // Test default otlp endpoint with compression
            let resp = warp::test::request()
                .path("/otlp/v1/traces")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .header("content-encoding", "gzip")
                .body(compress(&body))
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportTraceServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(actual_response.partial_success.unwrap().rejected_spans, 0);
        }
        {
            // Test endpoint with given index ID through header.
            let resp = warp::test::request()
                .path("/otlp/v1/traces")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .header("qw-otel-traces-index", "otel-traces-v0_6")
                .body(body.clone())
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportTraceServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(actual_response.partial_success.unwrap().rejected_spans, 0);
        }
        {
            // Test endpoint with given index ID through path.
            let resp = warp::test::request()
                .path("/otel-traces-v0_6/otlp/v1/traces")
                .method("POST")
                .header("content-type", "application/x-protobuf")
                .body(body)
                .reply(&otlp_traces_api_handler)
                .await;
            assert_eq!(resp.status(), 200);
            let actual_response: ExportTraceServiceResponse =
                serde_json::from_slice(resp.body()).unwrap();
            assert!(actual_response.partial_success.is_some());
            assert_eq!(actual_response.partial_success.unwrap().rejected_spans, 0);
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/rate_modulator.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use quickwit_common::tower::{ConstantRate, Rate};
use quickwit_ingest::MemoryCapacity;

#[derive(Clone)]
pub struct RateModulator<R> {
    rate_estimator: R,
    memory_capacity: MemoryCapacity,
    min_rate: ConstantRate,
}

impl<R> RateModulator<R>
where R: Rate
{
    /// Creates a new [`RateModulator`] instance.
    ///
    /// # Panics
    ///
    /// Panics if `rate_estimator` and `min_rate` have different periods.
    pub fn new(rate_estimator: R, memory_capacity: MemoryCapacity, min_rate: ConstantRate) -> Self {
        assert_eq!(
            rate_estimator.period(),
            min_rate.period(),
            "Rate estimator and min rate periods must be equal."
        );

        Self {
            rate_estimator,
            memory_capacity,
            min_rate,
        }
    }
}

impl<R> Rate for RateModulator<R>
where R: Rate
{
    fn work(&self) -> u64 {
        let memory_usage_ratio = self.memory_capacity.usage_ratio();
        let work = self.rate_estimator.work().max(self.min_rate.work());

        if memory_usage_ratio < 0.25 {
            work * 2
        } else if memory_usage_ratio > 0.99 {
            work / 32
        } else if memory_usage_ratio > 0.98 {
            work / 16
        } else if memory_usage_ratio > 0.95 {
            work / 8
        } else if memory_usage_ratio > 0.90 {
            work / 4
        } else if memory_usage_ratio > 0.80 {
            work / 2
        } else if memory_usage_ratio > 0.70 {
            work * 2 / 3
        } else {
            work
        }
    }

    fn period(&self) -> Duration {
        self.rate_estimator.period()
    }
}


================================================
FILE: quickwit/quickwit-serve/src/rest.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt::Formatter;
use std::io;
use std::sync::Arc;

use hyper_util::rt::{TokioExecutor, TokioIo};
use hyper_util::server::conn::auto::Builder;
use hyper_util::service::TowerToHyperService;
use quickwit_common::tower::BoxFutureInfaillible;
use quickwit_config::{disable_ingest_v1, enable_ingest_v2};
use quickwit_search::SearchService;
use tokio::io::{AsyncRead, AsyncWrite};
use tokio::net::{TcpListener, TcpStream};
use tokio_rustls::TlsAcceptor;
use tokio_util::either::Either;
use tower::ServiceBuilder;
use tower_http::compression::CompressionLayer;
use tower_http::compression::predicate::{NotForContentType, Predicate, SizeAbove};
use tower_http::cors::{AllowOrigin, CorsLayer};
use tracing::{error, info};
use warp::filters::log::Info;
use warp::hyper::http::HeaderValue;
use warp::hyper::{Method, StatusCode, http};
use warp::{Filter, Rejection, Reply, redirect};

use crate::cluster_api::cluster_handler;
use crate::decompression::{CorruptedData, UnsupportedEncoding};
use crate::delete_task_api::delete_task_api_handlers;
use crate::developer_api::developer_api_routes;
use crate::elasticsearch_api::elastic_api_handlers;
use crate::health_check_api::health_check_handlers;
use crate::index_api::index_management_handlers;
use crate::indexing_api::indexing_get_handler;
use crate::ingest_api::ingest_api_handlers;
use crate::jaeger_api::jaeger_api_handlers;
use crate::metrics_api::metrics_handler;
use crate::node_info_handler::node_info_handler;
use crate::otlp_api::otlp_ingest_api_handlers;
use crate::rest_api_response::{RestApiError, RestApiResponse};
use crate::search_api::{
    search_get_handler, search_plan_get_handler, search_plan_post_handler, search_post_handler,
};
use crate::template_api::index_template_api_handlers;
use crate::ui_handler::ui_handler;
use crate::{BodyFormat, BuildInfo, QuickwitServices, RuntimeInfo};

#[derive(Debug)]
pub(crate) struct InvalidJsonRequest(pub serde_json::Error);

impl warp::reject::Reject for InvalidJsonRequest {}

#[derive(Debug)]
pub(crate) struct InvalidArgument(pub String);

impl warp::reject::Reject for InvalidArgument {}

#[derive(Debug)]
pub struct TooManyRequests;

impl warp::reject::Reject for TooManyRequests {}

impl std::fmt::Display for TooManyRequests {
    fn fmt(&self, f: &mut Formatter) -> std::fmt::Result {
        write!(f, "too many requests")
    }
}

/// Env variable key to define the minimum size above which a response should be compressed.
/// If unset, no compression is applied.
const QW_MINIMUM_COMPRESSION_SIZE_KEY: &str = "QW_MINIMUM_COMPRESSION_SIZE";

#[derive(Clone, Copy)]
struct CompressionPredicate {
    size_above_opt: Option<SizeAbove>,
}

impl CompressionPredicate {
    fn from_env() -> CompressionPredicate {
        let minimum_compression_size_opt: Option<u16> =
            quickwit_common::get_from_env_opt::<usize>(QW_MINIMUM_COMPRESSION_SIZE_KEY, false).map(
                |minimum_compression_size: usize| {
                    u16::try_from(minimum_compression_size).unwrap_or(u16::MAX)
                },
            );
        let size_above_opt = minimum_compression_size_opt.map(SizeAbove::new);
        CompressionPredicate { size_above_opt }
    }
}

impl Predicate for CompressionPredicate {
    fn should_compress<B>(&self, response: &http::Response<B>) -> bool
    where B: http_body::Body {
        if let Some(size_above) = self.size_above_opt {
            size_above.should_compress(response)
        } else {
            false
        }
    }
}

async fn apply_tls_if_necessary(
    tcp_stream: TcpStream,
    tls_acceptor_opt: &Option<TlsAcceptor>,
) -> io::Result<impl AsyncRead + AsyncWrite + Unpin + 'static> {
    let Some(tls_acceptor) = &tls_acceptor_opt else {
        return Ok(Either::Right(tcp_stream));
    };
    let tls_stream_res = tls_acceptor
        .accept(tcp_stream)
        .await
        .inspect_err(|err| error!("failed to perform tls handshake: {err:#}"))?;
    Ok(Either::Left(tls_stream_res))
}

/// Starts REST services.
pub(crate) async fn start_rest_server(
    tcp_listener: TcpListener,
    quickwit_services: Arc<QuickwitServices>,
    readiness_trigger: BoxFutureInfaillible<()>,
    shutdown_signal: BoxFutureInfaillible<()>,
) -> anyhow::Result<()> {
    let request_counter = warp::log::custom(|info: Info| {
        let elapsed = info.elapsed();
        let status = info.status();
        let label_values: [&str; 2] = [info.method().as_str(), status.as_str()];
        crate::SERVE_METRICS
            .request_duration_secs
            .with_label_values(label_values)
            .observe(elapsed.as_secs_f64());
        crate::SERVE_METRICS
            .http_requests_total
            .with_label_values(label_values)
            .inc();
    });
    // Docs routes
    let api_doc = warp::path("openapi.json")
        .and(warp::get())
        .map(|| warp::reply::json(&crate::openapi::build_docs()))
        .recover(recover_fn)
        .boxed();

    // `/health/*` routes.
    let health_check_routes = health_check_handlers(
        quickwit_services.cluster.clone(),
        quickwit_services.indexing_service_opt.clone(),
        quickwit_services.janitor_service_opt.clone(),
    )
    .boxed();

    // `/metrics` route.
    let metrics_routes = warp::path("metrics")
        .and(warp::get())
        .map(metrics_handler)
        .recover(recover_fn)
        .boxed();

    // `/api/developer/*` route.
    let developer_routes = developer_api_routes(
        quickwit_services.cluster.clone(),
        quickwit_services.env_filter_reload_fn.clone(),
    )
    .boxed();

    // `/api/v1/*` routes.
    let api_v1_root_route = api_v1_routes(quickwit_services.clone());

    let redirect_root_to_ui_route = warp::path::end()
        .and(warp::get())
        .map(|| redirect(http::Uri::from_static("/ui/search")))
        .recover(recover_fn)
        .boxed();

    let extra_headers = warp::reply::with::headers(
        quickwit_services
            .node_config
            .rest_config
            .extra_headers
            .clone(),
    );

    // Combine all the routes together.
    let rest_routes = api_v1_root_route
        .or(api_doc)
        .or(redirect_root_to_ui_route)
        .or(ui_handler())
        .or(health_check_routes)
        .or(metrics_routes)
        .or(developer_routes)
        .with(request_counter)
        .recover(recover_fn_final)
        .with(extra_headers)
        .boxed();

    let warp_service = warp::service(rest_routes);
    let compression_predicate = CompressionPredicate::from_env().and(NotForContentType::IMAGES);
    let cors = build_cors(&quickwit_services.node_config.rest_config.cors_allow_origins);

    let service = ServiceBuilder::new()
        .layer(
            CompressionLayer::new()
                .zstd(true)
                .gzip(true)
                .quality(tower_http::CompressionLevel::Fastest)
                .compress_when(compression_predicate),
        )
        .layer(cors)
        .service(warp_service);

    let rest_listen_addr = tcp_listener.local_addr()?;
    info!(
        rest_listen_addr=?rest_listen_addr,
        "starting REST server listening on {rest_listen_addr}"
    );

    let service = TowerToHyperService::new(service);

    let server = Builder::new(TokioExecutor::new());
    let graceful = hyper_util::server::graceful::GracefulShutdown::new();
    let mut shutdown_signal = std::pin::pin!(shutdown_signal);
    readiness_trigger.await;

    let tls_acceptor_opt: Option<TlsAcceptor> =
        if let Some(tls_config) = &quickwit_services.node_config.rest_config.tls {
            let rustls_config = tls::make_rustls_config(tls_config)?;
            Some(TlsAcceptor::from(rustls_config))
        } else {
            None
        };

    loop {
        tokio::select! {
            tcp_accept_res = tcp_listener.accept() => {
                let tcp_stream = match tcp_accept_res {
                    Ok((tcp_stream, _remote_addr)) => tcp_stream,
                    Err(err) => {
                        error!("failed to accept connection: {err:#}");
                        continue;
                    }
                };

                let Ok(tcp_or_tls_stream) = apply_tls_if_necessary(tcp_stream, &tls_acceptor_opt).await else {
                    continue;
                };

                let serve_fut = server.serve_connection_with_upgrades(TokioIo::new(tcp_or_tls_stream), service.clone());
                let serve_with_shutdown_fut = graceful.watch(serve_fut.into_owned());
                tokio::spawn(async move {
                    if let Err(err) = serve_with_shutdown_fut.await {
                        error!("failed to serve connection: {err:#}");
                    }
                });
            },
            _ = &mut shutdown_signal => {
                info!("REST server shutdown signal received");
                break;
            }
        }
    }

    graceful.shutdown().await;
    info!("gracefully shutdown");

    Ok(())
}

fn search_routes(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    search_get_handler(search_service.clone())
        .or(search_post_handler(search_service.clone()))
        .or(search_plan_get_handler(search_service.clone()))
        .or(search_plan_post_handler(search_service.clone()))
        .recover(recover_fn)
        .boxed()
}

fn api_v1_routes(
    quickwit_services: Arc<QuickwitServices>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    let api_v1_root_url = warp::path!("api" / "v1" / ..);
    api_v1_root_url.and(
        elastic_api_handlers(
            quickwit_services.cluster.clone(),
            quickwit_services.node_config.clone(),
            quickwit_services.search_service.clone(),
            quickwit_services.ingest_service.clone(),
            quickwit_services.ingest_router_service.clone(),
            quickwit_services.metastore_client.clone(),
            quickwit_services.index_manager.clone(),
            !disable_ingest_v1(),
            enable_ingest_v2(),
        )
        .or(cluster_handler(quickwit_services.cluster.clone()))
        .boxed()
        .or(node_info_handler(
            BuildInfo::get(),
            RuntimeInfo::get(),
            quickwit_services.node_config.clone(),
        ))
        .boxed()
        .or(indexing_get_handler(
            quickwit_services.indexing_service_opt.clone(),
        ))
        .boxed()
        .or(search_routes(quickwit_services.search_service.clone()))
        .boxed()
        .or(ingest_api_handlers(
            quickwit_services.ingest_router_service.clone(),
            quickwit_services.ingest_service.clone(),
            quickwit_services.node_config.ingest_api_config.clone(),
            !disable_ingest_v1(),
            enable_ingest_v2(),
        ))
        .boxed()
        .or(otlp_ingest_api_handlers(
            quickwit_services.otlp_logs_service_opt.clone(),
            quickwit_services.otlp_traces_service_opt.clone(),
        ))
        .boxed()
        .or(index_management_handlers(
            quickwit_services.index_manager.clone(),
            quickwit_services.node_config.clone(),
        ))
        .boxed()
        .or(delete_task_api_handlers(
            quickwit_services.metastore_client.clone(),
        ))
        .boxed()
        .or(jaeger_api_handlers(
            quickwit_services.jaeger_service_opt.clone(),
        ))
        .boxed()
        .or(index_template_api_handlers(
            quickwit_services.metastore_client.clone(),
        ))
        .boxed(),
    )
}

/// This function returns a formatted error based on the given rejection reason.
///
/// The ordering of rejection processing is very important, we need to start
/// with the most specific rejections and end with the most generic. If not, Quickwit
/// will return useless errors to the user.
// TODO: we may want in the future revamp rejections as our usage does not exactly
// match rejection behaviour. When a filter returns a rejection, it means that it
// did not match, but maybe another filter can. Consequently warp will continue
// to try to match other filters. Once a filter is matched, we can enter into
// our own logic and return a proper reply.
// More on this here: https://github.com/seanmonstar/warp/issues/388.
// We may use this work on the PR is merged: https://github.com/seanmonstar/warp/pull/909.
pub async fn recover_fn(rejection: Rejection) -> Result<impl Reply, Rejection> {
    let error = get_status_with_error(rejection)?;
    let status_code = error.status_code;
    Ok(RestApiResponse::new::<(), _>(
        &Err(error),
        status_code,
        BodyFormat::default(),
    ))
}

pub async fn recover_fn_final(rejection: Rejection) -> Result<impl Reply, Rejection> {
    let error = get_status_with_error(rejection).unwrap_or_else(|rejection: Rejection| {
        if rejection.is_not_found() {
            RestApiError {
                status_code: StatusCode::NOT_FOUND,
                message: "Route not found".to_string(),
            }
        } else {
            error!("REST server error: {:?}", rejection);
            RestApiError {
                status_code: StatusCode::INTERNAL_SERVER_ERROR,
                message: "internal server error".to_string(),
            }
        }
    });
    let status_code = error.status_code;
    Ok(RestApiResponse::new::<(), _>(
        &Err(error),
        status_code,
        BodyFormat::default(),
    ))
}

fn get_status_with_error(rejection: Rejection) -> Result<RestApiError, Rejection> {
    if let Some(error) = rejection.find::<crate::format::UnsupportedMediaType>() {
        Ok(RestApiError {
            status_code: StatusCode::UNSUPPORTED_MEDIA_TYPE,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<serde_qs::Error>() {
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<InvalidJsonRequest>() {
        // Happens when the request body could not be deserialized correctly.
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.0.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::filters::body::BodyDeserializeError>() {
        // Happens when the request body could not be deserialized correctly.
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::UnsupportedMediaType>() {
        Ok(RestApiError {
            status_code: StatusCode::UNSUPPORTED_MEDIA_TYPE,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<UnsupportedEncoding>() {
        Ok(RestApiError {
            status_code: StatusCode::UNSUPPORTED_MEDIA_TYPE,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<CorruptedData>() {
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::InvalidQuery>() {
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::LengthRequired>() {
        Ok(RestApiError {
            status_code: StatusCode::LENGTH_REQUIRED,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::MissingHeader>() {
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::InvalidHeader>() {
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::PayloadTooLarge>() {
        Ok(RestApiError {
            status_code: StatusCode::PAYLOAD_TOO_LARGE,
            message: error.to_string(),
        })
    } else if let Some(err) = rejection.find::<TooManyRequests>() {
        Ok(RestApiError {
            status_code: StatusCode::TOO_MANY_REQUESTS,
            message: err.to_string(),
        })
    } else if let Some(error) = rejection.find::<InvalidArgument>() {
        // Happens when the url path or request body contains invalid argument(s).
        Ok(RestApiError {
            status_code: StatusCode::BAD_REQUEST,
            message: error.0.to_string(),
        })
    } else if let Some(error) = rejection.find::<warp::reject::MethodNotAllowed>() {
        Ok(RestApiError {
            status_code: StatusCode::METHOD_NOT_ALLOWED,
            message: error.to_string(),
        })
    } else {
        Err(rejection)
    }
}

fn build_cors(cors_origins: &[String]) -> CorsLayer {
    let debug_mode = quickwit_common::get_bool_from_env("QW_ENABLE_CORS_DEBUG", false);
    if debug_mode {
        info!("CORS debug mode is enabled, localhost and 127.0.0.1 origins will be allowed");
        return CorsLayer::new()
            .allow_methods([
                Method::GET,
                Method::POST,
                Method::PUT,
                Method::PATCH,
                Method::DELETE,
            ])
            .allow_origin(AllowOrigin::predicate(|origin, _parts| {
                [b"https://localhost:", b"https://127.0.0.1:"]
                    .iter()
                    .any(|prefix| origin.as_bytes().starts_with(*prefix))
            }))
            .allow_headers([http::header::CONTENT_TYPE]);
    }

    let mut cors = CorsLayer::new().allow_methods([
        Method::GET,
        Method::POST,
        Method::PUT,
        Method::DELETE,
        Method::OPTIONS,
    ]);
    if !cors_origins.is_empty() {
        let allow_any = cors_origins.iter().any(|origin| origin.as_str() == "*");

        if allow_any {
            info!("CORS is enabled, all origins will be allowed");
            cors = cors.allow_origin(tower_http::cors::Any);
        } else {
            info!(origins = ?cors_origins, "CORS is enabled, the following origins will be allowed");
            let origins = cors_origins
                .iter()
                .map(|origin| origin.parse::<HeaderValue>().unwrap())
                .collect::<Vec<_>>();
            cors = cors.allow_origin(origins);
        };
    }
    cors
}

mod tls {
    // most of this module is copied from hyper-tls examples, licensed under Apache 2.0, MIT or ISC

    use std::sync::Arc;
    use std::vec::Vec;
    use std::{fs, io};

    use quickwit_config::TlsConfig;
    use rustls::pki_types::{CertificateDer, PrivateKeyDer};
    use tokio_rustls::rustls::ServerConfig;

    fn io_error(error: String) -> io::Error {
        io::Error::other(error)
    }

    // Load public certificate from file.
    fn load_certs(filename: &str) -> io::Result<Vec<CertificateDer<'static>>> {
        // Open certificate file.
        let certfile = fs::File::open(filename)
            .map_err(|error| io_error(format!("failed to open {filename}: {error}")))?;
        let mut reader = io::BufReader::new(certfile);
        // Load and return certificate.
        rustls_pemfile::certs(&mut reader).collect()
    }

    // Load private key from file.
    fn load_private_key(filename: &str) -> io::Result<PrivateKeyDer<'static>> {
        // Open keyfile.
        let keyfile = fs::File::open(filename)
            .map_err(|error| io_error(format!("failed to open {filename}: {error}")))?;
        let mut reader = io::BufReader::new(keyfile);

        // Load and return a single private key.
        rustls_pemfile::private_key(&mut reader).map(|key| key.unwrap())
    }

    pub fn make_rustls_config(config: &TlsConfig) -> anyhow::Result<Arc<ServerConfig>> {
        let certs = load_certs(&config.cert_path)?;
        let key = load_private_key(&config.key_path)?;

        // TODO we could add support for client authorization, it seems less important than on the
        // gRPC side though
        if config.validate_client {
            anyhow::bail!("mTLS isn't supported on rest api");
        }

        let mut cfg = rustls::ServerConfig::builder()
            .with_no_client_auth()
            .with_single_cert(certs, key)
            .map_err(|error| io_error(error.to_string()))?;
        // Configure ALPN to accept HTTP/2, HTTP/1.1, and HTTP/1.0 in that order.
        cfg.alpn_protocols = vec![b"h2".to_vec(), b"http/1.1".to_vec(), b"http/1.0".to_vec()];
        Ok(Arc::new(cfg))
    }
}

#[cfg(test)]
mod tests {
    use std::future::Future;
    use std::pin::Pin;
    use std::task::{Context, Poll};

    use quickwit_cluster::{ChannelTransport, create_cluster_for_test};
    use quickwit_config::NodeConfig;
    use quickwit_index_management::IndexService;
    use quickwit_ingest::{IngestApiService, IngestServiceClient};
    use quickwit_proto::control_plane::ControlPlaneServiceClient;
    use quickwit_proto::ingest::router::IngestRouterServiceClient;
    use quickwit_proto::metastore::MetastoreServiceClient;
    use quickwit_search::MockSearchService;
    use quickwit_storage::StorageResolver;
    use tower::Service;
    use warp::http::HeaderName;
    use warp::hyper::{Request, Response, StatusCode};

    use super::*;
    use crate::rest::recover_fn_final;

    pub(crate) fn ingest_service_client() -> IngestServiceClient {
        let universe = quickwit_actors::Universe::new();
        let (ingest_service_mailbox, _) = universe.create_test_mailbox::<IngestApiService>();
        IngestServiceClient::from_mailbox(ingest_service_mailbox)
    }

    #[tokio::test]
    async fn test_cors() {
        // No cors enabled
        {
            let cors = build_cors(&[]);

            let mut layer = ServiceBuilder::new().layer(cors).service(HelloWorld);

            let resp = layer.call(Request::new(())).await.unwrap();
            let headers = resp.headers();
            assert_eq!(headers.get("Access-Control-Allow-Origin"), None);
            assert_eq!(headers.get("Access-Control-Allow-Methods"), None);
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);

            let resp = layer
                .call(cors_request("http://localhost:3000"))
                .await
                .unwrap();
            let headers = resp.headers();
            assert_eq!(headers.get("Access-Control-Allow-Origin"), None);
            assert_eq!(
                headers.get("Access-Control-Allow-Methods"),
                Some(
                    &"GET,POST,PUT,DELETE,OPTIONS"
                        .parse::<HeaderValue>()
                        .unwrap()
                )
            );
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);
        }

        // Wildcard cors enabled
        {
            let cors = build_cors(&["*".to_string()]);

            let mut layer = ServiceBuilder::new().layer(cors).service(HelloWorld);

            let resp = layer.call(Request::new(())).await.unwrap();
            let headers = resp.headers();
            assert_eq!(
                headers.get("Access-Control-Allow-Origin"),
                Some(&"*".parse::<HeaderValue>().unwrap())
            );
            assert_eq!(headers.get("Access-Control-Allow-Methods"), None);
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);

            let resp = layer
                .call(cors_request("http://localhost:3000"))
                .await
                .unwrap();
            let headers = resp.headers();
            assert_eq!(
                headers.get("Access-Control-Allow-Origin"),
                Some(&"*".parse::<HeaderValue>().unwrap())
            );
            assert_eq!(
                headers.get("Access-Control-Allow-Methods"),
                Some(
                    &"GET,POST,PUT,DELETE,OPTIONS"
                        .parse::<HeaderValue>()
                        .unwrap()
                )
            );
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);
        }

        // Specific origin cors enabled
        {
            let cors = build_cors(&["https://quickwit.io".to_string()]);

            let mut layer = ServiceBuilder::new().layer(cors).service(HelloWorld);

            let resp = layer.call(Request::new(())).await.unwrap();
            let headers = resp.headers();
            assert_eq!(headers.get("Access-Control-Allow-Origin"), None);
            assert_eq!(headers.get("Access-Control-Allow-Methods"), None);
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);

            let resp = layer
                .call(cors_request("http://localhost:3000"))
                .await
                .unwrap();
            let headers = resp.headers();
            assert_eq!(headers.get("Access-Control-Allow-Origin"), None);
            assert_eq!(
                headers.get("Access-Control-Allow-Methods"),
                Some(
                    &"GET,POST,PUT,DELETE,OPTIONS"
                        .parse::<HeaderValue>()
                        .unwrap()
                )
            );
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);

            let resp = layer
                .call(cors_request("https://quickwit.io"))
                .await
                .unwrap();
            let headers = resp.headers();
            assert_eq!(
                headers.get("Access-Control-Allow-Origin"),
                Some(&"https://quickwit.io".parse::<HeaderValue>().unwrap())
            );
            assert_eq!(
                headers.get("Access-Control-Allow-Methods"),
                Some(
                    &"GET,POST,PUT,DELETE,OPTIONS"
                        .parse::<HeaderValue>()
                        .unwrap()
                )
            );
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);
        }

        // Specific multiple-origin cors enabled
        {
            let cors = build_cors(&[
                "https://quickwit.io".to_string(),
                "http://localhost:3000".to_string(),
            ]);

            let mut layer = ServiceBuilder::new().layer(cors).service(HelloWorld);

            let resp = layer.call(Request::new(())).await.unwrap();
            let headers = resp.headers();
            assert_eq!(headers.get("Access-Control-Allow-Origin"), None);
            assert_eq!(headers.get("Access-Control-Allow-Methods"), None);
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);

            let resp = layer
                .call(cors_request("http://localhost:3000"))
                .await
                .unwrap();
            let headers = resp.headers();
            assert_eq!(
                headers.get("Access-Control-Allow-Origin"),
                Some(&"http://localhost:3000".parse::<HeaderValue>().unwrap())
            );
            assert_eq!(
                headers.get("Access-Control-Allow-Methods"),
                Some(
                    &"GET,POST,PUT,DELETE,OPTIONS"
                        .parse::<HeaderValue>()
                        .unwrap()
                )
            );
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);

            let resp = layer
                .call(cors_request("https://quickwit.io"))
                .await
                .unwrap();
            let headers = resp.headers();
            assert_eq!(
                headers.get("Access-Control-Allow-Origin"),
                Some(&"https://quickwit.io".parse::<HeaderValue>().unwrap())
            );
            assert_eq!(
                headers.get("Access-Control-Allow-Methods"),
                Some(
                    &"GET,POST,PUT,DELETE,OPTIONS"
                        .parse::<HeaderValue>()
                        .unwrap()
                )
            );
            assert_eq!(headers.get("Access-Control-Allow-Headers"), None);
            assert_eq!(headers.get("Access-Control-Max-Age"), None);
        }
    }

    fn cors_request(origin: &'static str) -> Request<()> {
        let mut request = Request::new(());
        (*request.method_mut()) = Method::OPTIONS;
        request
            .headers_mut()
            .insert("Origin", HeaderValue::from_static(origin));
        request
    }

    struct HelloWorld;

    impl Service<Request<()>> for HelloWorld {
        type Response = Response<String>;
        type Error = http::Error;
        type Future = Pin<Box<dyn Future<Output = Result<Self::Response, Self::Error>>>>;

        fn poll_ready(&mut self, _cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
            Poll::Ready(Ok(()))
        }

        fn call(&mut self, _req: Request<()>) -> Self::Future {
            let body = "hello, world!\n".to_string();
            let resp = Response::builder()
                .status(StatusCode::OK)
                .body(body)
                .expect("Unable to create `http::Response`");

            let fut = async { Ok(resp) };

            Box::pin(fut)
        }
    }

    #[tokio::test]
    async fn test_extra_headers() {
        let mut node_config = NodeConfig::for_test();
        node_config.rest_config.extra_headers.insert(
            HeaderName::from_static("x-custom-header"),
            HeaderValue::from_static("custom-value"),
        );
        node_config.rest_config.extra_headers.insert(
            HeaderName::from_static("x-custom-header-2"),
            HeaderValue::from_static("custom-value-2"),
        );
        let metastore_client = MetastoreServiceClient::mocked();
        let index_service =
            IndexService::new(metastore_client.clone(), StorageResolver::unconfigured());
        let control_plane_client = ControlPlaneServiceClient::mocked();
        let transport = ChannelTransport::default();
        let cluster = create_cluster_for_test(Vec::new(), &[], &transport, false)
            .await
            .unwrap();
        let quickwit_services = QuickwitServices {
            _report_splits_subscription_handle_opt: None,
            _local_shards_update_listener_handle_opt: None,
            cluster,
            control_plane_server_opt: None,
            control_plane_client,
            indexing_service_opt: None,
            index_manager: index_service,
            ingest_service: ingest_service_client(),
            ingest_router_opt: None,
            ingest_router_service: IngestRouterServiceClient::mocked(),
            ingester_opt: None,
            janitor_service_opt: None,
            otlp_logs_service_opt: None,
            otlp_traces_service_opt: None,
            metastore_client,
            metastore_server_opt: None,
            node_config: Arc::new(node_config.clone()),
            search_service: Arc::new(MockSearchService::new()),
            jaeger_service_opt: None,
            env_filter_reload_fn: crate::do_nothing_env_filter_reload_fn(),
        };

        let handler = api_v1_routes(Arc::new(quickwit_services))
            .recover(recover_fn_final)
            .with(warp::reply::with::headers(
                node_config.rest_config.extra_headers.clone(),
            ));

        let resp = warp::test::request()
            .path("/api/v1/version")
            .reply(&handler.clone())
            .await;

        assert_eq!(resp.status(), 200);
        assert_eq!(
            resp.headers().get("x-custom-header").unwrap(),
            "custom-value"
        );
        assert_eq!(
            resp.headers().get("x-custom-header-2").unwrap(),
            "custom-value-2"
        );

        let resp_404 = warp::test::request()
            .path("/api/v1/version404")
            .reply(&handler)
            .await;

        assert_eq!(resp_404.status(), 404);
        assert_eq!(
            resp_404.headers().get("x-custom-header").unwrap(),
            "custom-value"
        );
        assert_eq!(
            resp_404.headers().get("x-custom-header-2").unwrap(),
            "custom-value-2"
        );
    }
}


================================================
FILE: quickwit/quickwit-serve/src/rest_api_response.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use quickwit_proto::ServiceError;
use serde::{self, Serialize};
use warp::Reply;
use warp::hyper::StatusCode;
use warp::hyper::header::CONTENT_TYPE;
use warp::hyper::http::HeaderValue;

use crate::format::BodyFormat;

const JSON_SERIALIZATION_ERROR: &str = "JSON serialization failed.";

#[derive(Serialize)]
pub(crate) struct RestApiError {
    // For now, we want to keep [`RestApiError`] as simple as possible
    // and return just a message.
    #[serde(skip_serializing)]
    pub status_code: StatusCode,
    pub message: String,
}

/// Makes a JSON API response from a result.
/// The error is wrapped into an [`RestApiError`] to publicly expose
/// a consistent error format.
pub(crate) fn into_rest_api_response<T: serde::Serialize, E: ServiceError>(
    result: Result<T, E>,
    body_format: BodyFormat,
) -> RestApiResponse {
    let rest_api_result = result.map_err(|error| RestApiError {
        status_code: error.error_code().http_status_code(),
        message: error.to_string(),
    });
    let status_code = match &rest_api_result {
        Ok(_) => StatusCode::OK,
        Err(error) => error.status_code,
    };
    RestApiResponse::new(&rest_api_result, status_code, body_format)
}

/// A JSON reply for the REST API.
pub struct RestApiResponse {
    status_code: StatusCode,
    inner: Result<Vec<u8>, ()>,
}

impl RestApiResponse {
    pub fn new<T: serde::Serialize, E: serde::Serialize>(
        result: &Result<T, E>,
        status_code: StatusCode,
        body_format: BodyFormat,
    ) -> Self {
        let inner = body_format.result_to_vec(result);
        RestApiResponse { status_code, inner }
    }
}

impl Reply for RestApiResponse {
    #[inline]
    fn into_response(self) -> warp::reply::Response {
        match self.inner {
            Ok(body) => {
                let mut response = warp::reply::Response::new(body.into());
                response
                    .headers_mut()
                    .insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
                *response.status_mut() = self.status_code;
                response
            }
            Err(()) => {
                quickwit_common::rate_limited_error!(
                    limit_per_min = 10,
                    "REST body json serialization error."
                );
                warp::reply::json(&RestApiError {
                    status_code: StatusCode::INTERNAL_SERVER_ERROR,
                    message: JSON_SERIALIZATION_ERROR.to_string(),
                })
                .into_response()
            }
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/search_api/grpc_adapter.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use async_trait::async_trait;
use quickwit_proto::error::convert_to_grpc_result;
use quickwit_proto::search::{
    GetKvRequest, GetKvResponse, LeafListFieldsRequest, ListFieldsRequest, ListFieldsResponse,
    ReportSplitsRequest, ReportSplitsResponse, search_service_server as grpc,
};
use quickwit_proto::{set_parent_span_from_request_metadata, tonic};
use quickwit_search::SearchService;
use tracing::instrument;

#[derive(Clone)]
pub struct GrpcSearchAdapter(Arc<dyn SearchService>);

impl From<Arc<dyn SearchService>> for GrpcSearchAdapter {
    fn from(search_service_arc: Arc<dyn SearchService>) -> Self {
        GrpcSearchAdapter(search_service_arc)
    }
}

#[async_trait]
impl grpc::SearchService for GrpcSearchAdapter {
    #[instrument(skip(self, request))]
    async fn root_search(
        &self,
        request: tonic::Request<quickwit_proto::search::SearchRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::SearchResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let search_request = request.into_inner();
        let search_result = self.0.root_search(search_request).await;
        convert_to_grpc_result(search_result)
    }

    #[instrument(skip(self, request))]
    async fn leaf_search(
        &self,
        request: tonic::Request<quickwit_proto::search::LeafSearchRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::LeafSearchResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let leaf_search_request = request.into_inner();
        let leaf_search_result = self.0.leaf_search(leaf_search_request).await;
        convert_to_grpc_result(leaf_search_result)
    }

    #[instrument(skip(self, request))]
    async fn fetch_docs(
        &self,
        request: tonic::Request<quickwit_proto::search::FetchDocsRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::FetchDocsResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let fetch_docs_request = request.into_inner();
        let fetch_docs_result = self.0.fetch_docs(fetch_docs_request).await;
        convert_to_grpc_result(fetch_docs_result)
    }

    #[instrument(skip(self, request))]
    async fn root_list_terms(
        &self,
        request: tonic::Request<quickwit_proto::search::ListTermsRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::ListTermsResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let search_request = request.into_inner();
        let search_result = self.0.root_list_terms(search_request).await;
        convert_to_grpc_result(search_result)
    }

    #[instrument(skip(self, request))]
    async fn leaf_list_terms(
        &self,
        request: tonic::Request<quickwit_proto::search::LeafListTermsRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::LeafListTermsResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let leaf_search_request = request.into_inner();
        let leaf_search_result = self.0.leaf_list_terms(leaf_search_request).await;
        convert_to_grpc_result(leaf_search_result)
    }

    async fn scroll(
        &self,
        request: tonic::Request<quickwit_proto::search::ScrollRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::SearchResponse>, tonic::Status> {
        let scroll_request = request.into_inner();
        let scroll_result = self.0.scroll(scroll_request).await;
        convert_to_grpc_result(scroll_result)
    }

    #[instrument(skip(self, request))]
    async fn put_kv(
        &self,
        request: tonic::Request<quickwit_proto::search::PutKvRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::PutKvResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let put_request = request.into_inner();
        self.0.put_kv(put_request).await;
        Ok(tonic::Response::new(
            quickwit_proto::search::PutKvResponse {},
        ))
    }

    #[instrument(skip(self, request))]
    async fn get_kv(
        &self,
        request: tonic::Request<GetKvRequest>,
    ) -> Result<tonic::Response<GetKvResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let get_search_after_context_request = request.into_inner();
        let payload = self.0.get_kv(get_search_after_context_request).await;
        let get_response = GetKvResponse { payload };
        Ok(tonic::Response::new(get_response))
    }

    #[instrument(skip(self, request))]
    async fn report_splits(
        &self,
        request: tonic::Request<ReportSplitsRequest>,
    ) -> Result<tonic::Response<ReportSplitsResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let get_search_after_context_request = request.into_inner();
        self.0.report_splits(get_search_after_context_request).await;
        Ok(tonic::Response::new(ReportSplitsResponse {}))
    }

    #[instrument(skip(self, request))]
    async fn list_fields(
        &self,
        request: tonic::Request<ListFieldsRequest>,
    ) -> Result<tonic::Response<ListFieldsResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let resp = self.0.root_list_fields(request.into_inner()).await;
        convert_to_grpc_result(resp)
    }
    #[instrument(skip(self, request))]
    async fn leaf_list_fields(
        &self,
        request: tonic::Request<LeafListFieldsRequest>,
    ) -> Result<tonic::Response<ListFieldsResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let resp = self.0.leaf_list_fields(request.into_inner()).await;
        convert_to_grpc_result(resp)
    }

    #[instrument(skip(self, request))]
    async fn search_plan(
        &self,
        request: tonic::Request<quickwit_proto::search::SearchRequest>,
    ) -> Result<tonic::Response<quickwit_proto::search::SearchPlanResponse>, tonic::Status> {
        set_parent_span_from_request_metadata(request.metadata());
        let search_request = request.into_inner();
        let search_result = self.0.search_plan(search_request).await;
        convert_to_grpc_result(search_result)
    }
}


================================================
FILE: quickwit/quickwit-serve/src/search_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod grpc_adapter;
mod rest_handler;

pub use self::grpc_adapter::GrpcSearchAdapter;
pub use self::rest_handler::{
    SearchApi, SearchRequestQueryString, SortBy, search_get_handler, search_plan_get_handler,
    search_plan_post_handler, search_post_handler, search_request_from_api_request,
};
pub(crate) use self::rest_handler::{extract_index_id_patterns, extract_index_id_patterns_default};


================================================
FILE: quickwit/quickwit-serve/src/search_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::convert::TryFrom;
use std::sync::Arc;

use percent_encoding::percent_decode_str;
use quickwit_config::validate_index_id_pattern;
use quickwit_proto::search::{CountHits, SortField, SortOrder};
use quickwit_query::query_ast::query_ast_from_user_text;
use quickwit_search::{SearchError, SearchPlanResponseRest, SearchResponseRest, SearchService};
use serde::{Deserialize, Deserializer, Serialize, Serializer};
use serde_json::Value as JsonValue;
use tracing::info;
use warp::{Filter, Rejection};

use crate::rest_api_response::into_rest_api_response;
use crate::simple_list::{from_simple_list, to_simple_list};
use crate::{BodyFormat, with_arg};

#[derive(utoipa::OpenApi)]
#[openapi(
    paths(
        search_get_handler,
        search_post_handler,
        search_plan_get_handler,
        search_plan_post_handler,
    ),
    components(schemas(
        BodyFormat,
        SearchRequestQueryString,
        SearchResponseRest,
        SearchPlanResponseRest,
        SortBy,
        SortField,
        SortOrder,
    ),)
)]
pub struct SearchApi;

pub(crate) async fn extract_index_id_patterns_default() -> Result<Vec<String>, Rejection> {
    let index_id_patterns = Vec::new();
    Ok(index_id_patterns)
}

pub(crate) async fn extract_index_id_patterns(
    comma_separated_index_id_patterns: String,
) -> Result<Vec<String>, Rejection> {
    let percent_decoded_comma_separated_index_id_patterns =
        percent_decode_str(&comma_separated_index_id_patterns)
            .decode_utf8()
            .map_err(|error| {
                let message = format!(
                    "failed to percent decode comma-separated index ID patterns \
                     `{comma_separated_index_id_patterns}`: {error}"
                );
                crate::rest::InvalidArgument(message)
            })?;
    let mut index_id_patterns = Vec::new();

    for index_id_pattern in percent_decoded_comma_separated_index_id_patterns.split(',') {
        validate_index_id_pattern(index_id_pattern, true)
            .map_err(|error| crate::rest::InvalidArgument(error.to_string()))?;
        index_id_patterns.push(index_id_pattern.to_string());
    }
    assert!(!index_id_patterns.is_empty());
    Ok(index_id_patterns)
}

#[derive(Debug, Default, Eq, PartialEq, Deserialize, utoipa::ToSchema)]
pub struct SortBy {
    /// Fields to sort on.
    pub sort_fields: Vec<SortField>,
}

impl SortBy {
    pub fn is_empty(&self) -> bool {
        self.sort_fields.is_empty()
    }
}

impl From<String> for SortBy {
    fn from(sort_by: String) -> Self {
        let mut sort_fields = Vec::new();

        for field_name in sort_by.split(',') {
            if field_name.is_empty() {
                continue;
            }
            let (field_name, sort_order) = if let Some(tail) = field_name.strip_prefix('+') {
                (tail.trim().to_string(), SortOrder::Desc)
            } else if let Some(tail) = field_name.strip_prefix('-') {
                (tail.trim().to_string(), SortOrder::Asc)
            } else {
                let trimmed_field_name = field_name.trim().to_string();

                (trimmed_field_name, SortOrder::Desc)
            };
            let sort_field = SortField {
                field_name,
                sort_order: sort_order as i32,
                sort_datetime_format: None,
            };
            sort_fields.push(sort_field);
        }
        Self { sort_fields }
    }
}

pub fn sort_by_mini_dsl<'de, D>(deserializer: D) -> Result<SortBy, D::Error>
where D: Deserializer<'de> {
    let sort_by_mini_dsl = String::deserialize(deserializer)?;
    Ok(SortBy::from(sort_by_mini_dsl))
}

impl Serialize for SortBy {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        let mut sort_by_mini_dsl = String::new();

        for sort_field in &self.sort_fields {
            if sort_field.sort_order() == SortOrder::Desc {
                sort_by_mini_dsl.push('-');
            }
            sort_by_mini_dsl.push_str(&sort_field.field_name);
        }
        serializer.serialize_str(&sort_by_mini_dsl)
    }
}

fn default_max_hits() -> u64 {
    20
}

/// This struct represents the QueryString passed to
/// the rest API.
#[derive(
    Debug, Default, Eq, PartialEq, Serialize, Deserialize, utoipa::IntoParams, utoipa::ToSchema,
)]
#[into_params(parameter_in = Query)]
#[serde(deny_unknown_fields)]
pub struct SearchRequestQueryString {
    /// Query text. The query language is that of tantivy.
    pub query: String,
    #[param(value_type = Object)]
    #[schema(value_type = Object)]
    /// The aggregation JSON string.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub aggs: Option<JsonValue>,
    // Fields to search on
    #[param(rename = "search_field")]
    #[schema(rename = "search_field")]
    #[serde(default)]
    #[serde(rename = "search_field")]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(serialize_with = "to_simple_list")]
    pub search_fields: Option<Vec<String>>,
    /// Fields to extract snippets on.
    #[serde(default)]
    #[serde(deserialize_with = "from_simple_list")]
    #[serde(skip_serializing_if = "Option::is_none")]
    #[serde(serialize_with = "to_simple_list")]
    pub snippet_fields: Option<Vec<String>>,
    /// If set, restrict search to documents with a `timestamp >= start_timestamp`.
    /// This timestamp is expressed in seconds.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub start_timestamp: Option<i64>,
    /// If set, restrict search to documents with a `timestamp < end_timestamp``.
    /// This timestamp is expressed in seconds.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub end_timestamp: Option<i64>,
    /// Maximum number of hits to return (by default 20).
    #[serde(default = "default_max_hits")]
    pub max_hits: u64,
    /// First hit to return. Together with num_hits, this parameter
    /// can be used for pagination.
    ///
    /// E.g.
    /// The results with rank [start_offset..start_offset + max_hits) are returned
    #[serde(default)] // Default to 0. (We are 0-indexed)
    pub start_offset: u64,
    /// The output format.
    #[serde(default)]
    pub format: BodyFormat,
    /// Specifies how documents are sorted.
    #[serde(alias = "sort_by_field")]
    #[serde(deserialize_with = "sort_by_mini_dsl")]
    #[serde(default)]
    #[serde(skip_serializing_if = "SortBy::is_empty")]
    #[param(value_type = String)]
    pub sort_by: SortBy,
    #[param(value_type = bool)]
    #[schema(value_type = bool)]
    #[serde(with = "count_hits_from_bool")]
    #[serde(default = "count_hits_from_bool::default")]
    pub count_all: CountHits,
    #[param(value_type = bool)]
    #[schema(value_type = bool)]
    #[serde(default)]
    pub allow_failed_splits: bool,
}

mod count_hits_from_bool {
    use quickwit_proto::search::CountHits;
    use serde::{self, Deserialize, Deserializer, Serializer};

    pub fn serialize<S>(count_hits: &CountHits, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        if count_hits == &CountHits::Underestimate {
            serializer.serialize_bool(false)
        } else {
            serializer.serialize_none()
        }
    }

    pub fn deserialize<'de, D>(deserializer: D) -> Result<CountHits, D::Error>
    where D: Deserializer<'de> {
        let count_all = Option::<bool>::deserialize(deserializer)?.unwrap_or(true);
        Ok(if count_all {
            CountHits::CountAll
        } else {
            CountHits::Underestimate
        })
    }

    pub fn default() -> CountHits {
        CountHits::CountAll
    }
}

pub fn search_request_from_api_request(
    index_id_patterns: Vec<String>,
    search_request: SearchRequestQueryString,
) -> Result<quickwit_proto::search::SearchRequest, SearchError> {
    // The query ast below may still contain user input query. The actual
    // parsing of the user query will happen in the root service, and might require
    // the user of the docmapper default fields (which we do not have at this point).
    let query_ast = query_ast_from_user_text(&search_request.query, search_request.search_fields);
    let query_ast_json = serde_json::to_string(&query_ast)?;
    let search_request = quickwit_proto::search::SearchRequest {
        index_id_patterns,
        query_ast: query_ast_json,
        snippet_fields: search_request.snippet_fields.unwrap_or_default(),
        start_timestamp: search_request.start_timestamp,
        end_timestamp: search_request.end_timestamp,
        max_hits: search_request.max_hits,
        start_offset: search_request.start_offset,
        aggregation_request: search_request
            .aggs
            .map(|agg| serde_json::to_string(&agg).expect("could not serialize JsonValue")),
        sort_fields: search_request.sort_by.sort_fields,
        scroll_ttl_secs: None,
        search_after: None,
        count_hits: search_request.count_all.into(),
        ignore_missing_indexes: false,
        skip_aggregation_finalization: false,
    };
    Ok(search_request)
}

async fn search_endpoint(
    index_id_patterns: Vec<String>,
    search_request: SearchRequestQueryString,
    search_service: &dyn SearchService,
) -> Result<SearchResponseRest, SearchError> {
    let allow_failed_splits = search_request.allow_failed_splits;
    let search_request = search_request_from_api_request(index_id_patterns, search_request)?;
    let search_response =
        search_service
            .root_search(search_request)
            .await
            .and_then(|search_response| {
                if (!allow_failed_splits || search_response.num_successful_splits == 0)
                    && let Some(search_error) =
                        SearchError::from_split_errors(&search_response.failed_splits[..])
                {
                    return Err(search_error);
                }
                Ok(search_response)
            })?;
    let search_response_rest = SearchResponseRest::try_from(search_response)?;
    Ok(search_response_rest)
}

fn search_get_filter()
-> impl Filter<Extract = (Vec<String>, SearchRequestQueryString), Error = Rejection> + Clone {
    warp::path!(String / "search")
        .and_then(extract_index_id_patterns)
        .and(warp::get())
        .and(warp::query())
}

fn search_post_filter()
-> impl Filter<Extract = (Vec<String>, SearchRequestQueryString), Error = Rejection> + Clone {
    warp::path!(String / "search")
        .and_then(extract_index_id_patterns)
        .and(warp::post())
        .and(warp::body::content_length_limit(1024 * 1024))
        .and(warp::body::json())
}

fn search_plan_get_filter()
-> impl Filter<Extract = (Vec<String>, SearchRequestQueryString), Error = Rejection> + Clone {
    warp::path!(String / "search-plan")
        .and_then(extract_index_id_patterns)
        .and(warp::get())
        .and(warp::query())
}

fn search_plan_post_filter()
-> impl Filter<Extract = (Vec<String>, SearchRequestQueryString), Error = Rejection> + Clone {
    warp::path!(String / "search-plan")
        .and_then(extract_index_id_patterns)
        .and(warp::post())
        .and(warp::body::content_length_limit(1024 * 1024))
        .and(warp::body::json())
}

async fn search(
    index_id_patterns: Vec<String>,
    search_request: SearchRequestQueryString,
    search_service: Arc<dyn SearchService>,
) -> impl warp::Reply {
    info!(request =? search_request, "search");
    let body_format = search_request.format;
    let result = search_endpoint(index_id_patterns, search_request, &*search_service).await;
    into_rest_api_response(result, body_format)
}

async fn search_plan(
    index_id_patterns: Vec<String>,
    search_request: SearchRequestQueryString,
    search_service: Arc<dyn SearchService>,
) -> impl warp::Reply {
    let body_format = search_request.format;
    let result: Result<SearchPlanResponseRest, SearchError> = async {
        let plan_request = search_request_from_api_request(index_id_patterns, search_request)?;
        let plan_response = search_service.search_plan(plan_request).await?;
        let response = serde_json::from_str(&plan_response.result)?;
        Ok(response)
    }
    .await;
    into_rest_api_response(result, body_format)
}

#[utoipa::path(
    get,
    tag = "Search",
    path = "/{index_id}/search",
    responses(
        (status = 200, description = "Successfully executed search.", body = SearchResponseRest)
    ),
    params(
        SearchRequestQueryString,
        ("index_id" = String, Path, description = "The index ID to search."),
    )
)]
/// Search Index (GET Variant)
///
/// Parses the search request from the request query string.
pub fn search_get_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    search_get_filter()
        .and(with_arg(search_service))
        .then(search)
}

#[utoipa::path(
    post,
    tag = "Search",
    path = "/{index_id}/search",
    request_body = SearchRequestQueryString,
    responses(
        (status = 200, description = "Successfully executed search.", body = SearchResponseRest)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to search."),
    )
)]
/// Search Index (POST Variant)
///
/// REST POST search handler.
///
/// Parses the search request from the request body.
pub fn search_post_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    search_post_filter()
        .and(with_arg(search_service))
        .then(search)
}

#[utoipa::path(
    get,
    tag = "Search",
    path = "/{index_id}/search-plan",
    responses(
        (status = 200, description = "Metadata about how a request would be executed.", body = SearchPlanResponseRest)
    ),
    params(
        SearchRequestQueryString,
        ("index_id" = String, Path, description = "The index ID to search."),
    )
)]
/// Plan Query (GET Variant)
///
/// Parses the search request from the request query string.
pub fn search_plan_get_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    search_plan_get_filter()
        .and(with_arg(search_service))
        .then(search_plan)
}

#[utoipa::path(
    post,
    tag = "Search",
    path = "/{index_id}/search-plan",
    request_body = SearchRequestQueryString,
    responses(
        (status = 200, description = "Metadata about how a request would be executed.", body = SearchPlanResponseRest)
    ),
    params(
        ("index_id" = String, Path, description = "The index ID to search."),
    )
)]
/// Plan Query (POST Variant)
///
/// Parses the search request from the request body.
pub fn search_plan_post_handler(
    search_service: Arc<dyn SearchService>,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    search_plan_post_filter()
        .and(with_arg(search_service))
        .then(search_plan)
}

#[cfg(test)]
mod tests {
    use assert_json_diff::{assert_json_eq, assert_json_include};
    use mockall::predicate;
    use quickwit_search::{MockSearchService, SearchError};
    use serde_json::{Value as JsonValue, json};

    use super::*;
    use crate::recover_fn;

    fn search_handler(
        mock_search_service: MockSearchService,
    ) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
        let mock_search_service_in_arc = Arc::new(mock_search_service);
        search_get_handler(mock_search_service_in_arc.clone())
            .or(search_post_handler(mock_search_service_in_arc.clone()))
            .or(search_plan_get_handler(mock_search_service_in_arc.clone()))
            .or(search_plan_post_handler(mock_search_service_in_arc.clone()))
            .recover(recover_fn)
    }

    #[tokio::test]
    async fn test_extract_index_id_patterns() {
        extract_index_id_patterns("my-index".to_string())
            .await
            .unwrap();
        assert_eq!(
            extract_index_id_patterns("my-index-1,my-index-2%2A".to_string())
                .await
                .unwrap(),
            vec!["my-index-1".to_string(), "my-index-2*".to_string()]
        );
        assert_eq!(
            extract_index_id_patterns("my-index-1%2Cmy-index-%2A".to_string())
                .await
                .unwrap(),
            vec!["my-index-1".to_string(), "my-index-*".to_string()]
        );
        extract_index_id_patterns("".to_string()).await.unwrap_err();
        extract_index_id_patterns(" ".to_string())
            .await
            .unwrap_err();
    }

    #[test]
    fn test_serialize_search_response() -> anyhow::Result<()> {
        let search_response = SearchResponseRest {
            num_hits: 55,
            hits: Vec::new(),
            snippets: None,
            elapsed_time_micros: 0u64,
            errors: Vec::new(),
            aggregations: None,
        };
        let search_response_json: JsonValue = serde_json::to_value(search_response)?;
        let expected_search_response_json: JsonValue = json!({
            "num_hits": 55,
            "hits": [],
            "elapsed_time_micros": 0,
        });
        assert_json_include!(
            actual: search_response_json,
            expected: expected_search_response_json
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_route_post() {
        let rest_search_api_filter = search_post_filter();
        let (indexes, req) = warp::test::request()
            .method("POST")
            .path("/quickwit-demo-index/search")
            .json(&true)
            .body(r#"{"query": "*", "max_hits":10, "aggs": {"range":[]} }"#)
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(indexes, vec!["quickwit-demo-index".to_string()]);
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                search_fields: None,
                start_timestamp: None,
                max_hits: 10,
                format: BodyFormat::default(),
                sort_by: SortBy::default(),
                aggs: Some(json!({"range":[]})),
                count_all: CountHits::CountAll,
                ..Default::default()
            }
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_post_multi_indexes() {
        let rest_search_api_filter = search_post_filter();
        let (indexes, req) = warp::test::request()
            .method("POST")
            .path("/quickwit-demo-index,quickwit-demo,quickwit-demo-index-*/search")
            .json(&true)
            .body(r#"{"query": "*", "max_hits":10, "aggs": {"range":[]} }"#)
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(
            indexes,
            vec![
                "quickwit-demo-index".to_string(),
                "quickwit-demo".to_string(),
                "quickwit-demo-index-*".to_string()
            ]
        );
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                search_fields: None,
                start_timestamp: None,
                max_hits: 10,
                format: BodyFormat::default(),
                sort_by: SortBy::default(),
                aggs: Some(json!({"range":[]})),
                ..Default::default()
            }
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_post_multi_indexes_bad_pattern() {
        let rest_search_api_filter = search_post_filter();
        let bad_pattern_rejection = warp::test::request()
            .method("POST")
            .path("/quickwit-demo-index**/search")
            .json(&true)
            .body(r#"{"query": "*", "max_hits":10, "aggs": {"range":[]} }"#)
            .filter(&rest_search_api_filter)
            .await
            .unwrap_err();
        let rejection = bad_pattern_rejection
            .find::<crate::rest::InvalidArgument>()
            .unwrap();
        assert_eq!(
            rejection.0,
            "index ID pattern `quickwit-demo-index**` is invalid: patterns must not contain \
             multiple consecutive `*`"
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_simple() {
        let rest_search_api_filter = search_get_filter();
        let (indexes, req) = warp::test::request()
            .path(
                "/quickwit-demo-index/search?query=*&end_timestamp=1450720000&max_hits=10&\
                 start_offset=22",
            )
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(indexes, vec!["quickwit-demo-index".to_string()]);
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                search_fields: None,
                start_timestamp: None,
                end_timestamp: Some(1450720000),
                max_hits: 10,
                start_offset: 22,
                format: BodyFormat::default(),
                sort_by: SortBy::default(),
                ..Default::default()
            }
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_count_all() {
        let rest_search_api_filter = search_get_filter();
        let (indexes, req) = warp::test::request()
            .path("/quickwit-demo-index/search?query=*&count_all=true")
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(indexes, vec!["quickwit-demo-index".to_string()]);
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                format: BodyFormat::default(),
                sort_by: SortBy::default(),
                max_hits: 20,
                count_all: CountHits::CountAll,
                ..Default::default()
            }
        );
        let rest_search_api_filter = search_get_filter();
        let (indexes, req) = warp::test::request()
            .path("/quickwit-demo-index/search?query=*&count_all=false")
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(indexes, vec!["quickwit-demo-index".to_string()]);
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                format: BodyFormat::default(),
                sort_by: SortBy::default(),
                max_hits: 20,
                count_all: CountHits::Underestimate,
                ..Default::default()
            }
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_simple_default_num_hits_default_offset() {
        let rest_search_api_filter = search_get_filter();
        let (indexes, req) = warp::test::request()
            .path(
                "/quickwit-demo-index/search?query=*&end_timestamp=1450720000&search_field=title,\
                 body",
            )
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(indexes, vec!["quickwit-demo-index".to_string()]);
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                search_fields: Some(vec!["title".to_string(), "body".to_string()]),
                start_timestamp: None,
                end_timestamp: Some(1450720000),
                max_hits: 20,
                start_offset: 0,
                format: BodyFormat::default(),
                sort_by: SortBy::default(),
                ..Default::default()
            }
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_simple_format() {
        let rest_search_api_filter = search_get_filter();
        let (indexes, req) = warp::test::request()
            .path("/quickwit-demo-index/search?query=*&format=json")
            .filter(&rest_search_api_filter)
            .await
            .unwrap();
        assert_eq!(indexes, vec!["quickwit-demo-index".to_string()]);
        assert_eq!(
            &req,
            &super::SearchRequestQueryString {
                query: "*".to_string(),
                start_timestamp: None,
                end_timestamp: None,
                max_hits: 20,
                start_offset: 0,
                format: BodyFormat::Json,
                search_fields: None,
                sort_by: SortBy::default(),
                ..Default::default()
            }
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_sort_by() {
        for (sort_by_query_param, expected_sort_fields) in [
            ("", Vec::new()),
            (",", Vec::new()),
            (
                "field1",
                vec![SortField {
                    field_name: "field1".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: None,
                }],
            ),
            (
                "+field1",
                vec![SortField {
                    field_name: "field1".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: None,
                }],
            ),
            (
                "-field1",
                vec![SortField {
                    field_name: "field1".to_string(),
                    sort_order: SortOrder::Asc as i32,
                    sort_datetime_format: None,
                }],
            ),
            (
                "_score",
                vec![SortField {
                    field_name: "_score".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: None,
                }],
            ),
            (
                "-_score",
                vec![SortField {
                    field_name: "_score".to_string(),
                    sort_order: SortOrder::Asc as i32,
                    sort_datetime_format: None,
                }],
            ),
            (
                "+_score",
                vec![SortField {
                    field_name: "_score".to_string(),
                    sort_order: SortOrder::Desc as i32,
                    sort_datetime_format: None,
                }],
            ),
            (
                "field1,field2",
                vec![
                    SortField {
                        field_name: "field1".to_string(),
                        sort_order: SortOrder::Desc as i32,
                        sort_datetime_format: None,
                    },
                    SortField {
                        field_name: "field2".to_string(),
                        sort_order: SortOrder::Desc as i32,
                        sort_datetime_format: None,
                    },
                ],
            ),
            (
                "+field1,-field2",
                vec![
                    SortField {
                        field_name: "field1".to_string(),
                        sort_order: SortOrder::Desc as i32,
                        sort_datetime_format: None,
                    },
                    SortField {
                        field_name: "field2".to_string(),
                        sort_order: SortOrder::Asc as i32,
                        sort_datetime_format: None,
                    },
                ],
            ),
            (
                "-field1,+field2",
                vec![
                    SortField {
                        field_name: "field1".to_string(),
                        sort_order: SortOrder::Asc as i32,
                        sort_datetime_format: None,
                    },
                    SortField {
                        field_name: "field2".to_string(),
                        sort_order: SortOrder::Desc as i32,
                        sort_datetime_format: None,
                    },
                ],
            ),
        ] {
            let path = format!(
                "/quickwit-demo-index/search?query=*&format=json&sort_by={sort_by_query_param}"
            );
            let rest_search_api_filter = search_get_filter();
            let (_, req) = warp::test::request()
                .path(&path)
                .filter(&rest_search_api_filter)
                .await
                .unwrap();

            assert_eq!(
                &req.sort_by.sort_fields, &expected_sort_fields,
                "Expected sort fields `{:?}` for query param `{sort_by_query_param}`, got: {:?}",
                expected_sort_fields, req.sort_by.sort_fields
            );
        }

        let rest_search_api_filter = search_get_filter();
        let (_, req) = warp::test::request()
            .path("/quickwit-demo-index/search?query=*&format=json&sort_by_field=fiel1")
            .filter(&rest_search_api_filter)
            .await
            .unwrap();

        assert_eq!(
            &req.sort_by.sort_fields,
            &[SortField {
                field_name: "fiel1".to_string(),
                sort_order: SortOrder::Desc as i32,
                sort_datetime_format: None,
            }],
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_invalid_key() {
        let resp = warp::test::request()
            .path("/quickwit-demo-index/search?query=*&end_unix_timestamp=1450720000")
            .reply(&search_handler(MockSearchService::new()))
            .await;
        assert_eq!(resp.status(), 400);
        let resp_json: JsonValue = serde_json::from_slice(resp.body()).unwrap();
        assert!(
            resp_json
                .get("message")
                .unwrap()
                .as_str()
                .unwrap()
                .contains("Invalid query string")
        );
    }

    #[tokio::test]
    async fn test_rest_search_api_route_post_with_invalid_payload() -> anyhow::Result<()> {
        let resp = warp::test::request()
            .method("POST")
            .path("/quickwit-demo-index/search")
            .json(&true)
            .body(r#"{"query": "*", "bad_param":10, "aggs": {"range":[]} }"#)
            .reply(&search_handler(MockSearchService::new()))
            .await;
        assert_eq!(resp.status(), 400);
        let content = String::from_utf8_lossy(resp.body());
        assert!(content.contains("Request body deserialize error: unknown field `bad_param`"));
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_route_serialize_with_results() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_root_search().returning(|_| {
            Ok(quickwit_proto::search::SearchResponse {
                hits: Vec::new(),
                num_hits: 10,
                elapsed_time_micros: 16,
                errors: Vec::new(),
                ..Default::default()
            })
        });
        let rest_search_api_handler = search_handler(mock_search_service);
        let resp = warp::test::request()
            .path("/quickwit-demo-index/search?query=*")
            .reply(&rest_search_api_handler)
            .await;
        assert_eq!(resp.status(), 200);
        let resp_json: JsonValue = serde_json::from_slice(resp.body())?;
        let expected_response_json = serde_json::json!({
            "num_hits": 10,
            "hits": [],
            "elapsed_time_micros": 16,
        });
        assert_json_include!(actual: resp_json, expected: expected_response_json);
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_start_offset_and_num_hits_parameter() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .with(predicate::function(
                |search_request: &quickwit_proto::search::SearchRequest| {
                    search_request.start_offset == 5 && search_request.max_hits == 30
                },
            ))
            .returning(|_| Ok(Default::default()));
        let rest_search_api_handler = search_handler(mock_search_service);
        assert_eq!(
            warp::test::request()
                .path("/quickwit-demo-index/search?query=*&start_offset=5&max_hits=30")
                .reply(&rest_search_api_handler)
                .await
                .status(),
            200
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_with_index_does_not_exist() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_root_search().returning(|_| {
            Err(SearchError::IndexesNotFound {
                index_ids: vec!["not-found-index".to_string()],
            })
        });
        let rest_search_api_handler = search_handler(mock_search_service);
        assert_eq!(
            warp::test::request()
                .path("/index-does-not-exist/search?query=myfield:test")
                .reply(&rest_search_api_handler)
                .await
                .status(),
            404
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_with_wrong_fieldname() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .returning(|_| Err(SearchError::Internal("ty".to_string())));
        let rest_search_api_handler = search_handler(mock_search_service);
        assert_eq!(
            warp::test::request()
                .path("/index-does-not-exist/search?query=myfield:test")
                .reply(&rest_search_api_handler)
                .await
                .status(),
            500
        );
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_with_invalid_query() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service
            .expect_root_search()
            .returning(|_| Err(SearchError::InvalidQuery("invalid query".to_string())));
        let rest_search_api_handler = search_handler(mock_search_service);
        let response = warp::test::request()
            .path("/my-index/search?query=myfield:test")
            .reply(&rest_search_api_handler)
            .await;
        assert_eq!(response.status(), 400);
        let body = String::from_utf8_lossy(response.body());
        assert!(body.contains("invalid query"));
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_route_serialize_results_with_snippet() -> anyhow::Result<()> {
        let mut mock_search_service = MockSearchService::new();
        mock_search_service.expect_root_search().returning(|_| {
            Ok(quickwit_proto::search::SearchResponse {
                hits: vec![quickwit_proto::search::Hit {
                    json: r#"{"title": "foo", "body": "foo bar baz"}"#.to_string(),
                    partial_hit: None,
                    snippet: Some(r#"{"title": [], "body": ["foo <em>bar</em> baz"]}"#.to_string()),
                    index_id: "quickwit-demo-index".to_string(),
                }],
                num_hits: 1,
                elapsed_time_micros: 16,
                errors: Vec::new(),
                ..Default::default()
            })
        });
        let rest_search_api_handler = search_handler(mock_search_service);
        let resp = warp::test::request()
            .path(
                "/quickwit-demo-index/search?query=bar&search_field=title,body&\
                 snippet_fields=title,body",
            )
            .reply(&rest_search_api_handler)
            .await;

        assert_eq!(resp.status(), 200);
        let resp_json: JsonValue = serde_json::from_slice(resp.body())?;
        let expected_response_json = serde_json::json!({
            "num_hits": 1,
            "hits": [{"title": "foo", "body": "foo bar baz"}],
            "snippets": [{"title": [], "body": ["foo <em>bar</em> baz"]}],
            "elapsed_time_micros": 16,
            "errors": [],
        });
        assert_json_eq!(resp_json, expected_response_json);
        Ok(())
    }

    #[tokio::test]
    async fn test_rest_search_api_multi_indexes() {
        {
            let mut mock_search_service = MockSearchService::new();
            mock_search_service
                .expect_root_search()
                .with(predicate::function(
                    |search_request: &quickwit_proto::search::SearchRequest| {
                        search_request.index_id_patterns
                            == vec!["quickwit-demo-*".to_string(), "quickwit-demo2".to_string()]
                    },
                ))
                .returning(|_| Ok(Default::default()));
            let rest_search_api_handler = search_handler(mock_search_service);
            assert_eq!(
                warp::test::request()
                    .path("/quickwit-demo-*,quickwit-demo2/search?query=*")
                    .reply(&rest_search_api_handler)
                    .await
                    .status(),
                200
            );
            assert_eq!(
                warp::test::request()
                    .path("/quickwit-demo-*%2Cquickwit-demo2/search?query=*")
                    .reply(&rest_search_api_handler)
                    .await
                    .status(),
                200
            );
        }
        {
            let mut mock_search_service = MockSearchService::new();
            mock_search_service
                .expect_root_search()
                .returning(|_| Ok(Default::default()));
            let rest_search_api_handler = search_handler(mock_search_service);
            assert_eq!(
                warp::test::request()
                    .path("/*/search?query=*")
                    .reply(&rest_search_api_handler)
                    .await
                    .status(),
                200
            );
            let response = warp::test::request()
                .path("/abc!/search?query=*")
                .reply(&rest_search_api_handler)
                .await;
            assert_eq!(response.status(), 400);
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/simple_list.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::str::FromStr;

use serde::{Deserialize, Deserializer, Serializer};

/// Serializes an `Option<&[Serialize]>` with
/// `Some(value)` to a comma separated string of values.
/// Used to serialize values within the query string
pub fn to_simple_list<S, T>(
    value: &Option<Vec<T>>,
    serializer: S,
) -> Result<<S as Serializer>::Ok, <S as Serializer>::Error>
where
    S: Serializer,
    T: ToString,
{
    let vec = &value
        .as_ref()
        .expect("attempt to serialize Option::None value");

    let serialized_str = vec
        .iter()
        .map(|value| value.to_string())
        .collect::<Vec<_>>() // do not collect here
        .join(",");

    serializer.serialize_str(&serialized_str)
}

/// Deserializes a comma separated string of values
/// into a [`Vec<T>`].
/// Used to deserialize list of values from the query string.
pub fn from_simple_list<'de, D, T>(deserializer: D) -> Result<Option<Vec<T>>, D::Error>
where
    D: Deserializer<'de>,
    T: FromStr,
    <T as FromStr>::Err: ToString,
{
    let str_sequence = String::deserialize(deserializer)?;
    let list = str_sequence
        .trim_matches(',')
        .split(',')
        .map(|item| T::from_str(item))
        .collect::<Result<Vec<_>, _>>()
        .map_err(|err| serde::de::Error::custom(err.to_string()))?;
    Ok(Some(list))
}


================================================
FILE: quickwit/quickwit-serve/src/tcp_listener.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::net::SocketAddr;

use quickwit_proto::tonic;
use tokio::net::TcpListener;
use tonic::async_trait;

/// Resolve `SocketAddr` into `TcpListener` instances.
///
/// This trait can be used to inject existing [`TcpListener`] instances to the
/// Quickwit REST and gRPC servers when running them in tests.
#[async_trait]
pub trait TcpListenerResolver: Clone + Send + 'static {
    async fn resolve(&self, addr: SocketAddr) -> anyhow::Result<TcpListener>;
}

#[derive(Clone)]
pub struct DefaultTcpListenerResolver;

#[async_trait]
impl TcpListenerResolver for DefaultTcpListenerResolver {
    async fn resolve(&self, addr: SocketAddr) -> anyhow::Result<TcpListener> {
        TcpListener::bind(addr)
            .await
            .map_err(|err| anyhow::anyhow!(err))
    }
}

#[cfg(any(test, feature = "testsuite"))]
pub mod for_tests {
    use std::collections::HashMap;
    use std::sync::Arc;

    use anyhow::Context;
    use tokio::sync::Mutex;

    use super::*;

    #[derive(Clone, Default)]
    pub struct TestTcpListenerResolver {
        listeners: Arc<Mutex<HashMap<SocketAddr, TcpListener>>>,
    }

    #[async_trait]
    impl TcpListenerResolver for TestTcpListenerResolver {
        async fn resolve(&self, addr: SocketAddr) -> anyhow::Result<TcpListener> {
            self.listeners
                .lock()
                .await
                .remove(&addr)
                .context(format!("No listener found for address {addr}"))
        }
    }

    impl TestTcpListenerResolver {
        pub async fn add_listener(&self, listener: TcpListener) {
            self.listeners
                .lock()
                .await
                .insert(listener.local_addr().unwrap(), listener);
        }
    }
}


================================================
FILE: quickwit/quickwit-serve/src/template_api/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod rest_handler;

pub(crate) use rest_handler::{IndexTemplateApi, index_template_api_handlers};


================================================
FILE: quickwit/quickwit-serve/src/template_api/rest_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::any::type_name;

use bytes::Bytes;
use quickwit_config::{ConfigFormat, IndexTemplate, IndexTemplateId, VersionedIndexTemplate};
use quickwit_proto::metastore::{
    CreateIndexTemplateRequest, DeleteIndexTemplatesRequest, GetIndexTemplateRequest,
    ListIndexTemplatesRequest, MetastoreError, MetastoreResult, MetastoreService,
    MetastoreServiceClient, serde_utils,
};
use serde_json::Value as JsonValue;
use warp::reject::Rejection;
use warp::{Filter, Reply};

use crate::format::{extract_config_format, extract_format_from_qs};
use crate::rest::recover_fn;
use crate::rest_api_response::into_rest_api_response;
use crate::with_arg;

#[derive(utoipa::OpenApi)]
#[openapi(
    paths(
        create_index_template,
        get_index_template,
        update_index_template,
        delete_index_template,
        list_index_templates,
    ),
    components(schemas(VersionedIndexTemplate))
)]
pub(crate) struct IndexTemplateApi;

pub(crate) fn index_template_api_handlers(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl Reply,), Error = Rejection> + Clone {
    create_index_template_handler(metastore.clone())
        .or(get_index_template_handler(metastore.clone()))
        .or(update_index_template_handler(metastore.clone()))
        .or(delete_index_template_handler(metastore.clone()))
        .or(list_index_templates_handler(metastore.clone()))
        .recover(recover_fn)
        .boxed()
}

fn create_index_template_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("templates")
        .and(warp::post())
        .and(warp::filters::body::bytes())
        .and(extract_config_format())
        .and(with_arg(metastore))
        .then(create_index_template)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    post,
    tag = "Templates",
    path = "/templates",
    request_body = VersionedIndexTemplate,
    responses(
        (status = 200, description = "The index template was successfully created.", body = VersionedIndexTemplate)
    ),
)]
/// Creates a new index template.
async fn create_index_template(
    body: Bytes,
    config_format: ConfigFormat,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<IndexTemplate> {
    let index_template: IndexTemplate =
        config_format
            .parse(&body)
            .map_err(|error| MetastoreError::JsonDeserializeError {
                struct_name: type_name::<IndexTemplate>().to_string(),
                message: error.to_string(),
            })?;
    index_template.validate().map_err(|error| {
        let message = format!("invalid index template: {error}");
        MetastoreError::InvalidArgument { message }
    })?;
    let index_template_json = serde_utils::to_json_str(&index_template)?;
    let create_index_template = CreateIndexTemplateRequest {
        index_template_json,
        overwrite: false,
    };
    metastore
        .create_index_template(create_index_template)
        .await?;
    Ok(index_template)
}

fn get_index_template_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("templates" / String)
        .and(warp::get())
        .and(with_arg(metastore))
        .then(get_index_template)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    get,
    tag = "Templates",
    path = "/templates/{template_id}",
    responses(
        (status = 200, description = "The index template was successfully retrieved.", body = VersionedIndexTemplate),
        (status = 404, description = "The index template was not found.")
    ),
)]
/// Retrieves the index template identified by `template_id`.
async fn get_index_template(
    template_id: IndexTemplateId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<IndexTemplate> {
    let get_index_template_request = GetIndexTemplateRequest { template_id };
    let get_index_template_response = metastore
        .get_index_template(get_index_template_request)
        .await?;
    let index_template: IndexTemplate =
        serde_utils::from_json_str(&get_index_template_response.index_template_json)?;
    Ok(index_template)
}

fn update_index_template_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("templates" / String)
        .and(warp::put())
        .and(warp::filters::body::bytes())
        .and(extract_config_format())
        .and(with_arg(metastore))
        .then(update_index_template)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    put,
    tag = "Templates",
    path = "/templates/{template_id}",
    request_body = VersionedIndexTemplate,
    responses(
        (status = 200, description = "The index template was successfully retrieved.", body = VersionedIndexTemplate),
        (status = 404, description = "The index template was not found.")
    ),
)]
/// Updates the index template identified by `template_id`.
async fn update_index_template(
    template_id: IndexTemplateId,
    body: Bytes,
    config_format: ConfigFormat,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<IndexTemplate> {
    let mut json_value: JsonValue =
        config_format
            .parse(&body)
            .map_err(|error| MetastoreError::JsonDeserializeError {
                struct_name: type_name::<IndexTemplate>().to_string(),
                message: error.to_string(),
            })?;
    json_value["template_id"] = JsonValue::String(template_id);

    if let Some(JsonValue::Number(number)) = json_value.get("version") {
        json_value["version"] = JsonValue::String(number.to_string());
    }
    let index_template: IndexTemplate = serde_utils::from_json_value(json_value)?;
    index_template.validate().map_err(|error| {
        let message = format!("invalid index template: {error}");
        MetastoreError::InvalidArgument { message }
    })?;
    let index_template_json = serde_utils::to_json_str(&index_template)?;
    let create_index_template = CreateIndexTemplateRequest {
        index_template_json,
        overwrite: true,
    };
    metastore
        .create_index_template(create_index_template)
        .await?;
    Ok(index_template)
}

fn delete_index_template_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("templates" / String)
        .and(warp::delete())
        .and(with_arg(metastore))
        .then(delete_index_template)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    delete,
    tag = "Templates",
    path = "/templates/{template_id}",
    responses(
        (status = 200, description = "The index template was successfully deleted."),
        (status = 404, description = "The index template was not found.")
    ),
)]
/// Deletes the index template identified by the provided `template_id`.
async fn delete_index_template(
    template_id: IndexTemplateId,
    metastore: MetastoreServiceClient,
) -> MetastoreResult<()> {
    let template_ids = vec![template_id];
    let delete_index_templates_request = DeleteIndexTemplatesRequest { template_ids };
    metastore
        .delete_index_templates(delete_index_templates_request)
        .await?;
    Ok(())
}

fn list_index_templates_handler(
    metastore: MetastoreServiceClient,
) -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path!("templates")
        .and(warp::get())
        .and(with_arg(metastore))
        .then(list_index_templates)
        .and(extract_format_from_qs())
        .map(into_rest_api_response)
}

#[utoipa::path(
    get,
    tag = "Templates",
    path = "/templates",
    responses(
        (status = 200, description = "The index template was successfully retrieved.", body = [VersionedIndexTemplate]),
    ),
)]
/// Retrieves all the index templates stored in the metastore.
async fn list_index_templates(
    metastore: MetastoreServiceClient,
) -> MetastoreResult<Vec<IndexTemplate>> {
    let list_index_templates_request = ListIndexTemplatesRequest {};
    let list_index_templates_response = metastore
        .list_index_templates(list_index_templates_request)
        .await?;
    let index_templates: Vec<IndexTemplate> = list_index_templates_response
        .index_templates_json
        .into_iter()
        .map(|index_template_json| {
            serde_utils::from_json_str::<IndexTemplate>(&index_template_json)
        })
        .collect::<MetastoreResult<_>>()?;
    Ok(index_templates)
}

#[cfg(test)]
mod tests {
    use quickwit_proto::metastore::{
        EmptyResponse, EntityKind, GetIndexTemplateResponse, ListIndexTemplatesResponse,
        MockMetastoreService,
    };
    use serde_json::json;

    use super::*;

    #[tokio::test]
    async fn test_create_index_template() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_create_index_template()
            .return_once(|request| {
                assert!(!request.overwrite);

                let index_template: IndexTemplate =
                    serde_json::from_str(&request.index_template_json).unwrap();

                assert_eq!(index_template.template_id, "test-template-foo");
                assert_eq!(index_template.index_id_patterns, ["test-index-foo*"]);

                Ok(EmptyResponse {})
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let create_index_template_handler = create_index_template_handler(metastore);
        let response = warp::test::request()
            .path("/templates")
            .method("POST")
            .json(&json!({
                "version": "0.7",
                "template_id": "test-template-foo",
                "index_id_patterns": ["test-index-foo*"],
                "doc_mapping": {},
            }))
            .reply(&create_index_template_handler)
            .await;
        assert_eq!(response.status(), 200);
    }

    #[tokio::test]
    async fn test_get_index_template() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_get_index_template()
            .withf(|request| request.template_id == "test-template-foo")
            .return_once(|request| {
                assert_eq!(request.template_id, "test-template-foo");

                let error = MetastoreError::NotFound(EntityKind::IndexTemplate {
                    template_id: request.template_id,
                });
                Err(error)
            });
        mock_metastore
            .expect_get_index_template()
            .withf(|request| request.template_id == "test-template-bar")
            .return_once(|request| {
                assert_eq!(request.template_id, "test-template-bar");

                let index_template =
                    IndexTemplate::for_test("test-template-bar", &["test-index-bar*"], 100);
                let index_template_json = serde_utils::to_json_str(&index_template).unwrap();
                let response = GetIndexTemplateResponse {
                    index_template_json,
                };
                Ok(response)
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let get_index_template_handler = get_index_template_handler(metastore);

        let response = warp::test::request()
            .path("/templates/test-template-foo")
            .reply(&get_index_template_handler)
            .await;
        assert_eq!(response.status(), 404);

        let response = warp::test::request()
            .path("/templates/test-template-bar")
            .reply(&get_index_template_handler)
            .await;
        assert_eq!(response.status(), 200);

        let index_template: IndexTemplate = serde_json::from_slice(response.body()).unwrap();
        assert_eq!(index_template.template_id, "test-template-bar");
        assert_eq!(index_template.index_id_patterns, ["test-index-bar*"]);
        assert_eq!(index_template.priority, 100);
    }

    #[tokio::test]
    async fn test_update_index_template() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_create_index_template()
            .return_once(|request| {
                assert!(request.overwrite);

                let index_template: IndexTemplate =
                    serde_json::from_str(&request.index_template_json).unwrap();

                assert_eq!(index_template.template_id, "test-template-foo");
                assert_eq!(index_template.index_id_patterns, ["test-index-foo*"]);

                Ok(EmptyResponse {})
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let update_index_template_handler = update_index_template_handler(metastore);
        let response = warp::test::request()
            .path("/templates/test-template-foo")
            .method("PUT")
            .json(&json!({
                "version": "0.7",
                "template_id": "test-template-bar", // This `template_id` should be ignored and overridden by the path parameter.
                "index_id_patterns": ["test-index-foo*"],
                "doc_mapping": {},
            }))
            .reply(&update_index_template_handler)
            .await;
        assert_eq!(response.status(), 200);
    }

    #[tokio::test]
    async fn test_delete_index_template() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_delete_index_templates()
            .return_once(|request| {
                assert_eq!(request.template_ids, ["test-template-foo"]);
                Ok(EmptyResponse {})
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let delete_index_template_handler = delete_index_template_handler(metastore);
        let response = warp::test::request()
            .path("/templates/test-template-foo")
            .method("DELETE")
            .reply(&delete_index_template_handler)
            .await;
        assert_eq!(response.status(), 200);
    }

    #[tokio::test]
    async fn test_list_index_templates() {
        let mut mock_metastore = MockMetastoreService::new();
        mock_metastore
            .expect_list_index_templates()
            .return_once(|_request| {
                let index_template_foo =
                    IndexTemplate::for_test("test-template-foo", &["test-index-foo*"], 100);
                let index_template_foo_json = serde_json::to_string(&index_template_foo).unwrap();

                let index_template_bar =
                    IndexTemplate::for_test("test-template-bar", &["test-index-bar*"], 200);
                let index_template_bar_json = serde_json::to_string(&index_template_bar).unwrap();

                let response = ListIndexTemplatesResponse {
                    index_templates_json: vec![index_template_foo_json, index_template_bar_json],
                };
                Ok(response)
            });
        let metastore = MetastoreServiceClient::from_mock(mock_metastore);
        let list_index_templates_handler = list_index_templates_handler(metastore);
        let response = warp::test::request()
            .path("/templates")
            .method("GET")
            .reply(&list_index_templates_handler)
            .await;
        assert_eq!(response.status(), 200);

        let mut index_templates: Vec<IndexTemplate> =
            serde_json::from_slice(response.body()).unwrap();
        index_templates.sort_unstable_by(|left, right| left.template_id.cmp(&right.template_id));

        assert_eq!(index_templates.len(), 2);
        assert_eq!(index_templates[0].template_id, "test-template-bar");
        assert_eq!(index_templates[1].template_id, "test-template-foo");
    }
}


================================================
FILE: quickwit/quickwit-serve/src/ui_handler.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use once_cell::sync::Lazy;
use quickwit_telemetry::payload::TelemetryEvent;
use regex::Regex;
use rust_embed::RustEmbed;
use warp::hyper::header::HeaderValue;
use warp::path::Tail;
use warp::reply::Response;
use warp::{Filter, Rejection};

use crate::rest::recover_fn;

/// Regular expression to identify which path should serve an asset file.
/// If not matched, the server serves the `index.html` file.
const PATH_PATTERN: &str = r"(^static|\.(png|json|txt|ico|js|map|css|woff2|ttf)$)";

const UI_INDEX_FILE_NAME: &str = "index.html";

#[derive(RustEmbed)]
#[folder = "../quickwit-ui/build/"]
struct Asset;

pub fn ui_handler() -> impl Filter<Extract = (impl warp::Reply,), Error = Rejection> + Clone {
    warp::path("ui")
        .and(warp::path::tail())
        .and_then(serve_file)
        .recover(recover_fn)
        .boxed()
}

async fn serve_file(path: Tail) -> Result<impl warp::Reply, Rejection> {
    serve_impl(path.as_str()).await
}

async fn serve_impl(path: &str) -> Result<impl warp::Reply + use<>, Rejection> {
    static PATH_PTN: Lazy<Regex> = Lazy::new(|| Regex::new(PATH_PATTERN).unwrap());
    let path_to_file = if PATH_PTN.is_match(path) {
        path
    } else {
        // Quickwit UI is a single page application.
        // Any path request that is not an asset should serve the `index.html` file.
        // The client (browser) usually request `index.html` once unless the user refreshes the
        // page.
        quickwit_telemetry::send_telemetry_event(TelemetryEvent::UiIndexPageLoad).await;
        UI_INDEX_FILE_NAME
    };
    let asset = Asset::get(path_to_file).ok_or_else(warp::reject::not_found)?;
    let mime = mime_guess::from_path(path_to_file).first_or_octet_stream();

    let mut res = Response::new(asset.data.into_owned().into());
    res.headers_mut().insert(
        "content-type",
        HeaderValue::from_str(mime.as_ref()).unwrap(),
    );
    Ok(res)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_path_regex() {
        let path_ptn = Regex::new(PATH_PATTERN).unwrap();

        assert!(path_ptn.is_match("manifest.json"));
        assert!(path_ptn.is_match("favicon.ico"));
        assert!(path_ptn.is_match("static/js/main.df380554.js.map"));
        assert!(path_ptn.is_match("android-chrome-192x192.png"));
        assert!(!path_ptn.is_match("search"));
        assert!(!path_ptn.is_match(""));
    }
}


================================================
FILE: quickwit/quickwit-storage/Cargo.toml
================================================
[package]
name = "quickwit-storage"
description = "Storage layer"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
anyhow = { workspace = true }
async-trait = { workspace = true }
base64 = { workspace = true }
bytes = { workspace = true }
bytesize = { workspace = true }
fnv = { workspace = true }
futures = { workspace = true }
http-body-util = { workspace = true}
hyper = { workspace = true }
lru = { workspace = true }
md5 = { workspace = true }
mini-moka = { workspace = true }
mockall = { workspace = true, optional = true }
once_cell = { workspace = true }
pin-project = { workspace = true }
quick_cache = { workspace = true }
regex = { workspace = true }
serde = { workspace = true }
serde_json = { workspace = true }
tantivy = { workspace = true }
tempfile = { workspace = true }
thiserror = { workspace = true }
tokio = { workspace = true, features = ["test-util"] }
tokio-stream = { workspace = true }
tokio-util = { workspace = true }
tracing = { workspace = true }
ulid = { workspace = true }

aws-config = { workspace = true }
aws-credential-types = { workspace = true }
aws-sdk-s3 = { workspace = true }
aws-smithy-types = { workspace = true }

azure_core = { workspace = true, optional = true }
azure_identity = { workspace = true, optional = true }
azure_storage = { workspace = true, optional = true }
azure_storage_blobs = { workspace = true, optional = true }

quickwit-aws = { workspace = true }
quickwit-common = { workspace = true }
quickwit-config = { workspace = true }
quickwit-proto = { workspace = true }

opendal = { workspace = true, optional = true }
reqwest = { workspace = true, optional = true }

[dev-dependencies]
http = { workspace = true }
mockall = { workspace = true }
proptest = { workspace = true }
tokio = { workspace = true }
tracing-subscriber = { workspace = true }

aws-sdk-s3 = { workspace = true }
aws-smithy-runtime = { workspace = true, features = ["test-util"] }

quickwit-common = { workspace = true, features = ["testsuite"] }

[features]
azure = [
  "azure_core",
  "azure_identity",
  "azure_storage",
  "azure_storage_blobs",
  "azure_core/hmac_rust",
  "azure_core/enable_reqwest_rustls",
  "azure_storage/enable_reqwest_rustls",
  "azure_storage_blobs/enable_reqwest_rustls",
]
gcs = ["dep:opendal", "opendal/services-gcs"]
ci-test = []
integration-testsuite = [
  "azure",
  "azure_core/azurite_workaround",
  "azure_storage_blobs/azurite_workaround",
  "gcs",                                    # Stands for Google cloud storage.
  "dep:reqwest",
]
testsuite = ["mockall"]


================================================
FILE: quickwit/quickwit-storage/src/bundle_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::convert::TryInto;
use std::fmt::Debug;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::{fmt, io};

use anyhow::Context;
use async_trait::async_trait;
use quickwit_common::chunk_range;
use quickwit_common::uri::Uri;
use serde::{Deserialize, Serialize};
use tantivy::HasLen;
use tantivy::directory::FileSlice;
use tokio::io::{AsyncRead, AsyncWriteExt};
use tracing::error;

use crate::storage::SendableAsync;
use crate::{
    BulkDeleteError, OwnedBytes, Storage, StorageError, StorageResult, VersionedComponent,
};

/// BundleStorage bundles together multiple files into a single file.
/// with some metadata
pub struct BundleStorage {
    storage: Arc<dyn Storage>,
    /// The file path of the bundle in the storage.
    bundle_filepath: PathBuf,
    metadata: BundleStorageFileOffsets,
}

impl BundleStorage {
    /// Opens a BundleStorage.
    ///
    /// The provided data must include the footer_bytes at the end of the slice, but it can have
    /// more up front.
    ///
    /// Returns (Hotcache, Self)
    pub fn open_from_split_data_with_owned_bytes(
        storage: Arc<dyn Storage>,
        bundle_filepath: PathBuf,
        split_data: OwnedBytes,
    ) -> anyhow::Result<(FileSlice, Self)> {
        Self::open_from_split_data(
            storage,
            bundle_filepath,
            FileSlice::new(Arc::new(split_data)),
        )
    }
    /// Opens a BundleStorage.
    ///
    /// The provided data must include the footer_bytes at the end of the slice, but it can have
    /// more up front.
    ///
    /// Returns (Hotcache, Self)
    pub fn open_from_split_data(
        storage: Arc<dyn Storage>,
        bundle_filepath: PathBuf,
        split_data: FileSlice,
    ) -> anyhow::Result<(FileSlice, Self)> {
        let (hotcache, metadata) = BundleStorageFileOffsets::open_from_split_data(split_data)?;
        Ok((
            hotcache,
            BundleStorage {
                storage,
                bundle_filepath,
                metadata,
            },
        ))
    }

    /// Returns Iterator over files contained in the bundle.
    pub fn iter_files(&self) -> impl Iterator<Item = &PathBuf> {
        self.metadata.files.keys()
    }
}

const SPLIT_HOTBYTES_FOOTER_LENGTH_NUM_BYTES: usize = std::mem::size_of::<u32>();
const BUNDLE_METADATA_LENGTH_NUM_BYTES: usize = std::mem::size_of::<u32>();

#[derive(Copy, Clone, Default)]
#[repr(u32)]
pub enum BundleStorageFileOffsetsVersions {
    #[default]
    V1 = 1,
}

impl VersionedComponent for BundleStorageFileOffsetsVersions {
    const MAGIC_NUMBER: u32 = 403_881_646u32;

    type Component = BundleStorageFileOffsets;

    fn to_version_code(self) -> u32 {
        self as u32
    }

    fn try_from_version_code_impl(version_code: u32) -> Option<Self> {
        match version_code {
            1 => Some(Self::V1),
            _ => None,
        }
    }

    fn serialize_impl(component: &BundleStorageFileOffsets, output: &mut Vec<u8>) {
        let metadata_json = serde_json::to_string(component).unwrap();
        output.extend_from_slice(metadata_json.as_bytes());
    }

    fn deserialize_impl(&self, bytes: &mut OwnedBytes) -> anyhow::Result<Self::Component> {
        serde_json::from_reader(bytes).context("deserializing bundle storage file offsets failed")
    }
}

/// Returns the file offsets in the file bundle.
#[derive(Debug, Default, Serialize, Deserialize, Clone)]
pub struct BundleStorageFileOffsets {
    /// The files and their offsets in the body
    pub files: HashMap<PathBuf, Range<u64>>,
}

impl BundleStorageFileOffsets {
    /// File need to include split data (with hotcache at the end).
    /// See docs/internals/split-format.md
    /// [Files, FileMetadata, FileMetadata Len, HotCache, HotCache Len]
    /// Returns (Hotcache, Self)
    fn open_from_split_data(file: FileSlice) -> anyhow::Result<(FileSlice, Self)> {
        let (bundle_and_hotcache_bytes, hotcache_num_bytes_data) =
            file.split_from_end(SPLIT_HOTBYTES_FOOTER_LENGTH_NUM_BYTES);
        let hotcache_num_bytes: u32 = u32::from_le_bytes(
            hotcache_num_bytes_data
                .read_bytes()?
                .as_ref()
                .try_into()
                .unwrap(),
        );
        let (bundle, hotcache) =
            bundle_and_hotcache_bytes.split_from_end(hotcache_num_bytes as usize);
        Ok((hotcache, Self::open(bundle)?))
    }

    /// FileSlice needs to end with the bundle (without hotcache from the split at the end).
    /// See docs/internals/split-format.md
    /// [Files, FileMetadata, FileMetadata Len]
    pub fn open(file: FileSlice) -> anyhow::Result<Self> {
        let (tantivy_files_data, num_bytes_file_metadata) =
            file.split_from_end(BUNDLE_METADATA_LENGTH_NUM_BYTES);
        let footer_num_bytes: u32 = u32::from_le_bytes(
            num_bytes_file_metadata
                .read_bytes()?
                .as_slice()
                .try_into()
                .unwrap(),
        );

        let mut bundle_storage_file_offsets_data = tantivy_files_data
            .slice_from_end(footer_num_bytes as usize)
            .read_bytes()?;
        BundleStorageFileOffsetsVersions::try_read_component(&mut bundle_storage_file_offsets_data)
    }

    /// Returns file offsets for given path.
    pub fn get(&self, path: &Path) -> Option<Range<u64>> {
        self.files.get(path).cloned()
    }

    /// Returns whether file exists in metadata.
    pub fn exists(&self, path: &Path) -> bool {
        self.files.contains_key(path)
    }
}

#[async_trait]
impl Storage for BundleStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if !self
            .storage
            .exists(&self.bundle_filepath)
            .await
            .unwrap_or(false)
        {
            anyhow::bail!("`{}` not found in storage", self.bundle_filepath.display())
        }
        Ok(())
    }

    async fn put(
        &self,
        path: &Path,
        _payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        Err(unsupported_operation(&[path]))
    }

    async fn copy_to(
        &self,
        path: &Path,
        output: &mut dyn SendableAsync,
    ) -> crate::StorageResult<()> {
        let file_num_bytes = self.file_num_bytes(path).await? as usize;
        let block_size = 100_000_000;
        for block in chunk_range(0..file_num_bytes, block_size) {
            let file_content = self.get_slice(path, block).await?;
            output.write_all(&file_content).await?;
        }
        output.flush().await?;
        Ok(())
    }

    async fn get_slice(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> crate::StorageResult<OwnedBytes> {
        let file_offsets = self.metadata.get(path).ok_or_else(|| {
            crate::StorageErrorKind::NotFound
                .with_error(anyhow::anyhow!("missing file `{}`", path.display()))
        })?;
        let new_range =
            file_offsets.start as usize + range.start..file_offsets.start as usize + range.end;
        self.storage
            .get_slice(&self.bundle_filepath, new_range)
            .await
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        _range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        Err(unsupported_operation(&[path]))
    }

    async fn get_all(&self, path: &Path) -> crate::StorageResult<OwnedBytes> {
        let file_offsets = self.metadata.get(path).ok_or_else(|| {
            crate::StorageErrorKind::NotFound
                .with_error(anyhow::anyhow!("missing file `{}`", path.display()))
        })?;
        self.storage
            .get_slice(
                &self.bundle_filepath,
                file_offsets.start as usize..file_offsets.end as usize,
            )
            .await
    }

    async fn delete(&self, path: &Path) -> crate::StorageResult<()> {
        Err(unsupported_operation(&[path]))
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        Err(BulkDeleteError {
            error: Some(unsupported_operation(paths)),
            ..Default::default()
        })
    }

    async fn exists(&self, path: &Path) -> crate::StorageResult<bool> {
        // also check if self.bundle_file_name exists ?
        Ok(self.metadata.exists(path))
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        let file_range = self.metadata.get(path).ok_or_else(|| {
            crate::StorageErrorKind::NotFound
                .with_error(anyhow::anyhow!("missing file `{}`", path.display()))
        })?;
        Ok(file_range.end - file_range.start)
    }

    fn uri(&self) -> &Uri {
        self.storage.uri()
    }
}

impl HasLen for BundleStorage {
    fn len(&self) -> usize {
        unimplemented!()
    }
}

impl fmt::Debug for BundleStorage {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "BundleStorage({:?}, files={:?})",
            &self.bundle_filepath, self.metadata
        )
    }
}

fn unsupported_operation(paths: &[&Path]) -> StorageError {
    let msg = "Unsupported operation. BundleStorage only supports async reads";
    error!(paths=?paths, msg);
    io::Error::other(format!("{msg}: {paths:?}")).into()
}

#[cfg(test)]
mod tests {
    use std::fs::{self, File};
    use std::io::Write;

    use super::*;
    use crate::{PutPayload, RamStorageBuilder, SplitPayloadBuilder};

    #[tokio::test]
    async fn bundle_storage_file_offsets() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(&[123, 76])?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(&[99, 55, 44])?;

        let buffer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1.clone(), test_filepath2.clone()],
            &[],
            &[5, 5, 5],
        )?
        .read_all()
        .await?;

        let bundle_filepath = Path::new("bundle");
        let bundle_file_slice = FileSlice::new(Arc::new(buffer.clone()));
        let (hotcache, metadata) =
            BundleStorageFileOffsets::open_from_split_data(bundle_file_slice)?;
        assert_eq!(hotcache.read_bytes().unwrap().as_ref(), &[5, 5, 5]);
        let ram_storage = RamStorageBuilder::default()
            .put(&bundle_filepath.to_string_lossy(), &buffer)
            .build();

        let bundle_storage = BundleStorage {
            metadata,
            bundle_filepath: bundle_filepath.to_path_buf(),
            storage: Arc::new(ram_storage),
        };
        let f1_data = bundle_storage.get_all(Path::new("f1")).await?;
        assert_eq!(&*f1_data, &[123u8, 76u8]);

        let f2_data = bundle_storage.get_all(Path::new("f2")).await?;
        assert_eq!(&f2_data[..], &[99, 55, 44]);

        Ok(())
    }
    #[tokio::test]
    async fn bundle_storage_test() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(&[123, 76])?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(&[99, 55, 44])?;

        let buffer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1.clone(), test_filepath2.clone()],
            &[],
            &[1, 3, 3, 7],
        )?
        .read_all()
        .await?;

        let (hotcache, metadata) =
            BundleStorageFileOffsets::open_from_split_data(FileSlice::from(buffer.to_vec()))?;
        assert_eq!(hotcache.read_bytes().unwrap().as_ref(), &[1, 3, 3, 7]);

        let bundle_filepath = Path::new("bundle");
        let ram_storage = RamStorageBuilder::default()
            .put(&bundle_filepath.to_string_lossy(), &buffer)
            .build();

        let bundle_storage = BundleStorage {
            metadata,
            bundle_filepath: bundle_filepath.to_path_buf(),
            storage: Arc::new(ram_storage),
        };
        let f1_data = bundle_storage.get_all(Path::new("f1")).await?;
        assert_eq!(&*f1_data, &[123u8, 76u8]);

        let f2_data = bundle_storage.get_all(Path::new("f2")).await?;
        assert_eq!(&f2_data[..], &[99, 55, 44]);

        let copy_to_file = temp_dir.path().join("copy_file");
        bundle_storage
            .copy_to_file(Path::new("f2"), &copy_to_file)
            .await?;
        let file_content = fs::read(copy_to_file).unwrap();
        assert_eq!(&f2_data[..], file_content);

        Ok(())
    }

    #[tokio::test]
    async fn bundlestorage_test_empty() -> anyhow::Result<()> {
        let buffer = SplitPayloadBuilder::get_split_payload(&[], &[], &[])?
            .read_all()
            .await?;

        let (_hotcache, metadata) =
            BundleStorageFileOffsets::open_from_split_data(FileSlice::from(buffer.to_vec()))?;

        let bundle_filepath = PathBuf::from("bundle");
        let ram_storage = RamStorageBuilder::default()
            .put(&bundle_filepath.to_string_lossy(), &buffer)
            .build();
        let bundle_storage = BundleStorage {
            metadata,
            bundle_filepath,
            storage: Arc::new(ram_storage),
        };

        assert_eq!(bundle_storage.exists(Path::new("blub")).await?, false);

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/base_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Borrow;
use std::hash::Hash;
use std::sync::{Arc, Weak};
use std::time::Duration;

use bytesize::ByteSize;
use lru::LruCache;
use mini_moka::sync::Cache as MokaCache;
use quick_cache::unsync::Cache as QuickCache;
use quickwit_config::CachePolicy;
use tokio::time::Instant;
use tracing::{error, warn};

use crate::OwnedBytes;
use crate::cache::stored_item::{StoredItem, ValueLen};
use crate::metrics::SingleCacheMetrics;

/// We do not evict anything that has been accessed in the last 60s.
///
/// The goal is to behave better on scan access patterns, without being as aggressive as
/// using a MRU strategy.
///
/// TLDR is:
///
/// If two items have been access in the last 60s it is not really worth considering the
/// latter too be more recent than the previous and do an eviction.
/// The difference is not significant enough to raise the probability of its future access.
///
/// On the other hand, for very large queries involving enough data to saturate the cache,
/// we are facing a scanning pattern. If variations of this  query is repeated over and over
/// a regular LRU eviction policy would yield a hit rate of 0.
pub(crate) const LRU_MIN_TIME_SINCE_LAST_ACCESS: Duration = Duration::from_secs(60);

// A fake entry inside a cache, which the cache believe to be of the given size
#[derive(Clone)]
pub(crate) struct FakeCacheEntry(pub usize);

impl ValueLen for FakeCacheEntry {
    fn len(&self) -> usize {
        self.0
    }
}

#[derive(Clone, Copy, Debug, PartialEq)]
pub(crate) enum Capacity {
    Unlimited,
    InBytes(usize),
}

impl Capacity {
    fn exceeds_capacity(&self, num_bytes: usize) -> bool {
        match *self {
            Capacity::Unlimited => false,
            Capacity::InBytes(capacity_in_bytes) => num_bytes > capacity_in_bytes,
        }
    }
}

pub(crate) enum AnyCache<K: Hash + Eq, V: ValueLen = OwnedBytes> {
    Lru(Lru<K, V>),
    S3Fifo(S3Fifo<K, V>),
    TinyLfu(TinyLfu<K, V>),
}

impl<K: Hash + Eq + Send + Sync + 'static, V: ValueLen + Clone + Send + Sync + 'static>
    AnyCache<K, V>
{
    pub fn from_policy_and_capacity(
        policy: CachePolicy,
        capacity: ByteSize,
        cache_metrics: SingleCacheMetrics,
    ) -> Self {
        match policy {
            CachePolicy::Lru => AnyCache::Lru(Lru::with_capacity(
                Capacity::InBytes(capacity.as_u64().try_into().unwrap_or(usize::MAX)),
                cache_metrics,
            )),
            CachePolicy::S3Fifo => {
                AnyCache::S3Fifo(S3Fifo::with_capacity(capacity.as_u64(), cache_metrics))
            }
            CachePolicy::TinyLfu => {
                AnyCache::TinyLfu(TinyLfu::with_capacity(capacity.as_u64(), cache_metrics))
            }
        }
    }
    pub fn unbounded(cache_metrics: SingleCacheMetrics) -> Self {
        AnyCache::Lru(Lru::with_capacity(Capacity::Unlimited, cache_metrics))
    }

    pub fn get<Q>(&mut self, cache_key: &Q) -> Option<V>
    where
        K: Borrow<Q>,
        Arc<K>: Borrow<Q>,
        Q: Hash + Eq + ?Sized,
    {
        match self {
            AnyCache::Lru(lru) => lru.get(cache_key),
            AnyCache::S3Fifo(s3fifo) => s3fifo.get(cache_key),
            AnyCache::TinyLfu(tiny_lfu) => tiny_lfu.get(cache_key),
        }
    }
    pub fn put(&mut self, key: K, value: V) {
        match self {
            AnyCache::Lru(lru) => lru.put(key, value),
            AnyCache::S3Fifo(s3fifo) => s3fifo.put(key, value),
            AnyCache::TinyLfu(tiny_lfu) => tiny_lfu.put(key, value),
        }
    }
}

pub struct Lru<K: Hash + Eq, V> {
    lru_cache: LruCache<K, StoredItem<V>>,
    num_items: usize,
    num_bytes: u64,
    capacity: Capacity,
    cache_metrics: SingleCacheMetrics,
}

impl<K: Hash + Eq, V> Drop for Lru<K, V> {
    fn drop(&mut self) {
        // we don't count this toward evicted entries, as we are clearing the whole cache
        self.cache_metrics.in_cache_count.sub(self.num_items as i64);
        self.cache_metrics
            .in_cache_num_bytes
            .sub(self.num_bytes as i64);
    }
}

impl<K: Hash + Eq, V: ValueLen + Clone> Lru<K, V> {
    /// Creates a new NeedMutSliceCache with the given capacity.
    fn with_capacity(capacity: Capacity, cache_metrics: SingleCacheMetrics) -> Self {
        Lru {
            // The limit will be decided by the amount of memory in the cache,
            // not the number of items in the cache.
            // Enforcing this limit is done in the `NeedMutCache` impl.
            lru_cache: LruCache::unbounded(),
            num_items: 0,
            num_bytes: 0,
            capacity,
            cache_metrics,
        }
    }

    fn record_item(&mut self, num_bytes: u64) {
        self.num_items += 1;
        self.num_bytes += num_bytes;
        self.cache_metrics.in_cache_count.inc();
        self.cache_metrics.in_cache_num_bytes.add(num_bytes as i64);
    }

    fn drop_item(&mut self, num_bytes: u64) {
        self.num_items -= 1;
        self.num_bytes -= num_bytes;
        self.cache_metrics.in_cache_count.dec();
        self.cache_metrics.in_cache_num_bytes.sub(num_bytes as i64);
        self.cache_metrics.evict_num_items.inc();
        self.cache_metrics.evict_num_bytes.inc_by(num_bytes);
    }

    pub fn get<Q>(&mut self, cache_key: &Q) -> Option<V>
    where
        K: Borrow<Q>,
        Q: Hash + Eq + ?Sized,
    {
        let item_opt = self.lru_cache.get_mut(cache_key);
        if let Some(item) = item_opt {
            self.cache_metrics.hits_num_items.inc();
            self.cache_metrics.hits_num_bytes.inc_by(item.len() as u64);
            Some(item.payload())
        } else {
            self.cache_metrics.misses_num_items.inc();
            None
        }
    }

    /// Attempt to put the given amount of data in the cache.
    /// This may fail silently if the owned_bytes slice is larger than the cache
    /// capacity.
    fn put(&mut self, key: K, bytes: V) {
        if self.capacity.exceeds_capacity(bytes.len()) {
            // The value does not fit in the cache. We simply don't store it.
            if self.capacity != Capacity::InBytes(0) {
                warn!(
                    capacity_in_bytes = ?self.capacity,
                    len = bytes.len(),
                    "Downloaded a byte slice larger than the cache capacity."
                );
            }
            return;
        }
        if let Some(previous_data) = self.lru_cache.pop(&key) {
            self.drop_item(previous_data.len() as u64);
        }

        let now = Instant::now();
        while self
            .capacity
            .exceeds_capacity(self.num_bytes as usize + bytes.len())
        {
            if let Some((_, candidate_for_eviction)) = self.lru_cache.peek_lru() {
                let time_since_last_access =
                    now.duration_since(candidate_for_eviction.last_access_time());
                if time_since_last_access < LRU_MIN_TIME_SINCE_LAST_ACCESS {
                    // It is not worth doing an eviction.
                    // TODO: It is sub-optimal that we might have needlessly evicted items in this
                    // loop before just returning.
                    return;
                }
            }
            if let Some((_, bytes)) = self.lru_cache.pop_lru() {
                self.drop_item(bytes.len() as u64);
            } else {
                error!(
                    "Logical error. Even after removing all of the items in the cache the \
                     capacity is insufficient. This case is guarded against and should never \
                     happen."
                );
                return;
            }
        }
        self.record_item(bytes.len() as u64);
        self.lru_cache.put(key, StoredItem::new(bytes, now));
    }
}

// actually, quick_cache is a Clock-PRO, not a S3-fifo contrary to what quick-cache and Moka's
// readme says. While both are clearly distinct (one being clock-based, the other being fifo
// based), they are not too disimilar in term of strenght/weaknesses.
pub struct S3Fifo<K: Hash + Eq, V: ValueLen> {
    cache:
        QuickCache<K, V, QuickCacheWeighter, quick_cache::DefaultHashBuilder, QuickCacheLifecycle>,
    capacity: u64,
    cache_metrics: SingleCacheMetrics,
}

impl<K: Hash + Eq, V: ValueLen> Drop for S3Fifo<K, V> {
    fn drop(&mut self) {
        // we don't count this toward evicted entries, as we are clearing the whole cache
        self.cache_metrics
            .in_cache_count
            .sub(self.cache.len() as i64);
        self.cache_metrics
            .in_cache_num_bytes
            .sub(self.cache.weight() as i64);
    }
}

struct QuickCacheWeighter;
impl<K, V: ValueLen> quick_cache::Weighter<K, V> for QuickCacheWeighter {
    fn weight(&self, _key: &K, value: &V) -> u64 {
        value.len() as u64
    }
}

struct QuickCacheLifecycle;
#[derive(Default)]
struct QuickCacheQueryEffect {
    count: u64,
    bytes: u64,
}
impl<K, V: ValueLen> quick_cache::Lifecycle<K, V> for QuickCacheLifecycle {
    type RequestState = QuickCacheQueryEffect;

    fn begin_request(&self) -> Self::RequestState {
        QuickCacheQueryEffect::default()
    }
    fn on_evict(&self, state: &mut Self::RequestState, _key: K, val: V) {
        state.count += 1;
        state.bytes += val.len() as u64;
    }
}

impl<K: Hash + Eq, V: ValueLen + Clone> S3Fifo<K, V> {
    /// Creates a new NeedMutSliceCache with the given capacity.
    fn with_capacity(capacity: u64, cache_metrics: SingleCacheMetrics) -> Self {
        S3Fifo {
            cache: QuickCache::with(
                (capacity / (128 * 1024)) as usize,
                capacity,
                QuickCacheWeighter,
                quick_cache::DefaultHashBuilder::new(),
                QuickCacheLifecycle,
            ),
            capacity,
            cache_metrics,
        }
    }

    pub fn get<Q>(&mut self, cache_key: &Q) -> Option<V>
    where
        K: Borrow<Q>,
        Q: Hash + Eq + ?Sized,
    {
        let item_opt = self.cache.get(cache_key);
        if let Some(item) = item_opt {
            self.cache_metrics.hits_num_items.inc();
            self.cache_metrics.hits_num_bytes.inc_by(item.len() as u64);
            Some(item.clone())
        } else {
            self.cache_metrics.misses_num_items.inc();
            None
        }
    }

    /// Attempt to put the given amount of data in the cache.
    /// This may fail silently if the owned_bytes slice is larger than the cache
    /// capacity.
    fn put(&mut self, key: K, value: V) {
        if self.capacity < value.len() as u64 {
            // The value does not fit in the cache. We simply don't store it.
            if self.capacity != 0 {
                warn!(
                    capacity_in_bytes = ?self.capacity,
                    len = value.len(),
                    "Downloaded a byte slice larger than the cache capacity."
                );
            }
            return;
        }

        self.cache_metrics.in_cache_count.inc();
        self.cache_metrics
            .in_cache_num_bytes
            .add(value.len() as i64);
        let evicted = self.cache.insert_with_lifecycle(key, value);
        self.cache_metrics.in_cache_count.sub(evicted.count as i64);
        self.cache_metrics
            .in_cache_num_bytes
            .sub(evicted.bytes as i64);
        self.cache_metrics.evict_num_items.inc_by(evicted.count);
        self.cache_metrics.evict_num_bytes.inc_by(evicted.bytes);
    }
}

// We don't make this value Clone to ensure each item is dropped only once
struct CapacityTracker<V: ValueLen> {
    item: V,
    cache_metrics: Weak<SingleCacheMetrics>,
}

impl<V: ValueLen> Drop for CapacityTracker<V> {
    fn drop(&mut self) {
        if let Some(cache_metrics) = self.cache_metrics.upgrade() {
            cache_metrics.in_cache_count.dec();
            cache_metrics.in_cache_num_bytes.sub(self.item.len() as i64);
            cache_metrics.evict_num_items.inc();
            cache_metrics.evict_num_bytes.inc_by(self.item.len() as u64);
        }
    }
}

pub struct TinyLfu<K: Hash + Eq, V: ValueLen> {
    // this field is put first so it's dropped before the cache
    // we use that to not count removed entries as "evicted", by
    // calling CapacityTracker's Drop only after its Weak has expired.
    cache_metrics: Arc<SingleCacheMetrics>,

    // we store an Arc because moka does a lot of internal cloning, and it's hard to not double
    // evict/forget to count eviction otherwise
    cache: MokaCache<K, Arc<CapacityTracker<V>>>,
    capacity: u64,
}

impl<K: Hash + Eq, V: ValueLen> Drop for TinyLfu<K, V> {
    fn drop(&mut self) {
        // we don't count this toward evicted entries, as we are clearing the whole cache
        self.cache_metrics
            .in_cache_count
            .sub(self.cache.entry_count() as i64);
        self.cache_metrics
            .in_cache_num_bytes
            .sub(self.cache.weighted_size() as i64);
    }
}

impl<K: Hash + Eq + Send + Sync + 'static, V: ValueLen + Clone + Send + Sync + 'static>
    TinyLfu<K, V>
{
    /// Creates a new NeedMutSliceCache with the given capacity.
    fn with_capacity(capacity: u64, cache_metrics: SingleCacheMetrics) -> Self {
        TinyLfu {
            cache: MokaCache::builder()
                .max_capacity(capacity)
                .weigher(|_k, v: &Arc<CapacityTracker<V>>| {
                    v.item.len().try_into().unwrap_or(u32::MAX)
                })
                .build(),
            capacity,
            cache_metrics: cache_metrics.into(),
        }
    }

    pub fn get<Q>(&mut self, cache_key: &Q) -> Option<V>
    where
        Arc<K>: Borrow<Q>,
        Q: Hash + Eq + ?Sized,
    {
        let item_opt = self.cache.get(cache_key);
        if let Some(item) = item_opt {
            self.cache_metrics.hits_num_items.inc();
            self.cache_metrics
                .hits_num_bytes
                .inc_by(item.item.len() as u64);
            Some(item.item.clone())
        } else {
            self.cache_metrics.misses_num_items.inc();
            None
        }
    }

    /// Attempt to put the given amount of data in the cache.
    /// This may fail silently if the owned_bytes slice is larger than the cache
    /// capacity.
    fn put(&mut self, key: K, value: V) {
        if self.capacity < value.len() as u64 {
            // The value does not fit in the cache. We simply don't store it.
            if self.capacity != 0 {
                warn!(
                    capacity_in_bytes = ?self.capacity,
                    len = value.len(),
                    "Downloaded a byte slice larger than the cache capacity."
                );
            }
            return;
        }

        self.cache_metrics.in_cache_count.inc();
        self.cache_metrics
            .in_cache_num_bytes
            .add(value.len() as i64);
        self.cache.insert(
            key,
            CapacityTracker {
                item: value,
                cache_metrics: Arc::downgrade(&self.cache_metrics),
            }
            .into(),
        );
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/byte_range_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::{Borrow, Cow};
use std::collections::BTreeMap;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::atomic::{AtomicU64, Ordering};
use std::sync::{Arc, Mutex};

use tantivy::directory::OwnedBytes;

use crate::metrics::{CacheMetrics, SingleCacheMetrics};

#[derive(Clone, PartialOrd, Ord, PartialEq, Eq)]
struct CacheKey<'a, T: ToOwned + ?Sized> {
    tag: Cow<'a, T>,
    range_start: usize,
}

impl<T: ToOwned + ?Sized> CacheKey<'static, T> {
    fn from_owned(tag: T::Owned, range_start: usize) -> Self {
        CacheKey {
            tag: Cow::Owned(tag),
            range_start,
        }
    }
}

impl<'a, T: ToOwned + ?Sized> CacheKey<'a, T> {
    fn from_borrowed(tag: &'a T, range_start: usize) -> Self {
        CacheKey {
            tag: Cow::Borrowed(tag),
            range_start,
        }
    }
}

struct CacheValue {
    range_end: usize,
    bytes: OwnedBytes,
}

/// T is a tag, usually a file path.
struct NeedMutByteRangeCache<T: 'static + ToOwned + ?Sized> {
    cache: BTreeMap<CacheKey<'static, T>, CacheValue>,
    // this is hardly significant as items can get merged if they overlap
    num_items: u64,
    num_bytes: u64,
    cache_counters: &'static SingleCacheMetrics,
}

impl<T: 'static + ToOwned + ?Sized + Ord> NeedMutByteRangeCache<T> {
    fn with_infinite_capacity(cache_counters: &'static CacheMetrics) -> Self {
        NeedMutByteRangeCache {
            cache: BTreeMap::new(),
            num_items: 0,
            num_bytes: 0,
            cache_counters: &cache_counters.cache_metrics,
        }
    }

    fn get_slice(&mut self, tag: &T, byte_range: Range<usize>) -> Option<OwnedBytes> {
        if byte_range.start == byte_range.end {
            return Some(OwnedBytes::empty());
        }

        let key = CacheKey::from_borrowed(tag, byte_range.start);
        let (k, v) = if let Some((k, v)) = self.get_block(&key, byte_range.end) {
            (k, v)
        } else if let Some((k, v)) = self.merge_ranges(&key, byte_range.end) {
            (k, v)
        } else {
            self.cache_counters.misses_num_items.inc();
            return None;
        };

        let start = byte_range.start - k.range_start;
        let end = byte_range.end - k.range_start;
        let result = v.bytes.slice(start..end);

        self.cache_counters.hits_num_items.inc();
        self.cache_counters
            .hits_num_bytes
            .inc_by((end - start) as u64);

        Some(result)
    }

    fn put_slice(&mut self, tag: T::Owned, byte_range: Range<usize>, bytes: OwnedBytes) {
        let len = byte_range.end - byte_range.start;
        assert_eq!(len, bytes.len());
        if len == 0 {
            return;
        }

        // try to find a block with which we overlap (and not just touch)
        let start_key = CacheKey::from_borrowed(tag.borrow(), byte_range.start);
        let first_matching_block = self
            .get_block(&start_key, byte_range.start + 1)
            .map(|(k, _v)| k);

        let end_key = CacheKey::from_borrowed(tag.borrow(), byte_range.end - 1);
        let last_matching_block = self.get_block(&end_key, byte_range.end).map(|(k, _v)| k);

        if first_matching_block.is_some() && first_matching_block == last_matching_block {
            // same start and end: all the range is already covered
            return;
        }

        let first_matching_block = first_matching_block.unwrap_or(&start_key);
        let last_matching_block = last_matching_block.unwrap_or(&end_key);

        let overlapping: Vec<Range<usize>> = self
            .cache
            .range(first_matching_block..=last_matching_block)
            .map(|(k, v)| k.range_start..v.range_end)
            .collect();

        let can_drop_first = overlapping
            .first()
            .map(|r| byte_range.start <= r.start)
            .unwrap_or(true);

        let can_drop_last = overlapping
            .last()
            .map(|r| byte_range.end >= r.end)
            .unwrap_or(true);

        let (final_range, final_bytes) = if can_drop_first && can_drop_last {
            // if we are here, either there was no overlapping block, or there was, but this buffer
            // covers entirely every block it overlapped with. There is no merging to do.
            (byte_range, bytes)
        } else {
            // if we are here, we have to do some merging

            // first find the final buffer start and end position.
            let start = if can_drop_first {
                byte_range.start
            } else {
                // if no first, can_drop_first is true
                overlapping.first().unwrap().start
            };
            let end = if can_drop_last {
                byte_range.end
            } else {
                // if no last, can_drop_last is true
                overlapping.last().unwrap().end
            };

            let mut buffer = Vec::with_capacity(end - start);

            // if this buffer overlap, but does not contain the 1st buffer, copy the
            // non-overlapping part at the start of the final buffer.
            if !can_drop_first {
                let first_range = overlapping.first().unwrap();
                let key = CacheKey::from_borrowed(tag.borrow(), first_range.start);
                let block = self.cache.get(&key).unwrap();

                let len = first_range.end.min(byte_range.start) - first_range.start;
                buffer.extend_from_slice(&block.bytes[..len]);
            }

            // copy the entire current buffer
            buffer.extend_from_slice(&bytes);

            // if this buffer overlap, but does not contain the last buffer, copy the
            // non-overlapping part ad the end of the final buffer.
            if !can_drop_last {
                let last_range = overlapping.last().unwrap();
                let key = CacheKey::from_borrowed(tag.borrow(), last_range.start);
                let block = self.cache.get(&key).unwrap();

                let start = last_range.start.max(byte_range.end) - last_range.start;
                buffer.extend_from_slice(&block.bytes[start..]);
            }

            // sanity check, we copied as much as expected
            debug_assert_eq!(end - start, buffer.len());

            (start..end, OwnedBytes::new(buffer))
        };

        // not sure why, but the borrow check gets unhappy if I create a borrowed
        // in the loop. It works with .get() instead of .remove() (?).
        let mut key = CacheKey::from_owned(tag, 0);
        for range in overlapping.into_iter() {
            // remove every block with which we overlapped, including the 1st and last, as they
            // were included as prefix/suffix to the final block.
            key.range_start = range.start;
            self.cache.remove(&key);
            self.update_counter_drop_item(range.end - range.start);
        }

        // and finally insert the newly added buffer
        key.range_start = final_range.start;
        let value = CacheValue {
            range_end: final_range.end,
            bytes: final_bytes,
        };
        self.cache.insert(key, value);
        self.update_counter_record_item(final_range.end - final_range.start);
    }

    // Return a block that contain everything between query.range_start and range_end
    fn get_block<'a>(
        &self,
        query: &CacheKey<'a, T>,
        range_end: usize,
    ) -> Option<(&CacheKey<'a, T>, &CacheValue)> {
        self.cache
            .range(..=query)
            .next_back()
            .filter(|(k, v)| k.tag == query.tag && range_end <= v.range_end)
    }

    /// Try to merge all blocks in the given range. Fails if some bytes were not already stored.
    fn merge_ranges<'a>(
        &mut self,
        start: &CacheKey<'a, T>,
        range_end: usize,
    ) -> Option<(&CacheKey<'a, T>, &CacheValue)> {
        let own_key = |key: &CacheKey<T>| {
            CacheKey::from_owned(T::borrow(&key.tag).to_owned(), key.range_start)
        };

        let first_block = self.get_block(start, start.range_start)?;

        // query cache for all blocks which overlap with our query
        let overlapping_blocks = self
            .cache
            .range(first_block.0..)
            .take_while(|(k, _)| k.tag == start.tag && k.range_start <= range_end);

        // verify there are no hole, and each range touches the next one. There can't be overlap
        // due to how we fill our data-structure.
        let mut last_block = first_block;
        for (k, v) in overlapping_blocks.clone().skip(1) {
            if k.range_start != last_block.1.range_end {
                return None;
            }

            last_block = (k, v);
        }
        if last_block.1.range_end < range_end {
            // we got a gap at the end
            return None;
        }

        // we have everything we need. Merge every sub-buffer into a single large buffer.
        let mut buffer = Vec::with_capacity(last_block.1.range_end - first_block.0.range_start);
        let mut part_count = 0i64;
        for (_, v) in overlapping_blocks {
            part_count += 1;
            buffer.extend_from_slice(&v.bytes);
        }
        assert_eq!(
            buffer.len(),
            (last_block.1.range_end - first_block.0.range_start)
        );

        let new_key = own_key(first_block.0);
        let new_value = CacheValue {
            range_end: last_block.1.range_end,
            bytes: OwnedBytes::new(buffer),
        };

        // cleanup is sub-optimal, we'd need a BTreeMap::drain_range or something like that
        let last_key = own_key(last_block.0);

        // remove previous buffers from the cache
        let blocks_to_remove: Vec<_> = self
            .cache
            .range(&new_key..=&last_key)
            .map(|(k, _)| own_key(k))
            .collect();
        for block in blocks_to_remove {
            self.cache.remove(&block);
        }

        // and insert the new merged buffer
        self.cache.insert(new_key, new_value);

        self.num_items -= (part_count - 1) as u64;
        self.cache_counters.in_cache_count.sub(part_count - 1);

        self.get_block(start, range_end)
    }

    fn update_counter_record_item(&mut self, num_bytes: usize) {
        self.num_items += 1;
        self.num_bytes += num_bytes as u64;
        self.cache_counters.in_cache_count.inc();
        self.cache_counters.in_cache_num_bytes.add(num_bytes as i64);
    }

    fn update_counter_drop_item(&mut self, num_bytes: usize) {
        self.num_items -= 1;
        self.num_bytes -= num_bytes as u64;
        self.cache_counters.in_cache_count.dec();
        self.cache_counters.in_cache_num_bytes.sub(num_bytes as i64);
        self.cache_counters.evict_num_items.inc();
        self.cache_counters.evict_num_bytes.inc_by(num_bytes as u64);
    }
}

impl<T: 'static + ToOwned + ?Sized> Drop for NeedMutByteRangeCache<T> {
    fn drop(&mut self) {
        self.cache_counters
            .in_cache_count
            .sub(self.num_items as i64);
        self.cache_counters
            .in_cache_num_bytes
            .sub(self.num_bytes as i64);
    }
}

/// Cache for ranges of bytes in files.
///
/// This cache is used in the contraption that makes it possible for Quickwit
/// to use tantivy while doing asynchronous io.
/// Quickwit manually populates this cache in an asynchronous "warmup" phase.
/// tantivy then gets its data from this cache without performing any IO.
///
/// Contrary to `MemorySizedCache`, it's able to answer subset of known ranges,
/// does not have any eviction, and assumes an infinite capacity.
///
/// This cache assume immutable data: if you put a new slice and it overlap with
/// cached data, the changes may or may not get recorded.
///
/// At the moment this is hardly a cache as it features no eviction policy.
#[derive(Clone)]
pub struct ByteRangeCache {
    inner_arc: Arc<Inner>,
}

struct Inner {
    num_stored_bytes: AtomicU64,
    need_mut_byte_range_cache: Mutex<NeedMutByteRangeCache<Path>>,
}

impl ByteRangeCache {
    /// Creates a slice cache that never removes any entry.
    pub fn with_infinite_capacity(cache_counters: &'static CacheMetrics) -> Self {
        let need_mut_byte_range_cache =
            NeedMutByteRangeCache::with_infinite_capacity(cache_counters);
        let inner = Inner {
            num_stored_bytes: AtomicU64::default(),
            need_mut_byte_range_cache: Mutex::new(need_mut_byte_range_cache),
        };
        ByteRangeCache {
            inner_arc: Arc::new(inner),
        }
    }

    /// Overall amount of bytes stored in the cache.
    pub fn get_num_bytes(&self) -> u64 {
        self.inner_arc.num_stored_bytes.load(Ordering::Relaxed)
    }

    /// If available, returns the cached view of the slice.
    pub fn get_slice(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes> {
        self.inner_arc
            .need_mut_byte_range_cache
            .lock()
            .unwrap()
            .get_slice(path, byte_range)
    }

    /// Put the given amount of data in the cache.
    pub fn put_slice(&self, path: PathBuf, byte_range: Range<usize>, bytes: OwnedBytes) {
        let mut need_mut_byte_range_cache_locked =
            self.inner_arc.need_mut_byte_range_cache.lock().unwrap();
        need_mut_byte_range_cache_locked.put_slice(path, byte_range, bytes);
        let num_bytes = need_mut_byte_range_cache_locked.num_bytes;
        drop(need_mut_byte_range_cache_locked);
        self.inner_arc
            .num_stored_bytes
            .store(num_bytes, Ordering::Relaxed);
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;
    use std::ops::Range;
    use std::path::Path;

    use once_cell::sync::Lazy;
    use proptest::prelude::*;

    use super::ByteRangeCache;
    use crate::OwnedBytes;
    use crate::metrics::{CACHE_METRICS_FOR_TESTS, CacheMetrics};

    #[derive(Debug)]
    enum Operation {
        Insert {
            range: Range<usize>,
            tag: &'static str,
        },
        Get {
            range: Range<usize>,
            tag: &'static str,
        },
    }

    fn tag_strategy() -> impl Strategy<Value = &'static str> {
        prop_oneof![Just("path1"), Just("path2"),]
    }

    #[allow(deprecated)]
    fn range_strategy() -> impl Strategy<Value = Range<usize>> {
        (0usize..11usize).prop_perturb(|start, mut rng| start..rng.gen_range(start..12usize))
    }

    fn op_strategy() -> impl Strategy<Value = Operation> {
        prop_oneof![
            (tag_strategy(), range_strategy())
                .prop_map(|(tag, range)| Operation::Insert { range, tag }),
            (tag_strategy(), range_strategy())
                .prop_map(|(tag, range)| Operation::Get { range, tag }),
        ]
    }

    fn ops_strategy() -> impl Strategy<Value = Vec<Operation>> {
        prop::collection::vec(op_strategy(), 1..100)
    }

    proptest::proptest! {
        #[test]
        fn test_proptest_byte_range_cache(ops in ops_strategy()) {
            let mut state: HashMap<&'static str, Vec<bool>> = HashMap::new();
            state.insert("path1", vec![false; 12]);
            state.insert("path2", vec![false; 12]);

            let cache = ByteRangeCache::with_infinite_capacity(&CACHE_METRICS_FOR_TESTS);

            for op in ops {
                match op {
                    Operation::Insert {
                        range,
                        tag,
                    } => {
                        state.get_mut(tag).unwrap()
                            [range.clone()].fill(true);
                        let bytes = range.clone().map(|i| (i%256) as u8).collect::<Vec<_>>();
                        cache.put_slice(tag.into(), range, OwnedBytes::new(bytes));


                        let expected_item_count: usize = state.values()
                            .map(|tagged_state| {
                                count_items(tagged_state)
                            })
                            .sum();
                        // in some case we have ranges touching each other, count_items count them
                        // as only one, but cache count them as 2.
                        assert!(cache.inner_arc.need_mut_byte_range_cache.lock().unwrap().num_items >= expected_item_count as u64);

                        let expected_byte_count = state.values()
                            .flatten()
                            .filter(|stored| **stored)
                            .count();
                        assert_eq!(cache.inner_arc.need_mut_byte_range_cache.lock().unwrap().num_bytes, expected_byte_count as u64);
                    }
                    Operation::Get {
                        range,
                        tag,
                    } => {
                        let slice = cache.get_slice(Path::new(tag), range.clone());
                        if state[tag][range.clone()].iter().all(|t| *t) {
                            let slice = slice.unwrap();
                            let bytes = range.clone().map(|i| (i%256) as u8).collect::<Vec<_>>();
                            assert_eq!(slice[..], bytes[..]);

                        } else {
                            assert!(slice.is_none());
                        }
                    },
                }
            }
        }
    }

    fn count_items(state: &[bool]) -> usize {
        state
            .iter()
            .fold((false, 0), |(last_val, count), next| {
                if *next && !last_val {
                    (*next, count + 1)
                } else {
                    (*next, count)
                }
            })
            .1
    }

    #[test]
    fn test_byte_range_cache_doesnt_merge_unnecessarily() {
        // we need to get a 'static ref to metrics, and want a dedicated metrics because we assert
        // on it
        static METRICS: Lazy<CacheMetrics> =
            Lazy::new(|| CacheMetrics::for_component("byterange_cache_test"));

        let cache = ByteRangeCache::with_infinite_capacity(&METRICS);

        let key: std::path::PathBuf = "key".into();

        cache.put_slice(
            key.clone(),
            0..5,
            OwnedBytes::new((0..5).collect::<Vec<_>>()),
        );
        cache.put_slice(
            key.clone(),
            5..10,
            OwnedBytes::new((5..10).collect::<Vec<_>>()),
        );
        cache.put_slice(
            key.clone(),
            10..15,
            OwnedBytes::new((10..15).collect::<Vec<_>>()),
        );
        cache.put_slice(
            key.clone(),
            15..20,
            OwnedBytes::new((15..20).collect::<Vec<_>>()),
        );

        {
            let mutable_cache = cache.inner_arc.need_mut_byte_range_cache.lock().unwrap();
            assert_eq!(mutable_cache.cache.len(), 4);
            assert_eq!(mutable_cache.num_items, 4);
            assert_eq!(mutable_cache.cache_counters.in_cache_count.get(), 4);
            assert_eq!(mutable_cache.num_bytes, 20);
            assert_eq!(mutable_cache.cache_counters.in_cache_num_bytes.get(), 20);
        }

        cache.get_slice(&key, 3..12).unwrap();

        {
            // now they should've been merged, except the last one
            let mutable_cache = cache.inner_arc.need_mut_byte_range_cache.lock().unwrap();
            assert_eq!(mutable_cache.cache.len(), 2);
            assert_eq!(mutable_cache.num_items, 2);
            assert_eq!(mutable_cache.cache_counters.in_cache_count.get(), 2);
            assert_eq!(mutable_cache.num_bytes, 20);
            assert_eq!(mutable_cache.cache_counters.in_cache_num_bytes.get(), 20);
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/memory_sized_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Borrow;
use std::hash::Hash;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::{Arc, Mutex};

use quickwit_config::CacheConfig;

use crate::OwnedBytes;
use crate::cache::base_cache::{AnyCache, FakeCacheEntry};
use crate::cache::slice_address::{SliceAddress, SliceAddressKey, SliceAddressRef};
use crate::metrics::CacheMetrics;

struct CacheState<K: Hash + Eq> {
    cache: AnyCache<K>,
    virtual_caches: Vec<AnyCache<K, FakeCacheEntry>>,
}

impl<K: Hash + Eq + Clone + Send + Sync + 'static> CacheState<K> {
    fn from_config(cache_config: &CacheConfig, cache_counters: &'static CacheMetrics) -> Self {
        let cache = AnyCache::from_policy_and_capacity(
            cache_config.policy(),
            cache_config.capacity(),
            cache_counters.cache_metrics.clone(),
        );
        let virtual_caches = cache_config
            .virtual_caches
            .iter()
            .cloned()
            .map(|mut virtual_cache_config| {
                AnyCache::from_policy_and_capacity(
                    virtual_cache_config.policy_for_virtual_cache(cache_config.policy()),
                    virtual_cache_config.capacity_for_virtual_cache(cache_config.capacity()),
                    cache_counters.virtual_cache(&virtual_cache_config),
                )
            })
            .collect();
        CacheState {
            cache,
            virtual_caches,
        }
    }

    fn infinite(cache_counters: &'static CacheMetrics) -> Self {
        CacheState {
            cache: AnyCache::unbounded(cache_counters.cache_metrics.clone()),
            // there is no point in having virtual caches for an unbounded cache
            virtual_caches: Vec::new(),
        }
    }

    pub fn get<Q>(&mut self, cache_key: &Q) -> Option<OwnedBytes>
    where
        K: Borrow<Q>,
        Arc<K>: Borrow<Q>,
        Q: Hash + Eq + ?Sized,
    {
        for virtual_cache in &mut self.virtual_caches {
            // we simulate an access on all virtual caches
            virtual_cache.get(cache_key);
        }
        self.cache.get(cache_key)
    }

    fn put(&mut self, key: K, bytes: OwnedBytes) {
        for virtual_cache in &mut self.virtual_caches {
            // we simulate an access on all virtual caches
            virtual_cache.put(key.clone(), FakeCacheEntry(bytes.len()));
        }

        self.cache.put(key, bytes)
    }
}

/// A simple in-resident memory slice cache.
pub struct MemorySizedCache<K: Hash + Eq = SliceAddress> {
    inner: Mutex<CacheState<K>>,
}

impl<K: Hash + Eq + Clone + Send + Sync + 'static> MemorySizedCache<K> {
    /// Creates an slice cache with the given capacity.
    pub fn from_config(cache_config: &CacheConfig, cache_counters: &'static CacheMetrics) -> Self {
        MemorySizedCache {
            inner: Mutex::new(CacheState::from_config(cache_config, cache_counters)),
        }
    }

    /// Creates a slice cache that never removes any entry.
    pub fn with_infinite_capacity(cache_counters: &'static CacheMetrics) -> Self {
        MemorySizedCache {
            inner: Mutex::new(CacheState::infinite(cache_counters)),
        }
    }

    /// If available, returns the cached view of the slice.
    pub fn get<Q>(&self, cache_key: &Q) -> Option<OwnedBytes>
    where
        K: Borrow<Q>,
        Arc<K>: Borrow<Q>,
        Q: Hash + Eq + ?Sized,
    {
        self.inner.lock().unwrap().get(cache_key)
    }

    /// Attempt to put the given amount of data in the cache.
    /// This may fail silently if the owned_bytes slice is larger than the cache
    /// capacity.
    pub fn put(&self, val: K, bytes: OwnedBytes) {
        self.inner.lock().unwrap().put(val, bytes);
    }
}

impl MemorySizedCache<SliceAddress> {
    /// If available, returns the cached view of the slice.
    pub fn get_slice(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes> {
        let slice_address_ref = SliceAddressRef { path, byte_range };
        self.get(&slice_address_ref as &dyn SliceAddressKey)
    }

    /// Attempt to put the given amount of data in the cache.
    /// This may fail silently if the owned_bytes slice is larger than the cache
    /// capacity.
    pub fn put_slice(&self, path: PathBuf, byte_range: Range<usize>, bytes: OwnedBytes) {
        let slice_address = SliceAddress { path, byte_range };
        self.put(slice_address, bytes);
    }
}

#[cfg(test)]
mod tests {
    use bytesize::ByteSize;

    use super::*;
    use crate::cache::base_cache::LRU_MIN_TIME_SINCE_LAST_ACCESS;
    use crate::metrics::CACHE_METRICS_FOR_TESTS;

    #[tokio::test]
    async fn test_cache_edge_condition() {
        tokio::time::pause();
        let cache = MemorySizedCache::<String>::from_config(
            &ByteSize::b(5).into(),
            &CACHE_METRICS_FOR_TESTS,
        );
        {
            let data = OwnedBytes::new(&b"abc"[..]);
            cache.put("3".to_string(), data);
            assert_eq!(cache.get(&"3".to_string()).unwrap(), &b"abc"[..]);
        }
        {
            let data = OwnedBytes::new(&b"de"[..]);
            cache.put("2".to_string(), data);
            // our first entry should still be here.
            assert_eq!(cache.get(&"3".to_string()).unwrap(), &b"abc"[..]);
            assert_eq!(cache.get(&"2".to_string()).unwrap(), &b"de"[..]);
        }
        {
            let data = OwnedBytes::new(&b"fghij"[..]);
            cache.put("5".to_string(), data);
            // Eviction should not happen, because all items in cache are too young.
            assert!(cache.get(&"5".to_string()).is_none());
        }
        tokio::time::advance(LRU_MIN_TIME_SINCE_LAST_ACCESS.mul_f32(1.1f32)).await;
        {
            let data = OwnedBytes::new(&b"fghij"[..]);
            cache.put("5".to_string(), data);
            assert_eq!(cache.get(&"5".to_string()).unwrap(), &b"fghij"[..]);
            // our two first entries should have be removed from the cache
            assert!(cache.get(&"2".to_string()).is_none());
            assert!(cache.get(&"3".to_string()).is_none());
        }
        tokio::time::advance(LRU_MIN_TIME_SINCE_LAST_ACCESS.mul_f32(1.1f32)).await;
        {
            let data = OwnedBytes::new(&b"klmnop"[..]);
            cache.put("6".to_string(), data);
            // The entry put should have been dismissed as it is too large for the cache
            assert!(cache.get(&"6".to_string()).is_none());
            // The previous entry should however be remaining.
            assert_eq!(cache.get(&"5".to_string()).unwrap(), &b"fghij"[..]);
        }
    }

    #[test]
    fn test_cache_edge_unlimited_capacity() {
        let cache = MemorySizedCache::with_infinite_capacity(&CACHE_METRICS_FOR_TESTS);
        {
            let data = OwnedBytes::new(&b"abc"[..]);
            cache.put("3".to_string(), data);
            assert_eq!(cache.get(&"3".to_string()).unwrap(), &b"abc"[..]);
        }
        {
            let data = OwnedBytes::new(&b"de"[..]);
            cache.put("2".to_string(), data);
            assert_eq!(cache.get(&"3".to_string()).unwrap(), &b"abc"[..]);
            assert_eq!(cache.get(&"2".to_string()).unwrap(), &b"de"[..]);
        }
    }

    #[test]
    fn test_cache() {
        let cache =
            MemorySizedCache::from_config(&ByteSize::kb(10).into(), &CACHE_METRICS_FOR_TESTS);
        assert!(cache.get(&"hello.seg").is_none());
        let data = OwnedBytes::new(&b"werwer"[..]);
        cache.put("hello.seg", data);
        assert_eq!(cache.get(&"hello.seg").unwrap(), &b"werwer"[..]);
    }

    #[test]
    fn test_cache_no_cache() {
        let cache =
            MemorySizedCache::from_config(&CacheConfig::no_cache(), &CACHE_METRICS_FOR_TESTS);
        assert!(cache.get(&"hello.seg").is_none());
        let data = OwnedBytes::new(&b"werwer"[..]);
        cache.put("hello.seg", data);
        assert!(cache.get(&"hello.seg").is_none());
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod base_cache;
mod byte_range_cache;
mod memory_sized_cache;
mod quickwit_cache;
mod slice_address;
mod storage_with_cache;
mod stored_item;

use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use async_trait::async_trait;
pub use quickwit_cache::QuickwitCache;
pub use storage_with_cache::StorageWithCache;

pub use self::byte_range_cache::ByteRangeCache;
pub use self::memory_sized_cache::MemorySizedCache;
use crate::{OwnedBytes, Storage};

/// Wraps the given directory with a slice cache that is actually global
/// to quickwit.
///
/// FIXME The current approach is quite horrible in that:
/// - it uses a global
/// - it relies on the idea that all of the files we attempt to cache have universally unique names.
///   It happens to be true today, but this might be very error prone in the future.
pub fn wrap_storage_with_cache(
    long_term_cache: Arc<dyn StorageCache>,
    storage: Arc<dyn Storage>,
) -> Arc<dyn Storage> {
    Arc::new(StorageWithCache {
        storage,
        cache: long_term_cache,
    })
}

/// The `StorageCache` trait is the abstraction used to describe the caching logic
/// used in front of a storage. See `StorageWithCache`.
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait]
pub trait StorageCache: Send + Sync + 'static {
    /// Try to get a slice from the cache.
    async fn get(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes>;
    /// Try to get the entire file.
    async fn get_all(&self, path: &Path) -> Option<OwnedBytes>;
    /// Put a slice of data into the cache.
    async fn put(&self, path: PathBuf, byte_range: Range<usize>, bytes: OwnedBytes);
    /// Put an entire file into the cache.
    async fn put_all(&self, path: PathBuf, bytes: OwnedBytes);
}


================================================
FILE: quickwit/quickwit-storage/src/cache/quickwit_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_config::CacheConfig;

use crate::OwnedBytes;
use crate::cache::{MemorySizedCache, StorageCache};
use crate::metrics::CacheMetrics;

const FULL_SLICE: Range<usize> = 0..usize::MAX;

/// Quickwit storage cache with a size limit.
/// It is used currently by to cache only fast fields data.
pub struct QuickwitCache {
    router: Vec<(&'static str, Arc<dyn StorageCache>)>,
}

impl From<Vec<(&'static str, Arc<dyn StorageCache>)>> for QuickwitCache {
    fn from(router: Vec<(&'static str, Arc<dyn StorageCache>)>) -> Self {
        QuickwitCache { router }
    }
}

impl QuickwitCache {
    /// Creates a [`QuickwitCache`] with a cache on fast fields.
    pub fn new(cache_config: &CacheConfig) -> Self {
        let mut quickwit_cache = QuickwitCache::empty();
        let fast_field_cache_counters: &'static CacheMetrics =
            &crate::STORAGE_METRICS.fast_field_cache;
        quickwit_cache.add_route(
            ".fast",
            Arc::new(SimpleCache::from_config(
                cache_config,
                fast_field_cache_counters,
            )),
        );
        quickwit_cache
    }

    /// Empties cache.
    pub fn empty() -> QuickwitCache {
        QuickwitCache::from(Vec::new())
    }

    /// Adds a caching route defined by a path suffix. All elements with a path matching
    /// this suffix will be cached.
    pub fn add_route(&mut self, path_suffix: &'static str, route_cache: Arc<dyn StorageCache>) {
        self.router.push((path_suffix, route_cache));
    }

    fn get_relevant_cache(&self, path: &Path) -> Option<&dyn StorageCache> {
        for (suffix, cache) in &self.router {
            if path.to_string_lossy().ends_with(suffix) {
                return Some(cache.as_ref());
            }
        }
        None
    }
}

#[async_trait]
impl StorageCache for QuickwitCache {
    async fn get(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes> {
        // We don't check for the presence of the entire file in the
        // cache.
        // That's voluntary to avoid messing with the cache miss counts.
        if let Some(cache) = self.get_relevant_cache(path) {
            return cache.get(path, byte_range).await;
        }
        None
    }

    async fn get_all(&self, path: &Path) -> Option<OwnedBytes> {
        if let Some(cache) = self.get_relevant_cache(path) {
            return cache.get_all(path).await;
        }
        None
    }

    async fn put(&self, path: PathBuf, byte_range: Range<usize>, bytes: OwnedBytes) {
        if let Some(cache) = self.get_relevant_cache(&path) {
            cache.put(path, byte_range, bytes).await;
        }
    }

    async fn put_all(&self, path: PathBuf, bytes: OwnedBytes) {
        if let Some(cache) = self.get_relevant_cache(&path) {
            cache.put(path, FULL_SLICE, bytes).await;
        }
    }
}

/// The Quickwit cache logic is very simple for the moment.
///
/// It stores hotcache files using an LRU cache.
///
/// HACK! We use `0..usize::MAX` to signify the "entire file".
/// TODO fixme
struct SimpleCache {
    slice_cache: MemorySizedCache,
}

impl SimpleCache {
    fn from_config(cache_config: &CacheConfig, cache_counters: &'static CacheMetrics) -> Self {
        SimpleCache {
            slice_cache: MemorySizedCache::from_config(cache_config, cache_counters),
        }
    }
}

#[async_trait]
impl StorageCache for SimpleCache {
    async fn get(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes> {
        if let Some(bytes) = self.slice_cache.get_slice(path, byte_range) {
            return Some(bytes);
        }
        None
    }

    async fn put(&self, path: PathBuf, byte_range: Range<usize>, bytes: OwnedBytes) {
        self.slice_cache.put_slice(path, byte_range, bytes);
    }

    async fn get_all(&self, path: &Path) -> Option<OwnedBytes> {
        self.slice_cache.get_slice(path, FULL_SLICE)
    }

    async fn put_all(&self, path: PathBuf, bytes: OwnedBytes) {
        self.slice_cache.put_slice(path, FULL_SLICE.clone(), bytes);
    }
}

#[cfg(test)]
mod tests {
    use std::path::Path;
    use std::sync::Arc;

    use super::QuickwitCache;
    use crate::cache::StorageCache;
    use crate::{MockStorageCache, OwnedBytes};

    #[tokio::test]
    async fn test_quickwit_cache_get_all() {
        let mock_cache_hotcache = MockStorageCache::default();
        let mut mock_cache_fast = MockStorageCache::default();
        mock_cache_fast
            .expect_get_all()
            .times(1)
            .withf(|path| path == Path::new("bubu/toto.fast"))
            .returning(|_| Some(OwnedBytes::new(&b"aaaa"[..])));
        let mut quickwit_cache = QuickwitCache::empty();
        quickwit_cache.add_route("hotcache", Arc::new(mock_cache_hotcache));
        quickwit_cache.add_route("fast", Arc::new(mock_cache_fast));
        quickwit_cache.get_all(Path::new("bubu/toto.fast")).await;
    }

    #[tokio::test]
    async fn test_quickwit_cache_get() {
        let mock_cache_hotcache = MockStorageCache::default();
        let mut mock_cache = MockStorageCache::default();
        mock_cache
            .expect_get()
            .times(1)
            .withf(|path, _| path == Path::new("bubu/toto.fast"))
            .returning(|_, _| Some(OwnedBytes::new(&b"aaaaa"[..])));
        let mut quickwit_cache = QuickwitCache::empty();
        quickwit_cache.add_route("hotcache", Arc::new(mock_cache_hotcache));
        quickwit_cache.add_route("fast", Arc::new(mock_cache));
        quickwit_cache.get(Path::new("bubu/toto.fast"), 5..10).await;
    }

    #[tokio::test]
    async fn test_quickwit_cache_priority() {
        let mut mock_cache_ast = MockStorageCache::default();
        mock_cache_ast
            .expect_get()
            .times(1)
            .withf(|path, _| path == Path::new("bubu/toto.fast"))
            .returning(|_, _| Some(OwnedBytes::new(&b"aaaaa"[..])));
        let mock_cache_fast = MockStorageCache::default();
        let mut quickwit_cache = QuickwitCache::empty();
        quickwit_cache.add_route("ast", Arc::new(mock_cache_ast));
        quickwit_cache.add_route("fast", Arc::new(mock_cache_fast));
        assert_eq!(
            quickwit_cache
                .get(Path::new("bubu/toto.fast"), 5..10)
                .await
                .unwrap(),
            &b"aaaaa"[..]
        );
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/slice_address.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::borrow::Borrow;
use std::hash::{Hash, Hasher};
use std::ops::Range;
use std::path::{Path, PathBuf};

#[derive(Hash, Clone, Debug, Eq, PartialEq)]
pub struct SliceAddress {
    pub path: PathBuf,
    pub byte_range: Range<usize>,
}

// ------------------------------------------------------------
// The following struct exists to make it possible to
// fetch a slice from a cache without cloning PathBuf.

// The trick is described in https://github.com/sunshowers-code/borrow-complex-key-example/blob/main/src/lib.rs

#[derive(Clone, Debug, Eq, Hash, PartialEq)]
pub(crate) struct SliceAddressRef<'a> {
    pub path: &'a Path,
    pub byte_range: Range<usize>,
}

pub(crate) trait SliceAddressKey {
    fn key(&self) -> SliceAddressRef<'_>;
}

impl SliceAddressKey for SliceAddress {
    fn key(&self) -> SliceAddressRef<'_> {
        SliceAddressRef {
            path: self.path.as_path(),
            byte_range: self.byte_range.clone(),
        }
    }
}

impl SliceAddressKey for SliceAddressRef<'_> {
    fn key(&self) -> SliceAddressRef<'_> {
        self.clone()
    }
}

impl<'a> Borrow<dyn SliceAddressKey + 'a> for std::sync::Arc<SliceAddress> {
    fn borrow(&self) -> &(dyn SliceAddressKey + 'a) {
        &**self
    }
}

impl<'a> Borrow<dyn SliceAddressKey + 'a> for SliceAddress {
    fn borrow(&self) -> &(dyn SliceAddressKey + 'a) {
        self
    }
}
impl PartialEq for dyn SliceAddressKey + '_ {
    fn eq(&self, other: &Self) -> bool {
        self.key().eq(&other.key())
    }
}

impl Eq for dyn SliceAddressKey + '_ {}

impl Hash for dyn SliceAddressKey + '_ {
    fn hash<H: Hasher>(&self, state: &mut H) {
        self.key().hash(state)
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/storage_with_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::ops::Range;
use std::path::Path;
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use tokio::io::AsyncRead;

use crate::cache::StorageCache;
use crate::storage::SendableAsync;
use crate::{BulkDeleteError, OwnedBytes, Storage, StorageResult};

/// Use with care, StorageWithCache is read-only.
pub struct StorageWithCache {
    pub storage: Arc<dyn Storage>,
    pub cache: Arc<dyn StorageCache>,
}

impl fmt::Debug for StorageWithCache {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("StorageWithCache").finish()
    }
}

#[async_trait]
impl Storage for StorageWithCache {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.storage.check_connectivity().await
    }

    async fn put(
        &self,
        path: &Path,
        _payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        unimplemented!("StorageWithCache is readonly. Failed to put {:?}", path)
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        self.storage.copy_to(path, output).await
    }

    async fn get_slice(&self, path: &Path, byte_range: Range<usize>) -> StorageResult<OwnedBytes> {
        if let Some(bytes) = self.cache.get(path, byte_range.clone()).await {
            Ok(bytes)
        } else {
            let bytes = self.storage.get_slice(path, byte_range.clone()).await?;
            self.cache
                .put(path.to_owned(), byte_range, bytes.clone())
                .await;
            Ok(bytes)
        }
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        _range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        unimplemented!(
            "StorageWithCache does not support streamed read yet. Failed to get {:?}",
            path
        )
    }

    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        if let Some(bytes) = self.cache.get_all(path).await {
            Ok(bytes)
        } else {
            let bytes = self.storage.get_all(path).await?;
            self.cache.put_all(path.to_owned(), bytes.clone()).await;
            Ok(bytes)
        }
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        unimplemented!("Failed to delete file `{path:?}`. `StorageWithCache` is read-only.")
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        unimplemented!("Failed to delete files `{paths:?}`. `StorageWithCache` is read-only.")
    }

    async fn exists(&self, path: &Path) -> StorageResult<bool> {
        self.storage.exists(path).await
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        self.storage.file_num_bytes(path).await
    }

    fn uri(&self) -> &Uri {
        self.storage.uri()
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;
    use std::path::PathBuf;
    use std::sync::Mutex;

    use super::*;
    use crate::{MockStorage, MockStorageCache, OwnedBytes};

    #[tokio::test]
    async fn put_in_cache_test() {
        let mut mock_storage = MockStorage::default();
        let mut mock_cache = MockStorageCache::default();
        let actual_cache: Arc<Mutex<HashMap<PathBuf, OwnedBytes>>> =
            Arc::new(Mutex::new(HashMap::new()));

        let cache1 = actual_cache.clone();
        mock_cache
            .expect_get_all()
            .times(2)
            .returning(move |path| cache1.lock().unwrap().get(path).cloned());
        mock_cache
            .expect_put_all()
            .times(1)
            .returning(move |path, data| {
                let actual_cache = actual_cache.clone();
                actual_cache.lock().unwrap().insert(path, data);
            });

        mock_storage
            .expect_get_all()
            .times(1)
            .returning(|_path| Ok(OwnedBytes::new(vec![1, 2, 3])));

        let storage_with_cache = StorageWithCache {
            storage: Arc::new(mock_storage),
            cache: Arc::new(mock_cache),
        };

        let data1 = storage_with_cache
            .get_all(Path::new("cool_file"))
            .await
            .unwrap();
        // hitting the cache
        let data2 = storage_with_cache
            .get_all(Path::new("cool_file"))
            .await
            .unwrap();
        assert_eq!(data1, data2);
    }
}


================================================
FILE: quickwit/quickwit-storage/src/cache/stored_item.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use tantivy::directory::OwnedBytes;
use tokio::time::Instant;

/// It is a bit overkill to put this in its own module, but I
/// wanted to ensure that no one would access payload without updating `last_access_time`.
pub(super) struct StoredItem<V = OwnedBytes> {
    last_access_time: Instant,
    payload: V,
}

impl<V> StoredItem<V> {
    pub fn new(payload: V, now: Instant) -> Self {
        StoredItem {
            last_access_time: now,
            payload,
        }
    }
}

impl<V: ValueLen + Clone> StoredItem<V> {
    pub fn payload(&mut self) -> V {
        self.last_access_time = Instant::now();
        self.payload.clone()
    }

    pub fn len(&self) -> usize {
        self.payload.len()
    }

    pub fn last_access_time(&self) -> Instant {
        self.last_access_time
    }
}

pub(crate) trait ValueLen {
    fn len(&self) -> usize;
}

impl ValueLen for OwnedBytes {
    fn len(&self) -> usize {
        OwnedBytes::len(self)
    }
}


================================================
FILE: quickwit/quickwit-storage/src/debouncer.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::hash::Hash;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::{Arc, Mutex};

use async_trait::async_trait;
use fnv::FnvHashMap;
use futures::future::{BoxFuture, WeakShared};
use futures::{Future, FutureExt};
use quickwit_common::uri::Uri;
use tantivy::directory::OwnedBytes;
use tokio::io::AsyncRead;

use crate::storage::SendableAsync;
use crate::{BulkDeleteError, Storage, StorageResult};

/// The AsyncDebouncer debounces inflight Futures, so that concurrent async request to the same data
/// source can be deduplicated.
///
/// Since we pass the Future potentially to multiple consumer, everything needs to be cloneable. The
/// data and the future. This is reflected on the generic type bounds for the value V: Clone.
///
/// Since most Futures return an Result<V, Error>, this also encompasses the error.
pub struct AsyncDebouncer<K, V: Clone> {
    cache: Mutex<FnvHashMap<K, WeakShared<BoxFuture<'static, V>>>>,
}

impl<K, V: Clone> Default for AsyncDebouncer<K, V> {
    fn default() -> Self {
        Self {
            cache: Default::default(),
        }
    }
}

impl<K: Hash + Eq + Clone, V: Clone> AsyncDebouncer<K, V> {
    /// Returns the number of inflight futures.
    pub fn len(&self) -> usize {
        self.cache.lock().unwrap().len()
    }

    /// Cleanup
    /// In case there is already an existing Future for the passed key, the constructor is not
    /// used.
    fn cleanup(&self) {
        let mut guard = self.cache.lock().unwrap();
        guard.retain(|_, v| v.upgrade().is_some());
    }

    /// Instead of the future directly, a constructor to build the future is passed.
    /// In case there is already an existing Future for the passed key, the constructor is not
    /// used.
    pub async fn get_or_create<T, F>(&self, key: K, build_a_future: T) -> V
    where
        T: FnOnce() -> F,
        F: Future<Output = V> + Send + 'static,
    {
        self.cleanup();

        // explicit scope to drop the lock
        let weak_fut_opt = { self.cache.lock().unwrap().get(&key).cloned() };
        if let Some(weak_future) = weak_fut_opt
            && let Some(future) = weak_future.upgrade()
        {
            return future.await;
        }

        let fut = Box::pin(build_a_future()) as BoxFuture<'static, V>;
        let fut = fut.shared();
        self.cache.lock().unwrap().insert(
            key.clone(),
            fut.clone().downgrade().expect(
                "future has been dropped, but that shouldn't happen since it's still in scope",
            ),
        );
        let res = fut.await;

        self.cache.lock().unwrap().remove(&key);

        res
    }
}

type DebouncerKey = (PathBuf, Range<usize>);

/// Just to keep in mind there is a race condition on debouncing, when combined with delete
///
/// All on the same key
/// start get R1
/// start delete R2
/// end delete R2
/// start get R3
/// end get R1
/// end get R3
///
/// ==> R3 would return the cached result, although the resource has been deleted.
pub(crate) struct DebouncedStorage<T> {
    // wrap both in Arc, because the Future is stored in the cache, which has 'static lifetime
    // associated
    underlying: Arc<T>,
    slice_debouncer: Arc<AsyncDebouncer<DebouncerKey, StorageResult<OwnedBytes>>>,
}

impl<T> fmt::Debug for DebouncedStorage<T> {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("DebouncedStorage").finish()
    }
}

impl<T: Storage> DebouncedStorage<T> {
    pub(crate) fn new(underlying: T) -> Self {
        Self {
            underlying: Arc::new(underlying),
            slice_debouncer: Arc::new(AsyncDebouncer::default()),
        }
    }
}

#[async_trait]
impl<T: Storage> Storage for DebouncedStorage<T> {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.underlying.check_connectivity().await
    }

    async fn put(
        &self,
        path: &Path,
        payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        self.underlying.put(path, payload).await
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        self.underlying.copy_to(path, output).await
    }

    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        let (debouncer, underlying) = (self.slice_debouncer.clone(), self.underlying.clone());
        let key = (path.to_owned(), range);
        debouncer
            .get_or_create(key.clone(), || async move {
                underlying.get_slice(&key.0, key.1).await
            })
            .await
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        // Getting a stream bypasses the debouncer
        self.underlying.get_slice_stream(path, range).await
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        self.underlying.delete(path).await
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        self.underlying.bulk_delete(paths).await
    }

    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        let (debouncer, underlying) = (self.slice_debouncer.clone(), self.underlying.clone());
        let key = (path.to_owned(), 0..usize::MAX);
        debouncer
            .get_or_create(
                key.clone(),
                || async move { underlying.get_all(&key.0).await },
            )
            .await
    }

    fn uri(&self) -> &Uri {
        self.underlying.uri()
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        self.underlying.file_num_bytes(path).await
    }
}

#[cfg(test)]
mod tests {

    use std::ops::Range;
    use std::path::PathBuf;
    use std::sync::Arc;
    use std::sync::atomic::{AtomicU32, Ordering};
    use std::time::Duration;

    use once_cell::sync::OnceCell;
    use tempfile::TempDir;
    use tokio::fs::{self, File};
    use tokio::io::AsyncWriteExt;
    use tokio::task;

    use super::*;

    #[test]
    fn test_sync_and_send() {
        fn is_sync<T: Sync>() {}
        fn is_send<T: Send>() {}
        is_sync::<AsyncDebouncer<String, Result<String, String>>>();
        is_send::<AsyncDebouncer<String, Result<String, String>>>();
    }

    #[derive(Hash, Clone, Debug, Eq, PartialEq)]
    pub struct SliceAddress {
        pub path: PathBuf,
        pub byte_range: Range<usize>,
    }

    async fn get_test_file(temp_dir: &TempDir) -> Arc<PathBuf> {
        let test_filepath1 = Arc::new(temp_dir.path().join("f1"));

        let mut file1 = File::create(test_filepath1.as_ref()).await.unwrap();
        file1.write_all("nice cache dude".as_bytes()).await.unwrap();
        test_filepath1
    }

    #[tokio::test]
    async fn test_async_slice_cache() {
        // test data

        let temp_dir = tempfile::tempdir().unwrap();
        let test_filepath1 = get_test_file(&temp_dir).await;

        let cache: AsyncDebouncer<SliceAddress, Result<String, String>> = AsyncDebouncer::default();

        let addr1 = SliceAddress {
            path: test_filepath1.as_ref().clone(),
            byte_range: 10..20,
        };

        static COUNT: AtomicU32 = AtomicU32::new(0);

        // Load via closure
        let _val = cache
            .get_or_create(addr1.clone(), || {
                let test_filepath1 = test_filepath1.clone();
                async move {
                    COUNT.fetch_add(1, Ordering::SeqCst);
                    let contents = Box::pin(fs::read_to_string(test_filepath1.as_ref().clone()))
                        .await
                        // to string, so that the error is cloneable
                        .map_err(|err| err.to_string())?;

                    Ok(contents)
                }
            })
            .await
            .unwrap();

        // Load via function
        let _val = cache
            .get_or_create(addr1, || {
                load_via_fn(test_filepath1.as_ref().clone(), &COUNT)
            })
            .await
            .unwrap();

        assert_eq!(COUNT.load(Ordering::SeqCst), 2);

        // Load via function, new entry
        let addr2 = SliceAddress {
            path: test_filepath1.as_ref().clone(),
            byte_range: 10..30,
        };

        let _val = cache
            .get_or_create(addr2.to_owned(), || {
                load_via_fn(test_filepath1.as_ref().clone(), &COUNT)
            })
            .await
            .unwrap();

        assert_eq!(COUNT.load(Ordering::SeqCst), 3);

        let load = || load_via_fn(test_filepath1.as_ref().clone(), &COUNT);

        let handles = vec![
            cache.get_or_create(addr2.to_owned(), load),
            cache.get_or_create(addr2.to_owned(), load),
        ];

        futures::future::join_all(handles).await;

        // Count is only increased by one, because of debouncing
        assert_eq!(COUNT.load(Ordering::SeqCst), 4);

        // Quadruple debouncing
        let handles = vec![
            cache.get_or_create(addr2.to_owned(), load),
            cache.get_or_create(addr2.to_owned(), load),
            cache.get_or_create(addr2.to_owned(), load),
            cache.get_or_create(addr2.to_owned(), load),
        ];
        futures::future::join_all(handles).await;

        // Count is only increased by one, because of debouncing
        assert_eq!(COUNT.load(Ordering::SeqCst), 5);
    }

    #[tokio::test]
    async fn test_debounce() {
        let temp_dir = tempfile::tempdir().unwrap();
        let test_filepath1 = get_test_file(&temp_dir).await;

        let cache: AsyncDebouncer<SliceAddress, Result<String, String>> = AsyncDebouncer::default();

        let addr2 = SliceAddress {
            path: test_filepath1.as_ref().clone(),
            byte_range: 10..20,
        };
        static COUNT: AtomicU32 = AtomicU32::new(0);

        let load = || load_via_fn(test_filepath1.as_ref().clone(), &COUNT);

        let handles = vec![
            cache.get_or_create(addr2.to_owned(), load),
            cache.get_or_create(addr2.to_owned(), load),
        ];

        futures::future::join_all(handles).await;

        // Count is only increased by one, because of debouncing
        assert_eq!(COUNT.load(Ordering::SeqCst), 1);
    }

    #[tokio::test]
    async fn test_cancellation_future() {
        use tokio::time::timeout;
        let cache: AsyncDebouncer<String, Result<String, String>> = AsyncDebouncer::default();

        let load = || async {
            timeout(Duration::from_millis(10), load_via_fn2())
                .await
                .map_err(|err| err.to_string())
        };

        cache
            .get_or_create("key1".to_owned(), load)
            .await
            .unwrap_err();
        tokio::time::sleep(Duration::from_secs(1)).await;
        let val = cache.get_or_create("key1".to_owned(), load).await;
        assert!(val.is_err());
    }

    async fn load_via_fn2() -> String {
        tokio::time::sleep(Duration::from_millis(500)).await;
        "blub".to_string()
    }

    pub static GLOBAL_DEBOUNCER: once_cell::sync::OnceCell<AsyncDebouncer<String, String>> =
        OnceCell::new();
    pub fn get_global_debouncer() -> &'static AsyncDebouncer<String, String> {
        GLOBAL_DEBOUNCER.get_or_init(AsyncDebouncer::default)
    }

    #[tokio::test]
    async fn test_cancellation_task() {
        let load = || async { load_via_fn2().await };

        let handle = task::spawn(async move {
            get_global_debouncer()
                .get_or_create("key1".to_owned(), load)
                .await
        });
        tokio::time::sleep(Duration::from_millis(10)).await;
        // This will cause  the Future to be cancelled, so it will not be polled anymore.
        // That also means the remove in the cache is not called, which is awaiting the future
        handle.abort();

        tokio::time::sleep(Duration::from_secs(1)).await;
        // The task still hangs unfinished
        assert_eq!(get_global_debouncer().len(), 1);

        // The next get clears
        get_global_debouncer()
            .get_or_create("key1".to_owned(), load)
            .await;

        tokio::time::sleep(Duration::from_secs(1)).await;
        assert_eq!(get_global_debouncer().len(), 0);
    }

    async fn load_via_fn(path: PathBuf, cnt: &AtomicU32) -> Result<String, String> {
        cnt.fetch_add(1, Ordering::SeqCst);
        let contents = Box::pin(fs::read_to_string(path))
            .await
            .map_err(|err| err.to_string())?;
        // sleep so the requests can be reproducible debounced
        tokio::time::sleep(Duration::from_millis(10)).await;
        Ok(contents)
    }
}


================================================
FILE: quickwit/quickwit-storage/src/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::path::PathBuf;
use std::sync::Arc;
use std::{fmt, io};

use serde::{Deserialize, Serialize};
use tantivy::directory::error::{OpenDirectoryError, OpenReadError};
use thiserror::Error;

/// Storage error kind.
#[derive(Clone, Copy, Debug, Eq, PartialEq, Serialize, Deserialize)]
pub enum StorageErrorKind {
    /// The target file does not exist.
    NotFound,
    /// The request credentials do not allow for this operation.
    Unauthorized,
    /// A third-party service forbids this operation, or is misconfigured.
    Service,
    /// Any generic internal error.
    Internal,
    /// A timeout occurred during the operation.
    Timeout,
    /// Io error.
    Io,
}

/// Generic Storage Resolver Error.
#[allow(missing_docs)]
#[derive(Debug, Clone, thiserror::Error, Serialize, Deserialize)]
pub enum StorageResolverError {
    /// The storage config is invalid.
    #[error("invalid storage config: `{0}`")]
    InvalidConfig(String),

    /// The URI is malformed or does not contain sufficient information to connect to the storage.
    #[error("invalid storage URI: `{0}`")]
    InvalidUri(String),

    /// The requested backend is unsupported or unavailable.
    #[error("unsupported storage backend: `{0}`")]
    UnsupportedBackend(String),

    /// The URI is valid, and is meant to be handled by this resolver,
    /// but the resolver failed to actually connect to the storage.
    /// e.g. connection error, credentials error, incompatible version,
    /// internal error in third party, etc.
    #[error("failed to open storage {kind:?}: {message}")]
    FailedToOpenStorage {
        kind: crate::StorageErrorKind,
        message: String,
    },
}

impl StorageErrorKind {
    /// Creates a StorageError.
    pub fn with_error(self, source: impl Into<anyhow::Error>) -> StorageError {
        StorageError {
            kind: self,
            source: Arc::new(source.into()),
        }
    }
}

impl From<StorageError> for io::Error {
    fn from(storage_err: StorageError) -> Self {
        let io_error_kind = match storage_err.kind() {
            StorageErrorKind::NotFound => io::ErrorKind::NotFound,
            _ => io::ErrorKind::Other,
        };
        // TODO: This is swallowing the context of the source error.
        io::Error::new(io_error_kind, storage_err.source.to_string())
    }
}

/// Generic StorageError.
#[derive(Debug, Clone, Error)]
#[error("storage error(kind={kind:?}, source={source})")]
#[allow(missing_docs)]
pub struct StorageError {
    pub kind: StorageErrorKind,
    #[source]
    source: Arc<anyhow::Error>,
}

/// Generic Result type for storage operations.
pub type StorageResult<T> = Result<T, StorageError>;

impl StorageError {
    /// Add some context to the wrapper error.
    pub fn add_context<C>(self, ctx: C) -> Self
    where C: fmt::Display + Send + Sync + 'static {
        StorageError {
            kind: self.kind,
            source: Arc::new(anyhow::anyhow!("{ctx}").context(self.source)),
        }
    }

    /// Returns the corresponding `StorageErrorKind` for this error.
    pub fn kind(&self) -> StorageErrorKind {
        self.kind
    }
}

impl From<io::Error> for StorageError {
    fn from(err: io::Error) -> StorageError {
        match err.kind() {
            io::ErrorKind::NotFound => StorageErrorKind::NotFound.with_error(err),
            _ => StorageErrorKind::Io.with_error(err),
        }
    }
}

impl From<OpenDirectoryError> for StorageError {
    fn from(err: OpenDirectoryError) -> StorageError {
        match err {
            OpenDirectoryError::DoesNotExist(_) => StorageErrorKind::NotFound.with_error(err),
            _ => StorageErrorKind::Io.with_error(err),
        }
    }
}

impl From<OpenReadError> for StorageError {
    fn from(err: OpenReadError) -> StorageError {
        match err {
            OpenReadError::FileDoesNotExist(_) => StorageErrorKind::NotFound.with_error(err),
            _ => StorageErrorKind::Io.with_error(err),
        }
    }
}

/// Error returned by `bulk_delete`. Under the hood, `bulk_delete` groups the files to
/// delete into multiple batches of fixed size and issues one delete objects request per batch. The
/// whole operation can fail in multiples ways, which is reflected by the quirkiness of the API of
/// [`BulkDeleteError`]. First, a batch can fail partially, i.e. some objects are deleted while
/// others are not. The `successes` and `failures` attributes of the error will be populated
/// accordingly. Second, a batch can fail completely, in which case the `error` field will be set.
/// Because a batch failing entirely usually indicates a systemic error, for instance, a connection
/// or credentials issue, `bulk_delete` does not attempt to delete the remaining batches and
/// populates the `unattempted` attribute. Consequently, the attributes of this error are not
/// "mutually exclusive": there exists a path where all those fields are not empty. The caller is
/// expected to handle this error carefully and inspect the instance thoroughly before any retry
/// attempt.
#[must_use]
#[derive(Debug, Default, thiserror::Error)]
pub struct BulkDeleteError {
    /// Error that occurred for a whole batch and caused the entire deletion operation to be
    /// aborted.
    pub error: Option<StorageError>,
    /// List of files that were successfully deleted, including non-existing files.
    pub successes: Vec<PathBuf>,
    /// List of files that failed to be deleted along with the corresponding failure descriptions.
    pub failures: HashMap<PathBuf, DeleteFailure>,
    /// List of remaining files to delete before the operation was aborted.
    pub unattempted: Vec<PathBuf>,
}

/// Describes the failure for an individual file in a batch delete operation.
#[derive(Debug, Default)]
pub struct DeleteFailure {
    /// The error that occurred for this file.
    pub error: Option<StorageError>,
    /// The failure code is a string that uniquely identifies an error condition. It is meant to be
    /// read and understood by programs that detect and handle errors by type.
    pub code: Option<String>,
    /// The error message contains a generic description of the error condition in English. It is
    /// intended for a human audience. Simple programs display the message directly to the end user
    /// if they encounter an error condition they don't know how or don't care to handle.
    /// Sophisticated programs with more exhaustive error handling and proper internationalization
    /// are more likely to ignore the error message.
    pub message: Option<String>,
}

impl fmt::Display for BulkDeleteError {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(
            f,
            "bulk delete error ({} success(es),  {} failure(s), {} unattempted)",
            self.successes.len(),
            self.failures.len(),
            self.unattempted.len()
        )?;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/file_descriptor_cache.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fs::File;
use std::io;
use std::num::{NonZeroU32, NonZeroUsize};
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::{Arc, Mutex};

use tantivy::directory::OwnedBytes;
use tokio::sync::{OwnedSemaphorePermit, Semaphore};
use ulid::Ulid;

use crate::metrics::SingleCacheMetrics;

pub struct FileDescriptorCache {
    fd_cache: Mutex<lru::LruCache<Ulid, SplitFile>>,
    fd_semaphore: Arc<Semaphore>,
    fd_cache_metrics: SingleCacheMetrics,
}

#[derive(Clone)]
pub struct SplitFile(Arc<SplitFileInner>);

struct SplitFileInner {
    num_bytes: u64,
    // Order matters here. We want file to be dropped (closed) before the semaphore.
    file: File,
    _fd_semaphore_guard: OwnedSemaphorePermit,
}

fn get_split_file_path(root_path: &Path, split_id: Ulid) -> PathBuf {
    let split_filename = quickwit_common::split_file(split_id);
    root_path.join(split_filename)
}

impl FileDescriptorCache {
    /// Creates a new file descriptor cache.
    /// `max_fd_limit` is the total number of file descriptors that can be open at the same time.
    /// `fd_cache_capacity` is the number of file descriptors that can be cached. It is required to
    /// be less than `max_fd_limit`.
    ///
    /// # Warning
    ///
    /// The file descriptor cache can be prone to deadlocks.
    /// Currently the risk is only avoided due to the split search concurrency limit.
    ///
    /// When setting the two limit, ensure the max_fd_limit is higher than the split search
    /// concurrency limit and that you have set some margin between the two, and also make sure
    /// the `max_fd_limit` is sufficient to avoid deadlocks.
    ///
    /// TODO It would be good to refactor this to enforce this with a bit of a refactoring.
    /// For instance, client could be forced to declare upfront the number of file descriptors they
    /// will need. In Quickwit however, one task is hitting one split at a time, so the risk is
    /// absent.
    fn new(
        max_fd_limit: NonZeroU32,
        fd_cache_capacity: NonZeroU32,
        fd_cache_metrics: SingleCacheMetrics,
    ) -> FileDescriptorCache {
        assert!(max_fd_limit.get() > fd_cache_capacity.get());
        let fd_cache = Mutex::new(lru::LruCache::new(
            NonZeroUsize::new(fd_cache_capacity.get() as usize).unwrap(),
        ));
        let fd_semaphore = Arc::new(Semaphore::new(max_fd_limit.get() as usize));
        FileDescriptorCache {
            fd_cache,
            fd_semaphore,
            fd_cache_metrics,
        }
    }

    pub fn with_fd_cache_capacity(fd_cache_capacity: NonZeroU32) -> FileDescriptorCache {
        let max_fd_limit = (fd_cache_capacity.get() * 2)
            .clamp(fd_cache_capacity.get() + 100, fd_cache_capacity.get() + 200);
        Self::new(
            NonZeroU32::new(max_fd_limit).unwrap(),
            fd_cache_capacity,
            crate::STORAGE_METRICS
                .fd_cache_metrics
                .cache_metrics
                .clone(),
        )
    }

    fn get_split_file(&self, split_id: Ulid) -> Option<SplitFile> {
        self.fd_cache.lock().unwrap().get(&split_id).cloned()
    }

    fn put_split_file(&self, split_id: Ulid, split_file: SplitFile) {
        let mut fd_cache_lock = self.fd_cache.lock().unwrap();
        fd_cache_lock.push(split_id, split_file);
        self.fd_cache_metrics
            .in_cache_count
            .set(fd_cache_lock.len() as i64);
    }

    /// Evicts the given list of split ids from the file descriptor cache.
    /// This method does NOT remove the actual files.
    pub fn evict_split_files(&self, split_ids: &[Ulid]) {
        let mut fd_cache_lock = self.fd_cache.lock().unwrap();
        for split_id in split_ids {
            fd_cache_lock.pop(split_id);
        }
        self.fd_cache_metrics
            .in_cache_count
            .set(fd_cache_lock.len() as i64);
        self.fd_cache_metrics
            .evict_num_items
            .inc_by(split_ids.len() as u64);
    }

    pub async fn get_or_open_split_file(
        &self,
        root_path: &Path,
        split_id: Ulid,
        num_bytes: u64,
    ) -> std::io::Result<SplitFile> {
        if let Some(split_file) = self.get_split_file(split_id) {
            self.fd_cache_metrics.hits_num_items.inc();
            return Ok(split_file);
        } else {
            self.fd_cache_metrics.misses_num_items.inc();
        }
        let split_path = get_split_file_path(root_path, split_id);
        let fd_semaphore_guard = Semaphore::acquire_owned(self.fd_semaphore.clone())
            .await
            .expect("fd_semaphore acquire failed. please report");
        let file: File = tokio::task::spawn_blocking(move || std::fs::File::open(split_path))
            .await
            .map_err(|join_error| {
                io::Error::other(format!("failed to open file: {join_error:?}"))
            })??;
        let split_file = SplitFile(Arc::new(SplitFileInner {
            num_bytes,
            file,
            _fd_semaphore_guard: fd_semaphore_guard,
        }));
        self.put_split_file(split_id, split_file.clone());
        Ok(split_file)
    }
}

impl SplitFile {
    pub async fn get_range(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        use std::os::unix::fs::FileExt;
        let file = self.clone();
        let buf = tokio::task::spawn_blocking(move || {
            let mut buf = Vec::with_capacity(range.len());
            #[allow(clippy::uninit_vec)]
            unsafe {
                buf.set_len(range.len());
            }
            file.0.file.read_exact_at(&mut buf, range.start as u64)?;
            io::Result::Ok(buf)
        })
        .await
        .unwrap()?;
        Ok(OwnedBytes::new(buf))
    }

    pub async fn get_all(&self) -> io::Result<OwnedBytes> {
        self.get_range(0..self.0.num_bytes as usize).await
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroU32;

    use tokio::fs;
    use ulid::Ulid;

    use super::FileDescriptorCache;
    use crate::metrics::CacheMetrics;

    #[tokio::test]
    async fn test_fd_cache_big_cache() {
        let cache_metrics = CacheMetrics::for_component("fdtest").cache_metrics;
        let fd_cache = FileDescriptorCache::new(
            NonZeroU32::new(20).unwrap(),
            NonZeroU32::new(10).unwrap(),
            cache_metrics.clone(),
        );
        let tempdir = tempfile::tempdir().unwrap();
        let split_ids: Vec<Ulid> = std::iter::repeat_with(Ulid::new).take(100).collect();
        for &split_id in &split_ids {
            let split_filepath = super::get_split_file_path(tempdir.path(), split_id);
            let content = split_id.to_string();
            assert_eq!(content.len(), 26);
            fs::write(split_filepath, content.as_bytes()).await.unwrap();
        }
        for &split_id in &split_ids[0..10] {
            fd_cache
                .get_or_open_split_file(tempdir.path(), split_id, 26)
                .await
                .unwrap();
        }
        for &split_id in &split_ids[0..10] {
            fd_cache
                .get_or_open_split_file(tempdir.path(), split_id, 26)
                .await
                .unwrap();
        }
        for &split_id in &split_ids[0..10] {
            fd_cache
                .get_or_open_split_file(tempdir.path(), split_id, 26)
                .await
                .unwrap();
        }
        assert_eq!(cache_metrics.in_cache_count.get(), 10);
        assert_eq!(cache_metrics.hits_num_items.get(), 20);
        assert_eq!(cache_metrics.misses_num_items.get(), 10);
    }

    // This mimics Quickwit's workload where the fd cache is much smaller than the number of
    // splits. Each search will read from the same split file, and the cache will help avoid
    // opening the file several times.
    #[tokio::test]
    async fn test_fd_cache_small_cache() {
        let cache_metrics = CacheMetrics::for_component("fdtest2").cache_metrics;
        let fd_cache = FileDescriptorCache::new(
            NonZeroU32::new(20).unwrap(),
            NonZeroU32::new(10).unwrap(),
            cache_metrics.clone(),
        );
        let tempdir = tempfile::tempdir().unwrap();
        let split_ids: Vec<Ulid> = std::iter::repeat_with(Ulid::new).take(100).collect();
        for &split_id in &split_ids {
            let split_filepath = super::get_split_file_path(tempdir.path(), split_id);
            let content = split_id.to_string();
            assert_eq!(content.len(), 26);
            fs::write(split_filepath, content.as_bytes()).await.unwrap();
        }
        for &split_id in &split_ids[0..100] {
            for _ in 0..10 {
                fd_cache
                    .get_or_open_split_file(tempdir.path(), split_id, 26)
                    .await
                    .unwrap();
            }
        }
        assert_eq!(cache_metrics.in_cache_count.get(), 10);
        assert_eq!(cache_metrics.hits_num_items.get(), 100 * 9);
        assert_eq!(cache_metrics.misses_num_items.get(), 100);
    }

    #[tokio::test]
    async fn test_split_file() {
        let fd_cache = FileDescriptorCache::with_fd_cache_capacity(NonZeroU32::new(20).unwrap());
        let tempdir = tempfile::tempdir().unwrap();
        let split_id: Ulid = Ulid::new();
        let split_filepath = super::get_split_file_path(tempdir.path(), split_id);
        let content = split_id.to_string();
        assert_eq!(content.len(), 26);
        fs::write(split_filepath, content.as_bytes()).await.unwrap();
        let split_file = fd_cache
            .get_or_open_split_file(tempdir.path(), split_id, 26)
            .await
            .unwrap();
        {
            let bytes = split_file.get_all().await.unwrap();
            assert_eq!(bytes.as_slice(), content.as_bytes());
        }
        {
            let bytes = split_file.get_range(1..3).await.unwrap();
            assert_eq!(bytes.as_slice(), &content.as_bytes()[1..3]);
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![warn(missing_docs)]
#![allow(clippy::bool_assert_comparison)]
#![allow(clippy::len_without_is_empty)]
#![deny(clippy::disallowed_methods)]

//! `quickwit-storage` is the abstraction used in quickwit to interface itself
//! to different storage:
//! - object storages (S3)
//! - local filesystem
//! - distributed filesystems.
//! - etc.
//!
//! The `BundleStorage` bundles together multiple files into a single file.
mod cache;
mod debouncer;
mod file_descriptor_cache;
mod metrics;
mod storage;
mod timeout_and_retry_storage;
pub use debouncer::AsyncDebouncer;
pub(crate) use debouncer::DebouncedStorage;

pub use self::metrics::STORAGE_METRICS;
pub use self::payload::PutPayload;
pub use self::storage::Storage;

mod bundle_storage;
mod error;

mod local_file_storage;
mod object_storage;
#[cfg(feature = "gcs")]
mod opendal_storage;
mod payload;
mod prefix_storage;
mod ram_storage;
mod split;
mod split_cache;
mod storage_factory;
mod storage_resolver;
mod versioned_component;

use quickwit_common::uri::Uri;
pub use split_cache::SplitCache;
pub use tantivy::directory::OwnedBytes;
pub use versioned_component::VersionedComponent;

pub use self::bundle_storage::{BundleStorage, BundleStorageFileOffsets};
#[cfg(any(test, feature = "testsuite"))]
pub use self::cache::MockStorageCache;
pub use self::cache::{
    ByteRangeCache, MemorySizedCache, QuickwitCache, StorageCache, wrap_storage_with_cache,
};
pub use self::local_file_storage::{LocalFileStorage, LocalFileStorageFactory};
#[cfg(feature = "azure")]
pub use self::object_storage::{AzureBlobStorage, AzureBlobStorageFactory};
pub use self::object_storage::{
    MultiPartPolicy, S3CompatibleObjectStorage, S3CompatibleObjectStorageFactory,
};
#[cfg(feature = "gcs")]
pub use self::opendal_storage::GoogleCloudStorageFactory;
#[cfg(all(feature = "gcs", feature = "integration-testsuite"))]
pub use self::opendal_storage::test_config_helpers;
pub use self::ram_storage::{RamStorage, RamStorageBuilder};
pub use self::split::{SplitPayload, SplitPayloadBuilder};
#[cfg(any(test, feature = "testsuite"))]
pub use self::storage::MockStorage;
#[cfg(any(test, feature = "testsuite"))]
pub use self::storage_factory::MockStorageFactory;
pub use self::storage_factory::{StorageFactory, UnsupportedStorage};
pub use self::storage_resolver::StorageResolver;
#[cfg(feature = "integration-testsuite")]
pub use self::test_suite::{
    storage_test_multi_part_upload, storage_test_single_part_upload, storage_test_suite,
    test_write_and_bulk_delete,
};
pub use self::timeout_and_retry_storage::TimeoutAndRetryStorage;
pub use crate::error::{
    BulkDeleteError, DeleteFailure, StorageError, StorageErrorKind, StorageResolverError,
    StorageResult,
};

/// Loads an entire local or remote file into memory.
pub async fn load_file(
    storage_resolver: &StorageResolver,
    uri: &Uri,
) -> anyhow::Result<OwnedBytes> {
    let parent = uri
        .parent()
        .ok_or_else(|| anyhow::anyhow!("URI `{uri}` is not a valid file URI"))?;
    let storage = storage_resolver.resolve(&parent).await?;
    let file_name = uri
        .file_name()
        .ok_or_else(|| anyhow::anyhow!("URI `{uri}` is not a valid file URI"))?;
    let bytes = storage.get_all(file_name).await?;
    Ok(bytes)
}

// this function isn't meant to be called, just to break compilation if
// serde_json::Map is an ordered map and not a btree map
#[allow(dead_code)]
#[cfg(not(any(test, feature = "testsuite", feature = "integration-testsuite")))]
unsafe fn serde_json_preserve_order_canary(
    val: serde_json::Map<String, serde_json::Value>,
) -> std::collections::BTreeMap<String, serde_json::Value> {
    use std::mem::transmute as assert_serde_json__preserve_order__disabled;
    unsafe { assert_serde_json__preserve_order__disabled(val) }
}

#[cfg(any(test, feature = "testsuite", feature = "integration-testsuite"))]
mod for_test {
    use std::sync::Arc;

    use crate::{RamStorage, Storage};

    /// Returns a storage backed by an "in-memory file" for testing.
    pub fn storage_for_test() -> Arc<dyn Storage> {
        Arc::new(RamStorage::default())
    }
}

#[cfg(any(test, feature = "testsuite", feature = "integration-testsuite"))]
pub use for_test::storage_for_test;

#[cfg(test)]
mod tests {
    use std::str::FromStr;

    use super::*;

    #[tokio::test]
    async fn test_load_file() {
        let storage_resolver = StorageResolver::builder()
            .register(LocalFileStorageFactory)
            .build()
            .unwrap();
        let expected_bytes = tokio::fs::read_to_string("Cargo.toml").await.unwrap();
        assert_eq!(
            load_file(&storage_resolver, &Uri::from_str("Cargo.toml").unwrap())
                .await
                .unwrap()
                .as_slice(),
            expected_bytes.as_bytes()
        );
    }
}

#[cfg(any(test, feature = "integration-testsuite"))]
pub(crate) mod test_suite {

    use std::path::Path;

    use anyhow::Context;
    use tokio::io::AsyncReadExt;

    use crate::{Storage, StorageErrorKind};

    async fn test_get_inexistent_file(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let err = storage
            .get_slice(Path::new("missingfile"), 0..3)
            .await
            .map_err(|err| err.kind());
        assert!(matches!(err, Err(StorageErrorKind::NotFound)));
        Ok(())
    }

    async fn test_write_and_get_slice(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("write_and_read_slice");
        storage
            .put(
                test_path,
                Box::new(b"abcdefghiklmnopqrstuvxyz"[..].to_vec()),
            )
            .await?;
        let payload = storage.get_slice(test_path, 3..6).await?;
        assert_eq!(&payload[..], b"def");
        Ok(())
    }

    async fn test_write_and_get_slice_stream(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("write_and_read_slice_stream");
        storage
            .put(
                test_path,
                Box::new(b"abcdefghiklmnopqrstuvxyz"[..].to_vec()),
            )
            .await?;
        let mut reader = storage.get_slice_stream(test_path, 3..6).await?;
        let mut buf = vec![0; 3];
        reader.read_exact(&mut buf).await?;
        assert_eq!(&buf[..], b"def");
        Ok(())
    }

    async fn test_write_get_all(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("write_and_read_all");
        storage
            .put(test_path, Box::new(b"abcdef"[..].to_vec()))
            .await?;
        let payload = storage.get_all(test_path).await?;
        assert_eq!(&payload[..], &b"abcdef"[..]);
        Ok(())
    }

    async fn test_write_and_cp(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("write_and_cp");
        let payload_bytes = b"abcdefghijklmnopqrstuvwxyz";
        storage
            .put(test_path, Box::new(payload_bytes.to_vec()))
            .await?;
        let temp_dir = tempfile::tempdir()?;
        let dest_path = temp_dir.path().to_path_buf();
        let local_copy = dest_path.join("local_copy");
        storage.copy_to_file(test_path, &local_copy).await?;
        let payload = std::fs::read(&local_copy)?;
        assert_eq!(&payload[..], payload_bytes);
        Ok(())
    }

    async fn test_write_and_delete(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("write_and_delete");
        let payload_bytes = b"abcdefghijklmnopqrstuvwxyz";
        storage
            .put(test_path, Box::new(payload_bytes.to_vec()))
            .await?;
        assert!(storage.exists(test_path).await?);
        storage.delete(test_path).await?;
        assert!(!storage.exists(test_path).await?);
        storage.delete(test_path).await?;
        Ok(())
    }

    /// Tests `Storage::bulk_delete`.
    pub async fn test_write_and_bulk_delete(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_paths = [
            Path::new("foo"),
            Path::new("bar"),
            Path::new("qux"),
            Path::new("baz"),
            Path::new("file-does-not-exist"),
        ];
        for test_path in &test_paths[0..4] {
            storage
                .put(Path::new(test_path), Box::new(b"123".to_vec()))
                .await?;
            assert!(storage.exists(test_path).await?);
        }
        storage.bulk_delete(&test_paths).await?;

        for test_path in test_paths {
            assert!(!storage.exists(test_path).await?);
        }
        Ok(())
    }

    async fn test_file_size(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("write_for_filesize");
        let payload_bytes = b"abcdefghijklmnopqrstuvwxyz";
        storage
            .put(test_path, Box::new(payload_bytes.to_vec()))
            .await?;
        assert_eq!(storage.file_num_bytes(test_path).await?, 26u64);
        storage.delete(test_path).await?;
        Ok(())
    }

    async fn test_exists(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("exists");
        assert!(!storage.exists(test_path).await.unwrap());
        storage
            .put(test_path, Box::<std::vec::Vec<u8>>::default())
            .await?;
        assert!(storage.exists(test_path).await.unwrap());
        storage.delete(test_path).await.unwrap();
        Ok(())
    }

    async fn test_delete_missing_file(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("missing_file");
        assert!(!storage.exists(test_path).await.unwrap());
        assert!(storage.delete(test_path).await.is_ok());
        Ok(())
    }

    async fn test_write_and_delete_with_dir_separator(
        storage: &mut dyn Storage,
    ) -> anyhow::Result<()> {
        let test_path = Path::new("foo/bar/write_and_delete_with_separator");
        let payload_bytes = b"abcdefghijklmnopqrstuvwxyz";
        storage
            .put(test_path, Box::new(payload_bytes.to_vec()))
            .await?;
        assert!(matches!(
            storage.exists(Path::new("foo/bar")).await,
            Ok(false)
        ));
        storage.delete(test_path).await?;

        assert!(matches!(
            storage.exists(Path::new("foo/bar")).await,
            Ok(false)
        ));
        assert!(matches!(storage.exists(Path::new("foo")).await, Ok(false)));
        Ok(())
    }

    /// Generic test suite for a storage.
    pub async fn storage_test_suite(storage: &mut dyn Storage) -> anyhow::Result<()> {
        test_get_inexistent_file(storage)
            .await
            .context("get_inexistent_file")?;
        test_write_and_get_slice(storage)
            .await
            .context("write_and_get_slice")?;
        test_write_and_get_slice_stream(storage)
            .await
            .context("write_and_get_slice_stream")?;
        test_write_get_all(storage)
            .await
            .context("write_and_get_all")?;
        test_write_and_cp(storage).await.context("write_and_cp")?;
        test_write_and_delete(storage)
            .await
            .context("write_and_delete")?;
        test_write_and_bulk_delete(storage)
            .await
            .context("write_and_bulk_delete")?;
        test_exists(storage).await.context("exists")?;
        test_write_and_delete_with_dir_separator(storage)
            .await
            .context("write_and_delete_with_separator")?;
        test_file_size(storage).await.context("file_size")?;
        test_delete_missing_file(storage)
            .await
            .context("delete_missing_file")?;
        Ok(())
    }

    /// Generic single-part upload test.
    #[cfg(feature = "integration-testsuite")]
    pub async fn storage_test_single_part_upload(storage: &mut dyn Storage) -> anyhow::Result<()> {
        use std::ops::Range;

        let test_path = Path::new("hello_small.txt");
        let data = b"hello, happy tax payer!";
        let data_size = data.len() as u64;
        storage.put(test_path, Box::new(data.to_vec())).await?;
        // file_num_bytes
        assert_eq!(storage.file_num_bytes(test_path).await?, data_size);
        // get_all
        let all_bytes = storage.get_all(test_path).await?;
        assert_eq!(all_bytes.as_slice(), data);
        // get_slice
        let happy_bytes = storage
            .get_slice(test_path, Range { start: 7, end: 12 })
            .await?;
        assert_eq!(happy_bytes.as_slice(), &data[7..12]);
        // get_slice_stream
        let mut happy_byte_stream = storage
            .get_slice_stream(test_path, Range { start: 7, end: 12 })
            .await?;
        let mut happy_bytes_read = Vec::new();
        happy_byte_stream.read_to_end(&mut happy_bytes_read).await?;
        assert_eq!(happy_bytes_read.as_slice(), &data[7..12]);
        Ok(())
    }

    /// Generic multi-part upload test.
    #[cfg(feature = "integration-testsuite")]
    pub async fn storage_test_multi_part_upload(storage: &mut dyn Storage) -> anyhow::Result<()> {
        let test_path = Path::new("hello_large.txt");

        let mut test_buffer = Vec::with_capacity(15_000_000);
        for i in 0..15_000_000u32 {
            test_buffer.push((i % 256) as u8);
        }

        storage
            .put(test_path, Box::new(test_buffer.clone()))
            .await?;

        assert_eq!(storage.file_num_bytes(test_path).await?, 15_000_000);

        let downloaded_data = storage.get_all(test_path).await?;

        assert_eq!(test_buffer.len(), downloaded_data.len(), "Length mismatch");
        // dont use assert_eq since we dont want large buffers to be printed
        // if assert fails
        assert!(
            test_buffer.as_slice() == downloaded_data.as_slice(),
            "Content mismatch - data corruption detected!"
        );

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/local_file_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::{BTreeSet, HashMap};
use std::fmt;
use std::io::{ErrorKind, SeekFrom};
use std::ops::Range;
use std::path::{Component, Path, PathBuf};
use std::sync::Arc;

use async_trait::async_trait;
use futures::StreamExt;
use futures::future::{BoxFuture, FutureExt};
use quickwit_common::ignore_error_kind;
use quickwit_common::uri::Uri;
use quickwit_config::StorageBackend;
use tokio::io::{AsyncRead, AsyncReadExt, AsyncSeekExt, AsyncWriteExt};
use tracing::warn;

use crate::metrics::object_storage_get_slice_in_flight_guards;
use crate::storage::SendableAsync;
use crate::{
    BulkDeleteError, DebouncedStorage, DeleteFailure, OwnedBytes, Storage, StorageError,
    StorageErrorKind, StorageFactory, StorageResolverError, StorageResult,
};

/// File system compatible storage implementation.
#[derive(Clone)]
pub struct LocalFileStorage {
    uri: Uri,
    root: PathBuf,
}

impl fmt::Debug for LocalFileStorage {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("LocalFileStorage")
            .field("root", &self.root.display())
            .finish()
    }
}

impl LocalFileStorage {
    fn full_path(&self, relative_path: &Path) -> crate::StorageResult<PathBuf> {
        ensure_valid_relative_path(relative_path)?;
        Ok(self.root.join(relative_path))
    }

    /// Creates a local file storage instance given a URI.
    pub fn from_uri(uri: &Uri) -> Result<Self, StorageResolverError> {
        uri.filepath()
            .map(|root| Self {
                uri: uri.clone(),
                root: root.to_path_buf(),
            })
            .ok_or_else(|| {
                let message = format!("URI `{uri}` is not a valid file URI");
                StorageResolverError::InvalidUri(message)
            })
    }

    /// Moves a file from a source to a destination.
    /// from here is an external path, and to is an internal path.
    pub async fn move_into(&self, from_external: &Path, to: &Path) -> crate::StorageResult<()> {
        let to_full_path = self.full_path(to)?;
        tokio::fs::rename(from_external, to_full_path).await?;
        Ok(())
    }

    /// Moves a file from a source to a destination.
    /// from here is an internal path, and to is an external path.
    pub async fn move_out(&self, from_internal: &Path, to: &Path) -> crate::StorageResult<()> {
        let from_full_path = self.full_path(from_internal)?;
        tokio::fs::rename(from_full_path, to).await?;
        Ok(())
    }

    async fn delete_single_file(&self, relative_path: &Path) -> StorageResult<()> {
        let full_path = self.full_path(relative_path)?;
        ignore_error_kind!(ErrorKind::NotFound, tokio::fs::remove_file(full_path).await)?;
        Ok(())
    }
}

/// Ensure that the path given does not include any ".." for security reasons.
///
/// In order to reduce the attack surface, we want to make sure the `FileStorage`
/// only access/delete files that are children of its root_directory.
fn ensure_valid_relative_path(path: &Path) -> StorageResult<()> {
    for component in path.components() {
        match component {
            Component::RootDir | Component::ParentDir | Component::Prefix(_) => {
                // We forbid `Path` components that are breaking the assumption that
                // root.join(path) is a child of root (if we omit fs links).
                return Err(StorageErrorKind::Unauthorized.with_error(anyhow::anyhow!(
                    "path `{}` is forbidden. only simple relative path are allowed",
                    path.display()
                )));
            }
            Component::CurDir | Component::Normal(_) => {
                // we accept `./` and subdir/
            }
        }
    }
    Ok(())
}

/// Delete empty directories starting from `{root}/{path}` directory and stopping at `{root}`
/// directory. Note that the `{root}` directory is not deleted.
fn delete_all_dirs_if_empty<'a>(
    root: &'a Path,
    path: &'a Path,
) -> BoxFuture<'a, std::io::Result<()>> {
    async move {
        let full_path = root.join(path);
        let path_entries_result = full_path.read_dir();
        if let Err(err) = &path_entries_result {
            // Ignore `ErrorKind::NotFound` as this could be deleted by another concurrent task.
            if err.kind() == ErrorKind::NotFound {
                return Ok(());
            }
        }

        let is_not_empty = path_entries_result?.next().is_some();
        if is_not_empty {
            return Ok(());
        }

        let delete_result = tokio::fs::remove_dir(full_path).await;
        if let Err(err) = &delete_result {
            // Ignore `ErrorKind::NotFound` as this could be deleted by another concurrent task.
            if err.kind() == ErrorKind::NotFound {
                return Ok(());
            }
            delete_result?;
        }

        match &path.parent() {
            Some(path) => {
                if path == &Path::new("") || path == &Path::new(".") {
                    return Ok(());
                }
                delete_all_dirs_if_empty(root, path).await?;
            }
            _ => return Ok(()),
        }

        Ok(())
    }
    .boxed()
}

#[async_trait]
impl Storage for LocalFileStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if !self.root.try_exists()? {
            // By creating directories, we check if we have the right permissions.
            tokio::fs::create_dir_all(&self.root).await?
        }
        Ok(())
    }

    async fn put(
        &self,
        path: &Path,
        payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        let full_path = self.full_path(path)?;
        let parent_dir = full_path.parent().ok_or_else(|| {
            let err = anyhow::anyhow!("no parent directory for {full_path:?}");
            StorageErrorKind::Internal.with_error(err)
        })?;

        tokio::fs::create_dir_all(parent_dir).await?;
        let mut reader = payload.byte_stream().await?.into_async_read();
        let named_temp_file = tempfile::NamedTempFile::new_in(parent_dir)?;
        let (temp_std_file, temp_filepath) = named_temp_file.into_parts();
        let mut temp_tokio_file = tokio::fs::File::from_std(temp_std_file);
        tokio::io::copy(&mut reader, &mut temp_tokio_file).await?;
        temp_tokio_file.flush().await?;
        temp_tokio_file.sync_data().await?;
        temp_filepath
            .persist(&full_path)
            .map_err(|err| StorageErrorKind::Io.with_error(err))?;
        // We also need to sync the parent directory to ensure it
        // the file move has been persisted on all file systems.
        tokio::fs::File::open(parent_dir).await?.sync_data().await?;
        Ok(())
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        let full_path = self.full_path(path)?;
        let mut file = tokio::fs::File::open(&full_path).await?;
        tokio::io::copy(&mut file, output).await?;
        Ok(())
    }

    #[tracing::instrument(skip(self), level = "debug")]
    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        let full_path = self.full_path(path)?;
        tokio::task::spawn_blocking(move || {
            use std::io::{Read, Seek};
            // we run these io in a spawn_blocking so there is no scheduling delay between each
            // step, as there would be if using tokio async File.
            let mut file = std::fs::File::open(full_path)?;
            file.seek(SeekFrom::Start(range.start as u64))?;
            let _in_flight_guards = object_storage_get_slice_in_flight_guards(range.len());
            let mut content_bytes: Vec<u8> = Vec::with_capacity(range.len());
            #[allow(clippy::uninit_vec)]
            unsafe {
                content_bytes.set_len(range.len());
            }
            file.read_exact(&mut content_bytes)?;
            Ok(OwnedBytes::new(content_bytes))
        })
        .await
        .map_err(|_| {
            StorageErrorKind::Internal.with_error(anyhow::anyhow!("reading file panicked"))
        })?
    }

    #[tracing::instrument(skip(self), level = "debug")]
    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        let full_path = self.full_path(path)?;
        let mut file = tokio::fs::File::open(&full_path).await?;
        file.seek(SeekFrom::Start(range.start as u64)).await?;
        Ok(Box::new(file.take(range.len() as u64)))
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        self.delete_single_file(path).await?;
        if let Some(parent) = path.parent()
            && let Err(error) = delete_all_dirs_if_empty(&self.root, parent).await
        {
            warn!(error=?error, path=%path.display(), "failed to delete directory");
        }
        Ok(())
    }

    /// Deletes the files identified by `paths` concurrently, with a maximum of `10` syscalls at a
    /// time. Additionally, deletes the parent directories of `paths` if they are empty after the
    /// first round of deletions.
    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        let mut successes = Vec::with_capacity(paths.len());
        let mut failures = HashMap::new();
        let mut parent_paths = BTreeSet::new();

        let remove_file_res_futures: Vec<_> = paths
            .iter()
            .map(|path| async move {
                let remove_file_res = self.delete_single_file(path).await;
                (path, remove_file_res)
            })
            .collect();

        let mut stream = futures::stream::iter(remove_file_res_futures).buffer_unordered(10);

        while let Some((path, remove_file_res)) = stream.next().await {
            match remove_file_res {
                Ok(_) => {
                    successes.push(path.to_path_buf());

                    if let Some(parent) = path.parent() {
                        parent_paths.insert(parent);
                    }
                }
                Err(error) => {
                    let failure = DeleteFailure {
                        error: Some(error),
                        ..Default::default()
                    };
                    failures.insert(path.to_path_buf(), failure);
                }
            }
        }
        // Delete parent directories of `paths` if they are empty.
        // Traverse the parent directories in reverse order, so that we delete the deepest ones
        // first.
        for parent_path in parent_paths.into_iter().rev() {
            if let Err(error) = delete_all_dirs_if_empty(&self.root, parent_path).await {
                warn!(error=?error, path=%parent_path.display(), "failed to delete directory");
            }
        }
        if failures.is_empty() {
            return Ok(());
        }
        Err(BulkDeleteError {
            successes,
            failures,
            ..Default::default()
        })
    }

    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        let full_path = self.full_path(path)?;
        let content_bytes = tokio::fs::read(full_path).await.map_err(|err| {
            StorageError::from(err).add_context(format!(
                "failed to read file {}/{}",
                self.uri(),
                path.to_string_lossy()
            ))
        })?;
        Ok(OwnedBytes::new(content_bytes))
    }

    fn uri(&self) -> &Uri {
        &self.uri
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        let full_path = self.full_path(path)?;
        match tokio::fs::metadata(full_path).await {
            Ok(metadata) => {
                if metadata.is_file() {
                    Ok(metadata.len())
                } else {
                    Err(StorageErrorKind::NotFound.with_error(anyhow::anyhow!(
                        "file `{}` is not a regular file, cannot determine its size",
                        path.display()
                    )))
                }
            }
            Err(err) => {
                if err.kind() == ErrorKind::NotFound {
                    Err(StorageErrorKind::NotFound.with_error(err))
                } else {
                    Err(err.into())
                }
            }
        }
    }
}

/// A File storage resolver
#[derive(Clone, Debug, Default)]
pub struct LocalFileStorageFactory;

#[async_trait]
impl StorageFactory for LocalFileStorageFactory {
    fn backend(&self) -> StorageBackend {
        StorageBackend::File
    }

    async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        let storage = LocalFileStorage::from_uri(uri)?;
        Ok(Arc::new(DebouncedStorage::new(storage)))
    }
}

#[cfg(test)]
mod tests {

    use std::str::FromStr;

    use super::*;
    use crate::test_suite::storage_test_suite;

    #[tokio::test]
    async fn test_local_file_storage() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let uri = Uri::from_str(&format!("{}", temp_dir.path().display())).unwrap();
        let mut local_file_storage = LocalFileStorage::from_uri(&uri)?;
        storage_test_suite(&mut local_file_storage).await?;
        Ok(())
    }

    #[tokio::test]
    async fn test_local_file_storage_forbids_double_dot() {
        let temp_dir = tempfile::tempdir().unwrap();
        let uri = Uri::from_str(&format!("{}", temp_dir.path().display())).unwrap();
        let local_file_storage = LocalFileStorage::from_uri(&uri).unwrap();
        assert_eq!(
            local_file_storage
                .exists(Path::new("hello/toto"))
                .await
                .unwrap(),
            false
        );
        let exist_error = local_file_storage
            .exists(Path::new("hello/../toto"))
            .await
            .unwrap_err();
        assert_eq!(exist_error.kind(), StorageErrorKind::Unauthorized);
    }

    #[tokio::test]
    async fn test_local_file_storage_factory() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let index_uri =
            Uri::from_str(&format!("file://{}/foo/bar", temp_dir.path().display())).unwrap();
        let local_file_storage_factory = LocalFileStorageFactory;
        let local_file_storage = local_file_storage_factory.resolve(&index_uri).await?;
        assert_eq!(local_file_storage.uri(), &index_uri);

        let err = local_file_storage_factory
            .resolve(&Uri::for_test("s3://foo/bar"))
            .await
            .err()
            .unwrap();
        assert!(matches!(err, StorageResolverError::InvalidUri { .. }));

        let err = local_file_storage_factory
            .resolve(&Uri::for_test("s3://"))
            .await
            .err()
            .unwrap();
        assert!(matches!(err, StorageResolverError::InvalidUri { .. }));
        Ok(())
    }

    #[tokio::test]
    async fn test_local_file_storage_bulk_delete() {
        let temp_dir = tempfile::tempdir().unwrap();
        tokio::fs::create_dir(temp_dir.path().join("foo-dir"))
            .await
            .unwrap();
        tokio::fs::create_dir(temp_dir.path().join("bar-dir"))
            .await
            .unwrap();
        tokio::fs::File::create(temp_dir.path().join("foo-dir/foo"))
            .await
            .unwrap();

        let uri = Uri::from_str(&format!("{}", temp_dir.path().display())).unwrap();
        let local_file_storage = LocalFileStorage::from_uri(&uri).unwrap();
        let error = local_file_storage
            .bulk_delete(&[Path::new("foo-dir/foo"), Path::new("bar-dir")])
            .await
            .unwrap_err();
        assert_eq!(error.successes, [PathBuf::from("foo-dir/foo")]);

        let failure = error.failures.get(Path::new("bar-dir")).unwrap();
        assert_eq!(failure.error.as_ref().unwrap().kind(), StorageErrorKind::Io);

        assert!(!temp_dir.path().join("foo-dir").try_exists().unwrap());
    }

    #[tokio::test]
    async fn test_try_delete_dir_all() -> anyhow::Result<()> {
        let path_root = tempfile::tempdir()?.keep();
        let dir_path = path_root.clone().join("foo/bar/baz");
        tokio::fs::create_dir_all(dir_path.clone()).await?;

        // check all empty directory
        assert_eq!(dir_path.try_exists().unwrap(), true);
        delete_all_dirs_if_empty(&path_root, dir_path.as_path()).await?;
        assert_eq!(dir_path.try_exists().unwrap(), false);
        assert_eq!(dir_path.parent().unwrap().try_exists().unwrap(), false);

        // check with intermediate file
        tokio::fs::create_dir_all(dir_path.clone()).await?;
        let intermediate_file = dir_path.parent().unwrap().join("fizz.txt");
        tokio::fs::File::create(intermediate_file.clone()).await?;
        assert_eq!(dir_path.try_exists().unwrap(), true);
        assert_eq!(intermediate_file.try_exists().unwrap(), true);
        delete_all_dirs_if_empty(&path_root, dir_path.as_path()).await?;
        assert_eq!(dir_path.try_exists().unwrap(), false);
        assert_eq!(dir_path.parent().unwrap().try_exists().unwrap(), true);

        // make sure it does not go beyond the path
        tokio::fs::create_dir_all(path_root.join("home/foo/bar")).await?;
        delete_all_dirs_if_empty(&path_root.join("home/foo"), Path::new("bar")).await?;
        assert_eq!(path_root.join("home/foo").try_exists().unwrap(), true);

        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/metrics.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// See https://prometheus.io/docs/practices/naming/

use std::collections::HashMap;
use std::sync::RwLock;

use once_cell::sync::Lazy;
use quickwit_common::metrics::{
    GaugeGuard, Histogram, IntCounter, IntCounterVec, IntGauge, new_counter, new_counter_vec,
    new_gauge, new_histogram_vec,
};
use quickwit_config::CacheConfig;

/// Counters associated to storage operations.
pub struct StorageMetrics {
    pub shortlived_cache: CacheMetrics,
    pub partial_request_cache: CacheMetrics,
    pub predicate_cache: CacheMetrics,
    pub fd_cache_metrics: CacheMetrics,
    pub fast_field_cache: CacheMetrics,
    pub split_footer_cache: CacheMetrics,
    pub searcher_split_cache: CacheMetrics,
    pub get_slice_timeout_successes: [IntCounter; 3],
    pub get_slice_timeout_all_timeouts: IntCounter,
    pub object_storage_get_total: IntCounter,
    pub object_storage_get_errors_total: IntCounterVec<1>,
    pub object_storage_get_slice_in_flight_count: IntGauge,
    pub object_storage_get_slice_in_flight_num_bytes: IntGauge,
    pub object_storage_put_total: IntCounter,
    pub object_storage_put_parts: IntCounter,
    pub object_storage_download_num_bytes: IntCounter,
    pub object_storage_upload_num_bytes: IntCounter,

    pub object_storage_delete_requests_total: IntCounter,
    pub object_storage_bulk_delete_requests_total: IntCounter,
    pub object_storage_delete_request_duration: Histogram,
    pub object_storage_bulk_delete_request_duration: Histogram,
}

impl Default for StorageMetrics {
    fn default() -> Self {
        let get_slice_timeout_outcome_total_vec = new_counter_vec(
            "get_slice_timeout_outcome",
            "Outcome of get_slice operations. success_after_1_timeout means the operation \
             succeeded after a retry caused by a timeout.",
            "storage",
            &[],
            ["outcome"],
        );
        let get_slice_timeout_successes = [
            get_slice_timeout_outcome_total_vec.with_label_values(["success_after_0_timeout"]),
            get_slice_timeout_outcome_total_vec.with_label_values(["success_after_1_timeout"]),
            get_slice_timeout_outcome_total_vec.with_label_values(["success_after_2+_timeout"]),
        ];
        let get_slice_timeout_all_timeouts =
            get_slice_timeout_outcome_total_vec.with_label_values(["all_timeouts"]);

        let object_storage_requests_total = new_counter_vec(
            "object_storage_requests_total",
            "Total number of object storage requests performed.",
            "storage",
            &[],
            ["action"],
        );
        let object_storage_delete_requests_total =
            object_storage_requests_total.with_label_values(["delete_object"]);
        let object_storage_bulk_delete_requests_total =
            object_storage_requests_total.with_label_values(["delete_objects"]);

        let object_storage_request_duration = new_histogram_vec(
            "object_storage_request_duration_seconds",
            "Duration of object storage requests in seconds.",
            "storage",
            &[],
            ["action"],
            vec![0.1, 0.5, 1.0, 5.0, 10.0, 30.0, 60.0],
        );
        let object_storage_delete_request_duration =
            object_storage_request_duration.with_label_values(["delete_object"]);
        let object_storage_bulk_delete_request_duration =
            object_storage_request_duration.with_label_values(["delete_objects"]);

        StorageMetrics {
            fast_field_cache: CacheMetrics::for_component("fastfields"),
            fd_cache_metrics: CacheMetrics::for_component("fd"),
            partial_request_cache: CacheMetrics::for_component("partial_request"),
            predicate_cache: CacheMetrics::for_component("predicate"),
            searcher_split_cache: CacheMetrics::for_component("searcher_split"),
            shortlived_cache: CacheMetrics::for_component("shortlived"),
            split_footer_cache: CacheMetrics::for_component("splitfooter"),
            get_slice_timeout_successes,
            get_slice_timeout_all_timeouts,
            object_storage_get_total: new_counter(
                "object_storage_gets_total",
                "Number of objects fetched. Might be lower than get_slice_timeout_outcome if \
                 queries are debounced.",
                "storage",
                &[],
            ),
            object_storage_get_errors_total: new_counter_vec::<1>(
                "object_storage_get_errors_total",
                "Number of GetObject errors.",
                "storage",
                &[],
                ["code"],
            ),
            object_storage_get_slice_in_flight_count: new_gauge(
                "object_storage_get_slice_in_flight_count",
                "Number of GetObject for which the memory was allocated but the download is still \
                 in progress.",
                "storage",
                &[],
            ),
            object_storage_get_slice_in_flight_num_bytes: new_gauge(
                "object_storage_get_slice_in_flight_num_bytes",
                "Memory allocated for GetObject requests that are still in progress.",
                "storage",
                &[],
            ),
            object_storage_put_total: new_counter(
                "object_storage_puts_total",
                "Number of objects uploaded. May differ from object_storage_requests_parts due to \
                 multipart upload.",
                "storage",
                &[],
            ),
            object_storage_put_parts: new_counter(
                "object_storage_puts_parts",
                "Number of object parts uploaded.",
                "",
                &[],
            ),
            object_storage_download_num_bytes: new_counter(
                "object_storage_download_num_bytes",
                "Amount of data downloaded from an object storage.",
                "storage",
                &[],
            ),
            object_storage_upload_num_bytes: new_counter(
                "object_storage_upload_num_bytes",
                "Amount of data uploaded to an object storage.",
                "storage",
                &[],
            ),
            object_storage_delete_requests_total,
            object_storage_bulk_delete_requests_total,
            object_storage_delete_request_duration,
            object_storage_bulk_delete_request_duration,
        }
    }
}

/// Counters associated to a cache.
pub struct CacheMetrics {
    pub component_name: String,
    pub cache_metrics: SingleCacheMetrics,
    virtual_caches_metrics: RwLock<HashMap<CacheConfig, SingleCacheMetrics>>,
}

#[derive(Clone)]
pub struct SingleCacheMetrics {
    pub in_cache_count: IntGauge,
    pub in_cache_num_bytes: IntGauge,
    pub hits_num_items: IntCounter,
    pub hits_num_bytes: IntCounter,
    pub misses_num_items: IntCounter,
    pub evict_num_items: IntCounter,
    pub evict_num_bytes: IntCounter,
}

impl CacheMetrics {
    pub fn for_component(component_name: &str) -> Self {
        const CACHE_METRICS_NAMESPACE: &str = "cache";
        let labels = [("component_name", component_name)];
        CacheMetrics {
            component_name: component_name.to_string(),
            cache_metrics: SingleCacheMetrics {
                in_cache_count: new_gauge(
                    "in_cache_count",
                    "Count of in cache by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
                in_cache_num_bytes: new_gauge(
                    "in_cache_num_bytes",
                    "Number of bytes in cache by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
                hits_num_items: new_counter(
                    "cache_hits_total",
                    "Number of cache hits by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
                hits_num_bytes: new_counter(
                    "cache_hits_bytes",
                    "Number of cache hits in bytes by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
                misses_num_items: new_counter(
                    "cache_misses_total",
                    "Number of cache misses by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
                evict_num_items: new_counter(
                    "cache_evict_total",
                    "Number of cache entry evicted by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
                evict_num_bytes: new_counter(
                    "cache_evict_bytes",
                    "Number of cache entry evicted in bytes by component",
                    CACHE_METRICS_NAMESPACE,
                    &labels,
                ),
            },
            virtual_caches_metrics: RwLock::default(),
        }
    }

    pub fn virtual_cache(&self, config: &CacheConfig) -> SingleCacheMetrics {
        if let Some(virtual_cache_metrics) = self.virtual_caches_metrics.read().unwrap().get(config)
        {
            return virtual_cache_metrics.clone();
        }

        const CACHE_METRICS_NAMESPACE: &str = "cache";
        let capacity = config.capacity().as_u64().to_string();
        let policy = config.policy().to_string();
        let labels = [
            ("component_name", self.component_name.as_str()),
            ("capacity", &capacity),
            ("policy", &policy),
        ];
        let new_virtual_cache_metrics = SingleCacheMetrics {
            in_cache_count: new_gauge(
                "virtual_in_cache_count",
                "Count of in cache by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
            in_cache_num_bytes: new_gauge(
                "virtual_in_cache_num_bytes",
                "Number of bytes in cache by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
            hits_num_items: new_counter(
                "virtual_cache_hits_total",
                "Number of cache hits by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
            hits_num_bytes: new_counter(
                "virtual_cache_hits_bytes",
                "Number of cache hits in bytes by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
            misses_num_items: new_counter(
                "virtual_cache_misses_total",
                "Number of cache misses by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
            evict_num_items: new_counter(
                "virtual_cache_evict_total",
                "Number of cache entry evicted by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
            evict_num_bytes: new_counter(
                "virtual_cache_evict_bytes",
                "Number of cache entry evicted in bytes by component",
                CACHE_METRICS_NAMESPACE,
                &labels,
            ),
        };

        self.virtual_caches_metrics
            .write()
            .unwrap()
            .entry(config.clone())
            .or_insert(new_virtual_cache_metrics)
            .clone()
    }
}

/// Storage counters exposes a bunch a set of storage/cache related metrics through a prometheus
/// endpoint.
pub static STORAGE_METRICS: Lazy<StorageMetrics> = Lazy::new(StorageMetrics::default);

#[cfg(test)]
pub static CACHE_METRICS_FOR_TESTS: Lazy<CacheMetrics> =
    Lazy::new(|| CacheMetrics::for_component("fortest"));

pub fn object_storage_get_slice_in_flight_guards(
    get_request_size: usize,
) -> (GaugeGuard<'static>, GaugeGuard<'static>) {
    let mut bytes_guard = GaugeGuard::from_gauge(
        &crate::STORAGE_METRICS.object_storage_get_slice_in_flight_num_bytes,
    );
    bytes_guard.add(get_request_size as i64);
    let mut count_guard =
        GaugeGuard::from_gauge(&crate::STORAGE_METRICS.object_storage_get_slice_in_flight_count);
    count_guard.add(1);
    (bytes_guard, count_guard)
}


================================================
FILE: quickwit/quickwit-storage/src/object_storage/azure_blob_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::num::NonZeroU32;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::{fmt, io};

use async_trait::async_trait;
use azure_core::error::ErrorKind;
use azure_core::{Pageable, StatusCode};
use azure_storage::Error as AzureError;
use azure_storage::prelude::*;
use azure_storage_blobs::blob::operations::GetBlobResponse;
use azure_storage_blobs::prelude::*;
use bytes::Bytes;
use futures::io::Error as FutureError;
use futures::stream::{StreamExt, TryStreamExt};
use md5::Digest;
use once_cell::sync::OnceCell;
use quickwit_common::retry::{RetryParams, Retryable, retry};
use quickwit_common::uri::Uri;
use quickwit_common::{chunk_range, ignore_error_kind, into_u64_range};
use quickwit_config::{AzureStorageConfig, StorageBackend};
use regex::Regex;
use tantivy::directory::OwnedBytes;
use thiserror::Error;
use tokio::io::{AsyncRead, AsyncWriteExt, BufReader};
use tokio_util::compat::FuturesAsyncReadCompatExt;
use tokio_util::io::StreamReader;
use tracing::{instrument, warn};

use crate::debouncer::DebouncedStorage;
use crate::metrics::object_storage_get_slice_in_flight_guards;
use crate::storage::SendableAsync;
use crate::{
    BulkDeleteError, DeleteFailure, MultiPartPolicy, PutPayload, STORAGE_METRICS, Storage,
    StorageError, StorageErrorKind, StorageFactory, StorageResolverError, StorageResult,
};

/// Azure object storage resolver.
pub struct AzureBlobStorageFactory {
    storage_config: AzureStorageConfig,
}

impl AzureBlobStorageFactory {
    /// Creates a new Azure blob storage factory.
    pub fn new(storage_config: AzureStorageConfig) -> Self {
        Self { storage_config }
    }
}

#[async_trait]
impl StorageFactory for AzureBlobStorageFactory {
    fn backend(&self) -> StorageBackend {
        StorageBackend::Azure
    }

    async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        let storage = AzureBlobStorage::from_uri(&self.storage_config, uri)?;
        Ok(Arc::new(DebouncedStorage::new(storage)))
    }
}

/// Azure object storage implementation
pub struct AzureBlobStorage {
    container_client: ContainerClient,
    uri: Uri,
    prefix: PathBuf,
    multipart_policy: MultiPartPolicy,
    retry_params: RetryParams,
}

impl fmt::Debug for AzureBlobStorage {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("AzureBlobStorage")
            .field("uri", &self.uri)
            .field("prefix", &self.prefix)
            .finish()
    }
}

impl AzureBlobStorage {
    /// Creates a new [`AzureBlobStorage`] instance.
    pub fn new(
        storage_account_name: String,
        storage_credentials: StorageCredentials,
        uri: Uri,
        container_name: String,
    ) -> Self {
        let container_client = BlobServiceClient::new(storage_account_name, storage_credentials)
            .container_client(container_name);
        Self {
            container_client,
            uri,
            prefix: PathBuf::new(),
            multipart_policy: MultiPartPolicy {
                // Azure max part size is 100MB
                // https://azure.microsoft.com/en-us/blog/general-availability-larger-block-blobs-in-azure-storage/
                target_part_num_bytes: 100_000_000,
                multipart_threshold_num_bytes: 100_000_000,
                max_num_parts: 50_000, // Azure allows up to 50,000 blocks
                max_object_num_bytes: 4_770_000_000_000u64, // Azure allows up to 4.77TB objects
                max_concurrent_uploads: 100,
            },
            retry_params: RetryParams::aggressive(),
        }
    }

    /// Sets the prefix path.
    ///
    /// The existing prefix is overwritten.
    pub fn with_prefix(self, prefix: PathBuf) -> Self {
        Self {
            container_client: self.container_client,
            uri: self.uri,
            prefix,
            multipart_policy: self.multipart_policy,
            retry_params: self.retry_params,
        }
    }

    /// Creates an emulated storage for testing.
    #[cfg(feature = "integration-testsuite")]
    pub fn new_emulated(container: &str) -> Self {
        use std::str::FromStr;

        let container_client = ClientBuilder::emulator().container_client(container);
        let uri = Uri::from_str(&format!("azure://tester/{container}")).unwrap();

        Self {
            container_client,
            uri,
            prefix: PathBuf::new(),
            multipart_policy: MultiPartPolicy::default(),
            retry_params: RetryParams::no_retries(),
        }
    }

    /// Sets the multipart policy.
    ///
    /// See `MultiPartPolicy`.
    #[cfg(feature = "integration-testsuite")]
    pub fn set_policy(&mut self, multipart_policy: MultiPartPolicy) {
        self.multipart_policy = multipart_policy;
    }

    /// Builds instance from URI.
    pub fn from_uri(
        azure_storage_config: &AzureStorageConfig,
        uri: &Uri,
    ) -> Result<AzureBlobStorage, StorageResolverError> {
        let storage_account_name =
            azure_storage_config.resolve_account_name().ok_or_else(|| {
                let message = format!(
                    "could not find Azure storage account name in environment variable `{}` or \
                     storage config",
                    AzureStorageConfig::AZURE_STORAGE_ACCOUNT_ENV_VAR
                );
                StorageResolverError::InvalidConfig(message)
            })?;
        let storage_credentials = if let Some(access_key) =
            azure_storage_config.resolve_access_key()
        {
            StorageCredentials::access_key(storage_account_name.clone(), access_key)
        } else if let Ok(credential) = azure_identity::create_credential() {
            StorageCredentials::token_credential(credential)
        } else {
            return Err(StorageResolverError::InvalidConfig(
                "could not find Azure storage account credentials using the following credential \
                 providers: environment, managed identity, and storage account access key"
                    .to_string(),
            ));
        };
        let (container_name, prefix) = parse_azure_uri(uri).ok_or_else(|| {
            let message = format!("failed to extract container name from Azure URI `{uri}`");
            StorageResolverError::InvalidUri(message)
        })?;
        let azure_blob_storage = AzureBlobStorage::new(
            storage_account_name,
            storage_credentials,
            uri.clone(),
            container_name,
        );
        Ok(azure_blob_storage.with_prefix(prefix))
    }

    /// Returns the blob name (a.k.a blob key).
    fn blob_name(&self, relative_path: &Path) -> String {
        let key_path = self.prefix.join(relative_path);
        key_path.to_string_lossy().to_string()
    }

    /// Downloads a blob as vector of bytes.
    async fn get_to_vec(
        &self,
        path: &Path,
        range_opt: Option<Range<usize>>,
    ) -> StorageResult<Vec<u8>> {
        let name = self.blob_name(path);
        let capacity = range_opt.as_ref().map(Range::len).unwrap_or(0);
        retry(&self.retry_params, || async {
            let (mut response_stream, _in_flight_guards) = if let Some(range) = range_opt.as_ref() {
                let stream = self
                    .container_client
                    .blob_client(&name)
                    .get()
                    .range(range.clone())
                    .into_stream();
                // only record ranged get request as being in flight
                let in_flight_guards = object_storage_get_slice_in_flight_guards(capacity);
                (stream, Some(in_flight_guards))
            } else {
                let stream = self.container_client.blob_client(&name).get().into_stream();
                (stream, None)
            };
            let mut buf: Vec<u8> = Vec::with_capacity(capacity);
            download_all(&mut response_stream, &mut buf).await?;

            Result::<_, AzureErrorWrapper>::Ok(buf)
        })
        .await
        .map_err(StorageError::from)
    }

    /// Performs a single part upload.
    async fn put_single_part<'a>(
        &'a self,
        name: &'a str,
        payload: Box<dyn crate::PutPayload>,
    ) -> StorageResult<()> {
        crate::STORAGE_METRICS.object_storage_put_parts.inc();
        crate::STORAGE_METRICS
            .object_storage_upload_num_bytes
            .inc_by(payload.len());
        retry(&self.retry_params, || async {
            let data = Bytes::from(payload.read_all().await?.to_vec());
            let hash = azure_storage_blobs::prelude::Hash::from(md5::compute(&data[..]).0);
            self.container_client
                .blob_client(name)
                .put_block_blob(data)
                .hash(hash)
                .into_future()
                .await?;
            Result::<(), AzureErrorWrapper>::Ok(())
        })
        .await?;
        Ok(())
    }

    /// Performs a multipart upload.
    async fn put_multi_part<'a>(
        &'a self,
        name: &'a str,
        payload: Box<dyn PutPayload>,
        part_len: u64,
        total_len: u64,
    ) -> StorageResult<()> {
        assert!(total_len > 0);
        let multipart_ranges =
            chunk_range(0..total_len as usize, part_len as usize).map(into_u64_range);

        let blob_client = self.container_client.blob_client(name);
        let upload_blocks_stream = tokio_stream::iter(multipart_ranges.enumerate())
            .map(|(num, range)| {
                let moved_blob_client = blob_client.clone();
                let moved_payload = payload.clone();
                crate::STORAGE_METRICS.object_storage_put_parts.inc();
                crate::STORAGE_METRICS
                    .object_storage_upload_num_bytes
                    .inc_by(range.end - range.start);
                async move {
                    retry(&self.retry_params, || async {
                        // zero pad block ids to make them sortable as strings
                        let block_id = format!("block:{:05}", num);
                        let (data, hash_digest) =
                            extract_range_data_and_hash(moved_payload.box_clone(), range.clone())
                                .await?;
                        let hash = azure_storage_blobs::prelude::Hash::from(hash_digest.0);
                        moved_blob_client
                            .put_block(block_id.clone(), data)
                            .hash(hash)
                            .into_future()
                            .await?;
                        Result::<_, AzureErrorWrapper>::Ok(block_id)
                    })
                    .await
                }
            })
            .buffer_unordered(self.multipart_policy.max_concurrent_uploads());

        // Collect and sort block ids to preserve part order for put_block_list.
        // Azure docs: "The put block list operation enforces the order in which blocks
        // are to be combined to create a blob".
        // https://docs.microsoft.com/en-us/rest/api/storageservices/put-block-list
        let mut block_ids: Vec<String> = upload_blocks_stream
            .try_collect()
            .await
            .map_err(StorageError::from)?;
        block_ids.sort_unstable();

        let block_list = BlockList {
            blocks: block_ids
                .into_iter()
                .map(BlobBlockType::new_uncommitted)
                .collect(),
        };

        // Commit all uploaded blocks.
        blob_client
            .put_block_list(block_list)
            .into_future()
            .await
            .map_err(AzureErrorWrapper::from)?;

        Ok(())
    }
}

#[async_trait]
impl Storage for AzureBlobStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        if let Some(first_blob_result) = self
            .container_client
            .list_blobs()
            .max_results(NonZeroU32::new(1u32).expect("1 is always non-zero."))
            .into_stream()
            .next()
            .await
        {
            let _ = first_blob_result?;
        }
        Ok(())
    }

    async fn put(
        &self,
        path: &Path,
        payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        crate::STORAGE_METRICS.object_storage_put_total.inc();
        let name = self.blob_name(path);
        let total_len = payload.len();
        let part_num_bytes = self.multipart_policy.part_num_bytes(total_len);

        if part_num_bytes >= total_len {
            self.put_single_part(&name, payload).await?;
        } else {
            self.put_multi_part(&name, payload, part_num_bytes, total_len)
                .await?;
        }
        Ok(())
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        let name = self.blob_name(path);
        let mut output_stream = self.container_client.blob_client(name).get().into_stream();

        while let Some(chunk_result) = output_stream.next().await {
            let chunk_response = chunk_result.map_err(AzureErrorWrapper::from)?;
            let chunk_response_body_stream = chunk_response
                .data
                .map_err(FutureError::other)
                .into_async_read()
                .compat();
            let mut body_stream_reader = BufReader::new(chunk_response_body_stream);
            let num_bytes_copied = tokio::io::copy_buf(&mut body_stream_reader, output).await?;
            STORAGE_METRICS
                .object_storage_download_num_bytes
                .inc_by(num_bytes_copied);
        }
        output.flush().await?;
        Ok(())
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        let blob_name = self.blob_name(path);
        let delete_res: Result<_, StorageError> = self
            .container_client
            .blob_client(blob_name)
            .delete()
            .into_future()
            .await
            .map_err(|err| AzureErrorWrapper::from(err).into());
        ignore_error_kind!(StorageErrorKind::NotFound, delete_res)?;
        Ok(())
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        // See https://github.com/Azure/azure-sdk-for-rust/issues/1068
        warn!(
            num_files = paths.len(),
            "`AzureBlobStorage` does not support batch delete. Falling back to sequential delete, \
             which might be slow and issue many requests."
        );
        let mut successes = Vec::with_capacity(paths.len());
        let mut failures = HashMap::new();

        let futures = paths
            .iter()
            .map(|path| async move {
                let delete_res = self.delete(path).await;
                (path, delete_res)
            })
            .collect::<Vec<_>>();
        let mut stream = futures::stream::iter(futures).buffer_unordered(100);

        while let Some((path, delete_res)) = stream.next().await {
            match delete_res {
                Ok(_) => successes.push(path.to_path_buf()),
                Err(error) => {
                    let failure = DeleteFailure {
                        error: Some(error),
                        ..Default::default()
                    };
                    failures.insert(path.to_path_buf(), failure);
                }
            };
        }
        if failures.is_empty() {
            Ok(())
        } else {
            Err(BulkDeleteError {
                successes,
                failures,
                ..Default::default()
            })
        }
    }

    #[instrument(level = "debug", skip(self, range), fields(range.start = range.start, range.end = range.end))]
    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        self.get_to_vec(path, Some(range.clone()))
            .await
            .map(OwnedBytes::new)
            .map_err(|err| {
                err.add_context(format!(
                    "failed to fetch slice {:?} for object: {}/{}",
                    range,
                    self.uri,
                    path.display(),
                ))
            })
    }

    #[instrument(level = "debug", skip(self, range), fields(range.start = range.start, range.end = range.end))]
    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        retry(&self.retry_params, || async {
            let range = range.clone();
            let name = self.blob_name(path);
            let page_stream = self
                .container_client
                .blob_client(name)
                .get()
                .range(range)
                .into_stream();
            let mut bytes_stream = page_stream
                .map(|page_res| page_res.map(|page| page.data).map_err(FutureError::other))
                .try_flatten()
                .map(|bytes_res| bytes_res.map_err(FutureError::other));
            // Peek into the stream so that any early error can be retried
            let first_chunk = bytes_stream.next().await;
            let reader: Box<dyn AsyncRead + Send + Unpin> = if let Some(res) = first_chunk {
                let first_chunk = res.map_err(AzureErrorWrapper::from)?;
                let reconstructed_stream =
                    Box::pin(futures::stream::once(async { Ok(first_chunk) }).chain(bytes_stream));
                Box::new(StreamReader::new(reconstructed_stream))
            } else {
                Box::new(tokio::io::empty())
            };
            Result::<Box<dyn AsyncRead + Send + Unpin>, AzureErrorWrapper>::Ok(reader)
        })
        .await
        .map_err(|e| e.into())
    }

    #[instrument(level = "debug", skip(self), fields(fetched_bytes_len))]
    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        let data = self
            .get_to_vec(path, None)
            .await
            .map(OwnedBytes::new)
            .map_err(|err| {
                err.add_context(format!(
                    "failed to fetch object: {}/{}",
                    self.uri,
                    path.display()
                ))
            })?;
        tracing::Span::current().record("fetched_bytes_len", data.len());
        Ok(data)
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        let name = self.blob_name(path);
        let properties_result = self
            .container_client
            .blob_client(name)
            .get_properties()
            .into_future()
            .await;
        match properties_result {
            Ok(response) => Ok(response.blob.properties.content_length),
            Err(err) => Err(StorageError::from(AzureErrorWrapper::from(err))),
        }
    }

    fn uri(&self) -> &Uri {
        &self.uri
    }
}

/// Copy range of payload into `Bytes` and return the computed md5.
async fn extract_range_data_and_hash(
    payload: Box<dyn PutPayload>,
    range: Range<u64>,
) -> io::Result<(Bytes, Digest)> {
    let mut reader = payload
        .range_byte_stream(range.clone())
        .await?
        .into_async_read();
    let mut buf: Vec<u8> = Vec::with_capacity(range.count());
    tokio::io::copy(&mut reader, &mut buf).await?;
    let data = Bytes::from(buf);
    let hash = md5::compute(&data[..]);
    Ok((data, hash))
}

pub fn parse_azure_uri(uri: &Uri) -> Option<(String, PathBuf)> {
    // Ex: azure://container/prefix.
    static URI_PTN: OnceCell<Regex> = OnceCell::new();

    let captures = URI_PTN
        .get_or_init(|| {
            Regex::new(r"azure(\+[^:]+)?://(?P<container>[^/]+)(/(?P<prefix>.+))?")
                .expect("The regular expression should compile.")
        })
        .captures(uri.as_str())?;

    let container = captures.name("container")?.as_str().to_string();
    let prefix = captures
        .name("prefix")
        .map(|prefix_match| PathBuf::from(prefix_match.as_str()))
        .unwrap_or_default();
    Some((container, prefix))
}

/// Collect a download stream into an output buffer.
async fn download_all(
    chunk_stream: &mut Pageable<GetBlobResponse, AzureError>,
    output: &mut Vec<u8>,
) -> Result<(), AzureErrorWrapper> {
    output.clear();
    while let Some(chunk_result) = chunk_stream.next().await {
        let chunk_response = chunk_result?;
        let chunk_response_body_stream = chunk_response
            .data
            .map_err(FutureError::other)
            .into_async_read()
            .compat();
        let mut body_stream_reader = BufReader::new(chunk_response_body_stream);
        let num_bytes_copied = tokio::io::copy_buf(&mut body_stream_reader, output).await?;
        crate::STORAGE_METRICS
            .object_storage_download_num_bytes
            .inc_by(num_bytes_copied);
    }
    // When calling `get_all`, the Vec capacity is not properly set.
    output.shrink_to_fit();
    Ok(())
}

#[derive(Error, Debug)]
#[error("Azure error wrapper(inner={inner})")]
struct AzureErrorWrapper {
    inner: AzureError,
}

impl Retryable for AzureErrorWrapper {
    fn is_retryable(&self) -> bool {
        match self.inner.kind() {
            ErrorKind::HttpResponse { status, .. } => !matches!(
                status,
                StatusCode::NotFound
                    | StatusCode::Unauthorized
                    | StatusCode::BadRequest
                    | StatusCode::Forbidden
            ),
            ErrorKind::Io => true,
            _ => false,
        }
    }
}

impl From<AzureError> for AzureErrorWrapper {
    fn from(err: AzureError) -> Self {
        AzureErrorWrapper { inner: err }
    }
}

impl From<io::Error> for AzureErrorWrapper {
    fn from(err: io::Error) -> Self {
        AzureErrorWrapper {
            inner: AzureError::new(ErrorKind::Io, err),
        }
    }
}

impl From<AzureErrorWrapper> for StorageError {
    fn from(err: AzureErrorWrapper) -> Self {
        match err.inner.kind() {
            ErrorKind::HttpResponse { status, .. } => match status {
                StatusCode::NotFound => StorageErrorKind::NotFound.with_error(err),
                _ => StorageErrorKind::Service.with_error(err),
            },
            ErrorKind::Io => StorageErrorKind::Io.with_error(err),
            ErrorKind::Credential => StorageErrorKind::Unauthorized.with_error(err),
            _ => StorageErrorKind::Internal.with_error(err),
        }
    }
}

#[cfg(test)]
mod tests {
    use quickwit_common::uri::Uri;

    use crate::object_storage::azure_blob_storage::parse_azure_uri;

    #[test]
    fn test_parse_azure_uri() {
        assert!(parse_azure_uri(&Uri::for_test("azure://")).is_none());

        let (container, prefix) =
            parse_azure_uri(&Uri::for_test("azure://test-container")).unwrap();
        assert_eq!(container, "test-container");
        assert!(prefix.to_str().unwrap().is_empty());

        let (container, prefix) =
            parse_azure_uri(&Uri::for_test("azure://test-container/")).unwrap();
        assert_eq!(container, "test-container");
        assert!(prefix.to_str().unwrap().is_empty());

        let (container, prefix) =
            parse_azure_uri(&Uri::for_test("azure://test-container/indexes")).unwrap();
        assert_eq!(container, "test-container");
        assert_eq!(prefix.to_str().unwrap(), "indexes");
    }
}


================================================
FILE: quickwit/quickwit-storage/src/object_storage/error.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use aws_sdk_s3::error::{DisplayErrorContext, ProvideErrorMetadata, SdkError};
use aws_sdk_s3::operation::abort_multipart_upload::AbortMultipartUploadError;
use aws_sdk_s3::operation::complete_multipart_upload::CompleteMultipartUploadError;
use aws_sdk_s3::operation::create_multipart_upload::CreateMultipartUploadError;
use aws_sdk_s3::operation::delete_object::DeleteObjectError;
use aws_sdk_s3::operation::delete_objects::DeleteObjectsError;
use aws_sdk_s3::operation::get_object::GetObjectError;
use aws_sdk_s3::operation::head_object::HeadObjectError;
use aws_sdk_s3::operation::put_object::PutObjectError;
use aws_sdk_s3::operation::upload_part::UploadPartError;

use crate::{StorageError, StorageErrorKind};

impl<E> From<SdkError<E>> for StorageError
where E: std::error::Error + ToStorageErrorKind + Send + Sync + 'static
{
    fn from(error: SdkError<E>) -> StorageError {
        let error_kind = match &error {
            SdkError::ConstructionFailure(_) => StorageErrorKind::Internal,
            SdkError::DispatchFailure(failure) => {
                if failure.is_io() {
                    StorageErrorKind::Io
                } else if failure.is_timeout() {
                    StorageErrorKind::Timeout
                } else {
                    StorageErrorKind::Internal
                }
            }
            SdkError::ResponseError(response_error) => {
                match response_error.raw().status().as_u16() {
                    404 /* NOT_FOUND */ => StorageErrorKind::NotFound,
                    403 /* UNAUTHORIZED */ => StorageErrorKind::Unauthorized,
                    _ => StorageErrorKind::Internal,
                }
            }
            SdkError::ServiceError(service_error) => service_error.err().to_storage_error_kind(),
            SdkError::TimeoutError(_) => StorageErrorKind::Timeout,
            _ => StorageErrorKind::Internal,
        };
        let source = anyhow::anyhow!("{}", DisplayErrorContext(error));
        error_kind.with_error(source)
    }
}

pub trait ToStorageErrorKind {
    fn to_storage_error_kind(&self) -> StorageErrorKind;
}

impl ToStorageErrorKind for GetObjectError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        let error_code = self.code().unwrap_or("unknown");
        crate::STORAGE_METRICS
            .object_storage_get_errors_total
            .with_label_values([error_code])
            .inc();
        match self {
            GetObjectError::InvalidObjectState(_) => StorageErrorKind::Service,
            GetObjectError::NoSuchKey(_) => StorageErrorKind::NotFound,
            _ => StorageErrorKind::Service,
        }
    }
}

impl ToStorageErrorKind for DeleteObjectError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        StorageErrorKind::Service
    }
}

impl ToStorageErrorKind for DeleteObjectsError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        StorageErrorKind::Service
    }
}

impl ToStorageErrorKind for UploadPartError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        StorageErrorKind::Service
    }
}

impl ToStorageErrorKind for CompleteMultipartUploadError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        StorageErrorKind::Service
    }
}

impl ToStorageErrorKind for AbortMultipartUploadError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        match self {
            AbortMultipartUploadError::NoSuchUpload(_) => StorageErrorKind::Internal,
            _ => StorageErrorKind::Service,
        }
    }
}

impl ToStorageErrorKind for CreateMultipartUploadError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        StorageErrorKind::Service
    }
}

impl ToStorageErrorKind for PutObjectError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        StorageErrorKind::Service
    }
}

impl ToStorageErrorKind for HeadObjectError {
    fn to_storage_error_kind(&self) -> StorageErrorKind {
        match self {
            HeadObjectError::NotFound(_) => StorageErrorKind::NotFound,
            _ => StorageErrorKind::Service,
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/src/object_storage/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod error;

mod s3_compatible_storage;
pub use self::s3_compatible_storage::S3CompatibleObjectStorage;
pub use self::s3_compatible_storage_resolver::S3CompatibleObjectStorageFactory;

mod policy;
pub use crate::object_storage::policy::MultiPartPolicy;

mod s3_compatible_storage_resolver;

#[cfg(feature = "azure")]
mod azure_blob_storage;
#[cfg(feature = "azure")]
pub use self::azure_blob_storage::{AzureBlobStorage, AzureBlobStorageFactory};


================================================
FILE: quickwit/quickwit-storage/src/object_storage/policy.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

/// The multipart policy defines when and how multipart upload / download should happen.
///
/// The right settings might be vendor specific, but if not available the default values
/// should be safe.
pub struct MultiPartPolicy {
    /// Ideal part size.
    /// Since S3 has a constraint on the number of parts, it cannot always be
    /// respected.
    pub target_part_num_bytes: usize,
    /// Maximum number of parts allowed.
    pub max_num_parts: usize,
    /// Threshold above which multipart is triggered.
    pub multipart_threshold_num_bytes: u64,
    /// Maximum size allowed for an object.
    pub max_object_num_bytes: u64,
    /// Maximum number of parts to be upload concurrently.
    pub max_concurrent_uploads: usize,
}

impl MultiPartPolicy {
    /// This function returns the size of the part that should
    /// be used. We should have `part_num_bytes(len)` <= `len`.
    ///
    /// If this function returns `len`, then multipart upload
    /// will not be used.
    pub fn part_num_bytes(&self, len: u64) -> u64 {
        assert!(
            len < self.max_object_num_bytes,
            "This object storage does not support object of that size {}",
            self.max_object_num_bytes
        );
        assert!(
            self.max_num_parts > 0,
            "Misconfiguration: max_num_parts == 0 makes no sense."
        );
        if len < self.multipart_threshold_num_bytes || self.max_num_parts == 1 {
            return len;
        }
        let max_num_parts = self.max_num_parts as u64;
        // complete part is the smallest integer such that
        // <max_num_parts> * <min_part_len> >= len.
        let min_part_len = 1u64 + (len - 1u64) / max_num_parts;
        (min_part_len).max(self.target_part_num_bytes as u64)
    }

    /// Limits the number of parts that can be concurrently uploaded.
    pub fn max_concurrent_uploads(&self) -> usize {
        self.max_concurrent_uploads
    }
}

// The best default value may differ depending on vendors.
impl Default for MultiPartPolicy {
    fn default() -> Self {
        MultiPartPolicy {
            // S3 limits part size from 5M to 5GB, we want to end up with as few parts as possible
            // since each part is charged as a put request.
            target_part_num_bytes: 5_000_000_000, // 5GB
            multipart_threshold_num_bytes: 128 * 1_024 * 1_024, // 128 MiB
            max_num_parts: 10_000,
            max_object_num_bytes: 5_000_000_000_000u64, // S3 allows up to 5TB objects
            max_concurrent_uploads: 100,
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/src/object_storage/s3_compatible_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::pin::Pin;
use std::task::{Context, Poll};
use std::{fmt, io};

use anyhow::{Context as AnyhhowContext, anyhow};
use async_trait::async_trait;
use aws_credential_types::provider::SharedCredentialsProvider;
use aws_sdk_s3::Client as S3Client;
use aws_sdk_s3::config::{Credentials, Region};
use aws_sdk_s3::error::{ProvideErrorMetadata, SdkError};
use aws_sdk_s3::operation::delete_objects::DeleteObjectsOutput;
use aws_sdk_s3::operation::get_object::{GetObjectError, GetObjectOutput};
use aws_sdk_s3::primitives::ByteStream;
use aws_sdk_s3::types::builders::ObjectIdentifierBuilder;
use aws_sdk_s3::types::{CompletedMultipartUpload, CompletedPart, Delete, ObjectIdentifier};
use base64::prelude::{BASE64_STANDARD, Engine};
use futures::{StreamExt, stream};
use once_cell::sync::{Lazy, OnceCell};
use quickwit_aws::retry::{AwsRetryable, aws_retry};
use quickwit_aws::{aws_behavior_version, get_aws_config};
use quickwit_common::retry::{Retry, RetryParams};
use quickwit_common::uri::Uri;
use quickwit_common::{chunk_range, into_u64_range};
use quickwit_config::S3StorageConfig;
use regex::Regex;
use tokio::io::{AsyncRead, AsyncReadExt, AsyncWriteExt, BufReader, ReadBuf};
use tokio::sync::Semaphore;
use tracing::{info, instrument, warn};

use crate::metrics::object_storage_get_slice_in_flight_guards;
use crate::object_storage::MultiPartPolicy;
use crate::storage::SendableAsync;
use crate::{
    BulkDeleteError, DeleteFailure, OwnedBytes, STORAGE_METRICS, Storage, StorageError,
    StorageErrorKind, StorageResolverError, StorageResult,
};

/// Semaphore to limit the number of concurrent requests to the object store. Some object stores
/// (R2, SeaweedFs...) return errors when too many concurrent requests are emitted.
static REQUEST_SEMAPHORE: Lazy<Semaphore> = Lazy::new(|| {
    let num_permits: usize =
        quickwit_common::get_from_env("QW_S3_MAX_CONCURRENCY", 10_000usize, false);
    Semaphore::new(num_permits)
});

/// Wrap the async read handle together with a permit to keep the permit alive
/// until the handle is dropped
struct S3AsyncRead<T: AsyncRead + Send + Unpin> {
    pub read: T,
    pub _permit: Result<tokio::sync::SemaphorePermit<'static>, tokio::sync::AcquireError>,
}

impl<T: AsyncRead + Send + Unpin> AsyncRead for S3AsyncRead<T> {
    fn poll_read(
        self: Pin<&mut Self>,
        cx: &mut Context<'_>,
        buf: &mut ReadBuf<'_>,
    ) -> Poll<io::Result<()>> {
        let self_unpin = self.get_mut();
        Pin::new(&mut self_unpin.read).poll_read(cx, buf)
    }
}

/// S3-compatible object storage implementation.
pub struct S3CompatibleObjectStorage {
    s3_client: S3Client,
    uri: Uri,
    bucket: String,
    prefix: PathBuf,
    multipart_policy: MultiPartPolicy,
    retry_params: RetryParams,
    disable_multi_object_delete: bool,
    disable_multipart_upload: bool,
}

impl fmt::Debug for S3CompatibleObjectStorage {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("S3CompatibleObjectStorage")
            .field("bucket", &self.bucket)
            .field("prefix", &self.prefix)
            .finish()
    }
}

fn get_credentials_provider(
    s3_storage_config: &S3StorageConfig,
) -> Option<SharedCredentialsProvider> {
    match (
        &s3_storage_config.access_key_id,
        &s3_storage_config.secret_access_key,
    ) {
        (Some(access_key_id), Some(secret_access_key)) => {
            info!("using S3 credentials defined in storage config");
            let credentials = Credentials::from_keys(access_key_id, secret_access_key, None);
            let credentials_provider = SharedCredentialsProvider::new(credentials);
            Some(credentials_provider)
        }
        _ => None,
    }
}

fn get_region(s3_storage_config: &S3StorageConfig) -> Option<Region> {
    s3_storage_config.region.clone().map(|region| {
        info!(region=%region, "using S3 region defined in storage config");
        Region::new(region)
    })
}

pub async fn create_s3_client(s3_storage_config: &S3StorageConfig) -> S3Client {
    let aws_config = get_aws_config().await;
    let credentials_provider =
        get_credentials_provider(s3_storage_config).or(aws_config.credentials_provider());
    let region = get_region(s3_storage_config).or(aws_config.region().cloned());
    let mut s3_config = aws_sdk_s3::Config::builder()
        .behavior_version(aws_behavior_version())
        .region(region);

    if let Some(identity_cache) = aws_config.identity_cache() {
        s3_config.set_identity_cache(identity_cache);
    }
    s3_config.set_credentials_provider(credentials_provider);
    s3_config.set_force_path_style(s3_storage_config.force_path_style_access());
    s3_config.set_http_client(aws_config.http_client());
    s3_config.set_retry_config(aws_config.retry_config().cloned());
    s3_config.set_sleep_impl(aws_config.sleep_impl());
    s3_config.set_stalled_stream_protection(aws_config.stalled_stream_protection());
    s3_config.set_timeout_config(aws_config.timeout_config().cloned());

    if let Some(endpoint) = s3_storage_config.endpoint() {
        info!(endpoint=%endpoint, "using S3 endpoint defined in storage config or environment variable");
        s3_config.set_endpoint_url(Some(endpoint));
    }
    S3Client::from_conf(s3_config.build())
}

impl S3CompatibleObjectStorage {
    /// Creates an object storage given a region and an uri.
    pub async fn from_uri(
        s3_storage_config: &S3StorageConfig,
        uri: &Uri,
    ) -> Result<Self, StorageResolverError> {
        let s3_client = create_s3_client(s3_storage_config).await;
        Self::from_uri_and_client(s3_storage_config, uri, s3_client).await
    }

    /// Creates an object storage given a region, an uri and an S3 client.
    pub async fn from_uri_and_client(
        s3_storage_config: &S3StorageConfig,
        uri: &Uri,
        s3_client: S3Client,
    ) -> Result<Self, StorageResolverError> {
        let (bucket, prefix) = parse_s3_uri(uri).ok_or_else(|| {
            let message = format!("failed to extract bucket name from S3 URI: {uri}");
            StorageResolverError::InvalidUri(message)
        })?;
        let retry_params = RetryParams::aggressive();
        let disable_multi_object_delete = s3_storage_config.disable_multi_object_delete;
        let disable_multipart_upload = s3_storage_config.disable_multipart_upload;
        Ok(Self {
            s3_client,
            uri: uri.clone(),
            bucket,
            prefix,
            multipart_policy: MultiPartPolicy::default(),
            retry_params,
            disable_multi_object_delete,
            disable_multipart_upload,
        })
    }

    /// Sets a specific for all buckets.
    ///
    /// This method overrides any existing prefix. (It does NOT
    /// append the argument to any existing prefix.)
    pub fn with_prefix(self, prefix: PathBuf) -> Self {
        Self {
            s3_client: self.s3_client,
            uri: self.uri,
            bucket: self.bucket,
            prefix,
            multipart_policy: self.multipart_policy,
            retry_params: self.retry_params,
            disable_multi_object_delete: self.disable_multi_object_delete,
            disable_multipart_upload: self.disable_multipart_upload,
        }
    }

    /// Sets the multipart policy.
    ///
    /// See `MultiPartPolicy`.
    #[cfg(feature = "integration-testsuite")]
    pub fn set_policy(&mut self, multipart_policy: MultiPartPolicy) {
        self.multipart_policy = multipart_policy;
    }
}

pub fn parse_s3_uri(uri: &Uri) -> Option<(String, PathBuf)> {
    static S3_URI_PTN: OnceCell<Regex> = OnceCell::new();

    let captures = S3_URI_PTN
        .get_or_init(|| {
            // s3://bucket/path/to/object
            Regex::new(r"s3(\+[^:]+)?://(?P<bucket>[^/]+)(/(?P<prefix>.+))?")
                .expect("The regular expression should compile.")
        })
        .captures(uri.as_str())?;

    let bucket = captures.name("bucket")?.as_str().to_string();
    let prefix = captures
        .name("prefix")
        .map(|prefix_match| PathBuf::from(prefix_match.as_str()))
        .unwrap_or_default();
    Some((bucket, prefix))
}

#[derive(Clone, Debug)]
struct MultipartUploadId(pub String);

#[derive(Clone, Debug)]
struct Part {
    pub part_number: usize,
    pub range: Range<u64>,
    pub md5: md5::Digest,
}

impl Part {
    fn len(&self) -> u64 {
        self.range.end - self.range.start
    }
}

const MD5_CHUNK_SIZE: usize = 1_000_000;

async fn compute_md5<T: AsyncRead + std::marker::Unpin>(mut read: T) -> io::Result<md5::Digest> {
    let mut checksum = md5::Context::new();
    let mut buf = vec![0; MD5_CHUNK_SIZE];
    loop {
        let read_len = read.read(&mut buf).await?;
        checksum.consume(&buf[..read_len]);
        if read_len == 0 {
            return Ok(checksum.finalize());
        }
    }
}

impl S3CompatibleObjectStorage {
    fn key(&self, relative_path: &Path) -> String {
        // FIXME: This may not work on Windows.
        let key_path = self.prefix.join(relative_path);
        key_path.to_string_lossy().to_string()
    }

    fn relative_path(&self, key: &str) -> PathBuf {
        // FIXME: This may not work on Windows.
        Path::new(key)
            .strip_prefix(&self.prefix)
            .expect("The prefix should have been prepended to the key before this method call.")
            .to_path_buf()
    }

    async fn put_single_part_single_try<'a>(
        &'a self,
        bucket: &'a str,
        key: &'a str,
        payload: Box<dyn crate::PutPayload>,
        len: u64,
    ) -> Result<(), Retry<StorageError>> {
        let body = payload
            .byte_stream()
            .await
            .map_err(|io_error| Retry::Permanent(StorageError::from(io_error)))?;

        crate::STORAGE_METRICS.object_storage_put_parts.inc();
        crate::STORAGE_METRICS
            .object_storage_upload_num_bytes
            .inc_by(len);

        self.s3_client
            .put_object()
            .bucket(bucket)
            .key(key)
            .body(body)
            .content_length(len as i64)
            .send()
            .await
            .map_err(|sdk_error| {
                if sdk_error.is_retryable() {
                    Retry::Transient(StorageError::from(sdk_error))
                } else {
                    Retry::Permanent(StorageError::from(sdk_error))
                }
            })?;
        Ok(())
    }

    async fn put_single_part<'a>(
        &'a self,
        key: &'a str,
        payload: Box<dyn crate::PutPayload>,
        len: u64,
    ) -> StorageResult<()> {
        let bucket = &self.bucket;
        aws_retry(&self.retry_params, || async {
            self.put_single_part_single_try(bucket, key, payload.clone(), len)
                .await
        })
        .await
        .map_err(|error| error.into_inner())?;
        Ok(())
    }

    async fn create_multipart_upload(&self, key: &str) -> StorageResult<MultipartUploadId> {
        let upload_id = aws_retry(&self.retry_params, || async {
            self.s3_client
                .create_multipart_upload()
                .bucket(self.bucket.clone())
                .key(key)
                .send()
                .await
        })
        .await?
        .upload_id
        .ok_or_else(|| {
            StorageErrorKind::Internal
                .with_error(anyhow!("the returned multipart upload id was null"))
        })?;
        Ok(MultipartUploadId(upload_id))
    }

    async fn create_multipart_requests(
        &self,
        payload: Box<dyn crate::PutPayload>,
        len: u64,
        part_len: u64,
    ) -> io::Result<Vec<Part>> {
        assert!(len > 0);
        let multipart_ranges = chunk_range(0..len as usize, part_len as usize)
            .map(into_u64_range)
            .collect::<Vec<_>>();

        let mut parts = Vec::with_capacity(multipart_ranges.len());

        for (multipart_id, multipart_range) in multipart_ranges.into_iter().enumerate() {
            let read = payload
                .range_byte_stream(multipart_range.clone())
                .await?
                .into_async_read();
            let md5 = compute_md5(read).await?;

            let part = Part {
                part_number: multipart_id + 1, // parts are 1-indexed
                range: multipart_range,
                md5,
            };
            parts.push(part);
        }
        Ok(parts)
    }

    fn build_delete_batch_requests<'a>(
        &self,
        delete_paths: &'a [&'a Path],
    ) -> anyhow::Result<Vec<(&'a [&'a Path], Delete)>> {
        #[cfg(test)]
        const MAX_NUM_KEYS: usize = 3;

        #[cfg(not(test))]
        const MAX_NUM_KEYS: usize = 1_000;

        let path_chunks = delete_paths.chunks(MAX_NUM_KEYS);
        let num_delete_requests = path_chunks.len();
        let mut delete_requests: Vec<(&[&Path], Delete)> = Vec::with_capacity(num_delete_requests);

        for path_chunk in path_chunks {
            let object_ids: Vec<ObjectIdentifier> = path_chunk
                .iter()
                .map(|path| {
                    let key = self.key(path);
                    ObjectIdentifierBuilder::default()
                        .key(key)
                        .build()
                        .context("failed to build object identifier")
                })
                .collect::<anyhow::Result<_>>()?;
            let delete = Delete::builder()
                .set_objects(Some(object_ids))
                .build()
                .context("failed to build delete request")?;
            delete_requests.push((path_chunk, delete));
        }
        Ok(delete_requests)
    }

    async fn upload_part<'a>(
        &'a self,
        upload_id: MultipartUploadId,
        key: &'a str,
        part: Part,
        payload: Box<dyn crate::PutPayload>,
    ) -> Result<CompletedPart, Retry<StorageError>> {
        let byte_stream = payload
            .range_byte_stream(part.range.clone())
            .await
            .map_err(StorageError::from)
            .map_err(Retry::Permanent)?;
        let md5 = BASE64_STANDARD.encode(part.md5.0);

        crate::STORAGE_METRICS.object_storage_put_parts.inc();
        crate::STORAGE_METRICS
            .object_storage_upload_num_bytes
            .inc_by(part.len());

        let upload_part_output = self
            .s3_client
            .upload_part()
            .bucket(self.bucket.clone())
            .key(key)
            .body(byte_stream)
            .content_length(part.len() as i64)
            .content_md5(md5)
            .part_number(part.part_number as i32)
            .upload_id(upload_id.0)
            .send()
            .await
            .map_err(|s3_err| {
                if s3_err.is_retryable() {
                    Retry::Transient(StorageError::from(s3_err))
                } else {
                    Retry::Permanent(StorageError::from(s3_err))
                }
            })?;

        let completed_part = CompletedPart::builder()
            .set_e_tag(upload_part_output.e_tag)
            .part_number(part.part_number as i32)
            .build();
        Ok(completed_part)
    }

    async fn put_multipart<'a>(
        &'a self,
        key: &'a str,
        payload: Box<dyn crate::PutPayload>,
        part_len: u64,
        total_len: u64,
    ) -> StorageResult<()> {
        let upload_id = self.create_multipart_upload(key).await?;
        let parts = self
            .create_multipart_requests(payload.clone(), total_len, part_len)
            .await?;
        let max_concurrent_upload = self.multipart_policy.max_concurrent_uploads();
        let completed_parts_res: StorageResult<Vec<CompletedPart>> =
            stream::iter(parts.into_iter().map(|part| {
                let payload = payload.clone();
                let upload_id = upload_id.clone();
                aws_retry(&self.retry_params, move || {
                    self.upload_part(upload_id.clone(), key, part.clone(), payload.clone())
                })
            }))
            .buffered(max_concurrent_upload)
            .collect::<Vec<_>>()
            .await
            .into_iter()
            .map(|res| res.map_err(|e| e.into_inner()))
            .collect();
        match completed_parts_res {
            Ok(completed_parts) => {
                self.complete_multipart_upload(key, completed_parts, &upload_id.0)
                    .await
            }
            Err(upload_error) => {
                let abort_multipart_upload_res: StorageResult<()> =
                    self.abort_multipart_upload(key, &upload_id.0).await;
                if let Err(abort_error) = abort_multipart_upload_res {
                    warn!(
                        key = %key,
                        error = ?abort_error,
                        "Failed to abort multipart upload."
                    );
                }
                Err(upload_error)
            }
        }
    }

    async fn complete_multipart_upload(
        &self,
        key: &str,
        completed_parts: Vec<CompletedPart>,
        upload_id: &str,
    ) -> StorageResult<()> {
        let completed_upload = CompletedMultipartUpload::builder()
            .set_parts(Some(completed_parts))
            .build();
        aws_retry(&self.retry_params, || async {
            self.s3_client
                .complete_multipart_upload()
                .bucket(self.bucket.clone())
                .key(key)
                .multipart_upload(completed_upload.clone())
                .upload_id(upload_id)
                .send()
                .await
        })
        .await?;
        Ok(())
    }

    async fn abort_multipart_upload(&self, key: &str, upload_id: &str) -> StorageResult<()> {
        aws_retry(&self.retry_params, || async {
            self.s3_client
                .abort_multipart_upload()
                .bucket(self.bucket.clone())
                .key(key)
                .upload_id(upload_id)
                .send()
                .await
        })
        .await?;
        Ok(())
    }

    async fn get_object(
        &self,
        path: &Path,
        range_opt: Option<Range<usize>>,
    ) -> Result<GetObjectOutput, SdkError<GetObjectError>> {
        let key = self.key(path);
        let range_str = range_opt.map(|range| format!("bytes={}-{}", range.start, range.end - 1));

        crate::STORAGE_METRICS.object_storage_get_total.inc();

        let get_object_output = self
            .s3_client
            .get_object()
            .bucket(self.bucket.clone())
            .key(key)
            .set_range(range_str)
            .send()
            .await?;
        Ok(get_object_output)
    }

    async fn get_to_vec(
        &self,
        path: &Path,
        range_opt: Option<Range<usize>>,
    ) -> StorageResult<Vec<u8>> {
        let cap = range_opt.as_ref().map(Range::len).unwrap_or(0);
        let get_object_output = aws_retry(&self.retry_params, || {
            self.get_object(path, range_opt.clone())
        })
        .await?;
        // only record ranged get request as being in flight
        let _in_flight_guards =
            range_opt.map(|range| object_storage_get_slice_in_flight_guards(range.len()));
        let mut buf: Vec<u8> = Vec::with_capacity(cap);
        download_all(get_object_output.body, &mut buf).await?;
        Ok(buf)
    }

    /// Bulk delete implementation based on the DeleteObject API:
    /// <https://docs.aws.amazon.com/AmazonS3/latest/API/API_DeleteObject.html>
    async fn bulk_delete_single(&self, paths: &[&Path]) -> Result<(), BulkDeleteError> {
        let mut successes = Vec::with_capacity(paths.len());
        let mut failures = HashMap::new();

        let futures = paths
            .iter()
            .map(|path| async move {
                let delete_res = self.delete(path).await;
                (path, delete_res)
            })
            .collect::<Vec<_>>();
        let mut stream = futures::stream::iter(futures).buffer_unordered(100);

        while let Some((path, delete_res)) = stream.next().await {
            match delete_res {
                Ok(_) => successes.push(path.to_path_buf()),
                Err(error) => {
                    let failure = DeleteFailure {
                        error: Some(error),
                        ..Default::default()
                    };
                    failures.insert(path.to_path_buf(), failure);
                }
            };
        }
        if failures.is_empty() {
            Ok(())
        } else {
            Err(BulkDeleteError {
                successes,
                failures,
                ..Default::default()
            })
        }
    }

    /// Bulk delete implementation based on the DeleteObjects API, also called Multi-Object Delete
    /// API: <https://docs.aws.amazon.com/AmazonS3/latest/API/API_DeleteObjects.html>
    async fn bulk_delete_multi(&self, paths: &[&Path]) -> Result<(), BulkDeleteError> {
        let _permit = REQUEST_SEMAPHORE.acquire().await;

        let delete_requests: Vec<(&[&Path], Delete)> = self
            .build_delete_batch_requests(paths)
            .map_err(|error: anyhow::Error| {
                let unattempted = paths.iter().copied().map(Path::to_path_buf).collect();
                BulkDeleteError {
                    error: Some(StorageErrorKind::Internal.with_error(error)),
                    successes: Default::default(),
                    failures: Default::default(),
                    unattempted,
                }
            })?;

        let mut error = None;
        let mut successes = Vec::with_capacity(paths.len());
        let mut failures = HashMap::new();
        let mut unattempted = Vec::new();

        let mut delete_requests_it = delete_requests.iter();

        for (path_chunk, delete) in &mut delete_requests_it {
            let delete_objects_res: StorageResult<DeleteObjectsOutput> =
                aws_retry(&self.retry_params, || async {
                    crate::STORAGE_METRICS
                        .object_storage_bulk_delete_requests_total
                        .inc();
                    let _timer = crate::STORAGE_METRICS
                        .object_storage_bulk_delete_request_duration
                        .start_timer();
                    self.s3_client
                        .delete_objects()
                        .bucket(self.bucket.clone())
                        .delete(delete.clone())
                        .send()
                        .await
                })
                .await
                .map_err(Into::into);

            match delete_objects_res {
                Ok(delete_objects_output) => {
                    if let Some(deleted_objects) = delete_objects_output.deleted {
                        for deleted_object in deleted_objects {
                            if let Some(key) = deleted_object.key {
                                let path = self.relative_path(&key);
                                successes.push(path);
                            }
                        }
                    }
                    if let Some(s3_errors) = delete_objects_output.errors {
                        for s3_error in s3_errors {
                            if let Some(key) = s3_error.key {
                                let path = self.relative_path(&key);
                                match s3_error.code {
                                    Some(code) if code == "NoSuchKey" => {
                                        successes.push(path);
                                    }
                                    _ => {
                                        let failure = DeleteFailure {
                                            code: s3_error.code,
                                            message: s3_error.message,
                                            ..Default::default()
                                        };
                                        failures.insert(path, failure);
                                    }
                                }
                            }
                        }
                    }
                }
                Err(delete_objects_error) => {
                    error = Some(delete_objects_error);
                    unattempted.extend(path_chunk.iter().copied().map(PathBuf::from));
                    break;
                }
            }
        }

        if error.is_none() && failures.is_empty() {
            return Ok(());
        }

        // Do we have remaining requests?
        for (path_chunk, _) in delete_requests_it {
            unattempted.extend(path_chunk.iter().copied().map(PathBuf::from));
        }

        Err(BulkDeleteError {
            error,
            successes,
            failures,
            unattempted,
        })
    }
}

async fn download_all(byte_stream: ByteStream, output: &mut Vec<u8>) -> io::Result<()> {
    output.clear();
    let mut body_stream_reader = BufReader::new(byte_stream.into_async_read());
    let num_bytes_copied = tokio::io::copy_buf(&mut body_stream_reader, output).await?;
    STORAGE_METRICS
        .object_storage_download_num_bytes
        .inc_by(num_bytes_copied);
    // When calling `get_all`, the Vec capacity is not properly set.
    output.shrink_to_fit();
    Ok(())
}

#[async_trait]
impl Storage for S3CompatibleObjectStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        // we ignore error as we never close the semaphore
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        self.s3_client
            .list_objects_v2()
            .bucket(self.bucket.clone())
            .max_keys(1)
            .send()
            .await?;
        Ok(())
    }

    async fn put(
        &self,
        path: &Path,
        payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        crate::STORAGE_METRICS.object_storage_put_total.inc();
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        let key = self.key(path);
        let total_len = payload.len();
        let part_num_bytes = self.multipart_policy.part_num_bytes(total_len);
        if self.disable_multipart_upload || part_num_bytes >= total_len {
            self.put_single_part(&key, payload, total_len).await?;
        } else {
            self.put_multipart(&key, payload, part_num_bytes, total_len)
                .await?;
        }
        Ok(())
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        let get_object_output =
            aws_retry(&self.retry_params, || self.get_object(path, None)).await?;
        let mut body_read = BufReader::new(get_object_output.body.into_async_read());
        let num_bytes_copied = tokio::io::copy_buf(&mut body_read, output).await?;
        STORAGE_METRICS
            .object_storage_download_num_bytes
            .inc_by(num_bytes_copied);
        output.flush().await?;
        Ok(())
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        let bucket = self.bucket.clone();
        let key = self.key(path);
        let delete_res = aws_retry(&self.retry_params, || async {
            crate::STORAGE_METRICS
                .object_storage_delete_requests_total
                .inc();
            let _timer = crate::STORAGE_METRICS
                .object_storage_delete_request_duration
                .start_timer();
            self.s3_client
                .delete_object()
                .bucket(&bucket)
                .key(&key)
                .send()
                .await
        })
        .await;

        match delete_res {
            Ok(_) => Ok(()),
            Err(error) if error.code() == Some("NoSuchKey") => Ok(()),
            Err(error) => Err(error.into()),
        }
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        if self.disable_multi_object_delete {
            self.bulk_delete_single(paths).await
        } else {
            self.bulk_delete_multi(paths).await
        }
    }

    #[instrument(level = "debug", skip(self, range), fields(range.start = range.start, range.end = range.end))]
    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        self.get_to_vec(path, Some(range.clone()))
            .await
            .map(OwnedBytes::new)
            .map_err(|err| {
                err.add_context(format!(
                    "failed to fetch slice {:?} for object: {}/{}",
                    range,
                    self.uri,
                    path.display(),
                ))
            })
    }

    #[instrument(level = "debug", skip(self, range), fields(range.start = range.start, range.end = range.end))]
    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> crate::StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        let permit = REQUEST_SEMAPHORE.acquire().await;
        let get_object_output = aws_retry(&self.retry_params, || {
            self.get_object(path, Some(range.clone()))
        })
        .await?;
        Ok(Box::new(S3AsyncRead {
            read: get_object_output.body.into_async_read(),
            _permit: permit,
        }))
    }

    #[instrument(level = "debug", skip(self), fields(num_bytes_fetched))]
    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        let bytes = self
            .get_to_vec(path, None)
            .await
            .map(OwnedBytes::new)
            .map_err(|err| {
                err.add_context(format!(
                    "failed to fetch object: {}/{}",
                    self.uri,
                    path.display()
                ))
            })?;
        tracing::Span::current().record("num_bytes_fetched", bytes.len());
        Ok(bytes)
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        let _permit = REQUEST_SEMAPHORE.acquire().await;
        let bucket = self.bucket.clone();
        let key = self.key(path);
        let head_object_output = aws_retry(&self.retry_params, || async {
            self.s3_client
                .head_object()
                .bucket(&bucket)
                .key(&key)
                .send()
                .await
        })
        .await?;

        Ok(head_object_output.content_length().unwrap_or(0) as u64)
    }

    fn uri(&self) -> &Uri {
        &self.uri
    }
}

#[cfg(test)]
mod tests {

    use std::path::PathBuf;

    use aws_sdk_s3::config::{Credentials, Region};
    use aws_sdk_s3::primitives::SdkBody;
    use aws_smithy_runtime::client::http::test_util::{ReplayEvent, StaticReplayClient};
    use hyper::http;
    use quickwit_aws::aws_behavior_version;
    use quickwit_common::chunk_range;
    use quickwit_common::uri::Uri;

    use super::*;
    use crate::{MultiPartPolicy, S3CompatibleObjectStorage};

    #[tokio::test]
    async fn test_md5_calc() -> std::io::Result<()> {
        let data = (0..1_500_000).map(|el| el as u8).collect::<Vec<_>>();
        let md5 = compute_md5(data.as_slice()).await?;
        assert_eq!(md5, md5::compute(data));

        Ok(())
    }

    #[test]
    fn test_split_range_into_chunks_inexact() {
        assert_eq!(
            chunk_range(0..11, 3).collect::<Vec<_>>(),
            vec![0..3, 3..6, 6..9, 9..11]
        );
    }
    #[test]
    fn test_split_range_into_chunks_exact() {
        assert_eq!(
            chunk_range(0..9, 3).collect::<Vec<_>>(),
            vec![0..3, 3..6, 6..9]
        );
    }

    #[test]
    fn test_split_range_empty() {
        assert!(chunk_range(0..0, 1).collect::<Vec<_>>().is_empty());
    }

    #[test]
    fn test_parse_uri() {
        assert_eq!(
            parse_s3_uri(&Uri::for_test("s3://bucket/path/to/object")),
            Some(("bucket".to_string(), PathBuf::from("path/to/object")))
        );
        assert_eq!(
            parse_s3_uri(&Uri::for_test("s3://bucket/path")),
            Some(("bucket".to_string(), PathBuf::from("path")))
        );
        assert_eq!(
            parse_s3_uri(&Uri::for_test("s3://bucket/path/to/object")),
            Some(("bucket".to_string(), PathBuf::from("path/to/object")))
        );
        assert_eq!(
            parse_s3_uri(&Uri::for_test("s3://bucket/")),
            Some(("bucket".to_string(), PathBuf::from("")))
        );
        assert_eq!(
            parse_s3_uri(&Uri::for_test("s3://bucket")),
            Some(("bucket".to_string(), PathBuf::from("")))
        );
        assert_eq!(parse_s3_uri(&Uri::for_test("ram://path/to/file")), None);
    }

    #[tokio::test]
    async fn test_s3_compatible_storage_relative_path() {
        let sdk_config = aws_config::defaults(aws_behavior_version()).load().await;
        let s3_client = S3Client::new(&sdk_config);
        let uri = Uri::for_test("s3://bucket/indexes");
        let bucket = "bucket".to_string();
        let prefix = PathBuf::new();

        let mut s3_storage = S3CompatibleObjectStorage {
            s3_client,
            uri,
            bucket,
            prefix,
            multipart_policy: MultiPartPolicy::default(),
            retry_params: RetryParams::for_test(),
            disable_multi_object_delete: false,
            disable_multipart_upload: false,
        };
        assert_eq!(
            s3_storage.relative_path("indexes/foo"),
            PathBuf::from("indexes/foo")
        );

        s3_storage.prefix = PathBuf::from("indexes");

        assert_eq!(
            s3_storage.relative_path("indexes/foo"),
            PathBuf::from("foo")
        );
    }

    #[tokio::test]
    async fn test_s3_compatible_storage_bulk_delete_single() {
        let client = StaticReplayClient::new(vec![
            ReplayEvent::new(
                http::Request::builder().body(SdkBody::empty()).unwrap(),
                http::Response::builder().body(SdkBody::empty()).unwrap(),
            ),
            ReplayEvent::new(
                http::Request::builder().body(SdkBody::empty()).unwrap(),
                http::Response::builder().body(SdkBody::empty()).unwrap(),
            ),
        ]);
        let credentials = Credentials::new("mock_key", "mock_secret", None, None, "mock_provider");
        let config = aws_sdk_s3::Config::builder()
            .behavior_version(aws_behavior_version())
            .region(Some(Region::new("Foo")))
            .http_client(client.clone())
            .credentials_provider(credentials)
            .build();
        let s3_client = S3Client::from_conf(config);
        let uri = Uri::for_test("s3://bucket/indexes");
        let bucket = "bucket".to_string();
        let prefix = PathBuf::new();

        let s3_storage = S3CompatibleObjectStorage {
            s3_client,
            uri,
            bucket,
            prefix,
            multipart_policy: MultiPartPolicy::default(),
            retry_params: RetryParams::for_test(),
            disable_multi_object_delete: true,
            disable_multipart_upload: false,
        };
        let _ = s3_storage
            .bulk_delete(&[Path::new("foo"), Path::new("bar")])
            .await;

        let requests = client.actual_requests().collect::<Vec<_>>();
        assert_eq!(requests.len(), 2);
        assert!(requests[0].uri().to_string().ends_with("DeleteObject"));
    }

    #[tokio::test]
    async fn test_s3_compatible_storage_bulk_delete_multi() {
        let client = StaticReplayClient::new(vec![ReplayEvent::new(
            http::Request::builder().body(SdkBody::empty()).unwrap(),
            http::Response::builder().body(SdkBody::empty()).unwrap(),
        )]);
        let credentials = Credentials::new("mock_key", "mock_secret", None, None, "mock_provider");
        let config = aws_sdk_s3::Config::builder()
            .behavior_version(aws_behavior_version())
            .region(Some(Region::new("Foo")))
            .http_client(client.clone())
            .credentials_provider(credentials)
            .build();
        let s3_client = S3Client::from_conf(config);
        let uri = Uri::for_test("s3://bucket/indexes");
        let bucket = "bucket".to_string();
        let prefix = PathBuf::new();

        let s3_storage = S3CompatibleObjectStorage {
            s3_client,
            uri,
            bucket,
            prefix,
            multipart_policy: MultiPartPolicy::default(),
            retry_params: RetryParams::for_test(),
            disable_multi_object_delete: false,
            disable_multipart_upload: false,
        };
        let _ = s3_storage
            .bulk_delete(&[Path::new("foo"), Path::new("bar")])
            .await;

        let requests = client.actual_requests().collect::<Vec<_>>();
        assert_eq!(requests.len(), 1);
        assert!(requests[0].uri().to_string().ends_with("delete"));
    }

    #[tokio::test]
    async fn test_s3_compatible_storage_bulk_delete_multi_errors() {
        let client = StaticReplayClient::new(vec![
            ReplayEvent::new(
                // This is quite fragile, currently this is *not* validated by the SDK
                // but may in future, that being said, there is no way to know what the
                // request should look like until it raises an error in reality as this
                // is up to how the validation is implemented.
                http::Request::builder().body(SdkBody::empty()).unwrap(),
                http::Response::builder()
                    .status(200)
                    .body(SdkBody::from(
                        r#"<?xml version="1.0" encoding="UTF-8"?>
                        <DeleteResult xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
                            <Deleted>
                                <Key>foo</Key>
                            </Deleted>
                            <Error>
                                <Key>bar</Key>
                                <Code>NoSuchKey</Code>
                                <Message>The specified key does not exist</Message>
                            </Error>
                            <Error>
                                <Key>baz</Key>
                                <Code>AccessDenied</Code>
                                <Message>Access Denied</Message>
                            </Error>
                        </DeleteResult>"#
                    ))
                    .unwrap()
            ),
            ReplayEvent::new(
                // This is quite fragile, currently this is *not* validated by the SDK
                // but may in future, that being said, there is no way to know what the
                // request should look like until it raises an error in reality as this
                // is up to how the validation is implemented.
                http::Request::builder().body(SdkBody::empty()).unwrap(),
                http::Response::builder()
                    .status(400)
                    .body(SdkBody::from(
                        r#"<?xml version="1.0" encoding="UTF-8"?>
                        <Error>
                            <Code>MalformedXML</Code>
                            <Message>The XML you provided was not well-formed or did not validate against our published schema.</Message>
                            <RequestId>264A17BF16E9E80A</RequestId>
                            <HostId>P3xqrhuhYxlrefdw3rEzmJh8z5KDtGzb+/FB7oiQaScI9Yaxd8olYXc7d1111ab+</HostId>
                        </Error>"#
                    ))
                    .unwrap()
            ),
        ]);
        let credentials = Credentials::new("mock_key", "mock_secret", None, None, "mock_provider");
        let config = aws_sdk_s3::Config::builder()
            .behavior_version(aws_behavior_version())
            .region(Some(Region::new("Foo")))
            .http_client(client)
            .credentials_provider(credentials)
            .build();
        let s3_client = S3Client::from_conf(config);
        let uri = Uri::for_test("s3://bucket/indexes");
        let bucket = "bucket".to_string();
        let prefix = PathBuf::new();

        let s3_storage = S3CompatibleObjectStorage {
            s3_client,
            uri,
            bucket,
            prefix,
            multipart_policy: MultiPartPolicy::default(),
            retry_params: RetryParams::for_test(),
            disable_multi_object_delete: false,
            disable_multipart_upload: false,
        };
        let bulk_delete_error = s3_storage
            .bulk_delete(&[
                Path::new("foo"),
                Path::new("bar"),
                Path::new("baz"),
                Path::new("foobar"),
                Path::new("foobaz"),
                Path::new("barfoo"),
                Path::new("barbaz"),
            ])
            .await
            .unwrap_err();

        assert_eq!(
            bulk_delete_error.successes,
            [PathBuf::from("foo"), PathBuf::from("bar")]
        );
        let failure = bulk_delete_error.failures.get(Path::new("baz")).unwrap();
        assert_eq!(failure.code.as_ref().unwrap(), "AccessDenied");
        assert_eq!(failure.message.as_ref().unwrap(), "Access Denied");
        assert!(failure.error.is_none());

        assert_eq!(
            bulk_delete_error.unattempted,
            [
                PathBuf::from("foobar"),
                PathBuf::from("foobaz"),
                PathBuf::from("barfoo"),
                PathBuf::from("barbaz")
            ]
        );
        let delete_objects_error = bulk_delete_error.error.unwrap();
        assert!(delete_objects_error.to_string().contains("MalformedXML"));
    }

    #[tokio::test]
    async fn test_s3_compatible_storage_retry_put() {
        let client = StaticReplayClient::new(vec![
            ReplayEvent::new(
                // This is quite fragile, currently this is *not* validated by the SDK
                // but may in future, that being said, there is no way to know what the
                // request should look like until it raises an error in reality as this
                // is up to how the validation is implemented.
                http::Request::builder().body(SdkBody::empty()).unwrap(),
                http::Response::builder()
                    .status(429)
                    .body(SdkBody::from(
                        r#"<?xml version="1.0" encoding="UTF-8"?>
                        <Error>
                          <Code>SlowDown</Code>
                          <Message>message</Message>
                          <Resource>/my-path</Resource>
                          <RequestId>4442587FB7D0A2F9</RequestId>
                        </Error>"#,
                    ))
                    .unwrap(),
            ),
            ReplayEvent::new(
                // This is quite fragile, currently this is *not* validated by the SDK
                // but may in future, that being said, there is no way to know what the
                // request should look like until it raises an error in reality as this
                // is up to how the validation is implemented.
                http::Request::builder().body(SdkBody::empty()).unwrap(),
                http::Response::builder()
                    .status(200)
                    .body(SdkBody::empty())
                    .unwrap(),
            ),
        ]);
        let credentials = Credentials::new("mock_key", "mock_secret", None, None, "mock_provider");
        let config = aws_sdk_s3::Config::builder()
            .behavior_version(aws_behavior_version())
            .region(Some(Region::new("Foo")))
            .http_client(client)
            .credentials_provider(credentials)
            .build();
        let s3_client = S3Client::from_conf(config);
        let uri = Uri::for_test("s3://bucket/indexes");
        let bucket = "bucket".to_string();
        let prefix = PathBuf::new();

        let s3_storage = S3CompatibleObjectStorage {
            s3_client,
            uri,
            bucket,
            prefix,
            multipart_policy: MultiPartPolicy::default(),
            retry_params: RetryParams::for_test(),
            disable_multi_object_delete: false,
            disable_multipart_upload: false,
        };
        s3_storage
            .put(Path::new("my-path"), Box::new(vec![1, 2, 3]))
            .await
            .unwrap();
    }
}


================================================
FILE: quickwit/quickwit-storage/src/object_storage/s3_compatible_storage_resolver.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use async_trait::async_trait;
use aws_sdk_s3::Client as S3Client;
use quickwit_common::uri::Uri;
use quickwit_config::{S3StorageConfig, StorageBackend};
use tokio::sync::OnceCell;

use super::s3_compatible_storage::create_s3_client;
use crate::{
    DebouncedStorage, S3CompatibleObjectStorage, Storage, StorageFactory, StorageResolverError,
};

/// S3 compatible object storage resolver.
pub struct S3CompatibleObjectStorageFactory {
    storage_config: S3StorageConfig,
    // we cache the S3Client so we don't rebuild one every time we build a new Storage (for
    // every search query).
    // We don't build it in advance because we don't know if this factory is one that will
    // end up being used, or if something like azure, gcs, or even local files, will be used
    // instead.
    s3_client: OnceCell<S3Client>,
}

impl S3CompatibleObjectStorageFactory {
    /// Creates a new S3-compatible storage factory.
    pub fn new(storage_config: S3StorageConfig) -> Self {
        Self {
            storage_config,
            s3_client: OnceCell::new(),
        }
    }
}

#[async_trait]
impl StorageFactory for S3CompatibleObjectStorageFactory {
    fn backend(&self) -> StorageBackend {
        StorageBackend::S3
    }

    async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        let s3_client = self
            .s3_client
            .get_or_init(|| create_s3_client(&self.storage_config))
            .await
            .clone();
        let storage =
            S3CompatibleObjectStorage::from_uri_and_client(&self.storage_config, uri, s3_client)
                .await?;
        Ok(Arc::new(DebouncedStorage::new(storage)))
    }
}


================================================
FILE: quickwit/quickwit-storage/src/opendal_storage/base.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::ops::Range;
use std::path::Path;

use async_trait::async_trait;
use futures::AsyncWriteExt as FuturesAsyncWriteExt;
use opendal::{DeleteInput, IntoDeleteInput, Operator};
use quickwit_common::uri::Uri;
use tokio::io::{AsyncRead, AsyncWriteExt as TokioAsyncWriteExt};
use tokio_util::compat::{FuturesAsyncReadCompatExt, FuturesAsyncWriteCompatExt};

use crate::metrics::object_storage_get_slice_in_flight_guards;
use crate::storage::SendableAsync;
use crate::{
    BulkDeleteError, MultiPartPolicy, OwnedBytes, PutPayload, Storage, StorageError,
    StorageErrorKind, StorageResolverError, StorageResult,
};

/// OpenDAL based storage implementation.
/// # TODO
///
/// - Implement REQUEST_SEMAPHORE to control the concurrency.
/// - Implement STORAGE_METRICS for metrics.
pub struct OpendalStorage {
    uri: Uri,
    op: Operator,
    multipart_policy: MultiPartPolicy,
}

impl fmt::Debug for OpendalStorage {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("OpendalStorage")
            .field("operator", &self.op.info())
            .finish()
    }
}

impl OpendalStorage {
    /// Create a new google cloud storage.
    pub fn new_google_cloud_storage(
        uri: Uri,
        cfg: opendal::services::Gcs,
    ) -> Result<Self, StorageResolverError> {
        let op = Operator::new(cfg)?.finish();
        Ok(Self {
            uri,
            op,
            // limits are the same as on S3
            multipart_policy: MultiPartPolicy::default(),
        })
    }

    #[cfg(feature = "integration-testsuite")]
    pub fn set_policy(&mut self, multipart_policy: MultiPartPolicy) {
        self.multipart_policy = multipart_policy;
    }
}

#[async_trait]
impl Storage for OpendalStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.op.check().await?;
        Ok(())
    }

    async fn put(&self, path: &Path, payload: Box<dyn PutPayload>) -> StorageResult<()> {
        crate::STORAGE_METRICS.object_storage_put_total.inc();
        let path = path.as_os_str().to_string_lossy();
        let mut payload_reader = payload.byte_stream().await?.into_async_read();

        let mut storage_writer = self
            .op
            .writer_with(&path)
            .chunk(self.multipart_policy.part_num_bytes(payload.len()) as usize)
            .await?
            .into_futures_async_write()
            .compat_write();
        tokio::io::copy(&mut payload_reader, &mut storage_writer).await?;
        storage_writer.get_mut().close().await?;
        crate::STORAGE_METRICS
            .object_storage_upload_num_bytes
            .inc_by(payload.len());
        Ok(())
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        let path = path.as_os_str().to_string_lossy();
        let mut storage_reader = self
            .op
            .reader(&path)
            .await?
            .into_futures_async_read(..)
            .await?
            .compat();
        let num_bytes_copied = tokio::io::copy(&mut storage_reader, output).await?;
        crate::STORAGE_METRICS
            .object_storage_download_num_bytes
            .inc_by(num_bytes_copied);
        output.flush().await?;
        Ok(())
    }

    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        let path = path.as_os_str().to_string_lossy();
        let size = range.len();
        let range = range.start as u64..range.end as u64;
        // Unlike other object store implementations, in flight requests are
        // recorded before issuing the query to the object store.
        let _inflight_guards = object_storage_get_slice_in_flight_guards(size);
        crate::STORAGE_METRICS.object_storage_get_total.inc();
        let storage_content = self.op.read_with(&path).range(range).await?.to_vec();
        Ok(OwnedBytes::new(storage_content))
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        let path = path.as_os_str().to_string_lossy();
        let range = range.start as u64..range.end as u64;
        let storage_reader = self
            .op
            .reader_with(&path)
            .await?
            .into_futures_async_read(range)
            .await?
            .compat();
        Ok(Box::new(storage_reader))
    }

    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        let path = path.as_os_str().to_string_lossy();
        let storage_content = self.op.read(&path).await?.to_vec();
        Ok(OwnedBytes::new(storage_content))
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        let path = path.as_os_str().to_string_lossy();
        crate::STORAGE_METRICS
            .object_storage_delete_requests_total
            .inc();
        let _timer = crate::STORAGE_METRICS
            .object_storage_delete_request_duration
            .start_timer();
        self.op.delete(&path).await?;
        Ok(())
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        // The mock service we used in integration testsuite doesn't support bulk delete.
        // Let's fallback to delete one by one in this case.
        #[cfg(feature = "integration-testsuite")]
        {
            let storage_info = self.op.info();
            if storage_info.name().starts_with("sample-bucket") && storage_info.scheme() == "gcs" {
                let mut bulk_error = BulkDeleteError::default();
                for (index, path) in paths.iter().enumerate() {
                    crate::STORAGE_METRICS
                        .object_storage_bulk_delete_requests_total
                        .inc();
                    let _timer = crate::STORAGE_METRICS
                        .object_storage_bulk_delete_request_duration
                        .start_timer();
                    let result = self.op.delete(&path.as_os_str().to_string_lossy()).await;
                    if let Err(err) = result {
                        let storage_error_kind = err.kind();
                        let storage_error: StorageError = err.into();
                        bulk_error.failures.insert(
                            path.to_path_buf(),
                            crate::DeleteFailure {
                                code: Some(storage_error_kind.to_string()),
                                message: Some(storage_error.to_string()),
                                error: Some(storage_error.clone()),
                            },
                        );
                        bulk_error.error = Some(storage_error);
                        for path in paths[index..].iter() {
                            bulk_error.unattempted.push(path.to_path_buf())
                        }
                        break;
                    } else {
                        bulk_error.successes.push(path.to_path_buf())
                    }
                }

                return if bulk_error.error.is_some() {
                    Err(bulk_error)
                } else {
                    Ok(())
                };
            }
        }
        let delete_inputs: Vec<DeleteInput> = paths
            .iter()
            .map(|path| path.as_os_str().to_string_lossy().into_delete_input())
            .collect();

        self.op
            .delete_iter(delete_inputs)
            .await
            .map_err(|error| BulkDeleteError {
                error: Some(error.into()),
                ..Default::default()
            })?;
        Ok(())
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        let path = path.as_os_str().to_string_lossy();
        let meta = self.op.stat(&path).await?;
        Ok(meta.content_length())
    }

    fn uri(&self) -> &Uri {
        &self.uri
    }
}

impl From<opendal::Error> for StorageError {
    fn from(err: opendal::Error) -> Self {
        match err.kind() {
            opendal::ErrorKind::NotFound => StorageErrorKind::NotFound.with_error(err),
            opendal::ErrorKind::PermissionDenied => StorageErrorKind::Unauthorized.with_error(err),
            opendal::ErrorKind::ConfigInvalid => StorageErrorKind::Service.with_error(err),
            _ => StorageErrorKind::Io.with_error(err),
        }
    }
}

impl From<opendal::Error> for StorageResolverError {
    fn from(err: opendal::Error) -> Self {
        StorageResolverError::InvalidConfig(err.to_string())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/opendal_storage/google_cloud_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::path::PathBuf;
use std::sync::Arc;

use async_trait::async_trait;
use once_cell::sync::OnceCell;
use quickwit_common::uri::Uri;
use quickwit_config::{GoogleCloudStorageConfig, StorageBackend};
use regex::Regex;
use tracing::info;

use super::OpendalStorage;
use crate::debouncer::DebouncedStorage;
use crate::{Storage, StorageFactory, StorageResolverError};

/// Google cloud storage resolver.
pub struct GoogleCloudStorageFactory {
    storage_config: GoogleCloudStorageConfig,
}

impl GoogleCloudStorageFactory {
    /// Create a new google cloud storage factory via config.
    pub fn new(storage_config: GoogleCloudStorageConfig) -> Self {
        Self { storage_config }
    }
}

#[async_trait]
impl StorageFactory for GoogleCloudStorageFactory {
    fn backend(&self) -> StorageBackend {
        StorageBackend::Google
    }

    async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        let storage = from_uri(&self.storage_config, uri)?;
        Ok(Arc::new(DebouncedStorage::new(storage)))
    }
}

/// Helpers to configure the GCP local test setup.
#[cfg(feature = "integration-testsuite")]
pub mod test_config_helpers {
    use super::*;

    /// URL of the local GCP emulator.
    pub const LOCAL_GCP_EMULATOR_ENDPOINT: &str = "http://127.0.0.1:4443";
    /// Creates a storage connecting to a local emulated google cloud storage.
    pub fn new_emulated_google_cloud_storage(
        uri: &Uri,
    ) -> Result<OpendalStorage, StorageResolverError> {
        let (bucket, root) = parse_google_uri(uri).expect("must be valid google uri");

        let cfg = opendal::services::Gcs::default()
            .bucket(&bucket)
            .root(&root.to_string_lossy())
            .endpoint(LOCAL_GCP_EMULATOR_ENDPOINT)
            .allow_anonymous() // Disable authentication for fake GCS server
            .disable_vm_metadata(); // Disable GCE metadata server requests
        let store = OpendalStorage::new_google_cloud_storage(uri.clone(), cfg)?;
        Ok(store)
    }
}

fn from_uri(
    google_cloud_storage_config: &GoogleCloudStorageConfig,
    uri: &Uri,
) -> Result<OpendalStorage, StorageResolverError> {
    let (bucket_name, prefix) = parse_google_uri(uri).ok_or_else(|| {
        let message = format!("failed to extract bucket name from google URI: {uri}");
        StorageResolverError::InvalidUri(message)
    })?;

    let mut cfg = opendal::services::Gcs::default()
        .bucket(&bucket_name)
        .root(&prefix.to_string_lossy());

    if let Some(credential_path) = google_cloud_storage_config.resolve_credential_path() {
        info!(path=%credential_path, "fetching google cloud storage credentials from path");
        cfg = cfg.credential_path(&credential_path);
    }
    let store = OpendalStorage::new_google_cloud_storage(uri.clone(), cfg)?;
    Ok(store)
}

fn parse_google_uri(uri: &Uri) -> Option<(String, PathBuf)> {
    // Ex: gs://bucket/prefix.
    static URI_PTN: OnceCell<Regex> = OnceCell::new();

    let captures = URI_PTN
        .get_or_init(|| {
            Regex::new(r"gs(\+[^:]+)?://(?P<bucket>[^/]+)(/(?P<prefix>.*))?$")
                .expect("The regular expression should compile.")
        })
        .captures(uri.as_str())?;

    let bucket = captures.name("bucket")?.as_str().to_string();
    let prefix = captures
        .name("prefix")
        .map(|prefix_match| PathBuf::from(prefix_match.as_str()))
        .unwrap_or_default();
    Some((bucket, prefix))
}

#[cfg(test)]
mod tests {
    use quickwit_common::uri::Uri;

    use super::parse_google_uri;

    #[test]
    fn test_parse_google_uri() {
        assert!(parse_google_uri(&Uri::for_test("gs://")).is_none());

        let (bucket, prefix) = parse_google_uri(&Uri::for_test("gs://test-bucket")).unwrap();
        assert_eq!(bucket, "test-bucket");
        assert!(prefix.to_str().unwrap().is_empty());

        let (bucket, prefix) = parse_google_uri(&Uri::for_test("gs://test-bucket/")).unwrap();
        assert_eq!(bucket, "test-bucket");
        assert!(prefix.to_str().unwrap().is_empty());

        let (bucket, prefix) =
            parse_google_uri(&Uri::for_test("gs://test-bucket/indexes")).unwrap();
        assert_eq!(bucket, "test-bucket");
        assert_eq!(prefix.to_str().unwrap(), "indexes");
    }
}


================================================
FILE: quickwit/quickwit-storage/src/opendal_storage/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod base;
use base::OpendalStorage;

mod google_cloud_storage;

pub use google_cloud_storage::GoogleCloudStorageFactory;
#[cfg(feature = "integration-testsuite")]
pub use google_cloud_storage::test_config_helpers;


================================================
FILE: quickwit/quickwit-storage/src/payload.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io;
use std::ops::Range;

use async_trait::async_trait;
use aws_sdk_s3::primitives::ByteStream;
use tantivy::directory::OwnedBytes;

#[async_trait]
/// PutPayload is used to upload data and support multipart.
pub trait PutPayload: PutPayloadClone + Send + Sync {
    /// Return the total length of the payload.
    fn len(&self) -> u64;

    /// Retrieve bytestream for specified range.
    async fn range_byte_stream(&self, range: Range<u64>) -> io::Result<ByteStream>;

    /// Retrieve complete bytestream.
    async fn byte_stream(&self) -> io::Result<ByteStream> {
        let total_len = self.len();
        let range = 0..total_len;
        self.range_byte_stream(range).await
    }

    /// Load the whole Payload into memory.
    async fn read_all(&self) -> io::Result<OwnedBytes> {
        let total_len = self.len();
        let range = 0..total_len;
        let mut reader = self.range_byte_stream(range).await?.into_async_read();

        let mut data: Vec<u8> = Vec::with_capacity(total_len as usize);
        tokio::io::copy(&mut reader, &mut data).await?;

        Ok(OwnedBytes::new(data))
    }
}

pub trait PutPayloadClone {
    fn box_clone(&self) -> Box<dyn PutPayload>;
}

impl<T> PutPayloadClone for T
where T: 'static + PutPayload + Clone
{
    fn box_clone(&self) -> Box<dyn PutPayload> {
        Box::new(self.clone())
    }
}

impl Clone for Box<dyn PutPayload> {
    fn clone(&self) -> Box<dyn PutPayload> {
        self.box_clone()
    }
}

#[async_trait]
impl PutPayload for Vec<u8> {
    fn len(&self) -> u64 {
        self.len() as u64
    }

    async fn range_byte_stream(&self, range: Range<u64>) -> io::Result<ByteStream> {
        Ok(ByteStream::from(
            self[range.start as usize..range.end as usize].to_vec(),
        ))
    }
}


================================================
FILE: quickwit/quickwit-storage/src/prefix_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use tokio::io::AsyncRead;

use crate::storage::SendableAsync;
use crate::{BulkDeleteError, OwnedBytes, Storage};

/// This storage acts as a proxy to another storage that simply modifies each API call
/// by preceding each path with a given a prefix.
struct PrefixStorage {
    pub storage: Arc<dyn Storage>,
    pub prefix: PathBuf,
    uri: Uri,
}

impl fmt::Debug for PrefixStorage {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("PrefixStorage")
            .field("uri", &self.uri)
            .field("prefix", &self.prefix)
            .finish()
    }
}

#[async_trait]
impl Storage for PrefixStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.storage.check_connectivity().await
    }

    async fn put(
        &self,
        path: &Path,
        payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        self.storage.put(&self.prefix.join(path), payload).await
    }

    async fn copy_to(
        &self,
        path: &Path,
        output: &mut dyn SendableAsync,
    ) -> crate::StorageResult<()> {
        self.storage.copy_to(&self.prefix.join(path), output).await
    }

    async fn get_slice(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> crate::StorageResult<OwnedBytes> {
        self.storage.get_slice(&self.prefix.join(path), range).await
    }

    async fn get_all(&self, path: &Path) -> crate::StorageResult<OwnedBytes> {
        self.storage.get_all(&self.prefix.join(path)).await
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> crate::StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        self.storage
            .get_slice_stream(&self.prefix.join(path), range)
            .await
    }

    async fn delete(&self, path: &Path) -> crate::StorageResult<()> {
        self.storage.delete(&self.prefix.join(path)).await
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        let prefixed_pathbufs: Vec<PathBuf> =
            paths.iter().map(|path| self.prefix.join(path)).collect();
        let prefixed_paths: Vec<&Path> = prefixed_pathbufs
            .iter()
            .map(|pathbuf| pathbuf.as_path())
            .collect();
        self.storage
            .bulk_delete(&prefixed_paths)
            .await
            .map_err(|error| strip_prefix_from_error(error, &self.prefix))?;
        Ok(())
    }

    async fn exists(&self, path: &Path) -> crate::StorageResult<bool> {
        self.storage.exists(&self.prefix.join(path)).await
    }

    fn uri(&self) -> &Uri {
        &self.uri
    }

    async fn file_num_bytes(&self, path: &Path) -> crate::StorageResult<u64> {
        self.storage.file_num_bytes(&self.prefix.join(path)).await
    }
}

/// Creates a [`PrefixStorage`] using an underlying storage and a prefix.
pub(crate) fn add_prefix_to_storage(
    storage: Arc<dyn Storage>,
    prefix: PathBuf,
    uri: Uri,
) -> Arc<dyn Storage> {
    Arc::new(PrefixStorage {
        storage,
        prefix,
        uri,
    })
}

fn strip_prefix_from_error(error: BulkDeleteError, prefix: &Path) -> BulkDeleteError {
    if prefix == Path::new("") {
        return error;
    }
    let successes = error
        .successes
        .into_iter()
        .map(|path| {
            path.strip_prefix(prefix)
                .expect(
                    "The prefix should have been prepended to the path before the bulk delete \
                     call.",
                )
                .to_path_buf()
        })
        .collect();
    let failures = error
        .failures
        .into_iter()
        .map(|(path, failure)| {
            (
                path.strip_prefix(prefix)
                    .expect(
                        "The prefix should have been prepended to the path before the bulk delete \
                         call.",
                    )
                    .to_path_buf(),
                failure,
            )
        })
        .collect();
    let unattempted = error
        .unattempted
        .into_iter()
        .map(|path| {
            path.strip_prefix(prefix)
                .expect(
                    "The prefix should have been prepended to the path before the bulk delete \
                     call.",
                )
                .to_path_buf()
        })
        .collect();
    BulkDeleteError {
        error: error.error,
        successes,
        failures,
        unattempted,
    }
}

#[cfg(test)]
mod tests {

    use std::collections::HashMap;

    use super::*;
    use crate::DeleteFailure;

    #[test]
    fn test_strip_prefix_from_error() {
        {
            let error = BulkDeleteError {
                error: None,
                successes: vec![PathBuf::from("ram:///indexes/foo")],
                unattempted: vec![PathBuf::from("ram:///indexes/bar")],
                failures: HashMap::from_iter([(
                    PathBuf::from("ram:///indexes/baz"),
                    DeleteFailure::default(),
                )]),
            };
            let stripped_error = strip_prefix_from_error(error, Path::new(""));

            assert_eq!(
                stripped_error.successes,
                vec![PathBuf::from("ram:///indexes/foo")],
            );
            assert_eq!(
                stripped_error.unattempted,
                vec![PathBuf::from("ram:///indexes/bar")],
            );
            assert_eq!(
                stripped_error.failures.keys().next().unwrap(),
                &PathBuf::from("ram:///indexes/baz"),
            );
        }
        {
            let error = BulkDeleteError {
                error: None,
                successes: vec![PathBuf::from("ram:///indexes/foo")],
                unattempted: vec![PathBuf::from("ram:///indexes/bar")],
                failures: HashMap::from_iter([(
                    PathBuf::from("ram:///indexes/baz"),
                    DeleteFailure::default(),
                )]),
            };
            let stripped_error = strip_prefix_from_error(error, Path::new("ram:///indexes"));

            assert_eq!(stripped_error.successes, vec![PathBuf::from("foo")],);
            assert_eq!(stripped_error.unattempted, vec![PathBuf::from("bar")],);
            assert_eq!(
                stripped_error.failures.keys().next().unwrap(),
                &PathBuf::from("baz"),
            );
        }
        {
            let error = BulkDeleteError {
                error: None,
                successes: vec![PathBuf::from("ram:///indexes/foo")],
                unattempted: vec![PathBuf::from("ram:///indexes/bar")],
                failures: HashMap::from_iter([(
                    PathBuf::from("ram:///indexes/baz"),
                    DeleteFailure::default(),
                )]),
            };
            let stripped_error = strip_prefix_from_error(error, Path::new("ram:///indexes/"));

            assert_eq!(stripped_error.successes, vec![PathBuf::from("foo")],);
            assert_eq!(stripped_error.unattempted, vec![PathBuf::from("bar")],);
            assert_eq!(
                stripped_error.failures.keys().next().unwrap(),
                &PathBuf::from("baz"),
            );
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/src/ram_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::io::Cursor;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_common::uri::{Protocol, Uri};
use quickwit_config::StorageBackend;
use tokio::io::{AsyncRead, AsyncWriteExt};
use tokio::sync::RwLock;

use crate::prefix_storage::add_prefix_to_storage;
use crate::storage::SendableAsync;
use crate::{
    BulkDeleteError, OwnedBytes, Storage, StorageErrorKind, StorageFactory, StorageResolverError,
    StorageResult,
};

/// In Ram implementation of quickwit's storage.
///
/// This implementation is mostly useful in unit tests.
#[derive(Clone)]
pub struct RamStorage {
    uri: Uri,
    files: Arc<RwLock<HashMap<PathBuf, OwnedBytes>>>,
}

impl fmt::Debug for RamStorage {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        formatter
            .debug_struct("RamStorage")
            .field("uri", &self.uri)
            .finish()
    }
}

impl Default for RamStorage {
    fn default() -> Self {
        Self {
            uri: Uri::for_test("ram:///"),
            files: Arc::new(RwLock::new(HashMap::new())),
        }
    }
}

impl RamStorage {
    /// Creates a [`RamStorageBuilder`]
    pub fn builder() -> RamStorageBuilder {
        RamStorageBuilder::default()
    }

    async fn put_data(&self, path: &Path, payload: OwnedBytes) {
        self.files.write().await.insert(path.to_path_buf(), payload);
    }

    async fn get_data(&self, path: &Path) -> Option<OwnedBytes> {
        self.files.read().await.get(path).cloned()
    }

    /// Returns the list of files that are present in the RamStorage.
    pub async fn list_files(&self) -> Vec<PathBuf> {
        self.files.read().await.keys().cloned().collect()
    }
}

#[async_trait]
impl Storage for RamStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        Ok(())
    }

    async fn put(
        &self,
        path: &Path,
        payload: Box<dyn crate::PutPayload>,
    ) -> crate::StorageResult<()> {
        let payload_bytes = payload.read_all().await?;
        self.put_data(path, payload_bytes).await;
        Ok(())
    }

    async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()> {
        let payload_bytes = self.get_data(path).await.ok_or_else(|| {
            StorageErrorKind::NotFound
                .with_error(anyhow::anyhow!("failed to find dest_path {:?}", path))
        })?;
        output.write_all(&payload_bytes).await?;
        output.flush().await?;
        Ok(())
    }

    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        let payload_bytes = self.get_data(path).await.ok_or_else(|| {
            StorageErrorKind::NotFound
                .with_error(anyhow::anyhow!("failed to find dest_path {:?}", path))
        })?;
        Ok(payload_bytes.slice(range.start..range.end))
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        let bytes = self.get_slice(path, range).await?;
        Ok(Box::new(Cursor::new(bytes)))
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        self.files.write().await.remove(path);
        Ok(())
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        let mut files = self.files.write().await;
        for &path in paths {
            files.remove(path);
        }
        Ok(())
    }

    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        let payload_bytes = self.get_data(path).await.ok_or_else(|| {
            StorageErrorKind::NotFound
                .with_error(anyhow::anyhow!("failed to find dest_path {:?}", path))
        })?;
        Ok(payload_bytes)
    }

    fn uri(&self) -> &Uri {
        &self.uri
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        if let Some(file_bytes) = self.files.read().await.get(path) {
            Ok(file_bytes.len() as u64)
        } else {
            let err = anyhow::anyhow!("missing file `{}`", path.display());
            Err(StorageErrorKind::NotFound.with_error(err))
        }
    }
}

/// Builder to create a prepopulated [`RamStorage`]. This is mostly useful for tests.
#[derive(Default)]
pub struct RamStorageBuilder {
    files: HashMap<PathBuf, OwnedBytes>,
}

impl RamStorageBuilder {
    /// Adds a new file into the [`RamStorageBuilder`].
    pub fn put(mut self, path: &str, payload: &[u8]) -> Self {
        self.files
            .insert(PathBuf::from(path), OwnedBytes::new(payload.to_vec()));
        self
    }

    /// Finalizes the [`RamStorage`] creation.
    pub fn build(self) -> RamStorage {
        RamStorage {
            uri: Uri::for_test("ram:///"),
            files: Arc::new(RwLock::new(self.files)),
        }
    }
}

/// Storage resolver for [`RamStorage`].
pub struct RamStorageFactory {
    ram_storage: Arc<dyn Storage>,
}

impl Default for RamStorageFactory {
    fn default() -> Self {
        RamStorageFactory {
            ram_storage: Arc::new(RamStorage::default()),
        }
    }
}

#[async_trait]
impl StorageFactory for RamStorageFactory {
    fn backend(&self) -> StorageBackend {
        StorageBackend::Ram
    }

    async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        match uri.filepath() {
            Some(prefix) if uri.protocol() == Protocol::Ram => Ok(add_prefix_to_storage(
                self.ram_storage.clone(),
                prefix.to_path_buf(),
                uri.clone(),
            )),
            _ => {
                let message = format!("URI `{uri}` is not a valid RAM URI");
                Err(StorageResolverError::InvalidUri(message))
            }
        }
    }
}

#[cfg(test)]
mod tests {

    use super::*;
    use crate::test_suite::storage_test_suite;

    #[tokio::test]
    async fn test_storage() -> anyhow::Result<()> {
        let mut ram_storage = RamStorage::default();
        storage_test_suite(&mut ram_storage).await?;
        Ok(())
    }

    #[tokio::test]
    async fn test_ram_storage_factory() {
        let ram_storage_factory = RamStorageFactory::default();
        let ram_uri = Uri::for_test("s3:///foo");
        let err = ram_storage_factory.resolve(&ram_uri).await.err().unwrap();
        assert!(matches!(err, StorageResolverError::InvalidUri { .. }));

        let data_uri = Uri::for_test("ram:///data");
        let data_storage = ram_storage_factory.resolve(&data_uri).await.ok().unwrap();
        let home_uri = Uri::for_test("ram:///home");
        let home_storage = ram_storage_factory.resolve(&home_uri).await.ok().unwrap();
        assert_ne!(data_storage.uri(), home_storage.uri());

        let data_storage_two = ram_storage_factory.resolve(&data_uri).await.ok().unwrap();
        assert_eq!(data_storage.uri(), data_storage_two.uri());
    }

    #[tokio::test]
    async fn test_ram_storage_builder() -> anyhow::Result<()> {
        let storage = RamStorage::builder()
            .put("path1", b"path1_payload")
            .put("path2", b"path2_payload")
            .put("path1", b"path1_payloadb")
            .build();
        assert_eq!(
            &storage.get_all(Path::new("path1")).await?,
            &b"path1_payloadb"[..]
        );
        assert_eq!(
            &storage.get_all(Path::new("path2")).await?,
            &b"path2_payload"[..]
        );
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/split.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::io;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::pin::Pin;

use async_trait::async_trait;
use aws_sdk_s3::primitives::{ByteStream, FsBuilder, Length, SdkBody};
use futures::{Stream, StreamExt, stream};
use hyper::body::{Bytes, Frame};
use pin_project::pin_project;
use quickwit_common::shared_consts::SPLIT_FIELDS_FILE_NAME;

use crate::bundle_storage::BundleStorageFileOffsetsVersions;
use crate::{BundleStorageFileOffsets, PutPayload, VersionedComponent};

/// Payload of a split which builds the split bundle and hotcache on the fly and streams it to the
/// storage.
#[derive(Clone)]
pub struct SplitPayload {
    payloads: Vec<Box<dyn PutPayload>>,
    /// bytes range of the footer (hotcache + bundle metadata)
    pub footer_range: Range<u64>,
}

async fn range_byte_stream_from_payloads(
    payloads: &[Box<dyn PutPayload>],
    range: Range<u64>,
) -> io::Result<ByteStream> {
    let mut bytestreams: Vec<ByteStream> = Vec::new();

    let payloads_and_ranges =
        chunk_payload_ranges(payloads, range.start as usize..range.end as usize);

    for (payload, range) in payloads_and_ranges {
        bytestreams.push(
            payload
                .range_byte_stream(range.start as u64..range.end as u64)
                .await?,
        );
    }

    let body = stream::iter(bytestreams)
        .map(StreamAdaptor)
        .flatten()
        .map(|result| result.map(Frame::data));
    let stream_body = http_body_util::StreamBody::new(body);
    let concat_stream = ByteStream::new(SdkBody::from_body_1_x(stream_body));
    Ok(concat_stream)
}

// With sdk 1.0, ByteStream no longer implement Stream, despite having analogous functions
// this adaptor is just meant to make it implement Stream for places where we really need it
#[pin_project]
struct StreamAdaptor(#[pin] ByteStream);

impl Stream for StreamAdaptor {
    type Item = Result<Bytes, aws_smithy_types::byte_stream::error::Error>;

    fn poll_next(
        self: Pin<&mut Self>,
        ctx: &mut std::task::Context<'_>,
    ) -> std::task::Poll<Option<Self::Item>> {
        self.project().0.poll_next(ctx)
    }

    fn size_hint(&self) -> (usize, Option<usize>) {
        let (lower_bound_u64, upper_bound_u64) = self.0.size_hint();
        // if conversion fails, it means lower_bound is too large to fit in an usize on this
        // platform. When that's the case, we return usize::MAX as best effort. Any value is valid,
        // but MAX is the most informative.
        let lower_bound = lower_bound_u64.try_into().unwrap_or(usize::MAX);
        // for the upperbound, if conversion fails, we just say the upper bound is unknown
        let upper_bound =
            upper_bound_u64.and_then(|upper_bound_u64| upper_bound_u64.try_into().ok());
        (lower_bound, upper_bound)
    }
}

#[async_trait]
impl PutPayload for SplitPayload {
    fn len(&self) -> u64 {
        self.payloads.iter().map(|payload| payload.len()).sum()
    }

    async fn range_byte_stream(&self, range: Range<u64>) -> io::Result<ByteStream> {
        range_byte_stream_from_payloads(&self.payloads, range).await
    }
}

#[derive(Clone)]
struct FilePayload {
    len: u64,
    path: PathBuf,
}

#[async_trait]
impl PutPayload for FilePayload {
    fn len(&self) -> u64 {
        self.len
    }

    async fn range_byte_stream(&self, range: Range<u64>) -> io::Result<ByteStream> {
        assert!(!range.is_empty());
        assert!(range.end <= self.len);

        let len = range.end - range.start;
        let mut fs_builder = FsBuilder::new().path(&self.path);

        if range.start > 0 {
            fs_builder = fs_builder.offset(range.start);
        }
        fs_builder = fs_builder.length(Length::Exact(len));

        fs_builder
            .build()
            .await
            .map_err(|error| io::Error::other(format!("failed to create byte stream: {error}")))
    }
}

/// SplitPayloadBuilder is used to create a `SplitPayload`.
#[derive(Default)]
pub struct SplitPayloadBuilder {
    /// File name, payload, and range of the payload in the bundle file
    /// Range could be computed on the fly, and is just kept here for convenience.
    payloads: Vec<(String, Box<dyn PutPayload>, Range<u64>)>,
    current_offset: usize,
}

impl SplitPayloadBuilder {
    /// Creates a new SplitPayloadBuilder for given files and hotcache.
    pub fn get_split_payload(
        split_files: &[PathBuf],
        serialized_split_fields: &[u8],
        hotcache: &[u8],
    ) -> anyhow::Result<SplitPayload> {
        let mut split_payload_builder = SplitPayloadBuilder::default();
        for file in split_files {
            split_payload_builder.add_file(file)?;
        }
        split_payload_builder.add_payload(
            SPLIT_FIELDS_FILE_NAME.to_string(),
            Box::new(serialized_split_fields.to_vec()),
        );
        let offsets = split_payload_builder.finalize(hotcache)?;
        Ok(offsets)
    }

    /// Adds the payload to the bundle file.
    pub fn add_payload(&mut self, file_name: String, payload: Box<dyn PutPayload>) {
        let range = self.current_offset as u64..self.current_offset as u64 + payload.len();
        self.current_offset += payload.len() as usize;
        self.payloads.push((file_name, payload, range));
    }

    /// Adds the file to the bundle file.
    pub fn add_file(&mut self, path: &Path) -> io::Result<()> {
        let file = std::fs::metadata(path)?;
        let file_name = path
            .file_name()
            .and_then(std::ffi::OsStr::to_str)
            .map(ToOwned::to_owned)
            .ok_or_else(|| {
                io::Error::new(
                    io::ErrorKind::InvalidData,
                    format!("Invalid file name in path {path:?}"),
                )
            })?;

        let file_payload = FilePayload {
            path: path.to_owned(),
            len: file.len(),
        };

        self.add_payload(file_name, Box::new(file_payload));

        Ok(())
    }

    /// Writes the bundle file offsets metadata at the end of the bundle file,
    /// and returns the byte-range of this metadata information.
    pub fn finalize(self, hotcache: &[u8]) -> anyhow::Result<SplitPayload> {
        // Add the fields metadata to the bundle metadata.
        // Build the footer.
        let metadata_with_fixed_paths = self
            .payloads
            .iter()
            .map(|(file_name, _, range)| {
                let file_name = PathBuf::from(file_name);
                Ok((file_name, range.start..range.end))
            })
            .collect::<Result<HashMap<_, _>, anyhow::Error>>()?;

        let bundle_storage_file_offsets = BundleStorageFileOffsets {
            files: metadata_with_fixed_paths,
        };
        let metadata_json =
            BundleStorageFileOffsetsVersions::serialize(&bundle_storage_file_offsets);

        // The hotcache needs to be the next to the metadata in order to be able to read both
        // in one continuous read.
        let mut footer_bytes = Vec::new();
        footer_bytes.extend(&metadata_json);
        footer_bytes.extend((metadata_json.len() as u32).to_le_bytes());
        footer_bytes.extend(hotcache);
        footer_bytes.extend((hotcache.len() as u32).to_le_bytes());

        let mut payloads: Vec<Box<dyn PutPayload>> = self
            .payloads
            .into_iter()
            .map(|(_, payload, _)| payload)
            .collect();

        payloads.push(Box::new(footer_bytes.to_vec()));

        Ok(SplitPayload {
            payloads,
            footer_range: self.current_offset as u64
                ..self.current_offset as u64 + footer_bytes.len() as u64,
        })
    }
}

/// Returns the payloads with their absolute ranges.
fn get_payloads_with_absolute_range(
    payloads: &[Box<dyn PutPayload>],
) -> Vec<(Box<dyn PutPayload>, Range<usize>)> {
    let mut current = 0;
    payloads
        .iter()
        .map(|payload| {
            let start = current;
            current += payload.len();
            (payload.clone(), start as usize..current as usize)
        })
        .collect()
}

fn get_ranges_overlap(range1: &Range<usize>, range2: &Range<usize>) -> Range<usize> {
    range1.start.max(range2.start)..range1.end.min(range2.end)
}

// Returns payloads and their relative ranges for an absolute range.
fn chunk_payload_ranges(
    payloads: &[Box<dyn PutPayload>],
    range: Range<usize>,
) -> Vec<(Box<dyn PutPayload>, Range<usize>)> {
    let mut ranges = Vec::new();
    for (payload, payload_absolute_range) in get_payloads_with_absolute_range(payloads) {
        let absolute_range_overlap = get_ranges_overlap(&payload_absolute_range, &range);
        if !absolute_range_overlap.is_empty() {
            // Push the range relative to this payload as we will read from it.
            ranges.push((
                payload.clone(),
                (absolute_range_overlap.start - payload_absolute_range.start)
                    ..(absolute_range_overlap.end - payload_absolute_range.start),
            ));
        }
    }
    ranges
}

#[cfg(test)]
mod tests {
    use std::fs::File;
    use std::io::Write;

    use super::*;

    #[tokio::test]
    async fn test_split_offset_computer() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("f1");
        let test_filepath2 = temp_dir.path().join("f2");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(b"hello")?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(b"world")?;

        let split_payload =
            SplitPayloadBuilder::get_split_payload(&[test_filepath1, test_filepath2], &[], b"abc")?;

        assert_eq!(split_payload.len(), 128);

        Ok(())
    }

    #[cfg(test)]
    async fn fetch_data(
        split_streamer: &SplitPayload,
        range: Range<u64>,
    ) -> anyhow::Result<Vec<u8>> {
        use tokio::io::AsyncReadExt as _;

        let mut data = Vec::new();
        split_streamer
            .range_byte_stream(range)
            .await?
            .into_async_read()
            .read_to_end(&mut data)
            .await?;
        Ok(data)
    }

    #[test]
    fn test_chunk_payloads() -> anyhow::Result<()> {
        let payloads: Vec<Box<dyn PutPayload>> = vec![
            Box::new(vec![1, 2, 3]),
            Box::new(vec![4, 5, 6]),
            Box::new(vec![7, 8, 9, 10]),
        ];

        assert_eq!(
            chunk_payload_ranges(&payloads, 0..1)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![0..1]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 0..2)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![0..2]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 1..2)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![1..2]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 2..3)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![2..3]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 0..6)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![0..3, 0..3]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 0..5)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![0..3, 0..2]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 3..6)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![0..3]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 4..6)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![1..3]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 5..6)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![2..3]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 2..6)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![2..3, 0..3]
        );
        assert_eq!(
            chunk_payload_ranges(&payloads, 2..5)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![2..3, 0..2]
        );

        assert_eq!(
            chunk_payload_ranges(&payloads, 7..8)
                .iter()
                .map(|el| el.1.clone())
                .collect::<Vec<_>>(),
            vec![1..2]
        );

        Ok(())
    }

    #[tokio::test]
    async fn test_split_streamer() -> anyhow::Result<()> {
        let temp_dir = tempfile::tempdir()?;
        let test_filepath1 = temp_dir.path().join("a");
        let test_filepath2 = temp_dir.path().join("b");

        let mut file1 = File::create(&test_filepath1)?;
        file1.write_all(&[123, 76])?;

        let mut file2 = File::create(&test_filepath2)?;
        file2.write_all(&[99, 55, 44])?;

        let split_streamer = SplitPayloadBuilder::get_split_payload(
            &[test_filepath1.clone(), test_filepath2.clone()],
            &[],
            &[1, 2, 3],
        )?;

        // border case 1 exact start of first block
        assert_eq!(fetch_data(&split_streamer, 0..1).await?, vec![123]);
        assert_eq!(fetch_data(&split_streamer, 0..2).await?, vec![123, 76]);
        assert_eq!(fetch_data(&split_streamer, 0..3).await?, vec![123, 76, 99]);

        // border 2 case skip and take cross adjacent blocks
        assert_eq!(fetch_data(&split_streamer, 1..3).await?, vec![76, 99]);

        // border 3 case skip and take in separate blocks with full block between
        assert_eq!(
            fetch_data(&split_streamer, 1..6).await?,
            vec![76, 99, 55, 44, 174]
        );

        // border case 4 exact middle block
        assert_eq!(fetch_data(&split_streamer, 2..5).await?, vec![99, 55, 44]);

        // border case 5, no skip but take in middle block
        assert_eq!(fetch_data(&split_streamer, 2..4).await?, vec![99, 55]);

        // border case 6 skip and take in middle block
        assert_eq!(fetch_data(&split_streamer, 3..4).await?, vec![55]);

        // border case 7 start exact last block - footer
        assert_eq!(
            fetch_data(&split_streamer, 5..10).await?,
            vec![174, 190, 18, 24, 1]
        );
        // border case 8 skip and take in last block  - footer
        assert_eq!(
            fetch_data(&split_streamer, 6..10).await?,
            vec![190, 18, 24, 1]
        );

        let total_len = split_streamer.len();
        let all_data = fetch_data(&split_streamer, 0..total_len).await?;

        // last 8 bytes are the length of the hotcache bytes
        assert_eq!(all_data[all_data.len() - 4..], 3_u32.to_le_bytes());
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/src/split_cache/download_task.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroU32;
use std::path::Path;
use std::sync::Arc;
use std::time::Duration;

use quickwit_common::split_file;
use tokio::sync::{OwnedSemaphorePermit, Semaphore};

use crate::split_cache::split_table::{CandidateSplit, DownloadOpportunity};
use crate::{SplitCache, StorageResolver};

async fn download_split(
    root_path: &Path,
    candidate_split: &CandidateSplit,
    storage_resolver: StorageResolver,
) -> anyhow::Result<u64> {
    let CandidateSplit {
        split_ulid,
        storage_uri,
        living_token: _,
    } = candidate_split;
    let split_filename = split_file(*split_ulid);
    let target_filepath = root_path.join(&split_filename);
    let storage = storage_resolver.resolve(storage_uri).await?;
    let num_bytes = storage
        .copy_to_file(Path::new(&split_filename), &target_filepath)
        .await?;
    Ok(num_bytes)
}

async fn perform_eviction_and_download(
    download_opportunity: DownloadOpportunity,
    split_cache: Arc<SplitCache>,
    storage_resolver: StorageResolver,
    _download_permit: OwnedSemaphorePermit,
) -> anyhow::Result<()> {
    let DownloadOpportunity {
        splits_to_delete,
        split_to_download,
    } = download_opportunity;
    let split_ulid = split_to_download.split_ulid;
    // tokio io runs on `spawn_blocking` threads anyway.
    let split_cache_clone = split_cache.clone();
    let _ = tokio::task::spawn_blocking(move || {
        split_cache_clone.evict(&splits_to_delete[..]);
    })
    .await;
    let num_bytes =
        download_split(&split_cache.root_path, &split_to_download, storage_resolver).await?;
    let mut shared_split_table_lock = split_cache.split_table.lock().unwrap();
    shared_split_table_lock.register_as_downloaded(split_ulid, num_bytes);
    Ok(())
}

pub(crate) fn spawn_download_task(
    split_cache: Arc<SplitCache>,
    storage_resolver: StorageResolver,
    num_concurrent_downloads: NonZeroU32,
) {
    let semaphore = Arc::new(Semaphore::new(num_concurrent_downloads.get() as usize));
    tokio::task::spawn(async move {
        loop {
            let download_permit = Semaphore::acquire_owned(semaphore.clone()).await.unwrap();
            let download_opportunity_opt = split_cache
                .split_table
                .lock()
                .unwrap()
                .find_download_opportunity();
            if let Some(download_opportunity) = download_opportunity_opt {
                let split_cache_clone = split_cache.clone();
                tokio::task::spawn(perform_eviction_and_download(
                    download_opportunity,
                    split_cache_clone,
                    storage_resolver.clone(),
                    download_permit,
                ));
            } else {
                // We wait 1 sec before retrying, to avoid wasting CPU.
                tokio::time::sleep(Duration::from_secs(1)).await;
            }
        }
    });
}


================================================
FILE: quickwit/quickwit-storage/src/split_cache/mod.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

mod download_task;
mod split_table;

use std::collections::BTreeMap;
use std::ffi::OsStr;
use std::io;
use std::ops::Range;
use std::path::{Path, PathBuf};
use std::str::FromStr;
use std::sync::{Arc, Mutex};

use async_trait::async_trait;
use quickwit_common::split_file;
use quickwit_common::uri::Uri;
use quickwit_config::SplitCacheLimits;
use quickwit_proto::search::ReportSplit;
use tantivy::directory::OwnedBytes;
use tracing::{error, info, instrument, warn};
use ulid::Ulid;

use crate::file_descriptor_cache::{FileDescriptorCache, SplitFile};
use crate::split_cache::download_task::spawn_download_task;
use crate::split_cache::split_table::SplitTable;
use crate::{Storage, StorageCache, wrap_storage_with_cache};

/// On disk Cache of splits for searchers.
///
/// The search acts receives reports of splits.
pub struct SplitCache {
    // Directory containing the cached split files.
    // Split ids are universally unique, so we all put them in the same directory.
    root_path: PathBuf,
    // In memory structure, listing the splits we know about regardless
    // of whether they are in cache, being downloaded, or just available for download.
    split_table: Mutex<SplitTable>,
    fd_cache: FileDescriptorCache,
}

impl SplitCache {
    /// Creates a new SplitCache and spawns the task that will continuously search for
    /// download opportunities.
    pub fn with_root_path(
        root_path: PathBuf,
        storage_resolver: crate::StorageResolver,
        limits: SplitCacheLimits,
    ) -> io::Result<Arc<SplitCache>> {
        std::fs::create_dir_all(&root_path)?;
        let mut existing_splits: BTreeMap<Ulid, u64> = Default::default();
        for dir_entry_res in std::fs::read_dir(&root_path)? {
            let dir_entry = dir_entry_res?;
            let path = dir_entry.path();
            let meta = std::fs::metadata(&path)?;
            if meta.is_dir() {
                continue;
            }
            let ext = path.extension().and_then(OsStr::to_str).unwrap_or("");
            match ext {
                "temp" => {
                    // This file is a temporary file that was being downloaded, when Quickwit was
                    // stopped (killed for instance) in a way that prevented
                    // their cleanup. It is important to remove it.
                    if let Err(io_err) = std::fs::remove_file(&path)
                        && io_err.kind() != io::ErrorKind::NotFound
                    {
                        error!(path=?path, "failed to remove temporary file");
                    }
                }
                "split" => {
                    if let Some(split_ulid) = split_id_from_path(&path) {
                        existing_splits.insert(split_ulid, meta.len());
                    } else {
                        warn!(path=%path.display(), ".split file with invalid ulid in split cache directory, ignoring");
                    }
                }
                _ => {
                    warn!(path=%path.display(), "unknown file in split cache directory, ignoring");
                }
            }
        }
        let mut split_table = SplitTable::with_limits_and_existing_splits(limits, existing_splits);

        // In case of a setting change, it could be useful to evict some splits on startup.
        let splits_to_remove_res = split_table.make_room_for_split_if_necessary(u64::MAX);
        if let Ok(splits_to_remove) = splits_to_remove_res {
            info!(
                num_splits = splits_to_remove.len(),
                "Evicting splits from the searcher cache. Has the node configuration changed?"
            );
            delete_evicted_splits(&root_path, &splits_to_remove[..]);
        }
        let fd_cache = FileDescriptorCache::with_fd_cache_capacity(limits.max_file_descriptors);
        let split_cache = Arc::new(SplitCache {
            root_path,
            split_table: Mutex::new(split_table),
            fd_cache,
        });

        spawn_download_task(
            split_cache.clone(),
            storage_resolver,
            limits.num_concurrent_downloads,
        );

        Ok(split_cache)
    }

    /// Remove splits from both the fd cache and the split cache.
    /// This method does NOT update the split table.
    pub(crate) fn evict(&self, splits_to_evict: &[Ulid]) {
        self.fd_cache.evict_split_files(splits_to_evict);
        delete_evicted_splits(&self.root_path, splits_to_evict);
    }

    /// Wraps a storage with our split cache.
    pub fn wrap_storage(self_arc: Arc<Self>, storage: Arc<dyn Storage>) -> Arc<dyn Storage> {
        let cache = Arc::new(SplitCacheBackingStorage {
            split_cache: self_arc,
            storage_root_uri: storage.uri().clone(),
        });
        wrap_storage_with_cache(cache, storage)
    }

    /// Report the split cache about the existence of new splits.
    pub fn report_splits(&self, report_splits: Vec<ReportSplit>) {
        let mut split_table = self.split_table.lock().unwrap();
        for report_split in report_splits {
            let Ok(split_ulid) = Ulid::from_str(&report_split.split_id) else {
                error!(split_id=%report_split.split_id, "received invalid split ulid: ignoring");
                continue;
            };
            let Ok(storage_uri) = Uri::from_str(&report_split.storage_uri) else {
                error!(storage_uri=%report_split.storage_uri, "received invalid storage uri: ignoring");
                continue;
            };
            split_table.report(split_ulid, storage_uri);
        }
    }

    // Returns a split guard object. As long as it is not dropped, the
    // split won't be evinced from the cache.
    async fn get_split_file(&self, split_id: Ulid, storage_uri: &Uri) -> Option<SplitFile> {
        // We touch before even checking the fd cache in order to update the file's last access time
        // for the file cache.
        let num_bytes_opt: Option<u64> = self
            .split_table
            .lock()
            .unwrap()
            .touch(split_id, storage_uri);

        let num_bytes = num_bytes_opt?;
        self.fd_cache
            .get_or_open_split_file(&self.root_path, split_id, num_bytes)
            .await
            .ok()
    }
}

/// Removes the evicted split files from the file system.
/// This function just logs errors, and swallows them.
///
/// At this point, the disk space is already accounted as released,
/// so the error could result in a "disk space leak".
#[instrument]
fn delete_evicted_splits(root_path: &Path, splits_to_delete: &[Ulid]) {
    for &split_to_delete in splits_to_delete {
        let split_file_path = root_path.join(split_file(split_to_delete));
        if let Err(_io_err) = std::fs::remove_file(&split_file_path) {
            // This is an pretty critical error. The split size is not tracked anymore at this
            // point.
            error!(path=%split_file_path.display(), "failed to remove split file from cache directory. This is critical as the file is now not taken in account in the cache size limits");
        }
    }
}

fn split_id_from_path(split_path: &Path) -> Option<Ulid> {
    let split_filename = split_path.file_name()?.to_str()?;
    let split_id_str = split_filename.strip_suffix(".split")?;
    Ulid::from_str(split_id_str).ok()
}

struct SplitCacheBackingStorage {
    split_cache: Arc<SplitCache>,
    storage_root_uri: Uri,
}

impl SplitCacheBackingStorage {
    async fn get_impl(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes> {
        let split_id = split_id_from_path(path)?;
        let split_file: SplitFile = self
            .split_cache
            .get_split_file(split_id, &self.storage_root_uri)
            .await?;
        split_file.get_range(byte_range).await.ok()
    }

    async fn get_all_impl(&self, path: &Path) -> Option<OwnedBytes> {
        let split_id = split_id_from_path(path)?;
        let split_file = self
            .split_cache
            .get_split_file(split_id, &self.storage_root_uri)
            .await?;
        split_file.get_all().await.ok()
    }

    fn record_hit_metrics(&self, result_opt: Option<&OwnedBytes>) {
        let split_metrics = &crate::STORAGE_METRICS.searcher_split_cache.cache_metrics;
        if let Some(result) = result_opt {
            split_metrics.hits_num_items.inc();
            split_metrics.hits_num_bytes.inc_by(result.len() as u64);
        } else {
            split_metrics.misses_num_items.inc();
        }
    }
}

#[async_trait]
impl StorageCache for SplitCacheBackingStorage {
    async fn get(&self, path: &Path, byte_range: Range<usize>) -> Option<OwnedBytes> {
        let result = self.get_impl(path, byte_range).await;
        self.record_hit_metrics(result.as_ref());
        result
    }

    async fn get_all(&self, path: &Path) -> Option<OwnedBytes> {
        let result = self.get_all_impl(path).await;
        self.record_hit_metrics(result.as_ref());
        result
    }

    async fn put(&self, _path: PathBuf, _byte_range: Range<usize>, _bytes: OwnedBytes) {}
    async fn put_all(&self, _path: PathBuf, _bytes: OwnedBytes) {}
}


================================================
FILE: quickwit/quickwit-storage/src/split_cache/split_table.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::cmp::Ordering;
use std::collections::{BTreeMap, BTreeSet, HashMap};
use std::sync::{Arc, Weak};
use std::time::{Duration, Instant};

use quickwit_common::uri::Uri;
use quickwit_config::SplitCacheLimits;
use ulid::Ulid;

type LastAccessDate = u64;

/// Maximum number of splits to track.
const MAX_NUM_CANDIDATES: usize = 1_000;

/// Splits that are freshly reported get a last access time of `now - NEWLY_REPORT_SPLIT_LAST_TIME`.
const NEWLY_REPORTED_SPLIT_LAST_TIME: Duration = Duration::from_secs(60 * 10); // 10mn

#[derive(Clone, Copy)]
pub(crate) struct SplitKey {
    pub last_accessed: LastAccessDate,
    pub split_ulid: Ulid,
}

impl PartialOrd for SplitKey {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl Ord for SplitKey {
    fn cmp(&self, other: &Self) -> Ordering {
        (self.last_accessed, &self.split_ulid).cmp(&(other.last_accessed, &other.split_ulid))
    }
}

impl PartialEq for SplitKey {
    fn eq(&self, other: &Self) -> bool {
        (self.last_accessed, &self.split_ulid) == (other.last_accessed, &other.split_ulid)
    }
}

impl Eq for SplitKey {}

#[derive(Clone, Debug)]
enum Status {
    Candidate(CandidateSplit),
    Downloading { alive_token: Weak<()> },
    OnDisk { num_bytes: u64 },
}

impl PartialEq for Status {
    fn eq(&self, other: &Status) -> bool {
        match (self, other) {
            (Status::Candidate(candidate_split), Status::Candidate(other_candidate_split)) => {
                candidate_split == other_candidate_split
            }
            (Status::Downloading { .. }, Status::Downloading { .. }) => true,
            (
                Status::OnDisk { num_bytes },
                Status::OnDisk {
                    num_bytes: other_num_bytes,
                },
            ) => num_bytes == other_num_bytes,
            _ => false,
        }
    }
}

pub struct SplitInfo {
    pub(crate) split_key: SplitKey,
    status: Status,
}

/// The split table keeps track of splits we know about (regardless of whether they have already
/// been downloaded or not).
///
/// Invariant:
/// Each split appearing into split_to_status, should be listed 1 and exactly once in the
/// either
/// - on_disk_splits
/// - downloading_splits
/// - candidate_splits.
///
/// It is possible for the split table size in bytes to exceed its limits, by at
/// most one split.
pub struct SplitTable {
    on_disk_splits: BTreeSet<SplitKey>,
    downloading_splits: BTreeSet<SplitKey>,
    candidate_splits: BTreeSet<SplitKey>,
    split_to_status: HashMap<Ulid, SplitInfo>,
    origin_time: Instant,
    limits: SplitCacheLimits,
    on_disk_bytes: u64,
}

impl SplitTable {
    pub(crate) fn with_limits_and_existing_splits(
        limits: SplitCacheLimits,
        existing_filepaths: BTreeMap<Ulid, u64>,
    ) -> SplitTable {
        let origin_time = Instant::now() - NEWLY_REPORTED_SPLIT_LAST_TIME;
        let mut split_table = SplitTable {
            on_disk_splits: BTreeSet::default(),
            candidate_splits: BTreeSet::default(),
            downloading_splits: BTreeSet::default(),
            split_to_status: HashMap::default(),
            origin_time,
            limits,
            on_disk_bytes: 0u64,
        };
        split_table.acknowledge_on_disk_splits(existing_filepaths);
        split_table
    }

    fn acknowledge_on_disk_splits(&mut self, existing_filepaths: BTreeMap<Ulid, u64>) {
        for (split_ulid, num_bytes) in existing_filepaths {
            let split_info = SplitInfo {
                split_key: SplitKey {
                    last_accessed: 0,
                    split_ulid,
                },
                status: Status::OnDisk { num_bytes },
            };
            self.insert(split_info);
        }
    }
}

fn compute_timestamp(start: Instant) -> LastAccessDate {
    start.elapsed().as_micros() as u64
}

impl SplitTable {
    fn remove(&mut self, split_ulid: Ulid) -> Option<SplitInfo> {
        let split_info = self.split_to_status.remove(&split_ulid)?;
        let split_queue: &mut BTreeSet<SplitKey> = match split_info.status {
            Status::Candidate { .. } => &mut self.candidate_splits,
            Status::Downloading { .. } => &mut self.downloading_splits,
            Status::OnDisk { num_bytes } => {
                self.on_disk_bytes -= num_bytes;
                crate::metrics::STORAGE_METRICS
                    .searcher_split_cache
                    .cache_metrics
                    .in_cache_count
                    .dec();
                crate::metrics::STORAGE_METRICS
                    .searcher_split_cache
                    .cache_metrics
                    .in_cache_num_bytes
                    .sub(num_bytes as i64);
                crate::metrics::STORAGE_METRICS
                    .searcher_split_cache
                    .cache_metrics
                    .evict_num_items
                    .inc();
                crate::metrics::STORAGE_METRICS
                    .searcher_split_cache
                    .cache_metrics
                    .evict_num_bytes
                    .inc_by(num_bytes);
                &mut self.on_disk_splits
            }
        };
        let is_in_queue = split_queue.remove(&split_info.split_key);
        assert!(is_in_queue);
        if let Status::Downloading { alive_token } = &split_info.status
            && alive_token.strong_count() == 0
        {
            return None;
        }
        Some(split_info)
    }

    fn gc_downloading_splits_if_necessary(&mut self) {
        if self.downloading_splits.len()
            < (self.limits.num_concurrent_downloads.get() as usize + 10)
        {
            return;
        }
        let mut splits_to_remove = Vec::new();
        for split in &self.downloading_splits {
            if let Some(split_info) = self.split_to_status.get(&split.split_ulid)
                && let Status::Downloading { alive_token } = &split_info.status
                && alive_token.strong_count() == 0
            {
                splits_to_remove.push(split.split_ulid);
            }
        }
        for split in splits_to_remove {
            self.remove(split);
        }
    }

    /// Insert a `split_info`. This methods assumes the split was not present in the split table
    /// to begin with. It will panic if the split was already present.
    ///
    /// Keep this method private.
    fn insert(&mut self, split_info: SplitInfo) {
        let was_not_in_queue = match split_info.status {
            Status::Candidate { .. } => {
                // we truncate *before* inserting, otherwise way may end up in an inconsistent
                // state which make truncate_candidate_list loop indefinitely
                self.truncate_candidate_list();
                self.candidate_splits.insert(split_info.split_key)
            }
            Status::Downloading { .. } => self.downloading_splits.insert(split_info.split_key),
            Status::OnDisk { num_bytes } => {
                self.on_disk_bytes += num_bytes;
                crate::metrics::STORAGE_METRICS
                    .searcher_split_cache
                    .cache_metrics
                    .in_cache_count
                    .inc();
                crate::metrics::STORAGE_METRICS
                    .searcher_split_cache
                    .cache_metrics
                    .in_cache_num_bytes
                    .add(num_bytes as i64);
                self.on_disk_splits.insert(split_info.split_key)
            }
        };
        // this is fine to do in an inconsistent state, the last entry will just be ignored while
        // gcing
        self.gc_downloading_splits_if_necessary();
        assert!(was_not_in_queue);
        let split_ulid_was_absent = self
            .split_to_status
            .insert(split_info.split_key.split_ulid, split_info)
            .is_none();
        assert!(split_ulid_was_absent);
    }

    /// Touch the file, updating its last access time, possibly extending its life in the
    /// cache (if in cache).
    ///
    /// If the file is already on the disk cache, return `Some(num_bytes)`.
    /// If the file is not in cache, return `None`, and register the file in the candidate for
    /// download list.
    pub fn touch(&mut self, split_ulid: Ulid, storage_uri: &Uri) -> Option<u64> {
        let timestamp = compute_timestamp(self.origin_time);
        let status = self.mutate_split(split_ulid, |old_split_info| {
            if let Some(mut split_info) = old_split_info {
                split_info.split_key.last_accessed = timestamp;
                split_info
            } else {
                SplitInfo {
                    split_key: SplitKey {
                        split_ulid,
                        last_accessed: timestamp,
                    },
                    status: Status::Candidate(CandidateSplit {
                        storage_uri: storage_uri.clone(),
                        split_ulid,
                        living_token: Arc::new(()),
                    }),
                }
            }
        });
        if let Status::OnDisk { num_bytes } = status {
            Some(num_bytes)
        } else {
            None
        }
    }

    /// Mutates a split ulid.
    ///
    /// By design this function maintains the invariant.
    /// It removes the split with the given ulid, modifies, and re
    fn mutate_split(
        &mut self,
        split_ulid: Ulid,
        mutate_fn: impl FnOnce(Option<SplitInfo>) -> SplitInfo,
    ) -> Status {
        let split_info_opt = self.remove(split_ulid);
        let new_split: SplitInfo = mutate_fn(split_info_opt);
        let new_status = new_split.status.clone();
        self.insert(new_split);
        new_status
    }

    fn change_split_status(&mut self, split_ulid: Ulid, status: Status) {
        let start_time = self.origin_time;
        self.mutate_split(split_ulid, move |split_info_opt| {
            if let Some(mut split_info) = split_info_opt {
                split_info.status = status;
                split_info
            } else {
                SplitInfo {
                    split_key: SplitKey {
                        last_accessed: compute_timestamp(start_time),
                        split_ulid,
                    },
                    status,
                }
            }
        });
    }

    pub(crate) fn report(&mut self, split_ulid: Ulid, storage_uri: Uri) {
        let origin_time = self.origin_time;
        self.mutate_split(split_ulid, move |split_info_opt| {
            if let Some(split_info) = split_info_opt {
                return split_info;
            }
            SplitInfo {
                split_key: SplitKey {
                    last_accessed: compute_timestamp(origin_time)
                        .saturating_sub(NEWLY_REPORTED_SPLIT_LAST_TIME.as_micros() as u64),
                    split_ulid,
                },
                status: Status::Candidate(CandidateSplit {
                    storage_uri,
                    split_ulid,
                    living_token: Arc::new(()),
                }),
            }
        });
    }

    /// Make sure we have at most `MAX_CANDIDATES` candidate splits.
    fn truncate_candidate_list(&mut self) {
        // we remove one more to make place for one candidate about to be inserted
        while self.candidate_splits.len() >= MAX_NUM_CANDIDATES {
            let worst_candidate = self.candidate_splits.first().unwrap().split_ulid;
            self.remove(worst_candidate);
        }
    }

    pub(crate) fn register_as_downloaded(&mut self, split_ulid: Ulid, num_bytes: u64) {
        self.change_split_status(split_ulid, Status::OnDisk { num_bytes });
    }

    /// Change the state of the given split from candidate to downloading state,
    /// and returns its URI.
    ///
    /// This function does NOT trigger the download itself. It is up to
    /// the caller to actually initiate the download.
    pub(crate) fn start_download(&mut self, split_ulid: Ulid) -> Option<CandidateSplit> {
        let split_info = self.remove(split_ulid)?;
        let Status::Candidate(candidate_split) = split_info.status else {
            self.insert(split_info);
            return None;
        };
        let alive_token = Arc::downgrade(&candidate_split.living_token);
        self.insert(SplitInfo {
            split_key: split_info.split_key,
            status: Status::Downloading { alive_token },
        });
        Some(candidate_split)
    }

    fn best_candidate(&self) -> Option<SplitKey> {
        self.candidate_splits.last().copied()
    }

    fn is_out_of_limits(&self) -> bool {
        if self.on_disk_splits.is_empty() {
            return false;
        }
        if self.on_disk_splits.len() + self.downloading_splits.len()
            >= self.limits.max_num_splits.get() as usize
        {
            return true;
        }
        if self.on_disk_bytes > self.limits.max_num_bytes.as_u64() {
            return true;
        }
        false
    }

    /// Evicts splits to reach the target limits.
    ///
    /// Returns false if the first candidate for eviction is
    /// fresher that the candidate split. (Note this is suboptimal.
    ///
    /// Returns `None` if this would mean evicting splits that
    /// have been accessed more recently than the candidate split.
    pub(crate) fn make_room_for_split_if_necessary(
        &mut self,
        last_access_date: LastAccessDate,
    ) -> Result<Vec<Ulid>, NoRoomAvailable> {
        let mut split_infos = Vec::new();
        while self.is_out_of_limits() {
            if let Some(first_split) = self.on_disk_splits.first() {
                if first_split.last_accessed > last_access_date {
                    // This is not worth doing the eviction.
                    break;
                }
                split_infos.extend(self.remove(first_split.split_ulid));
            } else {
                break;
            }
        }
        if self.is_out_of_limits() {
            // We are still out of limits.
            // Let's not go through with the eviction, and reinsert the splits.
            for split_info in split_infos {
                self.insert(split_info);
            }
            Err(NoRoomAvailable)
        } else {
            Ok(split_infos
                .into_iter()
                .map(|split_info| split_info.split_key.split_ulid)
                .collect())
        }
    }

    pub(crate) fn find_download_opportunity(&mut self) -> Option<DownloadOpportunity> {
        let best_candidate_split_key = self.best_candidate()?;
        let splits_to_delete: Vec<Ulid> = self
            .make_room_for_split_if_necessary(best_candidate_split_key.last_accessed)
            .ok()?;
        let split_to_download: CandidateSplit =
            self.start_download(best_candidate_split_key.split_ulid)?;
        Some(DownloadOpportunity {
            splits_to_delete,
            split_to_download,
        })
    }

    #[cfg(test)]
    pub fn num_bytes(&self) -> u64 {
        self.on_disk_bytes
    }
}

#[derive(Clone, Copy, Debug)]
pub(crate) struct NoRoomAvailable;

#[derive(Clone, Debug, Eq, PartialEq)]
pub(crate) struct CandidateSplit {
    pub storage_uri: Uri,
    pub split_ulid: Ulid,
    pub living_token: Arc<()>,
}

pub(crate) struct DownloadOpportunity {
    // At this point, the split have already been removed from the split table.
    // The file however need to be deleted.
    pub splits_to_delete: Vec<Ulid>,
    pub split_to_download: CandidateSplit,
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroU32;
    use std::sync::Arc;

    use bytesize::ByteSize;
    use quickwit_common::uri::Uri;
    use quickwit_config::SplitCacheLimits;
    use ulid::Ulid;

    use crate::split_cache::split_table::{
        CandidateSplit, DownloadOpportunity, SplitInfo, SplitKey, SplitTable, Status,
    };

    const TEST_STORAGE_URI: &str = "s3://test";

    fn sorted_split_ulids(num_splits: usize) -> Vec<Ulid> {
        let mut split_ulids: Vec<Ulid> =
            std::iter::repeat_with(Ulid::new).take(num_splits).collect();
        split_ulids.sort();
        split_ulids
    }

    #[test]
    fn test_split_table() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::kb(1),
                max_num_splits: NonZeroU32::new(1).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        let ulids = sorted_split_ulids(2);
        let ulid1 = ulids[0];
        let ulid2 = ulids[1];
        split_table.report(ulid1, Uri::for_test(TEST_STORAGE_URI));
        split_table.report(ulid2, Uri::for_test(TEST_STORAGE_URI));
        let candidate = split_table.best_candidate().unwrap();
        assert_eq!(candidate.split_ulid, ulid2);
    }

    #[test]
    fn test_split_table_prefer_last_touched() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::kb(1),
                max_num_splits: NonZeroU32::new(1).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        let ulids = sorted_split_ulids(2);
        let ulid1 = ulids[0];
        let ulid2 = ulids[1];
        split_table.report(ulid1, Uri::for_test(TEST_STORAGE_URI));
        split_table.report(ulid2, Uri::for_test(TEST_STORAGE_URI));
        let num_bytes_opt = split_table.touch(ulid1, &Uri::for_test("s3://test1/"));
        assert!(num_bytes_opt.is_none());
        let candidate = split_table.best_candidate().unwrap();
        assert_eq!(candidate.split_ulid, ulid1);
    }

    #[test]
    fn test_split_table_prefer_start_download_prevent_new_report() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::kb(1),
                max_num_splits: NonZeroU32::new(1).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        let ulid1 = Ulid::new();
        split_table.report(ulid1, Uri::for_test(TEST_STORAGE_URI));
        assert_eq!(split_table.num_bytes(), 0);
        let download = split_table.start_download(ulid1);
        assert!(download.is_some());
        assert!(split_table.start_download(ulid1).is_none());
        split_table.register_as_downloaded(ulid1, 10_000_000);
        assert_eq!(split_table.num_bytes(), 10_000_000);
        assert_eq!(
            split_table.touch(ulid1, &Uri::for_test(TEST_STORAGE_URI)),
            Some(10_000_000)
        );
        let ulid2 = Ulid::new();
        split_table.report(ulid2, Uri::for_test("s3://test`/"));
        let download = split_table.start_download(ulid2);
        assert!(download.is_some());
        assert!(split_table.start_download(ulid2).is_none());
        assert_eq!(split_table.num_bytes(), 10_000_000);
        split_table.register_as_downloaded(ulid2, 3_000_000);
        assert_eq!(split_table.num_bytes(), 13_000_000);
    }

    #[test]
    fn test_eviction_due_to_size() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::mb(1),
                max_num_splits: NonZeroU32::new(30).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        let mut split_ulids: Vec<Ulid> = std::iter::repeat_with(Ulid::new).take(6).collect();
        split_ulids.sort();
        let splits = [
            (split_ulids[0], 10_000),
            (split_ulids[1], 20_000),
            (split_ulids[2], 300_000),
            (split_ulids[3], 400_000),
            (split_ulids[4], 100_000),
            (split_ulids[5], 300_000),
        ];
        for (split_ulid, num_bytes) in splits {
            split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
            split_table.register_as_downloaded(split_ulid, num_bytes);
        }
        let new_ulid = Ulid::new();
        split_table.report(new_ulid, Uri::for_test(TEST_STORAGE_URI));
        let DownloadOpportunity {
            splits_to_delete,
            split_to_download,
        } = split_table.find_download_opportunity().unwrap();
        assert_eq!(
            &splits_to_delete[..],
            &[splits[0].0, splits[1].0, splits[2].0][..]
        );
        assert_eq!(split_to_download.split_ulid, new_ulid);
    }

    #[test]
    fn test_eviction_due_to_num_splits() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::mb(10),
                max_num_splits: NonZeroU32::new(5).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        let mut split_ulids: Vec<Ulid> = std::iter::repeat_with(Ulid::new).take(6).collect();
        split_ulids.sort();
        let splits = [
            (split_ulids[0], 10_000),
            (split_ulids[1], 20_000),
            (split_ulids[2], 300_000),
            (split_ulids[3], 400_000),
            (split_ulids[4], 100_000),
            (split_ulids[5], 300_000),
        ];
        for (split_ulid, num_bytes) in splits {
            split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
            split_table.register_as_downloaded(split_ulid, num_bytes);
        }
        let new_ulid = Ulid::new();
        split_table.report(new_ulid, Uri::for_test(TEST_STORAGE_URI));
        let DownloadOpportunity {
            splits_to_delete,
            split_to_download,
        } = split_table.find_download_opportunity().unwrap();
        assert_eq!(&splits_to_delete[..], &[splits[0].0, splits[1].0]);
        assert_eq!(split_to_download.split_ulid, new_ulid);
    }

    #[test]
    fn test_failed_download_can_be_re_reported() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::mb(10),
                max_num_splits: NonZeroU32::new(5).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        let split_ulid = Ulid::new();
        split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
        let candidate = split_table.start_download(split_ulid).unwrap();
        // This report should be cancelled as we have a download currently running.
        split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));

        assert!(split_table.start_download(split_ulid).is_none());
        std::mem::drop(candidate);

        // Still not possible to start a download.
        assert!(split_table.start_download(split_ulid).is_none());

        // This report should be considered as our candidate (and its alive token has been dropped)
        split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));

        let candidate2 = split_table.start_download(split_ulid).unwrap();
        assert_eq!(candidate2.split_ulid, split_ulid);
    }

    #[test]
    fn test_split_table_truncate_candidates() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::mb(10),
                max_num_splits: NonZeroU32::new(5).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        for i in 1..2_000 {
            let split_ulid = Ulid::new();
            split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
            assert_eq!(
                split_table.candidate_splits.len(),
                i.min(super::MAX_NUM_CANDIDATES)
            );
        }
    }

    // Unit test for #5334
    #[test]
    fn test_split_inserted_is_the_worst_candidate_5334() {
        let mut split_table = SplitTable::with_limits_and_existing_splits(
            SplitCacheLimits {
                max_num_bytes: ByteSize::mb(10),
                max_num_splits: NonZeroU32::new(2).unwrap(),
                num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
                max_file_descriptors: NonZeroU32::new(100).unwrap(),
            },
            Default::default(),
        );
        for i in (0u128..=super::MAX_NUM_CANDIDATES as u128).rev() {
            let split_ulid = Ulid(i);
            let candidate_split = CandidateSplit {
                storage_uri: Uri::for_test(TEST_STORAGE_URI),
                split_ulid,
                living_token: Arc::new(()),
            };
            let split_info = SplitInfo {
                split_key: SplitKey {
                    last_accessed: 0u64,
                    split_ulid,
                },
                status: Status::Candidate(candidate_split),
            };
            split_table.insert(split_info);
        }
        assert_eq!(
            split_table.candidate_splits.len(),
            super::MAX_NUM_CANDIDATES
        );
    }
}


================================================
FILE: quickwit/quickwit-storage/src/split_cache/tests.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::num::NonZeroU32;

use bytesize::ByteSize;
use quickwit_common::uri::Uri;
use quickwit_config::SplitCacheLimits;
use ulid::Ulid;

use crate::split_cache::split_table::{DownloadOpportunity, SplitTable};

const TEST_STORAGE_URI: &'static str = "s3://test";

#[test]
fn test_split_table() {
    let mut split_table = SplitTable::with_limits(SplitCacheLimits {
        max_num_bytes: ByteSize::kb(1),
        max_num_splits: NonZeroU32::new(1).unwrap(),
        num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
    });
    let ulid1 = Ulid::new();
    let ulid2 = Ulid::new();
    split_table.report(ulid1, Uri::for_test(TEST_STORAGE_URI));
    split_table.report(ulid2, Uri::for_test(TEST_STORAGE_URI));
    let candidate = split_table.best_candidate().unwrap();
    assert_eq!(candidate.split_ulid, ulid2);
}

#[test]
fn test_split_table_prefer_last_touched() {
    let mut split_table = SplitTable::with_limits(SplitCacheLimits {
        max_num_bytes: ByteSize::kb(1),
        max_num_splits: NonZeroU32::new(1).unwrap(),
        num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
    });
    let ulid1 = Ulid::new();
    let ulid2 = Ulid::new();
    split_table.report(ulid1, Uri::for_test(TEST_STORAGE_URI));
    split_table.report(ulid2, Uri::for_test(TEST_STORAGE_URI));
    let split_guard_opt = split_table.get_split_guard(ulid1, &Uri::for_test("s3://test1/"));
    assert!(split_guard_opt.is_none());
    let candidate = split_table.best_candidate().unwrap();
    assert_eq!(candidate.split_ulid, ulid1);
}

#[test]
fn test_split_table_prefer_start_download_prevent_new_report() {
    let mut split_table = SplitTable::with_limits(SplitCacheLimits {
        max_num_bytes: ByteSize::kb(1),
        max_num_splits: NonZeroU32::new(1).unwrap(),
        num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
    });
    let ulid1 = Ulid::new();
    split_table.report(ulid1, Uri::for_test(TEST_STORAGE_URI));
    assert_eq!(split_table.num_bytes(), 0);
    let download = split_table.start_download(ulid1);
    assert!(download.is_some());
    assert!(split_table.start_download(ulid1).is_none());
    split_table.register_as_downloaded(ulid1, 10_000_000);
    assert_eq!(split_table.num_bytes(), 10_000_000);
    split_table.get_split_guard(ulid1, &Uri::for_test(TEST_STORAGE_URI));
    let ulid2 = Ulid::new();
    split_table.report(ulid2, Uri::for_test("s3://test`/"));
    let download = split_table.start_download(ulid2);
    assert!(download.is_some());
    assert!(split_table.start_download(ulid2).is_none());
    assert_eq!(split_table.num_bytes(), 10_000_000);
    split_table.register_as_downloaded(ulid2, 3_000_000);
    assert_eq!(split_table.num_bytes(), 13_000_000);
}

#[test]
fn test_eviction_due_to_size() {
    let mut split_table = SplitTable::with_limits(SplitCacheLimits {
        max_num_bytes: ByteSize::mb(1),
        max_num_splits: NonZeroU32::new(30).unwrap(),
        num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
    });
    let mut split_ulids: Vec<Ulid> = std::iter::repeat_with(Ulid::new).take(6).collect();
    split_ulids.sort();
    let splits = [
        (split_ulids[0], 10_000),
        (split_ulids[1], 20_000),
        (split_ulids[2], 300_000),
        (split_ulids[3], 400_000),
        (split_ulids[4], 100_000),
        (split_ulids[5], 300_000),
    ];
    for (split_ulid, num_bytes) in splits {
        split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
        split_table.register_as_downloaded(split_ulid, num_bytes);
    }
    let new_ulid = Ulid::new();
    split_table.report(new_ulid, Uri::for_test(TEST_STORAGE_URI));
    let DownloadOpportunity {
        splits_to_delete,
        split_to_download,
    } = split_table.find_download_opportunity().unwrap();
    assert_eq!(
        &splits_to_delete[..],
        &[splits[0].0, splits[1].0, splits[2].0][..]
    );
    assert_eq!(split_to_download.split_ulid, new_ulid);
}

#[test]
fn test_eviction_due_to_num_splits() {
    let mut split_table = SplitTable::with_limits(SplitCacheLimits {
        max_num_bytes: ByteSize::mb(10),
        max_num_splits: NonZeroU32::new(5).unwrap(),
        num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
    });
    let mut split_ulids: Vec<Ulid> = std::iter::repeat_with(Ulid::new).take(6).collect();
    split_ulids.sort();
    let splits = [
        (split_ulids[0], 10_000),
        (split_ulids[1], 20_000),
        (split_ulids[2], 300_000),
        (split_ulids[3], 400_000),
        (split_ulids[4], 100_000),
        (split_ulids[5], 300_000),
    ];
    for (split_ulid, num_bytes) in splits {
        split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
        split_table.register_as_downloaded(split_ulid, num_bytes);
    }
    let new_ulid = Ulid::new();
    split_table.report(new_ulid, Uri::for_test(TEST_STORAGE_URI));
    let DownloadOpportunity {
        splits_to_delete,
        split_to_download,
    } = split_table.find_download_opportunity().unwrap();
    assert_eq!(&splits_to_delete[..], &[splits[0].0][..]);
    assert_eq!(split_to_download.split_ulid, new_ulid);
}

#[test]
fn test_failed_download_can_be_re_reported() {
    let mut split_table = SplitTable::with_limits(SplitCacheLimits {
        max_num_bytes: ByteSize::mb(10),
        max_num_splits: NonZeroU32::new(5).unwrap(),
        num_concurrent_downloads: NonZeroU32::new(1).unwrap(),
    });
    let split_ulid = Ulid::new();
    split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));
    let candidate = split_table.start_download(split_ulid).unwrap();
    // This report should be cancelled as we have a download currently running.
    split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));

    assert!(split_table.start_download(split_ulid).is_none());
    std::mem::drop(candidate);

    // Still not possible to start a download.
    assert!(split_table.start_download(split_ulid).is_none());

    // This report should be considered as our candidate (and its alive token has been dropped)
    split_table.report(split_ulid, Uri::for_test(TEST_STORAGE_URI));

    let candidate2 = split_table.start_download(split_ulid).unwrap();
    assert_eq!(candidate2.split_ulid, split_ulid);
}


================================================
FILE: quickwit/quickwit-storage/src/storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::fmt;
use std::io::{self};
use std::ops::Range;
use std::path::{Path, PathBuf};

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use tempfile::TempPath;
use tokio::fs::File;
use tokio::io::{AsyncRead, AsyncWrite};
use tracing::error;

use crate::{BulkDeleteError, OwnedBytes, PutPayload, StorageErrorKind, StorageResult};

/// This trait is only used to make it build trait object with `AsyncWrite + Send + Unpin`.
pub trait SendableAsync: AsyncWrite + Send + Unpin {}
impl<W: AsyncWrite + Send + Unpin> SendableAsync for W {}

/// Storage meant to receive and serve quickwit's split.
///
/// Object storage are the primary target implementation of this trait,
/// and its interface is meant to allow for multipart download/upload.
///
/// Note that Storage does not have the notion of directory separators.
/// For underlying implementation where directory separator have meaning,
/// The implementation should treat directory separators as exactly the same way
/// object storage treat them. This means when directory separators a present
/// in the storage operation path, the storage implementation should create and remove transparently
/// these intermediate directories.
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait]
pub trait Storage: fmt::Debug + Send + Sync + 'static {
    /// Check storage connection if applicable
    async fn check_connectivity(&self) -> anyhow::Result<()>;

    /// Saves a file into the storage.
    async fn put(&self, path: &Path, payload: Box<dyn PutPayload>) -> StorageResult<()>;

    /// Copies the file associated to `Path` into an `AsyncWrite`.
    /// This function is required to call `.flush()` before it successfully returns.
    ///
    /// See also `copy_to_file`.
    ///
    /// async_trait Expansion of
    /// async fn copy_to(&self, path: &Path, output: &mut dyn SendableAsync) -> StorageResult<()>;
    ///
    /// Just putting the async form is breaking mockall.
    fn copy_to<'life0, 'life1, 'life2, 'async_trait>(
        &'life0 self,
        path: &'life1 Path,
        output: &'life2 mut dyn SendableAsync,
    ) -> ::core::pin::Pin<
        Box<
            dyn ::core::future::Future<Output = StorageResult<()>>
                + ::core::marker::Send
                + 'async_trait,
        >,
    >
    where
        'life0: 'async_trait,
        'life1: 'async_trait,
        'life2: 'async_trait,
        Self: 'async_trait;

    /// Downloads an entire file and writes it into a local file.
    /// `output_path` is expected to be a file path (not a directory path)
    /// without any existing file yet.
    ///
    /// This function will attempt to download things to a temporary file
    /// in the same directory as the `output_path`, and then atomically move it
    /// to the actual `output_path`.
    ///
    /// In case of failure, `quickwit` (not the OS) will attempt to delete the file
    /// using some `Drop` mechanic.
    /// If quickwit is killed for instance, this may result in the temporary file not
    /// being deleted. It is important, upon started to identify these ".temp"
    /// files and delete them.
    ///
    /// See also `copy_to`.
    async fn copy_to_file(&self, path: &Path, output_path: &Path) -> StorageResult<u64> {
        default_copy_to_file(self, path, output_path).await
    }

    /// Downloads a slice of a file from the storage, and returns an in memory buffer
    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes>;

    /// Opens a stream handle on the file from the storage.
    ///
    /// Might panic, return an error or an empty stream if the range is empty.
    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>>;

    /// Downloads the entire content of a "small" file, returns an in memory buffer.
    /// For large files prefer `copy_to_file`.
    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes>;

    /// Deletes a file.
    ///
    /// This method should return Ok(()) if the file did not exist.
    async fn delete(&self, path: &Path) -> StorageResult<()>;

    /// Deletes multiple files at once.
    ///
    /// The implementation may call `[`Storage::delete`] in a loop if the underlying storage does
    /// not support deleting objects in bulk. The request can fail partially, i.e. some objects are
    /// successfully deleted while others are not.
    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError>;

    /// Returns whether a file exists or not.
    async fn exists(&self, path: &Path) -> StorageResult<bool> {
        match self.file_num_bytes(path).await {
            Ok(_) => Ok(true),
            Err(storage_err) if storage_err.kind() == StorageErrorKind::NotFound => Ok(false),
            Err(other_storage_err) => Err(other_storage_err),
        }
    }

    /// Returns a file size.
    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64>;

    /// Returns an URI identifying the storage
    fn uri(&self) -> &Uri;
}

async fn default_copy_to_file<S: Storage + ?Sized>(
    storage: &S,
    path: &Path,
    output_path: &Path,
) -> StorageResult<u64> {
    let mut download_temp_file =
        DownloadTempFile::with_target_path(output_path.to_path_buf()).await?;
    storage.copy_to(path, download_temp_file.as_mut()).await?;
    let num_bytes = download_temp_file.persist().await?;
    Ok(num_bytes)
}

struct DownloadTempFile {
    target_filepath: PathBuf,
    temp_filepath: PathBuf,
    file: File,
    has_attempted_deletion: bool,
}

impl DownloadTempFile {
    /// Creates or truncate temp file.
    pub async fn with_target_path(target_filepath: PathBuf) -> io::Result<DownloadTempFile> {
        let Some(filename) = target_filepath.file_name() else {
            return Err(io::Error::other(
                "Target filepath is not a directory path. Expected a filepath.",
            ));
        };
        let filename: &str = filename
            .to_str()
            .ok_or_else(|| io::Error::other("target filepath is not a valid UTF-8 string"))?;
        let mut temp_filepath = target_filepath.clone();
        temp_filepath.set_file_name(format!("{filename}.temp"));
        let file = tokio::fs::File::create(temp_filepath.clone()).await?;
        Ok(DownloadTempFile {
            target_filepath,
            temp_filepath,
            file,
            has_attempted_deletion: false,
        })
    }

    pub async fn persist(mut self) -> io::Result<u64> {
        TempPath::from_path(&self.temp_filepath).persist(&self.target_filepath)?;
        self.has_attempted_deletion = true;
        let num_bytes = std::fs::metadata(&self.target_filepath)?.len();
        Ok(num_bytes)
    }
}

impl Drop for DownloadTempFile {
    fn drop(&mut self) {
        if self.has_attempted_deletion {
            return;
        }
        let temp_filepath = self.temp_filepath.clone();
        self.has_attempted_deletion = true;
        tokio::task::spawn_blocking(move || {
            if let Err(io_error) = std::fs::remove_file(&temp_filepath) {
                error!(temp_filepath=%temp_filepath.display(), io_error=?io_error, "Failed to remove temporary file");
            }
        });
    }
}

impl AsMut<File> for DownloadTempFile {
    fn as_mut(&mut self) -> &mut File {
        &mut self.file
    }
}

#[cfg(test)]
mod tests {
    use std::time::Duration;

    use super::*;
    use crate::{RamStorage, StorageError};

    const CONTENT: &[u8] = b"hello world";

    #[tokio::test]
    async fn test_copy_to_file() {
        let ram_storage = RamStorage::default();
        let temp_dir = tempfile::tempdir().unwrap();
        let dest_filepath = temp_dir.path().join("bar");
        let path = Path::new("foo/bar");
        ram_storage
            .put(path, Box::new(CONTENT.to_owned()))
            .await
            .unwrap();
        let num_bytes = ram_storage
            .copy_to_file(path, &dest_filepath)
            .await
            .unwrap();
        assert_eq!(num_bytes, 11);
        let content = std::fs::read(&dest_filepath).unwrap();
        assert_eq!(&content, CONTENT);
    }

    #[tokio::test]
    async fn test_copy_to_file_deletes_tempfile_on_failure() {
        let mut storage = MockStorage::default();
        storage.expect_copy_to().return_once(|_, _| {
            Box::pin(futures::future::err(StorageError::from(io::Error::other(
                "fake storage error",
            ))))
        });
        let path = Path::new("foo/bar");
        let temp_dir = tempfile::tempdir().unwrap();
        let dest_filepath = temp_dir.path().join("bar");
        default_copy_to_file(&storage, path, &dest_filepath)
            .await
            .unwrap_err();
        tokio::time::sleep(Duration::from_millis(100)).await;
        let mut read_dir = tokio::fs::read_dir(dest_filepath.parent().unwrap())
            .await
            .unwrap();
        let entry_opt = read_dir
            .next_entry()
            .await
            .unwrap()
            .map(|dir_entry| dir_entry.path());
        assert_eq!(entry_opt, None);
    }
}


================================================
FILE: quickwit/quickwit-storage/src/storage_factory.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::sync::Arc;

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_config::StorageBackend;

use crate::{Storage, StorageResolverError};

/// A storage factory builds a [`Storage`] object for a target [`StorageBackend`] from a
/// [`Uri`].
#[cfg_attr(any(test, feature = "testsuite"), mockall::automock)]
#[async_trait]
pub trait StorageFactory: Send + Sync + 'static {
    /// Returns the storage backend targeted by the factory.
    fn backend(&self) -> StorageBackend;

    /// Returns the appropriate [`Storage`] object for the URI.
    async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError>;
}

/// A storage factory for handling unsupported or unavailable storage backends.
#[derive(Debug, Clone)]
pub struct UnsupportedStorage {
    backend: StorageBackend,
    message: &'static str,
}

impl UnsupportedStorage {
    /// Creates a new [`UnsupportedStorage`].
    pub fn new(backend: StorageBackend, message: &'static str) -> Self {
        Self { backend, message }
    }
}

#[async_trait]
impl StorageFactory for UnsupportedStorage {
    fn backend(&self) -> StorageBackend {
        self.backend
    }

    async fn resolve(&self, _uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        Err(StorageResolverError::UnsupportedBackend(
            self.message.to_string(),
        ))
    }
}


================================================
FILE: quickwit/quickwit-storage/src/storage_resolver.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashMap;
use std::fmt;
use std::sync::Arc;

use once_cell::sync::Lazy;
use quickwit_common::uri::{Protocol, Uri};
use quickwit_config::{StorageBackend, StorageConfigs};

#[cfg(feature = "azure")]
use crate::AzureBlobStorageFactory;
#[cfg(feature = "gcs")]
use crate::GoogleCloudStorageFactory;
use crate::local_file_storage::LocalFileStorageFactory;
use crate::ram_storage::RamStorageFactory;
use crate::{S3CompatibleObjectStorageFactory, Storage, StorageFactory, StorageResolverError};

/// Returns the [`Storage`] instance associated with the protocol of a URI. The actual creation of
/// storage objects is delegated to pre-registered [`StorageFactory`]. The resolver is only
/// responsible for dispatching to the appropriate factory.
#[derive(Clone)]
pub struct StorageResolver {
    per_backend_factories: Arc<HashMap<StorageBackend, Box<dyn StorageFactory>>>,
}

impl fmt::Debug for StorageResolver {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.debug_struct("StorageResolver").finish()
    }
}

impl StorageResolver {
    /// Creates an empty [`StorageResolverBuilder`].
    pub fn builder() -> StorageResolverBuilder {
        StorageResolverBuilder::default()
    }

    /// Resolves the given URI.
    pub async fn resolve(&self, uri: &Uri) -> Result<Arc<dyn Storage>, StorageResolverError> {
        let backend = match uri.protocol() {
            Protocol::Azure => StorageBackend::Azure,
            Protocol::File => StorageBackend::File,
            Protocol::Ram => StorageBackend::Ram,
            Protocol::S3 => StorageBackend::S3,
            Protocol::Google => StorageBackend::Google,
            _ => {
                let message = format!(
                    "Quickwit does not support {} as a storage backend",
                    uri.protocol()
                );
                return Err(StorageResolverError::UnsupportedBackend(message));
            }
        };
        let storage_factory = self.per_backend_factories.get(&backend).ok_or({
            let message = format!("no storage factory is registered for {}", uri.protocol());
            StorageResolverError::UnsupportedBackend(message)
        })?;
        let storage = storage_factory.resolve(uri).await?;
        Ok(storage)
    }

    /// Creates and returns a default [`StorageResolver`] with the default storage configuration for
    /// each backend. Note that if the environment (env vars, instance metadata, ...) fails to
    /// provide the necessary credentials, the default Azure or S3 storage returned by this
    /// resolver will not work.
    pub fn unconfigured() -> Self {
        static STORAGE_RESOLVER: Lazy<StorageResolver> = Lazy::new(|| {
            let storage_configs = StorageConfigs::default();
            StorageResolver::configured(&storage_configs)
        });
        STORAGE_RESOLVER.clone()
    }

    /// Creates and returns a [`StorageResolver`].
    pub fn configured(storage_configs: &StorageConfigs) -> Self {
        let mut builder = StorageResolver::builder()
            .register(LocalFileStorageFactory)
            .register(RamStorageFactory::default())
            .register(S3CompatibleObjectStorageFactory::new(
                storage_configs.find_s3().cloned().unwrap_or_default(),
            ));
        #[cfg(feature = "azure")]
        {
            builder = builder.register(AzureBlobStorageFactory::new(
                storage_configs.find_azure().cloned().unwrap_or_default(),
            ));
        }
        #[cfg(not(feature = "azure"))]
        {
            use crate::storage_factory::UnsupportedStorage;

            builder = builder.register(UnsupportedStorage::new(
                StorageBackend::Azure,
                "Quickwit was compiled without the `azure` feature",
            ))
        }
        #[cfg(feature = "gcs")]
        {
            builder = builder.register(GoogleCloudStorageFactory::new(
                storage_configs.find_google().cloned().unwrap_or_default(),
            ));
        }
        #[cfg(not(feature = "gcs"))]
        {
            use crate::storage_factory::UnsupportedStorage;

            builder = builder.register(UnsupportedStorage::new(
                StorageBackend::Google,
                "Quickwit was compiled without the `gcs` feature",
            ))
        }
        builder
            .build()
            .expect("storage factory and config backends should match")
    }

    /// Returns a [`StorageResolver`] for testing purposes. Unlike
    /// [`StorageResolver::unconfigured`], this resolver does not return a singleton.
    #[cfg(any(test, feature = "testsuite"))]
    pub fn for_test() -> Self {
        StorageResolver::builder()
            .register(RamStorageFactory::default())
            .register(LocalFileStorageFactory)
            .build()
            .expect("storage factory and config backends should match")
    }
}

#[derive(Default)]
pub struct StorageResolverBuilder {
    per_backend_factories: HashMap<StorageBackend, Box<dyn StorageFactory>>,
}

impl StorageResolverBuilder {
    /// Registers a [`StorageFactory`].
    pub fn register<S: StorageFactory>(mut self, storage_factory: S) -> Self {
        self.per_backend_factories
            .insert(storage_factory.backend(), Box::new(storage_factory));
        self
    }

    /// Builds the [`StorageResolver`].
    pub fn build(self) -> anyhow::Result<StorageResolver> {
        let storage_resolver = StorageResolver {
            per_backend_factories: Arc::new(self.per_backend_factories),
        };
        Ok(storage_resolver)
    }
}

#[cfg(test)]
mod tests {
    use std::path::Path;

    use super::*;
    use crate::{MockStorageFactory, RamStorage};

    #[tokio::test]
    async fn test_storage_resolver_simple() -> anyhow::Result<()> {
        let mut file_storage_factory = MockStorageFactory::new();
        file_storage_factory
            .expect_backend()
            .returning(|| StorageBackend::File);

        let mut ram_storage_factory = MockStorageFactory::new();
        ram_storage_factory
            .expect_backend()
            .returning(|| StorageBackend::Ram);
        ram_storage_factory.expect_resolve().returning(|_uri| {
            Ok(Arc::new(
                RamStorage::builder()
                    .put("hello", b"hello_content_second")
                    .build(),
            ))
        });
        let storage_resolver = StorageResolver::builder()
            .register(file_storage_factory)
            .register(ram_storage_factory)
            .build()
            .unwrap();
        let storage = storage_resolver.resolve(&Uri::for_test("ram:///")).await?;
        let data = storage.get_all(Path::new("hello")).await?;
        assert_eq!(&data[..], b"hello_content_second");
        Ok(())
    }

    #[tokio::test]
    async fn test_storage_resolver_override() -> anyhow::Result<()> {
        let mut first_ram_storage_factory = MockStorageFactory::new();
        first_ram_storage_factory
            .expect_backend()
            .returning(|| StorageBackend::Ram);

        let mut second_ram_storage_factory = MockStorageFactory::new();
        second_ram_storage_factory
            .expect_backend()
            .returning(|| StorageBackend::Ram);
        second_ram_storage_factory
            .expect_resolve()
            .returning(|uri| {
                assert_eq!(uri.as_str(), "ram:///home");
                Ok(Arc::new(
                    RamStorage::builder()
                        .put("hello", b"hello_content_second")
                        .build(),
                ))
            });
        let storage_resolver = StorageResolver::builder()
            .register(first_ram_storage_factory)
            .register(second_ram_storage_factory)
            .build()
            .unwrap();
        let storage = storage_resolver
            .resolve(&Uri::for_test("ram:///home"))
            .await?;
        let data = storage.get_all(Path::new("hello")).await?;
        assert_eq!(&data[..], b"hello_content_second");
        Ok(())
    }

    #[tokio::test]
    async fn test_storage_resolver_unsupported_protocol() {
        let storage_resolver = StorageResolver::unconfigured();
        let storage_uri = Uri::for_test("postgresql://localhost:5432/metastore");
        let resolver_error = storage_resolver.resolve(&storage_uri).await.unwrap_err();
        assert!(matches!(
            resolver_error,
            StorageResolverError::UnsupportedBackend(_)
        ));
    }
}


================================================
FILE: quickwit/quickwit-storage/src/timeout_and_retry_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::ops::Range;
use std::path::Path;
use std::sync::Arc;

use async_trait::async_trait;
use quickwit_common::uri::Uri;
use quickwit_common::{rate_limited_info, rate_limited_warn};
use quickwit_config::StorageTimeoutPolicy;
use tantivy::directory::OwnedBytes;
use tokio::io::AsyncRead;

use crate::storage::SendableAsync;
use crate::{BulkDeleteError, PutPayload, Storage, StorageErrorKind, StorageResult};

/// Storage proxy that implements a retry operation if the underlying storage
/// takes too long.
///
/// This is useful in order to ensure a low latency on S3.
/// Retrying agressively is recommended for S3.
///
/// <https://docs.aws.amazon.com/whitepapers/latest/s3-optimizing-performance-best-practices/timeouts-and-retries-for-latency-sensitive-applications.html>
#[derive(Clone, Debug)]
pub struct TimeoutAndRetryStorage {
    underlying: Arc<dyn Storage>,
    storage_timeout_policy: StorageTimeoutPolicy,
}

impl TimeoutAndRetryStorage {
    /// Creates a new `TimeoutAndRetryStorage`.
    ///
    /// See [StorageTimeoutPolicy] for more information.
    pub fn new(storage: Arc<dyn Storage>, storage_timeout_policy: StorageTimeoutPolicy) -> Self {
        TimeoutAndRetryStorage {
            underlying: storage,
            storage_timeout_policy,
        }
    }
}

#[async_trait]
impl Storage for TimeoutAndRetryStorage {
    async fn check_connectivity(&self) -> anyhow::Result<()> {
        self.underlying.check_connectivity().await
    }

    async fn put(&self, path: &Path, payload: Box<dyn PutPayload>) -> StorageResult<()> {
        self.underlying.put(path, payload).await
    }

    fn copy_to<'life0, 'life1, 'life2, 'async_trait>(
        &'life0 self,
        path: &'life1 Path,
        output: &'life2 mut dyn SendableAsync,
    ) -> ::core::pin::Pin<
        Box<
            dyn ::core::future::Future<Output = StorageResult<()>>
                + ::core::marker::Send
                + 'async_trait,
        >,
    >
    where
        'life0: 'async_trait,
        'life1: 'async_trait,
        'life2: 'async_trait,
        Self: 'async_trait,
    {
        self.underlying.copy_to(path, output)
    }

    async fn copy_to_file(&self, path: &Path, output_path: &Path) -> StorageResult<u64> {
        self.underlying.copy_to_file(path, output_path).await
    }

    /// Downloads a slice of a file from the storage, and returns an in memory buffer
    async fn get_slice(&self, path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
        let num_bytes = range.len();
        for (attempt_id, timeout_duration) in self
            .storage_timeout_policy
            .compute_timeout(num_bytes)
            .enumerate()
        {
            let get_slice_fut = self.underlying.get_slice(path, range.clone());
            // TODO test avoid aborting timed out requests. #5468
            match tokio::time::timeout(timeout_duration, get_slice_fut).await {
                Ok(result) => {
                    crate::STORAGE_METRICS
                        .get_slice_timeout_successes
                        .get(attempt_id)
                        .or(crate::STORAGE_METRICS.get_slice_timeout_successes.last())
                        .unwrap()
                        .inc();
                    return result;
                }
                Err(_elapsed) => {
                    rate_limited_info!(limit_per_min=60, num_bytes=num_bytes, path=%path.display(), timeout_secs=timeout_duration.as_secs_f32(), "get timeout elapsed");
                    continue;
                }
            }
        }
        rate_limited_warn!(limit_per_min=60, num_bytes=num_bytes, path=%path.display(), "all get_slice attempts timeouted");
        crate::STORAGE_METRICS.get_slice_timeout_all_timeouts.inc();
        return Err(
            StorageErrorKind::Timeout.with_error(anyhow::anyhow!("internal timeout on get_slice"))
        );
    }

    async fn get_slice_stream(
        &self,
        path: &Path,
        range: Range<usize>,
    ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
        self.underlying.get_slice_stream(path, range).await
    }

    async fn get_all(&self, path: &Path) -> StorageResult<OwnedBytes> {
        self.underlying.get_all(path).await
    }

    async fn delete(&self, path: &Path) -> StorageResult<()> {
        self.underlying.delete(path).await
    }

    async fn bulk_delete<'a>(&self, paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
        self.underlying.bulk_delete(paths).await
    }

    async fn exists(&self, path: &Path) -> StorageResult<bool> {
        self.underlying.exists(path).await
    }

    async fn file_num_bytes(&self, path: &Path) -> StorageResult<u64> {
        self.underlying.file_num_bytes(path).await
    }

    fn uri(&self) -> &Uri {
        self.underlying.uri()
    }
}

#[cfg(test)]
mod tests {

    use std::sync::Mutex;
    use std::time::Duration;

    use tokio::time::Instant;

    use super::*;

    #[derive(Debug)]
    struct StorageWithDelay {
        delays: Mutex<Vec<Duration>>,
    }

    impl StorageWithDelay {
        pub fn new(mut delays: Vec<Duration>) -> StorageWithDelay {
            delays.reverse();
            StorageWithDelay {
                delays: Mutex::new(delays),
            }
        }
    }

    #[async_trait]
    impl Storage for StorageWithDelay {
        fn uri(&self) -> &Uri {
            todo!();
        }

        async fn check_connectivity(&self) -> anyhow::Result<()> {
            todo!()
        }
        async fn put(&self, _path: &Path, _payload: Box<dyn PutPayload>) -> StorageResult<()> {
            todo!();
        }
        fn copy_to<'life0, 'life1, 'life2, 'async_trait>(
            &'life0 self,
            _path: &'life1 Path,
            _output: &'life2 mut dyn SendableAsync,
        ) -> ::core::pin::Pin<
            Box<
                dyn ::core::future::Future<Output = StorageResult<()>>
                    + ::core::marker::Send
                    + 'async_trait,
            >,
        >
        where
            'life0: 'async_trait,
            'life1: 'async_trait,
            'life2: 'async_trait,
            Self: 'async_trait,
        {
            todo!();
        }

        async fn get_slice(&self, _path: &Path, range: Range<usize>) -> StorageResult<OwnedBytes> {
            let duration_opt = self.delays.lock().unwrap().pop();
            let Some(delay) = duration_opt else {
                return Err(
                    StorageErrorKind::Internal.with_error(anyhow::anyhow!("internal error"))
                );
            };
            tokio::time::sleep(delay).await;
            let buf = vec![0u8; range.len()];
            Ok(OwnedBytes::new(buf))
        }
        async fn get_slice_stream(
            &self,
            _path: &Path,
            _range: Range<usize>,
        ) -> StorageResult<Box<dyn AsyncRead + Send + Unpin>> {
            todo!()
        }
        async fn get_all(&self, _path: &Path) -> StorageResult<OwnedBytes> {
            todo!();
        }
        async fn delete(&self, _path: &Path) -> StorageResult<()> {
            todo!();
        }
        async fn bulk_delete<'a>(&self, _paths: &[&'a Path]) -> Result<(), BulkDeleteError> {
            todo!();
        }
        async fn exists(&self, _path: &Path) -> StorageResult<bool> {
            todo!()
        }
        async fn file_num_bytes(&self, _path: &Path) -> StorageResult<u64> {
            todo!();
        }
    }

    #[tokio::test]
    async fn test_timeout_and_retry_storage() {
        tokio::time::pause();

        let timeout_policy = StorageTimeoutPolicy {
            min_throughtput_bytes_per_secs: 100_000,
            timeout_millis: 2_000,
            max_num_retries: 1,
        };

        let path = Path::new("foo/bar");

        {
            let now = Instant::now();
            let storage_with_delay =
                StorageWithDelay::new(vec![Duration::from_secs(5), Duration::from_secs(3)]);
            let storage =
                TimeoutAndRetryStorage::new(Arc::new(storage_with_delay), timeout_policy.clone());
            assert_eq!(
                storage.get_slice(path, 10..100).await.unwrap_err().kind,
                StorageErrorKind::Timeout
            );
            let elapsed = now.elapsed().as_millis();
            assert!(elapsed.abs_diff(2 * 2_000) < 100);
        }
        {
            let now = Instant::now();
            let storage_with_delay =
                StorageWithDelay::new(vec![Duration::from_secs(5), Duration::from_secs(1)]);
            let storage = TimeoutAndRetryStorage::new(Arc::new(storage_with_delay), timeout_policy);
            assert!(storage.get_slice(path, 10..100).await.is_ok(),);
            let elapsed = now.elapsed().as_millis();
            assert!(elapsed.abs_diff(2_000 + 1_000) < 100);
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/src/versioned_component.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::io::Read;

use anyhow::Context;
use tantivy::directory::OwnedBytes;

/// Helper trait for versioning.
///
/// See the unit test for an example.
pub trait VersionedComponent: Default + Copy + Clone {
    /// This number is used to identify that the type.
    const MAGIC_NUMBER: u32;
    /// Type of the component we are versioning.
    type Component;
    /// Component name, used to make explicit error messages.
    fn component_name() -> &'static str {
        std::any::type_name::<Self::Component>()
    }
    /// Return the version code.
    fn to_version_code(self) -> u32;

    /// Serialize the header.
    /// Only the current version is meant to be serialized.
    fn header() -> [u8; 8] {
        let mut header = [0u8; 8];
        header[0..4].copy_from_slice(&Self::MAGIC_NUMBER.to_le_bytes());
        header[4..8].copy_from_slice(&Self::default().to_version_code().to_le_bytes());
        header
    }

    /// Deserialize the header from a `Read` trait.
    /// This method will check for the magic number and version code.
    fn try_read_component(bytes: &mut OwnedBytes) -> anyhow::Result<Self::Component> {
        let version = try_read_version::<Self>(bytes)?;
        version.deserialize_impl(bytes)
    }

    /// Parse the version code.
    /// This version is meant to be implemented but only to be called
    /// from `try_deserialize_from_bytes`.
    ///
    /// If the version is unknown, this method should return `None`.
    fn try_from_version_code_impl(version_code: u32) -> Option<Self>;

    /// Function to serialize a given component with the current codec.
    fn serialize(component: &Self::Component) -> Vec<u8> {
        let mut output = Vec::with_capacity(8);
        output.extend_from_slice(&Self::header());
        Self::serialize_impl(component, &mut output);
        output
    }

    /// Serialize the component using the current format.
    ///
    /// This function should NOT serialize the header.
    /// It should only append content to the `output` buffer.
    ///
    /// This function is meant to be implemented but should not be called directly.
    /// Instead, client should use `.serialize(..)`.
    fn serialize_impl(component: &Self::Component, output: &mut Vec<u8>);

    /// This method is meant to be implemented but not called, except by `try_read_component`.
    ///
    /// This method should consume the bytes from the `OwnedBytes`.
    fn deserialize_impl(&self, bytes: &mut OwnedBytes) -> anyhow::Result<Self::Component>;
}

/// Deserialize the header from a `Read` trait.
///
/// (This function is not part of the trait to make it private.)
fn try_read_version<V: VersionedComponent>(bytes: &mut OwnedBytes) -> anyhow::Result<V> {
    let mut header_bytes: [u8; 8] = [0u8; 8];
    bytes
        .read_exact(&mut header_bytes[..])
        .with_context(|| format!("failed to read header for {}", V::component_name()))?;
    try_deserialize_from_bytes::<V>(header_bytes)
}

/// Deserialize the header from 8 bytes.
/// An error is returned if the magic number does not match,
/// or if the version is unsupported.
///
/// (This function is not part of the trait to make it private.)
fn try_deserialize_from_bytes<V: VersionedComponent>(header_bytes: [u8; 8]) -> anyhow::Result<V> {
    let magic_number = u32::from_le_bytes(header_bytes[0..4].try_into().unwrap());
    if magic_number != V::MAGIC_NUMBER {
        anyhow::bail!("hot directory metadata's magic number does not match");
    }
    let version_code: u32 = u32::from_le_bytes(header_bytes[4..8].try_into().unwrap());
    V::try_from_version_code_impl(version_code).with_context(|| {
        format!(
            "version code {} is not supported for {}",
            version_code,
            V::component_name()
        )
    })
}

#[cfg(test)]
mod tests {
    use tantivy::directory::OwnedBytes;

    use crate::VersionedComponent;

    #[derive(Copy, Clone, Default)]
    #[repr(u32)]
    enum FakeComponentCodec {
        V1,
        #[default]
        V2 = 2,
    }

    #[derive(Debug)]
    struct FakeComponent {
        value: u32,
    }

    impl VersionedComponent for FakeComponentCodec {
        const MAGIC_NUMBER: u32 = 332_221_734u32;

        type Component = FakeComponent;

        fn to_version_code(self) -> u32 {
            self as u32
        }

        fn try_from_version_code_impl(version_code: u32) -> Option<Self> {
            match version_code {
                1u32 => Some(Self::V1),
                2u32 => Some(Self::V2),
                _ => None,
            }
        }

        fn serialize_impl(component: &Self::Component, output: &mut Vec<u8>) {
            output.extend_from_slice(&component.value.to_le_bytes());
        }

        fn deserialize_impl(&self, bytes: &mut OwnedBytes) -> anyhow::Result<Self::Component> {
            match self {
                FakeComponentCodec::V1 => {
                    if bytes.len() < 8 {
                        anyhow::bail!("not enough bytes to deserialize");
                    }
                    let value_bytes: [u8; 8] = bytes[0..8].try_into().unwrap();
                    let value: u32 = u64::from_le_bytes(value_bytes) as u32;
                    Ok(FakeComponent { value })
                }
                FakeComponentCodec::V2 => {
                    if bytes.len() < 4 {
                        anyhow::bail!("not enough bytes to deserialize");
                    }
                    let value_bytes: [u8; 4] = bytes[0..4].try_into().unwrap();
                    bytes.advance(4);
                    let value: u32 = u32::from_le_bytes(value_bytes);
                    Ok(FakeComponent { value })
                }
            }
        }
    }

    #[test]
    fn test_versioned_component() {
        let component = FakeComponent { value: 42 };
        let buf = FakeComponentCodec::serialize(&component);
        {
            let mut payload = OwnedBytes::new(buf.clone());
            let fake_component = FakeComponentCodec::try_read_component(&mut payload).unwrap();
            assert_eq!(fake_component.value, 42u32);
        }
        {
            let mut buf_clone = buf.clone();
            buf_clone[0] = 0u8;
            let mut payload = OwnedBytes::new(buf_clone);
            let fake_component_err =
                FakeComponentCodec::try_read_component(&mut payload).unwrap_err();
            assert!(
                fake_component_err
                    .to_string()
                    .to_lowercase()
                    .contains("magic number")
            );
        }
        {
            let mut buf_clone = buf;
            buf_clone.truncate(4);
            buf_clone.extend_from_slice(&1u32.to_le_bytes());
            buf_clone.extend_from_slice(&32u64.to_le_bytes());
            let mut payload = OwnedBytes::new(buf_clone);
            let fake_component = FakeComponentCodec::try_read_component(&mut payload).unwrap();
            assert_eq!(fake_component.value, 32u32);
        }
    }
}


================================================
FILE: quickwit/quickwit-storage/tests/azure_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// This file is an integration test that assumes that a connection
// to Azurite (the emulated azure blob storage environment)
// with default `loose` config is possible.

#[cfg(feature = "integration-testsuite")]
#[tokio::test]
#[cfg_attr(not(feature = "ci-test"), ignore)]
async fn azure_storage_test_suite() -> anyhow::Result<()> {
    use std::path::PathBuf;

    use anyhow::Context;
    use azure_storage_blobs::prelude::ClientBuilder;
    use quickwit_common::rand::append_random_suffix;
    use quickwit_storage::{AzureBlobStorage, MultiPartPolicy};
    let _ = tracing_subscriber::fmt::try_init();

    // Setup container.
    let container_name = append_random_suffix("quickwit").to_lowercase();
    let container_client = ClientBuilder::emulator().container_client(&container_name);
    container_client.create().into_future().await?;

    let mut object_storage = AzureBlobStorage::new_emulated(&container_name);
    quickwit_storage::storage_test_suite(&mut object_storage).await?;

    let mut object_storage = AzureBlobStorage::new_emulated(&container_name).with_prefix(
        PathBuf::from("/integration-tests/test-azure-compatible-storage"),
    );
    quickwit_storage::storage_test_single_part_upload(&mut object_storage)
        .await
        .context("test single-part upload failed")?;

    object_storage.set_policy(MultiPartPolicy {
        // On azure, block size is limited between 64KB and 100MB.
        target_part_num_bytes: 5 * 1_024 * 1_024, // 5MiB
        max_num_parts: 10_000,
        multipart_threshold_num_bytes: 10_000_000,
        max_object_num_bytes: 5_000_000_000_000,
        max_concurrent_uploads: 100,
    });
    quickwit_storage::storage_test_multi_part_upload(&mut object_storage)
        .await
        .context("test multipart upload failed")?;

    // Teardown container.
    container_client.delete().into_future().await?;
    Ok(())
}


================================================
FILE: quickwit/quickwit-storage/tests/google_cloud_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// This file is an integration test that assumes that a connection
// to Fake GCS Server (the emulated google cloud storage environment)

#[cfg(all(feature = "integration-testsuite", feature = "gcs"))]
#[cfg_attr(not(feature = "ci-test"), ignore)]
mod gcp_storage_test_suite {
    use std::str::FromStr;

    use anyhow::Context;
    use quickwit_common::rand::append_random_suffix;
    use quickwit_common::setup_logging_for_tests;
    use quickwit_common::uri::Uri;
    use quickwit_storage::test_config_helpers::{
        LOCAL_GCP_EMULATOR_ENDPOINT, new_emulated_google_cloud_storage,
    };

    pub fn sign_gcs_request(req: &mut reqwest::Request) {
        req.headers_mut().insert(
            reqwest::header::AUTHORIZATION,
            reqwest::header::HeaderValue::from_str("Bearer dummy").unwrap(),
        );
    }

    async fn create_gcs_bucket(bucket_name: &str) -> anyhow::Result<()> {
        let client = reqwest::Client::new();
        let url = format!("{LOCAL_GCP_EMULATOR_ENDPOINT}/storage/v1/b");
        let mut request = client
            .post(url)
            .body(serde_json::to_vec(&serde_json::json!({
                "name": bucket_name,
            }))?)
            .header(reqwest::header::CONTENT_TYPE, "application/json")
            .build()?;

        sign_gcs_request(&mut request);

        let response = client.execute(request).await?;

        if !response.status().is_success() {
            let error_text = response.text().await?;
            anyhow::bail!("Failed to create bucket: {}", error_text);
        };
        Ok(())
    }

    #[tokio::test]
    async fn google_cloud_storage_test_suite() -> anyhow::Result<()> {
        setup_logging_for_tests();

        let bucket_name = append_random_suffix("sample-bucket").to_lowercase();
        create_gcs_bucket(bucket_name.as_str())
            .await
            .context("Failed to create test GCS bucket")?;

        let mut object_storage =
            new_emulated_google_cloud_storage(&Uri::from_str(&format!("gs://{bucket_name}"))?)?;

        quickwit_storage::storage_test_suite(&mut object_storage).await?;

        let mut object_storage = new_emulated_google_cloud_storage(&Uri::from_str(&format!(
            "gs://{bucket_name}/integration-tests/test-gcs-storage"
        ))?)?;

        quickwit_storage::storage_test_single_part_upload(&mut object_storage)
            .await
            .context("test single-part upload failed")?;

        // TODO: Uncomment storage_test_multi_part_upload when the XML API is
        // supported in the emulated GCS server
        // (https://github.com/fsouza/fake-gcs-server/pull/1164)

        // object_storage.set_policy(MultiPartPolicy {
        //     target_part_num_bytes: 5 * 1_024 * 1_024,
        //     max_num_parts: 10_000,
        //     multipart_threshold_num_bytes: 10_000_000,
        //     max_object_num_bytes: 5_000_000_000_000,
        //     max_concurrent_uploads: 100,
        // });
        // quickwit_storage::storage_test_multi_part_upload(&mut object_storage)
        //     .await
        //     .context("test multipart upload failed")?;
        Ok(())
    }
}


================================================
FILE: quickwit/quickwit-storage/tests/s3_storage.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// This file is an integration test that assumes that the environment
// makes it po

#[cfg(feature = "integration-testsuite")]
pub mod s3_storage_test_suite {

    use std::path::PathBuf;
    use std::str::FromStr;

    use anyhow::Context;
    use once_cell::sync::OnceCell;
    use quickwit_common::setup_logging_for_tests;
    use quickwit_common::uri::Uri;
    use quickwit_config::S3StorageConfig;
    use quickwit_storage::{MultiPartPolicy, S3CompatibleObjectStorage};
    use tokio::runtime::Runtime;

    // Introducing a common runtime for the unit tests in this file.
    //
    // By default, tokio creates a new runtime, for each unit test.
    // Here, we want to use the singleton `AwsSdkConfig` object.
    // This object packs a smithy connector which itself includes a
    // hyper client pool. A hyper client cannot be used from multiple runtimes.
    fn test_runtime_singleton() -> &'static Runtime {
        static RUNTIME_CACHE: OnceCell<tokio::runtime::Runtime> = OnceCell::new();
        RUNTIME_CACHE.get_or_init(|| {
            tokio::runtime::Builder::new_multi_thread()
                .worker_threads(1)
                .enable_all()
                .build()
                .unwrap()
        })
    }

    async fn run_s3_storage_test_suite(s3_storage_config: S3StorageConfig, bucket_uri: &str) {
        setup_logging_for_tests();

        let storage_uri = Uri::from_str(bucket_uri).unwrap();
        let mut object_storage =
            S3CompatibleObjectStorage::from_uri(&s3_storage_config, &storage_uri)
                .await
                .unwrap();

        quickwit_storage::storage_test_suite(&mut object_storage)
            .await
            .context("S3 storage test suite failed")
            .unwrap();

        let mut object_storage =
            S3CompatibleObjectStorage::from_uri(&s3_storage_config, &storage_uri)
                .await
                .unwrap()
                .with_prefix(PathBuf::from("test-s3-compatible-storage"));

        quickwit_storage::storage_test_single_part_upload(&mut object_storage)
            .await
            .context("test single-part upload failed")
            .unwrap();

        object_storage.set_policy(MultiPartPolicy {
            target_part_num_bytes: 5 * 1_024 * 1_024, //< the minimum on S3 is 5MB.
            max_num_parts: 10_000,
            multipart_threshold_num_bytes: 10_000_000,
            max_object_num_bytes: 5_000_000_000_000,
            max_concurrent_uploads: 100,
        });

        quickwit_storage::storage_test_multi_part_upload(&mut object_storage)
            .await
            .context("test multipart upload failed")
            .unwrap();
    }

    #[test]
    #[cfg_attr(not(feature = "ci-test"), ignore)]
    fn test_suite_on_s3_storage_path_style_access() {
        use quickwit_common::rand::append_random_suffix;

        let s3_storage_config = S3StorageConfig {
            force_path_style_access: true,
            ..Default::default()
        };
        let bucket_uri =
            append_random_suffix("s3://quickwit-integration-tests/test-path-style-access");
        let test_runtime = test_runtime_singleton();
        test_runtime.block_on(run_s3_storage_test_suite(s3_storage_config, &bucket_uri));
    }

    #[test]
    #[cfg_attr(not(feature = "ci-test"), ignore)]
    fn test_suite_on_s3_storage_virtual_hosted_style_access() {
        use quickwit_common::rand::append_random_suffix;

        let s3_storage_config = S3StorageConfig {
            force_path_style_access: false,
            ..Default::default()
        };
        let bucket_uri = append_random_suffix(
            "s3://quickwit-integration-tests/test-virtual-hosted-style-access",
        );
        let test_runtime = test_runtime_singleton();
        test_runtime.block_on(run_s3_storage_test_suite(s3_storage_config, &bucket_uri));
    }

    #[test]
    #[cfg_attr(not(feature = "ci-test"), ignore)]
    fn test_suite_on_s3_storage_bulk_delete_single_object_delete_api() {
        use std::str::FromStr;

        use anyhow::Context;
        use quickwit_common::rand::append_random_suffix;
        use quickwit_common::uri::Uri;

        let s3_storage_config = S3StorageConfig {
            disable_multi_object_delete: true,
            ..Default::default()
        };
        let bucket_uri = append_random_suffix(
            "s3://quickwit-integration-tests/test-bulk-delete-single-object-delete-api",
        );
        let storage_uri = Uri::from_str(&bucket_uri).unwrap();
        let test_runtime = test_runtime_singleton();
        test_runtime.block_on(async move {
            let mut object_storage =
                S3CompatibleObjectStorage::from_uri(&s3_storage_config, &storage_uri)
                    .await
                    .unwrap();
            quickwit_storage::test_write_and_bulk_delete(&mut object_storage)
                .await
                .context("test bulk delete single-object delete API failed")
                .unwrap();
        });
    }
}


================================================
FILE: quickwit/quickwit-telemetry/Cargo.toml
================================================
[package]
name = "quickwit-telemetry"
description = "Open Telemetry services"

version.workspace = true
edition.workspace = true
homepage.workspace = true
documentation.workspace = true
repository.workspace = true
authors.workspace = true
license.workspace = true

[dependencies]
async-trait = { workspace = true }
hostname = { workspace = true }
md5 = { workspace = true }
once_cell = { workspace = true }
reqwest = { workspace = true }
serde = { workspace = true }
tokio = { workspace = true }
tracing = { workspace = true }
username = { workspace = true }
uuid = { workspace = true }

# This is actually not used directly the goal is to fix the version
# used by reqwest. 0.8.30 has an unclear license.
encoding_rs = { workspace = true }

quickwit-common = { workspace = true }

[dev-dependencies]
serde_json = { workspace = true }

[package.metadata.cargo-machete]
# see above
ignored = ["encoding_rs"]


================================================
FILE: quickwit/quickwit-telemetry/src/lib.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#![allow(clippy::bool_assert_comparison)]
#![deny(clippy::disallowed_methods)]

pub mod payload;
/// This crate contains  the code responsible for sending usage data to Quickwit inc's server.
mod sender;
pub(crate) mod sink;

use once_cell::sync::OnceCell;
use payload::QuickwitTelemetryInfo;
use tracing::info;

use crate::payload::TelemetryEvent;
pub use crate::sender::is_telemetry_disabled;
use crate::sender::{TelemetryLoopHandle, TelemetrySender};

static TELEMETRY_SENDER: OnceCell<TelemetrySender> = OnceCell::new();

/// Returns a `TelemetryLoopHandle` if the telemetry loop is not yet started.
pub fn start_telemetry_loop(quickwit_info: QuickwitTelemetryInfo) -> Option<TelemetryLoopHandle> {
    let telemetry_sender =
        TELEMETRY_SENDER.get_or_init(|| TelemetrySender::from_quickwit_info(quickwit_info));
    // This should not happen... unless telemetry is enabled and you are running tests in parallel
    // in the same process.
    if telemetry_sender.loop_started() {
        info!("telemetry loop already started. please disable telemetry during tests");
        return None;
    }
    Some(telemetry_sender.start_loop())
}

/// Sends a telemetry event to Quickwit's server via HTTP.
///
/// Telemetry guarantees to send at most 1 request per minute.
/// Each requests can ship at most 10 messages.
///
/// If this methods is called too often, some events will be dropped.
///
/// If the http requests fail, the error will be silent.
///
/// We voluntarily use an enum here to make it easier for reader
/// to audit the type of information that is send home.
pub async fn send_telemetry_event(event: TelemetryEvent) {
    if let Some(telemetry_sender) = TELEMETRY_SENDER.get() {
        telemetry_sender.send(event).await;
    }
}

/// This environment variable can be set to disable sending telemetry events.
pub const DISABLE_TELEMETRY_ENV_KEY: &str = "QW_DISABLE_TELEMETRY";


================================================
FILE: quickwit/quickwit-telemetry/src/payload.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::collections::HashSet;
use std::env;
use std::time::UNIX_EPOCH;

use serde::{Deserialize, Serialize};
use uuid::Uuid;

/// Represents the payload of the request sent with telemetry requests.
#[derive(Debug, Serialize, Deserialize)]
pub struct TelemetryPayload {
    /// Client information. See details in `[ClientInformation]`.
    pub client_info: ClientInfo,
    /// Quickwit information. See details in `[QuickwitInfo]`.
    pub quickwit_info: QuickwitTelemetryInfo,
    pub events: Vec<EventWithTimestamp>,
    /// Represents the number of events that where drops due to the
    /// combination of the `TELEMETRY_PUSH_COOLDOWN` and `MAX_EVENT_IN_QUEUE`.
    pub num_dropped_events: usize,
}

#[derive(Debug, Serialize, Deserialize)]
pub struct EventWithTimestamp {
    /// Unix time in seconds.
    pub unixtime: u64,
    /// Telemetry event.
    #[serde(flatten)]
    pub event: TelemetryEvent,
}

/// Returns the number of seconds elapsed since UNIX_EPOCH.
///
/// If the system clock is set before 1970, returns 0.
fn unixtime() -> u64 {
    match UNIX_EPOCH.elapsed() {
        Ok(duration) => duration.as_secs(),
        Err(_) => 0u64,
    }
}

impl From<TelemetryEvent> for EventWithTimestamp {
    fn from(event: TelemetryEvent) -> Self {
        EventWithTimestamp {
            unixtime: unixtime(),
            event,
        }
    }
}

/// Represents a Telemetry Event send to Quickwit's telemetry server for usage information.
#[derive(Debug, Serialize, Deserialize, PartialEq, Eq)]
#[serde(tag = "type")]
#[serde(rename_all = "snake_case")]
pub enum TelemetryEvent {
    RunCommand,
    /// EndCommand (with the return code).
    EndCommand {
        return_code: i32,
    },
    /// Event sent every 12h to signal the server is running.
    Running,
    /// UI index.html was requested.
    UiIndexPageLoad,
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct ClientInfo {
    session_uuid: uuid::Uuid,
    os: String,
    arch: String,
    hashed_host_username: String,
    kubernetes: bool,
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct QuickwitTelemetryInfo {
    pub version: String,
    pub services: HashSet<String>,
    pub features: HashSet<QuickwitFeature>,
}

impl QuickwitTelemetryInfo {
    pub fn new(services: HashSet<String>, features: HashSet<QuickwitFeature>) -> Self {
        Self {
            features,
            version: env!("CARGO_PKG_VERSION").to_string(),
            services,
        }
    }
}

impl Default for QuickwitTelemetryInfo {
    fn default() -> Self {
        Self {
            features: HashSet::new(),
            version: env!("CARGO_PKG_VERSION").to_string(),
            services: HashSet::new(),
        }
    }
}

#[derive(Clone, Debug, Serialize, Deserialize, PartialEq, Eq, Hash)]
#[serde(rename_all = "snake_case")]
pub enum QuickwitFeature {
    FileBackedMetastore,
    Jaeger,
    Otlp,
    PostgresqMetastore,
}

fn hashed_host_username() -> String {
    let hostname = hostname::get()
        .map(|hostname| hostname.to_string_lossy().to_string())
        .unwrap_or_default();
    let username = username::get_user_name().unwrap_or_default();
    let hashed_value = format!("{hostname}:{username}");
    let digest = md5::compute(hashed_value.as_bytes());
    format!("{digest:x}")
}

impl Default for ClientInfo {
    fn default() -> ClientInfo {
        ClientInfo {
            session_uuid: Uuid::new_v4(),
            os: env::consts::OS.to_string(),
            arch: env::consts::ARCH.to_string(),
            hashed_host_username: hashed_host_username(),
            kubernetes: std::env::var_os("KUBERNETES_SERVICE_HOST").is_some(),
        }
    }
}

#[cfg(test)]
mod tests {
    use serde_json;

    use super::{EventWithTimestamp, TelemetryEvent};

    #[test]
    fn test_serialize_payload_as_expected() {
        let event = EventWithTimestamp {
            unixtime: 0,
            event: TelemetryEvent::EndCommand { return_code: 0 },
        };
        let json = serde_json::to_string(&event).unwrap();
        assert_eq!(
            json,
            r#"{"unixtime":0,"type":"end_command","return_code":0}"#
        );
    }
}


================================================
FILE: quickwit/quickwit-telemetry/src/sender.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::mem;
use std::sync::Arc;
use std::sync::atomic::{AtomicBool, Ordering};
use std::time::Duration;

use tokio::sync::mpsc::{Receiver, Sender};
use tokio::sync::{Mutex, RwLock, oneshot};
use tokio::task::JoinHandle;
use tokio::time::Interval;
use tracing::info;

use crate::payload::{
    ClientInfo, EventWithTimestamp, QuickwitTelemetryInfo, TelemetryEvent, TelemetryPayload,
};
use crate::sink::{HttpClient, Sink};

/// At most 1 Request per minutes.
const TELEMETRY_PUSH_COOLDOWN: Duration = Duration::from_secs(60);

/// Interval at which to send telemetry `Running` event.
const TELEMETRY_RUNNING_EVENT_INTERVAL: Duration =
    Duration::from_secs(if cfg!(test) { 3 } else { 60 * 60 * 12 }); // 12h

/// Upon termination of the program, we send one last telemetry request with pending events.
/// This duration is the amount of time we wait for at most to send that last telemetry request.
const LAST_REQUEST_TIMEOUT: Duration = Duration::from_secs(1);

const MAX_NUM_EVENTS_IN_QUEUE: usize = 10;

#[cfg(test)]
struct ClockButton(Sender<()>);

#[cfg(test)]
impl ClockButton {
    async fn tick(&self) {
        let _ = self.0.send(()).await;
    }
}

enum Clock {
    Periodical(Mutex<Interval>),
    #[cfg(test)]
    Manual(Mutex<Receiver<()>>),
}

impl Clock {
    pub fn periodical(period: Duration) -> Clock {
        let interval = tokio::time::interval(period);
        Clock::Periodical(Mutex::new(interval))
    }

    #[cfg(test)]
    pub async fn manual() -> (ClockButton, Clock) {
        let (tx, rx) = tokio::sync::mpsc::channel(1);
        let _ = tx.send(()).await;
        let button = ClockButton(tx);
        (button, Clock::Manual(Mutex::new(rx)))
    }

    async fn tick(&self) {
        match self {
            Clock::Periodical(interval) => {
                interval.lock().await.tick().await;
            }
            #[cfg(test)]
            Clock::Manual(channel) => {
                channel.lock().await.recv().await;
            }
        }
    }
}

#[derive(Default)]
struct EventsState {
    events: Vec<EventWithTimestamp>,
    num_dropped_events: usize,
}

impl EventsState {
    fn drain_events(&mut self) -> EventsState {
        mem::replace(
            self,
            EventsState {
                events: Vec::new(),
                num_dropped_events: 0,
            },
        )
    }

    /// Adds an event.
    /// If the queue is already saturated, (ie. it has reached the len `MAX_NUM_EVENTS_IN_QUEUE`)
    // Returns true iff it was the first event in the queue.
    fn push_event(&mut self, event: TelemetryEvent) -> bool {
        if self.events.len() >= MAX_NUM_EVENTS_IN_QUEUE {
            self.num_dropped_events += 1;
            return false;
        }
        let events_was_empty = self.events.is_empty();
        self.events.push(EventWithTimestamp::from(event));
        events_was_empty
    }
}

struct Events {
    state: RwLock<EventsState>,
    items_available_tx: Sender<()>,
    items_available_rx: RwLock<Receiver<()>>,
}

impl Default for Events {
    fn default() -> Self {
        let (items_available_tx, items_available_rx) = tokio::sync::mpsc::channel(1);
        Events {
            state: RwLock::new(EventsState::default()),
            items_available_tx,
            items_available_rx: RwLock::new(items_available_rx),
        }
    }
}

impl Events {
    /// Wait for events to be available (if there are pending events, then do not wait)
    /// and then send them to the ingest API server.
    async fn drain_events(&self) -> EventsState {
        self.items_available_rx.write().await.recv().await;
        self.state.write().await.drain_events()
    }

    async fn push_event(&self, event: TelemetryEvent) {
        let is_first_event = self.state.write().await.push_event(event);
        if is_first_event {
            let _ = self.items_available_tx.send(()).await;
        }
    }
}

pub(crate) struct Inner {
    sink: Option<Box<dyn Sink>>,
    client_info: ClientInfo,
    quickwit_info: QuickwitTelemetryInfo,
    /// This channel is just used to signal there are new items available.
    events: Events,
    clock: Clock,
    is_started: AtomicBool,
}

impl Inner {
    pub fn is_disabled(&self) -> bool {
        self.sink.is_none()
    }

    async fn create_telemetry_payload(&self) -> TelemetryPayload {
        let events_state = self.events.drain_events().await;
        TelemetryPayload {
            client_info: self.client_info.clone(),
            quickwit_info: self.quickwit_info.clone(),
            events: events_state.events,
            num_dropped_events: events_state.num_dropped_events,
        }
    }

    /// Wait for events to be available (if there are pending events, then do not wait)
    /// and then send them to the ingest API server.
    ///
    /// If the requests fails, it fails silently.
    async fn send_pending_events(&self) {
        if let Some(sink) = self.sink.as_ref() {
            let payload = self.create_telemetry_payload().await;
            sink.send_payload(payload).await;
        }
    }

    async fn send(&self, event: TelemetryEvent) {
        if self.is_disabled() {
            return;
        }
        self.events.push_event(event).await;
    }
}

pub struct TelemetrySender {
    pub(crate) inner: Arc<Inner>,
}

pub enum TelemetryLoopHandle {
    NoLoop,
    WithLoop {
        join_handle: JoinHandle<()>,
        terminate_command_tx: oneshot::Sender<()>,
    },
}

impl TelemetryLoopHandle {
    /// Terminate telemetry will exit the telemetry loop
    /// and possibly send the last request, possibly ignoring the
    /// telemetry cooldown.
    pub async fn terminate_telemetry(self) {
        if let Self::WithLoop {
            join_handle,
            terminate_command_tx,
        } = self
        {
            let _ = terminate_command_tx.send(());
            let _ = tokio::time::timeout(LAST_REQUEST_TIMEOUT, join_handle).await;
        }
    }
}

impl TelemetrySender {
    pub fn from_quickwit_info(quickwit_info: QuickwitTelemetryInfo) -> Self {
        let http_client = create_http_client();
        TelemetrySender::new(
            quickwit_info,
            http_client,
            Clock::periodical(TELEMETRY_PUSH_COOLDOWN),
        )
    }

    fn new<S: Sink>(
        quickwit_info: QuickwitTelemetryInfo,
        sink_opt: Option<S>,
        clock: Clock,
    ) -> Self {
        let sink_opt: Option<Box<dyn Sink>> = if let Some(sink) = sink_opt {
            Some(Box::new(sink))
        } else {
            None
        };
        Self {
            inner: Arc::new(Inner {
                sink: sink_opt,
                client_info: ClientInfo::default(),
                quickwit_info,
                events: Events::default(),
                clock,
                is_started: AtomicBool::new(false),
            }),
        }
    }

    pub fn loop_started(&self) -> bool {
        self.inner.is_started.load(Ordering::Relaxed)
    }

    pub fn start_loop(&self) -> TelemetryLoopHandle {
        let (terminate_command_tx, mut terminate_command_rx) = oneshot::channel();
        if self.inner.is_disabled() {
            return TelemetryLoopHandle::NoLoop;
        }

        assert!(
            self.inner
                .is_started
                .compare_exchange(false, true, Ordering::SeqCst, Ordering::SeqCst)
                .is_ok(),
            "The telemetry loop is already started."
        );

        let inner = self.inner.clone();
        start_monitor_if_server_running_task(inner.clone());
        let join_handle = tokio::task::spawn(async move {
            // This channel is used to send the command to terminate telemetry.
            loop {
                let quit_loop = tokio::select! {
                    _ = (&mut terminate_command_rx) => { true }
                    _ = inner.clock.tick() => { false }
                };
                inner.send_pending_events().await;
                if quit_loop {
                    break;
                }
            }
        });
        TelemetryLoopHandle::WithLoop {
            join_handle,
            terminate_command_tx,
        }
    }

    pub async fn send(&self, event: TelemetryEvent) {
        self.inner.send(event).await;
    }
}

/// telemetry is disabled in tests.
#[cfg(test)]
pub fn is_telemetry_disabled() -> bool {
    true
}
/// Check to see if telemetry is enabled.
#[cfg(not(test))]
pub fn is_telemetry_disabled() -> bool {
    quickwit_common::get_bool_from_env(crate::DISABLE_TELEMETRY_ENV_KEY, false)
}

fn start_monitor_if_server_running_task(telemetry_sender: Arc<Inner>) {
    let mut clock = tokio::time::interval(TELEMETRY_RUNNING_EVENT_INTERVAL);
    tokio::spawn(async move {
        // Drop the first immediate tick.
        clock.tick().await;
        loop {
            clock.tick().await;
            telemetry_sender.send(TelemetryEvent::Running).await;
        }
    });
}

fn create_http_client() -> Option<HttpClient> {
    if is_telemetry_disabled() {
        info!("telemetry to quickwit is disabled");
        return None;
    }
    let client = HttpClient::try_new()?;
    info!("telemetry to {} is enabled", client.endpoint());
    Some(client)
}

#[cfg(test)]
mod tests {

    use std::env;

    use super::*;

    #[ignore]
    #[tokio::test]
    async fn test_enabling_and_disabling_telemetry() {
        // SAFETY: this test may not be entirely sound if not run with nextest or --test-threads=1
        // as this is only a test, and it would be extremly inconvenient to run it in a different
        // way, we are keeping it that way

        // We group the two in a single test to ensure it happens on the same thread.
        unsafe { env::set_var(crate::DISABLE_TELEMETRY_ENV_KEY, "") };
        assert_eq!(
            TelemetrySender::from_quickwit_info(QuickwitTelemetryInfo::default())
                .inner
                .is_disabled(),
            true
        );
        unsafe { env::remove_var(crate::DISABLE_TELEMETRY_ENV_KEY) };
        assert_eq!(
            TelemetrySender::from_quickwit_info(QuickwitTelemetryInfo::default())
                .inner
                .is_disabled(),
            false
        );
    }

    #[tokio::test]
    async fn test_telemetry_no_wait_for_first_event() {
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        let (_clock_btn, clock) = Clock::manual().await;
        let telemetry_sender =
            TelemetrySender::new(QuickwitTelemetryInfo::default(), Some(tx), clock);
        let loop_handler = telemetry_sender.start_loop();
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        let payload_opt = rx.recv().await;
        assert!(payload_opt.is_some());
        let payload = payload_opt.unwrap();
        assert_eq!(payload.events.len(), 1);
        loop_handler.terminate_telemetry().await;
    }

    #[tokio::test]
    async fn test_telemetry_two_events() {
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        let (clock_btn, clock) = Clock::manual().await;
        let telemetry_sender =
            TelemetrySender::new(QuickwitTelemetryInfo::default(), Some(tx), clock);
        let loop_handler = telemetry_sender.start_loop();
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        {
            let payload = rx.recv().await.unwrap();
            assert_eq!(payload.events.len(), 1);
        }
        clock_btn.tick().await;
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        {
            let payload = rx.recv().await.unwrap();
            assert_eq!(payload.events.len(), 1);
        }
        loop_handler.terminate_telemetry().await;
    }

    #[tokio::test]
    async fn test_telemetry_uptime_events() {
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        let (clock_btn, clock) = Clock::manual().await;
        let telemetry_sender =
            TelemetrySender::new(QuickwitTelemetryInfo::default(), Some(tx), clock);
        let loop_handler = telemetry_sender.start_loop();
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        {
            let payload = rx.recv().await.unwrap();
            assert_eq!(payload.events.len(), 1);
        }
        clock_btn.tick().await;
        tokio::time::sleep(TELEMETRY_RUNNING_EVENT_INTERVAL + Duration::from_secs(1)).await;
        {
            let payload = rx.recv().await.unwrap();
            assert_eq!(payload.events.len(), 1);
            assert_eq!(payload.events[0].event, TelemetryEvent::Running);
        }
        loop_handler.terminate_telemetry().await;
    }

    #[tokio::test]
    async fn test_telemetry_cooldown_observed() {
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        let (clock_btn, clock) = Clock::manual().await;
        let telemetry_sender =
            TelemetrySender::new(QuickwitTelemetryInfo::default(), Some(tx), clock);
        let loop_handler = telemetry_sender.start_loop();
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        {
            let payload = rx.recv().await.unwrap();
            assert_eq!(payload.events.len(), 1);
        }
        tokio::task::yield_now().await;
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;

        let timeout_res = tokio::time::timeout(Duration::from_millis(1), rx.recv()).await;
        assert!(timeout_res.is_err());

        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        clock_btn.tick().await;
        {
            let payload = rx.recv().await.unwrap();
            assert_eq!(payload.events.len(), 2);
        }
        loop_handler.terminate_telemetry().await;
    }

    #[tokio::test]
    async fn test_terminate_telemetry_sends_pending_events() {
        let (tx, mut rx) = tokio::sync::mpsc::unbounded_channel();
        let (_clock_btn, clock) = Clock::manual().await;
        let telemetry_sender =
            TelemetrySender::new(QuickwitTelemetryInfo::default(), Some(tx), clock);
        let loop_handler = telemetry_sender.start_loop();
        telemetry_sender.send(TelemetryEvent::UiIndexPageLoad).await;
        let payload = rx.recv().await.unwrap();
        assert_eq!(payload.events.len(), 1);
        telemetry_sender
            .send(TelemetryEvent::EndCommand { return_code: 2i32 })
            .await;
        loop_handler.terminate_telemetry().await;
        let payload = rx.recv().await.unwrap();
        assert_eq!(payload.events.len(), 1);
        assert!(matches!(
            &payload.events[0].event,
            &TelemetryEvent::EndCommand { .. }
        ));
    }
}


================================================
FILE: quickwit/quickwit-telemetry/src/sink.rs
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use std::time::Duration;

use async_trait::async_trait;
use reqwest::Client;
use reqwest::redirect::Policy;
use tokio::sync::mpsc::UnboundedSender;

use crate::payload::TelemetryPayload;

/// Telemetry ingest API URL
const DEFAULT_TELEMETRY_INGEST_API_URL: &str = "https://telemetry.quickwit.io/";

fn telemetry_ingest_api_url() -> String {
    if let Some(ingest_api_url) = std::env::var_os("TELEMETRY_INGEST_API") {
        ingest_api_url.to_string_lossy().to_string()
    } else {
        DEFAULT_TELEMETRY_INGEST_API_URL.to_string()
    }
}

#[async_trait]
pub trait Sink: Send + Sync + 'static {
    async fn send_payload(&self, payload: TelemetryPayload);
}
pub struct HttpClient {
    client: Client,
    endpoint: String,
}

impl HttpClient {
    pub fn try_new() -> Option<Self> {
        let client = Client::builder()
            .redirect(Policy::limited(3))
            .timeout(Duration::from_secs(10))
            .build()
            .ok()?;
        Some(HttpClient {
            client,
            endpoint: telemetry_ingest_api_url(),
        })
    }

    pub fn endpoint(&self) -> &str {
        &self.endpoint
    }
}

#[async_trait]
impl Sink for UnboundedSender<TelemetryPayload> {
    async fn send_payload(&self, payload: TelemetryPayload) {
        let _ = self.send(payload);
    }
}

#[async_trait]
impl Sink for HttpClient {
    async fn send_payload(&self, payload: TelemetryPayload) {
        // Note that we swallow the error if any
        let _ = self.client.post(&self.endpoint).json(&payload).send().await;
    }
}


================================================
FILE: quickwit/quickwit-ui/.gitignore
================================================
# See https://help.github.com/articles/ignoring-files/ for more about ignoring files.

# dependencies
/node_modules
/.pnp
.pnp.js

# testing
/coverage
/cypress/videos
/cypress/screenshots

# misc
.DS_Store
.env.local
.env.development.local
.env.test.local
.env.production.local

npm-debug.log*
yarn-debug.log*
yarn-error.log*


================================================
FILE: quickwit/quickwit-ui/.gitignore_for_build_directory
================================================
# Ignore all files in this directory
*
# except .gitignore
!.gitignore


================================================
FILE: quickwit/quickwit-ui/Makefile
================================================
.PHONY: build install start

build:
	yarn build

install:
	yarn install --frozen-lockfile --network-timeout 300000

start:
	yarn start


================================================
FILE: quickwit/quickwit-ui/README.md
================================================
# quickwit-ui


## Prerequisites

`node` and `yarn` need to be installed on your system.
The project then relies on misc nodejs tools that can be installed locally by 
running `yarn`.

## Available Scripts


In the project directory, you can run:


### `yarn start`

Runs the app in the development mode.\
Open [http://localhost:3000](http://localhost:3000) to view it in the browser.

The page will reload if you make edits.\
You will also see any lint errors in the console.

### `yarn test`

Launches the test runner.

### `yarn e2e-test`

Launches the e2e test runner with [cypress](https://www.cypress.io/). To make them work, you need to start a
searcher beforehand with `cargo r run --service searcher --config config/quickwit.yaml`.

### `yarn format`

Re-writes files with the correct formatting if needed.\
You might want to configure your IDE to do that [automatically](https://biomejs.dev/guides/editors/first-party-extensions/).

### `yarn build`

Builds the app for production to the `build` folder.\
It correctly bundles React in production mode and optimizes the build for the best performance.

The build is minified and the filenames include the hashes.\
Your app is ready to be deployed!


================================================
FILE: quickwit/quickwit-ui/biome.json
================================================
{
  "$schema": "./node_modules/@biomejs/biome/configuration_schema.json",
  "formatter": {
    "enabled": true,
    "indentStyle": "space",
    "includes": ["**", "!build/**"]
  },
  "linter": {
    "enabled": true,
    "rules": {
      "recommended": true,
      "style": "off",
      "complexity": "off",
      "correctness": {
        "useExhaustiveDependencies": "off"
      },
      "suspicious": {
        "noTsIgnore": "off",
        "useIterableCallbackReturn": "off",
        "noExplicitAny": "off",
        "noArrayIndexKey": "off"
      }
    },
    "includes": ["**", "!build/**"]
  }
}


================================================
FILE: quickwit/quickwit-ui/build/.gitignore
================================================
# Ignore all files in this directory
*
# except .gitignore
!.gitignore


================================================
FILE: quickwit/quickwit-ui/e2e/homepage.spec.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { expect, test } from "@playwright/test";

test.describe("Home navigation", () => {
  test("Should display sidebar links", async ({ page }) => {
    await page.goto("/ui");
    await expect(page.locator("a")).toContainText([
      "Query editor",
      "Indexes",
      "Cluster",
    ]);
  });

  test("Should navigate to cluster state", async ({ page }) => {
    await page.goto("/ui");
    await page.getByRole("link", { name: "Cluster" }).click();
    await expect(page.getByLabel("breadcrumb")).toContainText("Cluster");
    await expect(page.getByText("cluster_id")).toBeVisible();
  });

  test("Should display otel logs index page", async ({ page }) => {
    await page.goto("/ui/indexes/otel-logs-v0_7");
    await expect(
      page.getByLabel("breadcrumb").getByRole("link", { name: "Indexes" }),
    ).toBeVisible();
  });
});


================================================
FILE: quickwit/quickwit-ui/index.html
================================================
<!DOCTYPE html>
<html lang="en">
  <head>
    <meta charset="utf-8" />
    <link rel="icon" href="favicon.ico" />
    <meta name="viewport" content="width=device-width, initial-scale=1" />
    <meta name="theme-color" content="#000000" />
    <meta
      name="description"
      content="Sub-second search & analytics engine on cloud storage"
    />
    <link rel="apple-touch-icon" href="logo192.png" />
    <!--
      manifest.json provides metadata used when your web app is installed on a
      user's mobile device or desktop. See https://developers.google.com/web/fundamentals/web-app-manifest/
    -->
    <link rel="manifest" href="manifest.json" />
    <!--
      TODO: remove and replace with Quickwit fonts.
    -->
    <link
      rel="stylesheet"
      href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700&display=swap"
    />
    <title>Quickwit UI</title>
  </head>
  <body>
    <noscript>You need to enable JavaScript to run this app.</noscript>
    <div id="root"></div>
    <script type="module" src="src/index.tsx"></script>
  </body>
</html>


================================================
FILE: quickwit/quickwit-ui/jest/setup.js
================================================
global.TextEncoder = require("util").TextEncoder;


================================================
FILE: quickwit/quickwit-ui/jest.config.js
================================================
module.exports = {
  setupFiles: [
    "react-app-polyfill/jsdom", // polyfill jsdom api (such as fetch)
    "<rootDir>/jest/setup.js", // polyfill textEncode
  ],

  setupFilesAfterEnv: ["@testing-library/jest-dom"],

  testEnvironment: "jsdom",

  transform: {
    // transform js file (typescript and es6 import)
    "^.+\\.(js|jsx|mjs|cjs|ts|tsx)$": [
      "babel-jest",
      {
        presets: [["babel-preset-react-app", { runtime: "automatic" }]],
        plugins: [
          [
            "@dr.pogodin/babel-plugin-transform-assets",
            { extensions: ["svg", "woff2"] },
          ],
        ],
        babelrc: false,
        configFile: false,
      },
    ],
  },

  moduleNameMapper: {
    "@monaco-editor/react": "<rootDir>/mocks/monacoMock.js",
    "swagger-ui-react": "<rootDir>/mocks/swaggerUIMock.js",
    "@mui/x-charts": "<rootDir>/mocks/x-charts.js",
  },

  testPathIgnorePatterns: ["/node_modules/", "<rootDir>/e2e/"],

  resetMocks: true,
};


================================================
FILE: quickwit/quickwit-ui/mocks/monacoMock.js
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// Mock MonocoEditor as the current jest setup does not work when Monaco JS files
// are loaded.
export const Editor = (props) => {
  return <div>{props.value}</div>;
};


================================================
FILE: quickwit/quickwit-ui/mocks/swaggerUIMock.js
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

// Mock SwaggerUI as the current jest setup does not work when Monaco JS files
// are loaded.
export default function SwaggerUI(props) {
  return <div>{props.url}</div>;
}


================================================
FILE: quickwit/quickwit-ui/mocks/x-charts.js
================================================
export const LineChart = ({ children }) => children;


================================================
FILE: quickwit/quickwit-ui/package.json
================================================
{
  "name": "quickwit-ui",
  "version": "0.8.0",
  "license": "Apache-2.0",
  "private": true,
  "packageManager": "yarn@1.22.22",
  "dependencies": {
    "@babel/core": "7.29.0",
    "@babel/runtime": "7.28.6",
    "@biomejs/biome": "2.4.4",
    "@dr.pogodin/babel-plugin-transform-assets": "1.2.6",
    "@emotion/react": "11.14.0",
    "@emotion/styled": "11.14.1",
    "@monaco-editor/react": "4.7.0",
    "@mui/icons-material": "7.3.8",
    "@mui/lab": "7.0.1-beta.22",
    "@mui/material": "7.3.8",
    "@mui/system": "7.3.8",
    "@mui/x-charts": "8.27.0",
    "@mui/x-date-pickers": "8.27.2",
    "@testing-library/dom": "10.4.1",
    "@testing-library/jest-dom": "6.9.1",
    "@testing-library/react": "16.3.2",
    "@testing-library/user-event": "14.6.1",
    "@types/jest": "30.0.0",
    "@types/node": "24.10.9",
    "@types/react": "19.2.14",
    "@types/react-dom": "19.2.3",
    "@types/swagger-ui-react": "5.18.0",
    "babel-jest": "30.2.0",
    "babel-preset-react-app": "10.1.0",
    "dayjs": "1.11.19",
    "jest": "30.2.0",
    "jest-environment-jsdom": "30.2.0",
    "monaco-editor": "0.55.1",
    "react": "19.2.4",
    "react-app-polyfill": "3.0.0",
    "react-dom": "19.2.4",
    "react-number-format": "5.4.4",
    "react-router": "7.13.1",
    "styled-components": "6.1.19",
    "styled-icons": "10.47.1",
    "swagger-ui-react": "5.32.0",
    "typescript": "5.9.3",
    "vite": "7.3.1"
  },
  "resolutions": {
    "@types/react": "19.2.14",
    "@types/react-dom": "19.2.3",
    "dompurify": "3.3.1",
    "glob": "11.1.0"
  },
  "scripts": {
    "start": "vite",
    "build": "vite build --outDir build",
    "test": "jest",
    "postbuild": "cp .gitignore_for_build_directory build/.gitignore",
    "lint": "biome check",
    "format": "biome check --write",
    "type": "tsc",
    "e2e-test": "playwright test"
  },
  "devDependencies": {
    "@playwright/test": "^1.58.2"
  }
}


================================================
FILE: quickwit/quickwit-ui/playwright.config.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { defineConfig } from "@playwright/test";

export default defineConfig({
  testDir: "./e2e",
  use: {
    baseURL: "http://127.0.0.1:7280/ui",
    browserName: "chromium",
    video: "off",
    screenshot: "off",
  },
});


================================================
FILE: quickwit/quickwit-ui/public/manifest.json
================================================
{
  "short_name": "Quickwit UI",
  "name": "Quickwit UI: Search and manage your indexes.",
  "icons": [
    {
      "src": "favicon.ico",
      "sizes": "32x32 16x16",
      "type": "image/x-icon"
    },
    {
      "src": "android-chrome-192x192.png",
      "sizes": "192x192",
      "type": "image/png"
    },
    {
      "src": "android-chrome-512x512.png",
      "sizes": "512x512",
      "type": "image/png"
    }
  ],
  "start_url": ".",
  "display": "standalone",
  "theme_color": "#000000",
  "background_color": "#ffffff"
}


================================================
FILE: quickwit/quickwit-ui/public/robots.txt
================================================
# https://www.robotstxt.org/robotstxt.html
User-agent: *
Disallow:


================================================
FILE: quickwit/quickwit-ui/src/components/ApiUrlFooter.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import ContentCopyIcon from "@mui/icons-material/ContentCopy";
import { Box, Button, styled, Typography } from "@mui/material";
import { QUICKWIT_LIGHT_GREY } from "../utils/theme";

const Footer = styled(Box)`
  display: flex;
  height: 25px;
  padding: 0px 5px;
  position: absolute;
  bottom: 0px;
  font-size: 0.9em;
  background-color: ${QUICKWIT_LIGHT_GREY};
  opacity: 0.7;
`;

export default function ApiUrlFooter(url: string) {
  const urlMaxLength = 80;
  const origin =
    // @ts-ignore
    process.env.NODE_ENV === "development"
      ? "http://localhost:7280"
      : window.location.origin;
  const completeUrl = `${origin}/${url}`;
  const isTooLong = completeUrl.length > urlMaxLength;
  // TODO show generated aggregation
  return (
    <Footer>
      <Typography sx={{ padding: "4px 5px", fontSize: "0.95em" }}>
        API URL:
      </Typography>
      <Button
        sx={{
          fontSize: "0.93em",
          textTransform: "inherit",
          whiteSpace: "nowrap",
          overflow: "hidden",
          textOverflow: "clip",
        }}
        onClick={() => {
          if (window.isSecureContext) {
            navigator.clipboard.writeText(completeUrl);
          } else {
            window.open(completeUrl, "_blank");
          }
        }}
        endIcon={<ContentCopyIcon />}
        size="small"
      >
        {completeUrl.substring(0, urlMaxLength)}
        {isTooLong && "..."}
      </Button>
    </Footer>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/IndexSideBar.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import styled from "@emotion/styled";
import { ChevronRight, KeyboardArrowDown } from "@mui/icons-material";
import {
  Autocomplete,
  Box,
  Chip,
  CircularProgress,
  IconButton,
  List,
  ListItem,
  ListItemText,
  TextField,
  Typography,
} from "@mui/material";
import Tooltip from "@mui/material/Tooltip";
import React, { useEffect, useMemo, useState } from "react";
import { Client } from "../services/client";
import { FieldMapping, getAllFields, IndexMetadata } from "../utils/models";

const IndexBarWrapper = styled("div")({
  display: "flex",
  height: "100%",
  flex: "0 0 260px",
  maxWidth: "260px",
  flexDirection: "column",
  borderRight: "1px solid rgba(0, 0, 0, 0.12)",
  overflow: "auto",
});

function IndexAutocomplete(props: IndexMetadataProps) {
  const [open, setOpen] = React.useState(false);
  const [options, setOptions] = React.useState<readonly IndexMetadata[]>([]);
  const [value, setValue] = React.useState<IndexMetadata | null>(null);
  const [loading, setLoading] = React.useState(false);
  // We want to show the circular progress only if we are loading some results and
  // when there is no option available.
  const showLoading = loading && options.length === 0;
  const quickwitClient = useMemo(() => new Client(), []);

  useEffect(() => {
    if (loading) {
      return;
    }
    setLoading(true);
    quickwitClient.listIndexes().then(
      (indexesMetadata) => {
        setOptions([...indexesMetadata]);
        setLoading(false);
      },
      (error) => {
        console.log("Index autocomplete error", error);
        setLoading(false);
      },
    );
  }, [quickwitClient, open]);

  useEffect(() => {
    if (!open) {
      if (props.indexMetadata !== null && options.length === 0) {
        setOptions([props.indexMetadata]);
      }
    }
  }, [open, props.indexMetadata, options.length]);

  useEffect(() => {
    setValue(props.indexMetadata);
  }, [props.indexMetadata]);

  return (
    <Autocomplete
      size="small"
      sx={{ width: 210 }}
      open={open}
      value={value}
      onChange={(_, updatedValue) => {
        setValue(updatedValue);

        if (
          updatedValue == null ||
          updatedValue.index_config.index_id == null
        ) {
          props.onIndexMetadataUpdate(null);
        } else {
          props.onIndexMetadataUpdate(updatedValue);
        }
      }}
      onOpen={() => {
        setOpen(true);
      }}
      onClose={() => {
        setOpen(false);
        setLoading(false);
      }}
      isOptionEqualToValue={(option, value) =>
        option.index_config.index_id === value.index_config.index_id
      }
      getOptionLabel={(option) => option.index_config.index_id}
      options={options}
      noOptionsText="No indexes."
      loading={loading}
      renderInput={(params) => (
        <TextField
          {...params}
          placeholder="Select an index"
          InputProps={{
            ...params.InputProps,
            endAdornment: (
              <React.Fragment>
                {showLoading ? (
                  <CircularProgress color="inherit" size={20} />
                ) : null}
                {params.InputProps.endAdornment}
              </React.Fragment>
            ),
          }}
        />
      )}
    />
  );
}

export interface IndexMetadataProps {
  indexMetadata: null | IndexMetadata;
  onIndexMetadataUpdate(indexMetadata: IndexMetadata | null): void;
}

function fieldTypeLabel(fieldMapping: FieldMapping): string {
  if (fieldMapping.type[0] !== undefined) {
    return fieldMapping.type[0].toUpperCase();
  } else {
    return "";
  }
}

export function IndexSideBar(props: IndexMetadataProps) {
  const [open, setOpen] = useState(true);
  const fields =
    props.indexMetadata === null
      ? []
      : getAllFields(
          props.indexMetadata.index_config.doc_mapping.field_mappings,
        );
  return (
    <IndexBarWrapper>
      <Box sx={{ px: 3, py: 2 }}>
        <Typography variant="body1" mb={1}>
          Index ID
        </Typography>
        <IndexAutocomplete {...props} />
      </Box>
      <Box sx={{ paddingLeft: "10px", height: "100%" }}>
        <IconButton
          aria-label="expand row"
          size="small"
          onClick={() => setOpen(!open)}
        >
          {open ? <KeyboardArrowDown /> : <ChevronRight />}
        </IconButton>
        Fields
        {open && (
          <List
            dense={true}
            sx={{ paddingTop: "0", overflowWrap: "break-word" }}
          >
            {fields.map(function (field) {
              return (
                <ListItem
                  key={field.json_path}
                  secondaryAction={
                    <IconButton edge="end" aria-label="add"></IconButton>
                  }
                  sx={{ paddingLeft: "10px" }}
                >
                  <Tooltip
                    title={field.field_mapping.type}
                    arrow
                    placement="left"
                  >
                    <Chip
                      label={fieldTypeLabel(field.field_mapping)}
                      size="small"
                      sx={{
                        marginRight: "10px",
                        borderRadius: "3px",
                        fontSize: "0.6rem",
                      }}
                    />
                  </Tooltip>
                  <ListItemText primary={field.json_path} />
                </ListItem>
              );
            })}
          </List>
        )}
      </Box>
    </IndexBarWrapper>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/IndexSummary.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import styled from "@emotion/styled";
import { Alert, Paper } from "@mui/material";
import dayjs from "dayjs";
import utc from "dayjs/plugin/utc";
import { FC, ReactNode } from "react";
import { NumericFormat } from "react-number-format";
import { Index } from "../utils/models";

dayjs.extend(utc);

const ItemContainer = styled.div`
  padding: 10px;
  display: flex;
  flex-direction: column;
`;
const Row = styled.div`
  padding: 5px;
  display: flex;
  flex-direction: row;
  &:nth-of-type(odd) {
    background: rgba(0, 0, 0, 0.05);
  }
`;
const RowKey = styled.div`
  width: 350px;
`;
const IndexRow: FC<{ title: string; children: ReactNode }> = ({
  title,
  children,
}) => (
  <Row>
    <RowKey>{title}</RowKey>
    <div>{children}</div>
  </Row>
);

export function IndexSummary({ index }: { index: Index }) {
  const all_splits = index.splits;
  const published_splits = all_splits.filter(
    (split) => split.split_state === "Published",
  );
  const num_of_staged_splits = all_splits.filter(
    (split) => split.split_state === "Staged",
  ).length;
  const num_of_marked_for_delete_splits = all_splits.filter(
    (split) => split.split_state === "MarkedForDeletion",
  ).length;
  const total_num_docs = published_splits
    .map((split) => split.num_docs)
    .reduce((sum, current) => sum + current, 0);
  const total_num_bytes = published_splits
    .map((split) => {
      return split.footer_offsets.end;
    })
    .reduce((sum, current) => sum + current, 0);
  const total_uncompressed_num_bytes = published_splits
    .map((split) => {
      return split.uncompressed_docs_size_in_bytes;
    })
    .reduce((sum, current) => sum + current, 0);
  return (
    <Paper variant="outlined">
      <ItemContainer>
        {index.split_limit_reached && (
          <Alert severity="warning" sx={{ mb: 2 }}>
            Split limit reached. Only the first 10,000 splits were retrieved.
            The actual total may be higher. Statistics shown are incomplete.
          </Alert>
        )}
        <IndexRow title="Created at:">
          {dayjs
            .unix(index.metadata.create_timestamp)
            .utc()
            .format("YYYY/MM/DD HH:mm")}
        </IndexRow>
        <IndexRow title="URI:">
          {index.metadata.index_config.index_uri}
        </IndexRow>
        <IndexRow title="Number of published documents:">
          <NumericFormat
            value={total_num_docs}
            displayType={"text"}
            thousandSeparator={true}
          />
        </IndexRow>
        <IndexRow title="Size of published documents (uncompressed):">
          <NumericFormat
            value={total_uncompressed_num_bytes / 1000000}
            displayType={"text"}
            thousandSeparator={true}
            suffix=" MB"
            decimalScale={2}
          />
        </IndexRow>
        <IndexRow title="Number of published splits:">
          {published_splits.length}
        </IndexRow>
        <IndexRow title="Size of published splits:">
          <NumericFormat
            value={total_num_bytes / 1000000}
            displayType={"text"}
            thousandSeparator={true}
            suffix=" MB"
            decimalScale={2}
          />
        </IndexRow>
        <IndexRow title="Number of staged splits:">
          {num_of_staged_splits}
        </IndexRow>
        <IndexRow title="Number of splits marked for deletion:">
          {num_of_marked_for_delete_splits}
        </IndexRow>
      </ItemContainer>
    </Paper>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/IndexesTable.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import {
  Paper,
  Table,
  TableBody,
  TableCell,
  TableContainer,
  TableHead,
  TableRow,
} from "@mui/material";
import dayjs from "dayjs";
import utc from "dayjs/plugin/utc";
import { useNavigate } from "react-router";
import { IndexMetadata } from "../utils/models";

dayjs.extend(utc);

const IndexesTable = ({
  indexesMetadata,
}: Readonly<{ indexesMetadata: IndexMetadata[] }>) => {
  const navigate = useNavigate();
  const handleClick = (indexId: string) => {
    navigate(`/indexes/${indexId}`);
  };

  return (
    <TableContainer component={Paper}>
      <Table sx={{ minWidth: 650 }} aria-label="Indexes">
        <TableHead>
          <TableRow>
            <TableCell align="left">ID</TableCell>
            <TableCell align="left">URI</TableCell>
            <TableCell align="left">Created on</TableCell>
            <TableCell align="left">Sources</TableCell>
          </TableRow>
        </TableHead>
        <TableBody>
          {indexesMetadata.map((indexMetadata) => (
            <TableRow
              key={indexMetadata.index_config.index_id}
              sx={{
                "&:last-child td, &:last-child th": { border: 0 },
                cursor: "pointer",
              }}
              hover={true}
              onClick={() => handleClick(indexMetadata.index_config.index_id)}
            >
              <TableCell component="th" scope="row">
                {indexMetadata.index_config.index_id}
              </TableCell>
              <TableCell align="left">
                {indexMetadata.index_config.index_uri}
              </TableCell>
              <TableCell align="left">
                {dayjs
                  .unix(indexMetadata.create_timestamp)
                  .utc()
                  .format("YYYY/MM/DD HH:mm")}
              </TableCell>
              <TableCell align="left">
                {indexMetadata.sources?.length || "None"}
              </TableCell>
            </TableRow>
          ))}
        </TableBody>
      </Table>
    </TableContainer>
  );
};

export default IndexesTable;


================================================
FILE: quickwit/quickwit-ui/src/components/JsonEditor.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { BeforeMount, Editor, OnMount } from "@monaco-editor/react";
import { useCallback } from "react";
import { EDITOR_THEME } from "../utils/theme";

export function JsonEditor({
  content,
  resizeOnMount,
}: {
  content: unknown;
  resizeOnMount: boolean;
}) {
  // Setting editor height based on lines height and count to stretch and fit its content.
  const onMount: OnMount = useCallback(
    (editor) => {
      if (!resizeOnMount) {
        return;
      }
      const editorElement = editor.getDomNode();

      if (!editorElement) {
        return;
      }

      // Weirdly enough, we have to wait a few ms to get the right height
      // from `editor.getContentHeight()`. If not, we sometimes end up with
      // a height > 7000px... and I don't know why.
      setTimeout(() => {
        const height = Math.min(800, editor.getContentHeight());
        editorElement.style.height = `${height}px`;
        editor.layout();
      }, 10);
    },
    [resizeOnMount],
  );

  const beforeMount: BeforeMount = (monaco) => {
    monaco.editor.defineTheme("quickwit-light", EDITOR_THEME);
  };

  return (
    <Editor
      language="json"
      value={JSON.stringify(content, null, 2)}
      beforeMount={beforeMount}
      onMount={onMount}
      options={{
        readOnly: true,
        fontFamily: "monospace",
        overviewRulerBorder: false,
        overviewRulerLanes: 0,
        minimap: {
          enabled: false,
        },
        scrollbar: {
          alwaysConsumeMouseWheel: false,
        },
        renderLineHighlight: "gutter",
        fontSize: 12,
        fixedOverflowWidgets: true,
        scrollBeyondLastLine: false,
        automaticLayout: true,
        wordWrap: "on",
        wrappingIndent: "deepIndent",
      }}
      theme="quickwit-light"
    />
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/LayoutUtils.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Box, Breadcrumbs, styled } from "@mui/material";

export const APP_BAR_HEIGHT_PX = "48px";
export const ViewUnderAppBarBox = styled(Box)`
display: flex;
flex-direction: column;
margin-top: ${APP_BAR_HEIGHT_PX};
height: calc(100% - ${APP_BAR_HEIGHT_PX});
width: 100%;
`;
export const FullBoxContainer = styled(Box)`
display: flex;
flex-direction: column;
height: 100%;
width: 100%;
padding: 16px 24px;
`;
export const QBreadcrumbs = styled(Breadcrumbs)`
padding-bottom: 8px;
`;


================================================
FILE: quickwit/quickwit-ui/src/components/Loader.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Box, keyframes, styled } from "@mui/material";
import loadinIcongUrl from "../assets/img/quickwit-logo-monochrome.svg";

const spin = keyframes`
from {
  transform: rotate(0deg);
}
to {
  transform: rotate(360deg);
}
`;

const LoadingIcon = (props: React.ComponentProps<"img">) => (
  <img {...props} src={loadinIcongUrl} alt="loading icon" />
);

const SpinningLoadingIcon = styled(LoadingIcon)`
  height: 10vmin;
  pointer-events: none;
  fill: #cbd1dd;
  animation: ${spin} infinite 5s linear;
`;

export default function Loader() {
  return (
    <Box
      display="flex"
      justifyContent="center"
      alignItems="center"
      minHeight="40vh"
    >
      <SpinningLoadingIcon></SpinningLoadingIcon>
    </Box>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/QueryActionBar.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import PlayArrowIcon from "@mui/icons-material/PlayArrow";
import { Box, Button, Tab, Tabs } from "@mui/material";
import { SearchComponentProps } from "../utils/SearchComponentProps";
import { TimeRangeSelect } from "./TimeRangeSelect";

export function QueryEditorActionBar(props: SearchComponentProps) {
  const timestamp_field_name =
    props.index?.metadata.index_config.doc_mapping.timestamp_field;
  const shouldDisplayTimeRangeSelect = timestamp_field_name ?? false;

  const handleChange = (_event: React.SyntheticEvent, newTab: number) => {
    const updatedSearchRequest = {
      ...props.searchRequest,
      aggregation: newTab !== 0,
    };
    props.onSearchRequestUpdate(updatedSearchRequest);
    props.runSearch(updatedSearchRequest);
  };

  return (
    <Box sx={{ display: "flex" }}>
      <Box sx={{ flexGrow: 0, padding: "10px" }}>
        <Button
          onClick={() => props.runSearch(props.searchRequest)}
          variant="contained"
          startIcon={<PlayArrowIcon />}
          disableElevation
          sx={{ flexGrow: 1 }}
          disabled={props.queryRunning || !props.searchRequest.indexId}
        >
          Run
        </Button>
      </Box>
      <Box sx={{ flexGrow: 0 }}>
        <Box sx={{ borderBottom: 1, borderColor: "divider", flexGrow: 1 }}>
          <Tabs
            value={Number(props.searchRequest.aggregation)}
            onChange={handleChange}
          >
            <Tab label="Search" />
            <Tab label="Aggregation" />
          </Tabs>
        </Box>
      </Box>
      <Box sx={{ flexGrow: 1 }}></Box>
      {shouldDisplayTimeRangeSelect && (
        <TimeRangeSelect
          timeRange={{
            startTimestamp: props.searchRequest.startTimestamp,
            endTimestamp: props.searchRequest.endTimestamp,
          }}
          onUpdate={(timeRange) => {
            props.runSearch({ ...props.searchRequest, ...timeRange });
          }}
          disabled={props.queryRunning || !props.searchRequest.indexId}
        />
      )}
    </Box>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/QueryEditor/AggregationEditor.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Box } from "@mui/material";
import FormControl from "@mui/material/FormControl";
import MenuItem from "@mui/material/MenuItem";
import Select, { SelectChangeEvent } from "@mui/material/Select";
import TextField from "@mui/material/TextField";
import { useEffect, useRef, useState } from "react";
import { HistogramAgg, TermAgg } from "../../utils/models";
import { SearchComponentProps } from "../../utils/SearchComponentProps";

export function AggregationEditor(props: SearchComponentProps) {
  return (
    <Box hidden={!props.searchRequest.aggregation}>
      <MetricKind
        searchRequest={props.searchRequest}
        onSearchRequestUpdate={props.onSearchRequestUpdate}
        runSearch={props.runSearch}
        index={props.index}
        queryRunning={props.queryRunning}
      />
      <AggregationKind
        searchRequest={props.searchRequest}
        onSearchRequestUpdate={props.onSearchRequestUpdate}
        runSearch={props.runSearch}
        index={props.index}
        queryRunning={props.queryRunning}
      />
    </Box>
  );
}

export function MetricKind(props: SearchComponentProps) {
  // TODO add percentiles
  const metricRef = useRef(props.searchRequest.aggregationConfig.metric);

  const handleTypeChange = (event: SelectChangeEvent) => {
    const value = event.target.value;
    const updatedMetric =
      value !== "count" ? { ...metricRef.current!, type: value } : null;
    const updatedAggregation = {
      ...props.searchRequest.aggregationConfig,
      metric: updatedMetric,
    };
    const updatedSearchRequest = {
      ...props.searchRequest,
      aggregationConfig: updatedAggregation,
    };
    props.onSearchRequestUpdate(updatedSearchRequest);
    metricRef.current = updatedMetric;
  };

  const handleNameChange = (event: React.ChangeEvent<HTMLInputElement>) => {
    const value = event.target.value;
    if (metricRef.current == null) {
      return;
    }
    const updatedMetric = { ...metricRef.current!, field: value };
    const updatedAggregation = {
      ...props.searchRequest.aggregationConfig,
      metric: updatedMetric,
    };
    const updatedSearchRequest = {
      ...props.searchRequest,
      aggregationConfig: updatedAggregation,
    };
    props.onSearchRequestUpdate(updatedSearchRequest);
    metricRef.current = updatedMetric;
  };

  return (
    <Box sx={{ m: 1, minWidth: 120, display: "flex", flexDirection: "row" }}>
      <FormControl variant="standard">
        <Select
          value={metricRef.current ? metricRef.current.type : "count"}
          onChange={handleTypeChange}
          sx={{ minHeight: "44px" }}
        >
          <MenuItem value="count">Count</MenuItem>
          <MenuItem value="avg">Average</MenuItem>
          <MenuItem value="sum">Sum</MenuItem>
          <MenuItem value="max">Max</MenuItem>
          <MenuItem value="min">Min</MenuItem>
        </Select>
      </FormControl>
      <FormControl variant="standard">
        <TextField
          variant="standard"
          label="Field"
          onChange={handleNameChange}
          sx={{
            marginLeft: "10px",
            ...(!metricRef.current && { display: "none" }),
          }}
        />
      </FormControl>
    </Box>
  );
}

export function AggregationKind(props: SearchComponentProps) {
  const defaultAgg = {
    histogram: {
      interval: "1d",
    },
  };
  const [aggregations, setAggregations] = useState<
    ({ term: TermAgg } | { histogram: HistogramAgg })[]
  >([defaultAgg]);

  useEffect(() => {
    // do the initial filling of parameters
    const aggregationConfig = props.searchRequest.aggregationConfig;
    if (
      aggregationConfig.histogram === null &&
      aggregationConfig.term === null
    ) {
      const initialAggregation = Object.assign({}, ...aggregations);
      const initialSearchRequest = {
        ...props.searchRequest,
        aggregationConfig: initialAggregation,
      };
      props.onSearchRequestUpdate(initialSearchRequest);
    }
  }, []); // Empty dependency array means this runs once after mount

  useEffect(() => {
    // Update search request whenever aggregations change
    const metric = props.searchRequest.aggregationConfig.metric;
    const updatedAggregation = Object.assign(
      {},
      { metric: metric },
      ...aggregations,
    );
    const updatedSearchRequest = {
      ...props.searchRequest,
      aggregationConfig: updatedAggregation,
    };
    props.onSearchRequestUpdate(updatedSearchRequest);
  }, [aggregations]);

  const handleAggregationChange = (pos: number, event: SelectChangeEvent) => {
    const value = event.target.value;
    setAggregations((agg) => {
      const newAggregations = [...agg];
      switch (value) {
        case "histogram": {
          newAggregations[pos] = {
            histogram: {
              interval: "1d",
            },
          };
          break;
        }
        case "term": {
          newAggregations[pos] = {
            term: {
              field: "",
              size: 10,
            },
          };
          break;
        }
        case "rm": {
          newAggregations.splice(pos, 1);
        }
      }
      return newAggregations;
    });
  };

  const handleHistogramChange = (pos: number, event: SelectChangeEvent) => {
    const value = event.target.value;
    setAggregations((agg) => {
      const newAggregations = [...agg];
      newAggregations[pos] = { histogram: { interval: value } };
      return newAggregations;
    });
  };

  const handleTermFieldChange = (
    pos: number,
    event: React.ChangeEvent<HTMLInputElement | HTMLTextAreaElement>,
  ) => {
    const value = event.target.value;
    setAggregations((agg) => {
      const newAggregations = [...agg];
      const term = newAggregations[pos];
      if (isTerm(term)) {
        term.term.field = value;
      }
      return newAggregations;
    });
  };

  const handleTermCountChange = (
    pos: number,
    event: React.ChangeEvent<HTMLInputElement | HTMLTextAreaElement>,
  ) => {
    const value = event.target.value;
    setAggregations((agg) => {
      const newAggregations = [...agg];
      const term = newAggregations[pos];
      if (isTerm(term)) {
        term.term.size = Number(value);
      }
      return newAggregations;
    });
  };

  function isHistogram(
    agg: { term: TermAgg } | { histogram: HistogramAgg } | undefined,
  ): agg is { histogram: HistogramAgg } {
    if (!agg) return false;
    return "histogram" in agg;
  }

  function isTerm(
    agg: { term: TermAgg } | { histogram: HistogramAgg } | undefined,
  ): agg is { term: TermAgg } {
    if (!agg) return false;
    return "term" in agg;
  }

  const getAggregationKind = (
    agg: { term: TermAgg } | { histogram: HistogramAgg } | undefined,
  ) => {
    if (isHistogram(agg)) {
      return "histogram";
    }
    if (isTerm(agg)) {
      return "term";
    }
    return "new";
  };

  const makeOptions = (
    pos: number,
    agg: ({ term: TermAgg } | { histogram: HistogramAgg })[],
  ) => {
    const options = [];
    if (pos >= agg.length) {
      options.push(
        <MenuItem value="new" key="new">
          Add aggregation
        </MenuItem>,
      );
    }
    let addHistogram = true;
    let addTerm = true;
    for (let i = 0; i < agg.length; i++) {
      if (i === pos) continue;
      if (getAggregationKind(agg[i]) === "histogram") addHistogram = false;
      if (getAggregationKind(agg[i]) === "term") addTerm = false;
    }
    if (addHistogram) {
      options.push(
        <MenuItem value="histogram" key="histogram">
          Histogram aggregation
        </MenuItem>,
      );
    }
    if (addTerm) {
      options.push(
        <MenuItem value="term" key="term">
          Term aggregation
        </MenuItem>,
      );
    }
    if (agg.length > 1) {
      options.push(
        <MenuItem value="rm" key="rm">
          Remove aggregation
        </MenuItem>,
      );
    }
    return options;
  };

  const drawAdditional = (
    pos: number,
    aggs: ({ term: TermAgg } | { histogram: HistogramAgg })[],
  ) => {
    const agg = aggs[pos];
    if (isHistogram(agg)) {
      return (
        <FormControl variant="standard">
          <Select
            value={agg.histogram.interval}
            onChange={(e) => handleHistogramChange(pos, e)}
            sx={{ marginLeft: "10px", minHeight: "44px" }}
          >
            <MenuItem value="10s">10 seconds</MenuItem>
            <MenuItem value="1m">1 minute</MenuItem>
            <MenuItem value="5m">5 minutes</MenuItem>
            <MenuItem value="10m">10 minutes</MenuItem>
            <MenuItem value="1h">1 hour</MenuItem>
            <MenuItem value="1d">1 day</MenuItem>
          </Select>
        </FormControl>
      );
    }
    if (isTerm(agg)) {
      return (
        <>
          <FormControl variant="standard">
            <TextField
              variant="standard"
              label="Field"
              onChange={(e) => handleTermFieldChange(pos, e)}
              sx={{ marginLeft: "10px" }}
            />
          </FormControl>
          <FormControl variant="standard">
            <TextField
              variant="standard"
              label="Return top"
              type="number"
              onChange={(e) => handleTermCountChange(pos, e)}
              value={agg.term.size}
              sx={{ marginLeft: "10px" }}
            />
          </FormControl>
        </>
      );
    }
    return null;
  };

  return (
    <>
      <Box sx={{ m: 1, minWidth: 120, display: "flex", flexDirection: "row" }}>
        <FormControl variant="standard">
          <Select
            value={getAggregationKind(aggregations[0])}
            onChange={(e) => handleAggregationChange(0, e)}
            sx={{ minHeight: "44px", width: "190px" }}
          >
            {makeOptions(0, aggregations)}
          </Select>
        </FormControl>
        {drawAdditional(0, aggregations)}
      </Box>
      <Box sx={{ m: 1, minWidth: 120, display: "flex", flexDirection: "row" }}>
        <FormControl
          variant="standard"
          sx={{ m: 1, minWidth: 120, display: "flex", flexDirection: "row" }}
        >
          <Select
            value={getAggregationKind(aggregations[1])}
            onChange={(e) => handleAggregationChange(1, e)}
            sx={{ minHeight: "44px", width: "190px" }}
          >
            {makeOptions(1, aggregations)}
          </Select>
          {drawAdditional(1, aggregations)}
        </FormControl>
      </Box>
    </>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/QueryEditor/QueryEditor.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Editor } from "@monaco-editor/react";
import { Box } from "@mui/material";
import * as monacoEditor from "monaco-editor/esm/vs/editor/editor.api";
import React, { useEffect, useRef, useState } from "react";
import { SearchComponentProps } from "../../utils/SearchComponentProps";
import { EDITOR_THEME } from "../../utils/theme";
import {
  createIndexCompletionProvider,
  LANGUAGE_CONFIG,
  LanguageFeatures,
} from "./config";

const QUICKWIT_EDITOR_THEME_ID = "quickwit-light";

function getLanguageId(indexId: string | null): string {
  if (indexId === null) {
    return "";
  }
  return `${indexId}-query-language`;
}

export function QueryEditor(props: SearchComponentProps) {
  const monacoRef = useRef<null | typeof monacoEditor>(null);
  const [languageId, setLanguageId] = useState<string>("");
  const runSearchRef = useRef(props.runSearch);
  const searchRequestRef = useRef(props.searchRequest);
  const defaultValue =
    props.searchRequest.query === null
      ? `// Select an index and type your query. Example: field_name:"phrase query"`
      : props.searchRequest.query;
  let resize: () => void;

  function handleEditorDidMount(editor: any, monaco: any) {
    monacoRef.current = monaco;
    editor.addAction({
      id: "SEARCH",
      label: "Run search",
      keybindings: [
        monaco.KeyCode.F9,
        monaco.KeyMod.CtrlCmd | monaco.KeyCode.Enter,
      ],
      run: () => {
        runSearchRef.current(searchRequestRef.current);
      },
    });
    resize = () => {
      editor.layout({
        width: Math.max(window.innerWidth - (260 + 180 + 2 * 24), 200),
        height: 84,
      });
    };
    window.addEventListener("resize", resize);
  }

  React.useEffect(() => {
    return () => window.removeEventListener("resize", resize);
  });

  useEffect(() => {
    const updatedLanguageId = getLanguageId(props.searchRequest.indexId);
    if (
      monacoRef.current !== null &&
      updatedLanguageId !== "" &&
      props.index !== null
    ) {
      const monaco = monacoRef.current;
      if (
        !monaco.languages
          .getLanguages()
          .some(({ id }: { id: string }) => id === updatedLanguageId)
      ) {
        console.log("register language", updatedLanguageId);
        monaco.languages.register({ id: updatedLanguageId });
        monaco.languages.setMonarchTokensProvider(
          updatedLanguageId,
          LanguageFeatures(),
        );
        if (props.index != null) {
          monaco.languages.registerCompletionItemProvider(
            updatedLanguageId,
            createIndexCompletionProvider(props.index.metadata),
          );
          monaco.languages.setLanguageConfiguration(
            updatedLanguageId,
            LANGUAGE_CONFIG,
          );
        }
      }
      setLanguageId(updatedLanguageId);
    }
  }, [monacoRef, props.index]);

  useEffect(() => {
    if (monacoRef.current !== null) {
      runSearchRef.current = props.runSearch;
    }
  }, [monacoRef, props.runSearch]);

  function handleEditorChange(value: any) {
    const updatedSearchRequest = Object.assign({}, props.searchRequest, {
      query: value,
    });
    searchRequestRef.current = updatedSearchRequest;
    props.onSearchRequestUpdate(updatedSearchRequest);
  }

  function handleEditorWillMount(monaco: any) {
    monaco.editor.defineTheme(QUICKWIT_EDITOR_THEME_ID, EDITOR_THEME);
  }

  return (
    <Box sx={{ height: "100px", py: 1 }}>
      <Editor
        beforeMount={handleEditorWillMount}
        onMount={handleEditorDidMount}
        onChange={handleEditorChange}
        language={languageId}
        value={defaultValue}
        options={{
          fontFamily: "monospace",
          minimap: {
            enabled: false,
          },
          renderLineHighlight: "gutter",
          fontSize: 14,
          fixedOverflowWidgets: true,
          scrollBeyondLastLine: false,
        }}
        theme={QUICKWIT_EDITOR_THEME_ID}
      />
    </Box>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/QueryEditor/config.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { getAllFields, IndexMetadata } from "../../utils/models";

export enum CompletionItemKind {
  Field = 3,
  Operator = 11,
}

const BRACES: [string, string] = ["{", "}"];
const BRACKETS: [string, string] = ["[", "]"];
const PARENTHESES: [string, string] = ["(", ")"];

export const LANGUAGE_CONFIG = {
  comments: {
    lineComment: "//",
  },
  brackets: [BRACES, BRACKETS, PARENTHESES],
  autoClosingPairs: [
    { open: "{", close: "}" },
    { open: "[", close: "]" },
    { open: "(", close: ")" },
    { open: '"', close: '"' },
    { open: "'", close: "'" },
  ],
  surroundingPairs: [
    { open: "{", close: "}" },
    { open: "[", close: "]" },
    { open: "(", close: ")" },
    { open: '"', close: '"' },
    { open: "'", close: "'" },
  ],
};

// TODO: clean language features as I (fmassot) did not dig into it yet.
export function LanguageFeatures(): any {
  return {
    defaultToken: "invalid",
    //wordDefinition: /(-?\d*\.\d\w*)|([^\`\~\!\#\%\^\&\*\(\)\-\=\+\[\{\]\}\\\|\;\:\'\"\,\.\<\>\/\?\s]+)/g,
    operators: ["+", "-"],
    brackets: [{ open: "(", close: ")", token: "delimiter.parenthesis" }],
    keywords: ["AND", "OR"],
    symbols: /[=><!~?:&|+\-*/^%]+/,
    escapes:
      /\\(?:[abfnrtv\\"']|x[0-9A-Fa-f]{1,4}|u[0-9A-Fa-f]{4}|U[0-9A-Fa-f]{8})/,
    tokenizer: {
      root: [
        // identifiers and keywords
        [
          /[a-z_$][\w$]*/,
          {
            cases: {
              "@keywords": "keyword",
              "@default": "identifier",
            },
          },
        ],
        [/[A-Z][\w$]*/, "type.identifier"], // to show class names nicely

        // whitespace
        { include: "@whitespace" },

        // delimiters and operators
        [/[{}()[]]/, "@brackets"],
        [/[<>](?!@symbols)/, "@brackets"],
        [/@symbols/, { cases: { "@operators": "operator", "@default": "" } }],

        // @ annotations.
        // As an example, we emit a debugging log message on these tokens.
        // Note: message are suppressed during the first load -- change some lines to see them.
        [
          /@\s*[a-zA-Z_$][\w$]*/,
          { token: "annotation", log: "annotation token: $0" },
        ],

        // numbers
        [/\d*\.\d+([eE][-+]?\d+)?/, "number.float"],
        [/0[xX][0-9a-fA-F]+/, "number.hex"],
        [/\d+/, "number"],

        // delimiter: after number because of .\d floats
        [/[;,.]/, "delimiter"],

        // strings
        [/"([^"\\]|\\.)*$/, "string.invalid"], // non-terminated string
        [/"/, { token: "string.quote", bracket: "@open", next: "@string" }],

        // characters
        [/'[^\\']'/, "string"],
        [/(')(@escapes)(')/, ["string", "string.escape", "string"]],
        [/'/, "string.invalid"],
      ],
      comment: [
        [/[^/*]+/, "comment"],
        [/\/\*/, "comment", "@push"], // nested comment
        ["\\*/", "comment", "@pop"],
        [/[/*]/, "comment"],
      ],
      string: [
        [/[^\\"]+/, "string"],
        [/@escapes/, "string.escape"],
        [/\\./, "string.escape.invalid"],
        [/"/, { token: "string.quote", bracket: "@close", next: "@pop" }],
      ],

      whitespace: [
        [/[ \t\r\n]+/, "white"],
        [/\/\*/, "comment", "@comment"],
        [/\/\/.*$/, "comment"],
      ],
    },
  };
}

export const createIndexCompletionProvider = (indexMetadata: IndexMetadata) => {
  const fields = getAllFields(
    indexMetadata.index_config.doc_mapping.field_mappings,
  );
  const completionProvider = {
    provideCompletionItems(model: any, position: any) {
      const word = model.getWordUntilPosition(position);

      const range = {
        startLineNumber: position.lineNumber,
        endLineNumber: position.lineNumber,
        startColumn: word.startColumn,
        endColumn: word.endColumn,
      };

      // We want to auto complete all fields except timestamp that is handled with `TimeRangeSelect` component.
      const fieldSuggestions = fields
        .filter(
          (field) =>
            field.json_path !==
            indexMetadata.index_config.doc_mapping.timestamp_field,
        )
        .map((field) => {
          return {
            label: field.json_path,
            kind: CompletionItemKind.Field,
            insertText:
              field.field_mapping.type === "json"
                ? field.json_path + "."
                : field.json_path + ":",
            range: range,
          };
        });

      return {
        suggestions: fieldSuggestions.concat([
          {
            label: "OR",
            kind: CompletionItemKind.Operator,
            insertText: "OR ",
            range: range,
          },
          {
            label: "AND",
            kind: CompletionItemKind.Operator,
            insertText: "AND ",
            range: range,
          },
        ]),
      };
    },
  };

  return completionProvider;
};

export const setErrorMarker = (
  monaco: any,
  editor: any,
  startlineNumber: number,
  startColumnNumber: number,
  message: string,
) => {
  const model = editor.getModel();

  if (model) {
    monaco.editor.setModelMarkers(model, "QuestDBLanguageName", [
      {
        message,
        severity: monaco.MarkerSeverity.Error,
        startLineNumber: startlineNumber,
        endLineNumber: startlineNumber,
        startColumn: startColumnNumber,
        endColumn: startColumnNumber,
      },
    ]);
  }
};


================================================
FILE: quickwit/quickwit-ui/src/components/ResponseErrorDisplay.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import SentimentVeryDissatisfiedIcon from "@mui/icons-material/SentimentVeryDissatisfied";
import { Box } from "@mui/material";
import { ResponseError } from "../utils/models";

function renderMessage(error: ResponseError) {
  if (
    error.message !== null &&
    error.message.includes("No search node available.")
  ) {
    return (
      <Box sx={{ fontSize: 16, pt: 2 }}>
        Your cluster does not contain any search node. You need at least one
        search node.
      </Box>
    );
  } else {
    return (
      <>
        <Box sx={{ fontSize: 16, pt: 2 }}>
          {error.status && <span>Status: {error.status}</span>}
        </Box>
        <Box sx={{ fontSize: 14, pt: 1, alignItems: "center" }}>
          Error: {error.message}
        </Box>
      </>
    );
  }
}

export default function ErrorResponseDisplay(error: ResponseError) {
  return (
    <Box
      sx={{
        pt: 2,
        display: "flex",
        flexDirection: "column",
        alignItems: "center",
      }}
    >
      <SentimentVeryDissatisfiedIcon sx={{ fontSize: 60 }} />
      {renderMessage(error)}
    </Box>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/SearchResult/AggregationResult.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { BarChart } from "@mui/x-charts/BarChart";
import { LineChart } from "@mui/x-charts/LineChart";
import {
  extractAggregationResults,
  HistogramResult,
  ParsedAggregationResult,
  SearchResponse,
  TermResult,
} from "../../utils/models";

function isHistogram(agg: ParsedAggregationResult): agg is HistogramResult {
  return agg != null && "timestamps" in agg;
}

function isTerm(agg: ParsedAggregationResult): agg is TermResult {
  return Array.isArray(agg);
}

export function AggregationResult({
  searchResponse,
}: {
  searchResponse: SearchResponse;
}) {
  const result = extractAggregationResults(searchResponse.aggregations);
  if (isHistogram(result)) {
    const xAxis: React.ComponentProps<typeof LineChart>["xAxis"] = [
      {
        data: result.timestamps,
        valueFormatter: (date: number) => {
          return new Date(date).toISOString();
        },
      },
    ];
    const series: React.ComponentProps<typeof LineChart>["series"] =
      result.data.map((line) => {
        return {
          curve: "monotoneX",
          label: line.name,
          data: line.value,
        };
      });
    // we don't customize colors because we would need a full palette.
    return <LineChart xAxis={xAxis} series={series} yAxis={[{ min: 0 }]} />;
  } else if (isTerm(result)) {
    return (
      <BarChart
        series={[
          { data: result.map((entry) => entry.value), color: "#004BD9A5" },
        ]}
        xAxis={[{ data: result.map((entry) => entry.term), scaleType: "band" }]}
        margin={{ top: 10, bottom: 30, left: 40, right: 10 }}
      />
    );
  } else {
    return <p>no result to display</p>;
  }
}


================================================
FILE: quickwit/quickwit-ui/src/components/SearchResult/ResultTable.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Box, styled, Table, TableBody, TableContainer } from "@mui/material";
import { Field, getAllFields, Index, SearchResponse } from "../../utils/models";
import { Row } from "./Row";

const TableBox = styled(Box)`
display: flex;
flex-direction: column;
overflow: auto;
flex: 1 1 100%;
height: 100%;
`;

export function ResultTable({
  searchResponse,
  index,
}: {
  searchResponse: SearchResponse;
  index: Index;
}) {
  const timestampField = getTimestampField(index);
  return (
    <TableBox>
      <TableContainer>
        <Table size="small">
          <TableBody>
            {searchResponse.hits.map((hit, idx) => (
              <Row key={idx} row={hit} timestampField={timestampField} />
            ))}
          </TableBody>
        </Table>
      </TableContainer>
    </TableBox>
  );
}

function getTimestampField(index: Index): Field | null {
  const fields = getAllFields(
    index.metadata.index_config.doc_mapping.field_mappings,
  );
  const timestamp_field_name =
    index.metadata.index_config.doc_mapping.timestamp_field;
  const timestamp_field = fields.filter(
    (field) => field.field_mapping.name === timestamp_field_name,
  )[0];
  return timestamp_field ?? null;
}


================================================
FILE: quickwit/quickwit-ui/src/components/SearchResult/Row.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { KeyboardArrowDown } from "@mui/icons-material";
import ChevronRight from "@mui/icons-material/ChevronRight";
import { Box, IconButton, styled, TableCell, TableRow } from "@mui/material";
import dayjs from "dayjs";
import relativeTime from "dayjs/plugin/relativeTime";
import utc from "dayjs/plugin/utc";
import React, { useState } from "react";
import {
  DATE_TIME_WITH_SECONDS_FORMAT as DATE_TIME_WITH_MILLISECONDS_FORMAT,
  DATE_TIME_WITH_SECONDS_FORMAT,
  Entry,
  Field,
  RawDoc,
} from "../../utils/models";
import { QUICKWIT_INTERMEDIATE_GREY } from "../../utils/theme";
import { JsonEditor } from "../JsonEditor";

dayjs.extend(relativeTime);
dayjs.extend(utc);

interface RowProps {
  timestampField: Field | null;
  row: RawDoc;
}

const EntryName = styled("dt")`
  display: inline;
  background-color: ${QUICKWIT_INTERMEDIATE_GREY};
  color: #343741;
  padding: 2px 1px 2px 4px;
  margin-right: 4px;
  word-break: normal;
  border-radius: 3px;
`;

const EntryValue = styled("dd")`
  display: inline;
  margin: 0;
  padding: 0;
  margin-inline-end: 5px;
`;

function EntryFormatter(entry: Entry) {
  // Some field can contains objects, stringify them to render them otherwise React will crash.
  const value =
    typeof entry.value === "object" ? JSON.stringify(entry.value) : entry.value;
  return (
    <>
      <EntryName>{entry.key}:</EntryName>
      <EntryValue>{value}</EntryValue>
    </>
  );
}

// Display the timestamp value if found in a `TableCell`.
function DisplayTimestampValue(row: RawDoc, timestampField: Field | null) {
  if (
    timestampField === null ||
    timestampField.field_mapping.output_format === null
  ) {
    return <></>;
  }
  let field_value = row;
  for (const path_segment of timestampField.path_segments) {
    field_value = field_value[path_segment];
  }
  if (!field_value) {
    return <></>;
  }
  return (
    <TableCell sx={{ verticalAlign: "top", padding: "4px" }}>
      <Box
        sx={{
          maxHeight: "115px",
          width: "90px",
          display: "inline-block",
          wordBreak: "break-word",
        }}
      >
        {formatDateTime(
          field_value,
          timestampField.field_mapping.output_format,
        )}
      </Box>
    </TableCell>
  );
}

function formatDateTime(field_value: any, timestampOutputFormat: string): any {
  // A unix timestamp can be in secs/millis/micros/nanos and need to be converted properly.
  if (
    timestampOutputFormat === "unix_timestamp_secs" &&
    typeof field_value === "number"
  ) {
    return dayjs(field_value * 1000)
      .utc()
      .format(DATE_TIME_WITH_SECONDS_FORMAT);
  } else if (
    timestampOutputFormat === "unix_timestamp_millis" &&
    typeof field_value === "number"
  ) {
    return dayjs(field_value).utc().format(DATE_TIME_WITH_MILLISECONDS_FORMAT);
  } else if (
    timestampOutputFormat === "unix_timestamp_micros" &&
    typeof field_value === "number"
  ) {
    return dayjs(field_value / 1000)
      .utc()
      .format(DATE_TIME_WITH_MILLISECONDS_FORMAT);
  } else if (
    timestampOutputFormat === "unix_timestamp_nanos" &&
    typeof field_value === "number"
  ) {
    return dayjs(field_value / 1000000)
      .utc()
      .format(DATE_TIME_WITH_MILLISECONDS_FORMAT);
  } else {
    // Other formats are string values and we can just display it as is.
    return field_value;
  }
}

const BreakWordBox = styled("dl")({
  verticalAlign: "top",
  display: "inline-block",
  color: "#464646",
  wordBreak: "break-all",
  wordWrap: "break-word",
  margin: 1,
  overflow: "hidden",
  lineHeight: "1.8em",
});

export function Row(props: RowProps) {
  const [open, setOpen] = useState(false);
  const entries: Entry[] = [];
  for (const [key, value] of Object.entries(props.row)) {
    entries.push({ key: key, value: value });
  }
  return (
    <>
      <TableRow>
        <TableCell
          sx={{ px: 0, py: 0, verticalAlign: "top", padding: "0  px" }}
        >
          <IconButton
            aria-label="expand row"
            size="small"
            onClick={() => setOpen(!open)}
          >
            {open ? <KeyboardArrowDown /> : <ChevronRight />}
          </IconButton>
        </TableCell>
        {DisplayTimestampValue(props.row, props.timestampField)}
        <TableCell sx={{ padding: "4px" }}>
          {!open && (
            <BreakWordBox sx={{ maxHeight: "100px" }}>
              {entries.map((entry) => (
                <React.Fragment key={entry.key}>
                  {EntryFormatter(entry)}
                </React.Fragment>
              ))}
            </BreakWordBox>
          )}
          {open && <JsonEditor content={props.row} resizeOnMount={true} />}
        </TableCell>
      </TableRow>
    </>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/SearchResult/SearchResult.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Box, Typography } from "@mui/material";
import { useMemo } from "react";
import { NumericFormat } from "react-number-format";
import { Index, ResponseError, SearchResponse } from "../../utils/models";
import Loader from "../Loader";
import ErrorResponseDisplay from "../ResponseErrorDisplay";
import { AggregationResult } from "./AggregationResult";
import { ResultTable } from "./ResultTable";

function HitCount({ searchResponse }: { searchResponse: SearchResponse }) {
  return (
    <Box>
      <Typography variant="body2" color="textSecondary">
        <NumericFormat
          displayType="text"
          value={searchResponse.num_hits}
          thousandSeparator=","
        />{" "}
        hits found in&nbsp;
        <NumericFormat
          decimalScale={2}
          displayType="text"
          value={searchResponse.elapsed_time_micros / 1000000}
          thousandSeparator=","
        />{" "}
        seconds
      </Typography>
    </Box>
  );
}

interface SearchResultProps {
  queryRunning: boolean;
  index: null | Index;
  searchResponse: null | SearchResponse;
  searchError: null | ResponseError;
}

export default function SearchResult(props: SearchResultProps) {
  const result = useMemo(() => {
    if (props.searchResponse == null || props.index == null) {
      return null;
    } else if (props.searchResponse.aggregations === undefined) {
      return (
        <ResultTable
          searchResponse={props.searchResponse}
          index={props.index}
        />
      );
    } else {
      return <AggregationResult searchResponse={props.searchResponse} />;
    }
  }, [props.searchResponse, props.index]);

  if (props.queryRunning) {
    return <Loader />;
  }

  if (props.searchError !== null) {
    return ErrorResponseDisplay(props.searchError);
  }

  if (props.searchResponse == null || props.index == null) {
    return <></>;
  }

  return (
    <Box sx={{ pt: 1, flexGrow: "1", flexBasis: "0%", overflow: "hidden" }}>
      <Box
        sx={{
          height: "100%",
          flexDirection: "column",
          flexGrow: 1,
          display: "flex",
        }}
      >
        <Box
          sx={{
            flexShrink: 0,
            display: "flex",
            flexGrow: 0,
            flexBasis: "auto",
          }}
        >
          <HitCount searchResponse={props.searchResponse} />
        </Box>
        <Box
          sx={{
            pt: 2,
            flexGrow: 1,
            flexBasis: "0%",
            minHeight: 0,
            display: "flex",
            flexDirection: "column",
          }}
        >
          {result}
        </Box>
      </Box>
    </Box>
  );
}


================================================
FILE: quickwit/quickwit-ui/src/components/SideBar.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import {
  ListItemButton,
  ListSubheader,
  styled,
  Typography,
} from "@mui/material";
import List from "@mui/material/List";
import ListItemIcon from "@mui/material/ListItemIcon";
import ListItemText from "@mui/material/ListItemText";
import { Database } from "@styled-icons/feather/Database";
import { Settings } from "@styled-icons/feather/Settings";
import { GroupWork } from "@styled-icons/material-outlined/GroupWork";
import { CodeSSlash } from "@styled-icons/remix-line/CodeSSlash";
import * as React from "react";
import { Link as RouterLink, LinkProps as RouterLinkProps } from "react-router";
import { useLocalStorage } from "../providers/LocalStorageProvider";
import { toUrlSearchRequestParams } from "../utils/urls";
import { APP_BAR_HEIGHT_PX } from "./LayoutUtils";

interface ListItemLinkProps {
  icon?: React.ReactElement;
  primary: React.ReactElement;
  to: string;
}

function ListItemLink(props: ListItemLinkProps) {
  const { icon, primary, to } = props;

  const renderLink = React.useMemo(
    () =>
      React.forwardRef<HTMLAnchorElement, Omit<RouterLinkProps, "to">>(
        function Link(itemProps, ref) {
          return (
            // biome-ignore lint/a11y/useValidAriaRole: remove the role
            <RouterLink to={to} ref={ref} {...itemProps} role={undefined} />
          );
        },
      ),
    [to],
  );

  return (
    <ListItemButton component={renderLink}>
      {icon ? (
        <ListItemIcon sx={{ minWidth: "40px" }}>{icon}</ListItemIcon>
      ) : null}
      <ListItemText primary={primary} />
    </ListItemButton>
  );
}

const SideBarWrapper = styled("div")({
  display: "flex",
  marginTop: `${APP_BAR_HEIGHT_PX}`,
  height: `calc(100% - ${APP_BAR_HEIGHT_PX})`,
  flex: "0 0 180px",
  flexDirection: "column",
  borderRight: "1px solid rgba(0, 0, 0, 0.12)",
});

const SideBar = () => {
  const lastSearchRequest = useLocalStorage().lastSearchRequest;
  let searchUrl = "/search";
  if (lastSearchRequest.indexId || lastSearchRequest.query) {
    searchUrl =
      "/search?" + toUrlSearchRequestParams(lastSearchRequest).toString();
  }
  return (
    <SideBarWrapper sx={{ px: 0, py: 2 }}>
      <List dense={true} sx={{ py: 0 }}>
        <ListSubheader sx={{ lineHeight: "25px" }}>
          <Typography variant="body1">Discover</Typography>
        </ListSubheader>
        <ListItemLink
          to={searchUrl}
          primary={<Typography variant="body1">Query editor</Typography>}
          icon={<CodeSSlash size="18px" />}
        />
        <ListSubheader sx={{ lineHeight: "25px", paddingTop: "10px" }}>
          <Typography variant="body1">Admin</Typography>
        </ListSubheader>
        <ListItemLink
          to="/indexes"
          primary={<Typography variant="body1">Indexes</Typography>}
          icon={<Database size="18px" />}
        />
        <ListItemLink
          to="/cluster"
          primary={<Typography variant="body1">Cluster</Typography>}
          icon={<GroupWork size="18px" />}
        />
        <ListItemLink
          to="/node-info"
          primary={<Typography variant="body1">Node info</Typography>}
          icon={<Settings size="18px" />}
        />
        <ListItemLink
          to="/api-playground"
          primary={<Typography variant="body1">API </Typography>}
          icon={<CodeSSlash size="18px" />}
        />
      </List>
    </SideBarWrapper>
  );
};

export default SideBar;


================================================
FILE: quickwit/quickwit-ui/src/components/TimeRangeSelect.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { AccessTime, ChevronRight, DateRange } from "@mui/icons-material";
import {
  Box,
  Button,
  Divider,
  List,
  ListItemButton,
  ListItemIcon,
  ListItemText,
  Popover,
} from "@mui/material";
import { DateTimePicker, LocalizationProvider } from "@mui/x-date-pickers";
import { AdapterDayjs } from "@mui/x-date-pickers/AdapterDayjs";
import { Dayjs, default as dayjs } from "dayjs";
import relativeTime from "dayjs/plugin/relativeTime";
import utc from "dayjs/plugin/utc";
import React, { JSX, useEffect, useMemo, useState } from "react";
import { DATE_TIME_WITH_SECONDS_FORMAT } from "../utils/models";

dayjs.extend(relativeTime);
dayjs.extend(utc);

const TIME_RANGE_CHOICES = [
  ["Last 15 min", 15 * 60],
  ["Last 30 min", 30 * 60],
  ["Last 1 hour", 60 * 60],
  ["Last 7 days", 7 * 24 * 60 * 60],
  ["Last 30 days", 30 * 24 * 60 * 60],
  ["Last 3 months", 90 * 24 * 60 * 60],
  ["Last year", 365 * 24 * 60 * 60],
];

type TimeRange = {
  startTimestamp: number | null;
  endTimestamp: number | null;
};

export interface TimeRangeSelectProps {
  timeRange: TimeRange;
  disabled?: boolean;
  onUpdate(newTimeRange: TimeRange): void;
}

interface TimeRangeSelectState {
  anchor: HTMLElement | null;
  customDatesPanelOpen: boolean;
  width: number;
}

export function TimeRangeSelect(props: TimeRangeSelectProps): JSX.Element {
  const getInitialState = () => {
    return { width: 220, anchor: null, customDatesPanelOpen: false };
  };
  const initialState = useMemo(() => {
    return getInitialState();
  }, []);
  const [state, setState] = useState<TimeRangeSelectState>(initialState);

  const handleOpenClick = (event: React.MouseEvent<HTMLButtonElement>) => {
    setState((prevState) => {
      return { ...prevState, anchor: event.currentTarget };
    });
  };

  const handleOpenCustomDatesPanelClick = () => {
    setState((prevState) => {
      return { ...prevState, customDatesPanelOpen: true, width: 500 };
    });
  };

  useEffect(() => {
    setState(initialState);
  }, [props.disabled, initialState]);

  const handleClose = () => {
    setState(initialState);
  };

  const handleTimeRangeChoiceClick = (
    secondsBeforeNow: number | string | undefined,
  ) => {
    if (secondsBeforeNow === undefined) {
      return;
    }
    // Ensures that we have a number.
    secondsBeforeNow = +secondsBeforeNow;
    setState(initialState);
    const startTimestamp = Math.trunc(Date.now() / 1000) - secondsBeforeNow;
    props.onUpdate({ startTimestamp, endTimestamp: null });
  };

  const handleReset = () => {
    props.onUpdate({ startTimestamp: null, endTimestamp: null });
  };

  const open = Boolean(state.anchor);
  const id = open ? "time-range-select-popover" : undefined;

  return (
    <Box sx={{ padding: "10px" }}>
      <Button
        variant="contained"
        disableElevation
        onClick={handleOpenClick}
        startIcon={<AccessTime />}
        disabled={props.disabled}
      >
        <DateTimeRangeLabel
          startTimestamp={props.timeRange.startTimestamp}
          endTimestamp={props.timeRange.endTimestamp}
        />
      </Button>
      <Popover
        id={id}
        open={open}
        anchorEl={state.anchor}
        onClose={handleClose}
        anchorOrigin={{
          vertical: "bottom",
          horizontal: "center",
        }}
        transformOrigin={{
          vertical: "top",
          horizontal: "center",
        }}
        PaperProps={{
          style: { width: state.width },
        }}
      >
        <Box display="flex" flexDirection="column">
          <Box p={1.5}>
            <b>Select a period</b>
          </Box>
          <Divider />
          <Box display="flex" flexDirection="row">
            <Box flexGrow={1} borderRight={1} borderColor="grey.300">
              <List disablePadding>
                {TIME_RANGE_CHOICES.map((value, idx) => {
                  return (
                    <ListItemButton
                      key={idx}
                      onClick={() => handleTimeRangeChoiceClick(value[1])}
                    >
                      <ListItemText primary={value[0]} />
                    </ListItemButton>
                  );
                })}
                <ListItemButton onClick={handleReset}>
                  <ListItemText primary="Reset" />
                </ListItemButton>
                <ListItemButton onClick={handleOpenCustomDatesPanelClick}>
                  <ListItemIcon
                    sx={{
                      alignItems: "left",
                      minWidth: "inherit",
                      paddingRight: "8px",
                    }}
                  >
                    <DateRange />
                  </ListItemIcon>
                  <ListItemText
                    primary="Custom dates"
                    sx={{ paddingRight: "16px" }}
                  />
                  <ListItemIcon sx={{ minWidth: "inherit" }}>
                    <ChevronRight />
                  </ListItemIcon>
                </ListItemButton>
              </List>
            </Box>
            {state.anchor !== null && state.customDatesPanelOpen && (
              <CustomDatesPanel {...props} />
            )}
          </Box>
        </Box>
      </Popover>
    </Box>
  );
}

function CustomDatesPanel(props: TimeRangeSelectProps): JSX.Element {
  const [startDate, setStartDate] = useState<Dayjs | null>(null);
  const [endDate, setEndDate] = useState<Dayjs | null>(null);

  useEffect(() => {
    setStartDate(
      props.timeRange.startTimestamp
        ? convertTimestampSecsIntoDateUtc(props.timeRange.startTimestamp)
        : null,
    );
    setEndDate(
      props.timeRange.endTimestamp
        ? convertTimestampSecsIntoDateUtc(props.timeRange.endTimestamp)
        : null,
    );
  }, [props.timeRange.startTimestamp, props.timeRange.endTimestamp]);
  const handleReset = (event: React.MouseEvent<HTMLButtonElement>) => {
    event.preventDefault();
    setStartDate(null);
    setEndDate(null);
    props.onUpdate({ startTimestamp: null, endTimestamp: null });
  };
  const handleApply = (event: React.MouseEvent<HTMLButtonElement>) => {
    event.preventDefault();
    const startTimestamp = startDate ? startDate.valueOf() / 1000 : null;
    const endTimestamp = endDate ? endDate.valueOf() / 1000 : null;
    props.onUpdate({ startTimestamp, endTimestamp });
  };

  return (
    <LocalizationProvider dateAdapter={AdapterDayjs}>
      <Box
        display="flex"
        flexDirection="column"
        p={2}
        sx={{ minWidth: "300px" }}
      >
        <Box flexGrow={1}>
          <Box pb={1.5}>
            <DateTimePicker
              label="Start Date"
              value={startDate}
              format={DATE_TIME_WITH_SECONDS_FORMAT}
              onChange={(newValue: null | Dayjs) => {
                // By default, newValue is a datetime defined on the local time zone and for now we consider
                // input/output only in UTC.
                setStartDate(
                  newValue
                    ? dayjs(
                        newValue.valueOf() + newValue.utcOffset() * 60 * 1000,
                      ).utc()
                    : null,
                );
              }}
              slotProps={{ textField: { sx: { width: "100%" } } }}
            />
          </Box>
          <Box>
            <DateTimePicker
              label="End Date"
              value={endDate}
              format={DATE_TIME_WITH_SECONDS_FORMAT}
              onChange={(newValue: null | Dayjs) => {
                // By default, newValue is a datetime defined on the local time zone and for now we consider
                // input/output only in UTC.
                setEndDate(
                  newValue
                    ? dayjs(
                        newValue.valueOf() + newValue.utcOffset() * 60 * 1000,
                      ).utc()
                    : null,
                );
              }}
              slotProps={{ textField: { sx: { width: "100%" } } }}
            />
          </Box>
        </Box>
        <Box display="flex">
          <Button
            variant="outlined"
            color="primary"
            onClick={handleReset}
            disableElevation
            style={{ marginRight: 10 }}
          >
            Reset
          </Button>
          <Button
            variant="contained"
            color="primary"
            onClick={handleApply}
            disableElevation
          >
            Apply
          </Button>
        </Box>
      </Box>
    </LocalizationProvider>
  );
}

interface DateTimeRangeLabelProps {
  startTimestamp: number | null;
  endTimestamp: number | null;
}

function DateTimeRangeLabel(props: DateTimeRangeLabelProps): JSX.Element {
  function Label() {
    if (props.startTimestamp !== null && props.endTimestamp !== null) {
      return (
        <>
          {convertTimestampSecsIntoDateUtc(props.startTimestamp).format(
            DATE_TIME_WITH_SECONDS_FORMAT,
          )}{" "}
          -{" "}
          {convertTimestampSecsIntoDateUtc(props.endTimestamp).format(
            DATE_TIME_WITH_SECONDS_FORMAT,
          )}
        </>
      );
    } else if (props.startTimestamp !== null && props.endTimestamp === null) {
      return (
        <>
          Since{" "}
          {convertTimestampSecsIntoDateUtc(props.startTimestamp).fromNow(true)}
        </>
      );
    } else if (props.startTimestamp == null && props.endTimestamp != null) {
      return (
        <>
          Before{" "}
          {convertTimestampSecsIntoDateUtc(props.endTimestamp).format(
            DATE_TIME_WITH_SECONDS_FORMAT,
          )}
        </>
      );
    }
    return <>No date range</>;
  }

  return (
    <span style={{ textTransform: "none" }}>
      <Label />
    </span>
  );
}

function convertTimestampSecsIntoDateUtc(timestamp_secs: number): Dayjs {
  return dayjs(timestamp_secs * 1000).utc();
}


================================================
FILE: quickwit/quickwit-ui/src/components/TopBar.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import GitHubIcon from "@mui/icons-material/GitHub";
import {
  Box,
  IconButton,
  Link,
  SvgIcon,
  styled,
  Tooltip,
  Typography,
} from "@mui/material";
import AppBar from "@mui/material/AppBar";
import Toolbar from "@mui/material/Toolbar";
import { Discord } from "@styled-icons/fa-brands/Discord";
import { useEffect, useMemo, useState } from "react";
import quickwitLogoUrl from "../assets/img/quickwit-logo-with-title.svg";
import { Client } from "../services/client";

const Logo = (props: React.ComponentProps<"img">) => (
  <img {...props} src={quickwitLogoUrl} alt="quickwit logo" />
);

const StyledAppBar = styled(AppBar)(({ theme }) => ({
  zIndex: theme.zIndex.drawer + 1,
}));

// Update the Button's color prop options
declare module "@mui/material/AppBar" {
  interface AppBarPropsColorOverrides {
    neutral: true;
  }
}

const TopBar = () => {
  const [clusterId, setClusterId] = useState<string>("");
  const quickwitClient = useMemo(() => new Client(), []);

  useEffect(() => {
    quickwitClient.cluster().then((cluster) => {
      setClusterId(cluster.cluster_id);
    });
  }, [quickwitClient]);

  return (
    <StyledAppBar position="fixed" elevation={0} color="neutral">
      <Toolbar variant="dense">
        <Box
          sx={{
            flexGrow: 1,
            p: 0,
            m: 0,
            display: "flex",
            alignItems: "center",
          }}
        >
          <Logo height="25px"></Logo>
          <Tooltip title="Cluster ID" placement="right">
            <Typography mx={2}>{clusterId}</Typography>
          </Tooltip>
        </Box>
        <Link href="https://quickwit.io/docs" target="_blank" sx={{ px: 2 }}>
          Docs
        </Link>
        <Link href="https://discord.gg/rpRRTezWhW" target="_blank">
          <IconButton size="large">
            <SvgIcon>
              <Discord />
            </SvgIcon>
          </IconButton>
        </Link>
        <Link href="https://github.com/quickwit-inc/quickwit" target="_blank">
          <IconButton size="large">
            <GitHubIcon />
          </IconButton>
        </Link>
      </Toolbar>
    </StyledAppBar>
  );
};

export default TopBar;


================================================
FILE: quickwit/quickwit-ui/src/index.css
================================================
/*
Copyright 2021-Present Datadog, Inc.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
html,
body {
  height: 100%;
}

#root {
  height: 100%;
}

div.swagger-ui div.information-container {
  display: none;
}


================================================
FILE: quickwit/quickwit-ui/src/index.test.js
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { describe, expect, it } from "@jest/globals";
import { render, screen } from "@testing-library/react";
import { BrowserRouter } from "react-router";
import App from "./views/App";

describe("App", () => {
  it("Should display side bar links", () => {
    render(
      <BrowserRouter>
        <App />
      </BrowserRouter>,
    );
    expect(screen.getByText(/Discover/)).toBeInTheDocument();
    expect(screen.getByText(/Query editor/)).toBeInTheDocument();
    expect(screen.getByText(/Admin/)).toBeInTheDocument();
  });
});


================================================
FILE: quickwit/quickwit-ui/src/index.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import React from "react";
import { createRoot } from "react-dom/client";
import "./index.css";
import { BrowserRouter } from "react-router";
import App from "./views/App";

const root = createRoot(document.getElementById("root")!);
root.render(
  <React.StrictMode>
    <BrowserRouter basename={import.meta.env.BASE_URL}>
      <App />
    </BrowserRouter>
  </React.StrictMode>,
);


================================================
FILE: quickwit/quickwit-ui/src/providers/EditorProvider.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import * as monacoEditor from "monaco-editor/esm/vs/editor/editor.api";
import {
  createContext,
  MutableRefObject,
  PropsWithChildren,
  useContext,
  useRef,
} from "react";

type ContextProps = {
  editorRef: MutableRefObject<unknown | null> | null;
  monacoRef: MutableRefObject<typeof monacoEditor | null> | null;
};

const defaultValues = {
  editorRef: null,
  monacoRef: null,
};

const EditorContext = createContext<ContextProps>(defaultValues);

export const EditorProvider = ({ children }: PropsWithChildren<unknown>) => {
  const editorRef = useRef<unknown | null>(null);
  const monacoRef = useRef<typeof monacoEditor | null>(null);

  return (
    <EditorContext.Provider
      value={{
        editorRef,
        monacoRef,
      }}
    >
      {children}
    </EditorContext.Provider>
  );
};

export const useEditor = () => {
  return useContext(EditorContext);
};


================================================
FILE: quickwit/quickwit-ui/src/providers/LocalStorageProvider.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import {
  createContext,
  PropsWithChildren,
  useContext,
  useEffect,
  useState,
} from "react";
import { EMPTY_SEARCH_REQUEST, SearchRequest } from "../utils/models";

type Props = Record<string, unknown>;

type ContextProps = {
  lastSearchRequest: SearchRequest;
  updateLastSearchRequest: (searchRequest: SearchRequest) => void;
};

const defaultValues = {
  lastSearchRequest: EMPTY_SEARCH_REQUEST,
  updateLastSearchRequest: () => undefined,
};

function parseSearchRequest(value: string | null): SearchRequest {
  if (value === null) {
    return EMPTY_SEARCH_REQUEST;
  }
  return JSON.parse(value);
}

export const LocalStorageContext = createContext<ContextProps>(defaultValues);

export const LocalStorageProvider = ({
  children,
}: PropsWithChildren<Props>) => {
  const [lastSearchRequest, setLastSearchRequest] =
    useState<SearchRequest>(EMPTY_SEARCH_REQUEST);

  useEffect(() => {
    if (localStorage.getItem("lastSearchRequest") !== null) {
      const lastSearchRequest = parseSearchRequest(
        localStorage.getItem("lastSearchRequest"),
      );
      setLastSearchRequest(lastSearchRequest);
    }
  }, []);

  useEffect(() => {
    localStorage.setItem(
      "lastSearchRequest",
      JSON.stringify(lastSearchRequest),
    );
  }, [lastSearchRequest]);

  function updateLastSearchRequest(searchRequest: SearchRequest) {
    setLastSearchRequest(searchRequest);
  }

  return (
    <LocalStorageContext.Provider
      value={{
        lastSearchRequest,
        updateLastSearchRequest,
      }}
    >
      {children}
    </LocalStorageContext.Provider>
  );
};

export const useLocalStorage = () => {
  return useContext(LocalStorageContext);
};


================================================
FILE: quickwit/quickwit-ui/src/services/client.test.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { describe, expect, it, jest } from "@jest/globals";
import { SearchRequest } from "../utils/models";
import { Client } from "./client";

describe("Client unit test", () => {
  it("Should construct correct search URL", async () => {
    // Mocking the fetch function to simulate network requests
    const mockFetch = jest.fn((_url: string, _options?: unknown) =>
      Promise.resolve({ ok: true, json: () => Promise.resolve({}) }),
    );
    (global as any).fetch = mockFetch;

    const searchRequest: SearchRequest = {
      indexId: "my-new-fresh-index-id",
      query: "severity_error:ERROR",
      startTimestamp: 100,
      endTimestamp: 200,
      maxHits: 20,
      sortByField: {
        field_name: "timestamp",
        order: "Desc",
      },
      aggregation: false,
      aggregationConfig: {
        metric: null,
        term: null,
        histogram: null,
      },
    };

    const client = new Client();
    expect(client.buildSearchBody(searchRequest, null)).toBe(
      '{"query":"severity_error:ERROR","max_hits":20,"start_timestamp":100,"end_timestamp":200,"sort_by_field":"+timestamp"}',
    );

    await client.search(searchRequest, null);
    const expectedUrl = `${client.apiRoot()}my-new-fresh-index-id/search`;
    expect(mockFetch).toHaveBeenCalledTimes(1);
    expect(mockFetch).toHaveBeenCalledWith(expectedUrl, expect.any(Object));
  });
});


================================================
FILE: quickwit/quickwit-ui/src/services/client.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import {
  Cluster,
  Index,
  IndexMetadata,
  QuickwitBuildInfo,
  SearchRequest,
  SearchResponse,
  SplitMetadata,
} from "../utils/models";
import { serializeSortByField } from "../utils/urls";

export class Client {
  private readonly _host: string;

  constructor(host?: string) {
    if (!host) {
      this._host = window.location.origin;
    } else {
      this._host = host;
    }
  }

  apiRoot(): string {
    return this._host + "/api/v1/";
  }

  async search(
    request: SearchRequest,
    timestamp_field: string | null,
  ): Promise<SearchResponse> {
    // TODO: improve validation of request.
    if (request.indexId === null || request.indexId === undefined) {
      throw Error("Search request must have and index id.");
    }
    const url = `${this.apiRoot()}${request.indexId}/search`;
    const body = this.buildSearchBody(request, timestamp_field);
    return this.fetch(url, this.defaultGetRequestParams(), body);
  }

  async cluster(): Promise<Cluster> {
    return await this.fetch(
      `${this.apiRoot()}cluster`,
      this.defaultGetRequestParams(),
    );
  }

  async buildInfo(): Promise<QuickwitBuildInfo> {
    return await this.fetch(
      `${this.apiRoot()}version`,
      this.defaultGetRequestParams(),
    );
  }

  async config(): Promise<Record<string, any>> {
    return await this.fetch(
      `${this.apiRoot()}config`,
      this.defaultGetRequestParams(),
    );
  }
  //
  // Index management API
  //
  async getIndex(indexId: string): Promise<Index> {
    const [metadata, splits] = await Promise.all([
      this.getIndexMetadata(indexId),
      this.getAllSplits(indexId),
    ]);
    return {
      metadata: metadata,
      splits: splits[0],
      split_limit_reached: splits[1],
    };
  }

  async getIndexMetadata(indexId: string): Promise<IndexMetadata> {
    return this.fetch(`${this.apiRoot()}indexes/${indexId}`, {});
  }

  async getAllSplits(
    indexId: string,
  ): Promise<[Array<SplitMetadata>, boolean]> {
    // TODO: restrieve all the splits.
    const results: { splits: Array<SplitMetadata> } = await this.fetch(
      `${this.apiRoot()}indexes/${indexId}/splits?limit=10000`,
      {},
    );

    return [results["splits"], results["splits"].length === 10000];
  }

  async listIndexes(): Promise<Array<IndexMetadata>> {
    return this.fetch(`${this.apiRoot()}indexes`, {});
  }

  async fetch<T>(
    url: string,
    params: RequestInit,
    body: string | null = null,
  ): Promise<T> {
    if (body !== null) {
      params.method = "POST";
      params.body = body;
      params.headers = {
        ...params.headers,
        "content-type": "application/json",
      };
    }
    const response = await fetch(url, params);
    if (response.ok) {
      return response.json() as Promise<T>;
    }
    const message = await response.text();
    return await Promise.reject({
      message: message,
      status: response.status,
    });
  }

  private defaultGetRequestParams(): RequestInit {
    return {
      method: "GET",
      headers: { Accept: "application/json" },
      mode: "cors",
      cache: "default",
    };
  }

  buildSearchBody(
    request: SearchRequest,
    timestamp_field: string | null,
  ): string {
    const body: any = {
      // TODO: the trim should be done in the backend.
      query: request.query.trim() || "*",
    };

    if (request.aggregation) {
      const qw_aggregation = this.buildAggregation(request, timestamp_field);
      body["aggs"] = qw_aggregation;
      body["max_hits"] = 0;
    } else {
      body["max_hits"] = 20;
    }
    if (request.startTimestamp) {
      body["start_timestamp"] = request.startTimestamp;
    }
    if (request.endTimestamp) {
      body["end_timestamp"] = request.endTimestamp;
    }
    if (request.sortByField) {
      body["sort_by_field"] = serializeSortByField(request.sortByField);
    }
    return JSON.stringify(body);
  }

  buildAggregation(
    request: SearchRequest,
    timestamp_field: string | null,
  ): any {
    let aggregation: any;
    if (request.aggregationConfig.metric) {
      const metric = request.aggregationConfig.metric;
      aggregation = {
        metric: {
          [metric.type]: {
            field: metric.field,
          },
        },
      };
    }
    if (request.aggregationConfig.histogram && timestamp_field) {
      const histogram = request.aggregationConfig.histogram;
      const interval = histogram.interval;
      let extended_bounds: any;
      if (request.startTimestamp && request.endTimestamp) {
        extended_bounds = {
          min: request.startTimestamp,
          max: request.endTimestamp,
        };
      } else {
        extended_bounds = undefined;
      }
      aggregation = {
        histo_agg: {
          aggs: aggregation,
          date_histogram: {
            field: timestamp_field,
            fixed_interval: interval,
            min_doc_count: 0,
            extended_bounds: extended_bounds,
          },
        },
      };
    }
    if (request.aggregationConfig.term) {
      const term = request.aggregationConfig.term;
      aggregation = {
        term_agg: {
          aggs: aggregation,
          terms: {
            field: term.field,
            size: term.size,
            order: {
              _count: "desc",
            },
            min_doc_count: 1,
          },
        },
      };
    }
    return aggregation;
  }
}


================================================
FILE: quickwit/quickwit-ui/src/utils/SearchComponentProps.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Index, SearchRequest } from "./models";

export interface SearchComponentProps {
  searchRequest: SearchRequest;
  queryRunning: boolean;
  index: null | Index;
  onSearchRequestUpdate(searchRequest: SearchRequest): void;
  runSearch(searchRequest: SearchRequest): void;
}


================================================
FILE: quickwit/quickwit-ui/src/utils/models.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

export type RawDoc = Record<string, any>;

export type FieldMapping = {
  description: string | null;
  name: string;
  type: string;
  stored: boolean | null;
  fast: boolean | null;
  indexed: boolean | null;
  // Specific datetime field attributes.
  output_format: string | null;
  field_mappings?: FieldMapping[];
};

export type Field = {
  // Json path (path segments concatenated as a string with dots between segments).
  json_path: string;
  // Json path of the field.
  path_segments: string[];
  field_mapping: FieldMapping;
};

export type Entry = {
  key: string;
  value: any;
};

export const DATE_TIME_WITH_SECONDS_FORMAT = "YYYY/MM/DD HH:mm:ss";
export const DATE_TIME_WITH_MILLISECONDS_FORMAT = "YYYY/MM/DD HH:mm:ss.SSS";

// Returns a flatten array of fields and nested fields found in the given `FieldMapping` array.
export function getAllFields(field_mappings: Array<FieldMapping>): Field[] {
  const fields: Field[] = [];
  for (const field_mapping of field_mappings) {
    if (
      field_mapping.type === "object" &&
      field_mapping.field_mappings !== undefined
    ) {
      for (const child_field_mapping of getAllFields(
        field_mapping.field_mappings,
      )) {
        fields.push({
          json_path: field_mapping.name + "." + child_field_mapping.json_path,
          path_segments: [field_mapping.name].concat(
            child_field_mapping.path_segments,
          ),
          field_mapping: child_field_mapping.field_mapping,
        });
      }
    } else {
      fields.push({
        json_path: field_mapping.name,
        path_segments: [field_mapping.name],
        field_mapping: field_mapping,
      });
    }
  }

  return fields;
}

export type DocMapping = {
  field_mappings: FieldMapping[];
  tag_fields: string[];
  store: boolean;
  dynamic_mapping: boolean;
  timestamp_field: string | null;
};

export type SortOrder = "Asc" | "Desc";

export type SortByField = {
  field_name: string;
  order: SortOrder;
};

export type SearchRequest = {
  indexId: string | null;
  query: string;
  startTimestamp: number | null;
  endTimestamp: number | null;
  maxHits: number;
  sortByField: SortByField | null;
  aggregation: boolean;
  aggregationConfig: Aggregation;
};

export type Aggregation = {
  metric: Metric | null;
  term: TermAgg | null;
  histogram: HistogramAgg | null;
};

export type Metric = {
  type: string;
  field: string;
};

export type TermAgg = {
  field: string;
  size: number;
};

export type HistogramAgg = {
  interval: string;
};

export type ParsedAggregationResult = TermResult | HistogramResult | null;

export type TermResult = { term: string; value: number }[];

export type HistogramResult = {
  timestamps: Date[];
  data: { name: string | undefined; value: number[] }[];
};

export function extractAggregationResults(
  aggregation: any,
): ParsedAggregationResult {
  const extract_value = (entry: any) => {
    if ("metric" in entry) {
      return entry.metric.value || 0;
    } else {
      return entry.doc_count;
    }
  };
  if ("histo_agg" in aggregation) {
    const buckets = aggregation.histo_agg.buckets;
    const timestamps = buckets.map((entry: any) => entry.key);
    const value = buckets.map(extract_value);
    // we are in the "simple histogram" case
    return {
      timestamps,
      data: [{ name: undefined, value }],
    };
  } else if ("term_agg" in aggregation) {
    // we have a term aggregation, but maybe there is an histogram inside
    const term_buckets = aggregation.term_agg.buckets;
    if (term_buckets.length === 0) {
      return null;
    }
    if (term_buckets.length > 0 && "histo_agg" in term_buckets[0]) {
      // we have a term+histo aggregation
      const timestamps_set: Set<number> = new Set();
      term_buckets.forEach((bucket: any) =>
        bucket.histo_agg.buckets.forEach((entry: any) =>
          timestamps_set.add(entry.key),
        ),
      );
      const timestamps = [...timestamps_set];
      timestamps.sort();

      const data = term_buckets.map((bucket: any) => {
        const histo_buckets = bucket.histo_agg.buckets;
        const first_elem_key = histo_buckets[0].key;
        const last_elem_key = histo_buckets[histo_buckets.length - 1].key;
        const prefix_len = timestamps.indexOf(first_elem_key);
        const suffix_len =
          timestamps.length - timestamps.indexOf(last_elem_key) - 1;
        const value = Array(prefix_len)
          .fill(0)
          .concat(histo_buckets.map(extract_value), Array(suffix_len).fill(0));

        return { name: bucket.key, value };
      });
      return {
        timestamps: timestamps.map((date) => new Date(date)),
        data,
      };
    } else {
      return term_buckets.map((bucket: any) => {
        return {
          term: bucket.key,
          value: extract_value(bucket),
        };
      });
    }
  }
  // we are in neither case??
  return null;
}

export const EMPTY_SEARCH_REQUEST: SearchRequest = {
  indexId: "",
  query: "",
  startTimestamp: null,
  endTimestamp: null,
  maxHits: 100,
  sortByField: null,
  aggregation: false,
  aggregationConfig: {
    metric: null,
    term: null,
    histogram: null,
  },
};

export type ResponseError = {
  status: number | null;
  message: string | null;
};

export type SearchResponse = {
  num_hits: number;
  hits: Array<RawDoc>;
  elapsed_time_micros: number;
  errors: Array<any> | undefined;
  aggregations: any | undefined;
};

export type IndexConfig = {
  version: string;
  index_id: string;
  index_uri: string;
  doc_mapping: DocMapping;
  indexing_settings: object;
  search_settings: object;
  retention: object;
};

export type IndexMetadata = {
  index_config: IndexConfig;
  checkpoint: object;
  sources: object[] | undefined;
  create_timestamp: number;
};

export const EMPTY_INDEX_METADATA: IndexMetadata = {
  index_config: {
    version: "",
    index_uri: "",
    index_id: "",
    doc_mapping: {
      field_mappings: [],
      tag_fields: [],
      store: false,
      dynamic_mapping: false,
      timestamp_field: null,
    },
    indexing_settings: {},
    search_settings: {},
    retention: {},
  },
  checkpoint: {},
  sources: undefined,
  create_timestamp: 0,
};

export type SplitMetadata = {
  split_id: string;
  split_state: string;
  num_docs: number;
  uncompressed_docs_size_in_bytes: number;
  time_range: null | Range;
  update_timestamp: number;
  version: number;
  create_timestamp: number;
  tags: string[];
  demux_num_ops: number;
  footer_offsets: Range;
};

export type Range = {
  start: number;
  end: number;
};

export type Index = {
  metadata: IndexMetadata;
  splits: SplitMetadata[];
  split_limit_reached: boolean;
};

export type Cluster = {
  node_id: string;
  cluster_id: string;
  state: ClusterState;
};

export type ClusterState = {
  state: ClusterStateSnapshot;
  live_nodes: any[];
  dead_nodes: any[];
};

export type ClusterStateSnapshot = {
  seed_addrs: string[];
  node_states: Record<string, NodeState>;
};

export type NodeState = {
  key_values: KeyValues;
  max_version: number;
};

export type KeyValues = {
  available_services: KeyValue;
  grpc_address: KeyValue;
  heartbeat: KeyValue;
};

export type KeyValue = {
  value: any;
  version: number;
};

export type QuickwitBuildInfo = {
  commit_version_tag: string;
  cargo_pkg_version: string;
  cargo_build_target: string;
  commit_short_hash: string;
  commit_date: string;
  version: string;
};

export type NodeId = {
  id: string;
  grpc_address: string;
  self: boolean;
};


================================================
FILE: quickwit/quickwit-ui/src/utils/theme.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { createTheme } from "@mui/material";
import SoehneMonoDreiviertelfettWoff2 from "./../assets/fonts/soehne-mono-web-dreiviertelfett.woff2";
import SoehneMonoKraftigWoff2 from "./../assets/fonts/soehne-mono-web-kraftig.woff2";
import SoehneBuchWoff2 from "./../assets/fonts/soehne-web-buch.woff2";
import SoehneHalbfettWoff2 from "./../assets/fonts/soehne-web-halbfett.woff2";

export const QUICKWIT_BLUE = "#004BD9";
export const QUICKWIT_RED = "#FF0026";
export const QUICKWIT_GREEN = "#00D588";
export const QUICKWIT_GREY = "#CBD1DE";
export const QUICKWIT_INTERMEDIATE_GREY = "rgba(203,209,222,0.5)";
export const QUICKWIT_LIGHT_GREY = "#F8F9FB";
export const QUICKWIT_BLACK = "#1F232A";

// Update the Typography's var@iant prop options
declare module "@mui/material/Typography" {
  interface TypographyPropsVariantOverrides {
    fontSize: true;
    poster: true;
    h3: false;
  }
}

declare module "@mui/material/styles" {
  interface Theme {
    status: {
      danger: React.CSSProperties["color"];
    };
  }

  interface PaletteOptions {
    neutral: PaletteOptions["primary"];
  }

  interface Palette {
    primary: Palette["primary"];
    secondary: Palette["secondary"];
    text: Palette["text"];
    neutral: Palette["primary"];
  }
}

export const theme = createTheme({
  palette: {
    primary: {
      main: "#000000",
      contrastText: "#ffffff",
    },
    secondary: {
      main: "#000000",
    },
    text: {
      primary: "#000000",
    },
    neutral: {
      main: "#F8F9FB",
      contrastText: "#000000",
    },
  },
  typography: {
    fontSize: 12,
    fontFamily: "SoehneMono, Arial",
    body1: {
      fontSize: "0.8rem",
    },
  },
  components: {
    MuiCssBaseline: {
      styleOverrides: `
        @font-face {
          font-family: 'SoehneMono';
          font-style: normal;
          font-display: swap;
          font-weight: 500;
          src: local('SoehneMonoKraftig'), local('SoehneMonoKraftig'), url(${SoehneMonoKraftigWoff2}) format('woff2');
        }
        @font-face {
          font-family: 'SoehneMono';
          font-style: normal;
          font-display: swap;
          font-weight: 700;
          src: local('SoehneMonoDreiviertelfett'), local('SoehneMonoDreiviertelfett'), url(${SoehneMonoDreiviertelfettWoff2}) format('woff2');
        }
        @font-face {
          font-family: 'Soehne';
          font-style: bold;
          font-display: swap;
          font-weight: 600;
          src: local('SoehneHalbfett'), local('SoehneHalbfett'), url(${SoehneHalbfettWoff2}) format('woff2');
        }
        @font-face {
          font-family: 'Soehne';
          font-style: normal;
          font-display: swap;
          font-weight: 300;
          src: local('SoehneBuch'), local('SoehneBuch'), url(${SoehneBuchWoff2}) format('woff2');
        }
      `,
    },
  },
});

export const EDITOR_THEME = {
  base: "vs" as const,
  inherit: true,
  rules: [
    { token: "comment", foreground: "#1F232A", fontStyle: "italic" },
    { token: "keyword", foreground: QUICKWIT_BLUE },
  ],
  colors: {
    "editor.comment.foreground": "#CBD1DE",
    "editor.foreground": "#000000",
    "editor.background": QUICKWIT_LIGHT_GREY,
    "editorLineNumber.foreground": "black",
    "editor.lineHighlightBackground": "#DFE0E1",
  },
};


================================================
FILE: quickwit/quickwit-ui/src/utils/urls.ts
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Aggregation, SearchRequest, SortByField, SortOrder } from "./models";

export function hasSearchParams(historySearch: string): boolean {
  const searchParams = new URLSearchParams(historySearch);

  return (
    searchParams.has("index_id") ||
    searchParams.has("query") ||
    searchParams.has("start_timestamp") ||
    searchParams.has("end_timestamp")
  );
}

export function parseSearchUrl(historySearch: string): SearchRequest {
  const searchParams = new URLSearchParams(historySearch);
  const startTimestampString = searchParams.get("start_timestamp");
  let startTimestamp = null;
  const startTimeStampParsedInt = parseInt(startTimestampString || "", 10);
  if (!Number.isNaN(startTimeStampParsedInt)) {
    startTimestamp = startTimeStampParsedInt;
  }
  let endTimestamp = null;
  const endTimestampString = searchParams.get("end_timestamp");
  const endTimestampParsedInt = parseInt(endTimestampString || "", 10);
  if (!Number.isNaN(endTimestampParsedInt)) {
    endTimestamp = endTimestampParsedInt;
  }
  let indexId = null;
  const indexIdParam = searchParams.get("index_id");
  if (indexIdParam !== null && indexIdParam.length > 0) {
    indexId = searchParams.get("index_id");
  }
  let sortByField = null;
  const sortByFieldParam = searchParams.get("sort_by_field");
  if (sortByFieldParam !== null) {
    if (sortByFieldParam.startsWith("+")) {
      const order: SortOrder = "Desc";
      sortByField = { field_name: sortByFieldParam.substring(1), order: order };
    } else if (sortByFieldParam.startsWith("-")) {
      const order: SortOrder = "Asc";
      sortByField = { field_name: sortByFieldParam.substring(1), order: order };
    } else {
      const order: SortOrder = "Desc";
      sortByField = { field_name: sortByFieldParam, order: order };
    }
  }
  const aggregationParam = searchParams.get("aggregation");
  const aggregation = parseAggregation(aggregationParam);
  return {
    indexId: indexId,
    query: searchParams.get("query") || "",
    maxHits: 10,
    startTimestamp: startTimestamp,
    endTimestamp: endTimestamp,
    sortByField: sortByField,
    aggregation: aggregationParam != null,
    aggregationConfig: aggregation,
  };
}

function parseAggregation(param: string | null): Aggregation {
  const empty: Aggregation = {
    metric: null,
    term: null,
    histogram: null,
  };
  if (param !== null) {
    try {
      const aggregation: Aggregation = JSON.parse(param);
      return aggregation;
    } catch {
      // ignore malformed param
    }
  }
  return empty;
}

export function toUrlSearchRequestParams(
  request: SearchRequest,
): URLSearchParams {
  const params = new URLSearchParams();
  params.append("query", request.query || "*");
  // We have to set the index ID in url params as it's not present in the UI path params.
  // This enables the react app to be able to get index ID from url params
  // if the user enter directly the UI url.
  params.append("index_id", request.indexId || "");
  if (request.maxHits) {
    params.append("max_hits", request.maxHits.toString());
  }
  if (request.startTimestamp) {
    params.append("start_timestamp", request.startTimestamp.toString());
  }
  if (request.endTimestamp) {
    params.append("end_timestamp", request.endTimestamp.toString());
  }
  if (request.sortByField) {
    params.append("sort_by_field", serializeSortByField(request.sortByField));
  }
  if (request.aggregation) {
    params.append(
      "aggregation",
      JSON.stringify(request.aggregationConfig, (_, val) => {
        if (val == null) {
          return undefined;
        } else {
          return val;
        }
      }),
    );
  }
  return params;
}

export function serializeSortByField(sortByField: SortByField): string {
  const order = sortByField.order === "Desc" ? "+" : "-";
  return `${order}${sortByField.field_name}`;
}


================================================
FILE: quickwit/quickwit-ui/src/views/ApiView.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import "swagger-ui-react/swagger-ui.css";
import SwaggerUI from "swagger-ui-react";
import {
  FullBoxContainer,
  ViewUnderAppBarBox,
} from "../components/LayoutUtils";

function ApiView() {
  return (
    <ViewUnderAppBarBox>
      <FullBoxContainer>
        <SwaggerUI
          layout="BaseLayout"
          defaultModelsExpandDepth={-1}
          url="/openapi.json"
        />
      </FullBoxContainer>
    </ViewUnderAppBarBox>
  );
}

export default ApiView;


================================================
FILE: quickwit/quickwit-ui/src/views/App.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { CssBaseline, ThemeProvider } from "@mui/material";
import { Navigate, Route, Routes } from "react-router";
import { FullBoxContainer } from "../components/LayoutUtils";
import SideBar from "../components/SideBar";
import TopBar from "../components/TopBar";
import { LocalStorageProvider } from "../providers/LocalStorageProvider";
import { theme } from "../utils/theme";
import ApiView from "./ApiView";
import ClusterView from "./ClusterView";
import IndexesView from "./IndexesView";
import IndexView from "./IndexView";
import NodeInfoView from "./NodeInfoView";
import SearchView from "./SearchView";

function App() {
  return (
    <ThemeProvider theme={theme}>
      <LocalStorageProvider>
        <FullBoxContainer sx={{ flexDirection: "row", p: 0 }}>
          <CssBaseline />
          <TopBar />
          <SideBar />
          <Routes>
            <Route path="/" element={<Navigate to="/search" />} />
            <Route path="search" element={<SearchView />} />
            <Route path="indexes" element={<IndexesView />} />
            <Route path="indexes/:indexId" element={<IndexView />} />
            <Route path="cluster" element={<ClusterView />} />
            <Route path="node-info" element={<NodeInfoView />} />
            <Route path="api-playground" element={<ApiView />} />
          </Routes>
        </FullBoxContainer>
      </LocalStorageProvider>
    </ThemeProvider>
  );
}

export default App;


================================================
FILE: quickwit/quickwit-ui/src/views/ClusterView.test.jsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { render, screen, waitFor } from "@testing-library/react";
import { act } from "react";
import { Client } from "../services/client";
import ClusterView from "./ClusterView";

jest.mock("../services/client");

let container = null;
beforeEach(() => {
  // setup a DOM element as a render target
  container = document.createElement("div");
  document.body.appendChild(container);
});

afterEach(() => {
  // cleanup on exiting
  container.remove();
  container = null;
});

test("renders ClusterStateView", async () => {
  const clusterState = {
    state: {
      seed_addrs: [],
      node_states: {
        "node-green-uCdq/1656700092": {
          key_values: {
            available_services: {
              value: "searcher",
              version: 3,
            },
            grpc_address: {
              value: "127.0.0.1:7281",
              version: 2,
            },
            heartbeat: {
              value: "24",
              version: 27,
            },
          },
          max_version: 27,
        },
      },
    },
    live_nodes: [],
    dead_nodes: [],
  };
  Client.prototype.cluster.mockImplementation(() =>
    Promise.resolve(clusterState),
  );

  await act(async () => {
    render(<ClusterView />, container);
  });

  await waitFor(() =>
    expect(screen.getByText(/node-green-uCdq/)).toBeInTheDocument(),
  );
});


================================================
FILE: quickwit/quickwit-ui/src/views/ClusterView.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Typography } from "@mui/material";
import { useEffect, useMemo, useState } from "react";
import ApiUrlFooter from "../components/ApiUrlFooter";
import { JsonEditor } from "../components/JsonEditor";
import {
  FullBoxContainer,
  QBreadcrumbs,
  ViewUnderAppBarBox,
} from "../components/LayoutUtils";
import Loader from "../components/Loader";
import ErrorResponseDisplay from "../components/ResponseErrorDisplay";
import { Client } from "../services/client";
import { Cluster, ResponseError } from "../utils/models";

function ClusterView() {
  const [loading, setLoading] = useState(false);
  const [cluster, setCluster] = useState<null | Cluster>(null);
  const [responseError, setResponseError] = useState<ResponseError | null>(
    null,
  );
  const quickwitClient = useMemo(() => new Client(), []);

  useEffect(() => {
    setLoading(true);
    quickwitClient.cluster().then(
      (cluster) => {
        setResponseError(null);
        setLoading(false);
        setCluster(cluster);
      },
      (error) => {
        setLoading(false);
        setResponseError(error);
      },
    );
  }, [quickwitClient]);

  const renderResult = () => {
    if (responseError !== null) {
      return ErrorResponseDisplay(responseError);
    }
    if (loading || cluster == null) {
      return <Loader />;
    }
    return <JsonEditor content={cluster} resizeOnMount={false} />;
  };

  return (
    <ViewUnderAppBarBox>
      <FullBoxContainer>
        <QBreadcrumbs aria-label="breadcrumb">
          <Typography color="text.primary">Cluster</Typography>
        </QBreadcrumbs>
        <FullBoxContainer sx={{ px: 0 }}>{renderResult()}</FullBoxContainer>
      </FullBoxContainer>
      {ApiUrlFooter("api/v1/cluster")}
    </ViewUnderAppBarBox>
  );
}

export default ClusterView;


================================================
FILE: quickwit/quickwit-ui/src/views/IndexView.test.jsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { render, screen, waitFor } from "@testing-library/react";
import { act } from "react";
import { BrowserRouter } from "react-router";
import { Client } from "../services/client";
import IndexView from "./IndexView";

jest.mock("../services/client");
jest.mock("react-router", () => ({
  ...jest.requireActual("react-router"),
  useParams: () => ({
    indexId: "my-new-fresh-index-id",
  }),
}));

test("renders IndexView", async () => {
  const index = {
    metadata: {
      index_config: {
        index_uri: "my-new-fresh-index-uri",
      },
    },
    splits: [],
  };
  Client.prototype.getIndex.mockImplementation(() => Promise.resolve(index));

  await act(async () => {
    render(<IndexView />, { wrapper: BrowserRouter });
  });

  await waitFor(() =>
    expect(screen.getByText(/my-new-fresh-index-uri/)).toBeInTheDocument(),
  );
});


================================================
FILE: quickwit/quickwit-ui/src/views/IndexView.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { TabContext, TabList, TabPanel } from "@mui/lab";
import { Box, styled, Tab, Typography } from "@mui/material";
import Link, { LinkProps } from "@mui/material/Link";
import React, { useCallback, useEffect, useMemo, useState } from "react";
import { Link as RouterLink, useParams } from "react-router";
import ApiUrlFooter from "../components/ApiUrlFooter";
import { IndexSummary } from "../components/IndexSummary";
import { JsonEditor } from "../components/JsonEditor";
import {
  FullBoxContainer,
  QBreadcrumbs,
  ViewUnderAppBarBox,
} from "../components/LayoutUtils";
import Loader from "../components/Loader";
import { Client } from "../services/client";
import { Index } from "../utils/models";

export type ErrorResult = {
  error: string;
};

const CustomTabPanel = styled(TabPanel)`
  padding-left: 0;
  padding-right: 0;
  height: 100%;
`;

// NOTE : https://mui.com/material-ui/react-breadcrumbs/#integration-with-react-router
interface LinkRouterProps extends LinkProps {
  to: string;
  replace?: boolean;
}

function LinkRouter(props: LinkRouterProps) {
  return <Link {...props} component={RouterLink} />;
}

function IndexView() {
  const { indexId } = useParams();
  const [loading, setLoading] = useState(false);
  const [, setLoadingError] = useState<ErrorResult | null>(null);
  const [tabIndex, setTabIndex] = useState("1");
  const [index, setIndex] = useState<Index>();
  const quickwitClient = useMemo(() => new Client(), []);

  const handleTabIndexChange = (_: React.SyntheticEvent, newValue: string) => {
    setTabIndex(newValue);
  };

  const fetchIndex = useCallback(() => {
    setLoading(true);
    if (indexId === undefined) {
      console.warn("`indexId` should always be set.");
      return;
    } else {
      quickwitClient.getIndex(indexId).then(
        (fetchedIndex) => {
          setLoadingError(null);
          setLoading(false);
          setIndex(fetchedIndex);
        },
        (error) => {
          setLoading(false);
          setLoadingError({ error: error });
        },
      );
    }
  }, [indexId, quickwitClient]);

  const renderFetchIndexResult = () => {
    if (loading || index === undefined) {
      return <Loader />;
    } else {
      // TODO: remove this css with magic number `48px`.
      return (
        <Box
          sx={{
            display: "flex",
            flexDirection: "column",
            height: "calc(100% - 48px)",
          }}
        >
          <TabContext value={tabIndex}>
            <Box sx={{ borderBottom: 1, borderColor: "divider" }}>
              <TabList onChange={handleTabIndexChange} aria-label="Index tabs">
                <Tab label="Summary" value="1" />
                <Tab label="Sources" value="2" />
                <Tab label="Doc Mapping" value="3" />
                <Tab label="Indexing settings" value="4" />
                <Tab label="Search settings" value="5" />
                <Tab label="Retention settings" value="6" />
                <Tab label="Splits" value="7" />
              </TabList>
            </Box>
            <CustomTabPanel value="1">
              <IndexSummary index={index} />
            </CustomTabPanel>
            <CustomTabPanel value="2">
              <JsonEditor
                content={index.metadata.sources}
                resizeOnMount={false}
              />
            </CustomTabPanel>
            <CustomTabPanel value="3">
              <JsonEditor
                content={index.metadata.index_config.doc_mapping}
                resizeOnMount={false}
              />
            </CustomTabPanel>
            <CustomTabPanel value="4">
              <JsonEditor
                content={index.metadata.index_config.indexing_settings}
                resizeOnMount={false}
              />
            </CustomTabPanel>
            <CustomTabPanel value="5">
              <JsonEditor
                content={index.metadata.index_config.search_settings}
                resizeOnMount={false}
              />
            </CustomTabPanel>
            <CustomTabPanel value="6">
              <JsonEditor
                content={index.metadata.index_config.retention || {}}
                resizeOnMount={false}
              />
            </CustomTabPanel>
            <CustomTabPanel value="7">
              <JsonEditor content={index.splits} resizeOnMount={false} />
            </CustomTabPanel>
          </TabContext>
        </Box>
      );
    }
  };

  useEffect(() => {
    fetchIndex();
  }, [fetchIndex]);

  return (
    <ViewUnderAppBarBox>
      <FullBoxContainer>
        <QBreadcrumbs aria-label="breadcrumb">
          <LinkRouter underline="hover" color="inherit" to="/indexes">
            <Typography color="text.primary">Indexes</Typography>
          </LinkRouter>
          <Typography color="text.primary">{indexId}</Typography>
        </QBreadcrumbs>
        {renderFetchIndexResult()}
      </FullBoxContainer>
      {ApiUrlFooter("api/v1/indexes/" + indexId)}
    </ViewUnderAppBarBox>
  );
}

export default IndexView;


================================================
FILE: quickwit/quickwit-ui/src/views/IndexesView.test.jsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { render, screen } from "@testing-library/react";
import { act } from "react";
import { Client } from "../services/client";
import IndexesView from "./IndexesView";

jest.mock("../services/client");
const mockedUsedNavigate = jest.fn();
jest.mock("react-router", () => ({
  ...jest.requireActual("react-router"),
  useNavigate: () => mockedUsedNavigate,
}));

let container = null;
beforeEach(() => {
  // setup a DOM element as a render target
  container = document.createElement("div");
  document.body.appendChild(container);
});

afterEach(() => {
  // cleanup on exiting
  container.remove();
  container = null;
});

test("renders IndexesView", async () => {
  const indexes = [
    {
      index_config: {
        index_id: "my-new-fresh-index",
        index_uri: "my-uri",
        indexing_settings: {
          timestamp_field: "timestamp",
        },
        search_settings: {},
        doc_mapping: {
          store: false,
          field_mappings: [],
          tag_fields: [],
          dynamic_mapping: false,
        },
      },
      sources: [],
      create_timestamp: 1000,
      update_timestamp: 1000,
    },
  ];
  Client.prototype.listIndexes.mockResolvedValueOnce(() => indexes);

  await act(async () => {
    render(<IndexesView />, container);
  });

  expect(
    screen.getByText(indexes[0].index_config.index_id),
  ).toBeInTheDocument();
});


================================================
FILE: quickwit/quickwit-ui/src/views/IndexesView.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { Box, Typography } from "@mui/material";
import { useEffect, useMemo, useState } from "react";
import ApiUrlFooter from "../components/ApiUrlFooter";
import IndexesTable from "../components/IndexesTable";
import {
  FullBoxContainer,
  QBreadcrumbs,
  ViewUnderAppBarBox,
} from "../components/LayoutUtils";
import Loader from "../components/Loader";
import ErrorResponseDisplay from "../components/ResponseErrorDisplay";
import { Client } from "../services/client";
import { IndexMetadata, ResponseError } from "../utils/models";

function IndexesView() {
  const [loading, setLoading] = useState(false);
  const [responseError, setResponseError] = useState<ResponseError | null>(
    null,
  );
  const [indexesMetadata, setIndexesMetadata] = useState<IndexMetadata[]>();
  const quickwitClient = useMemo(() => new Client(), []);

  const renderFetchIndexesResult = () => {
    if (responseError !== null) {
      return ErrorResponseDisplay(responseError);
    }
    if (loading || indexesMetadata === undefined) {
      return <Loader />;
    }
    if (indexesMetadata.length > 0) {
      return (
        <FullBoxContainer sx={{ px: 0 }}>
          <IndexesTable indexesMetadata={indexesMetadata} />
        </FullBoxContainer>
      );
    }
    return <Box>You have no index registered in your metastore.</Box>;
  };

  useEffect(() => {
    setLoading(true);
    quickwitClient.listIndexes().then(
      (indexesMetadata) => {
        setResponseError(null);
        setLoading(false);
        setIndexesMetadata(indexesMetadata);
      },
      (error) => {
        setLoading(false);
        setResponseError(error);
      },
    );
  }, [quickwitClient]);

  return (
    <ViewUnderAppBarBox>
      <FullBoxContainer>
        <QBreadcrumbs aria-label="breadcrumb">
          <Typography color="text.primary">Indexes</Typography>
        </QBreadcrumbs>
        {renderFetchIndexesResult()}
      </FullBoxContainer>
      {ApiUrlFooter("api/v1/indexes")}
    </ViewUnderAppBarBox>
  );
}

export default IndexesView;


================================================
FILE: quickwit/quickwit-ui/src/views/NodeInfoView.test.jsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { render, screen, waitFor } from "@testing-library/react";
import { act } from "react";
import { Client } from "../services/client";
import NodeInfoView from "./NodeInfoView";

jest.mock("../services/client");

let container = null;
beforeEach(() => {
  // setup a DOM element as a render target
  container = document.createElement("div");
  document.body.appendChild(container);
});

afterEach(() => {
  // cleanup on exiting
  container.remove();
  container = null;
});

test("renders NodeInfoView", async () => {
  const cluster = {
    cluster_id: "my cluster id",
  };
  Client.prototype.cluster.mockImplementation(() => Promise.resolve(cluster));

  const config = {
    node_id: "my-node-id",
  };
  Client.prototype.config.mockImplementation(() => Promise.resolve(config));

  const buildInfo = {
    version: "0.3.2",
  };
  Client.prototype.buildInfo.mockImplementation(() =>
    Promise.resolve(buildInfo),
  );
  await act(async () => {
    render(<NodeInfoView />, container);
  });

  await waitFor(() =>
    expect(screen.getByText(/my-node-id/)).toBeInTheDocument(),
  );
});


================================================
FILE: quickwit/quickwit-ui/src/views/NodeInfoView.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { TabContext, TabList, TabPanel } from "@mui/lab";
import { Box, styled, Tab, Typography } from "@mui/material";
import { useEffect, useMemo, useState } from "react";
import ApiUrlFooter from "../components/ApiUrlFooter";
import { JsonEditor } from "../components/JsonEditor";
import {
  FullBoxContainer,
  QBreadcrumbs,
  ViewUnderAppBarBox,
} from "../components/LayoutUtils";
import Loader from "../components/Loader";
import { Client } from "../services/client";
import { QuickwitBuildInfo } from "../utils/models";

const CustomTabPanel = styled(TabPanel)`
  padding-left: 0;
  padding-right: 0;
  height: 100%;
`;

function NodeInfoView() {
  const [loadingCounter, setLoadingCounter] = useState(2);
  const [nodeId, setNodeId] = useState<string>("");
  const [nodeConfig, setNodeConfig] = useState<null | Record<string, any>>(
    null,
  );
  const [buildInfo, setBuildInfo] = useState<null | QuickwitBuildInfo>(null);
  const [tabIndex, setTabIndex] = useState("1");
  const quickwitClient = useMemo(() => new Client(), []);

  const urlByTab: Record<string, string> = {
    "1": "api/v1/config",
    "2": "api/v1/version",
  };

  const handleTabIndexChange = (_: React.SyntheticEvent, newValue: string) => {
    setTabIndex(newValue);
  };

  useEffect(() => {
    quickwitClient.cluster().then(
      (cluster) => {
        setNodeId(cluster.node_id);
      },
      (error) => {
        console.log("Error when fetching cluster info:", error);
      },
    );
  });
  useEffect(() => {
    setLoadingCounter(2);
    quickwitClient.buildInfo().then(
      (fetchedBuildInfo) => {
        setLoadingCounter((prevCounter) => prevCounter - 1);
        setBuildInfo(fetchedBuildInfo);
      },
      (error) => {
        setLoadingCounter((prevCounter) => prevCounter - 1);
        console.log("Error when fetching build info: ", error);
      },
    );
    quickwitClient.config().then(
      (fetchedConfig) => {
        setLoadingCounter((prevCounter) => prevCounter - 1);
        setNodeConfig(fetchedConfig);
      },
      (error) => {
        setLoadingCounter((prevCounter) => prevCounter - 1);
        console.log("Error when fetching node config: ", error);
      },
    );
  }, [quickwitClient]);

  const renderResult = () => {
    if (loadingCounter !== 0) {
      return <Loader />;
    } else {
      return (
        <FullBoxContainer sx={{ px: 0 }}>
          <TabContext value={tabIndex}>
            <Box sx={{ borderBottom: 1, borderColor: "divider" }}>
              <TabList onChange={handleTabIndexChange} aria-label="Index tabs">
                <Tab label="Node config" value="1" />
                <Tab label="Build info" value="2" />
              </TabList>
            </Box>
            <CustomTabPanel value="1">
              <JsonEditor content={nodeConfig} resizeOnMount={false} />
            </CustomTabPanel>
            <CustomTabPanel value="2">
              <JsonEditor content={buildInfo} resizeOnMount={false} />
            </CustomTabPanel>
          </TabContext>
        </FullBoxContainer>
      );
    }
  };

  return (
    <ViewUnderAppBarBox>
      <FullBoxContainer>
        <QBreadcrumbs aria-label="breadcrumb">
          <Typography color="text.primary">Node ID: {nodeId} (self)</Typography>
        </QBreadcrumbs>
        {renderResult()}
      </FullBoxContainer>
      {ApiUrlFooter(urlByTab[tabIndex] || "")}
    </ViewUnderAppBarBox>
  );
}

export default NodeInfoView;


================================================
FILE: quickwit/quickwit-ui/src/views/SearchView.test.jsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { render, screen, waitFor } from "@testing-library/react";
import { act } from "react";
import { Client } from "../services/client";
import SearchView from "./SearchView";

jest.mock("../services/client");
const mockedUsedNavigate = jest.fn();
jest.mock("react-router", () => ({
  ...jest.requireActual("react-router"),
  useLocation: () => ({
    pathname: "/search",
    search:
      "index_id=my-new-fresh-index-idmax_hits=10&start_timestamp=1460554590&end_timestamp=1460554592&sort_by_field=-timestamp",
  }),
  useNavigate: () => mockedUsedNavigate,
}));

let container = null;
beforeEach(() => {
  // setup a DOM element as a render target
  container = document.createElement("div");
  document.body.appendChild(container);
});

afterEach(() => {
  // cleanup on exiting
  container.remove();
  container = null;
});

test("renders SearchView", async () => {
  const index = {
    metadata: {
      index_config: {
        index_id: "my-new-fresh-index-id",
        index_uri: "my-new-fresh-index-uri",
        indexing_settings: {},
        doc_mapping: {
          field_mappings: [
            {
              name: "timestamp",
              type: "i64",
            },
          ],
        },
      },
    },
    splits: [],
  };
  Client.prototype.getIndex.mockImplementation(() => Promise.resolve(index));
  Client.prototype.listIndexes.mockImplementation(() =>
    Promise.resolve([index.metadata]),
  );

  const searchResponse = {
    num_hits: 2,
    hits: [
      { body: "INFO This is an info log" },
      { body: "WARN This is a warn log" },
    ],
    elapsed_time_micros: 10,
    errors: [],
  };
  Client.prototype.search.mockImplementation(() =>
    Promise.resolve(searchResponse),
  );

  await act(async () => {
    render(<SearchView />, container);
  });

  await waitFor(() =>
    expect(screen.getByText(/This is an info log/)).toBeInTheDocument(),
  );
});


================================================
FILE: quickwit/quickwit-ui/src/views/SearchView.tsx
================================================
// Copyright 2021-Present Datadog, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

import { useEffect, useMemo, useRef, useState } from "react";
import { useLocation, useNavigate } from "react-router";
import ApiUrlFooter from "../components/ApiUrlFooter";
import { IndexSideBar } from "../components/IndexSideBar";
import {
  FullBoxContainer,
  ViewUnderAppBarBox,
} from "../components/LayoutUtils";
import { QueryEditorActionBar } from "../components/QueryActionBar";
import { AggregationEditor } from "../components/QueryEditor/AggregationEditor";
import { QueryEditor } from "../components/QueryEditor/QueryEditor";
import SearchResult from "../components/SearchResult/SearchResult";
import { useLocalStorage } from "../providers/LocalStorageProvider";
import { Client } from "../services/client";
import {
  EMPTY_SEARCH_REQUEST,
  Index,
  IndexMetadata,
  ResponseError,
  SearchRequest,
  SearchResponse,
} from "../utils/models";
import {
  hasSearchParams,
  parseSearchUrl,
  toUrlSearchRequestParams,
} from "../utils/urls";

function updateSearchRequestWithIndex(
  index: Index | null,
  searchRequest: SearchRequest,
) {
  // If we have a timestamp field, order by desc on the timestamp field.
  if (index?.metadata.index_config.doc_mapping.timestamp_field) {
    searchRequest.sortByField = {
      field_name: index?.metadata.index_config.doc_mapping.timestamp_field,
      order: "Desc",
    };
  } else {
    searchRequest.sortByField = null;
    searchRequest.startTimestamp = null;
    searchRequest.endTimestamp = null;
  }
  if (index?.metadata.index_config.index_id) {
    searchRequest.indexId = index?.metadata.index_config.index_id;
  }
}

function SearchView() {
  const location = useLocation();
  const navigate = useNavigate();
  const [index, setIndex] = useState<null | Index>(null);
  const prevIndexIdRef = useRef<string | null>(null);
  const [searchResponse, setSearchResponse] = useState<null | SearchResponse>(
    null,
  );
  const [searchError, setSearchError] = useState<null | ResponseError>(null);
  const [queryRunning, setQueryRunning] = useState(false);
  const [searchRequest, setSearchRequest] = useState<SearchRequest>(
    hasSearchParams(location.search)
      ? parseSearchUrl(location.search)
      : EMPTY_SEARCH_REQUEST,
  );
  const updateLastSearchRequest = useLocalStorage().updateLastSearchRequest;
  const quickwitClient = useMemo(() => new Client(), []);

  const runSearch = (updatedSearchRequest: SearchRequest) => {
    if (!updatedSearchRequest || !updatedSearchRequest.indexId) {
      return;
    }

    console.log("Run search...", updatedSearchRequest);
    updateSearchRequestWithIndex(index, updatedSearchRequest);
    setSearchRequest(updatedSearchRequest);
    setQueryRunning(true);
    setSearchError(null);
    navigate(
      "/search?" + toUrlSearchRequestParams(updatedSearchRequest).toString(),
    );
    const timestamp_field =
      index?.metadata.index_config.doc_mapping.timestamp_field || null;
    quickwitClient.search(updatedSearchRequest, timestamp_field).then(
      (response) => {
        updateLastSearchRequest(updatedSearchRequest);
        setSearchResponse(response);
        setQueryRunning(false);
      },
      (error) => {
        setQueryRunning(false);
        setSearchError(error);
        console.error("Error when running search request", error);
      },
    );
  };
  const onIndexMetadataUpdate = (indexMetadata: IndexMetadata | null) => {
    setSearchRequest((previousRequest) => {
      updateSearchRequestWithIndex(index, previousRequest);
      return {
        ...previousRequest,
        indexId:
          indexMetadata === null ? null : indexMetadata.index_config.index_id,
      };
    });
  };
  const onSearchRequestUpdate = (searchRequest: SearchRequest) => {
    setSearchRequest(searchRequest);
  };
  useEffect(() => {
    if (prevIndexIdRef.current !== index?.metadata.index_config.index_id) {
      setSearchResponse(null);
    }
    // Run search only if this is the first time we set the index.
    if (prevIndexIdRef.current === null) {
      runSearch(searchRequest);
    }
    prevIndexIdRef.current =
      index === null ? null : index.metadata.index_config.index_id;
  }, [index]);
  useEffect(() => {
    if (!searchRequest.indexId) {
      return;
    }

    if (
      index !== null &&
      index.metadata.index_config.index_id === searchRequest.indexId
    ) {
      return;
    }
    // If index id is changing, it's better to reset timestamps as the time unit may be different
    // between indexes.
    if (
      prevIndexIdRef.current !== null &&
      prevIndexIdRef.current !== index?.metadata.index_config.index_id
    ) {
      searchRequest.startTimestamp = null;
      searchRequest.endTimestamp = null;
    }
    quickwitClient.getIndex(searchRequest.indexId).then((fetchedIndex) => {
      setIndex(fetchedIndex);
    });
  }, [searchRequest, quickwitClient, index]);

  const searchParams = toUrlSearchRequestParams(searchRequest);
  // `toUrlSearchRequestParams` is used for the UI urls. We need to remove the `indexId` request parameter to generate
  // the correct API url, this is the only difference.
  searchParams.delete("index_id");
  return (
    <ViewUnderAppBarBox sx={{ flexDirection: "row" }}>
      <IndexSideBar
        indexMetadata={index === null ? null : index.metadata}
        onIndexMetadataUpdate={onIndexMetadataUpdate}
      />
      <FullBoxContainer sx={{ padding: 0 }}>
        <FullBoxContainer>
          <QueryEditorActionBar
            searchRequest={searchRequest}
            onSearchRequestUpdate={onSearchRequestUpdate}
            runSearch={runSearch}
            index={index}
            queryRunning={queryRunning}
          />
          <QueryEditor
            searchRequest={searchRequest}
            onSearchRequestUpdate={onSearchRequestUpdate}
            runSearch={runSearch}
            index={index}
            queryRunning={queryRunning}
          />
          <AggregationEditor
            searchRequest={searchRequest}
            onSearchRequestUpdate={onSearchRequestUpdate}
            runSearch={runSearch}
            index={index}
            queryRunning={queryRunning}
          />
          <SearchResult
            queryRunning={queryRunning}
            searchError={searchError}
            searchResponse={searchResponse}
            index={index}
          />
        </FullBoxContainer>
        {index !== null &&
          ApiUrlFooter(
            `api/v1/${index?.metadata.index_config.index_id}/search?${searchParams.toString()}`,
          )}
      </FullBoxContainer>
    </ViewUnderAppBarBox>
  );
}

export default SearchView;


================================================
FILE: quickwit/quickwit-ui/tsconfig.json
================================================
{
  "compilerOptions": {
    "target": "ESNext",
    "lib": ["dom", "dom.iterable", "esnext"],
    "allowJs": true,
    "skipLibCheck": true,
    "esModuleInterop": true,
    "allowSyntheticDefaultImports": true,
    "strict": true,
    "noPropertyAccessFromIndexSignature": true,
    "noUncheckedIndexedAccess": true,
    "noUnusedLocals": true,
    "noUnusedParameters": true,
    "forceConsistentCasingInFileNames": true,
    "noFallthroughCasesInSwitch": true,
    "module": "esnext",
    "moduleResolution": "node",
    "resolveJsonModule": true,
    "isolatedModules": true,
    "noEmit": true,
    "jsx": "react-jsx",
    "types": ["vite/client"]
  },
  "exclude": ["build"]
}


================================================
FILE: quickwit/quickwit-ui/vite.config.ts
================================================
import { UserConfig } from "vite";

export default {
  base: "/ui",
  server: {
    proxy: {
      "/api": "http://127.0.0.1:7280",
      "/openapi.json": "http://127.0.0.1:7280",
    },
    port: 3000,
  },
  build: {
    rollupOptions: {
      onwarn(warning, warn) {
        // Suppress "use client" directive warnings from material-ui
        if (
          warning.code === "MODULE_LEVEL_DIRECTIVE" &&
          warning.message.includes('"use client"')
        ) {
          return;
        }
        warn(warning);
      },
    },
  },
} satisfies UserConfig;


================================================
FILE: quickwit/rest-api-tests/Pipfile
================================================
[[source]]
url = "https://pypi.org/simple"
verify_ssl = true
name = "pypi"

[packages]
requests = "*"
pyaml = "*"

[dev-packages]

[requires]
python_version = "3.11"


================================================
FILE: quickwit/rest-api-tests/README.md
================================================
# Rest API tests

This directory is meant to test quickwit at the Rest API level.
It was initially meant to iterate over the elastic search compatibility API,
but it can also be used as a convenient way to create integration tests.

# Setting up the Python environment

## Installing Pipenv

```bash
pip install --user pipenv
```

[Pipenv installation](https://pipenv.pypa.io/en/latest/installation/)

## Installing the dependencies in a virtual environment

```bash
pipenv shell
pipenv install
```

# Running the tests

The test script is meant to target `elasticsearch` and `quickwit`.

When targeting quickwit, the script expects a fresh quickwit instance
running on `http://localhost:7280`. The data involved is small, and
running in DEBUG mode is fine.

```bash
./run_tests.py --engine quickwit
```

When targeting elasticsearch, the script expects elastic to be running on
`http://localhost:9200` (see [compose script](./docker-compose.yaml)).

In both cases, the test will take care of setting up, ingesting and tearing down the
indexes involved.

```./run_tests.py --engine elasticsearch```

# Writing a new test suite

Writing a new test suite only requires to create a new subdirectory somewhere in the scenarii/` tree.
The test script recursively browse the directories and executes some setup / teardown operation.

## setup

Setup consists in two things. First a context is built by loading and merging the content of the files `_ctx.yaml` and `_ctx.<engine>.yaml`.
This context will be used to prepopulate our steps dictionary.

This engine-specific context is perfect if you know all steps will target a specific endpoint, or a specific method.

Once the context is loaded, the steps described in `_setup.yaml` and `_setup.<engine>.yaml` (if present) will be executed.

These steps are just like any other steps except you are guaranteed they will be executed respectively before and after all other steps.
In particular, when targeting one specific test using the `--test flag`,
the necessary `setup` and `teardown` script will be automatically executed.

# teardown

It then executes the tests described in .yaml files, in their lexicographical order.
A single file can contain more than one tests, by separating them by `---`.

Here is an example of a test

```yaml
# Query string takes priority over query defined in body
method: [GET, POST]
params:
  # this overrides the query sent in body
  q: type:PushEvent
  size: 3
json:
  query:
    term:
      type:
        value: "whatever"
expected:
  hits:
    total:
      value: 60
      relation: "eq"
    hits:
      $expect: "len(val) == 3"
```

A test will just run a REST HTTP call, and check that the resulting JSON matches
some expectation.


- **method**: gives the list of HTTP methods to test. If there is more than one, they will be all tested.
- **params**: describes the parameters that should be sent as query strings.
- **json**: describes the JSON body, sent with the query
- **expected**: describes the expectation.

# Expectations

The expectation is an object that mirrors the structure of the response.
It does not need to contain its entire tree.

For instance, given the following json object:
```json
{"name": "Droopy", "age": 31}
```

It is possible to test for the name part only by using the following expectation:
```yaml
# ...
expected:
  name: Droopy
```

Sometimes, it might be cumbersome or even impossible to check a result against a value.
In that case, it is possible to express the condition as a python expression, by using the reserved keyword "$expect".

In the following, we could check that the age is greater than 30, like this:
```yaml
# ...
expected:
  age:
      $expect: "val >= 3"
```

Note that the value of the node (here `31`) is injected as a variable `val` in the expression.


================================================
FILE: quickwit/rest-api-tests/docker-compose.yaml
================================================
# This docker-compose file is useful to start up
# a single node elasticsearch to test our rest api tests
# against.
version: "3.7"

services:
  elasticsearch:
    image: docker.elastic.co/elasticsearch/elasticsearch:8.9.0
    container_name: elasticsearch
    environment:
      - xpack.security.enabled=false
      - discovery.type=single-node
      - "ES_JAVA_OPTS=-Xms512m -Xmx512m"
    ports:
      - 9200:9200
      - 9300:9300
    # If you see elasticsearch lacking disk space, you can mount a local directory
    # as follows like this.
    #volumes:
    #  - /Users/fulmicoton/git/quickwit/quickwit/rest-api-tests/esdata:/usr/share/elasticsearch/data


================================================
FILE: quickwit/rest-api-tests/run_tests.py
================================================
#!/usr/bin/env python3

import copy
import glob
import gzip
import http
import json
import os
import requests
import random
import shutil
import subprocess
import sys
import tempfile
import time
import yaml

from os import mkdir
from os import path as osp

# Simple !include constructor for YAML to allow reusing fragments across files.
# Usage examples:
#   - !include path/to/file.yaml                -> includes full file content
#   - !include path/to/file.yaml::doc_mapping   -> includes the 'doc_mapping' key
#   - !include path/to/file.yaml::a.b.c         -> includes nested key a -> b -> c
def _yaml_include(loader, node):
    value = loader.construct_scalar(node)
    if "::" in value:
        filepath, subpath = value.split("::", 1)
    else:
        filepath, subpath = value, None
    with open(filepath, "r") as f:
        included = yaml.load(f, Loader=yaml.Loader)
    if subpath:
        cur = included
        for seg in filter(None, subpath.split(".")):
            if not isinstance(cur, dict) or seg not in cur:
                raise KeyError(f"!include path '{subpath}' not found in {filepath}")
            cur = cur[seg]
        return cur
    return included

# Register the constructor on the default Loader used by this script.
yaml.Loader.add_constructor("!include", _yaml_include)

def debug_http():
    old_send = http.client.HTTPConnection.send
    def new_send(self, data):
        print(f'{"-"*9} BEGIN REQUEST {"-"*9}')
        if len(data) > 500:
            print("Data too big")
            print(data[:500])
        else:
            print(data.decode('utf-8').strip())
        print(f'{"-"*10} END REQUEST {"-"*10}')
        return old_send(self, data)
    http.client.HTTPConnection.send = new_send

def open_scenario(scenario_filepath):
    data = open(scenario_filepath).read()
    steps_data = data.split("\n---")
    for step_data in steps_data:
        step_data  = step_data.strip()
        if step_data == "":
            continue
        step_dict = yaml.load(step_data, Loader=yaml.Loader)
        if type(step_dict) == dict:
            yield step_dict

def run_step(step, previous_result):
    result = {}
    if "method" in step:
        methods = step["method"]
        if type(methods) != list:
            methods = [methods]
        for method in methods:
            result = run_request_step(method, step, previous_result)
    if "sleep_after" in step:
        time.sleep(step["sleep_after"])
    return result

def run_request_with_retry(run_req, expected_status_code=None, num_retries=10, wait_time=0.5):
    for try_number in range(num_retries + 1):
        r = run_req()
        if expected_status_code is None or r.status_code == expected_status_code:
            return r
        print("Failed with", r.text, r.status_code)
        if try_number < num_retries:
            print("Retrying...")
            time.sleep(wait_time)
    raise Exception("Wrong status code. Got %s, expected %s, url %s" % (r.status_code, expected_status_code, run_req().url))


def resolve_previous_result(c, previous_result):
    if type(c) == dict:
        result = {}
        if len(c) == 1 and "$previous" in c:
            return eval(c["$previous"], None, {"val": previous_result})
        for (k, v) in c.items():
            result[k] = resolve_previous_result(v, previous_result)
        return result
    if type(c) == list:
        return [
            resolve_previous_result(v, previous_result)
            for v in c
        ]
    return c

def run_request_step(method, step, previous_result):
    assert method in {"GET", "POST", "PUT", "DELETE"}
    if "headers" not in step:
        step["headers"] = {'user-agent': 'my-app/0.0.1'}
    method_req = getattr(requests, method.lower())
    endpoint = step.get("endpoint", "")
    url = "{}/{}".format(step["api_root"].rstrip('/'), endpoint.lstrip('/'))
    kvargs = {
        k: v
        for k, v in step.items()
        if k in {"params", "data", "json", "headers"}
    }
    body_from_file = step.get("body_from_file", None)
    if body_from_file is not None:
        body_from_file = osp.join(step["cwd"], body_from_file)
        kvargs["data"] = open(body_from_file, 'rb').read()

    kvargs = resolve_previous_result(kvargs, previous_result)
    shuffle_ndjson = step.get("shuffle_ndjson", None)
    if shuffle_ndjson is not None:
        docs_per_split = distribute_items(shuffle_ndjson, step.get("min_splits", 1), step.get("max_splits", 5), step.get("seed", None))

        for i, bucket in enumerate(docs_per_split):
            new_step = copy.deepcopy(step)
            del new_step["shuffle_ndjson"]
            new_step["ndjson"] = bucket
            run_request_step(method, new_step, previous_result)
        return;
    ndjson = step.get("ndjson", None)
    if ndjson is not None:
        # Add a newline at the end to please elasticsearch -> "The bulk request must be terminated by a newline [\\n]".
        kvargs["data"] = "\n".join([json.dumps(doc) for doc in ndjson]) + "\n"
        kvargs.setdefault("headers")["Content-Type"] = "application/json"
    expected_status_code = step.get("status_code", 200)
    debug = step.get("debug", False)
    num_retries = step.get("num_retries", 0)
    run_req = lambda : method_req(url, **kvargs)
    r = run_request_with_retry(run_req, expected_status_code, num_retries)
    expected_resp = step.get("expected", None)
    json_resp = r.json()
    if debug:
        print(expected_status_code)
        print(json_resp)
    if expected_resp is not None:
        try:
            check_result(json_resp, expected_resp, context_path="")
        except Exception as e:
            print(json.dumps(json_resp, indent=2))
            raise e
    return json_resp

def distribute_items(items, min_buckets, max_buckets, seed=None):
    if seed is None:
        seed = random.randint(0, 10000)
    random.seed(seed)
    
    # Determine the number of buckets
    num_buckets = random.randint(min_buckets, max_buckets)
    
    # Initialize empty buckets
    buckets = [[] for _ in range(num_buckets)]
    
    # Distribute items randomly into buckets
    for item in items:
        random_bucket = random.randint(0, num_buckets - 1)
        buckets[random_bucket].append(item)
    
    # Print the seed for reproducibility
    print(f"Seed: {seed}")
    
    return buckets

def check_result(result, expected, context_path = ""):
    if type(expected) == dict and "$expect" in expected:
        expectations = expected["$expect"]
        if type(expectations) == str:
            expectations = [expectations]
        for expectation in expectations:
            if not eval(expectation, None, {"val": result}):
                print(result)
                raise Exception("Failed to meet expectation %s at %s" % (expectation, context_path))
            return
    if type(result) != type(expected):
        raise Exception("Wrong type at context %s. Got %s, Expected %s" % (context_path, type(result), type(expected)))
    elif type(result) == dict:
        check_result_dict(result, expected, context_path)
    elif type(result) == list:
        check_result_list(result, expected, context_path)
    elif result != expected:
        raise Exception("Expected %s at context %s, got %s" % (expected, context_path, result))

def check_result_list(result, expected, context_path=""):
    if len(result) != len(expected):
        if len(expected) != 0:
            # get keys from the expected dicts and filter result to print only the keys that are in the expected dicts
            expected_keys = set().union(*expected)
            filtered_result = [{k: v for k, v in d.items() if k in expected_keys} for d in result]
            # Check if the length differs by more than five
            if abs(len(filtered_result) - len(expected)) > 5:
                # Show only the first 5 elements followed by ellipsis if there are more
                display_filtered_result = filtered_result[:5] + ['...'] if len(filtered_result) > 5 else filtered_result
            else:
                display_filtered_result = filtered_result
            raise Exception("Wrong length at context %s. Expected: %s Received: %s,\n Expected \n%s \n Received \n%s" % (context_path, len(expected), len(result), expected, display_filtered_result))
        raise Exception("Wrong length at context %s. Expected: %s Received: %s" % (context_path, len(expected), len(result)))
    for (i, (left, right)) in enumerate(zip(result, expected)):
        check_result(left, right, context_path + "[%s]" % i)

def check_result_dict(result, expected, context_path=""):
    for key, value in expected.items():
        try:
            child = result[key]
        except KeyError:
            raise Exception("Missing key `%s` at context %s" % (key, context_path))
        check_result(child, value, context_path + "." + key)

class PathTree:
    def __init__(self):
        self.children = {}
        self.scripts = []

    def add_child(self, seg):
        child = self.children.get(seg, None)
        if child is None:
            self.children[seg] = PathTree()
        return self.children[seg]

    def add_script(self, script):
        self.scripts.append(script)

    def add_path(self, path):
        path_segs = path.split("/")
        if path_segs[-1].startswith("_"):
            return
        path_tree = self
        for path_seg in path_segs[:-1]:
            path_tree = path_tree.add_child(path_seg)
        path_tree.add_script(path_segs[-1])

    def visit_nodes(self, visitor, path=[]):
        success = True
        success &= visitor.enter_directory(path)
        for script in self.scripts:
            success &= visitor.run_scenario(path, script)
        for k in sorted(self.children.keys()):
            child_path = path + [k]
            success &= self.children[k].visit_nodes(visitor, child_path)
        success &= visitor.exit_directory(path)
        return success

# Returns a new dictionary without modifying the arguments.
# The new dictionary is the result of merging the two dictionaries
# in that order:
# The second dictionary may shadow/override the keys of the first dictionar
def stack_dicts(context, overriding):
    context = context.copy()
    context.update(overriding)
    return context

class Visitor:
    def __init__(self, engine):
        self.engine = engine
        self.context_stack = []
        self.context = {}
    def run_setup_teardown_scripts(self, script_name, path):
        cwd = "/".join(path)
        success = True
        for file_name in [script_name + ".yaml", script_name + "." + self.engine + ".yaml"]:
            script_fullpath = cwd + "/" + file_name
            if osp.exists(script_fullpath):
                success &= self.run_scenario(path, file_name)
        return success
    def load_context(self, path):
        context = {"cwd": "/".join(path)}
        for file_name in ["_ctx.yaml", "_ctx." + self.engine + ".yaml"]:
            ctx_filepath = "/".join(path + [file_name])
            if osp.exists(ctx_filepath):
                ctx = yaml.load(open(ctx_filepath), Loader=yaml.Loader)
                context.update(ctx)
        self.context_stack.append(context)
        self.context.update(context)
    def enter_directory(self, path):
        print("============")
        self.load_context(path)
        return self.run_setup_teardown_scripts("_setup", path)
    def exit_directory(self, path):
        success = self.run_setup_teardown_scripts("_teardown", path)
        self.context_stack.pop()
        self.context = {}
        for ctx in self.context_stack:
            self.context.update(ctx)
        return success
    def run_scenario(self, path, script):
        scenario_path = "/".join(path + [script])
        steps = list(open_scenario(scenario_path))
        num_steps_executed = 0
        num_steps_skipped = 0
        previous_result = {}
        for (i, step) in enumerate(steps, 1):
            step = stack_dicts(self.context, step)
            applicable_engine = step.get("engines", None)
            if applicable_engine is not None:
                if self.engine not in applicable_engine:
                    num_steps_skipped += 1
                    continue
            try:
                previous_result = run_step(step, previous_result)
                num_steps_executed += 1
            except Exception as e:
                print("🔴 %s" % scenario_path)
                print(f"Failed at step '{step['desc']}'" if 'desc' in step else f"Failed at step {i}")
                print(step)
                print(e)
                print("--------------")
                return False
        else:
            print("🟢 %s: %d steps (%d skipped)" % (scenario_path, num_steps_executed, num_steps_skipped))
        return True

def build_path_tree(paths):
    paths.sort()
    path_tree = PathTree()
    for path in paths:
        path_tree.add_path(path)
    return path_tree

def run(scenario_paths, engine):
    path_tree = build_path_tree(scenario_paths)
    visitor = Visitor(engine=engine)
    return path_tree.visit_nodes(visitor)

def filter_test(prefixes, test_name):
    for prefix in prefixes:
        if test_name.startswith(prefix):
            return True
    return False

def filter_tests(prefixes, test_names):
    print("Filtering tests prefixes: %s" % prefixes)
    if prefixes is None or len(prefixes) == 0:
        return test_names
    return [
        test_name
        for test_name in test_names
        if filter_test(prefixes, test_name)
    ]

class QuickwitRunner:
    def __init__(self, quickwit_bin_path):
        self.quickwit_dir = tempfile.TemporaryDirectory()
        print('created temporary directory', self.quickwit_dir, self.quickwit_dir.name)
        qwdata = osp.join(self.quickwit_dir.name, "qwdata")
        config = osp.join(self.quickwit_dir.name, "config")
        mkdir(qwdata)
        mkdir(config)
        shutil.copy("../../config/quickwit.yaml", config)
        shutil.copy(quickwit_bin_path, self.quickwit_dir.name)
        self.proc = subprocess.Popen(["./quickwit", "run"], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL, cwd=self.quickwit_dir.name)
        for i in range(100):
            try:
                print("Checking on quickwit")
                res = requests.get("http://localhost:7280/health/readyz")
                if res.status_code == 200 and res.text.strip() == "true":
                    print("Quickwit started")
                    time.sleep(6)
                    break
            except:
                pass
            print("Server not ready yet. Sleep and retry...")
            time.sleep(1)
        else:
            print("Quickwit never started. Exiting.")
            sys.exit(2)
    def __del__(self):
        print("Killing Quickwit")
        subprocess.Popen.kill(self.proc)

def main():
    import argparse
    arg_parser = argparse.ArgumentParser(
        prog="rest-api-test",
        description="Runs a set of calls against a REST API and checks for conditions over the results."
    )
    arg_parser.add_argument("--engine", help="Targeted engine (elastic/quickwit).", default="quickwit")
    arg_parser.add_argument("--test", help="Specific prefix to select the tests to run. If not specified, all tests are run.", nargs="*")
    arg_parser.add_argument("--binary", help="Specific the quickwit binary to run.", nargs="?")
    parsed_args = arg_parser.parse_args()

    print(parsed_args)

    quickwit_process = None
    if parsed_args.binary is not None:
        if parsed_args.engine != "quickwit":
            print("The --binary option is only supported for quickwit engine.")
            sys.exit(3)
        binary = parsed_args.binary
        quickwit_process = QuickwitRunner(binary)
    quickwit_process

    scenario_filepaths = glob.glob("scenarii/**/*.yaml", recursive=True)
    scenario_filepaths = list(filter_tests(parsed_args.test, scenario_filepaths))
    return run(scenario_filepaths, engine=parsed_args.engine)

if __name__ == "__main__":
    import sys
    if main():
        sys.exit(0)
    else:
        sys.exit(1)


================================================
FILE: quickwit/rest-api-tests/scenarii/aggregations/0001-aggregations.yaml
================================================
# Test date histogram aggregation
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    date_histo:
      date_histogram:
        field: "date"
        fixed_interval: "30d"
        offset: "-4d"
expected:
  aggregations:
    date_histo:
      buckets:
        -  { "doc_count": 5, "key": 1420070400000.0, "key_as_string": "2015-01-01T00:00:00Z" }
        -  { "doc_count": 2, "key": 1422662400000.0, "key_as_string": "2015-01-31T00:00:00Z" }
---
# Test date histogram with extended bounds
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    date_histo:
      date_histogram:
        field: "date"
        fixed_interval: "30d"
        offset: "-4d"
        extended_bounds:
          min: 1420070400000
          max: 1425254400000
expected:
  aggregations:
    date_histo:
      buckets:
        -  { "doc_count": 5, "key": 1420070400000.0, "key_as_string": "2015-01-01T00:00:00Z" }
        -  { "doc_count": 2, "key": 1422662400000.0, "key_as_string": "2015-01-31T00:00:00Z" }
        -  { "doc_count": 0, "key": 1425254400000.0, "key_as_string": "2015-03-02T00:00:00Z" }
---
# Test date histogram aggregation and sub-aggregation 
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    date_histo: 
      date_histogram: 
        field: "date"
        fixed_interval: "30d"
        offset: "-4d"
      aggs:
        response:
          stats:
            field: response
expected:
  aggregations:
    date_histo:
      buckets:
        -  { "doc_count": 5, "key": 1420070400000.0, "key_as_string": "2015-01-01T00:00:00Z", "response": { "avg": 85.0, "count": 4, "max": 120.0, "min": 20.0, "sum": 340.0 } }
        -  { "doc_count": 2, "key": 1422662400000.0, "key_as_string": "2015-01-31T00:00:00Z", "response": { "avg": 80.0, "count": 2, "max": 130.0, "min": 30.0, "sum": 160.0 }  }
--- 
# Test date histogram aggregation + exists and sub-aggregation 
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query:
    bool:
      must:
        - exists:
            field: response
  aggs:
    date_histo: 
      date_histogram: 
        field: "date"
        fixed_interval: "30d"
        offset: "-4d"
      aggs:
        response:
          stats:
            field: response
expected:
  aggregations:
    date_histo:
      buckets:
        -  { "doc_count": 4, "key": 1420070400000.0, "key_as_string": "2015-01-01T00:00:00Z", "response": { "avg": 85.0, "count": 4, "max": 120.0, "min": 20.0, "sum": 340.0 } }
        -  { "doc_count": 2, "key": 1422662400000.0, "key_as_string": "2015-01-31T00:00:00Z", "response": { "avg": 80.0, "count": 2, "max": 130.0, "min": 30.0, "sum": 160.0 }  }
--- 
# Test range aggregation
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    my_range:
      range: 
        field: response
        ranges:
        - { to: 50, key: fast }
        - { from: 50, to: 80, key: medium }
        - { from: 80, key: slow }
expected:
  aggregations:
    my_range:
      buckets:
        - { "doc_count": 5, "key": "fast", "to": 50.0 }
        - { "doc_count": 0, "from": 50.0, "key": "medium", "to": 80.0 }
        - { "doc_count": 4, "from": 80.0, "key": "slow" }
--- 
# Test term aggs
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    hosts: 
      terms: 
        field: "host"
    tags: 
      terms: 
        field: "tags"
expected:
  aggregations:
    hosts:
      buckets:
      - doc_count: 4
        key: 192.168.0.10
      - doc_count: 2
        key: 192.168.0.1
      - doc_count: 1
        key: 192.168.0.11
      doc_count_error_upper_bound: 0
      sum_other_doc_count: 0
    tags:
      buckets:
      - doc_count: 5
        key: nice
      - doc_count: 2
        key: cool
      doc_count_error_upper_bound: 0
      sum_other_doc_count: 0
--- 
# Test term aggs with split_size
# We set split_size to 1, so one document with name "Fritz" will be missing from one split.
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    names: 
      terms: 
        field: "name"
        size: 1
        split_size: 1
expected:
  aggregations:
    names:
      buckets:
        # There are 3 documents with name "Fritz" but we only get 2. One does not get passed to the 
        # root node, because it gets cut off due to the split_size parameter set to 1.
        # We also get doc_count_error_upper_bound: 2, which signals that the result is approximate.
      - doc_count: 2 
        key: "Fritz"
      sum_other_doc_count: 8
      doc_count_error_upper_bound: 2
--- 
# Test term aggs with shard_size
# segment_size is an alias to shard_size
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    names: 
      terms: 
        field: "name"
        size: 1
        segment_size: 1
expected:
  aggregations:
    names:
      buckets:
        # There are 3 documents with name "Fritz" but we only get 2. One does not get passed to the 
        # root node, because it gets cut off due to the split_size parameter set to 1.
        # We also get doc_count_error_upper_bound: 2, which signals that the result is approximate.
      - doc_count: 2 
        key: "Fritz"
      sum_other_doc_count: 8
      doc_count_error_upper_bound: 2
--- 
# Test term aggs with shard_size
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    names: 
      terms: 
        field: "name"
        size: 1
        shard_size: 1
expected:
  aggregations:
    names:
      buckets:
        # There are 3 documents with name "Fritz" but we only get 2. One does not get passed to the 
        # root node, because it gets cut off due to the split_size parameter set to 1.
        # We also get doc_count_error_upper_bound: 2, which signals that the result is approximate.
      - doc_count: 2 
        key: "Fritz"
      sum_other_doc_count: 8
      doc_count_error_upper_bound: 2
---
# Test term aggs with split_size
# Here we increase split_size to 5, so we will get the 3 documents with name "Fritz"
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    names: 
      terms: 
        field: "name"
        size: 1
        split_size: 5
expected:
  aggregations:
    names:
      buckets:
        # We get all 3 documents with name "Fritz"
        # We also get doc_count_error_upper_bound: 0, to the result is exact.
      - doc_count: 3 
        key: "Fritz"
      sum_other_doc_count: 7
      doc_count_error_upper_bound: 0
--- 
# Test date histogram + percentiles sub-aggregation
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    metrics:
      date_histogram:
        field: date
        fixed_interval: 30d
        offset: "-4d"
      aggs:
        response:
          percentiles:
            field: response
            percents:
            - 85
            keyed: false
expected:
  aggregations:
    metrics:
      buckets:
      - doc_count: 5
        key: 1420070400000.0
        key_as_string: '2015-01-01T00:00:00Z'
        response:
          values:
          - key: 85.0
            value: 100.49456770856702
      - doc_count: 2
        key: 1422662400000.0
        key_as_string: '2015-01-31T00:00:00Z'
        response:
          values:
          - key: 85.0
            value: 30.26717133872237
--- 
# Test histogram
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    metrics:
      histogram:
        field: response
        interval: 50
expected:
  aggregations:
    metrics:
      buckets:
      - doc_count: 5
        key: 0.0
      - doc_count: 0
        key: 50.0
      - doc_count: 4
        key: 100.0

--- 
# Test histogram empty result on empty index
method: [GET]
engines:
  - quickwit
endpoint: _elastic/empty_aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    metrics:
      histogram:
        field: response
        interval: 50
expected:
  aggregations:
    metrics:
      buckets: []
---
# Test cardinality aggregation
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    unique_names:
      cardinality:
        field: "name"
    unique_response:
      cardinality:
        field: "response"
    unique_dates:
      cardinality:
        field: "date"
expected:
  aggregations:
    unique_names:
      value: 8.0
    unique_response:
      value: 5.0 # TODO: Check. The correct number is 6
    unique_dates:
      value: 6.0 
---
# Test extended stats aggregation
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    response_stats:
      extended_stats:
        field: "response"
expected:
  aggregations:
    response_stats:
      sum_of_squares: 55300.0
# Test term aggs number precision
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  size: 0
  aggs:
    names: 
      terms: 
        field: "high_prec_test"
expected:
  aggregations:
    names:
      buckets:
      - doc_count: 1 
        key: 1769070189829214200


================================================
FILE: quickwit/rest-api-tests/scenarii/aggregations/0002-doc-len.yaml
================================================
# Test summing doc len
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query: { match_all: {} }
  aggs:
    doc_len:
      sum:
        field: "_doc_length"
expected:
  aggregations:
    doc_len:
      value: 952.0
---
# Test doc len isn't shown when querying documents
method: [GET]
engines:
  - quickwit
endpoint: _elastic/aggregations/_search
json:
  query:
    term:
      id:
        value: 1
expected:
  hits:
    hits:
      - _source:
          $expect: "not '_doc_length' in val"
---


================================================
FILE: quickwit/rest-api-tests/scenarii/aggregations/_ctx.yaml
================================================
method: GET
engines: ["quickwit"]
api_root: "http://localhost:7280/api/v1/"
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/aggregations/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/aggregations
status_code: null
---
method: DELETE
endpoint: indexes/empty_aggregations
status_code: null
---
# Create index
method: POST
endpoint: indexes/
json:
  version: "0.8"
  index_id: aggregations
  doc_mapping:
    mode: dynamic
    dynamic_mapping:
      tokenizer: default
      fast: true
    field_mappings:
      - name: date
        type: datetime
        input_formats:
          - rfc3339
        fast_precision: seconds
        fast: true
      - name: high_prec_test
        type: u64
        fast: true
    store_document_size: true
---
# Create empty index
method: POST
endpoint: indexes/
json:
  version: "0.8"
  index_id: empty_aggregations
  doc_mapping:
    mode: dynamic
    dynamic_mapping:
      tokenizer: default
      fast: true
    field_mappings:
      - name: date
        type: datetime
        input_formats:
          - rfc3339
        fast_precision: seconds
        fast: true
---
# Ingest documents
method: POST
endpoint: aggregations/ingest
params:
  commit: force
ndjson:
  - {"name": "Albert", "response": 100, "id": 1, "date": "2015-01-01T12:10:30Z", "host": "192.168.0.10", "tags": ["nice"]}
  - {"name": "Fred", "response": 100, "id": 3, "date": "2015-01-01T12:10:30Z", "host": "192.168.0.1", "tags": ["nice"]}
  - {"name": "Manfred", "response": 120, "id": 13, "date": "2015-01-11T12:10:30Z", "host": "192.168.0.11", "tags": ["nice"]}
  - {"name": "Horst", "id": 2, "date": "2015-01-01T11:11:30Z", "host": "192.168.0.10", "tags": ["nice", "cool"]}
  - {"name": "Fritz", "response": 30, "id": 5, "host": "192.168.0.1", "tags": ["nice", "cool"]}
---
# Ingest documents split #2
method: POST
endpoint: aggregations/ingest
params:
  commit: force
ndjson:
  - {"name": "Fritz", "high_prec_test": 1769070189829214200, "response": 30, "id": 0}
  - {"name": "Fritz", "response": 30, "id": 0}
  - {"name": "Holger", "response": 30, "id": 4, "date": "2015-02-06T00:00:00Z", "host": "192.168.0.10"}
  - {"name": "Werner", "response": 20, "id": 5, "date": "2015-01-02T00:00:00Z", "host": "192.168.0.10"}
  - {"name": "Bernhard", "response": 130, "id": 14, "date": "2015-02-16T00:00:00Z"}


================================================
FILE: quickwit/rest-api-tests/scenarii/aggregations/_teardown.quickwit.yaml
================================================
# # Delete index
method: DELETE
endpoint: indexes/aggregations
---
method: DELETE
endpoint: indexes/empty_aggregations


================================================
FILE: quickwit/rest-api-tests/scenarii/concat_fields/0001_concat_field.yaml
================================================
# we use the tokenizer from the concat field, not the underlying field
endpoint: concat/search
params:
  query: "concat_raw:AB-CD"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:EF-GH"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:'AB CD'"
expected:
  num_hits: 0
---
endpoint: concat/search
params:
  query: "concat_raw:'EF GH'"
expected:
  num_hits: 0
---
endpoint: concat/search
params:
  query: "concat_default:AB"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_default:GH"
expected:
  num_hits: 1
---
# we find bool both in text and in bool fields
endpoint: concat/search
params:
  query: "concat_raw:true"
expected:
  num_hits: 2
---
endpoint: concat/search
params:
  query: "concat_default:true"
expected:
  num_hits: 2
---
# we find numbers both in text and int fields
endpoint: concat/search
params:
  query: "concat_raw:42"
expected:
  num_hits: 1 # only 1 hit, 42 doesn't get tokenized on this field
---
endpoint: concat/search
params:
  query: "concat_default:42"
expected:
  num_hits: 2 # 2 hits, the number, and the tokenized text
---
endpoint: concat/search
params:
  query: "concat_raw:otherfieldvalue"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:9"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:false"
expected:
  num_hits: 2 # also include the document with a json field
---
endpoint: concat/search
params:
  query: "concat_default:otherfieldvalue OR concat_default:9"
expected:
  num_hits: 0 # this field doesn't include _dynamic
---
endpoint: concat/search
params:
  query: "concat_default:false"
expected:
  num_hits: 1 # only include the document with a json field
---
endpoint: concat/search
params:
  query: "concat_raw:10"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:nestedstring"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_default:10"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_default:nestedstring"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_default:1.5"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_default:2.5"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_default:3.5"
expected:
  num_hits: 0
---
endpoint: concat/search
params:
  query: "concat_raw:1.5"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:2.5"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:3.5"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:9223372036854775808"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  query: "concat_raw:-5"
expected:
  num_hits: 1
---
endpoint: concat/search
params:
  # concat date values are stored as strings to enable some level of range
  # querying even though they don't support fast fields
  query: "concat_raw:\"2024-01-01\"*"
expected:
  num_hits: 1
---


================================================
FILE: quickwit/rest-api-tests/scenarii/concat_fields/_ctx.yaml
================================================
method: GET
engines: ["quickwit"]
api_root: "http://localhost:7280/api/v1/"
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/concat_fields/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/concat
status_code: null
---
# Create index
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: concat
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: text1
        type: text
        tokenizer: default
      - name: text2
        type: text
        tokenizer: raw
      - name: boolean
        type: bool
      - name: int
        type: u64
      - name: float
        type: f64
      - name: json
        type: json
      - name: concat_raw
        type: concatenate
        concatenate_fields:
          - text1
          - text2
          - boolean
          - int
          - json
          - float
        tokenizer: raw
        include_dynamic_fields: true
      - name: concat_default
        type: concatenate
        concatenate_fields:
          - text1
          - text2
          - boolean
          - int
          - json
          - float
        tokenizer: default
    dynamic_mapping:
      tokenizer: default
      expand_dots: true
sleep_after: 3
---
# Ingest documents
method: POST
endpoint: concat/ingest
num_retries: 10
params:
  commit: force
ndjson:
  - {"text1": "AB-CD", "text2": "EF-GH"}
  - {"text1": "true"}
  - {"boolean": true}
  - {"text2": "i like 42"}
  - {"int": 42}
  - {"other-field": "otherfieldvalue", "other-field-number": 9, "other-field-bool": false}
  - {"json": {"some_bool": false, "some_int": 10, "nested": {"some_string": "nestedstring"}}}
  - {"float": 1.5}
  - {"json": {"val:": 2.5, "date": "2024-01-01T00:13:00Z"}}
  - {"other": 3.5}
  # too big to be a i64, parsed as a u64
  - {"big": 9223372036854775808}
  - {"neg": -5}


================================================
FILE: quickwit/rest-api-tests/scenarii/concat_fields/_teardown.quickwit.yaml
================================================
# Delete index
method: DELETE
endpoint: indexes/concat


================================================
FILE: quickwit/rest-api-tests/scenarii/default_search_fields/0001_default_fields.yaml
================================================
endpoint: defaultsearchfields/search
params:
  query: hello
expected:
  num_hits: 1
  hits:
    - id: 1
      some_dynamic_field: hello
---
endpoint: defaultsearchfields/search
params:
  query: allo
expected:
  num_hits: 1
  hits:
    - id: 2
      inner_json: {'somefieldinjson': 'allo'}
---
endpoint: defaultsearchfields/search
params:
  query: bonjour
expected:
  num_hits: 1
  hits:
    - id: 3
      regular_field: bonjour


================================================
FILE: quickwit/rest-api-tests/scenarii/default_search_fields/0002_invalid_default_fields.yaml
================================================
# should fail because we are not in dynamic,
# yet we are targeting a field not in the field mapping.
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: failing1
  doc_mapping:
    mode: lenient
    field_mappings: []
  search_settings:
    default_search_fields:
      - regular_field
status_code: 400
expected:
  message:
    $expect: "\"unknown default search field `regular_field`\" in val"
---
# should fail because default search field targets a sub field of a
# non-json field
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: failing2
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: text
        type: text
  search_settings:
    default_search_fields:
      - text.inner
status_code: 400
expected:
  message:
    $expect: "\"unknown default search field `text.inner`\" in val"
---
# should fail because dynamic field is not indexed.
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: failing3
  doc_mapping:
    mode: dynamic
    field_mappings: []
    dynamic_mapping:
      indexed: false
  search_settings:
    default_search_fields:
      - some_field
status_code: 400
expected:
  message:
    $expect: "\"default search field `some_field` is not indexed\" in val"


================================================
FILE: quickwit/rest-api-tests/scenarii/default_search_fields/_ctx.yaml
================================================
method: GET
engines: ["quickwit"]
api_root: "http://localhost:7280/api/v1/"
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/default_search_fields/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/defaultsearchfields
status_code: null
---
# Create index
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: defaultsearchfields
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: id
        type: u64
      - name: inner_json
        type: json
      - name: regular_field
        type: text
    dynamic_mapping:
      expand_dots: true
      fast: true
  search_settings:
    default_search_fields:
      - regular_field
      - some_dynamic_field
      - inner_json.somefieldinjson
---
method: POST
endpoint: defaultsearchfields/ingest
params:
  commit: force
ndjson:
  - {"id": 1, "some_dynamic_field": "hello"}
  - {"id": 2, "inner_json": {"somefieldinjson": "allo"}}
  - {"id": 3, "regular_field": "bonjour"}


================================================
FILE: quickwit/rest-api-tests/scenarii/default_search_fields/_teardown.quickwit.yaml
================================================
# Delete index
method: DELETE
endpoint: indexes/defaultsearchfields


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0001-noquery.yaml
================================================
# This tests a simple request with no queries.
expected:
  hits:
    total:
      value: 100
      relation: "eq"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0002-query_string.yaml
================================================
params:
  q: type:PushEvent
expected:
  hits:
    total:
      value: 60
      relation: "eq"
    hits:
      $expect: "len(val) == 10"
---
# Testing size.
params:
  q: type:PushEvent
  size: 3
expected:
  hits:
    total:
      value: 60
      relation: "eq"
    hits:
      $expect: "len(val) == 3"
---
# Query string takes priority over query defined in body
params:
  # this overrides the query sent in body
  q: type:PushEvent
  size: 3
json:
  query:
    term:
      type:
        value: "whatever"
expected:
  hits:
    total:
      value: 60
      relation: "eq"
    hits:
      $expect: "len(val) == 3"
---
params:
  # this overrides the query sent in body
  size: 3
json:
  query:
    term:
      type:
        value: "PushEvent"
        # By default case_insensitive is false and prevents matching
        # case_insensitive: false
expected:
  hits:
    total:
      value: 0
      relation: "eq"
    hits:
      $expect: "len(val) == 0"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0003-match.yaml
================================================
json:
  query:
    match:
      type:
        query:  PushEvent
expected:
  hits:
    total:
      value: 60
---
json:
  query:
    match:
      # It is strangely possible to supply the
      # query directly as a string.
      type: PushEvent
expected:
  hits:
    total:
      value: 60
---
json:
  query:
    match:
      type: "," # this will result in a zero-ter query
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    match:
      type:
        query: ", " # this will result in a zero term query.
        zero_terms_query: all
expected:
  hits:
    total:
      value: 100
---
json:
  query:
    match:
      payload.commits.message:
        query: "intial commit" # by default this is a disjunction
expected:
  hits:
    total:
      value: 6
---
json:
  query:
    match:
      payload.commits.message:
        query: "intial commit" # by default this is a disjunction
        operator: AND
expected:
  hits:
    total:
      value: 1


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0004-term_aggregations.yaml
================================================
# disabled due to the previous lack of fast field specific tokenizer.
params:
  size: 0
json:
  aggs:
    mytypeagg:
      terms:
        field: type
        size: 5
expected:
  hits:
    total:
      value: 100
    hits:
      $expect: "len(val) == 0"
  aggregations:
    mytypeagg:
      doc_count_error_upper_bound: 0
      sum_other_doc_count: 9
      buckets:
        - { "key": "pushevent", "doc_count": 60 }
        - { "key": "createevent", "doc_count" : 12 }
        - { "key": "issuecommentevent", "doc_count" : 8 }
        - { "key": "watchevent", "doc_count" : 6 }
        - { "key": "pullrequestevent", "doc_count" : 5 }


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0005-query_string_query.yaml
================================================
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent AND actor.login:jadonk"
expected:
  hits:
    total:
      value: 2
    hits:
      $expect: "len(val) == 2"
---
params:
  size: 10
json:
  query:
    query_string:
      query: "PushEvent"
      fields: ["type"]
expected:
  hits:
    total:
      value: 60
---
params:
  size: 10
json:
  query:
    query_string:
      query: "PushEvent"
      fields: "type"
status_code: 400
---
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent OR"
      fields: []
status_code: 400
---
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent OR"
      fields: ["body"]
      lenient: true
# Lenient is not about the syntax.
status_code: 400
---
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent"
      fields: []
      lenient: true
expected:
  hits:
    total:
      value: 60
---
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent"
      fields: []
      lenient: true
expected:
  hits:
    total:
      value: 60
---
params:
  size: 10
json:
  query:
    query_string:
      query: "actor.id:1315639"
      fields: []
expected:
  hits:
    total:
      value: 1
---
# This test does not work on quickwit.
# Quickwit always act like elasticsearch's lenient mode.
engines: [elasticsearch]
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent OR actor.id:shouldhavebeenanumber"
      fields: []
      lenient: false
status_code: 400
---
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent OR actor.id:shouldhavebeenanumber"
      fields: []
      lenient: true
expected:
  hits:
    total:
      value: 60
---
params:
  size: 10
json:
  query:
    query_string:
      query: "type:PushEvent AND actor.id:shouldhavebeenanumber"
      fields: []
      lenient: true
expected:
  hits:
    total:
      value: 0
---
# Default field
json:
  query:
    query_string:
      default_field: payload.commits.message
      lenient: true
      query: "to AND the"
expected:
  hits:
    total:
      value: 3
---
# Default field + fields
json:
  query:
    query_string:
      default_field: payload.commits.message
      fields:
        - payload.comments.body
      lenient: true
      query: "to AND the"
status_code: 400
---
# wildcard
json:
  query:
    query_string:
      default_field: payload.description
      lenient: true
      query: "Jou*al AND unix"
expected:
  hits:
    total:
      value: 2
---
# wildcard
json:
  query:
    query_string:
      default_field: payload.description
      lenient: true
      query: "Jour?al AND unix"
expected:
  hits:
    total:
      value: 2
---
# wildcard
json:
  query:
    query_string:
      default_field: payload.description
      lenient: true
      query: "jou*al AND unix"
expected:
  hits:
    total:
      value: 2
---
# trailing wildcard
json:
  query:
    query_string:
      default_field: payload.description
      lenient: true
      query: "jour*"
expected:
  hits:
    total:
      value: 3
---
# escaped wildcard
json:
  query:
    query_string:
      default_field: payload.description
      lenient: true
      # ? char removed by tokenizer
      query: "jour\\?"
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    regexp:
      payload.description:
          value: "jour.*"
expected:
  hits:
    total:
      value: 3
---
json:
  query:
    query_string:
      default_field: actor.id
      query: ">=10791466"
      lenient: true
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    query_string:
      default_field: actor.id
      query: ">10791466"
      lenient: true
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    query_string:
      query: "true"
      fields: ["public", "public.notdefined", "notdefined"]
      lenient: true
expected:
  hits:
    total:
      value: 100
---
# trailing wildcard
json:
  query:
    query_string:
      query: "jour*"
      fields: ["payload.description", "payload.notdefined", "notdefined"]
      lenient: true
expected:
  hits:
    total:
      value: 3
---
# elasticsearch accepts this query
engines:
  - quickwit
json:
  query:
    query_string:
      query: "true"
      fields: ["public", "public.notdefined"]
status_code: 400


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0006-term_query.yaml
================================================
params:
  # this overrides the query sent in body apparently
  size: 3
json:
  track_total_hits: true
  query:
    term:
      type:
        value: "PushEvent"
        case_insensitive: true
expected:
  hits:
    total:
      value: 60
      relation: "eq"
    hits:
      $expect: "len(val) == 3"
---
# Terms must be pushed in their form post tokenization
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      type:
        # this does not match because push event has been lowercased by the tokenizer.
        value: "PushEvent"
expected:
  hits:
    total:
      value: 0
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      type:
        value: "pushevent"
expected:
  hits:
    total:
      value: 60
      relation: "eq"
---
params:
  size: 0
# Testing the format without the "value" object
json:
  track_total_hits: true
  query:
    term:
      type: "pushevent"
expected:
  hits:
    total:
      value: 60
      relation: "eq"
# Also testing numbers, and numbers as string in the JSON query
---
engines: ["elasticsearch"]
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      actor.id: 1762355
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      actor.id: "1762355"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      actor.id:
        value: 1762355
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      actor.id:
        value: "1762355"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
# id is a text field
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      id:
        value: "2549961272"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      id:
        value: 2549961272
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      id: 2549961272
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      id: "2549961272"
expected:
  hits:
    total:
      value: 1
      relation: "eq"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0007-range_queries.yaml
================================================
json:
  query:
    range:
      actor.id:
        gte: 10791466
expected:
  hits:
    total:
      value: 2
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        gt: 10791466
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        lt: 10791466
expected:
  hits:
    total:
      value: 98
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        lte: 10791466
expected:
  hits:
    total:
      value: 99
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        gt: 467872
expected:
  hits:
    total:
      value: 84
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        gte: 467872
expected:
  hits:
    total:
      value: 85
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        lte: 467872
expected:
  hits:
    total:
      value: 16
      relation: "eq"
---
json:
  query:
    range:
      actor.id:
        gt: 467872
        lt: 10791466
expected:
  hits:
    total:
      value: 82
      relation: "eq"
---
# Missing in some documents
json:
  query:
    range:
      payload.size:
        gte: 2
expected:
  hits:
    total:
      value: 13
      relation: "eq"
---
# Field not present in all documents
json:
  query:
    range:
      payload.size:
        lt: 2
expected:
  hits:
    total:
      value: 47
      relation: "eq"
---
# Timestamp field
json:
  query:
    range:
      created_at:
        lt: "2015-02-01T00:00:13Z"
        gte: "2015-02-01T00:00:10Z"
expected:
  hits:
    total:
      value: 44
      relation: "eq"
---
# Timestamp field using timestamp
json:
  query:
    range:
      created_at:
        lt: 1422748813000
expected:
  hits:
    total:
      value: 86
      relation: "eq"
---
# Timestamp field
json:
  query:
    range:
      created_at:
        gte: "2015-02-01T00:00:10Z"
expected:
  hits:
    total:
      value: 58
      relation: "eq"
---
# Timestamp field
json:
  query:
    range:
      created_at:
        lt: "2015-02-01T00:00:13Z"
expected:
  hits:
    total:
      value: 86
      relation: "eq"
---
# Timestamp field with milliseconds precision 2015-02-01T00:00:00.001
json:
  query:
    range:
      created_at:
        gte: "2015-02-01T00:00:00.001Z"
        lt: "2015-02-01T00:00:00.002Z"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
# Timestamp field with range in microseconds.
# Datetime will be truncated at milliseconds as
# defined in the doc mapper.
json:
  query:
    range:
      created_at:
        gte: "2015-02-01T00:00:00.001999Z"
        lte: "2015-02-01T00:00:00.001999Z"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
# This field is not a JSON field and doesn not have fast field normalization.
# That means it is case sensitive
json:
  query:
    range:
      repo.name:
        gte: "h"
        lte: "i"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
# This field is a JSON field and has fast field normalization.
# That means it is case insensitive
json:
  query:
    range:
      actor.login:
        gte: "H" # should automatically be normalized
        lte: "Z"
expected:
  hits:
    total:
      value: 68
      relation: "eq"
---
# This field is a JSON field and has fast field normalization.
# That means it is case insensitive
engines:
    - quickwit
json:
  query:
    range:
      actor.login:
        gte: "h" # should automatically be normalized
        lte: "z"
expected:
  hits:
    total:
      value: 68
      relation: "eq"
---
# This field is a JSON field and has fast field normalization.
# That means it is case insensitive
json:
  query:
    range:
      actor.login:
        gte: "H" # should automatically be normalized
        lte: "Z"
expected:
  hits:
    total:
      value: 68
      relation: "eq"
---
# Timestamp field with a custom format.
json:
  query:
    range:
      created_at:
        gte: "2015|02|01 T00:00:00.001999Z"
        lte: "2015|02|01 T00:00:00.001999Z"
        # Elasticsearch date format requires text to be escaped with single quotes
        format: yyyy|MM|dd 'T'HH:mm:ss.SSSSSS'Z'
expected:
  hits:
    total:
      value: 1
      relation: "eq"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0008-sort_by.yaml
================================================
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: desc
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 10791502
---
# Checking that passing the sort params as a query string works.
params:
    sort: "actor.id:desc"
    q: "*"
    size: 1
expected:
    hits:
        total:
            value: 100
            relation: eq
        hits:
            - _source:
                actor:
                    id: 10791502
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: asc
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 5688
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 5688
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    actor.id: {}
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 5688
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    _doc:
      order: desc
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 9018
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    _doc:
      order: asc
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 1762355
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    _doc: {}
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor:
            id: 1762355


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0009-bool_query.yaml
================================================
# Motivated by #3249
json:
  query:
      match_all: {}
expected:
  hits:
    total:
      value: 100
---
json:
  query:
      bool:
        filter:
          - match_all: {}
expected:
  hits:
    total:
      value: 100
---
json:
  query:
      bool: {}
expected:
  hits:
    total:
      value: 100
---
json:
  query:
      bool:
        must_not:
          - match_none: {}
expected:
  hits:
    total:
      value: 100
---
json:
  query:
      bool:
        must_not:
          - {"query_string": {"query": "type:PushEvent AND actor.login:jadonk"}}
expected:
  hits:
    total:
      value: 98
---
# Silly edge case 1
json:
  query:
      bool:
        should:
          - match_none: {}
expected:
  hits:
    total:
      value: 0
---
# Silly edge case 2
json:
  query:
      bool:
        should:
          - match_none: {}
        must_not:
          - match_none: {}
expected:
  hits:
    total:
      value: 0
---
# Silly edge case 3
json:
  query:
      bool:
        must_not:
          - match_none: {}
expected:
  hits:
    total:
      value: 100
---
# Silly edge case 4
json:
  query:
      bool:
        must:
          - match_all: {}
        should:
          - match_none: {}
expected:
  hits:
    total:
      value: 100
---
# Silly edge case 4
json:
  query:
      bool:
        filter:
          - match_all: {}
        should:
          - match_none: {}
expected:
  hits:
    total:
      value: 100
---
# Support null values
# This format is not supported by Elasticsearch
engines: ["quickwit"]
json:
  query:
      bool:
        must: null
        must_not: null
        should: null
        filter: null
        boost: null
expected:
  hits:
    total:
      value: 100
---
json:
    query:
        bool:
            should:
                - {"query_string": {"query": "type:PushEvent"}}
                - {"query_string": {"query": "actor.login:jadonk"}}
                - {"query_string": {"query": "actor.login:teozfrank"}}
                - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: 1
expected:
    hits:
        total:
            value: 69
---
json:
  query:
      bool:
        should:
          - {"query_string": {"query": "type:PushEvent"}}
          - {"query_string": {"query": "actor.login:jadonk"}}
          - {"query_string": {"query": "actor.login:teozfrank"}}
          - {"query_string": {"query": "type:IssueCommentEvent"}}
        minimum_should_match: 2
expected:
  hits:
    total:
      value: 3
---
json:
    query:
        bool:
            should:
                - {"query_string": {"query": "type:PushEvent"}}
                - {"query_string": {"query": "actor.login:jadonk"}}
                - {"query_string": {"query": "actor.login:teozfrank"}}
                - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: 3
expected:
    hits:
        total:
            value: 0
---
json:
  query:
      bool:
        must:
          - {"query_string": {"query": "type:PushEvent"}}
        should:
          - {"query_string": {"query": "actor.login:jadonk"}}
          - {"query_string": {"query": "actor.login:teozfrank"}}
          - {"query_string": {"query": "type:IssueCommentEvent"}}
        minimum_should_match: 1
expected:
  hits:
    total:
      value: 2
---
json:
  query:
      bool:
        must:
          - {"query_string": {"query": "type:PushEvent"}}
        should:
          - {"query_string": {"query": "actor.login:jadonk"}}
        minimum_should_match: 2 # that's one too many'
expected:
  hits:
    total:
      value: 0
---
json:
    query:
        bool:
            should:
            - {"query_string": {"query": "type:PushEvent"}}
            - {"query_string": {"query": "actor.login:jadonk"}}
            - {"query_string": {"query": "actor.login:teozfrank"}}
            - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: 50%
expected:
    hits:
        total:
            value: 3
---
json:
    query:
        bool:
            should:
            - {"query_string": {"query": "type:PushEvent"}}
            - {"query_string": {"query": "actor.login:jadonk"}}
            - {"query_string": {"query": "actor.login:teozfrank"}}
            - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: -2
expected:
    hits:
        total:
            value: 3
---
json:
    query:
        bool:
            should:
            - {"query_string": {"query": "type:PushEvent"}}
            - {"query_string": {"query": "actor.login:jadonk"}}
            - {"query_string": {"query": "actor.login:teozfrank"}}
            - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: -3
expected:
    hits:
        total:
            value: 69
---
# corner case: a minimum should match that is too negative is just discarded.
json:
    query:
        bool:
            should:
            - {"query_string": {"query": "type:PushEvent"}}
            - {"query_string": {"query": "actor.login:jadonk"}}
            - {"query_string": {"query": "actor.login:teozfrank"}}
            - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: -10
expected:
    hits:
        total:
            value: 69
---
# corner case: a minimum should match that is too negative is just discarded.
json:
    query:
        bool:
            must:
                - {"query_string": {"query": "type:PushEvent"}}
            should:
                - {"query_string": {"query": "actor.login:jadonk"}}
                - {"query_string": {"query": "actor.login:teozfrank"}}
                - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: -10
expected:
    hits:
        total:
            value: 60
---
json:
    query:
        bool:
            should:
            - {"query_string": {"query": "type:PushEvent"}}
            - {"query_string": {"query": "actor.login:jadonk"}}
            - {"query_string": {"query": "actor.login:teozfrank"}}
            - {"query_string": {"query": "type:IssueCommentEvent"}}
            minimum_should_match: 0
expected:
    hits:
        total:
            value: 69


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0010-match_phrase_prefix_query.yaml
================================================
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.pull_request.body:
        query: "p"
expected:
  hits:
    total:
      value: 2
      relation: "eq"
---
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.pull_request.body:
        query: "to p"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.pull_request.body:
        query: "be to p"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.commits.message:
        query: "automated comm"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
    hits:
      - _source:
          payload:
            commits:
              - message: "automated commit"
---
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.commits.message:
        query: "fix"
        max_expansions: 2
expected:
  hits:
    total:
      value: 6
      relation: "eq"
---
# This is a bit of a sloppy just testing that the tokenizer property is
# plugged
#
# We only apply it to quickwit because the raw tokenizer does not exist in ES.
method: [GET]
engines:
  - quickwit
json:
  query:
    match_phrase_prefix:
      payload.commits.message:
        query: "automated comm"
        analyzer: raw
expected:
  hits:
    total:
      value: 0
      relation: "eq"
---
# This is a bit of a sloppy just testing that the tokenizer property is
# plugged
#
# We only apply it to quickwit because the raw tokenizer does not exist in ES.
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.commits.message:
        query: "automated comm"
        analyzer: inexistent_tokenizer
status_code: 400


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0011-exists-query.yaml
================================================
json:
  query:
    exists:
      field: type
expected:
  hits:
    total:
      value: 100
---
json:
  query:
    exists:
      field: thisfielddoesnotexists
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    exists:
      field: payload.size
expected:
  hits:
    total:
      value: 60
---
json:
  query:
    exists:
      field: payload
expected:
  hits:
    total:
      # one of the docs contains `"payload":{}`
      value: 99
---
# Fortunately, ES does not accept this quirky syntax in the
# case of exists query.
json:
  query:
    exists: payload.size
status_code: 400


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0012-scroll-api.yaml
================================================
---
engines: ["quickwit"]
params:
    size: 1
    scroll: 30m
    allow_partial_search_results: "false"
json:
    query:
        match_all: {}
status_code: 400
expected:
    error:
        reason: "Invalid argument: Quickwit only supports scroll API with allow_partial_search_results set to true"
---
params:
  size: 1
  scroll: 30m
json:
  query:
    match_all: {}
  sort:
    - actor.id:
        order: desc
  aggs:
    mytypeagg:
      terms:
        field: type
        size: 5
store:
  scroll_id: _scroll_id
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  aggregations:
    mytypeagg: {}
  hits:
    hits:
      - _source: {actor: {login: "miyuotsuki"}}
    total:
      value: 100
      relation: "eq"
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      - _source: {actor: {login: "ScottThiessen"}}
    total:
      value: 100
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      - _source: {actor: {login: "seenajon"}}
    total:
      value: 100
---
engines: ["quickwit"]
params:
  size: 1
  scroll: 31m
json:
  query:
    match_all: {}
  sort:
    - actor.id:
        order: desc
status_code: 400
expected:
  status: 400
  error:
    reason: "Invalid argument: Quickwit only supports scroll TTL period up to 1800 secs"
---
params:
  size: 40
  scroll: 30m
json:
  query:
    match_all: {}
  sort:
    - actor.id:
        order: desc
  aggs:
    mytypeagg:
      terms:
        field: type
        size: 5
store:
  scroll_id: _scroll_id
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  aggregations:
    mytypeagg: {}
  hits:
    hits:
      $expect: "len(val) == 40"
    total:
      value: 100
      relation: "eq"
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      $expect: len(val) == 40
    total:
      value: 100
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      $expect: len(val) == 20
    total:
      value: 100
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      $expect: len(val) == 0
    total:
      value: 100
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      $expect: len(val) == 0
    total:
      value: 100


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0013-phrase-query.yaml
================================================
json:
  query:
    match_phrase:
      payload.commits.message: sign decoration
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    match_phrase:
      payload.commits.message:
        query: sign decoration
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    match_phrase:
      # There is a "zone of explosion" message.
      # Without slop no matches!
      payload.commits.message: zone explosion
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    match_phrase:
      # There is a "zone of explosion" message.
      # Without slop no matches!
      payload.commits.message:
        query: zone explosion
        slop: 1
expected:
  hits:
    total:
      value: 1


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0014-multi-match-query.yaml
================================================
json:
  engines:
    - quickwit
  query:
    multi_match:
      query: sign decoration
      fields: []
status_code:
  400
expected:
---
json:
  query:
    multi_match:
      query: sign decoration
      fields: ["payload.commits.message"]
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    multi_match:
      query: sign decoration
      # Apparently elasticsearch accepts a string here.
      fields: "payload.commits.message"
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    multi_match:
      query: sign decoration
      fields:
        - inexistent_field
        - payload.commits.message
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    multi_match:
      type: phrase
      query: sign decoration
      fields: ["payload.commits.message"]
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    multi_match:
      type: phrase
      query: zone explosion
      fields: ["payload.commits.message"]
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    multi_match:
      type: phrase
      query: zone explosion
      slop: 1
      fields: ["payload.commits.message"]
expected:
  hits:
    total:
      value: 1
---
engines:
    # TODO check the discrepancy with ES
    - quickwit
json:
  query:
    multi_match:
      type: most_fields
      query: the pomle missingtoken
      fields: ["payload.commits.message", "actor.login"]
expected:
  hits:
    total:
      value: 4
---
json:
  query:
    multi_match:
      type: phrase
      query: zone of expl
      fields: ["payload.commits.message"]
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    multi_match:
      type: phrase_prefix
      query: zone of expl
      fields: ["payload.commits.message"]
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    multi_match:
      type: phrase_prefix
      query: zone of expl
      # Yeah it makes no sense at all, but elastic accepts it.
      lenient: true
      fields: ["payload.commits.message"]
---
json:
  query:
    multi_match:
      type: most_fields
      query: the
      lenient: false
      fields: ["payload.commits.message", "hello"]


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0015-terms-query.yaml
================================================
json:
  query:
    terms:
      type:
        - PushEvent
        - CommitCommentEvent
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    terms:
      type:
        - pushevent
        - commitcommentevent
expected:
  hits:
    total:
      value: 61


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0016-misc-query.yaml
================================================
json:
  query:
    multi_match:
      fields:
        - payload.commits.message
        - payload.description
        - payload.comment.body
      lenient: true
      query: to be
      type: phrase
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    multi_match:
      fields:
        - payload.commits.message
        - payload.description
      lenient: true
      query: to b
      type: phrase
expected:
  hits:
    total:
      value: 0
---
json:
  query:
    multi_match:
      fields:
        - payload.commits.message
        - payload.description
        - payload.comment.body
      lenient: true
      query: to be
      type: phrase_prefix
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    multi_match:
      fields:
        - payload.commits.message
        - payload.description
        - payload.comment.body
      lenient: true
      query: to b
      type: phrase_prefix
expected:
  hits:
    total:
      value: 3
---
json:
  query:
    query_string:
      default_field: payload.commits.message
      lenient: true
      query: "to AND the"
expected:
  hits:
    total:
      value: 3
---
json:
  query:
    query_string:
      fields:
        - payload.commits.message
      lenient: true
      query: "to AND the"
expected:
  hits:
    total:
      value: 3
---
engines: ["quickwit"]
json:
  query:
    exists:
      field: payload.commits.message
expected:
  hits:
    total:
      value: 59  # There are actually 60 documents where this field is not empty, but one of them has a field longer than 255 chars
---
# test exists for a non-fast field
json:
  query:
    exists:
      field: public
expected:
  hits:
    total:
      value: 100
---
json:
  query:
    match_all: {}
expected:
  hits:
    total:
      value: 100
---
json:
  query:
    terms:
      payload.commits.message:
        - fix
        - bug
        - problem
        - closes
expected:
  hits:
    total:
      value: 3


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0017-match-bool-prefix-query.yaml
================================================
method: [GET]
json:
  query:
    match_bool_prefix:
      payload.pull_request.body:
        query: "file not ch"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
method: [GET]
json:
  query:
    match_bool_prefix:
      payload.pull_request.body:
        query: "file not chzn"
        operator: AND
expected:
  hits:
    total:
      value: 0
      relation: "eq"
---
method: [GET]
json:
  query:
    match_bool_prefix:
      payload.pull_request.body:
        query: "file not ch"
        operator: AND
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
method: [GET]
json:
  query:
    match_bool_prefix:
      payload.pull_request.body: "file not ch"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
method: [GET]
json:
  query:
    match_phrase_prefix:
      payload.commits.message:
        query: "fix"
expected:
  hits:
    total:
      value: 7
      relation: "eq"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0018-search_after.yaml
================================================
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: desc
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - sort: [10791502]
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: desc
  search_after: [10791502]
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - sort: [10791466]
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: asc
  search_after: [5688]
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - sort: [9018]
---
# Test with a search after value as string
# Quickwit should convert it to the correct type
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: asc
  search_after: ["5688"]
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - sort: [9018]
---
json:
  size: 1
  query:
      match_all: {}
  sort:
    - actor.id:
        order: asc
  search_after: [5688]
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - sort: [9018]
---
json:
  size: 100
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - created_at:
        order: asc
  search_after: [1422748815000]
expected:
  hits:
    hits:
      $expect: "len(val) == 4"
---
# Quickwit should accept timestamp as string.
json:
  size: 100
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - created_at:
        order: asc
  search_after: ["1422748815000"]
expected:
  hits:
    hits:
      $expect: "len(val) == 4"
---
json:
  size: 100
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - created_at:
        order: desc
  search_after: ["1422748800001"]
expected:
  hits:
    hits:
      $expect: "len(val) == 7"
---
# Only works for quickwit engine,
# `epoch_nanos_int` format is quickwit specific
engines:
  - quickwit
json:
  size: 100
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - created_at:
        order: asc
        format: epoch_nanos_int
  search_after: [1422748815000000000]
expected:
  hits:
    hits:
      - sort: [1422748816000000000]
      - sort: [1422748816000000000]
      - sort: [1422748816000000000]
      - sort: [1422748816000000000]


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0019-count.yaml
================================================
endpoint: "gharchive/_count"
params:
  q: type:PushEvent
expected:
  count: 60
---
endpoint: "gharchive/_count"
expected:
  count: 100


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0020-stats.yaml
================================================
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "gharchive/_stats"
expected:
  _all:
    primaries:
      docs:
        count: 100
      store:
        size_in_bytes:
          $expect: "val > 278300"
    total:
      segments:
        count: 1
      docs:
        count: 100
  indices:
    gharchive:
      primaries:
        docs:
          count: 100
        store:
          size_in_bytes:
            $expect: "val > 278300"
      total:
        segments:
          count: 1
        docs:
          count: 100
---
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "ghar*/_stats"
expected:
  _all:
    primaries:
      docs:
        count: 100
    total:
      segments:
        count: 1
      docs:
        count: 100
  indices:
    gharchive:
      primaries:
        docs:
          count: 100
      total:
        segments:
          count: 1
        docs:
          count: 100
---
method: [GET]
engines:
  - quickwit
endpoint: "_stats"
expected:
  _all:
    primaries:
      docs:
        count: 104
    total:
      segments:
        count: 3
      docs:
        count: 104
  indices:
    gharchive:
      primaries:
        docs:
          count: 100
      total:
        segments:
          count: 1
        docs:
          count: 100
    fast_only:
      primaries:
        docs:
          count: 2
      total:
        segments:
          count: 1
        docs:
          count: 2
    empty_index:
      primaries:
        docs:
          count: 0
      total:
        segments:
          count: 0
        docs:
          count: 0


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0021-cat-indices.yaml
================================================
method: [GET]
engines:
  - quickwit
endpoint: "_cat/indices?format=json"
expected:
- index: empty_index
  docs.count: '0'
- index: fast_only
  docs.count: '2'
- index: gharchive
  dataset.size: 222.8kb
  docs.count: '100'
  docs.deleted: '0'
  health: green
  pri: '1'
  pri.store.size:
      $expect: 270 < float(val[:-2]) < 280
  rep: '1'
  status: open
  store.size:
      #272.4kb
      $expect: 270 < float(val[:-2]) < 280
  rep: '1'
  #uuid: gharchive:01HN2SDANHDN6WFAFNH7BBMQ8C
- index: otel-logs-v0_9
  docs.count: '0'
- index: otel-traces-v0_9
  docs.count: '0'
- index: simple_es_compat
  docs.count: '2'
---
method: [GET]
engines:
  - quickwit
endpoint: "_cat/indices/gharchive?format=json"
expected:
- dataset.size:
    # 222.8kb
    $expect: 220 < float(val[:-2]) < 230
  docs.count: '100'
  docs.deleted: '0'
  health: green
  index: gharchive
  pri: '1'
  pri.store.size:
      #272.4kb
      $expect: 270 < float(val[:-2]) < 280
  rep: '1'
  status: open
  store.size:
      # 272.4kb
      $expect: 270 < float(val[:-2]) < 280
  #uuid: gharchive:01HN2SDANHDN6WFAFNH7BBMQ8C
---
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "_cat/indices/gharchive?format=json&h=docs.count,index"
expected:
- docs.count: '100'
  index: gharchive
--- # Wildcard test
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "_cat/indices/gharc*?format=json&h=docs.count,index"
expected:
- docs.count: '100'
  index: gharchive
--- # health green test
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "_cat/indices/gharchive?format=json&health=green"
expected:
- docs.count: '100'
  index: gharchive
--- # health red test
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "_cat/indices/gharchive?format=json&health=red"
expected: []
---
# Quickwit only supports JSON output. (Elastic has a table like text output.)
method: [GET]
engines:
  - quickwit
endpoint: "_cat/indices/gharchive" # missing format=json
status_code: 400
---
# Quickwit does not supports the `v` parameter.
method: [GET]
engines:
  - quickwit
endpoint: "_cat/indices/gharchive?format=json&v=true" # invalid h=true
status_code: 400
---
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: "_cat/indices/gharchive?format=json&b=b" # unsupported bytes parameter
status_code: 400


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0022-source.yaml
================================================
--- # _source_excludes
params:
  _source_excludes: ["actor"]
json:
  size: 1
  query:
      match_all: {}
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          $expect: "not 'actor' in val" 
--- # _source_includes
params:
  _source_includes: ["actor"]
json:
  size: 1
  query:
      match_all: {}
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          $expect: "len(val) == 1" # Contains only 'actor'
          actor:
            id: 5688
--- # _source_includes and _source_excludes
params:
  _source_includes: "actor,id"
  _source_excludes: ["actor"]
json:
  size: 1
  query:
      match_all: {}
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          $expect: "len(val) == 1" # Contains only 'actor'
          id: 5688
--- # _source_includes with path
params:
  _source_includes: "actor.id"
json:
  size: 1
  query:
      match_all: {}
expected:
  hits:
    total:
      value: 100
      relation: eq
    hits:
      - _source:
          actor: 
            $expect: "len(val) == 1" # Contains only 'actor'
            id: 5688


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0023-extra_filters.yaml
================================================
# Extra filters are additional filters that are applied to the query. Useful for permissions and other use cases. 
engines:
  - quickwit
json:
  query:
      match_all: {}
params:
  extra_filters: "type:PushEvent"
expected:
  hits:
    total:
      value: 60
--- # 2 extra filters
engines:
  - quickwit
json:
  query:
      match_all: {}
params:
  extra_filters: "type:PushEvent,actor.login:jadonk"
expected:
  hits:
    total:
      value: 2
--- # Test mixing
engines:
  - quickwit
json:
  query:
    query_string:
      query: "type:PushEvent"
params:
  extra_filters: "actor.login:jadonk"
expected:
  hits:
    total:
      value: 2
--- # Test mixing
engines:
  - quickwit
json:
  query:
    query_string:
      query: "type:PushEvent"
params:
  extra_filters: "type:PushEvent,actor.login:jadonk"
expected:
  hits:
    total:
      value: 2


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0024-delete_indices.yaml
================================================
--- #Create indices quickwit
engines:
  - quickwit
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: test_index1
  doc_mapping:
    mode: dynamic
sleep_after: 3
---
engines:
  - quickwit
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: test_index2
  doc_mapping:
    mode: dynamic
sleep_after: 3
--- # create indices elasticsearch
engines:
  - elasticsearch
method: PUT
endpoint: test_index1
json: {
  "mappings": {
    "properties": {
      "created_at": {
        "type": "date",
        "store": true
      }
    }
  }
}
--- # create indices elasticsearch
engines:
  - elasticsearch
method: PUT
endpoint: test_index2
json: {
  "mappings": {
    "properties": {
      "created_at": {
        "type": "date",
        "store": true
      }
    }
  }
}
---
engines:
  - quickwit
  - elasticsearch
method: DELETE
endpoint: test_index1,does_not_exist
status_code: 404
--- # delete partially matching with ignore_unavailable
engines:
  - quickwit
  - elasticsearch
method: DELETE
endpoint: test_index1,does_not_exist
status_code: 200
params:
  ignore_unavailable: "true"
--- # already deleted
engines:
  - quickwit
  - elasticsearch
method: DELETE 
endpoint: test_index1
status_code: 404
---
engines:
  - quickwit
  - elasticsearch
method: DELETE
endpoint: test_index2
status_code: 200


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0025-msearch.yaml
================================================
endpoint: "_msearch"
method: POST
ndjson:
  - {"index":"gharchive"}
  - {"query" : {"match" : { "type": "PushEvent"}}, "size": 0, "track_total_hits": true}
expected:
  responses:
    - hits:
        total:
          value: 60
---
endpoint: "_msearch"
engines: ["quickwit"]
method: POST
params:
  extra_filters: "type:PushEvent,actor.login:jadonk"
ndjson:
  - {"index":"gharchive"}
  - {"query" : {"match" : { "type": "PushEvent"}}, "size": 0, "track_total_hits": true}
expected:
  responses:
    - hits:
        total:
          value: 2
---
# `_source_excludes` is not supported in elasticsearch' msearch.
# This parameter is quickwit specific.
# To get more info about the quirks of msearch parameters,
# https://github.com/elastic/elasticsearch/issues/4227
endpoint: "_msearch"
engines: ["quickwit"]
method: POST
params:
  _source_excludes: ["actor"]
ndjson:
  - {"index":"gharchive"}
  - {"query" : {"match_all" : {}}, "size": 1}
expected:
  responses:
    - hits:
        total:
          value: 100
          relation: eq
        hits:
          - _source:
              $expect: "not 'actor' in val"
---
# `_source_includes` is not supported in elasticsearch' msearch.
# This parameter is quickwit specific.
endpoint: "_msearch"
engines: ["quickwit"]
method: POST
params:
  _source_includes: ["actor"]
ndjson:
  - {"index":"gharchive"}
  - {"query" : {"match_all" : {}}, "size": 1}
expected:
  responses:
    - hits:
        total:
          value: 100
          relation: eq
        hits:
          - _source:
              $expect: "len(val) == 1" # Contains only 'actor'
              actor:
                id: 5688
---
# `{_sources: {"excludes": [..]}}` is currently not supported in Quickwit.
# To get more info about the quirks of msearch parameters,
# https://github.com/elastic/elasticsearch/issues/4227
endpoint: "_msearch"
engines: ["elasticsearch"]
method: POST
ndjson:
  - {"index":"gharchive"}
  - {"query" : {"match_all" : {}}, "size": 1, "_source": {"excludes": ["actor"]} }
expected:
  responses:
    - hits:
        total:
          value: 100
          relation: eq
        hits:
          - _source:
              $expect: "not 'actor' in val"
---
# Same as above
endpoint: "_msearch"
engines: ["elasticsearch"]
method: POST
ndjson:
  - {"index":"gharchive"}
  - {"query" : {"match_all" : {}}, "size": 1, "_source": {"includes": ["actor"]}}
expected:
  responses:
    - hits:
        total:
          value: 100
          relation: eq
        hits:
          - _source:
              $expect: "len(val) == 1" # Contains only 'actor'
              actor:
                id: 5688
---
# test missing index
endpoint: "_msearch"
method: POST
ndjson:
  - {"index":"idontexist"}
  - {"query" : {"match" : { "type": "PushEvent"}}, "size": 0, "track_total_hits": true}
expected:
  responses:
    - status: 404
---
endpoint: "_msearch"
method: POST
ndjson:
  - {"index":"idontexist", "ignore_unavailable": true}
  - {"query" : {"match" : { "type": "PushEvent"}}, "size": 0}
expected:
  responses:
    - hits:
        total:
          value: 0
      status: 200


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0026-resolve.yaml
================================================
method: GET
endpoint: /_resolve/index/gh*
expected:
  indices:
    - name: gharchive
      attributes:
        - open
  aliases: []
  data_streams: []


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0027-cluster-health.yaml
================================================
method: GET
endpoint: /_cluster/health
status_code: 200


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0028-fast_only_field_query.yaml
================================================
# Search for a term in a field that is not indexed but is a fast field
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      fast_text: "abc-123"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
--- # term query with no matches
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      fast_text: "zzz"
expected:
  hits:
    total:
      value: 0
      relation: "eq"

--- # term set query with partial match
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    terms:
      fast_text:
        - "abc-123"
        - "zzz"
expected:
  hits:
    total:
      value: 1
      relation: "eq"

--- # term set query with multiple matches
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    terms:
      fast_text:
        - "abc-123"
        - "def-456"
expected:
  hits:
    total:
      value: 2
      relation: "eq"

--- # term query on nested JSON field
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      obj.nested_text: "abc-123"
expected:
  hits:
    total:
      value: 1
      relation: "eq"

--- # term query with no matches
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    term:
      obj.nested_text: "zzz"
expected:
  hits:
    total:
      value: 0
      relation: "eq"

--- # term set query
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    terms:
      obj.nested_text:
        - "abc-123"
        - "ghi-789"
expected:
  hits:
    total:
      value: 2
      relation: "eq"

--- # term set query with no matches
engines:
  - quickwit
endpoint: "fast_only/_search"
params:
  size: 0
json:
  track_total_hits: true
  query:
    terms:
      obj.nested_text:
        - "zzz"
expected:
  hits:
    total:
      value: 0
      relation: "eq"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0029-wildcard.yaml
================================================
json:
  query:
    wildcard:
      actor.login:
        value: jad?nk
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    wildcard:
      actor.login:
        value: j*nk
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    wildcard:
      actor.login: jad?nk
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    wildcard:
      repo.name:
        value: RUS*
        case_insensitive: true
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    wildcard:
      repo.name:
        value: RUS*
        case_insensitive: false
expected:
  hits:
    total:
      value: 0


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0030-prefix.yaml
================================================
json:
  query:
    prefix:
      actor.login:
        value: jado
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    prefix:
      actor.login:
        value: j
expected:
  hits:
    total:
      value: 10
---
json:
  query:
    prefix:
      actor.login: jado
expected:
  hits:
    total:
      value: 2
---
json:
  query:
    prefix:
      repo.name:
        value: RUST
        case_insensitive: true
expected:
  hits:
    total:
      value: 1
---
json:
  query:
    prefix:
      repo.name:
        value: RUST
        case_insensitive: false
expected:
  hits:
    total:
      value: 0


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0031-regex.yaml
================================================
# Basic regex match
params:
  size: 0
json:
  track_total_hits: true
  query:
    regexp:
      type:
        value: ".*event"
expected:
  hits:
    total:
      value: 100
      relation: "eq"
---
# Regex always match from start to end (`(re)` equivalent to `^(re)$`)
params:
  size: 3
json:
  track_total_hits: true
  query:
    regexp:
      type:
        value: "event"
expected:
  hits:
    total:
      value: 0
      relation: "eq"
---
# Regex with case_insensitive flag
params:
  size: 3
json:
  track_total_hits: true
  query:
    regexp:
      repo.name:
        # lowercased by the tokenizer
        value: "RUST.*"
        case_insensitive: true
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
params:
  size: 3
json:
  track_total_hits: true
  query:
    regexp:
      type:
        # lowercased by the tokenizer
        value: "RUST.*"
        case_insensitive: false
expected:
  hits:
    total:
      value: 0
      relation: "eq"
---
# In Elasticsearch, ^ and $ are escaped when they are used as anchors, so
# ^pushevent$ only matches if the original term is "^pushevent$". In Quickwit
# this fails (for now) because tantivy-fst returns an error on all zero width
# assertions.
engines:
  - elasticsearch
endpoint: "simple_es_compat/_search"
params:
  size: 3
json:
  track_total_hits: true
  query:
    regexp:
      keyword_text:
        value: "red$"
expected:
  hits:
    total:
      value: 0
      relation: "eq"
---
engines:
  - elasticsearch
endpoint: "simple_es_compat/_search"
params:
  size: 3
json:
  track_total_hits: true
  query:
    regexp:
      keyword_text:
        value: "gold$"
expected:
  hits:
    total:
      value: 1
      relation: "eq"
---
# regex in query_string
params:
  size: 10
json:
  query:
    query_string:
      query: "type:/pushevent/"
expected:
  hits:
    total:
      value: 60
      relation: "eq"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/0032-mappings.yaml
================================================
method: [GET]
engines:
  - elasticsearch
endpoint: "gharchive/_mappings"
expected:
  gharchive: {}
  # _all:
  #   primaries:
  #     docs:
  #       count: 100
  #     store:
  #       size_in_bytes:
  #         $expect: "val > 278300"
  #   total:
  #     segments:
  #       count: 1
  #     docs:
  #       count: 100
  # indices:
  #   gharchive:
  #     primaries:
  #       docs:
  #         count: 100
  #       store:
  #         size_in_bytes:
  #           $expect: "val > 278300"
  #     total:
  #       segments:
  #         count: 1
  #       docs:
  #         count: 100
---
# method: [GET]
# engines:
#   - quickwit
#   - elasticsearch
# endpoint: "ghar*/_stats"
# expected:
#   _all:
#     primaries:
#       docs:
#         count: 100
#     total:
#       segments:
#         count: 1
#       docs:
#         count: 100
#   indices:
#     gharchive:
#       primaries:
#         docs:
#           count: 100
#       total:
#         segments:
#           count: 1
#         docs:
#           count: 100
# ---
# method: [GET]
# engines:
#   - quickwit
# endpoint: "_stats"
# expected:
#   _all:
#     primaries:
#       docs:
#         count: 102
#     total:
#       segments:
#         count: 2
#       docs:
#         count: 102
#   indices:
#     gharchive:
#       primaries:
#         docs:
#           count: 100
#       total:
#         segments:
#           count: 1
#         docs:
#           count: 100
#     fast_only:
#       primaries:
#         docs:
#           count: 2
#       total:
#         segments:
#           count: 1
#         docs:
#           count: 2
#     empty_index:
#       primaries:
#         docs:
#           count: 0
#       total:
#         segments:
#           count: 0
#         docs:
#           count: 0


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_ctx.elasticsearch.yaml
================================================
api_root: http://localhost:9200/


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_ctx.quickwit.yaml
================================================
api_root: "http://localhost:7280/api/v1/_elastic/"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_ctx.yaml
================================================
method: [GET, POST]
endpoint: "gharchive/_search"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_setup.elasticsearch.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: gharchive
status_code: null
---
method: DELETE
endpoint: empty_index
status_code: null
---
method: DELETE
endpoint: simple_es_compat
status_code: null
---
# empty index
method: PUT
endpoint: empty_index
json: {
  "mappings": {
    "properties": {
      "created_at": {
        "type": "date",
        "store": true
      }
    }
  }
}
---
# Create index
method: PUT
endpoint: gharchive
json: {
  "settings": {
    "analysis": {
    "normalizer": {
      "keyword_lowercase": {
        "type": "custom",
        "filter": ["lowercase"]
      },
      "keyword_keepcase": { "type": "custom" }
    }
  }
  },
  "mappings": {
    "properties": {
      "id": {
        "type": "text",
        "store": true,
        "norms": false,
        "index_options": "docs"
      },
      "type": {
        "type": "text",
        "store": true,
        "norms": false,
        "index_options": "docs",
        "fielddata": true
      },
      "actor": {
        "properties": {
          "id": {
            "type": "long",
            "store": true
          },
          "login": {
            "type": "keyword",
            "normalizer": "keyword_lowercase",
            "store": true,
            "norms": false,
            "index_options": "docs"
          },
          "gravatar_id": {
            "type": "text",
            "store": true,
            "norms": false,
            "index_options": "docs"
          },
          "url": {
            "type": "text",
            "store": true,
            "norms": false,
            "index_options": "docs"
          },
          "avatar_url": {
            "type": "text",
            "store": true,
            "norms": false,
            "index_options": "docs"
          }
        }
      },
      "repo": {
        "properties": {
          "id": {
            "type": "long",
            "store": true
          },
          "name": {
            "type": "keyword",
            "normalizer": "keyword_keepcase",
            "store": true
          },
          "url": {
            "type": "text",
            "store": true,
            "norms": false,
            "index_options": "docs"
          }
        }
      },
      "payload": {
        "type": "object"
      },
      "created_at": {
        "type": "date",
        "store": true
      }
    }
  }
}
---
method: PUT
endpoint: gharchive/_settings
json: { "number_of_replicas": 0 }
---
# Create index
method: PUT
endpoint: simple_es_compat
json: {
  "mappings": {
    "properties": {
      "keyword_text": {
        "type": "keyword",
      }
    }
  }
}
---
method: PUT
endpoint: simple_es_compat/_settings
json: { "number_of_replicas": 0 }
---
# Ingest documents
method: POST
endpoint: _bulk
params:
  refresh: "true"
headers: {"Content-Type": "application/json", "content-encoding": "gzip"}
body_from_file: gharchive-bulk.json.gz
---
method: POST
endpoint: _bulk
params:
  refresh: "true"
headers: {"Content-Type": "application/json"}
ndjson:
  - {"index":{"_index":"simple_es_compat"}}
  - {"keyword_text": "red"}
  - {"index":{"_index":"simple_es_compat"}}
  - {"keyword_text": "gold$"}


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/gharchive
status_code: null
---
# Delete possibly remaining index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/empty_index
status_code: null
---
# Delete possibly remaining index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/simple_es_compat
status_code: null
---
# Create index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: empty_index
  doc_mapping:
    field_mappings:
        - name: created_at
          type: datetime
          fast: true
sleep_after: 3
---
# Create index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: gharchive
  doc_mapping:
    index_field_presence: true
    timestamp_field: created_at
    mode: dynamic
    field_mappings:
        - name: repo
          type: object
          field_mappings:
              - name: name
                type: text
                fast: true
                indexed: true
                tokenizer: raw
        - name: public
          type: bool
          fast: false
          indexed: true
        - name: created_at
          type: datetime
          fast: true
          fast_precision: milliseconds
    dynamic_mapping:
      expand_dots: true
      tokenizer: default
      fast:
        normalizer: lowercase
      record: position
---
# Ingest documents
method: POST
endpoint: _bulk
params:
  refresh: "true"
headers: {"Content-Type": "application/json", "content-encoding": "gzip"}
body_from_file: gharchive-bulk.json.gz
---
# Delete possibly remaining index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/fast_only
status_code: null
---
# Create a dedicated index with a root fast-only field
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: fast_only
  doc_mapping:
    field_mappings:
      - name: fast_text
        type: text
        fast: true
        indexed: false
      - name: obj
        type: object
        field_mappings:
          - name: nested_text
            type: text
            fast: true
            indexed: false
sleep_after: 1
---
# Ingest a couple documents into fast_only
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: fast_only/ingest
params:
  commit: force
ndjson:
  - {"fast_text": "abc-123", "obj": {"nested_text": "abc-123"}}
  - {"fast_text": "def-456", "obj": {"nested_text": "ghi-789"}}

---
# Create simple_es_compat index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: simple_es_compat
  doc_mapping:
    field_mappings:
      - name: keyword_text
        type: text
        fast: true
        indexed: true
        tokenizer: raw
sleep_after: 1
---
# Ingest documents into simple_es_compat
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: simple_es_compat/ingest
params:
  commit: force
ndjson:
  - {"keyword_text": "red"}
  - {"keyword_text": "gold$"}


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_teardown.elasticsearch.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: gharchive
---
method: DELETE
endpoint: empty_index
---
method: DELETE
endpoint: test_index1
status_code: null
---
method: DELETE
endpoint: test_index2
status_code: null


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/_teardown.quickwit.yaml
================================================
# Delete index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/gharchive
---
# Delete index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/empty_index
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/fast_only
status_code: null
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test_index1
status_code: null
--- # Cleanup
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test_index2
status_code: null
--- # Cleanup
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test_index1
status_code: null
--- # Cleanup
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/search_after
status_code: null


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0001-happy-path.yaml
================================================
ndjson:
  - index: { "_index": "test-index", "_id": "1" }
  - message: Hello, World!
  - index: { "_index": "test-index" }
  - message: Hola, Mundo!
status_code: 200
expected:
  errors: false
  items:
    - index:
        _index: test-index
        _id: "1"
        status: 201
    - index:
        _index: test-index
        status: 201


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0002-malformed-action.yaml
================================================
ndjson:
  - del: { "_index": "test-index", "_id": "1" }
status_code: 400
expected:
  status: 400
  error:
    type: illegal_argument_exception
    reason:
      $expect: val.startswith('Malformed action/metadata line [1]')


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0003-validation-failed-index-missing.yaml
================================================
ndjson:
  - index: { "_id": "1" }
  - message: Hello, World!
status_code: 400
expected:
  status: 400
  error:
    type: action_request_validation_exception
    reason: "Validation Failed: 1: index is missing;"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0004-put-request.yaml
================================================
method: PUT
ndjson:
  - index: { "_index": "test-index" }
  - message: Hello, World!
status_code: 200
expected:
  errors: false
  items:
    - index:
        _index: test-index
        status: 201


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0005-document-parsing-exception.yaml
================================================
ndjson:
  - index: { "_index": "test-index", "_id": "5" }
  - message: Hello, World!
    timestamp: timestamp
status_code: 200
expected:
  errors: true
  items:
    - index:
        _index: test-index
        _id: "5"
        status: 400
        error:
          type: document_parsing_exception
          reason:
            $expect: "'timestamp' in val"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0006-partial-index-not-found.yaml
================================================
ndjson:
  - index: { "_index": "test-index-not-found" }
  - message: Hello, World!"
  - index: { "_index": "test-index" }
  - message: Hola, Mundo!
  - index: { "_index": "test-index-pattern-777" }
  - message: Hola, Mundo!
status_code: 200
expected:
  errors: true
  items:
    - index:
        _index: test-index-not-found
        status: 404
        error:
          index: test-index-not-found
          type: index_not_found_exception
          reason:
            $expect: val.startswith('no such index [test-index-not-found]')
    - index:
        _index: test-index
        status: 201
    - index:
        _index: test-index-pattern-777
        status: 201


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/0007-illegal-index-name.yaml
================================================
# allowed characters are different between ES and Quickwit
engines:
  - quickwit
ndjson:
  - index: { "_index": "test-index" }
  - message: Hola, Mundo!
  - index: { "_index": "test-index-pattern-11" }
  - message: Hola, Mundo!
  - index: { "_index": "test-index-pattern-&1" }
  - message: Hola, Mundo!
status_code: 200
expected:
  errors: true
  items:
    - index:
        _index: test-index
        status: 201
    - index:
        _index: test-index-pattern-11
        status: 201
    - index:
        _index: test-index-pattern-&1
        status: 400


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_ctx.elasticsearch.yaml
================================================
api_root: http://localhost:9200


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_ctx.quickwit.yaml
================================================
api_root: http://localhost:7280/api/v1/_elastic


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_ctx.yaml
================================================
method: [POST]
endpoint: "_bulk"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_setup.elasticsearch.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: test-index*
status_code: null
---
method: PUT
endpoint: test-index
json: {
  "mappings": {
    "properties": {
      "message": {
        "type": "text",
        "store": true
      },
      "timestamp": {
        "type": "integer",
        "store": true
      }
    }
  }
}
---
# Only create indexes automatically for specific pattern
method: PUT
endpoint: _cluster/settings
json:
  transient:
    action.auto_create_index: "test-index-pattern-*"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_setup.quickwit.yaml
================================================
# Delete possibly remaining index and template
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test-index
status_code: null
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test-index-pattern-11
status_code: null
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test-index-pattern-777
status_code: null
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: templates/test-index-template
status_code: null
---
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.8"
  index_id: test-index
  doc_mapping:
    field_mappings:
        - name: message
          type: text
        - name: timestamp
          type: datetime
sleep_after: 3
---
# Create index template
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: templates
json:
  version: "0.8"
  template_id: test-index-template
  index_id_patterns:
    - test-index-pattern-*
  doc_mapping:
    mode: dynamic
  indexing_settings:
    commit_timeout_secs: 1


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_teardown.elasticsearch.yaml
================================================
# Reconfigure with the default settings
method: PUT
endpoint: _cluster/settings
json:
  transient:
    action.auto_create_index: "true"
---
method: DELETE
endpoint: test-index*
status_code: null


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/bulk/_teardown.quickwit.yaml
================================================
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test-index
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test-index-pattern-11
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/test-index-pattern-777
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: templates/test-index-template


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/0001-muti_indices_query.yaml
================================================
endpoint: "gharchive-*/_search"
params:
  q: "*"
expected:
  hits:
    total:
      value: 4
      relation: "eq"
    hits:
      $expect: "len(val) == 4"
---
endpoint: "gharchive-*/_search"
params:
  q: "actor.login:fmassot OR actor.login:guilload"
expected:
  hits:
    total:
      value: 2
      relation: "eq"
    hits:
      $expect: "len(val) == 2"
---
endpoint: "gharchive-1,gharchive-2/_search"
params:
  q: "actor.login:fmassot OR actor.login:guilload"
expected:
  hits:
    total:
      value: 2
      relation: "eq"
    hits:
      $expect: "len(val) == 2"
---
endpoint: "gharchive-1%2Cgharchive-2/_search"
params:
  q: "actor.login:fmassot OR actor.login:guilload"
expected:
  hits:
    total:
      value: 2
      relation: "eq"
    hits:
      $expect: "len(val) == 2"
---
# Index information
endpoint: "gharchive-1%2Cgharchive-2/_search"
params:
  size: 2
json:
  query:
    match_all: {}
  sort:
    created_at:
      order: desc
expected:
  hits:
    total:
      value: 4
      relation: "eq"
    hits:
      - _source:
          actor:
            login: trinity
        _index: "gharchive-2"
      - _source:
          actor:
            login: fulmicoton
        _index: "gharchive-1"
---
endpoint: "gharchive-*,-gharchive-2/_search"
params:
  q: "*"
expected:
  hits:
    total:
      value: 2
      relation: "eq"
    hits:
      $expect: "len(val) == 2"
---
endpoint: "gharchive-*,-*-2/_search"
params:
  q: "*"
expected:
  hits:
    total:
      value: 2
      relation: "eq"
    hits:
      $expect: "len(val) == 2"
---
# It is valid to have a pattern that does not match
# any index.
endpoint: "invalidptn-*/_search"
params:
  size: 2
json:
  query:
    match_all: {}
  sort:
    created_at:
      order: desc
expected:
  hits:
    total:
      value: 0
      relation: "eq"
    hits: []
---
# If a specific index (not a pattern) does not exist,
# this returns an error.
endpoint: "invalidptn*-,nonexistingindex/_search"
params:
  size: 2
json:
  query:
    match_all: {}
  sort:
    created_at:
      order: desc
status_code: 404
---
# If one of the pattern matches no index,
# but another matches some indices, it is valid too.
endpoint: "invalidptn*-,gharchive*/_search"
params:
  size: 2
json:
  query:
    match_all: {}
  sort:
    created_at:
      order: desc
expected:
  hits:
    total:
      value: 104
      relation: "eq"
    hits:
      $expect: "len(val) == 2"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/0002-muti_indices_scroll.yaml
================================================
endpoint: "gharchive-*/_search"
params:
  size: 1
  scroll: 30m
json:
  query:
    match_all: {}
  sort:
    - actor.id:
        order: desc
store:
  scroll_id: _scroll_id
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      - _source: {actor: {login: "trinity"}}
    total:
      value: 4
      relation: "eq"
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      - _source: {actor: {login: "guilload"}}
    total:
      value: 4
---
method: GET
endpoint: "_search/scroll"
params:
  scroll: 30m
json:
  scroll_id:
    $previous: "val[\"_scroll_id\"]"
expected:
  _scroll_id:
    $expect: "len(val) > 4"
  hits:
    hits:
      - _source: {actor: {login: "fulmicoton"}}
    total:
      value: 4
---
endpoint: "gharchive-*,non-existing-index/_search"
params:
  size: 1
  scroll: 30m
json:
  query:
    match_all: {}
  sort:
    - actor.id:
        order: desc
store:
  scroll_id: _scroll_id
status_code: 404
---
endpoint: "non-existing-index-*/_search"
params:
  size: 1
  scroll: 30m
json:
  query:
    match_all: {}
  sort:
    - actor.id:
        order: desc
expected:
  $expect: "'_scroll_id' in val"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/0003-multi_indices_aggs.yaml
================================================
# Test date histogram aggregation
method: [POST]
engines:
  - quickwit
endpoint: "gharchive-*/_search"
json:
  query: { match_all: {} }
  aggs:
    logins: 
      terms: 
        field: "actor.login"
        order:
          _key: asc
expected:
  aggregations:
    logins:
      buckets:
      - doc_count: 1
        key: fmassot
      - doc_count: 1
        key: fulmicoton
      - doc_count: 1
        key: guilload
      - doc_count: 1
        key: trinity
      sum_other_doc_count: 0
---
# Test date histogram aggregation
method: [POST]
endpoint: "noindexmatching-*/_search"
json:
  query: { match_all: {} }
  aggs:
    logins:
      terms:
        field: "actor.login"
        order:
          _key: asc
expected:
  $expect: "not 'aggregations' in val"

================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/0004-missing_index_query.yaml
================================================
endpoint: "idontexist/_search"
params:
  q: "*"
status_code: 404
---
endpoint: "idontexist/_search"
params:
  q: "*"
  ignore_unavailable: "true"
expected:
  hits:
    total:
      value: 0
---
endpoint: "gharchive-*,idontexist/_search"
params:
  q: "*"
status_code: 404
---
endpoint: "gharchive-*,idontexist/_search"
params:
  q: "*"
  ignore_unavailable: "true"
expected:
  hits:
    total:
      value: 4


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/_ctx.yaml
================================================
method: [GET, POST]


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/_setup.elasticsearch.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: gharchive-1
status_code: null
---
# Delete possibly remaining index
method: DELETE
endpoint: gharchive-2
status_code: null
---
# Create index 1
method: PUT
endpoint: gharchive-1
json: {
  "mappings": {
    "properties": {
      "id": {
        "type": "text",
        "store": true,
        "norms": false,
        "index_options": "docs"
      },
      "type": {
        "type": "text",
        "store": true,
        "norms": false,
        "index_options": "docs",
        "fielddata": true
      },
      "actor": {
        "properties": {
          "id": {
            "type": "long",
            "store": true
          },
          "login": {
            "type": "text",
            "store": true,
            "norms": false,
            "index_options": "docs"
          }
        }
      },
      "created_at": {
        "type": "date",
        "store": true
      }
    }
  }
}
---
# Create index 2
method: PUT
endpoint: gharchive-2
json: {
  "mappings": {
    "properties": {
      "id": {
        "type": "text",
        "store": true,
        "norms": false,
        "index_options": "docs"
      },
      "type": {
        "type": "text",
        "store": true,
        "norms": false,
        "index_options": "docs",
        "fielddata": true
      },
      "actor": {
        "properties": {
          "id": {
            "type": "long",
            "store": true
          },
          "login": {
            "type": "text",
            "store": true,
            "norms": false,
            "index_options": "docs"
          }
        }
      },
      "created_at": {
        "type": "date",
        "store": true
      }
    }
  }
}
---
# Ingest documents in index 1 and 2
method: POST
endpoint: _bulk
params:
  refresh: "true"
headers: {"Content-Type": "application/json"}
ndjson:
  - "index": { "_index": "gharchive-1" }
  - {"id": 1, "created_at":"2015-02-01T00:00:14Z", "type": "CreateEvent", "actor": { "id": 1, "login": "fmassot" } }
  - "index": { "_index": "gharchive-1" }
  - {"id": 2, "created_at":"2015-02-01T00:00:16Z", "type": "CreateEvent", "actor": { "id": 2, "login": "fulmicoton" } }
  - "index": { "_index": "gharchive-2" }
  - {"id": 3, "created_at":"2015-02-01T00:00:15Z", "type": "CreateEvent", "actor": { "id": 3, "login": "guilload" } }
  - "index": { "_index": "gharchive-2" }
  - {"id": 4, "created_at":"2015-02-01T00:00:17Z", "type": "CreateEvent", "actor": { "id": 4, "login": "trinity" } }


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/gharchive-1
status_code: null
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/gharchive-2
status_code: null
---
# Create index 1
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: gharchive-1
  doc_mapping:
    index_field_presence: true
    timestamp_field: created_at
    mode: dynamic
    field_mappings:
        - name: created_at
          type: datetime
          fast: true
    dynamic_mapping:
      expand_dots: true
      tokenizer: default
      fast:
        normalizer: lowercase
      record: position
---
# Create index 2
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: gharchive-2
  doc_mapping:
    index_field_presence: true
    timestamp_field: created_at
    mode: strict
    field_mappings:
      - name: created_at
        type: datetime
        fast: true
      - name: id
        type: u64
        fast: true
      - name: type
        type: text
        fast: true
      - name: actor
        type: object
        fast: true
        field_mappings:
          - name: id
            type: u64
            fast: true
          - name: login
            type: text
            fast: true
---
# Ingest documents in index 1
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: gharchive-1/ingest
params:
  commit: "force"
headers: {"Content-Type": "application/json"}
ndjson:
  - {"id": 1, "created_at":"2015-02-01T00:00:14Z", "type": "CreateEvent", "actor": { "id": 1, "login": "fmassot" } }
  - {"id": 2, "created_at":"2015-02-01T00:00:16Z", "type": "CreateEvent", "actor": { "id": 2, "login": "fulmicoton" } }
---
# Ingest documents in index 2
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: gharchive-2/ingest
params:
  commit: "force"
headers: {"Content-Type": "application/json"}
ndjson:
  - {"id": 3, "created_at":"2015-02-01T00:00:15Z", "type": "CreateEvent", "actor": { "id": 3, "login": "guilload" } }
  - {"id": 4, "created_at":"2015-02-01T00:00:17Z", "type": "CreateEvent", "actor": { "id": 4, "login": "trinity" } }


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/_teardown.elasticsearch.yaml
================================================
method: DELETE
endpoint: gharchive-1
---
method: DELETE
endpoint: gharchive-2


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility/multi-indices/_teardown.quickwit.yaml
================================================
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/gharchive-1
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/gharchive-2


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility_info/0001-info.yaml
================================================
expected:
  cluster_name:
    $expect: "val != ''"
  version:
    build_date:
      $expect: "val != ''"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility_info/_ctx.elasticsearch.yaml
================================================
api_root: http://localhost:9200


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility_info/_ctx.quickwit.yaml
================================================
api_root: "http://localhost:7280/api/v1/_elastic"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_compatibility_info/_ctx.yaml
================================================
method: [GET]
endpoint: "/"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/0001-field-capabilities.yaml
================================================
# Test _field_caps API
method: [GET]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps
expected:
  indices:
  - fieldcaps
  fields:
    nested.response:
      long:
        type: long
        metadata_field: false
        searchable: true
        aggregatable: true
    nested.name:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        type: text
        metadata_field: false
        searchable: true
        aggregatable: true
    host:
      ip:
        type: ip
        metadata_field: false
        searchable: true
        aggregatable: true
    mixed: # This is a little weird case (values [5, -5.5]), since coercion happens only on the columnar side. That's why `long` is not aggregatable.
      long:
        metadata_field: false
        searchable: true
        aggregatable: false
      double:
        metadata_field: false
        searchable: true
        aggregatable: true
    date:
      date_nanos:
        metadata_field: false
        searchable: true
        aggregatable: true
    response:
      long:
        metadata_field: false
        searchable: true
        aggregatable: true
    id:
      long:
        metadata_field: false
        searchable: true
        aggregatable: true
      double:
        metadata_field: false
        searchable: true
        aggregatable: true
    name:
      keyword:
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        metadata_field: false
        searchable: true
        aggregatable: true
    tags:
      keyword:
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test _field_caps API with timestamp filter
method: [GET]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps?start_timestamp=1684993001
expected:
  indices:
  - fieldcaps
  fields:
    $expect: "not 'id' in val" # Filtered by start_timestamp
    mixed: # This is a little weird case (values [5, -5.5]), since coercion happens only on the columnar side. That's why `long` is not aggregatable.
      long:
        metadata_field: false
        searchable: true
        aggregatable: false
      double:
        metadata_field: false
        searchable: true
        aggregatable: true
    date:
      date_nanos:
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test fields parameter with `.dynamic` suffix
method: [GET]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps?fields=nested.response,nested.name
expected:
  indices:
  - fieldcaps
  fields:
    nested.response:
      long:
        metadata_field: false
        searchable: true
        aggregatable: true
    nested.name:
      keyword:
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test fields parameter with wildcard
method: [GET]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps?fields=nest*
expected:
  indices:
  - fieldcaps
  fields:
    nested.response:
      long:
        metadata_field: false
        searchable: true
        aggregatable: true
    nested.name:
      keyword:
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test fields parameter with wildcard
method: [GET]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps?fields=nest*
expected:
  indices:
  - fieldcaps
  fields:
    nested.response:
      long:
        metadata_field: false
        searchable: true
        aggregatable: true
    nested.name:
      keyword:
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test fields parameter with wildcard
method: [GET]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps?fields=nested.*ponse
expected:
  indices:
  - fieldcaps
  fields:
    nested.response:
      long:
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Compare with elastic search
method: [GET]
endpoint: fieldcaps/_field_caps?fields=nested.*ponse
expected:
  indices:
  - fieldcaps
  fields:
    nested.response:
      long:
        type: long
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Compare ip field with elastic search
method: [GET]
endpoint: fieldcaps*/_field_caps?fields=host
expected:
  indices:
  - fieldcaps
  - fieldcaps-2
  fields:
    host:
      ip:
        type: ip
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Compare ip field with elastic search
method: [GET]
engines:
  - quickwit
  - elasticsearch
endpoint: fieldcaps/_field_caps?fields=date
expected:
  indices:
  - fieldcaps
  fields:
    date:
      date_nanos:
        type: date_nanos
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Wildcard on index name
method: [GET]
engines:
  - quickwit
endpoint: fieldca*/_field_caps?fields=tags*
expected:
  indices:
  - fieldcaps
  - fieldcaps-2
  fields:
    tags:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
    tags-2:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
        indices:
          - fieldcaps-2
---
# _field_caps without index endpoint
method: [GET]
engines:
  - quickwit
endpoint: _field_caps?fields=tags*
expected:
  indices:
  - fieldcaps
  - fieldcaps-2
  fields:
    tags:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
    tags-2:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
        indices:
          - fieldcaps-2
---
# Wildcard on index name + Wildcard without match
method: [GET]
endpoint: fieldca*,blub*/_field_caps?fields=date
expected:
  indices:
  - fieldcaps
  - fieldcaps-2
  fields:
    date:
      date_nanos:
        type: date_nanos
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Exact match index + Non matching exact index
method: [GET]
endpoint: fieldcaps,blub/_field_caps?fields=date
status_code: 404
---
# Compare ip field with elastic search
method: [GET]
endpoint: doesnotexist/_field_caps?fields=date
status_code: 404
---
# Compare ip field with elastic search
method: [GET]
endpoint: doesno*texist/_field_caps?fields=date
status_code: 200
---
# Test _field_caps API with index_filter (term query)
# Note: term queries require exact token match; 'fritz' is lowercase due to default tokenizer
method: [POST]
endpoint: fieldcaps/_field_caps?fields=*
json:
  index_filter:
    term:
      name: "fritz"
expected:
  indices:
  - fieldcaps
  fields:
    name:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        type: text
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test _field_caps API with index_filter (match_all query)
method: [POST]
endpoint: fieldcaps/_field_caps?fields=name
json:
  index_filter:
    match_all: {}
expected:
  indices:
  - fieldcaps
  fields:
    name:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        type: text
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test _field_caps API with index_filter (bool query)
method: [POST]
endpoint: fieldcaps/_field_caps?fields=response,name
json:
  index_filter:
    bool:
      must:
        - term:
            name: "fritz"
      filter:
        - range:
            response:
              gte: 30
expected:
  indices:
  - fieldcaps
  fields:
    response:
      long:
        type: long
        metadata_field: false
        searchable: true
        aggregatable: true
    name:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        type: text
        metadata_field: false
        searchable: true
        aggregatable: true
---
# Test _field_caps API with invalid index_filter
method: [POST]
endpoint: fieldcaps/_field_caps?fields=*
json:
  index_filter:
    invalid_query_type:
      field: "value"
status_code: 400
---
# Test _field_caps API with empty index_filter (should return 400 like ES)
method: [POST]
engines:
  - quickwit
  - elasticsearch
endpoint: fieldcaps/_field_caps?fields=name
json:
  index_filter: {}
status_code: 400
---
# Test _field_caps API with index_filter using tag field for split pruning (QW-only)
method: [POST]
engines:
  - quickwit
endpoint: fieldcaps/_field_caps?fields=name
json:
  index_filter:
    term:
      tags: "nice"
expected:
  indices:
  - fieldcaps
  fields:
    name:
      keyword:
        type: keyword
        metadata_field: false
        searchable: true
        aggregatable: true
      text:
        type: text
        metadata_field: false
        searchable: true
        aggregatable: true


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_ctx.elasticsearch.yaml
================================================
api_root: http://localhost:9200/


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_ctx.quickwit.yaml
================================================
api_root: "http://localhost:7280/api/v1/_elastic/"


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_ctx.yaml
================================================
method: [GET, POST]
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_setup.elasticsearch.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: fieldcaps
status_code: null
---
method: DELETE
endpoint: fieldcaps-2
status_code: null
---
# Create index 1
method: PUT
endpoint: fieldcaps
json: {
  "mappings": {
    "properties": {
      "host": {
        "type": "ip",
        "store": true
      },
      "date": {
        "type": "date_nanos"
      },
    }
  }
}
---
# Create index 2
method: PUT
endpoint: fieldcaps-2
json: {
  "mappings": {
    "properties": {
      "host": {
        "type": "ip",
        "store": true
      },
      "date": {
        "type": "date_nanos"
      },
    }
  }
}
---
# Ingest documents in fieldcaps
method: POST
endpoint: _bulk
params:
  refresh: "true"
headers: {"Content-Type": "application/json"}
ndjson:
  - "index": { "_index": "fieldcaps" }
  - {"name": "Fritz", "response": 30, "id": 5, "host": "192.168.0.1", "tags": ["nice", "cool"]}
  - "index": { "_index": "fieldcaps" }
  - {"nested": {"name": "Fritz", "response": 30}, "date": "2015-01-11T12:10:30Z", "host": "192.168.0.11", "tags": ["nice"]}
  - "index": { "_index": "fieldcaps-2" }
  - {"name": "Fritz", "response": 30, "id": 6, "host": "192.168.0.1", "tags": ["nice", "cool"], "tags-2": ["awesome"]}


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/fieldcaps
status_code: null
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/fieldcaps-2
status_code: null
---
# Create index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: fieldcaps
  doc_mapping:
    mode: dynamic
    dynamic_mapping:
      tokenizer: default
      fast: true
    timestamp_field: date
    tag_fields: ["tags"]
    field_mappings:
      - name: date
        type: datetime
        input_formats:
          - rfc3339
        fast_precision: seconds
        fast: true
      - name: host
        type: ip
        fast: true
      - name: tags
        type: array<text>
        tokenizer: raw
        fast: true
---
# Create index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: fieldcaps-2
  doc_mapping:
    mode: dynamic
    dynamic_mapping:
      tokenizer: default
      fast: true
    field_mappings:
      - name: date
        type: datetime
        input_formats:
          - rfc3339
        fast_precision: seconds
        fast: true
      - name: host
        type: ip
        fast: true
---
# Ingest documents
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: fieldcaps/ingest
params:
  commit: force
ndjson:
  - {"name": "Fritz", "response": 30, "id": 5, "date": "2015-01-10T12:00:00Z", "host": "192.168.0.1", "tags": ["nice", "cool"]}
  - {"nested": {"name": "Fritz", "response": 30}, "date": "2015-01-11T12:00:00Z", "host": "192.168.0.11", "tags": ["nice"]}
---
# Ingest documents split #1 index fieldcaps
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: fieldcaps/ingest
params:
  commit: force
ndjson:
  - {"id": -5.5, "date": "2018-01-10T12:00:00Z"} # cross split mixed type
---
# Ingest documents split #2 index fieldcaps
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: fieldcaps/ingest
params:
  commit: force
ndjson:
  - {"mixed": 5, "date": "2023-01-10T12:00:00Z"} # inter split mixed type
  - {"mixed": -5.5, "date": "2024-01-10T12:00:00Z"}
---
# Ingest documents in index fieldcaps-2
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: fieldcaps-2/ingest
params:
  commit: force
ndjson:
  - {"name": "Fritz", "response": 30, "id": 6, "host": "192.168.0.1", "tags": ["nice", "cool"], "tags-2": ["awesome"]}


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_teardown.elasticsearch.yaml
================================================
# # Delete index
method: DELETE
endpoint: fieldcaps
---
method: DELETE
endpoint: fieldcaps-2


================================================
FILE: quickwit/rest-api-tests/scenarii/es_field_capabilities/_teardown.quickwit.yaml
================================================
# # Delete index
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/fieldcaps
---
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/fieldcaps-2


================================================
FILE: quickwit/rest-api-tests/scenarii/multi_splits/0001-request-optimizations.yaml
================================================
json:
  size: 1
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - timestamp:
        order: asc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
---
json:
  size: 2
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - timestamp:
        order: asc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
---
json:
  size: 3
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - timestamp:
        order: asc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
---
json:
  size: 5
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - timestamp:
        order: asc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T12:00:00Z"}
--- # ASC + TIMESTAMP filter
json:
  size: 5
  track_total_hits: true
  query:
    range:
      timestamp:
        gte: "2015-01-10T12:00:00Z"
  sort:
    - timestamp:
        order: asc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2015-01-10T12:00:00Z"}
      - _source: {"timestamp": "2015-01-10T13:00:00Z"}
      - _source: {"timestamp": "2015-01-10T14:00:00.000000001Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
--- # ASC + TIMESTAMP filter
json:
  size: 5
  track_total_hits: true
  query:
    range:
      timestamp:
        lt: "2015-01-10T12:00:00Z"
  sort:
    - timestamp:
        order: asc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-10T10:00:00Z"}
--- # DESC
json:
  size: 6
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - timestamp:
        order: desc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2016-01-11T12:00:00Z"}
      - _source: {"timestamp": "2016-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
---
json:
  size: 7
  track_total_hits: true
  query:
      match_all: {}
  sort:
    - timestamp:
        order: desc
expected:
  hits:
    hits:
      - _source: {"timestamp": "2016-01-11T12:00:00Z"}
      - _source: {"timestamp": "2016-01-10T10:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-11T12:00:00Z"}
      - _source: {"timestamp": "2015-01-10T14:00:00.000000001Z"}


================================================
FILE: quickwit/rest-api-tests/scenarii/multi_splits/_ctx.yaml
================================================
method: [GET]
endpoint: "multi_splits/_search"
# The entire suite is just for Quickwit
engines: [quickwit]
api_root: "http://localhost:7280/api/v1/_elastic/"


================================================
FILE: quickwit/rest-api-tests/scenarii/multi_splits/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/multi_splits
status_code: null
---
# Create index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: multi_splits
  doc_mapping:
    mode: dynamic
    timestamp_field: timestamp
    field_mappings:
        - name: timestamp
          type: datetime
          input_formats:
            - rfc3339
          fast: true
sleep_after: 3
---
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: multi_splits/ingest
params:
  commit: force
min_splits: 1
max_splits: 10
#seed: 3694
shuffle_ndjson:
  - {"timestamp": "2015-01-10T10:00:00Z"}
  - {"timestamp": "2015-01-11T12:00:00Z"}
  - {"timestamp": "2015-01-10T10:00:00Z"}
  - {"timestamp": "2015-01-10T13:00:00Z"}
  - {"timestamp": "2015-01-11T12:00:00Z"}
  - {"timestamp": "2015-01-10T10:00:00Z"}
  - {"timestamp": "2015-01-10T14:00:00.000000001Z"} # 1h later than 2.doc
  - {"timestamp": "2015-01-11T12:00:00Z"}
  - {"timestamp": "2015-01-10T10:00:00Z"}
  - {"timestamp": "2015-01-10T12:00:00Z"} # 1h earlier than 2. doc
  - {"timestamp": "2015-01-11T12:00:00Z"}
  - {"timestamp": "2016-01-10T10:00:00Z"}
  - {"timestamp": "2016-01-11T12:00:00Z"}


================================================
FILE: quickwit/rest-api-tests/scenarii/multi_splits/_teardown.quickwit.yaml
================================================
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/multi_splits
status_code: null


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/0001_ts_range.yaml
================================================
# This tests a simple request with no queries.
endpoint: simple/search
params:
  query: "*"
  start_timestamp: 1684993001
  end_timestamp: 1684993002
expected:
  num_hits: 1
---
endpoint: simple/search
params:
  query: "*"
  start_timestamp: 1684993002
  end_timestamp: 1684993004
expected:
  num_hits: 2
---
endpoint: simple/search
params:
  query: "*"
  start_timestamp: 1684993002
  end_timestamp: 1684993004
expected:
  num_hits: 2
---
endpoint: simple/search
params:
  query: "ts:>=2023/05/25"
expected:
  num_hits: 4
---
endpoint: simple/search
params:
  query: "ts:>=1684993002 AND ts:<1684993004"
expected:
  num_hits: 2
---
endpoint: simple/search
params:
  query: "auto_date:>=2023-05-25T00:00:00Z AND auto_date:<2023-05-26T00:00:00Z"
expected:
  num_hits: 2


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/0002_negative_search.yaml
================================================
# regression test for bizarre handling of - vs NOT when no positive clause is present
endpoint: simple/search
params:
  query: "-ts:1234567890 AND -ts:1234567891"
expected:
  num_hits: 4
---
endpoint: simple/search
params:
  query: "NOT ts:1234567890 AND NOT ts:1234567891"
expected:
  num_hits: 4
---
endpoint: simple/search
params:
  query: "NOT ts:1234567890 AND -ts:1234567891"
expected:
  num_hits: 4
---
endpoint: simple/search
params:
  query: "-ts:1234567890 AND NOT ts:1234567891"
expected:
  num_hits: 4


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/0003_exists_search.yaml
================================================
endpoint: nested/search
params:
  query: "doesnotexist:*"
expected:
  num_hits: 0
---
# json fast fields:
endpoint: nested/search
params:
  query: "json_fast:*"
expected:
  num_hits: 1
---
endpoint: nested/search
params:
  query: "json_fast.field_c:*"
expected:
  num_hits: 1
---
endpoint: nested/search
params:
  query: "json_fast.doesnotexist:*"
expected:
  num_hits: 0
---
# json text fields:
endpoint: nested/search
params:
  query: "json_text.field_a:*"
expected:
  num_hits: 2
---
endpoint: nested/search
params:
  query: "json_text.field_b:*"
expected:
  num_hits: 1
---
endpoint: nested/search
params:
  query: "json_text:*"
expected:
  num_hits: 2
---
# object fields:
endpoint: nested/search
params:
  query: "object_multi.object_fast_field:*"
expected:
  num_hits: 2
---
endpoint: nested/search
params:
  query: "object_multi.doesnotexist:*"
expected:
  num_hits: 0
---
endpoint: nested/search
params:
  query: "object_multi.object_text_field:*"
expected:
  num_hits: 1
---
endpoint: nested/search
params:
  query: "object_multi:*"
expected:
  num_hits: 3


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/0004_exact_string.yaml
================================================
## using an index (with the raw tokenizer)
endpoint: nested/search
method: POST
json:
  query: "text_raw:indexed-with-raw-tokenizer-dashes"
expected:
  num_hits: 1
---
endpoint: nested/search
method: POST
json:
  query: "text_raw:indexed_with_raw_tokenizer_dashes"
expected:
  num_hits: 0
---
endpoint: nested/search
method: POST
json:
  query: "text_raw:indexed-with-raw"
expected:
  num_hits: 0
---
endpoint: nested/search
method: POST
json:
  query: 'text_raw:"indexed with raw tokenizer dashes"'
expected:
  num_hits: 1
---
endpoint: nested/search
method: POST
json:
  query: 'text_raw:"indexed with raw"'
expected:
  num_hits: 0
---
## using a fast field (use a range query to force using the fast field)
endpoint: nested/search
method: POST
json:
  query: "text_fast:fast-text-value-dashes"
expected:
  num_hits: 1
---
endpoint: nested/search
method: POST
json:
  query: "text_fast:[fast-text-value-dashes TO fast-text-value-dashes]"
expected:
  num_hits: 1
---
endpoint: nested/search
method: POST
json:
  query: "text_fast:[fast_text_value_dashes TO fast_text_value_dashes]"
expected:
  num_hits: 0
---
endpoint: nested/search
method: POST
json:
  query: "text_fast:[fast-text-value TO fast-text-value]"
expected:
  num_hits: 0
---
# unfortunately, the query parser does not support escaping whitespaces
# use the Elasticsearch API instead
endpoint: nested/search
method: POST
json:
  query: 'text_fast:["fast text value whitespaces" TO "fast text value whitespacesd"]'
status_code: 400
---
endpoint: nested/search
method: POST
json:
  query: "text_fast:[fast text value whitespaces TO fast text value whitespaces]"
status_code: 400
---
endpoint: nested/search
method: POST
json:
  query: "text_fast:[fast\ text\ value\ whitespaces TO fast\ text\ value\ whitespaces]"
status_code: 400


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/0005_fast_field_search.yaml
================================================
# Validate searching on a fast-only (non-indexed) field
endpoint: nested/search
method: POST
json:
  query: "text_fast:fast-text-value-dashes"
expected:
  num_hits: 1
---
# Non-matching exact value should return no hits
endpoint: nested/search
method: POST
json:
  query: "text_fast:fast_text_value_dashes"
expected:
  num_hits: 0


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/_ctx.yaml
================================================
method: GET
engines: ["quickwit"]
api_root: "http://localhost:7280/api/v1/"
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/simple
status_code: null
---
# Create index
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: simple
  doc_mapping:
    timestamp_field: ts
    mode: dynamic
    field_mappings:
      - name: ts
        type: datetime
        fast: true
      - name: not_fast
        type: datetime
        fast: true
    dynamic_mapping:
      tokenizer: default
      expand_dots: true
      fast: true
---
# Ingest documents
method: POST
endpoint: simple/ingest
params:
  commit: force
ndjson:
  - {"ts": 1684993001, "not_fast": 1684993001, "auto_date": "2023-05-25T10:00:00Z"}
  - {"ts": 1684993002, "not_fast": 1684993002, "auto_date": "2023-05-25T11:00:00Z"}
---
# Ingest documents split #2
method: POST
endpoint: simple/ingest
params:
  commit: force
ndjson:
  - {"ts": 1684993003, "not_fast": 1684993003}
  - {"ts": 1684993004, "not_fast": 1684993004}
  # a missing timestamp
  - {"not_fast": 1684993003}
---
method: DELETE
endpoint: indexes/nested
status_code: null
---
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: nested
  doc_mapping:
    index_field_presence: true
    # default mode is dynamic
    field_mappings:
      - name: json_text
        type: json
        indexed: true
      - name: json_fast
        type: json
        stored: true
        fast: true
      - name: object_multi
        type: object
        field_mappings:
          - name: object_text_field
            type: text
          - name: object_fast_field
            type: u64
            fast: true
      - name: text_fast
        type: text
        fast: true
        indexed: false
      - name: text_raw
        type: text
        fast: false
        indexed: true
        tokenizer: raw

---
method: POST
endpoint: nested/ingest
params:
  commit: force
ndjson:
  - {"json_text": {"field_a": "hello", "field_b": "world"}}
  - {"json_text": {"field_a": "hi"}}
  - {"json_fast": {"field_c": 1}}
  - {"object_multi": {"object_text_field": "multi hello"}}
  - {"object_multi": {"object_fast_field": 1}}
  - {"object_multi": {"object_fast_field": 2}}
  - {"text_raw": "indexed-with-raw-tokenizer-dashes"}
  - {"text_raw": "indexed with raw tokenizer dashes"}
  - {"text_fast": "fast-text-value-dashes"}
  - {"text_fast": "fast text value whitespaces"}


================================================
FILE: quickwit/rest-api-tests/scenarii/qw_search_api/_teardown.quickwit.yaml
================================================
method: DELETE
endpoint: indexes/simple
---
method: DELETE
endpoint: indexes/nested


================================================
FILE: quickwit/rest-api-tests/scenarii/search_after/0001-search_after_edge_case.yaml
================================================
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_u64:
        order: asc
  search_after: [-10]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [0]
--- # f64 to u64
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_u64:
        order: asc
  search_after: [0.2]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [20]
--- # u64 to i64
desc: "search after u64 to i64 asc"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [250]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [300]
      - sort: [9223372036854775807]
      - sort: [9223372036854775807]
--- # u64 to i64
desc: "search after u64 to i64 desc"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - val_i64:
        order: desc
  search_after: [250]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [200]
      - sort: [-100]
--- # u64 to i64 corner case. We are exceeding i64::MAX, so we don't get any results.
desc: "search after u64 to i64 corner case exceeding i64::MAX asc"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [18_000_000_000_000_000_000]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      $expect: "len(val) == 0"
--- # u64 to i64 corner case.We are exceeding i64::MAX, but with desc we get ALL the results.
desc: "search after u64 to i64 corner case exceeding i64::MAX desc"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - val_i64:
        order: desc
  search_after: [18_000_000_000_000_000_000]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [9_223_372_036_854_775_807]
      - sort: [9_223_372_036_854_775_807]
      - sort: [300]
      - sort: [200]
      - sort: [-100]
--- # u64 to i64 corner case
desc: "search after u64 to i64 corner case one below i64::MAX asc"
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [9_223_372_036_854_775_806]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [9_223_372_036_854_775_807]
---
desc: "search after u64 to i64 corner case exactly i64::MAX asc"
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [9_223_372_036_854_775_807]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      $expect: "len(val) == 0"
---
desc: "search after u64 to i64 corner case one above i64::MAX asc"
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [9_223_372_036_854_775_808]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      $expect: "len(val) == 0"
---
desc: "search after f64 to i64 corner case"
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [9_223_372_036_854_500_000.5] # lower the value we seem to hit some f64 accuracy issue here
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [9_223_372_036_854_775_807]
---
desc: "search after f64 to i64 out of bounds asc match nothing"
json:
  size: 1
  query:
      match_all: {}
  sort:
    - val_i64:
        order: asc
  search_after: [19_223_372_036_854_500_000.5]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      $expect: "len(val) == 0"
---
desc: "search after f64 to i64 out of bounds desc match everything"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - val_i64:
        order: desc
  search_after: [19_223_372_036_854_500_000.5]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [9_223_372_036_854_775_807]
      - sort: [9_223_372_036_854_775_807]
      - sort: [300]
      - sort: [200]
      - sort: [-100]
---
desc: "search after on mixed column asc"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - mixed_type:
        order: asc
  search_after: [-10]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [0]
      - sort: [True]
      - sort: [10.5]
      - sort: [18000000000000000000]
---
desc: "search after on mixed column desc match nothing"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - mixed_type:
        order: desc
  search_after: [-10]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      $expect: "len(val) == 0"
---
desc: "search after on mixed column desc"
json:
  size: 5
  query:
      match_all: {}
  sort:
    - mixed_type:
        order: desc
  search_after: [2]
expected:
  hits:
    total:
      value: 5
      relation: eq
    hits:
      - sort: [True]
      - sort: [0]
      - sort: [-10]


================================================
FILE: quickwit/rest-api-tests/scenarii/search_after/_ctx.yaml
================================================
method: [GET]
endpoint: "search_after/_search"
# The entire suite is just for Quickwit
engines: [quickwit]
api_root: "http://localhost:7280/api/v1/_elastic/"


================================================
FILE: quickwit/rest-api-tests/scenarii/search_after/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/search_after
status_code: null
---
# Create index
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: indexes/
json:
  version: "0.7"
  index_id: search_after
  doc_mapping:
    mode: dynamic
    dynamic_mapping:
      tokenizer: default
      fast: true
    field_mappings:
      - name: val_u64
        type: u64
        fast: true
      - name: val_f64
        type: f64
        fast: true
      - name: val_i64
        type: i64
        fast: true
sleep_after: 3
---
# Ingest documents split #1
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: search_after/ingest
params:
  commit: force
ndjson:
  - {"mixed_type": 18_000_000_000_000_000_000, "val_i64": -100, "val_f64": 100.5, "val_u64": 0} # mixed_type is a u64
  - {"mixed_type": 0, "val_i64": 9_223_372_036_854_775_807, "val_f64": 110, "val_u64": 18_000_000_000_000_000_000} # to enforce u64 type on val_u64 we need a value > 2^63, or it will take i64 (maybe we should change this)
---
# Ingest documents split #2
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: search_after/ingest
params:
  commit: force
ndjson:
  - {"mixed_type": 10.5, "val_i64": 200, "val_f64": 200.0, "val_u64": 20} #mixed_type is a f64
---
# Ingest documents split #3
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: search_after/ingest
params:
  commit: force
ndjson:
  - {"mixed_type": -10, "val_i64": 300, "val_f64": 300.0, "val_u64": 0} #mixed_type is a i64
---
# Ingest documents split #4
method: POST
api_root: http://localhost:7280/api/v1/
endpoint: search_after/ingest
params:
  commit: force
ndjson:
  - {"mixed_type": true, "val_i64": 9_223_372_036_854_775_807, "val_f64": 300.0, "val_u64": 0} # i64::MAX


================================================
FILE: quickwit/rest-api-tests/scenarii/search_after/_teardown.quickwit.yaml
================================================
method: DELETE
api_root: http://localhost:7280/api/v1/
endpoint: indexes/search_after
status_code: null


================================================
FILE: quickwit/rest-api-tests/scenarii/sort_orders/0001-sort-elasticapi.yaml
================================================
method: [GET]
engines:
  - quickwit
endpoint: _elastic/sortorder/_search
json:
  query:
    bool:
      must_not:
        match:
          count: 10
  sort:
    - id: {"order" : "desc"}
expected:
  hits:
    total:
      value: 4
      relation: "eq"
    hits:
      - _source: { "id": 5 }
      - _source: { "count": -2.5, "id": 4 }
      - _source: { "id": 3 }
      - _source: { "count": 15, "id": 2 }
---
endpoint: _elastic/sortorder/_search
json:
  query:
    bool:
      must_not:
        match:
          count: 10
  sort:
    - id: {"order" : "asc"}
expected:
  hits:
    total:
      value: 4
      relation: "eq"
    hits:
      - _source: {"count": 15, "id": 2 }
      - _source: {"id": 3}
      - _source: {"count": -2.5, "id": 4}
      - _source: {"id": 5}
---
endpoint: _elastic/sortorder/_search
json:
  query:
    match_all: {}
  sort:
    - id: {"order" : "asc"}
    - count: {"order" : "asc"}
expected:
  hits:
    total:
      value: 7
      relation: "eq"
    hits:
      - _source: {"count": 10, "id": 0 }
      - _source: {"count": 10, "id": 1 }
      - _source: {"count": 10, "id": 2 }
      - _source: {"count": 15, "id": 2 }
      - _source: {"id": 3}
      - _source: {"count": -2.5, "id": 4}
      - _source: {"id": 5}
---
endpoint: _elastic/sortorder/_search
json:
  query:
    match_all: {}
  sort:
    - count: {"order" : "desc"}
    - id: {"order" : "desc"}
expected:
  hits:
    total:
      value: 7
      relation: "eq"
    hits:
      - _source: {"count": 15, "id": 2 }
      - _source: {"count": 10, "id": 2 }
      - _source: {"count": 10, "id": 1 }
      - _source: {"count": 10, "id": 0 }
      - _source: {"count": -2.5, "id": 4}
      - _source: {"id": 5}
      - _source: {"id": 3}


================================================
FILE: quickwit/rest-api-tests/scenarii/sort_orders/_ctx.yaml
================================================
method: GET
engines: ["quickwit"]
api_root: "http://localhost:7280/api/v1/"
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/sort_orders/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/sortorder
status_code: null
---
# Create index
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: sortorder
  doc_mapping:
    mode: dynamic
    dynamic_mapping:
      tokenizer: default
      fast: true
---
# Ingest documents
method: POST
endpoint: sortorder/ingest
params:
  commit: force
min_splits: 1
max_splits: 10
shuffle_ndjson:
  - {"count": 10, "id": 1}
  - {"count": 10, "id": 2}
  - {"count": 15, "id": 2}
  - {"id": 3}
  - {"count": 10, "id": 0}
  - {"count": -2.5, "id": 4}
  - {"id": 5}


================================================
FILE: quickwit/rest-api-tests/scenarii/sort_orders/_teardown.quickwit.yaml
================================================
# # Delete index
method: DELETE
endpoint: indexes/sortorder


================================================
FILE: quickwit/rest-api-tests/scenarii/tag_fields/0001_allowed_types.yaml
================================================
# allowed types
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: allowedtypes
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: text1
        type: text
        tokenizer: raw
      - name: number1
        type: u64
      - name: number2
        type: i64
    tag_fields: 
      - text1
      - number1
      - number2
---
# tokenized not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: tokenizedtype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: text1
        type: text
        tokenizer: default
    tag_fields: [text1]
status_code: 400
---
# float not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: floattype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: number3
        type: f64
    tag_fields: [number3]
status_code: 400
---
# boolean not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: booltype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: boolean
        type: bool
    tag_fields: [boolean]
status_code: 400
---
# json not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: jsontype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: json1
        type: json
    tag_fields: [json1]
status_code: 400
---
# ip not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: iptype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: ip1
        type: ip
    tag_fields: [ip1]
status_code: 400
---
# bytes not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: bytestype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: bytes1
        type: bytes
    tag_fields: [bytes1]
status_code: 400
---
# bytes not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: datetype
  doc_mapping:
    mode: dynamic
    field_mappings:
      - name: date1
        type: datetime
        input_formats:
          - rfc3339
    tag_fields: [date1]
status_code: 400
---
# dynamic not allowed
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: dynamictype
  doc_mapping:
    mode: dynamic
    tag_fields: [dynamic1]
status_code: 400
---


================================================
FILE: quickwit/rest-api-tests/scenarii/tag_fields/0002_negative_tags.yaml
================================================
# regression test for https://github.com/quickwit-oss/quickwit/issues/4698
endpoint: tag-simple/search
params:
  query: "tag:1"
expected:
  num_hits: 3
---
endpoint: tag-simple/search
params:
  query: "-tag:2"
expected:
  num_hits: 4
---
endpoint: tag-simple/search
params:
  query: "tag:2"
expected:
  num_hits: 1
---
endpoint: tag-simple/search
params:
  query: "-tag:1"
expected:
  num_hits: 2


================================================
FILE: quickwit/rest-api-tests/scenarii/tag_fields/_ctx.yaml
================================================
method: GET
engines: ["quickwit"]
api_root: "http://localhost:7280/api/v1/"
headers:
  Content-Type: application/json


================================================
FILE: quickwit/rest-api-tests/scenarii/tag_fields/_setup.quickwit.yaml
================================================
# Delete possibly remaining index
method: DELETE
endpoint: indexes/allowedtypes
status_code: null
---
method: DELETE
endpoint: indexes/tag-simple
status_code: null
---
method: POST
endpoint: indexes/
json:
  version: "0.7"
  index_id: tag-simple
  doc_mapping:
    field_mappings:
      - name: seq
        type: u64
      - name: tag
        type: u64
    tag_fields: ["tag"]
---
method: POST
endpoint: tag-simple/ingest
params:
  commit: force
ndjson:
  - {"seq": 1, "tag": 1}
  - {"seq": 2, "tag": 2}
---
method: POST
endpoint: tag-simple/ingest
params:
  commit: force
ndjson:
  - {"seq": 1, "tag": 1}
  - {"seq": 3, "tag": null}
---
method: POST
endpoint: tag-simple/ingest
params:
  commit: force
ndjson:
  - {"seq": 4, "tag": 1}
---


================================================
FILE: quickwit/rest-api-tests/scenarii/tag_fields/_teardown.quickwit.yaml
================================================
method: DELETE
endpoint: indexes/allowedtypes
status_code: null
---
method: DELETE
endpoint: indexes/tag-simple


================================================
FILE: quickwit/rust-toolchain.toml
================================================
[toolchain]
channel = "1.93"
components = ["cargo", "clippy", "rustfmt", "rust-docs"]


================================================
FILE: quickwit/rustfmt.toml
================================================
ignore = [
   "**/codegen/**/*.rs",
]

comment_width = 120
format_strings = true
group_imports = "StdExternalCrate"
imports_granularity = "Module"
normalize_comments = false
where_single_line = true
wrap_comments = true


================================================
FILE: quickwit/scripts/about.hbs
================================================
<html>

<head>
    <style>
        @media (prefers-color-scheme: dark) {
            body {
                background: #333;
                color: white;
            }
            a {
                color: skyblue;
            }
        }
        .container {
            font-family: sans-serif;
            max-width: 800px;
            margin: 0 auto;
        }
        .intro {
            text-align: center;
        }
        .licenses-list {
            list-style-type: none;
            margin: 0;
            padding: 0;
        }
        .license-used-by {
            margin-top: -10px;
        }
        .license-text {
            max-height: 200px;
            overflow-y: scroll;
            white-space: pre-wrap;
        }
    </style>
</head>

<body>
    <main class="container">
        <div class="intro">
            <h1>Third Party Licenses</h1>
            <p>This page lists the licenses of the projects used in cargo-about.</p>
        </div>
    
        <h2>Overview of licenses:</h2>
        <ul class="licenses-overview">
            {{#each overview}}
            <li><a href="#{{id}}">{{name}}</a> ({{count}})</li>
            {{/each}}
        </ul>

        <h2>All license text:</h2>
        <ul class="licenses-list">
            {{#each licenses}}
            <li class="license">
                <h3 id="{{id}}">{{name}}</h3>
                <h4>Used by:</h4>
                <ul class="license-used-by">
                    {{#each used_by}}
                    <li><a href="{{#if crate.repository}} {{crate.repository}} {{else}} https://crates.io/crates/{{crate.name}} {{/if}}">{{crate.name}} {{crate.version}}</a></li>
                    {{/each}}
                </ul>
                <pre class="license-text">{{text}}</pre>
            </li>
            {{/each}}
        </ul>
    </main>
</body>

</html>


================================================
FILE: quickwit/scripts/about.toml
================================================
accepted = [
    "0BSD",
    "AGPL-3.0",
    "LicenseRef-AGPL-3.0-or-later",
    "Apache-2.0",
    "BSD-2-Clause",
    "BSD-3-Clause",
"CC0-1.0",
    "ISC",
    "MIT",
    "MPL-2.0",
    "OpenSSL",
    "Unicode-DFS-2016",
    "Unlicense",
    "Zlib",
    "zlib-acknowledgement"
]

workarounds = [
    "ring",
    "rustls",
]

[whichlang.clarify]
license = "MIT"


[plotters.clarify]
license = "MIT"


[plotters-svg.clarify]
license = "MIT"


[advapi32-sys.clarify]
license = "MIT"


================================================
FILE: quickwit/scripts/check_license_headers.sh
================================================
#!/bin/bash

RESULT=0

for file in $(git ls-files | \
    grep "build\|src\|proto" | \
    grep -e "\.proto\|\.rs\|\.ts" | \
    grep -v "quickwit-proto/protos/third-party" | \
    grep -v "quickwit-proto/src" | \
    grep -v "/codegen/" \
)
do
    diff <(sed 's/{\\d+}/2021/' .license_header.txt) <(head -n 14 $file) > /dev/null
    DIFFRESULT=$?
    if [ $DIFFRESULT -ne 0 ]; then
        grep -q -i 'begin quickwit-codegen' $file
        GREPRESULT=$?
        if [ $GREPRESULT -ne 0 ]; then
            echo "Incomplete or missing license header in $file"
            RESULT=1
        fi
    fi
done

exit $RESULT


================================================
FILE: quickwit/scripts/check_log_format.sh
================================================
#!/bin/bash

RESULT=0

for file in $(git ls-files | grep -E "src/.*\.rs$")
do
    LOG_STARTING_WITH_UPPERCASE=$(grep -E -n "(warn|info|error|debug)!\(\"[A-Z][a-z]" $file)
    DIFFRESULT=$?
    LOG_ENDING_WITH_PERIOD=$(grep -E -n "(warn|info|error|debug)!.*\.\"\);" $file)
    DIFFRESULT=$(($DIFFRESULT && $?))
    if [ $DIFFRESULT -eq 0 ]; then
      echo "===================="
      echo $file
      echo $LOG_STARTING_WITH_UPPERCASE
      echo $LOG_ENDING_WITH_PERIOD
      echo $FAULTY_LINES
      RESULT=1
    fi
done

exit $RESULT


================================================
FILE: quickwit/scripts/dep-tree.py
================================================
import fileinput
from collections import defaultdict
import graphviz

FILTER = {
	"quickwit-backward-compat",
	"quickwit-actors",
	"quickwit-cli",
    "quickwit-rest-client",
	"quickwit-doc-mapper",
	"quickwit-search",
	"quickwit-common",
	"quickwit-indexing",
	"quickwit-metastore",
	"quickwit-proto",
	"quickwit-directories",
	"quickwit-common",
    "quickwit-rest-client",
	"quickwit-serve",
	"quickwit-storage",
	"quickwit-cluster",
	"quickwit-index-management",
    "tantivy"
}

def deps():
    deps = defaultdict(set)
    last_level = {}
    old_code = 10
    for line in fileinput.input():
        line = line.strip()
        if len(line) < 2:
            continue
        (code, package) = (line[0], line[1:])
        if package not in FILTER:
            continue
        code = int(code)
        last_level[code] = package
        print(line)
        if code > 0:
            if (code - 1) in last_level:
                deps[last_level[code - 1]].add(package)
    return dict(deps)


deps_graph = deps()

dot = graphviz.Digraph(filename='deps', directory='.', format='svg')

for (from_node, to_nodes) in deps_graph.items():
    if from_node not in FILTER:
        continue
    dot.node(from_node, from_node)
    for to_node in to_nodes:
        print((from_node, to_node))
        if to_node == from_node:
            continue
        if to_node not in FILTER:
            continue
        dot.edge(from_node, to_node)

dot.render()